diff --git "a/wandb/run-20220307_135359-2ct09q1k/files/wandb-summary.json" "b/wandb/run-20220307_135359-2ct09q1k/files/wandb-summary.json" --- "a/wandb/run-20220307_135359-2ct09q1k/files/wandb-summary.json" +++ "b/wandb/run-20220307_135359-2ct09q1k/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 0.292, "train/learning_rate": 8.907363420427554e-09, "train/epoch": 20.0, "train/global_step": 17840, "_runtime": 116020, "_timestamp": 1646777259, "_step": 17851, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 21.0, 7.0, 2.0, 2.0, 4.0, 1.0, 1.0, 5.0, 0.0, 5.0, 4.0, 1.0, 2.0, 7.0, 14.0, 29.0, 30270.0, 111.0, 20.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-701.0, -687.619140625, -674.23828125, -660.857421875, -647.4765625, -634.095703125, -620.71484375, -607.333984375, -593.953125, -580.572265625, -567.19140625, -553.810546875, -540.4296875, -527.048828125, -513.66796875, -500.287109375, -486.90625, -473.525390625, -460.14453125, -446.763671875, -433.3828125, -420.001953125, -406.62109375, -393.240234375, -379.859375, -366.478515625, -353.09765625, -339.716796875, -326.3359375, -312.955078125, -299.57421875, -286.193359375, -272.8125, -259.431640625, -246.05078125, -232.669921875, -219.2890625, -205.908203125, -192.52734375, -179.146484375, -165.765625, -152.384765625, -139.00390625, -125.623046875, -112.2421875, -98.861328125, -85.48046875, -72.099609375, -58.71875, -45.337890625, -31.95703125, -18.576171875, -5.1953125, 8.185546875, 21.56640625, 34.947265625, 48.328125, 61.708984375, 75.08984375, 88.470703125, 101.8515625, 115.232421875, 128.61328125, 141.994140625, 155.375]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 7.0, 12.0, 8.0, 5.0, 20.0, 8.0, 20.0, 29.0, 29.0, 35.0, 42.0, 47.0, 64.0, 55.0, 58.0, 58.0, 55.0, 71.0, 52.0, 41.0, 54.0, 44.0, 29.0, 31.0, 34.0, 16.0, 26.0, 18.0, 15.0, 4.0, 3.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-213.13580322265625, -208.03428649902344, -202.93275451660156, -197.83123779296875, -192.72970581054688, -187.62818908691406, -182.5266571044922, -177.42514038085938, -172.3236083984375, -167.2220916748047, -162.1205596923828, -157.01904296875, -151.91751098632812, -146.8159942626953, -141.71446228027344, -136.61294555664062, -131.5114288330078, -126.40990447998047, -121.30838012695312, -116.20685577392578, -111.10533142089844, -106.00381469726562, -100.90229034423828, -95.80076599121094, -90.6992416381836, -85.59771728515625, -80.4961929321289, -75.39466857910156, -70.29315185546875, -65.19161987304688, -60.09010314941406, -54.98857879638672, -49.88706970214844, -44.785545349121094, -39.68402099609375, -34.58250045776367, -29.480976104736328, -24.379451751708984, -19.277929306030273, -14.176406860351562, -9.074882507324219, -3.9733591079711914, 1.128164291381836, 6.229687690734863, 11.33121109008789, 16.432735443115234, 21.534257888793945, 26.635780334472656, 31.7373046875, 36.838829040527344, 41.94035339355469, 47.041873931884766, 52.14339828491211, 57.24492263793945, 62.34644317626953, 67.44796752929688, 72.54949188232422, 77.65101623535156, 82.7525405883789, 87.85406494140625, 92.95558166503906, 98.05711364746094, 103.15863037109375, 108.2601547241211, 113.36167907714844]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 1.0, 5.0, 5.0, 8.0, 6.0, 12.0, 7.0, 7.0, 12.0, 14.0, 24.0, 10.0, 25.0, 32.0, 41.0, 31.0, 27.0, 32.0, 44.0, 45.0, 43.0, 42.0, 45.0, 47.0, 49.0, 36.0, 32.0, 32.0, 27.0, 28.0, 30.0, 33.0, 27.0, 22.0, 22.0, 21.0, 14.0, 17.0, 13.0, 10.0, 7.0, 7.0, 2.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-124.2356185913086, -120.41963195800781, -116.60365295410156, -112.78766632080078, -108.9716796875, -105.15570068359375, -101.33971405029297, -97.52372741699219, -93.70774841308594, -89.89176177978516, -86.0757827758789, -82.25979614257812, -78.44381713867188, -74.6278305053711, -70.81184387207031, -66.99586486816406, -63.17987823486328, -59.363895416259766, -55.54791259765625, -51.73192596435547, -47.91594314575195, -44.09996032714844, -40.283973693847656, -36.46799087524414, -32.652008056640625, -28.83602523803711, -25.02004051208496, -21.204055786132812, -17.388072967529297, -13.572090148925781, -9.756105422973633, -5.940120697021484, -2.1241378784179688, 1.6918458938598633, 5.507829666137695, 9.323813438415527, 13.13979721069336, 16.955780029296875, 20.771764755249023, 24.587749481201172, 28.403732299804688, 32.2197151184082, 36.03569793701172, 39.8516845703125, 43.667667388916016, 47.48365020751953, 51.29963684082031, 55.11561965942383, 58.931602478027344, 62.74758529663086, 66.56356811523438, 70.37955474853516, 74.19554138183594, 78.01152038574219, 81.82750701904297, 85.64349365234375, 89.45947265625, 93.27545928955078, 97.09143829345703, 100.90742492675781, 104.72340393066406, 108.53939056396484, 112.35537719726562, 116.17135620117188, 119.98734283447266]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 7.0, 18.0, 25.0, 27.0, 50.0, 81.0, 145.0, 194.0, 351.0, 504.0, 780.0, 1315.0, 2016.0, 3131.0, 4959.0, 7612.0, 11577.0, 16624.0, 24222.0, 33958.0, 45803.0, 60119.0, 75042.0, 89462.0, 101695.0, 127668.0, 97477.0, 83977.0, 69542.0, 54968.0, 41591.0, 29967.0, 21211.0, 14441.0, 9894.0, 6441.0, 4196.0, 2752.0, 1717.0, 1086.0, 735.0, 434.0, 274.0, 163.0, 113.0, 77.0, 35.0, 27.0, 14.0, 14.0, 11.0, 10.0, 6.0, 3.0, 1.0, 1.0], "bins": [-404.75, -392.6015625, -380.453125, -368.3046875, -356.15625, -344.0078125, -331.859375, -319.7109375, -307.5625, -295.4140625, -283.265625, -271.1171875, -258.96875, -246.8203125, -234.671875, -222.5234375, -210.375, -198.2265625, -186.078125, -173.9296875, -161.78125, -149.6328125, -137.484375, -125.3359375, -113.1875, -101.0390625, -88.890625, -76.7421875, -64.59375, -52.4453125, -40.296875, -28.1484375, -16.0, -3.8515625, 8.296875, 20.4453125, 32.59375, 44.7421875, 56.890625, 69.0390625, 81.1875, 93.3359375, 105.484375, 117.6328125, 129.78125, 141.9296875, 154.078125, 166.2265625, 178.375, 190.5234375, 202.671875, 214.8203125, 226.96875, 239.1171875, 251.265625, 263.4140625, 275.5625, 287.7109375, 299.859375, 312.0078125, 324.15625, 336.3046875, 348.453125, 360.6015625, 372.75]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 2.0, 5.0, 1.0, 7.0, 6.0, 8.0, 15.0, 9.0, 12.0, 14.0, 22.0, 18.0, 33.0, 18.0, 33.0, 19.0, 43.0, 42.0, 45.0, 43.0, 41.0, 41.0, 62.0, 42.0, 41.0, 45.0, 38.0, 38.0, 33.0, 27.0, 26.0, 27.0, 24.0, 28.0, 18.0, 12.0, 15.0, 13.0, 10.0, 10.0, 5.0, 6.0, 1.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-188.875, -182.82421875, -176.7734375, -170.72265625, -164.671875, -158.62109375, -152.5703125, -146.51953125, -140.46875, -134.41796875, -128.3671875, -122.31640625, -116.265625, -110.21484375, -104.1640625, -98.11328125, -92.0625, -86.01171875, -79.9609375, -73.91015625, -67.859375, -61.80859375, -55.7578125, -49.70703125, -43.65625, -37.60546875, -31.5546875, -25.50390625, -19.453125, -13.40234375, -7.3515625, -1.30078125, 4.75, 10.80078125, 16.8515625, 22.90234375, 28.953125, 35.00390625, 41.0546875, 47.10546875, 53.15625, 59.20703125, 65.2578125, 71.30859375, 77.359375, 83.41015625, 89.4609375, 95.51171875, 101.5625, 107.61328125, 113.6640625, 119.71484375, 125.765625, 131.81640625, 137.8671875, 143.91796875, 149.96875, 156.01953125, 162.0703125, 168.12109375, 174.171875, 180.22265625, 186.2734375, 192.32421875, 198.375]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 1.0, 7.0, 3.0, 6.0, 8.0, 14.0, 19.0, 13.0, 19.0, 24.0, 44.0, 31.0, 23.0, 44.0, 41.0, 49.0, 42.0, 52.0, 54.0, 43.0, 52.0, 55.0, 45.0, 43.0, 50.0, 36.0, 32.0, 24.0, 26.0, 20.0, 14.0, 20.0, 15.0, 11.0, 12.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-146.77110290527344, -142.3655548095703, -137.96002197265625, -133.55447387695312, -129.14894104003906, -124.74339294433594, -120.33785247802734, -115.93231201171875, -111.52677154541016, -107.12123107910156, -102.71569061279297, -98.31015014648438, -93.90460205078125, -89.49906921386719, -85.09352111816406, -80.68798065185547, -76.28244018554688, -71.87689971923828, -67.47135925292969, -63.06581497192383, -58.660274505615234, -54.25473403930664, -49.84918975830078, -45.44364929199219, -41.038108825683594, -36.632568359375, -32.227027893066406, -27.821483612060547, -23.415943145751953, -19.01040267944336, -14.604860305786133, -10.199317932128906, -5.793792724609375, -1.3882513046264648, 3.0172901153564453, 7.4228315353393555, 11.828372955322266, 16.23391342163086, 20.639455795288086, 25.044998168945312, 29.450538635253906, 33.8560791015625, 38.261619567871094, 42.66716384887695, 47.07270431518555, 51.47824478149414, 55.8837890625, 60.289329528808594, 64.69486999511719, 69.10041046142578, 73.50595092773438, 77.91149139404297, 82.31703186035156, 86.72257995605469, 91.12812042236328, 95.53366088867188, 99.93920135498047, 104.34474182128906, 108.75028228759766, 113.15582275390625, 117.56137084960938, 121.96690368652344, 126.37245178222656, 130.77798461914062, 135.18353271484375]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 7.0, 6.0, 4.0, 9.0, 6.0, 7.0, 19.0, 17.0, 10.0, 24.0, 20.0, 25.0, 19.0, 22.0, 28.0, 40.0, 37.0, 28.0, 42.0, 48.0, 45.0, 38.0, 39.0, 46.0, 39.0, 47.0, 42.0, 35.0, 41.0, 38.0, 28.0, 27.0, 30.0, 16.0, 12.0, 13.0, 12.0, 14.0, 4.0, 8.0, 6.0, 2.0, 0.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-136.23291015625, -132.0714569091797, -127.9100112915039, -123.7485580444336, -119.58710479736328, -115.4256591796875, -111.26420593261719, -107.10275268554688, -102.94129943847656, -98.77984619140625, -94.61840057373047, -90.45694732666016, -86.29549407958984, -82.13404846191406, -77.97259521484375, -73.81114196777344, -69.64969635009766, -65.48824310302734, -61.3267936706543, -57.16534423828125, -53.00389099121094, -48.84244155883789, -44.680992126464844, -40.51953887939453, -36.358089447021484, -32.19664001464844, -28.035186767578125, -23.873737335205078, -19.7122859954834, -15.550834655761719, -11.389385223388672, -7.227933883666992, -3.0664825439453125, 1.094968318939209, 5.2564191818237305, 9.417869567871094, 13.579320907592773, 17.740772247314453, 21.9022216796875, 26.06367301940918, 30.22512435913086, 34.386573791503906, 38.54802703857422, 42.709476470947266, 46.87092590332031, 51.032379150390625, 55.19382858276367, 59.35527801513672, 63.51673126220703, 67.67818450927734, 71.83963012695312, 76.00108337402344, 80.16253662109375, 84.32398986816406, 88.48543548583984, 92.64688873291016, 96.80833435058594, 100.96978759765625, 105.13123321533203, 109.29268646240234, 113.45413970947266, 117.61558532714844, 121.77703857421875, 125.93849182128906, 130.09994506835938]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 7.0, 11.0, 12.0, 18.0, 19.0, 39.0, 56.0, 104.0, 204.0, 300.0, 481.0, 816.0, 1275.0, 2071.0, 3549.0, 5819.0, 9740.0, 16663.0, 28230.0, 47989.0, 82882.0, 144040.0, 251088.0, 432745.0, 714245.0, 885607.0, 642858.0, 385436.0, 224792.0, 130596.0, 75765.0, 43935.0, 25837.0, 15019.0, 8889.0, 5280.0, 3147.0, 1873.0, 1113.0, 662.0, 431.0, 261.0, 168.0, 83.0, 48.0, 31.0, 27.0, 15.0, 6.0, 4.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-208.375, -201.517578125, -194.66015625, -187.802734375, -180.9453125, -174.087890625, -167.23046875, -160.373046875, -153.515625, -146.658203125, -139.80078125, -132.943359375, -126.0859375, -119.228515625, -112.37109375, -105.513671875, -98.65625, -91.798828125, -84.94140625, -78.083984375, -71.2265625, -64.369140625, -57.51171875, -50.654296875, -43.796875, -36.939453125, -30.08203125, -23.224609375, -16.3671875, -9.509765625, -2.65234375, 4.205078125, 11.0625, 17.919921875, 24.77734375, 31.634765625, 38.4921875, 45.349609375, 52.20703125, 59.064453125, 65.921875, 72.779296875, 79.63671875, 86.494140625, 93.3515625, 100.208984375, 107.06640625, 113.923828125, 120.78125, 127.638671875, 134.49609375, 141.353515625, 148.2109375, 155.068359375, 161.92578125, 168.783203125, 175.640625, 182.498046875, 189.35546875, 196.212890625, 203.0703125, 209.927734375, 216.78515625, 223.642578125, 230.5]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 9.0, 6.0, 8.0, 3.0, 6.0, 18.0, 17.0, 16.0, 10.0, 14.0, 24.0, 25.0, 30.0, 24.0, 27.0, 39.0, 48.0, 47.0, 36.0, 33.0, 41.0, 45.0, 44.0, 36.0, 41.0, 26.0, 49.0, 40.0, 35.0, 39.0, 18.0, 27.0, 28.0, 20.0, 11.0, 14.0, 12.0, 11.0, 8.0, 5.0, 6.0, 2.0, 1.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-115.0, -111.431640625, -107.86328125, -104.294921875, -100.7265625, -97.158203125, -93.58984375, -90.021484375, -86.453125, -82.884765625, -79.31640625, -75.748046875, -72.1796875, -68.611328125, -65.04296875, -61.474609375, -57.90625, -54.337890625, -50.76953125, -47.201171875, -43.6328125, -40.064453125, -36.49609375, -32.927734375, -29.359375, -25.791015625, -22.22265625, -18.654296875, -15.0859375, -11.517578125, -7.94921875, -4.380859375, -0.8125, 2.755859375, 6.32421875, 9.892578125, 13.4609375, 17.029296875, 20.59765625, 24.166015625, 27.734375, 31.302734375, 34.87109375, 38.439453125, 42.0078125, 45.576171875, 49.14453125, 52.712890625, 56.28125, 59.849609375, 63.41796875, 66.986328125, 70.5546875, 74.123046875, 77.69140625, 81.259765625, 84.828125, 88.396484375, 91.96484375, 95.533203125, 99.1015625, 102.669921875, 106.23828125, 109.806640625, 113.375]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 6.0, 7.0, 7.0, 14.0, 16.0, 18.0, 34.0, 72.0, 121.0, 154.0, 280.0, 479.0, 819.0, 1399.0, 2416.0, 3963.0, 7097.0, 12505.0, 22166.0, 38226.0, 66934.0, 113626.0, 191997.0, 312977.0, 481061.0, 672622.0, 730343.0, 568556.0, 380966.0, 239674.0, 144990.0, 85483.0, 49339.0, 28158.0, 16106.0, 9226.0, 5097.0, 2875.0, 1788.0, 1085.0, 632.0, 344.0, 221.0, 137.0, 87.0, 54.0, 39.0, 31.0, 19.0, 7.0, 8.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-144.25, -139.7734375, -135.296875, -130.8203125, -126.34375, -121.8671875, -117.390625, -112.9140625, -108.4375, -103.9609375, -99.484375, -95.0078125, -90.53125, -86.0546875, -81.578125, -77.1015625, -72.625, -68.1484375, -63.671875, -59.1953125, -54.71875, -50.2421875, -45.765625, -41.2890625, -36.8125, -32.3359375, -27.859375, -23.3828125, -18.90625, -14.4296875, -9.953125, -5.4765625, -1.0, 3.4765625, 7.953125, 12.4296875, 16.90625, 21.3828125, 25.859375, 30.3359375, 34.8125, 39.2890625, 43.765625, 48.2421875, 52.71875, 57.1953125, 61.671875, 66.1484375, 70.625, 75.1015625, 79.578125, 84.0546875, 88.53125, 93.0078125, 97.484375, 101.9609375, 106.4375, 110.9140625, 115.390625, 119.8671875, 124.34375, 128.8203125, 133.296875, 137.7734375, 142.25]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 3.0, 7.0, 12.0, 12.0, 12.0, 21.0, 14.0, 22.0, 20.0, 46.0, 57.0, 62.0, 88.0, 98.0, 131.0, 117.0, 153.0, 170.0, 210.0, 266.0, 260.0, 292.0, 290.0, 244.0, 251.0, 191.0, 167.0, 145.0, 164.0, 103.0, 90.0, 80.0, 60.0, 53.0, 38.0, 38.0, 14.0, 20.0, 24.0, 7.0, 12.0, 3.0, 5.0, 0.0, 8.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.21875, -56.3203125, -54.421875, -52.5234375, -50.625, -48.7265625, -46.828125, -44.9296875, -43.03125, -41.1328125, -39.234375, -37.3359375, -35.4375, -33.5390625, -31.640625, -29.7421875, -27.84375, -25.9453125, -24.046875, -22.1484375, -20.25, -18.3515625, -16.453125, -14.5546875, -12.65625, -10.7578125, -8.859375, -6.9609375, -5.0625, -3.1640625, -1.265625, 0.6328125, 2.53125, 4.4296875, 6.328125, 8.2265625, 10.125, 12.0234375, 13.921875, 15.8203125, 17.71875, 19.6171875, 21.515625, 23.4140625, 25.3125, 27.2109375, 29.109375, 31.0078125, 32.90625, 34.8046875, 36.703125, 38.6015625, 40.5, 42.3984375, 44.296875, 46.1953125, 48.09375, 49.9921875, 51.890625, 53.7890625, 55.6875, 57.5859375, 59.484375, 61.3828125, 63.28125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 9.0, 5.0, 3.0, 8.0, 14.0, 12.0, 20.0, 20.0, 26.0, 26.0, 33.0, 31.0, 43.0, 39.0, 56.0, 50.0, 49.0, 60.0, 62.0, 62.0, 38.0, 45.0, 36.0, 44.0, 32.0, 33.0, 30.0, 24.0, 25.0, 23.0, 11.0, 8.0, 5.0, 8.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-166.92550659179688, -162.397705078125, -157.86990356445312, -153.34210205078125, -148.81430053710938, -144.28648376464844, -139.75868225097656, -135.2308807373047, -130.7030792236328, -126.17527770996094, -121.64747619628906, -117.11966705322266, -112.59186553955078, -108.0640640258789, -103.5362548828125, -99.00845336914062, -94.48065185546875, -89.95285034179688, -85.425048828125, -80.8972396850586, -76.36943817138672, -71.84163665771484, -67.31382751464844, -62.78602600097656, -58.25822448730469, -53.73042297363281, -49.20261764526367, -44.67481231689453, -40.147010803222656, -35.61920928955078, -31.09140396118164, -26.563600540161133, -22.035781860351562, -17.507978439331055, -12.980175018310547, -8.452371597290039, -3.9245681762695312, 0.6032352447509766, 5.131038665771484, 9.658842086791992, 14.1866455078125, 18.714448928833008, 23.242252349853516, 27.770055770874023, 32.29785919189453, 36.825660705566406, 41.35346603393555, 45.88127136230469, 50.40907287597656, 54.93687438964844, 59.46467971801758, 63.99248504638672, 68.5202865600586, 73.04808807373047, 77.57589721679688, 82.10369873046875, 86.63150024414062, 91.1593017578125, 95.68710327148438, 100.21491241455078, 104.74271392822266, 109.27051544189453, 113.79832458496094, 118.32612609863281, 122.85392761230469]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 4.0, 5.0, 6.0, 10.0, 9.0, 7.0, 12.0, 18.0, 13.0, 14.0, 16.0, 15.0, 35.0, 27.0, 23.0, 34.0, 24.0, 49.0, 39.0, 32.0, 42.0, 47.0, 40.0, 43.0, 32.0, 37.0, 45.0, 30.0, 41.0, 32.0, 27.0, 27.0, 34.0, 25.0, 23.0, 19.0, 10.0, 16.0, 13.0, 8.0, 7.0, 5.0, 3.0, 2.0, 2.0, 0.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.46715545654297, -115.53140258789062, -111.59565734863281, -107.65990447998047, -103.72415161132812, -99.78840637207031, -95.85265350341797, -91.91690063476562, -87.98115539550781, -84.04540252685547, -80.10965728759766, -76.17390441894531, -72.23815155029297, -68.30239868164062, -64.36665344238281, -60.43090057373047, -56.495147705078125, -52.55939865112305, -48.6236457824707, -44.687896728515625, -40.75214385986328, -36.8163948059082, -32.880645751953125, -28.944894790649414, -25.009143829345703, -21.073392868041992, -17.13764190673828, -13.201892852783203, -9.266141891479492, -5.330390930175781, -1.3946418762207031, 2.541109085083008, 6.4768524169921875, 10.412603378295898, 14.348353385925293, 18.284103393554688, 22.2198543548584, 26.15560531616211, 30.091354370117188, 34.02710723876953, 37.96285629272461, 41.89860534667969, 45.83435821533203, 49.77010726928711, 53.70585632324219, 57.64160919189453, 61.57735824584961, 65.51310729980469, 69.44886016845703, 73.38461303710938, 77.32035827636719, 81.25611114501953, 85.19186401367188, 89.12760925292969, 93.06336212158203, 96.99911499023438, 100.93486022949219, 104.87061309814453, 108.80635833740234, 112.74211120605469, 116.67786407470703, 120.61361694335938, 124.54936218261719, 128.485107421875, 132.42086791992188]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 7.0, 3.0, 8.0, 6.0, 14.0, 25.0, 46.0, 54.0, 78.0, 123.0, 170.0, 289.0, 426.0, 753.0, 1063.0, 1747.0, 2700.0, 4267.0, 6539.0, 10310.0, 16185.0, 25888.0, 41322.0, 66798.0, 106493.0, 153691.0, 177951.0, 151808.0, 104255.0, 65440.0, 40768.0, 25368.0, 15885.0, 10177.0, 6536.0, 4114.0, 2565.0, 1673.0, 1069.0, 676.0, 444.0, 298.0, 162.0, 124.0, 84.0, 51.0, 36.0, 29.0, 21.0, 7.0, 11.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0], "bins": [-193.75, -187.962890625, -182.17578125, -176.388671875, -170.6015625, -164.814453125, -159.02734375, -153.240234375, -147.453125, -141.666015625, -135.87890625, -130.091796875, -124.3046875, -118.517578125, -112.73046875, -106.943359375, -101.15625, -95.369140625, -89.58203125, -83.794921875, -78.0078125, -72.220703125, -66.43359375, -60.646484375, -54.859375, -49.072265625, -43.28515625, -37.498046875, -31.7109375, -25.923828125, -20.13671875, -14.349609375, -8.5625, -2.775390625, 3.01171875, 8.798828125, 14.5859375, 20.373046875, 26.16015625, 31.947265625, 37.734375, 43.521484375, 49.30859375, 55.095703125, 60.8828125, 66.669921875, 72.45703125, 78.244140625, 84.03125, 89.818359375, 95.60546875, 101.392578125, 107.1796875, 112.966796875, 118.75390625, 124.541015625, 130.328125, 136.115234375, 141.90234375, 147.689453125, 153.4765625, 159.263671875, 165.05078125, 170.837890625, 176.625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 5.0, 10.0, 8.0, 4.0, 10.0, 5.0, 22.0, 23.0, 18.0, 28.0, 25.0, 22.0, 24.0, 27.0, 26.0, 30.0, 36.0, 42.0, 44.0, 42.0, 34.0, 36.0, 30.0, 44.0, 41.0, 44.0, 42.0, 40.0, 35.0, 25.0, 26.0, 25.0, 19.0, 17.0, 16.0, 16.0, 11.0, 6.0, 16.0, 10.0, 4.0, 3.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.4375, -89.125, -85.8125, -82.5, -79.1875, -75.875, -72.5625, -69.25, -65.9375, -62.625, -59.3125, -56.0, -52.6875, -49.375, -46.0625, -42.75, -39.4375, -36.125, -32.8125, -29.5, -26.1875, -22.875, -19.5625, -16.25, -12.9375, -9.625, -6.3125, -3.0, 0.3125, 3.625, 6.9375, 10.25, 13.5625, 16.875, 20.1875, 23.5, 26.8125, 30.125, 33.4375, 36.75, 40.0625, 43.375, 46.6875, 50.0, 53.3125, 56.625, 59.9375, 63.25, 66.5625, 69.875, 73.1875, 76.5, 79.8125, 83.125, 86.4375, 89.75, 93.0625, 96.375, 99.6875, 103.0, 106.3125, 109.625, 112.9375, 116.25, 119.5625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 14.0, 12.0, 20.0, 44.0, 38.0, 68.0, 96.0, 112.0, 182.0, 267.0, 360.0, 517.0, 766.0, 1233.0, 2073.0, 3145.0, 5135.0, 8740.0, 15803.0, 29857.0, 61687.0, 141734.0, 294670.0, 258318.0, 113885.0, 50816.0, 25364.0, 13497.0, 7643.0, 4415.0, 2845.0, 1700.0, 1137.0, 757.0, 506.0, 324.0, 225.0, 190.0, 87.0, 85.0, 53.0, 38.0, 32.0, 24.0, 13.0, 6.0, 8.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-319.0, -308.66796875, -298.3359375, -288.00390625, -277.671875, -267.33984375, -257.0078125, -246.67578125, -236.34375, -226.01171875, -215.6796875, -205.34765625, -195.015625, -184.68359375, -174.3515625, -164.01953125, -153.6875, -143.35546875, -133.0234375, -122.69140625, -112.359375, -102.02734375, -91.6953125, -81.36328125, -71.03125, -60.69921875, -50.3671875, -40.03515625, -29.703125, -19.37109375, -9.0390625, 1.29296875, 11.625, 21.95703125, 32.2890625, 42.62109375, 52.953125, 63.28515625, 73.6171875, 83.94921875, 94.28125, 104.61328125, 114.9453125, 125.27734375, 135.609375, 145.94140625, 156.2734375, 166.60546875, 176.9375, 187.26953125, 197.6015625, 207.93359375, 218.265625, 228.59765625, 238.9296875, 249.26171875, 259.59375, 269.92578125, 280.2578125, 290.58984375, 300.921875, 311.25390625, 321.5859375, 331.91796875, 342.25]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 10.0, 7.0, 8.0, 8.0, 14.0, 15.0, 5.0, 18.0, 12.0, 27.0, 16.0, 23.0, 27.0, 35.0, 41.0, 42.0, 39.0, 41.0, 41.0, 53.0, 44.0, 40.0, 40.0, 42.0, 27.0, 40.0, 33.0, 33.0, 30.0, 25.0, 22.0, 14.0, 22.0, 18.0, 15.0, 19.0, 9.0, 13.0, 13.0, 8.0, 5.0, 1.0, 6.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.0625, -72.580078125, -70.09765625, -67.615234375, -65.1328125, -62.650390625, -60.16796875, -57.685546875, -55.203125, -52.720703125, -50.23828125, -47.755859375, -45.2734375, -42.791015625, -40.30859375, -37.826171875, -35.34375, -32.861328125, -30.37890625, -27.896484375, -25.4140625, -22.931640625, -20.44921875, -17.966796875, -15.484375, -13.001953125, -10.51953125, -8.037109375, -5.5546875, -3.072265625, -0.58984375, 1.892578125, 4.375, 6.857421875, 9.33984375, 11.822265625, 14.3046875, 16.787109375, 19.26953125, 21.751953125, 24.234375, 26.716796875, 29.19921875, 31.681640625, 34.1640625, 36.646484375, 39.12890625, 41.611328125, 44.09375, 46.576171875, 49.05859375, 51.541015625, 54.0234375, 56.505859375, 58.98828125, 61.470703125, 63.953125, 66.435546875, 68.91796875, 71.400390625, 73.8828125, 76.365234375, 78.84765625, 81.330078125, 83.8125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 11.0, 10.0, 11.0, 15.0, 19.0, 38.0, 51.0, 73.0, 104.0, 154.0, 249.0, 368.0, 640.0, 1245.0, 3131.0, 13068.0, 101937.0, 652468.0, 240525.0, 25595.0, 5021.0, 1667.0, 825.0, 466.0, 276.0, 185.0, 114.0, 81.0, 52.0, 42.0, 26.0, 26.0, 17.0, 7.0, 7.0, 8.0, 1.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-348.5, -337.5, -326.5, -315.5, -304.5, -293.5, -282.5, -271.5, -260.5, -249.5, -238.5, -227.5, -216.5, -205.5, -194.5, -183.5, -172.5, -161.5, -150.5, -139.5, -128.5, -117.5, -106.5, -95.5, -84.5, -73.5, -62.5, -51.5, -40.5, -29.5, -18.5, -7.5, 3.5, 14.5, 25.5, 36.5, 47.5, 58.5, 69.5, 80.5, 91.5, 102.5, 113.5, 124.5, 135.5, 146.5, 157.5, 168.5, 179.5, 190.5, 201.5, 212.5, 223.5, 234.5, 245.5, 256.5, 267.5, 278.5, 289.5, 300.5, 311.5, 322.5, 333.5, 344.5, 355.5]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 9.0, 9.0, 14.0, 25.0, 26.0, 50.0, 141.0, 228.0, 214.0, 147.0, 60.0, 32.0, 14.0, 15.0, 7.0, 2.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0224151611328125, -0.021712303161621094, -0.021009445190429688, -0.02030658721923828, -0.019603729248046875, -0.01890087127685547, -0.018198013305664062, -0.017495155334472656, -0.01679229736328125, -0.016089439392089844, -0.015386581420898438, -0.014683723449707031, -0.013980865478515625, -0.013278007507324219, -0.012575149536132812, -0.011872291564941406, -0.01116943359375, -0.010466575622558594, -0.009763717651367188, -0.009060859680175781, -0.008358001708984375, -0.007655143737792969, -0.0069522857666015625, -0.006249427795410156, -0.00554656982421875, -0.004843711853027344, -0.0041408538818359375, -0.0034379959106445312, -0.002735137939453125, -0.0020322799682617188, -0.0013294219970703125, -0.0006265640258789062, 7.62939453125e-05, 0.0007791519165039062, 0.0014820098876953125, 0.0021848678588867188, 0.002887725830078125, 0.0035905838012695312, 0.0042934417724609375, 0.004996299743652344, 0.00569915771484375, 0.006402015686035156, 0.0071048736572265625, 0.007807731628417969, 0.008510589599609375, 0.009213447570800781, 0.009916305541992188, 0.010619163513183594, 0.011322021484375, 0.012024879455566406, 0.012727737426757812, 0.013430595397949219, 0.014133453369140625, 0.014836311340332031, 0.015539169311523438, 0.016242027282714844, 0.01694488525390625, 0.017647743225097656, 0.018350601196289062, 0.01905345916748047, 0.019756317138671875, 0.02045917510986328, 0.021162033081054688, 0.021864891052246094, 0.0225677490234375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 8.0, 4.0, 14.0, 9.0, 13.0, 38.0, 39.0, 57.0, 73.0, 77.0, 113.0, 143.0, 153.0, 237.0, 274.0, 452.0, 642.0, 962.0, 1613.0, 3250.0, 7974.0, 23796.0, 78933.0, 222650.0, 355951.0, 228150.0, 81691.0, 24898.0, 8077.0, 3357.0, 1655.0, 868.0, 595.0, 456.0, 324.0, 252.0, 198.0, 139.0, 104.0, 77.0, 53.0, 47.0, 35.0, 31.0, 20.0, 19.0, 13.0, 7.0, 9.0, 6.0, 3.0, 1.0, 1.0, 2.0], "bins": [-213.625, -207.435546875, -201.24609375, -195.056640625, -188.8671875, -182.677734375, -176.48828125, -170.298828125, -164.109375, -157.919921875, -151.73046875, -145.541015625, -139.3515625, -133.162109375, -126.97265625, -120.783203125, -114.59375, -108.404296875, -102.21484375, -96.025390625, -89.8359375, -83.646484375, -77.45703125, -71.267578125, -65.078125, -58.888671875, -52.69921875, -46.509765625, -40.3203125, -34.130859375, -27.94140625, -21.751953125, -15.5625, -9.373046875, -3.18359375, 3.005859375, 9.1953125, 15.384765625, 21.57421875, 27.763671875, 33.953125, 40.142578125, 46.33203125, 52.521484375, 58.7109375, 64.900390625, 71.08984375, 77.279296875, 83.46875, 89.658203125, 95.84765625, 102.037109375, 108.2265625, 114.416015625, 120.60546875, 126.794921875, 132.984375, 139.173828125, 145.36328125, 151.552734375, 157.7421875, 163.931640625, 170.12109375, 176.310546875, 182.5]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 7.0, 10.0, 18.0, 24.0, 25.0, 28.0, 34.0, 53.0, 52.0, 78.0, 88.0, 71.0, 81.0, 75.0, 80.0, 53.0, 56.0, 39.0, 43.0, 14.0, 14.0, 16.0, 7.0, 6.0, 4.0, 2.0, 6.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-60.6875, -58.99365234375, -57.2998046875, -55.60595703125, -53.912109375, -52.21826171875, -50.5244140625, -48.83056640625, -47.13671875, -45.44287109375, -43.7490234375, -42.05517578125, -40.361328125, -38.66748046875, -36.9736328125, -35.27978515625, -33.5859375, -31.89208984375, -30.1982421875, -28.50439453125, -26.810546875, -25.11669921875, -23.4228515625, -21.72900390625, -20.03515625, -18.34130859375, -16.6474609375, -14.95361328125, -13.259765625, -11.56591796875, -9.8720703125, -8.17822265625, -6.484375, -4.79052734375, -3.0966796875, -1.40283203125, 0.291015625, 1.98486328125, 3.6787109375, 5.37255859375, 7.06640625, 8.76025390625, 10.4541015625, 12.14794921875, 13.841796875, 15.53564453125, 17.2294921875, 18.92333984375, 20.6171875, 22.31103515625, 24.0048828125, 25.69873046875, 27.392578125, 29.08642578125, 30.7802734375, 32.47412109375, 34.16796875, 35.86181640625, 37.5556640625, 39.24951171875, 40.943359375, 42.63720703125, 44.3310546875, 46.02490234375, 47.71875]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 7.0, 2.0, 7.0, 6.0, 4.0, 9.0, 10.0, 16.0, 16.0, 20.0, 15.0, 21.0, 28.0, 21.0, 48.0, 33.0, 45.0, 53.0, 47.0, 42.0, 43.0, 57.0, 39.0, 47.0, 60.0, 39.0, 37.0, 45.0, 29.0, 24.0, 19.0, 33.0, 11.0, 11.0, 12.0, 12.0, 7.0, 10.0, 6.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-123.48811340332031, -119.9590835571289, -116.43004608154297, -112.90101623535156, -109.37197875976562, -105.84294891357422, -102.31391906738281, -98.78488159179688, -95.25584411621094, -91.72681427001953, -88.1977767944336, -84.66874694824219, -81.13970947265625, -77.61067962646484, -74.08164978027344, -70.5526123046875, -67.0235824584961, -63.49454879760742, -59.96551513671875, -56.436485290527344, -52.907447814941406, -49.37841796875, -45.84938430786133, -42.320350646972656, -38.791316986083984, -35.26228332519531, -31.73324966430664, -28.2042179107666, -24.67518424987793, -21.146150588989258, -17.61711883544922, -14.088085174560547, -10.559043884277344, -7.03001070022583, -3.5009775161743164, 0.028055191040039062, 3.557088851928711, 7.086122512817383, 10.615154266357422, 14.144187927246094, 17.673221588134766, 21.202255249023438, 24.73128890991211, 28.26032066345215, 31.78935432434082, 35.318389892578125, 38.84741973876953, 42.3764533996582, 45.905487060546875, 49.43452072143555, 52.96355438232422, 56.492584228515625, 60.02162170410156, 63.55065155029297, 67.07968139648438, 70.60871887207031, 74.13775634765625, 77.66678619384766, 81.1958236694336, 84.724853515625, 88.25389099121094, 91.78292083740234, 95.31195068359375, 98.84098815917969, 102.3700180053711]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 5.0, 3.0, 8.0, 8.0, 6.0, 12.0, 11.0, 13.0, 16.0, 17.0, 17.0, 29.0, 29.0, 36.0, 24.0, 35.0, 35.0, 52.0, 40.0, 39.0, 43.0, 29.0, 37.0, 40.0, 43.0, 35.0, 45.0, 34.0, 37.0, 37.0, 23.0, 28.0, 24.0, 14.0, 20.0, 14.0, 15.0, 13.0, 8.0, 9.0, 4.0, 8.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-114.05889129638672, -110.54922485351562, -107.03955841064453, -103.52989196777344, -100.02022552490234, -96.51055908203125, -93.00089263916016, -89.49122619628906, -85.98155975341797, -82.47189331054688, -78.96222686767578, -75.45256042480469, -71.9428939819336, -68.4332275390625, -64.9235610961914, -61.41389465332031, -57.90422439575195, -54.39455795288086, -50.884891510009766, -47.37522506713867, -43.86555862426758, -40.35588836669922, -36.846221923828125, -33.33655548095703, -29.82689094543457, -26.317224502563477, -22.807558059692383, -19.297889709472656, -15.788224220275879, -12.278556823730469, -8.768890380859375, -5.259223937988281, -1.7495574951171875, 1.7601091861724854, 5.269775867462158, 8.77944278717041, 12.289109230041504, 15.798776626586914, 19.308443069458008, 22.8181095123291, 26.327775955200195, 29.83744239807129, 33.347110748291016, 36.85677719116211, 40.3664436340332, 43.8761100769043, 47.38577651977539, 50.895442962646484, 54.40510940551758, 57.91477584838867, 61.424442291259766, 64.93411254882812, 68.44377899169922, 71.95344543457031, 75.4631118774414, 78.9727783203125, 82.4824447631836, 85.99211120605469, 89.50177764892578, 93.01144409179688, 96.52111053466797, 100.03077697753906, 103.54044342041016, 107.05010986328125, 110.55977630615234]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 7.0, 10.0, 16.0, 26.0, 45.0, 67.0, 100.0, 162.0, 245.0, 415.0, 665.0, 999.0, 1570.0, 2462.0, 3730.0, 5804.0, 8949.0, 13743.0, 20482.0, 29909.0, 42420.0, 57996.0, 75721.0, 93355.0, 106658.0, 111350.0, 106843.0, 94144.0, 77013.0, 59177.0, 43402.0, 30517.0, 20662.0, 13984.0, 9234.0, 6000.0, 3825.0, 2513.0, 1558.0, 1045.0, 609.0, 388.0, 246.0, 180.0, 120.0, 83.0, 41.0, 38.0, 17.0, 9.0, 6.0, 1.0, 2.0, 2.0, 3.0], "bins": [-128.5, -124.7783203125, -121.056640625, -117.3349609375, -113.61328125, -109.8916015625, -106.169921875, -102.4482421875, -98.7265625, -95.0048828125, -91.283203125, -87.5615234375, -83.83984375, -80.1181640625, -76.396484375, -72.6748046875, -68.953125, -65.2314453125, -61.509765625, -57.7880859375, -54.06640625, -50.3447265625, -46.623046875, -42.9013671875, -39.1796875, -35.4580078125, -31.736328125, -28.0146484375, -24.29296875, -20.5712890625, -16.849609375, -13.1279296875, -9.40625, -5.6845703125, -1.962890625, 1.7587890625, 5.48046875, 9.2021484375, 12.923828125, 16.6455078125, 20.3671875, 24.0888671875, 27.810546875, 31.5322265625, 35.25390625, 38.9755859375, 42.697265625, 46.4189453125, 50.140625, 53.8623046875, 57.583984375, 61.3056640625, 65.02734375, 68.7490234375, 72.470703125, 76.1923828125, 79.9140625, 83.6357421875, 87.357421875, 91.0791015625, 94.80078125, 98.5224609375, 102.244140625, 105.9658203125, 109.6875]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 8.0, 3.0, 8.0, 7.0, 3.0, 7.0, 11.0, 10.0, 20.0, 18.0, 18.0, 23.0, 27.0, 26.0, 35.0, 36.0, 36.0, 51.0, 40.0, 42.0, 35.0, 46.0, 37.0, 33.0, 44.0, 41.0, 34.0, 43.0, 33.0, 34.0, 40.0, 25.0, 21.0, 20.0, 16.0, 13.0, 13.0, 11.0, 12.0, 7.0, 4.0, 7.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.3125, -96.953125, -93.59375, -90.234375, -86.875, -83.515625, -80.15625, -76.796875, -73.4375, -70.078125, -66.71875, -63.359375, -60.0, -56.640625, -53.28125, -49.921875, -46.5625, -43.203125, -39.84375, -36.484375, -33.125, -29.765625, -26.40625, -23.046875, -19.6875, -16.328125, -12.96875, -9.609375, -6.25, -2.890625, 0.46875, 3.828125, 7.1875, 10.546875, 13.90625, 17.265625, 20.625, 23.984375, 27.34375, 30.703125, 34.0625, 37.421875, 40.78125, 44.140625, 47.5, 50.859375, 54.21875, 57.578125, 60.9375, 64.296875, 67.65625, 71.015625, 74.375, 77.734375, 81.09375, 84.453125, 87.8125, 91.171875, 94.53125, 97.890625, 101.25, 104.609375, 107.96875, 111.328125, 114.6875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 6.0, 6.0, 9.0, 16.0, 30.0, 57.0, 78.0, 126.0, 177.0, 329.0, 507.0, 848.0, 1282.0, 2054.0, 3007.0, 4726.0, 7360.0, 11442.0, 17330.0, 26307.0, 37483.0, 53059.0, 70238.0, 88302.0, 104195.0, 112638.0, 110688.0, 100270.0, 83339.0, 64655.0, 47858.0, 33491.0, 23198.0, 15260.0, 10139.0, 6412.0, 4179.0, 2718.0, 1725.0, 1113.0, 690.0, 468.0, 283.0, 167.0, 113.0, 75.0, 42.0, 31.0, 20.0, 6.0, 8.0, 2.0, 2.0, 1.0, 3.0, 1.0], "bins": [-120.25, -116.697265625, -113.14453125, -109.591796875, -106.0390625, -102.486328125, -98.93359375, -95.380859375, -91.828125, -88.275390625, -84.72265625, -81.169921875, -77.6171875, -74.064453125, -70.51171875, -66.958984375, -63.40625, -59.853515625, -56.30078125, -52.748046875, -49.1953125, -45.642578125, -42.08984375, -38.537109375, -34.984375, -31.431640625, -27.87890625, -24.326171875, -20.7734375, -17.220703125, -13.66796875, -10.115234375, -6.5625, -3.009765625, 0.54296875, 4.095703125, 7.6484375, 11.201171875, 14.75390625, 18.306640625, 21.859375, 25.412109375, 28.96484375, 32.517578125, 36.0703125, 39.623046875, 43.17578125, 46.728515625, 50.28125, 53.833984375, 57.38671875, 60.939453125, 64.4921875, 68.044921875, 71.59765625, 75.150390625, 78.703125, 82.255859375, 85.80859375, 89.361328125, 92.9140625, 96.466796875, 100.01953125, 103.572265625, 107.125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 7.0, 6.0, 10.0, 7.0, 17.0, 12.0, 17.0, 24.0, 27.0, 21.0, 22.0, 21.0, 36.0, 29.0, 34.0, 45.0, 41.0, 39.0, 52.0, 54.0, 45.0, 31.0, 43.0, 29.0, 42.0, 31.0, 40.0, 36.0, 23.0, 23.0, 20.0, 21.0, 15.0, 18.0, 13.0, 13.0, 8.0, 8.0, 4.0, 7.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.0625, -67.724609375, -65.38671875, -63.048828125, -60.7109375, -58.373046875, -56.03515625, -53.697265625, -51.359375, -49.021484375, -46.68359375, -44.345703125, -42.0078125, -39.669921875, -37.33203125, -34.994140625, -32.65625, -30.318359375, -27.98046875, -25.642578125, -23.3046875, -20.966796875, -18.62890625, -16.291015625, -13.953125, -11.615234375, -9.27734375, -6.939453125, -4.6015625, -2.263671875, 0.07421875, 2.412109375, 4.75, 7.087890625, 9.42578125, 11.763671875, 14.1015625, 16.439453125, 18.77734375, 21.115234375, 23.453125, 25.791015625, 28.12890625, 30.466796875, 32.8046875, 35.142578125, 37.48046875, 39.818359375, 42.15625, 44.494140625, 46.83203125, 49.169921875, 51.5078125, 53.845703125, 56.18359375, 58.521484375, 60.859375, 63.197265625, 65.53515625, 67.873046875, 70.2109375, 72.548828125, 74.88671875, 77.224609375, 79.5625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 5.0, 12.0, 8.0, 22.0, 26.0, 46.0, 61.0, 95.0, 159.0, 248.0, 437.0, 656.0, 1043.0, 1769.0, 3079.0, 5282.0, 9518.0, 17000.0, 30473.0, 52508.0, 85355.0, 124592.0, 158090.0, 164186.0, 141159.0, 100504.0, 64472.0, 38083.0, 21639.0, 11928.0, 6684.0, 3827.0, 2181.0, 1285.0, 772.0, 463.0, 312.0, 202.0, 129.0, 76.0, 52.0, 39.0, 20.0, 32.0, 7.0, 5.0, 4.0, 2.0, 5.0, 1.0, 5.0, 1.0], "bins": [-55.84375, -54.25732421875, -52.6708984375, -51.08447265625, -49.498046875, -47.91162109375, -46.3251953125, -44.73876953125, -43.15234375, -41.56591796875, -39.9794921875, -38.39306640625, -36.806640625, -35.22021484375, -33.6337890625, -32.04736328125, -30.4609375, -28.87451171875, -27.2880859375, -25.70166015625, -24.115234375, -22.52880859375, -20.9423828125, -19.35595703125, -17.76953125, -16.18310546875, -14.5966796875, -13.01025390625, -11.423828125, -9.83740234375, -8.2509765625, -6.66455078125, -5.078125, -3.49169921875, -1.9052734375, -0.31884765625, 1.267578125, 2.85400390625, 4.4404296875, 6.02685546875, 7.61328125, 9.19970703125, 10.7861328125, 12.37255859375, 13.958984375, 15.54541015625, 17.1318359375, 18.71826171875, 20.3046875, 21.89111328125, 23.4775390625, 25.06396484375, 26.650390625, 28.23681640625, 29.8232421875, 31.40966796875, 32.99609375, 34.58251953125, 36.1689453125, 37.75537109375, 39.341796875, 40.92822265625, 42.5146484375, 44.10107421875, 45.6875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 3.0, 4.0, 5.0, 13.0, 10.0, 12.0, 11.0, 16.0, 30.0, 26.0, 19.0, 43.0, 24.0, 45.0, 58.0, 59.0, 50.0, 56.0, 70.0, 62.0, 46.0, 44.0, 42.0, 36.0, 42.0, 20.0, 24.0, 23.0, 29.0, 16.0, 17.0, 13.0, 8.0, 5.0, 3.0, 3.0, 3.0, 3.0, 4.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.005023956298828125, -0.004869401454925537, -0.004714846611022949, -0.004560291767120361, -0.0044057369232177734, -0.0042511820793151855, -0.004096627235412598, -0.00394207239151001, -0.003787517547607422, -0.003632962703704834, -0.003478407859802246, -0.003323853015899658, -0.0031692981719970703, -0.0030147433280944824, -0.0028601884841918945, -0.0027056336402893066, -0.0025510787963867188, -0.002396523952484131, -0.002241969108581543, -0.002087414264678955, -0.0019328594207763672, -0.0017783045768737793, -0.0016237497329711914, -0.0014691948890686035, -0.0013146400451660156, -0.0011600852012634277, -0.0010055303573608398, -0.000850975513458252, -0.0006964206695556641, -0.0005418658256530762, -0.0003873109817504883, -0.0002327561378479004, -7.82012939453125e-05, 7.635354995727539e-05, 0.00023090839385986328, 0.00038546323776245117, 0.0005400180816650391, 0.000694572925567627, 0.0008491277694702148, 0.0010036826133728027, 0.0011582374572753906, 0.0013127923011779785, 0.0014673471450805664, 0.0016219019889831543, 0.0017764568328857422, 0.00193101167678833, 0.002085566520690918, 0.002240121364593506, 0.0023946762084960938, 0.0025492310523986816, 0.0027037858963012695, 0.0028583407402038574, 0.0030128955841064453, 0.003167450428009033, 0.003322005271911621, 0.003476560115814209, 0.003631114959716797, 0.0037856698036193848, 0.003940224647521973, 0.0040947794914245605, 0.0042493343353271484, 0.004403889179229736, 0.004558444023132324, 0.004712998867034912, 0.0048675537109375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 11.0, 11.0, 15.0, 36.0, 57.0, 87.0, 137.0, 224.0, 339.0, 612.0, 945.0, 1485.0, 2461.0, 4082.0, 6315.0, 10539.0, 16916.0, 26703.0, 40596.0, 60094.0, 83482.0, 107337.0, 123756.0, 128587.0, 118232.0, 98046.0, 73392.0, 51555.0, 34181.0, 22071.0, 13922.0, 8645.0, 5290.0, 3233.0, 2011.0, 1208.0, 699.0, 495.0, 291.0, 166.0, 118.0, 61.0, 48.0, 27.0, 17.0, 10.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-40.21875, -39.0458984375, -37.873046875, -36.7001953125, -35.52734375, -34.3544921875, -33.181640625, -32.0087890625, -30.8359375, -29.6630859375, -28.490234375, -27.3173828125, -26.14453125, -24.9716796875, -23.798828125, -22.6259765625, -21.453125, -20.2802734375, -19.107421875, -17.9345703125, -16.76171875, -15.5888671875, -14.416015625, -13.2431640625, -12.0703125, -10.8974609375, -9.724609375, -8.5517578125, -7.37890625, -6.2060546875, -5.033203125, -3.8603515625, -2.6875, -1.5146484375, -0.341796875, 0.8310546875, 2.00390625, 3.1767578125, 4.349609375, 5.5224609375, 6.6953125, 7.8681640625, 9.041015625, 10.2138671875, 11.38671875, 12.5595703125, 13.732421875, 14.9052734375, 16.078125, 17.2509765625, 18.423828125, 19.5966796875, 20.76953125, 21.9423828125, 23.115234375, 24.2880859375, 25.4609375, 26.6337890625, 27.806640625, 28.9794921875, 30.15234375, 31.3251953125, 32.498046875, 33.6708984375, 34.84375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 5.0, 8.0, 7.0, 3.0, 12.0, 10.0, 11.0, 10.0, 16.0, 13.0, 20.0, 22.0, 35.0, 32.0, 38.0, 39.0, 35.0, 27.0, 42.0, 44.0, 43.0, 49.0, 52.0, 45.0, 32.0, 40.0, 36.0, 26.0, 29.0, 23.0, 35.0, 24.0, 23.0, 15.0, 16.0, 14.0, 19.0, 12.0, 10.0, 9.0, 5.0, 5.0, 3.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.1796875, -12.7508544921875, -12.322021484375, -11.8931884765625, -11.46435546875, -11.0355224609375, -10.606689453125, -10.1778564453125, -9.7490234375, -9.3201904296875, -8.891357421875, -8.4625244140625, -8.03369140625, -7.6048583984375, -7.176025390625, -6.7471923828125, -6.318359375, -5.8895263671875, -5.460693359375, -5.0318603515625, -4.60302734375, -4.1741943359375, -3.745361328125, -3.3165283203125, -2.8876953125, -2.4588623046875, -2.030029296875, -1.6011962890625, -1.17236328125, -0.7435302734375, -0.314697265625, 0.1141357421875, 0.54296875, 0.9718017578125, 1.400634765625, 1.8294677734375, 2.25830078125, 2.6871337890625, 3.115966796875, 3.5447998046875, 3.9736328125, 4.4024658203125, 4.831298828125, 5.2601318359375, 5.68896484375, 6.1177978515625, 6.546630859375, 6.9754638671875, 7.404296875, 7.8331298828125, 8.261962890625, 8.6907958984375, 9.11962890625, 9.5484619140625, 9.977294921875, 10.4061279296875, 10.8349609375, 11.2637939453125, 11.692626953125, 12.1214599609375, 12.55029296875, 12.9791259765625, 13.407958984375, 13.8367919921875, 14.265625]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 2.0, 4.0, 7.0, 6.0, 3.0, 6.0, 8.0, 9.0, 10.0, 20.0, 8.0, 20.0, 18.0, 20.0, 28.0, 39.0, 32.0, 41.0, 34.0, 52.0, 48.0, 33.0, 50.0, 50.0, 52.0, 32.0, 41.0, 43.0, 31.0, 25.0, 29.0, 35.0, 21.0, 23.0, 20.0, 22.0, 10.0, 13.0, 12.0, 9.0, 10.0, 5.0, 9.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.63424682617188, -102.45063018798828, -99.26700592041016, -96.08338928222656, -92.89977264404297, -89.71615600585938, -86.53253173828125, -83.34891510009766, -80.16529846191406, -76.98168182373047, -73.79805755615234, -70.61444091796875, -67.43082427978516, -64.24720764160156, -61.06358337402344, -57.879966735839844, -54.69634246826172, -51.51272201538086, -48.329105377197266, -45.145484924316406, -41.96186828613281, -38.77824783325195, -35.594627380371094, -32.4110107421875, -29.22739028930664, -26.043771743774414, -22.860153198242188, -19.676532745361328, -16.4929141998291, -13.309295654296875, -10.125675201416016, -6.942056655883789, -3.7584381103515625, -0.5748190879821777, 2.608799934387207, 5.79241943359375, 8.976037979125977, 12.159656524658203, 15.343276977539062, 18.52689552307129, 21.710514068603516, 24.894132614135742, 28.07775115966797, 31.261371612548828, 34.44499206542969, 37.62860870361328, 40.81222915649414, 43.995849609375, 47.179466247558594, 50.36308670043945, 53.54670333862305, 56.730323791503906, 59.9139404296875, 63.09756088256836, 66.28118133544922, 69.46479797363281, 72.64842224121094, 75.83203887939453, 79.01566314697266, 82.19927978515625, 85.38289642333984, 88.56651306152344, 91.75013732910156, 94.93375396728516, 98.11737060546875]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 7.0, 4.0, 9.0, 4.0, 15.0, 8.0, 10.0, 5.0, 23.0, 17.0, 27.0, 34.0, 24.0, 28.0, 29.0, 37.0, 25.0, 33.0, 42.0, 42.0, 48.0, 39.0, 45.0, 47.0, 49.0, 34.0, 36.0, 25.0, 35.0, 33.0, 25.0, 28.0, 11.0, 22.0, 19.0, 20.0, 13.0, 8.0, 11.0, 6.0, 10.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-103.10801696777344, -99.7562484741211, -96.40447998046875, -93.0527114868164, -89.70094299316406, -86.34918212890625, -82.9974136352539, -79.64564514160156, -76.29387664794922, -72.94210815429688, -69.59033966064453, -66.23857116699219, -62.88680648803711, -59.535037994384766, -56.18327331542969, -52.831504821777344, -49.479736328125, -46.127967834472656, -42.77619934082031, -39.424434661865234, -36.07266616821289, -32.72089767456055, -29.369131088256836, -26.017364501953125, -22.66559600830078, -19.313827514648438, -15.962060928344727, -12.6102933883667, -9.258525848388672, -5.906757354736328, -2.554990768432617, 0.7967758178710938, 4.148536682128906, 7.500304222106934, 10.852071762084961, 14.203839302062988, 17.555606842041016, 20.90737533569336, 24.25914192199707, 27.61090850830078, 30.962677001953125, 34.31444549560547, 37.66621398925781, 41.01797866821289, 44.369747161865234, 47.72151565551758, 51.073280334472656, 54.425048828125, 57.776817321777344, 61.12858581542969, 64.48035430908203, 67.83212280273438, 71.18388366699219, 74.53565979003906, 77.88742065429688, 81.23918914794922, 84.59095764160156, 87.9427261352539, 91.29449462890625, 94.6462631225586, 97.99803161621094, 101.34979248046875, 104.7015609741211, 108.05332946777344, 111.40509796142578]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 18.0, 16.0, 42.0, 55.0, 82.0, 124.0, 205.0, 284.0, 506.0, 839.0, 1201.0, 1915.0, 3001.0, 4740.0, 7415.0, 11432.0, 18164.0, 28515.0, 45302.0, 72567.0, 116309.0, 186892.0, 301315.0, 479835.0, 685372.0, 728753.0, 553730.0, 359369.0, 222573.0, 137114.0, 84601.0, 53004.0, 33094.0, 20608.0, 12945.0, 8387.0, 5061.0, 3299.0, 2095.0, 1281.0, 884.0, 483.0, 296.0, 198.0, 128.0, 74.0, 69.0, 31.0, 24.0, 12.0, 9.0, 5.0, 0.0, 2.0, 5.0], "bins": [-126.5, -122.7978515625, -119.095703125, -115.3935546875, -111.69140625, -107.9892578125, -104.287109375, -100.5849609375, -96.8828125, -93.1806640625, -89.478515625, -85.7763671875, -82.07421875, -78.3720703125, -74.669921875, -70.9677734375, -67.265625, -63.5634765625, -59.861328125, -56.1591796875, -52.45703125, -48.7548828125, -45.052734375, -41.3505859375, -37.6484375, -33.9462890625, -30.244140625, -26.5419921875, -22.83984375, -19.1376953125, -15.435546875, -11.7333984375, -8.03125, -4.3291015625, -0.626953125, 3.0751953125, 6.77734375, 10.4794921875, 14.181640625, 17.8837890625, 21.5859375, 25.2880859375, 28.990234375, 32.6923828125, 36.39453125, 40.0966796875, 43.798828125, 47.5009765625, 51.203125, 54.9052734375, 58.607421875, 62.3095703125, 66.01171875, 69.7138671875, 73.416015625, 77.1181640625, 80.8203125, 84.5224609375, 88.224609375, 91.9267578125, 95.62890625, 99.3310546875, 103.033203125, 106.7353515625, 110.4375]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 3.0, 7.0, 7.0, 7.0, 14.0, 7.0, 8.0, 19.0, 19.0, 25.0, 24.0, 23.0, 31.0, 31.0, 19.0, 40.0, 38.0, 27.0, 37.0, 37.0, 44.0, 49.0, 41.0, 43.0, 51.0, 40.0, 33.0, 29.0, 35.0, 31.0, 28.0, 22.0, 25.0, 11.0, 19.0, 12.0, 9.0, 9.0, 12.0, 8.0, 9.0, 3.0, 5.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-78.75, -76.3154296875, -73.880859375, -71.4462890625, -69.01171875, -66.5771484375, -64.142578125, -61.7080078125, -59.2734375, -56.8388671875, -54.404296875, -51.9697265625, -49.53515625, -47.1005859375, -44.666015625, -42.2314453125, -39.796875, -37.3623046875, -34.927734375, -32.4931640625, -30.05859375, -27.6240234375, -25.189453125, -22.7548828125, -20.3203125, -17.8857421875, -15.451171875, -13.0166015625, -10.58203125, -8.1474609375, -5.712890625, -3.2783203125, -0.84375, 1.5908203125, 4.025390625, 6.4599609375, 8.89453125, 11.3291015625, 13.763671875, 16.1982421875, 18.6328125, 21.0673828125, 23.501953125, 25.9365234375, 28.37109375, 30.8056640625, 33.240234375, 35.6748046875, 38.109375, 40.5439453125, 42.978515625, 45.4130859375, 47.84765625, 50.2822265625, 52.716796875, 55.1513671875, 57.5859375, 60.0205078125, 62.455078125, 64.8896484375, 67.32421875, 69.7587890625, 72.193359375, 74.6279296875, 77.0625]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 7.0, 5.0, 15.0, 12.0, 17.0, 41.0, 61.0, 100.0, 147.0, 213.0, 379.0, 598.0, 894.0, 1312.0, 2177.0, 3169.0, 4970.0, 7807.0, 12269.0, 19277.0, 29765.0, 45658.0, 70772.0, 108606.0, 162912.0, 240745.0, 342966.0, 458233.0, 554155.0, 559100.0, 470688.0, 353240.0, 250162.0, 170511.0, 113501.0, 74304.0, 48075.0, 31156.0, 20133.0, 12762.0, 8481.0, 5268.0, 3437.0, 2309.0, 1345.0, 860.0, 566.0, 411.0, 267.0, 165.0, 95.0, 70.0, 40.0, 22.0, 15.0, 19.0, 6.0, 5.0, 1.0, 0.0, 2.0], "bins": [-76.125, -73.75, -71.375, -69.0, -66.625, -64.25, -61.875, -59.5, -57.125, -54.75, -52.375, -50.0, -47.625, -45.25, -42.875, -40.5, -38.125, -35.75, -33.375, -31.0, -28.625, -26.25, -23.875, -21.5, -19.125, -16.75, -14.375, -12.0, -9.625, -7.25, -4.875, -2.5, -0.125, 2.25, 4.625, 7.0, 9.375, 11.75, 14.125, 16.5, 18.875, 21.25, 23.625, 26.0, 28.375, 30.75, 33.125, 35.5, 37.875, 40.25, 42.625, 45.0, 47.375, 49.75, 52.125, 54.5, 56.875, 59.25, 61.625, 64.0, 66.375, 68.75, 71.125, 73.5, 75.875]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 11.0, 6.0, 6.0, 10.0, 13.0, 14.0, 15.0, 35.0, 27.0, 33.0, 43.0, 40.0, 60.0, 69.0, 85.0, 95.0, 128.0, 157.0, 175.0, 186.0, 221.0, 214.0, 247.0, 260.0, 236.0, 214.0, 191.0, 155.0, 163.0, 166.0, 126.0, 115.0, 107.0, 81.0, 78.0, 64.0, 34.0, 37.0, 35.0, 33.0, 26.0, 17.0, 15.0, 8.0, 5.0, 6.0, 3.0, 2.0, 4.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.1875, -36.017578125, -34.84765625, -33.677734375, -32.5078125, -31.337890625, -30.16796875, -28.998046875, -27.828125, -26.658203125, -25.48828125, -24.318359375, -23.1484375, -21.978515625, -20.80859375, -19.638671875, -18.46875, -17.298828125, -16.12890625, -14.958984375, -13.7890625, -12.619140625, -11.44921875, -10.279296875, -9.109375, -7.939453125, -6.76953125, -5.599609375, -4.4296875, -3.259765625, -2.08984375, -0.919921875, 0.25, 1.419921875, 2.58984375, 3.759765625, 4.9296875, 6.099609375, 7.26953125, 8.439453125, 9.609375, 10.779296875, 11.94921875, 13.119140625, 14.2890625, 15.458984375, 16.62890625, 17.798828125, 18.96875, 20.138671875, 21.30859375, 22.478515625, 23.6484375, 24.818359375, 25.98828125, 27.158203125, 28.328125, 29.498046875, 30.66796875, 31.837890625, 33.0078125, 34.177734375, 35.34765625, 36.517578125, 37.6875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 6.0, 6.0, 7.0, 3.0, 14.0, 9.0, 6.0, 11.0, 24.0, 23.0, 30.0, 33.0, 28.0, 34.0, 33.0, 48.0, 56.0, 55.0, 40.0, 48.0, 58.0, 49.0, 66.0, 46.0, 32.0, 40.0, 28.0, 23.0, 29.0, 28.0, 20.0, 29.0, 5.0, 10.0, 7.0, 9.0, 4.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-107.5115966796875, -104.39836883544922, -101.28514099121094, -98.17191314697266, -95.05868530273438, -91.9454574584961, -88.83222961425781, -85.718994140625, -82.60577392578125, -79.49254608154297, -76.37931823730469, -73.2660903930664, -70.15286254882812, -67.03963470458984, -63.9264030456543, -60.813175201416016, -57.69994354248047, -54.58671569824219, -51.473487854003906, -48.360260009765625, -45.247032165527344, -42.13380432128906, -39.020572662353516, -35.907344818115234, -32.79411697387695, -29.680889129638672, -26.56766128540039, -23.454431533813477, -20.341203689575195, -17.227975845336914, -14.11474609375, -11.001518249511719, -7.888282775878906, -4.775054454803467, -1.6618261337280273, 1.4514026641845703, 4.564630508422852, 7.677858352661133, 10.791088104248047, 13.904315948486328, 17.01754379272461, 20.13077163696289, 23.243999481201172, 26.357229232788086, 29.470457077026367, 32.58368682861328, 35.69691467285156, 38.810142517089844, 41.923370361328125, 45.036598205566406, 48.14982604980469, 51.26305389404297, 54.37628173828125, 57.48950958251953, 60.60274124145508, 63.71596908569336, 66.82919311523438, 69.94242095947266, 73.05564880371094, 76.16887664794922, 79.2821044921875, 82.39533233642578, 85.50856018066406, 88.62179565429688, 91.73502349853516]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 5.0, 2.0, 6.0, 7.0, 17.0, 9.0, 12.0, 18.0, 20.0, 15.0, 21.0, 28.0, 23.0, 29.0, 44.0, 26.0, 36.0, 27.0, 39.0, 38.0, 38.0, 41.0, 45.0, 52.0, 44.0, 35.0, 38.0, 36.0, 25.0, 36.0, 25.0, 23.0, 20.0, 10.0, 21.0, 19.0, 16.0, 12.0, 12.0, 6.0, 9.0, 8.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.69476318359375, -85.98043060302734, -83.26609802246094, -80.55176544189453, -77.83743286132812, -75.12310028076172, -72.40876770019531, -69.69444274902344, -66.9801025390625, -64.2657699584961, -61.55143737792969, -58.83710479736328, -56.122772216796875, -53.40843963623047, -50.69411087036133, -47.97977828979492, -45.26544952392578, -42.551116943359375, -39.83678436279297, -37.12245178222656, -34.408119201660156, -31.693788528442383, -28.97945785522461, -26.265125274658203, -23.550792694091797, -20.83646011352539, -18.122127532958984, -15.407796859741211, -12.693464279174805, -9.979131698608398, -7.264801025390625, -4.550468444824219, -1.8361358642578125, 0.8781962394714355, 3.5925283432006836, 6.306859970092773, 9.02119255065918, 11.735525131225586, 14.44985580444336, 17.164188385009766, 19.878520965576172, 22.592853546142578, 25.307186126708984, 28.021516799926758, 30.735849380493164, 33.45018005371094, 36.164512634277344, 38.87884521484375, 41.593177795410156, 44.30751037597656, 47.02184295654297, 49.736175537109375, 52.45050811767578, 55.16484069824219, 57.87916946411133, 60.593502044677734, 63.30783462524414, 66.02216339111328, 68.73649597167969, 71.4508285522461, 74.1651611328125, 76.8794937133789, 79.59382629394531, 82.30815887451172, 85.02249145507812]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 3.0, 8.0, 13.0, 10.0, 18.0, 24.0, 40.0, 75.0, 110.0, 162.0, 237.0, 319.0, 533.0, 775.0, 1206.0, 1866.0, 2795.0, 4185.0, 6224.0, 9631.0, 14216.0, 21871.0, 32120.0, 45296.0, 63159.0, 83099.0, 101993.0, 114397.0, 116141.0, 106513.0, 89964.0, 70189.0, 51239.0, 36426.0, 24771.0, 16721.0, 11045.0, 7268.0, 4724.0, 3102.0, 2070.0, 1365.0, 881.0, 558.0, 384.0, 272.0, 183.0, 137.0, 75.0, 50.0, 34.0, 20.0, 12.0, 12.0, 10.0, 6.0, 2.0, 1.0, 3.0, 5.0], "bins": [-144.5, -140.0078125, -135.515625, -131.0234375, -126.53125, -122.0390625, -117.546875, -113.0546875, -108.5625, -104.0703125, -99.578125, -95.0859375, -90.59375, -86.1015625, -81.609375, -77.1171875, -72.625, -68.1328125, -63.640625, -59.1484375, -54.65625, -50.1640625, -45.671875, -41.1796875, -36.6875, -32.1953125, -27.703125, -23.2109375, -18.71875, -14.2265625, -9.734375, -5.2421875, -0.75, 3.7421875, 8.234375, 12.7265625, 17.21875, 21.7109375, 26.203125, 30.6953125, 35.1875, 39.6796875, 44.171875, 48.6640625, 53.15625, 57.6484375, 62.140625, 66.6328125, 71.125, 75.6171875, 80.109375, 84.6015625, 89.09375, 93.5859375, 98.078125, 102.5703125, 107.0625, 111.5546875, 116.046875, 120.5390625, 125.03125, 129.5234375, 134.015625, 138.5078125, 143.0]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 5.0, 6.0, 7.0, 16.0, 16.0, 11.0, 21.0, 20.0, 24.0, 17.0, 27.0, 30.0, 30.0, 33.0, 38.0, 27.0, 30.0, 35.0, 53.0, 49.0, 49.0, 45.0, 40.0, 43.0, 37.0, 37.0, 26.0, 22.0, 27.0, 22.0, 19.0, 22.0, 18.0, 18.0, 15.0, 13.0, 11.0, 8.0, 12.0, 6.0, 2.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.875, -53.9306640625, -51.986328125, -50.0419921875, -48.09765625, -46.1533203125, -44.208984375, -42.2646484375, -40.3203125, -38.3759765625, -36.431640625, -34.4873046875, -32.54296875, -30.5986328125, -28.654296875, -26.7099609375, -24.765625, -22.8212890625, -20.876953125, -18.9326171875, -16.98828125, -15.0439453125, -13.099609375, -11.1552734375, -9.2109375, -7.2666015625, -5.322265625, -3.3779296875, -1.43359375, 0.5107421875, 2.455078125, 4.3994140625, 6.34375, 8.2880859375, 10.232421875, 12.1767578125, 14.12109375, 16.0654296875, 18.009765625, 19.9541015625, 21.8984375, 23.8427734375, 25.787109375, 27.7314453125, 29.67578125, 31.6201171875, 33.564453125, 35.5087890625, 37.453125, 39.3974609375, 41.341796875, 43.2861328125, 45.23046875, 47.1748046875, 49.119140625, 51.0634765625, 53.0078125, 54.9521484375, 56.896484375, 58.8408203125, 60.78515625, 62.7294921875, 64.673828125, 66.6181640625, 68.5625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 4.0, 7.0, 10.0, 13.0, 14.0, 25.0, 25.0, 56.0, 78.0, 113.0, 154.0, 215.0, 333.0, 455.0, 683.0, 1003.0, 1581.0, 2488.0, 3983.0, 6339.0, 10862.0, 19018.0, 34540.0, 63644.0, 116296.0, 194703.0, 227364.0, 160084.0, 90650.0, 49290.0, 26208.0, 14921.0, 8748.0, 5227.0, 3234.0, 2094.0, 1320.0, 883.0, 603.0, 385.0, 276.0, 186.0, 130.0, 110.0, 57.0, 57.0, 23.0, 25.0, 16.0, 18.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-253.625, -246.005859375, -238.38671875, -230.767578125, -223.1484375, -215.529296875, -207.91015625, -200.291015625, -192.671875, -185.052734375, -177.43359375, -169.814453125, -162.1953125, -154.576171875, -146.95703125, -139.337890625, -131.71875, -124.099609375, -116.48046875, -108.861328125, -101.2421875, -93.623046875, -86.00390625, -78.384765625, -70.765625, -63.146484375, -55.52734375, -47.908203125, -40.2890625, -32.669921875, -25.05078125, -17.431640625, -9.8125, -2.193359375, 5.42578125, 13.044921875, 20.6640625, 28.283203125, 35.90234375, 43.521484375, 51.140625, 58.759765625, 66.37890625, 73.998046875, 81.6171875, 89.236328125, 96.85546875, 104.474609375, 112.09375, 119.712890625, 127.33203125, 134.951171875, 142.5703125, 150.189453125, 157.80859375, 165.427734375, 173.046875, 180.666015625, 188.28515625, 195.904296875, 203.5234375, 211.142578125, 218.76171875, 226.380859375, 234.0]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 0.0, 3.0, 3.0, 4.0, 10.0, 17.0, 11.0, 10.0, 17.0, 19.0, 25.0, 16.0, 32.0, 24.0, 33.0, 28.0, 24.0, 33.0, 37.0, 38.0, 42.0, 45.0, 41.0, 42.0, 39.0, 44.0, 38.0, 36.0, 34.0, 35.0, 33.0, 22.0, 19.0, 13.0, 13.0, 25.0, 15.0, 18.0, 13.0, 11.0, 7.0, 4.0, 6.0, 6.0, 3.0, 7.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.375, -44.8154296875, -43.255859375, -41.6962890625, -40.13671875, -38.5771484375, -37.017578125, -35.4580078125, -33.8984375, -32.3388671875, -30.779296875, -29.2197265625, -27.66015625, -26.1005859375, -24.541015625, -22.9814453125, -21.421875, -19.8623046875, -18.302734375, -16.7431640625, -15.18359375, -13.6240234375, -12.064453125, -10.5048828125, -8.9453125, -7.3857421875, -5.826171875, -4.2666015625, -2.70703125, -1.1474609375, 0.412109375, 1.9716796875, 3.53125, 5.0908203125, 6.650390625, 8.2099609375, 9.76953125, 11.3291015625, 12.888671875, 14.4482421875, 16.0078125, 17.5673828125, 19.126953125, 20.6865234375, 22.24609375, 23.8056640625, 25.365234375, 26.9248046875, 28.484375, 30.0439453125, 31.603515625, 33.1630859375, 34.72265625, 36.2822265625, 37.841796875, 39.4013671875, 40.9609375, 42.5205078125, 44.080078125, 45.6396484375, 47.19921875, 48.7587890625, 50.318359375, 51.8779296875, 53.4375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 5.0, 3.0, 7.0, 11.0, 21.0, 31.0, 48.0, 66.0, 79.0, 110.0, 178.0, 247.0, 385.0, 568.0, 896.0, 1382.0, 2158.0, 3533.0, 5699.0, 10460.0, 21792.0, 58661.0, 205606.0, 466803.0, 174912.0, 50860.0, 19762.0, 9685.0, 5517.0, 3273.0, 2040.0, 1283.0, 846.0, 531.0, 340.0, 239.0, 151.0, 106.0, 80.0, 56.0, 36.0, 24.0, 23.0, 8.0, 7.0, 7.0, 4.0, 5.0, 0.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-245.25, -237.44921875, -229.6484375, -221.84765625, -214.046875, -206.24609375, -198.4453125, -190.64453125, -182.84375, -175.04296875, -167.2421875, -159.44140625, -151.640625, -143.83984375, -136.0390625, -128.23828125, -120.4375, -112.63671875, -104.8359375, -97.03515625, -89.234375, -81.43359375, -73.6328125, -65.83203125, -58.03125, -50.23046875, -42.4296875, -34.62890625, -26.828125, -19.02734375, -11.2265625, -3.42578125, 4.375, 12.17578125, 19.9765625, 27.77734375, 35.578125, 43.37890625, 51.1796875, 58.98046875, 66.78125, 74.58203125, 82.3828125, 90.18359375, 97.984375, 105.78515625, 113.5859375, 121.38671875, 129.1875, 136.98828125, 144.7890625, 152.58984375, 160.390625, 168.19140625, 175.9921875, 183.79296875, 191.59375, 199.39453125, 207.1953125, 214.99609375, 222.796875, 230.59765625, 238.3984375, 246.19921875, 254.0]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 6.0, 9.0, 10.0, 15.0, 11.0, 24.0, 31.0, 34.0, 56.0, 60.0, 94.0, 99.0, 100.0, 103.0, 98.0, 57.0, 50.0, 36.0, 32.0, 13.0, 12.0, 10.0, 4.0, 4.0, 7.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0230712890625, -0.02243518829345703, -0.021799087524414062, -0.021162986755371094, -0.020526885986328125, -0.019890785217285156, -0.019254684448242188, -0.01861858367919922, -0.01798248291015625, -0.01734638214111328, -0.016710281372070312, -0.016074180603027344, -0.015438079833984375, -0.014801979064941406, -0.014165878295898438, -0.013529777526855469, -0.0128936767578125, -0.012257575988769531, -0.011621475219726562, -0.010985374450683594, -0.010349273681640625, -0.009713172912597656, -0.009077072143554688, -0.008440971374511719, -0.00780487060546875, -0.007168769836425781, -0.0065326690673828125, -0.005896568298339844, -0.005260467529296875, -0.004624366760253906, -0.0039882659912109375, -0.0033521652221679688, -0.002716064453125, -0.0020799636840820312, -0.0014438629150390625, -0.0008077621459960938, -0.000171661376953125, 0.00046443939208984375, 0.0011005401611328125, 0.0017366409301757812, 0.00237274169921875, 0.0030088424682617188, 0.0036449432373046875, 0.004281044006347656, 0.004917144775390625, 0.005553245544433594, 0.0061893463134765625, 0.006825447082519531, 0.0074615478515625, 0.008097648620605469, 0.008733749389648438, 0.009369850158691406, 0.010005950927734375, 0.010642051696777344, 0.011278152465820312, 0.011914253234863281, 0.01255035400390625, 0.013186454772949219, 0.013822555541992188, 0.014458656311035156, 0.015094757080078125, 0.015730857849121094, 0.016366958618164062, 0.01700305938720703, 0.01763916015625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 9.0, 11.0, 18.0, 16.0, 35.0, 36.0, 69.0, 95.0, 127.0, 184.0, 259.0, 387.0, 544.0, 768.0, 1225.0, 1772.0, 2759.0, 4394.0, 7298.0, 13809.0, 30660.0, 79612.0, 211850.0, 344514.0, 206924.0, 78026.0, 29707.0, 13659.0, 7199.0, 4261.0, 2768.0, 1750.0, 1282.0, 758.0, 531.0, 385.0, 266.0, 174.0, 135.0, 84.0, 59.0, 42.0, 39.0, 19.0, 15.0, 6.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-147.75, -143.337890625, -138.92578125, -134.513671875, -130.1015625, -125.689453125, -121.27734375, -116.865234375, -112.453125, -108.041015625, -103.62890625, -99.216796875, -94.8046875, -90.392578125, -85.98046875, -81.568359375, -77.15625, -72.744140625, -68.33203125, -63.919921875, -59.5078125, -55.095703125, -50.68359375, -46.271484375, -41.859375, -37.447265625, -33.03515625, -28.623046875, -24.2109375, -19.798828125, -15.38671875, -10.974609375, -6.5625, -2.150390625, 2.26171875, 6.673828125, 11.0859375, 15.498046875, 19.91015625, 24.322265625, 28.734375, 33.146484375, 37.55859375, 41.970703125, 46.3828125, 50.794921875, 55.20703125, 59.619140625, 64.03125, 68.443359375, 72.85546875, 77.267578125, 81.6796875, 86.091796875, 90.50390625, 94.916015625, 99.328125, 103.740234375, 108.15234375, 112.564453125, 116.9765625, 121.388671875, 125.80078125, 130.212890625, 134.625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 0.0, 3.0, 4.0, 3.0, 6.0, 8.0, 10.0, 6.0, 13.0, 28.0, 38.0, 66.0, 84.0, 116.0, 128.0, 126.0, 106.0, 67.0, 66.0, 35.0, 28.0, 18.0, 9.0, 11.0, 5.0, 3.0, 1.0, 2.0, 8.0, 1.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.53125, -60.6923828125, -58.853515625, -57.0146484375, -55.17578125, -53.3369140625, -51.498046875, -49.6591796875, -47.8203125, -45.9814453125, -44.142578125, -42.3037109375, -40.46484375, -38.6259765625, -36.787109375, -34.9482421875, -33.109375, -31.2705078125, -29.431640625, -27.5927734375, -25.75390625, -23.9150390625, -22.076171875, -20.2373046875, -18.3984375, -16.5595703125, -14.720703125, -12.8818359375, -11.04296875, -9.2041015625, -7.365234375, -5.5263671875, -3.6875, -1.8486328125, -0.009765625, 1.8291015625, 3.66796875, 5.5068359375, 7.345703125, 9.1845703125, 11.0234375, 12.8623046875, 14.701171875, 16.5400390625, 18.37890625, 20.2177734375, 22.056640625, 23.8955078125, 25.734375, 27.5732421875, 29.412109375, 31.2509765625, 33.08984375, 34.9287109375, 36.767578125, 38.6064453125, 40.4453125, 42.2841796875, 44.123046875, 45.9619140625, 47.80078125, 49.6396484375, 51.478515625, 53.3173828125, 55.15625]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 3.0, 9.0, 8.0, 11.0, 13.0, 13.0, 15.0, 16.0, 20.0, 20.0, 31.0, 33.0, 27.0, 36.0, 57.0, 37.0, 51.0, 49.0, 46.0, 40.0, 50.0, 45.0, 55.0, 33.0, 43.0, 32.0, 30.0, 21.0, 26.0, 21.0, 20.0, 12.0, 14.0, 11.0, 5.0, 7.0, 14.0, 1.0, 3.0, 9.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-72.33639526367188, -70.1641845703125, -67.99197387695312, -65.81976318359375, -63.647552490234375, -61.475341796875, -59.30312728881836, -57.130916595458984, -54.95870590209961, -52.786495208740234, -50.61428451538086, -48.442073822021484, -46.269859313964844, -44.09764862060547, -41.925437927246094, -39.75322723388672, -37.581016540527344, -35.40880584716797, -33.236595153808594, -31.064382553100586, -28.89217185974121, -26.719961166381836, -24.547748565673828, -22.375537872314453, -20.203327178955078, -18.031116485595703, -15.858904838562012, -13.68669319152832, -11.514482498168945, -9.34227180480957, -7.170060157775879, -4.9978485107421875, -2.8256454467773438, -0.6534342765808105, 1.5187768936157227, 3.690988063812256, 5.863199234008789, 8.035409927368164, 10.207621574401855, 12.379833221435547, 14.552043914794922, 16.724254608154297, 18.896465301513672, 21.06867790222168, 23.240888595581055, 25.41309928894043, 27.585311889648438, 29.757522583007812, 31.929733276367188, 34.10194396972656, 36.27415466308594, 38.44636535644531, 40.61857604980469, 42.79078674316406, 44.9630012512207, 47.13521194458008, 49.30742263793945, 51.47963333129883, 53.6518440246582, 55.82405471801758, 57.99626922607422, 60.168479919433594, 62.34069061279297, 64.51290130615234, 66.68511199951172]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 7.0, 4.0, 6.0, 12.0, 13.0, 12.0, 14.0, 25.0, 20.0, 18.0, 24.0, 27.0, 31.0, 32.0, 27.0, 33.0, 42.0, 32.0, 41.0, 45.0, 48.0, 43.0, 40.0, 37.0, 33.0, 36.0, 26.0, 32.0, 34.0, 28.0, 19.0, 28.0, 21.0, 12.0, 16.0, 17.0, 22.0, 9.0, 8.0, 6.0, 8.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-74.7188720703125, -72.49765014648438, -70.27642822265625, -68.05520629882812, -65.833984375, -63.612762451171875, -61.391536712646484, -59.17031478881836, -56.949092864990234, -54.72787094116211, -52.506649017333984, -50.28542709350586, -48.06420135498047, -45.842979431152344, -43.62175750732422, -41.400535583496094, -39.17931365966797, -36.958091735839844, -34.73686981201172, -32.515647888183594, -30.294424057006836, -28.07320213317871, -25.851978302001953, -23.630756378173828, -21.409534454345703, -19.188312530517578, -16.967090606689453, -14.745866775512695, -12.52464485168457, -10.303422927856445, -8.082200050354004, -5.8609771728515625, -3.6397552490234375, -1.4185328483581543, 0.8026895523071289, 3.023911952972412, 5.245134353637695, 7.46635627746582, 9.687579154968262, 11.908802032470703, 14.130023956298828, 16.351245880126953, 18.572467803955078, 20.793691635131836, 23.01491355895996, 25.236135482788086, 27.457359313964844, 29.67858123779297, 31.899803161621094, 34.12102508544922, 36.342247009277344, 38.56346893310547, 40.784690856933594, 43.00591278076172, 45.22713851928711, 47.448360443115234, 49.66958236694336, 51.890804290771484, 54.11202621459961, 56.333248138427734, 58.554473876953125, 60.77569580078125, 62.996917724609375, 65.2181396484375, 67.43936157226562]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 12.0, 24.0, 38.0, 56.0, 78.0, 118.0, 186.0, 297.0, 453.0, 709.0, 1081.0, 1822.0, 3001.0, 4544.0, 7477.0, 11655.0, 18677.0, 28747.0, 43543.0, 63891.0, 89948.0, 116111.0, 133377.0, 133466.0, 115317.0, 89295.0, 63516.0, 43298.0, 28446.0, 18325.0, 11753.0, 7213.0, 4430.0, 2819.0, 1817.0, 1094.0, 727.0, 438.0, 253.0, 161.0, 121.0, 80.0, 61.0, 24.0, 22.0, 14.0, 6.0, 9.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-61.3125, -59.267578125, -57.22265625, -55.177734375, -53.1328125, -51.087890625, -49.04296875, -46.998046875, -44.953125, -42.908203125, -40.86328125, -38.818359375, -36.7734375, -34.728515625, -32.68359375, -30.638671875, -28.59375, -26.548828125, -24.50390625, -22.458984375, -20.4140625, -18.369140625, -16.32421875, -14.279296875, -12.234375, -10.189453125, -8.14453125, -6.099609375, -4.0546875, -2.009765625, 0.03515625, 2.080078125, 4.125, 6.169921875, 8.21484375, 10.259765625, 12.3046875, 14.349609375, 16.39453125, 18.439453125, 20.484375, 22.529296875, 24.57421875, 26.619140625, 28.6640625, 30.708984375, 32.75390625, 34.798828125, 36.84375, 38.888671875, 40.93359375, 42.978515625, 45.0234375, 47.068359375, 49.11328125, 51.158203125, 53.203125, 55.248046875, 57.29296875, 59.337890625, 61.3828125, 63.427734375, 65.47265625, 67.517578125, 69.5625]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 7.0, 8.0, 6.0, 11.0, 6.0, 17.0, 15.0, 14.0, 22.0, 20.0, 18.0, 27.0, 30.0, 31.0, 31.0, 41.0, 48.0, 41.0, 44.0, 39.0, 43.0, 50.0, 42.0, 50.0, 36.0, 33.0, 39.0, 30.0, 26.0, 31.0, 24.0, 12.0, 18.0, 19.0, 15.0, 14.0, 14.0, 9.0, 9.0, 5.0, 5.0, 3.0, 1.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.625, -70.4365234375, -68.248046875, -66.0595703125, -63.87109375, -61.6826171875, -59.494140625, -57.3056640625, -55.1171875, -52.9287109375, -50.740234375, -48.5517578125, -46.36328125, -44.1748046875, -41.986328125, -39.7978515625, -37.609375, -35.4208984375, -33.232421875, -31.0439453125, -28.85546875, -26.6669921875, -24.478515625, -22.2900390625, -20.1015625, -17.9130859375, -15.724609375, -13.5361328125, -11.34765625, -9.1591796875, -6.970703125, -4.7822265625, -2.59375, -0.4052734375, 1.783203125, 3.9716796875, 6.16015625, 8.3486328125, 10.537109375, 12.7255859375, 14.9140625, 17.1025390625, 19.291015625, 21.4794921875, 23.66796875, 25.8564453125, 28.044921875, 30.2333984375, 32.421875, 34.6103515625, 36.798828125, 38.9873046875, 41.17578125, 43.3642578125, 45.552734375, 47.7412109375, 49.9296875, 52.1181640625, 54.306640625, 56.4951171875, 58.68359375, 60.8720703125, 63.060546875, 65.2490234375, 67.4375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 5.0, 6.0, 7.0, 11.0, 15.0, 20.0, 35.0, 37.0, 46.0, 96.0, 130.0, 186.0, 331.0, 433.0, 593.0, 969.0, 1316.0, 1964.0, 2848.0, 4191.0, 6259.0, 9320.0, 14155.0, 21104.0, 31531.0, 46057.0, 66168.0, 92208.0, 118402.0, 134560.0, 129536.0, 107743.0, 80742.0, 57574.0, 39456.0, 26401.0, 17748.0, 11854.0, 7807.0, 5331.0, 3657.0, 2418.0, 1649.0, 1176.0, 791.0, 508.0, 373.0, 267.0, 177.0, 128.0, 75.0, 49.0, 39.0, 28.0, 12.0, 6.0, 11.0, 3.0, 2.0, 2.0, 3.0], "bins": [-79.125, -76.7119140625, -74.298828125, -71.8857421875, -69.47265625, -67.0595703125, -64.646484375, -62.2333984375, -59.8203125, -57.4072265625, -54.994140625, -52.5810546875, -50.16796875, -47.7548828125, -45.341796875, -42.9287109375, -40.515625, -38.1025390625, -35.689453125, -33.2763671875, -30.86328125, -28.4501953125, -26.037109375, -23.6240234375, -21.2109375, -18.7978515625, -16.384765625, -13.9716796875, -11.55859375, -9.1455078125, -6.732421875, -4.3193359375, -1.90625, 0.5068359375, 2.919921875, 5.3330078125, 7.74609375, 10.1591796875, 12.572265625, 14.9853515625, 17.3984375, 19.8115234375, 22.224609375, 24.6376953125, 27.05078125, 29.4638671875, 31.876953125, 34.2900390625, 36.703125, 39.1162109375, 41.529296875, 43.9423828125, 46.35546875, 48.7685546875, 51.181640625, 53.5947265625, 56.0078125, 58.4208984375, 60.833984375, 63.2470703125, 65.66015625, 68.0732421875, 70.486328125, 72.8994140625, 75.3125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 7.0, 9.0, 11.0, 10.0, 12.0, 18.0, 15.0, 15.0, 22.0, 24.0, 28.0, 29.0, 39.0, 30.0, 36.0, 32.0, 35.0, 38.0, 39.0, 41.0, 28.0, 41.0, 40.0, 56.0, 32.0, 30.0, 31.0, 33.0, 29.0, 26.0, 21.0, 22.0, 17.0, 17.0, 18.0, 8.0, 9.0, 9.0, 10.0, 3.0, 2.0, 11.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-57.59375, -55.91259765625, -54.2314453125, -52.55029296875, -50.869140625, -49.18798828125, -47.5068359375, -45.82568359375, -44.14453125, -42.46337890625, -40.7822265625, -39.10107421875, -37.419921875, -35.73876953125, -34.0576171875, -32.37646484375, -30.6953125, -29.01416015625, -27.3330078125, -25.65185546875, -23.970703125, -22.28955078125, -20.6083984375, -18.92724609375, -17.24609375, -15.56494140625, -13.8837890625, -12.20263671875, -10.521484375, -8.84033203125, -7.1591796875, -5.47802734375, -3.796875, -2.11572265625, -0.4345703125, 1.24658203125, 2.927734375, 4.60888671875, 6.2900390625, 7.97119140625, 9.65234375, 11.33349609375, 13.0146484375, 14.69580078125, 16.376953125, 18.05810546875, 19.7392578125, 21.42041015625, 23.1015625, 24.78271484375, 26.4638671875, 28.14501953125, 29.826171875, 31.50732421875, 33.1884765625, 34.86962890625, 36.55078125, 38.23193359375, 39.9130859375, 41.59423828125, 43.275390625, 44.95654296875, 46.6376953125, 48.31884765625, 50.0]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [4.0, 5.0, 4.0, 9.0, 7.0, 15.0, 28.0, 32.0, 49.0, 52.0, 88.0, 148.0, 197.0, 287.0, 406.0, 529.0, 843.0, 1275.0, 1832.0, 2737.0, 3984.0, 6319.0, 9915.0, 16671.0, 28621.0, 51787.0, 97416.0, 172311.0, 229689.0, 183586.0, 105237.0, 55843.0, 30232.0, 17689.0, 10731.0, 6636.0, 4281.0, 2955.0, 1965.0, 1332.0, 851.0, 606.0, 413.0, 271.0, 200.0, 145.0, 100.0, 69.0, 52.0, 33.0, 26.0, 26.0, 9.0, 9.0, 5.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-71.9375, -69.4189453125, -66.900390625, -64.3818359375, -61.86328125, -59.3447265625, -56.826171875, -54.3076171875, -51.7890625, -49.2705078125, -46.751953125, -44.2333984375, -41.71484375, -39.1962890625, -36.677734375, -34.1591796875, -31.640625, -29.1220703125, -26.603515625, -24.0849609375, -21.56640625, -19.0478515625, -16.529296875, -14.0107421875, -11.4921875, -8.9736328125, -6.455078125, -3.9365234375, -1.41796875, 1.1005859375, 3.619140625, 6.1376953125, 8.65625, 11.1748046875, 13.693359375, 16.2119140625, 18.73046875, 21.2490234375, 23.767578125, 26.2861328125, 28.8046875, 31.3232421875, 33.841796875, 36.3603515625, 38.87890625, 41.3974609375, 43.916015625, 46.4345703125, 48.953125, 51.4716796875, 53.990234375, 56.5087890625, 59.02734375, 61.5458984375, 64.064453125, 66.5830078125, 69.1015625, 71.6201171875, 74.138671875, 76.6572265625, 79.17578125, 81.6943359375, 84.212890625, 86.7314453125, 89.25]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 5.0, 6.0, 8.0, 10.0, 5.0, 14.0, 22.0, 32.0, 48.0, 59.0, 87.0, 96.0, 126.0, 113.0, 93.0, 77.0, 58.0, 38.0, 34.0, 17.0, 11.0, 7.0, 12.0, 10.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01236724853515625, -0.011964917182922363, -0.011562585830688477, -0.01116025447845459, -0.010757923126220703, -0.010355591773986816, -0.00995326042175293, -0.009550929069519043, -0.009148597717285156, -0.00874626636505127, -0.008343935012817383, -0.007941603660583496, -0.007539272308349609, -0.007136940956115723, -0.006734609603881836, -0.006332278251647949, -0.0059299468994140625, -0.005527615547180176, -0.005125284194946289, -0.004722952842712402, -0.004320621490478516, -0.003918290138244629, -0.003515958786010742, -0.0031136274337768555, -0.0027112960815429688, -0.002308964729309082, -0.0019066333770751953, -0.0015043020248413086, -0.0011019706726074219, -0.0006996393203735352, -0.00029730796813964844, 0.00010502338409423828, 0.000507354736328125, 0.0009096860885620117, 0.0013120174407958984, 0.0017143487930297852, 0.002116680145263672, 0.0025190114974975586, 0.0029213428497314453, 0.003323674201965332, 0.0037260055541992188, 0.0041283369064331055, 0.004530668258666992, 0.004932999610900879, 0.005335330963134766, 0.005737662315368652, 0.006139993667602539, 0.006542325019836426, 0.0069446563720703125, 0.007346987724304199, 0.007749319076538086, 0.008151650428771973, 0.00855398178100586, 0.008956313133239746, 0.009358644485473633, 0.00976097583770752, 0.010163307189941406, 0.010565638542175293, 0.01096796989440918, 0.011370301246643066, 0.011772632598876953, 0.01217496395111084, 0.012577295303344727, 0.012979626655578613, 0.0133819580078125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 7.0, 15.0, 8.0, 13.0, 19.0, 29.0, 40.0, 64.0, 83.0, 109.0, 187.0, 242.0, 371.0, 544.0, 843.0, 1214.0, 1889.0, 2840.0, 4486.0, 7143.0, 11606.0, 18710.0, 31895.0, 54584.0, 96629.0, 158445.0, 207203.0, 177132.0, 112300.0, 64831.0, 37063.0, 21812.0, 13054.0, 8234.0, 5100.0, 3349.0, 2167.0, 1425.0, 954.0, 659.0, 390.0, 260.0, 174.0, 137.0, 95.0, 73.0, 36.0, 31.0, 29.0, 13.0, 12.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-69.6875, -67.552734375, -65.41796875, -63.283203125, -61.1484375, -59.013671875, -56.87890625, -54.744140625, -52.609375, -50.474609375, -48.33984375, -46.205078125, -44.0703125, -41.935546875, -39.80078125, -37.666015625, -35.53125, -33.396484375, -31.26171875, -29.126953125, -26.9921875, -24.857421875, -22.72265625, -20.587890625, -18.453125, -16.318359375, -14.18359375, -12.048828125, -9.9140625, -7.779296875, -5.64453125, -3.509765625, -1.375, 0.759765625, 2.89453125, 5.029296875, 7.1640625, 9.298828125, 11.43359375, 13.568359375, 15.703125, 17.837890625, 19.97265625, 22.107421875, 24.2421875, 26.376953125, 28.51171875, 30.646484375, 32.78125, 34.916015625, 37.05078125, 39.185546875, 41.3203125, 43.455078125, 45.58984375, 47.724609375, 49.859375, 51.994140625, 54.12890625, 56.263671875, 58.3984375, 60.533203125, 62.66796875, 64.802734375, 66.9375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 1.0, 1.0, 6.0, 4.0, 16.0, 12.0, 10.0, 19.0, 16.0, 22.0, 24.0, 24.0, 38.0, 43.0, 49.0, 54.0, 63.0, 68.0, 64.0, 58.0, 59.0, 52.0, 45.0, 43.0, 48.0, 25.0, 26.0, 19.0, 25.0, 11.0, 11.0, 9.0, 9.0, 8.0, 5.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.75, -22.947998046875, -22.14599609375, -21.343994140625, -20.5419921875, -19.739990234375, -18.93798828125, -18.135986328125, -17.333984375, -16.531982421875, -15.72998046875, -14.927978515625, -14.1259765625, -13.323974609375, -12.52197265625, -11.719970703125, -10.91796875, -10.115966796875, -9.31396484375, -8.511962890625, -7.7099609375, -6.907958984375, -6.10595703125, -5.303955078125, -4.501953125, -3.699951171875, -2.89794921875, -2.095947265625, -1.2939453125, -0.491943359375, 0.31005859375, 1.112060546875, 1.9140625, 2.716064453125, 3.51806640625, 4.320068359375, 5.1220703125, 5.924072265625, 6.72607421875, 7.528076171875, 8.330078125, 9.132080078125, 9.93408203125, 10.736083984375, 11.5380859375, 12.340087890625, 13.14208984375, 13.944091796875, 14.74609375, 15.548095703125, 16.35009765625, 17.152099609375, 17.9541015625, 18.756103515625, 19.55810546875, 20.360107421875, 21.162109375, 21.964111328125, 22.76611328125, 23.568115234375, 24.3701171875, 25.172119140625, 25.97412109375, 26.776123046875, 27.578125]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 7.0, 3.0, 7.0, 9.0, 11.0, 14.0, 14.0, 24.0, 23.0, 28.0, 24.0, 29.0, 28.0, 39.0, 37.0, 46.0, 41.0, 44.0, 45.0, 53.0, 50.0, 42.0, 40.0, 34.0, 36.0, 28.0, 33.0, 26.0, 30.0, 23.0, 28.0, 23.0, 15.0, 17.0, 7.0, 6.0, 8.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-70.84236907958984, -68.74482727050781, -66.64729309082031, -64.54975128173828, -62.452213287353516, -60.35467529296875, -58.25713348388672, -56.15959548950195, -54.06205749511719, -51.96451950073242, -49.86697769165039, -47.769439697265625, -45.67190170288086, -43.574363708496094, -41.47682189941406, -39.3792839050293, -37.281742095947266, -35.1842041015625, -33.08666229248047, -30.989124298095703, -28.891586303710938, -26.79404640197754, -24.69650650024414, -22.598968505859375, -20.501428604125977, -18.403888702392578, -16.306350708007812, -14.208810806274414, -12.111271858215332, -10.01373291015625, -7.916193008422852, -5.8186540603637695, -3.7211151123046875, -1.6235759258270264, 0.47396326065063477, 2.571502685546875, 4.669041633605957, 6.766580581665039, 8.864120483398438, 10.96165943145752, 13.059198379516602, 15.156737327575684, 17.254276275634766, 19.351816177368164, 21.449356079101562, 23.546894073486328, 25.644433975219727, 27.741973876953125, 29.83951187133789, 31.93705177307129, 34.03459167480469, 36.13212966918945, 38.22966766357422, 40.32720947265625, 42.424747467041016, 44.52228546142578, 46.61982727050781, 48.71736526489258, 50.81490707397461, 52.912445068359375, 55.00998306274414, 57.107521057128906, 59.20506286621094, 61.3026008605957, 63.40013885498047]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 5.0, 6.0, 0.0, 3.0, 4.0, 8.0, 10.0, 14.0, 11.0, 15.0, 17.0, 18.0, 25.0, 31.0, 36.0, 21.0, 32.0, 36.0, 35.0, 38.0, 48.0, 35.0, 35.0, 48.0, 50.0, 40.0, 31.0, 41.0, 31.0, 35.0, 32.0, 24.0, 21.0, 37.0, 16.0, 22.0, 14.0, 15.0, 8.0, 13.0, 12.0, 6.0, 11.0, 9.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-82.25519561767578, -79.89909362792969, -77.5429916381836, -75.1868896484375, -72.83078002929688, -70.47467803955078, -68.11857604980469, -65.7624740600586, -63.4063720703125, -61.050270080566406, -58.69416427612305, -56.33806228637695, -53.98196029663086, -51.6258544921875, -49.269752502441406, -46.91365051269531, -44.55754470825195, -42.20144271850586, -39.8453369140625, -37.489234924316406, -35.13313293457031, -32.77703094482422, -30.42092514038086, -28.064823150634766, -25.70871925354004, -23.352615356445312, -20.99651336669922, -18.640409469604492, -16.284305572509766, -13.928203582763672, -11.572099685668945, -9.215997695922852, -6.859893798828125, -4.503790855407715, -2.1476874351501465, 0.20841598510742188, 2.564518928527832, 4.920621871948242, 7.276725769042969, 9.632827758789062, 11.988931655883789, 14.3450345993042, 16.70113754272461, 19.057241439819336, 21.413345336914062, 23.769447326660156, 26.125551223754883, 28.481653213500977, 30.837757110595703, 33.1938591003418, 35.549964904785156, 37.90606689453125, 40.262168884277344, 42.61827087402344, 44.9743766784668, 47.33047866821289, 49.68658447265625, 52.042686462402344, 54.3987922668457, 56.7548942565918, 59.11099624633789, 61.46710205078125, 63.823204040527344, 66.17930603027344, 68.53540802001953]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 8.0, 8.0, 9.0, 15.0, 28.0, 34.0, 55.0, 94.0, 144.0, 299.0, 537.0, 910.0, 1701.0, 3022.0, 5942.0, 11319.0, 22160.0, 44759.0, 92201.0, 196775.0, 425776.0, 817788.0, 1052723.0, 774938.0, 392618.0, 181550.0, 85167.0, 41000.0, 20661.0, 10382.0, 5406.0, 2776.0, 1512.0, 829.0, 459.0, 295.0, 143.0, 94.0, 50.0, 40.0, 26.0, 13.0, 14.0, 8.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-86.6875, -84.1708984375, -81.654296875, -79.1376953125, -76.62109375, -74.1044921875, -71.587890625, -69.0712890625, -66.5546875, -64.0380859375, -61.521484375, -59.0048828125, -56.48828125, -53.9716796875, -51.455078125, -48.9384765625, -46.421875, -43.9052734375, -41.388671875, -38.8720703125, -36.35546875, -33.8388671875, -31.322265625, -28.8056640625, -26.2890625, -23.7724609375, -21.255859375, -18.7392578125, -16.22265625, -13.7060546875, -11.189453125, -8.6728515625, -6.15625, -3.6396484375, -1.123046875, 1.3935546875, 3.91015625, 6.4267578125, 8.943359375, 11.4599609375, 13.9765625, 16.4931640625, 19.009765625, 21.5263671875, 24.04296875, 26.5595703125, 29.076171875, 31.5927734375, 34.109375, 36.6259765625, 39.142578125, 41.6591796875, 44.17578125, 46.6923828125, 49.208984375, 51.7255859375, 54.2421875, 56.7587890625, 59.275390625, 61.7919921875, 64.30859375, 66.8251953125, 69.341796875, 71.8583984375, 74.375]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 10.0, 9.0, 16.0, 18.0, 21.0, 21.0, 22.0, 20.0, 28.0, 30.0, 35.0, 46.0, 47.0, 39.0, 32.0, 27.0, 47.0, 49.0, 47.0, 30.0, 39.0, 48.0, 35.0, 24.0, 28.0, 35.0, 26.0, 23.0, 25.0, 18.0, 21.0, 10.0, 11.0, 13.0, 10.0, 9.0, 8.0, 3.0, 7.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-65.0625, -63.27490234375, -61.4873046875, -59.69970703125, -57.912109375, -56.12451171875, -54.3369140625, -52.54931640625, -50.76171875, -48.97412109375, -47.1865234375, -45.39892578125, -43.611328125, -41.82373046875, -40.0361328125, -38.24853515625, -36.4609375, -34.67333984375, -32.8857421875, -31.09814453125, -29.310546875, -27.52294921875, -25.7353515625, -23.94775390625, -22.16015625, -20.37255859375, -18.5849609375, -16.79736328125, -15.009765625, -13.22216796875, -11.4345703125, -9.64697265625, -7.859375, -6.07177734375, -4.2841796875, -2.49658203125, -0.708984375, 1.07861328125, 2.8662109375, 4.65380859375, 6.44140625, 8.22900390625, 10.0166015625, 11.80419921875, 13.591796875, 15.37939453125, 17.1669921875, 18.95458984375, 20.7421875, 22.52978515625, 24.3173828125, 26.10498046875, 27.892578125, 29.68017578125, 31.4677734375, 33.25537109375, 35.04296875, 36.83056640625, 38.6181640625, 40.40576171875, 42.193359375, 43.98095703125, 45.7685546875, 47.55615234375, 49.34375]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 6.0, 11.0, 14.0, 22.0, 45.0, 57.0, 128.0, 212.0, 392.0, 697.0, 1231.0, 2222.0, 4284.0, 7743.0, 14628.0, 27537.0, 52178.0, 98188.0, 182586.0, 330433.0, 552318.0, 778712.0, 792791.0, 579803.0, 350044.0, 195364.0, 104400.0, 55414.0, 29086.0, 15386.0, 8341.0, 4481.0, 2457.0, 1365.0, 729.0, 424.0, 230.0, 141.0, 85.0, 40.0, 22.0, 11.0, 11.0, 9.0, 4.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-75.5625, -73.40673828125, -71.2509765625, -69.09521484375, -66.939453125, -64.78369140625, -62.6279296875, -60.47216796875, -58.31640625, -56.16064453125, -54.0048828125, -51.84912109375, -49.693359375, -47.53759765625, -45.3818359375, -43.22607421875, -41.0703125, -38.91455078125, -36.7587890625, -34.60302734375, -32.447265625, -30.29150390625, -28.1357421875, -25.97998046875, -23.82421875, -21.66845703125, -19.5126953125, -17.35693359375, -15.201171875, -13.04541015625, -10.8896484375, -8.73388671875, -6.578125, -4.42236328125, -2.2666015625, -0.11083984375, 2.044921875, 4.20068359375, 6.3564453125, 8.51220703125, 10.66796875, 12.82373046875, 14.9794921875, 17.13525390625, 19.291015625, 21.44677734375, 23.6025390625, 25.75830078125, 27.9140625, 30.06982421875, 32.2255859375, 34.38134765625, 36.537109375, 38.69287109375, 40.8486328125, 43.00439453125, 45.16015625, 47.31591796875, 49.4716796875, 51.62744140625, 53.783203125, 55.93896484375, 58.0947265625, 60.25048828125, 62.40625]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 6.0, 9.0, 8.0, 13.0, 9.0, 31.0, 28.0, 30.0, 38.0, 50.0, 52.0, 68.0, 92.0, 111.0, 142.0, 154.0, 169.0, 194.0, 199.0, 239.0, 284.0, 257.0, 274.0, 237.0, 208.0, 193.0, 176.0, 174.0, 127.0, 123.0, 70.0, 70.0, 52.0, 48.0, 34.0, 29.0, 20.0, 13.0, 13.0, 11.0, 10.0, 5.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.140625, -27.32080078125, -26.5009765625, -25.68115234375, -24.861328125, -24.04150390625, -23.2216796875, -22.40185546875, -21.58203125, -20.76220703125, -19.9423828125, -19.12255859375, -18.302734375, -17.48291015625, -16.6630859375, -15.84326171875, -15.0234375, -14.20361328125, -13.3837890625, -12.56396484375, -11.744140625, -10.92431640625, -10.1044921875, -9.28466796875, -8.46484375, -7.64501953125, -6.8251953125, -6.00537109375, -5.185546875, -4.36572265625, -3.5458984375, -2.72607421875, -1.90625, -1.08642578125, -0.2666015625, 0.55322265625, 1.373046875, 2.19287109375, 3.0126953125, 3.83251953125, 4.65234375, 5.47216796875, 6.2919921875, 7.11181640625, 7.931640625, 8.75146484375, 9.5712890625, 10.39111328125, 11.2109375, 12.03076171875, 12.8505859375, 13.67041015625, 14.490234375, 15.31005859375, 16.1298828125, 16.94970703125, 17.76953125, 18.58935546875, 19.4091796875, 20.22900390625, 21.048828125, 21.86865234375, 22.6884765625, 23.50830078125, 24.328125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 9.0, 10.0, 11.0, 12.0, 18.0, 19.0, 26.0, 36.0, 31.0, 28.0, 37.0, 43.0, 35.0, 45.0, 48.0, 57.0, 49.0, 60.0, 43.0, 49.0, 45.0, 45.0, 36.0, 40.0, 32.0, 19.0, 28.0, 17.0, 12.0, 10.0, 13.0, 3.0, 13.0, 3.0, 2.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-61.50790023803711, -59.4245719909668, -57.341243743896484, -55.257911682128906, -53.174583435058594, -51.09125518798828, -49.00792694091797, -46.924598693847656, -44.841270446777344, -42.75794219970703, -40.67461395263672, -38.591285705566406, -36.50795364379883, -34.424625396728516, -32.3412971496582, -30.25796890258789, -28.174636840820312, -26.09130859375, -24.007978439331055, -21.924650192260742, -19.841320037841797, -17.757991790771484, -15.674663543701172, -13.591334342956543, -11.508005142211914, -9.424675941467285, -7.3413472175598145, -5.258018493652344, -3.174689292907715, -1.091360092163086, 0.9919681549072266, 3.0752973556518555, 5.158622741699219, 7.241951942443848, 9.325281143188477, 11.408609390258789, 13.491938591003418, 15.575267791748047, 17.65859603881836, 19.741924285888672, 21.825254440307617, 23.90858268737793, 25.991912841796875, 28.075241088867188, 30.1585693359375, 32.24189758300781, 34.325225830078125, 36.4085578918457, 38.491886138916016, 40.57521438598633, 42.65854263305664, 44.74187469482422, 46.82520294189453, 48.908531188964844, 50.991859436035156, 53.07518768310547, 55.15851593017578, 57.241844177246094, 59.325172424316406, 61.40850067138672, 63.4918327331543, 65.57516479492188, 67.65849304199219, 69.7418212890625, 71.82514953613281]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 2.0, 9.0, 5.0, 7.0, 5.0, 7.0, 16.0, 11.0, 8.0, 15.0, 26.0, 29.0, 28.0, 24.0, 38.0, 38.0, 36.0, 34.0, 41.0, 38.0, 38.0, 35.0, 36.0, 41.0, 40.0, 29.0, 33.0, 39.0, 31.0, 37.0, 23.0, 38.0, 22.0, 13.0, 19.0, 19.0, 14.0, 6.0, 14.0, 12.0, 9.0, 6.0, 3.0, 9.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-71.58344268798828, -69.53543853759766, -67.48743438720703, -65.43943786621094, -63.39143371582031, -61.34342956542969, -59.29542541503906, -57.24742126464844, -55.19942092895508, -53.15141677856445, -51.103416442871094, -49.05541229248047, -47.007408142089844, -44.959407806396484, -42.91140365600586, -40.8634033203125, -38.815399169921875, -36.76739501953125, -34.71939468383789, -32.671390533447266, -30.623388290405273, -28.57538604736328, -26.527381896972656, -24.479379653930664, -22.431377410888672, -20.38337516784668, -18.335372924804688, -16.287368774414062, -14.23936653137207, -12.191364288330078, -10.14336109161377, -8.095357894897461, -6.047351837158203, -3.9993491172790527, -1.9513463973999023, 0.09665632247924805, 2.1446590423583984, 4.192661285400391, 6.240664482116699, 8.288667678833008, 10.336669921875, 12.384672164916992, 14.4326753616333, 16.48067855834961, 18.5286808013916, 20.576683044433594, 22.62468719482422, 24.67268943786621, 26.720691680908203, 28.768693923950195, 30.816696166992188, 32.86470031738281, 34.91270446777344, 36.9607048034668, 39.00870895385742, 41.05670928955078, 43.104713439941406, 45.15271759033203, 47.20071792602539, 49.248722076416016, 51.296722412109375, 53.3447265625, 55.392730712890625, 57.44073486328125, 59.48873519897461]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 8.0, 6.0, 14.0, 10.0, 18.0, 25.0, 35.0, 52.0, 75.0, 109.0, 149.0, 202.0, 326.0, 461.0, 686.0, 1141.0, 1852.0, 2952.0, 4841.0, 8641.0, 14481.0, 25283.0, 45857.0, 81637.0, 143225.0, 212320.0, 203014.0, 130139.0, 73959.0, 41175.0, 23126.0, 13162.0, 7566.0, 4505.0, 2699.0, 1664.0, 990.0, 693.0, 486.0, 307.0, 212.0, 143.0, 105.0, 56.0, 41.0, 43.0, 11.0, 16.0, 8.0, 9.0, 7.0, 7.0, 2.0, 3.0, 3.0, 1.0, 3.0], "bins": [-212.375, -205.921875, -199.46875, -193.015625, -186.5625, -180.109375, -173.65625, -167.203125, -160.75, -154.296875, -147.84375, -141.390625, -134.9375, -128.484375, -122.03125, -115.578125, -109.125, -102.671875, -96.21875, -89.765625, -83.3125, -76.859375, -70.40625, -63.953125, -57.5, -51.046875, -44.59375, -38.140625, -31.6875, -25.234375, -18.78125, -12.328125, -5.875, 0.578125, 7.03125, 13.484375, 19.9375, 26.390625, 32.84375, 39.296875, 45.75, 52.203125, 58.65625, 65.109375, 71.5625, 78.015625, 84.46875, 90.921875, 97.375, 103.828125, 110.28125, 116.734375, 123.1875, 129.640625, 136.09375, 142.546875, 149.0, 155.453125, 161.90625, 168.359375, 174.8125, 181.265625, 187.71875, 194.171875, 200.625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 5.0, 0.0, 4.0, 4.0, 4.0, 4.0, 10.0, 8.0, 8.0, 12.0, 16.0, 14.0, 14.0, 26.0, 23.0, 23.0, 27.0, 34.0, 44.0, 37.0, 35.0, 41.0, 37.0, 27.0, 46.0, 44.0, 33.0, 39.0, 42.0, 37.0, 29.0, 32.0, 21.0, 35.0, 30.0, 22.0, 21.0, 13.0, 22.0, 17.0, 10.0, 12.0, 6.0, 6.0, 8.0, 6.0, 8.0, 6.0, 3.0, 5.0, 0.0, 0.0, 1.0, 1.0], "bins": [-59.28125, -57.58837890625, -55.8955078125, -54.20263671875, -52.509765625, -50.81689453125, -49.1240234375, -47.43115234375, -45.73828125, -44.04541015625, -42.3525390625, -40.65966796875, -38.966796875, -37.27392578125, -35.5810546875, -33.88818359375, -32.1953125, -30.50244140625, -28.8095703125, -27.11669921875, -25.423828125, -23.73095703125, -22.0380859375, -20.34521484375, -18.65234375, -16.95947265625, -15.2666015625, -13.57373046875, -11.880859375, -10.18798828125, -8.4951171875, -6.80224609375, -5.109375, -3.41650390625, -1.7236328125, -0.03076171875, 1.662109375, 3.35498046875, 5.0478515625, 6.74072265625, 8.43359375, 10.12646484375, 11.8193359375, 13.51220703125, 15.205078125, 16.89794921875, 18.5908203125, 20.28369140625, 21.9765625, 23.66943359375, 25.3623046875, 27.05517578125, 28.748046875, 30.44091796875, 32.1337890625, 33.82666015625, 35.51953125, 37.21240234375, 38.9052734375, 40.59814453125, 42.291015625, 43.98388671875, 45.6767578125, 47.36962890625, 49.0625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 0.0, 3.0, 6.0, 1.0, 11.0, 12.0, 18.0, 22.0, 38.0, 53.0, 91.0, 123.0, 159.0, 266.0, 379.0, 608.0, 980.0, 1598.0, 2556.0, 4200.0, 7067.0, 12334.0, 22326.0, 41958.0, 82661.0, 170457.0, 279383.0, 206331.0, 101843.0, 50639.0, 26649.0, 14676.0, 8306.0, 4893.0, 2781.0, 1814.0, 1109.0, 764.0, 479.0, 295.0, 213.0, 138.0, 100.0, 70.0, 38.0, 36.0, 27.0, 11.0, 15.0, 12.0, 2.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0], "bins": [-225.125, -218.43359375, -211.7421875, -205.05078125, -198.359375, -191.66796875, -184.9765625, -178.28515625, -171.59375, -164.90234375, -158.2109375, -151.51953125, -144.828125, -138.13671875, -131.4453125, -124.75390625, -118.0625, -111.37109375, -104.6796875, -97.98828125, -91.296875, -84.60546875, -77.9140625, -71.22265625, -64.53125, -57.83984375, -51.1484375, -44.45703125, -37.765625, -31.07421875, -24.3828125, -17.69140625, -11.0, -4.30859375, 2.3828125, 9.07421875, 15.765625, 22.45703125, 29.1484375, 35.83984375, 42.53125, 49.22265625, 55.9140625, 62.60546875, 69.296875, 75.98828125, 82.6796875, 89.37109375, 96.0625, 102.75390625, 109.4453125, 116.13671875, 122.828125, 129.51953125, 136.2109375, 142.90234375, 149.59375, 156.28515625, 162.9765625, 169.66796875, 176.359375, 183.05078125, 189.7421875, 196.43359375, 203.125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 5.0, 10.0, 9.0, 12.0, 13.0, 12.0, 21.0, 17.0, 32.0, 24.0, 27.0, 41.0, 38.0, 47.0, 39.0, 39.0, 48.0, 43.0, 46.0, 52.0, 46.0, 46.0, 35.0, 51.0, 44.0, 32.0, 27.0, 20.0, 20.0, 22.0, 17.0, 10.0, 11.0, 8.0, 8.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.75, -61.7626953125, -59.775390625, -57.7880859375, -55.80078125, -53.8134765625, -51.826171875, -49.8388671875, -47.8515625, -45.8642578125, -43.876953125, -41.8896484375, -39.90234375, -37.9150390625, -35.927734375, -33.9404296875, -31.953125, -29.9658203125, -27.978515625, -25.9912109375, -24.00390625, -22.0166015625, -20.029296875, -18.0419921875, -16.0546875, -14.0673828125, -12.080078125, -10.0927734375, -8.10546875, -6.1181640625, -4.130859375, -2.1435546875, -0.15625, 1.8310546875, 3.818359375, 5.8056640625, 7.79296875, 9.7802734375, 11.767578125, 13.7548828125, 15.7421875, 17.7294921875, 19.716796875, 21.7041015625, 23.69140625, 25.6787109375, 27.666015625, 29.6533203125, 31.640625, 33.6279296875, 35.615234375, 37.6025390625, 39.58984375, 41.5771484375, 43.564453125, 45.5517578125, 47.5390625, 49.5263671875, 51.513671875, 53.5009765625, 55.48828125, 57.4755859375, 59.462890625, 61.4501953125, 63.4375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 7.0, 8.0, 9.0, 12.0, 16.0, 27.0, 35.0, 44.0, 66.0, 85.0, 121.0, 173.0, 290.0, 415.0, 585.0, 963.0, 1503.0, 2504.0, 4149.0, 7397.0, 14005.0, 27936.0, 60832.0, 150946.0, 348750.0, 247563.0, 95088.0, 40846.0, 19754.0, 10286.0, 5613.0, 3126.0, 1888.0, 1164.0, 739.0, 501.0, 331.0, 236.0, 136.0, 124.0, 79.0, 57.0, 41.0, 29.0, 29.0, 14.0, 12.0, 12.0, 4.0, 6.0, 2.0, 2.0, 2.0, 3.0], "bins": [-150.25, -145.9267578125, -141.603515625, -137.2802734375, -132.95703125, -128.6337890625, -124.310546875, -119.9873046875, -115.6640625, -111.3408203125, -107.017578125, -102.6943359375, -98.37109375, -94.0478515625, -89.724609375, -85.4013671875, -81.078125, -76.7548828125, -72.431640625, -68.1083984375, -63.78515625, -59.4619140625, -55.138671875, -50.8154296875, -46.4921875, -42.1689453125, -37.845703125, -33.5224609375, -29.19921875, -24.8759765625, -20.552734375, -16.2294921875, -11.90625, -7.5830078125, -3.259765625, 1.0634765625, 5.38671875, 9.7099609375, 14.033203125, 18.3564453125, 22.6796875, 27.0029296875, 31.326171875, 35.6494140625, 39.97265625, 44.2958984375, 48.619140625, 52.9423828125, 57.265625, 61.5888671875, 65.912109375, 70.2353515625, 74.55859375, 78.8818359375, 83.205078125, 87.5283203125, 91.8515625, 96.1748046875, 100.498046875, 104.8212890625, 109.14453125, 113.4677734375, 117.791015625, 122.1142578125, 126.4375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 6.0, 2.0, 7.0, 7.0, 8.0, 16.0, 22.0, 16.0, 31.0, 51.0, 59.0, 87.0, 127.0, 120.0, 121.0, 83.0, 64.0, 43.0, 28.0, 12.0, 22.0, 15.0, 6.0, 8.0, 5.0, 3.0, 2.0, 5.0, 5.0, 1.0, 0.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01058197021484375, -0.010209918022155762, -0.009837865829467773, -0.009465813636779785, -0.009093761444091797, -0.008721709251403809, -0.00834965705871582, -0.007977604866027832, -0.007605552673339844, -0.0072335004806518555, -0.006861448287963867, -0.006489396095275879, -0.006117343902587891, -0.005745291709899902, -0.005373239517211914, -0.005001187324523926, -0.0046291351318359375, -0.004257082939147949, -0.003885030746459961, -0.0035129785537719727, -0.0031409263610839844, -0.002768874168395996, -0.002396821975708008, -0.0020247697830200195, -0.0016527175903320312, -0.001280665397644043, -0.0009086132049560547, -0.0005365610122680664, -0.00016450881958007812, 0.00020754337310791016, 0.0005795955657958984, 0.0009516477584838867, 0.001323699951171875, 0.0016957521438598633, 0.0020678043365478516, 0.00243985652923584, 0.002811908721923828, 0.0031839609146118164, 0.0035560131072998047, 0.003928065299987793, 0.004300117492675781, 0.0046721696853637695, 0.005044221878051758, 0.005416274070739746, 0.005788326263427734, 0.006160378456115723, 0.006532430648803711, 0.006904482841491699, 0.0072765350341796875, 0.007648587226867676, 0.008020639419555664, 0.008392691612243652, 0.00876474380493164, 0.009136795997619629, 0.009508848190307617, 0.009880900382995605, 0.010252952575683594, 0.010625004768371582, 0.01099705696105957, 0.011369109153747559, 0.011741161346435547, 0.012113213539123535, 0.012485265731811523, 0.012857317924499512, 0.0132293701171875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 7.0, 1.0, 10.0, 11.0, 13.0, 20.0, 29.0, 51.0, 56.0, 91.0, 114.0, 167.0, 241.0, 323.0, 499.0, 663.0, 926.0, 1420.0, 2112.0, 3354.0, 5621.0, 10124.0, 19827.0, 41169.0, 93400.0, 210790.0, 302237.0, 191986.0, 84172.0, 37122.0, 18013.0, 9376.0, 5170.0, 3052.0, 2000.0, 1354.0, 858.0, 626.0, 401.0, 326.0, 235.0, 166.0, 129.0, 75.0, 78.0, 46.0, 33.0, 29.0, 14.0, 14.0, 5.0, 3.0, 3.0, 1.0, 0.0, 3.0], "bins": [-115.375, -112.0244140625, -108.673828125, -105.3232421875, -101.97265625, -98.6220703125, -95.271484375, -91.9208984375, -88.5703125, -85.2197265625, -81.869140625, -78.5185546875, -75.16796875, -71.8173828125, -68.466796875, -65.1162109375, -61.765625, -58.4150390625, -55.064453125, -51.7138671875, -48.36328125, -45.0126953125, -41.662109375, -38.3115234375, -34.9609375, -31.6103515625, -28.259765625, -24.9091796875, -21.55859375, -18.2080078125, -14.857421875, -11.5068359375, -8.15625, -4.8056640625, -1.455078125, 1.8955078125, 5.24609375, 8.5966796875, 11.947265625, 15.2978515625, 18.6484375, 21.9990234375, 25.349609375, 28.7001953125, 32.05078125, 35.4013671875, 38.751953125, 42.1025390625, 45.453125, 48.8037109375, 52.154296875, 55.5048828125, 58.85546875, 62.2060546875, 65.556640625, 68.9072265625, 72.2578125, 75.6083984375, 78.958984375, 82.3095703125, 85.66015625, 89.0107421875, 92.361328125, 95.7119140625, 99.0625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 6.0, 3.0, 8.0, 7.0, 13.0, 15.0, 20.0, 19.0, 28.0, 32.0, 65.0, 52.0, 67.0, 98.0, 98.0, 94.0, 81.0, 53.0, 53.0, 44.0, 23.0, 26.0, 18.0, 16.0, 16.0, 6.0, 8.0, 8.0, 0.0, 5.0, 4.0, 1.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-44.53125, -43.16845703125, -41.8056640625, -40.44287109375, -39.080078125, -37.71728515625, -36.3544921875, -34.99169921875, -33.62890625, -32.26611328125, -30.9033203125, -29.54052734375, -28.177734375, -26.81494140625, -25.4521484375, -24.08935546875, -22.7265625, -21.36376953125, -20.0009765625, -18.63818359375, -17.275390625, -15.91259765625, -14.5498046875, -13.18701171875, -11.82421875, -10.46142578125, -9.0986328125, -7.73583984375, -6.373046875, -5.01025390625, -3.6474609375, -2.28466796875, -0.921875, 0.44091796875, 1.8037109375, 3.16650390625, 4.529296875, 5.89208984375, 7.2548828125, 8.61767578125, 9.98046875, 11.34326171875, 12.7060546875, 14.06884765625, 15.431640625, 16.79443359375, 18.1572265625, 19.52001953125, 20.8828125, 22.24560546875, 23.6083984375, 24.97119140625, 26.333984375, 27.69677734375, 29.0595703125, 30.42236328125, 31.78515625, 33.14794921875, 34.5107421875, 35.87353515625, 37.236328125, 38.59912109375, 39.9619140625, 41.32470703125, 42.6875]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 1.0, 7.0, 5.0, 5.0, 14.0, 18.0, 16.0, 38.0, 33.0, 35.0, 48.0, 39.0, 64.0, 52.0, 58.0, 66.0, 53.0, 56.0, 54.0, 44.0, 48.0, 40.0, 46.0, 25.0, 27.0, 26.0, 13.0, 11.0, 9.0, 11.0, 9.0, 4.0, 6.0, 10.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.23002624511719, -67.13697814941406, -65.04393768310547, -62.95089340209961, -60.85784912109375, -58.76480484008789, -56.67176055908203, -54.57871627807617, -52.48567199707031, -50.39262771606445, -48.299583435058594, -46.206539154052734, -44.113494873046875, -42.020450592041016, -39.927406311035156, -37.8343620300293, -35.74131774902344, -33.64827346801758, -31.55522918701172, -29.46218490600586, -27.369140625, -25.27609634399414, -23.18305206298828, -21.090007781982422, -18.996963500976562, -16.903919219970703, -14.810874938964844, -12.717830657958984, -10.624786376953125, -8.531742095947266, -6.438697814941406, -4.345653533935547, -2.2526168823242188, -0.15957260131835938, 1.9334716796875, 4.026515960693359, 6.119560241699219, 8.212604522705078, 10.305648803710938, 12.398693084716797, 14.491737365722656, 16.584781646728516, 18.677825927734375, 20.770870208740234, 22.863914489746094, 24.956958770751953, 27.050003051757812, 29.143047332763672, 31.23609161376953, 33.32913589477539, 35.42218017578125, 37.51522445678711, 39.60826873779297, 41.70131301879883, 43.79435729980469, 45.88740158081055, 47.980445861816406, 50.073490142822266, 52.166534423828125, 54.259578704833984, 56.352622985839844, 58.4456672668457, 60.53871154785156, 62.63175582885742, 64.72480010986328]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 3.0, 5.0, 10.0, 8.0, 12.0, 16.0, 13.0, 16.0, 24.0, 17.0, 32.0, 32.0, 39.0, 39.0, 37.0, 35.0, 51.0, 45.0, 46.0, 56.0, 45.0, 44.0, 46.0, 52.0, 37.0, 33.0, 29.0, 31.0, 29.0, 18.0, 27.0, 16.0, 11.0, 15.0, 10.0, 6.0, 10.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-73.37081909179688, -71.34426879882812, -69.3177261352539, -67.29117584228516, -65.2646255493164, -63.23807907104492, -61.21153259277344, -59.18498229980469, -57.15843200683594, -55.13188552856445, -53.1053352355957, -51.07878875732422, -49.05223846435547, -47.025691986083984, -44.9991455078125, -42.97259521484375, -40.946048736572266, -38.91950225830078, -36.89295196533203, -34.86640548706055, -32.8398551940918, -30.813308715820312, -28.786760330200195, -26.760211944580078, -24.73366355895996, -22.707115173339844, -20.680566787719727, -18.65401840209961, -16.627471923828125, -14.600922584533691, -12.57437515258789, -10.547826766967773, -8.521278381347656, -6.494729995727539, -4.46818208694458, -2.441634178161621, -0.4150857925415039, 1.6114625930786133, 3.638010025024414, 5.664558410644531, 7.691106796264648, 9.717655181884766, 11.744203567504883, 13.770750999450684, 15.7972993850708, 17.823848724365234, 19.85039520263672, 21.876943588256836, 23.903491973876953, 25.93004035949707, 27.956588745117188, 29.983135223388672, 32.00968551635742, 34.036231994628906, 36.062782287597656, 38.08932876586914, 40.115875244140625, 42.14242172241211, 44.16897201538086, 46.195518493652344, 48.222068786621094, 50.24861526489258, 52.27516174316406, 54.30171203613281, 56.32826232910156]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 11.0, 14.0, 26.0, 35.0, 41.0, 66.0, 100.0, 157.0, 215.0, 340.0, 532.0, 671.0, 1036.0, 1562.0, 2443.0, 3686.0, 5468.0, 8493.0, 12559.0, 19438.0, 28922.0, 42544.0, 60025.0, 82178.0, 103700.0, 119772.0, 122973.0, 113078.0, 92472.0, 70804.0, 50452.0, 35098.0, 23602.0, 15647.0, 10376.0, 6709.0, 4525.0, 2933.0, 2003.0, 1223.0, 857.0, 559.0, 407.0, 257.0, 185.0, 112.0, 70.0, 68.0, 42.0, 29.0, 18.0, 9.0, 5.0, 5.0, 0.0, 4.0, 2.0], "bins": [-43.875, -42.55517578125, -41.2353515625, -39.91552734375, -38.595703125, -37.27587890625, -35.9560546875, -34.63623046875, -33.31640625, -31.99658203125, -30.6767578125, -29.35693359375, -28.037109375, -26.71728515625, -25.3974609375, -24.07763671875, -22.7578125, -21.43798828125, -20.1181640625, -18.79833984375, -17.478515625, -16.15869140625, -14.8388671875, -13.51904296875, -12.19921875, -10.87939453125, -9.5595703125, -8.23974609375, -6.919921875, -5.60009765625, -4.2802734375, -2.96044921875, -1.640625, -0.32080078125, 0.9990234375, 2.31884765625, 3.638671875, 4.95849609375, 6.2783203125, 7.59814453125, 8.91796875, 10.23779296875, 11.5576171875, 12.87744140625, 14.197265625, 15.51708984375, 16.8369140625, 18.15673828125, 19.4765625, 20.79638671875, 22.1162109375, 23.43603515625, 24.755859375, 26.07568359375, 27.3955078125, 28.71533203125, 30.03515625, 31.35498046875, 32.6748046875, 33.99462890625, 35.314453125, 36.63427734375, 37.9541015625, 39.27392578125, 40.59375]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 12.0, 5.0, 7.0, 11.0, 17.0, 13.0, 17.0, 22.0, 19.0, 33.0, 38.0, 46.0, 37.0, 44.0, 48.0, 43.0, 45.0, 50.0, 54.0, 40.0, 55.0, 45.0, 35.0, 41.0, 39.0, 28.0, 30.0, 24.0, 16.0, 20.0, 13.0, 17.0, 11.0, 5.0, 5.0, 4.0, 6.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-69.1875, -67.30078125, -65.4140625, -63.52734375, -61.640625, -59.75390625, -57.8671875, -55.98046875, -54.09375, -52.20703125, -50.3203125, -48.43359375, -46.546875, -44.66015625, -42.7734375, -40.88671875, -39.0, -37.11328125, -35.2265625, -33.33984375, -31.453125, -29.56640625, -27.6796875, -25.79296875, -23.90625, -22.01953125, -20.1328125, -18.24609375, -16.359375, -14.47265625, -12.5859375, -10.69921875, -8.8125, -6.92578125, -5.0390625, -3.15234375, -1.265625, 0.62109375, 2.5078125, 4.39453125, 6.28125, 8.16796875, 10.0546875, 11.94140625, 13.828125, 15.71484375, 17.6015625, 19.48828125, 21.375, 23.26171875, 25.1484375, 27.03515625, 28.921875, 30.80859375, 32.6953125, 34.58203125, 36.46875, 38.35546875, 40.2421875, 42.12890625, 44.015625, 45.90234375, 47.7890625, 49.67578125, 51.5625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 4.0, 8.0, 7.0, 16.0, 25.0, 36.0, 68.0, 71.0, 116.0, 177.0, 246.0, 398.0, 637.0, 959.0, 1549.0, 2320.0, 3580.0, 5734.0, 9485.0, 15195.0, 24534.0, 40083.0, 64904.0, 101147.0, 142122.0, 165885.0, 153991.0, 115217.0, 75889.0, 47534.0, 28849.0, 17851.0, 10986.0, 6919.0, 4316.0, 2703.0, 1761.0, 1157.0, 723.0, 470.0, 267.0, 188.0, 145.0, 104.0, 67.0, 36.0, 31.0, 10.0, 15.0, 9.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0], "bins": [-58.5625, -56.77001953125, -54.9775390625, -53.18505859375, -51.392578125, -49.60009765625, -47.8076171875, -46.01513671875, -44.22265625, -42.43017578125, -40.6376953125, -38.84521484375, -37.052734375, -35.26025390625, -33.4677734375, -31.67529296875, -29.8828125, -28.09033203125, -26.2978515625, -24.50537109375, -22.712890625, -20.92041015625, -19.1279296875, -17.33544921875, -15.54296875, -13.75048828125, -11.9580078125, -10.16552734375, -8.373046875, -6.58056640625, -4.7880859375, -2.99560546875, -1.203125, 0.58935546875, 2.3818359375, 4.17431640625, 5.966796875, 7.75927734375, 9.5517578125, 11.34423828125, 13.13671875, 14.92919921875, 16.7216796875, 18.51416015625, 20.306640625, 22.09912109375, 23.8916015625, 25.68408203125, 27.4765625, 29.26904296875, 31.0615234375, 32.85400390625, 34.646484375, 36.43896484375, 38.2314453125, 40.02392578125, 41.81640625, 43.60888671875, 45.4013671875, 47.19384765625, 48.986328125, 50.77880859375, 52.5712890625, 54.36376953125, 56.15625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 8.0, 0.0, 2.0, 9.0, 9.0, 13.0, 12.0, 19.0, 24.0, 15.0, 30.0, 27.0, 35.0, 30.0, 51.0, 40.0, 47.0, 48.0, 53.0, 63.0, 52.0, 41.0, 41.0, 53.0, 44.0, 43.0, 31.0, 31.0, 35.0, 13.0, 22.0, 15.0, 12.0, 11.0, 10.0, 6.0, 6.0, 8.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.25, -53.6064453125, -51.962890625, -50.3193359375, -48.67578125, -47.0322265625, -45.388671875, -43.7451171875, -42.1015625, -40.4580078125, -38.814453125, -37.1708984375, -35.52734375, -33.8837890625, -32.240234375, -30.5966796875, -28.953125, -27.3095703125, -25.666015625, -24.0224609375, -22.37890625, -20.7353515625, -19.091796875, -17.4482421875, -15.8046875, -14.1611328125, -12.517578125, -10.8740234375, -9.23046875, -7.5869140625, -5.943359375, -4.2998046875, -2.65625, -1.0126953125, 0.630859375, 2.2744140625, 3.91796875, 5.5615234375, 7.205078125, 8.8486328125, 10.4921875, 12.1357421875, 13.779296875, 15.4228515625, 17.06640625, 18.7099609375, 20.353515625, 21.9970703125, 23.640625, 25.2841796875, 26.927734375, 28.5712890625, 30.21484375, 31.8583984375, 33.501953125, 35.1455078125, 36.7890625, 38.4326171875, 40.076171875, 41.7197265625, 43.36328125, 45.0068359375, 46.650390625, 48.2939453125, 49.9375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 5.0, 13.0, 12.0, 26.0, 32.0, 44.0, 71.0, 83.0, 144.0, 199.0, 274.0, 404.0, 624.0, 885.0, 1424.0, 2237.0, 3713.0, 6424.0, 11413.0, 21477.0, 42368.0, 86334.0, 176113.0, 269101.0, 208176.0, 106242.0, 51545.0, 26173.0, 13593.0, 7571.0, 4494.0, 2602.0, 1568.0, 1046.0, 698.0, 439.0, 313.0, 221.0, 137.0, 88.0, 68.0, 47.0, 38.0, 25.0, 18.0, 11.0, 10.0, 2.0, 4.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-82.625, -80.09375, -77.5625, -75.03125, -72.5, -69.96875, -67.4375, -64.90625, -62.375, -59.84375, -57.3125, -54.78125, -52.25, -49.71875, -47.1875, -44.65625, -42.125, -39.59375, -37.0625, -34.53125, -32.0, -29.46875, -26.9375, -24.40625, -21.875, -19.34375, -16.8125, -14.28125, -11.75, -9.21875, -6.6875, -4.15625, -1.625, 0.90625, 3.4375, 5.96875, 8.5, 11.03125, 13.5625, 16.09375, 18.625, 21.15625, 23.6875, 26.21875, 28.75, 31.28125, 33.8125, 36.34375, 38.875, 41.40625, 43.9375, 46.46875, 49.0, 51.53125, 54.0625, 56.59375, 59.125, 61.65625, 64.1875, 66.71875, 69.25, 71.78125, 74.3125, 76.84375, 79.375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 7.0, 8.0, 8.0, 10.0, 8.0, 5.0, 12.0, 12.0, 22.0, 24.0, 20.0, 35.0, 42.0, 42.0, 54.0, 53.0, 49.0, 63.0, 65.0, 57.0, 53.0, 57.0, 41.0, 42.0, 34.0, 19.0, 25.0, 20.0, 21.0, 20.0, 12.0, 11.0, 9.0, 10.0, 1.0, 6.0, 4.0, 2.0, 3.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00479888916015625, -0.0046347975730896, -0.004470705986022949, -0.004306614398956299, -0.0041425228118896484, -0.003978431224822998, -0.0038143396377563477, -0.0036502480506896973, -0.003486156463623047, -0.0033220648765563965, -0.003157973289489746, -0.0029938817024230957, -0.0028297901153564453, -0.002665698528289795, -0.0025016069412231445, -0.002337515354156494, -0.0021734237670898438, -0.0020093321800231934, -0.001845240592956543, -0.0016811490058898926, -0.0015170574188232422, -0.0013529658317565918, -0.0011888742446899414, -0.001024782657623291, -0.0008606910705566406, -0.0006965994834899902, -0.0005325078964233398, -0.00036841630935668945, -0.00020432472229003906, -4.023313522338867e-05, 0.00012385845184326172, 0.0002879500389099121, 0.0004520416259765625, 0.0006161332130432129, 0.0007802248001098633, 0.0009443163871765137, 0.001108407974243164, 0.0012724995613098145, 0.0014365911483764648, 0.0016006827354431152, 0.0017647743225097656, 0.001928865909576416, 0.0020929574966430664, 0.002257049083709717, 0.002421140670776367, 0.0025852322578430176, 0.002749323844909668, 0.0029134154319763184, 0.0030775070190429688, 0.003241598606109619, 0.0034056901931762695, 0.00356978178024292, 0.0037338733673095703, 0.0038979649543762207, 0.004062056541442871, 0.0042261481285095215, 0.004390239715576172, 0.004554331302642822, 0.004718422889709473, 0.004882514476776123, 0.0050466060638427734, 0.005210697650909424, 0.005374789237976074, 0.005538880825042725, 0.005702972412109375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 6.0, 10.0, 6.0, 12.0, 23.0, 23.0, 59.0, 72.0, 114.0, 172.0, 241.0, 414.0, 661.0, 1092.0, 2008.0, 3642.0, 6591.0, 12860.0, 26916.0, 58426.0, 130060.0, 259502.0, 274922.0, 144786.0, 65647.0, 29621.0, 14242.0, 7247.0, 3930.0, 2085.0, 1222.0, 730.0, 416.0, 256.0, 179.0, 111.0, 88.0, 58.0, 32.0, 27.0, 8.0, 17.0, 7.0, 3.0, 3.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-87.8125, -85.07421875, -82.3359375, -79.59765625, -76.859375, -74.12109375, -71.3828125, -68.64453125, -65.90625, -63.16796875, -60.4296875, -57.69140625, -54.953125, -52.21484375, -49.4765625, -46.73828125, -44.0, -41.26171875, -38.5234375, -35.78515625, -33.046875, -30.30859375, -27.5703125, -24.83203125, -22.09375, -19.35546875, -16.6171875, -13.87890625, -11.140625, -8.40234375, -5.6640625, -2.92578125, -0.1875, 2.55078125, 5.2890625, 8.02734375, 10.765625, 13.50390625, 16.2421875, 18.98046875, 21.71875, 24.45703125, 27.1953125, 29.93359375, 32.671875, 35.41015625, 38.1484375, 40.88671875, 43.625, 46.36328125, 49.1015625, 51.83984375, 54.578125, 57.31640625, 60.0546875, 62.79296875, 65.53125, 68.26953125, 71.0078125, 73.74609375, 76.484375, 79.22265625, 81.9609375, 84.69921875, 87.4375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 7.0, 7.0, 20.0, 17.0, 10.0, 13.0, 17.0, 24.0, 30.0, 47.0, 46.0, 51.0, 67.0, 58.0, 66.0, 57.0, 48.0, 47.0, 52.0, 44.0, 44.0, 39.0, 30.0, 39.0, 19.0, 19.0, 12.0, 12.0, 12.0, 9.0, 12.0, 5.0, 2.0, 6.0, 6.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.40625, -20.74658203125, -20.0869140625, -19.42724609375, -18.767578125, -18.10791015625, -17.4482421875, -16.78857421875, -16.12890625, -15.46923828125, -14.8095703125, -14.14990234375, -13.490234375, -12.83056640625, -12.1708984375, -11.51123046875, -10.8515625, -10.19189453125, -9.5322265625, -8.87255859375, -8.212890625, -7.55322265625, -6.8935546875, -6.23388671875, -5.57421875, -4.91455078125, -4.2548828125, -3.59521484375, -2.935546875, -2.27587890625, -1.6162109375, -0.95654296875, -0.296875, 0.36279296875, 1.0224609375, 1.68212890625, 2.341796875, 3.00146484375, 3.6611328125, 4.32080078125, 4.98046875, 5.64013671875, 6.2998046875, 6.95947265625, 7.619140625, 8.27880859375, 8.9384765625, 9.59814453125, 10.2578125, 10.91748046875, 11.5771484375, 12.23681640625, 12.896484375, 13.55615234375, 14.2158203125, 14.87548828125, 15.53515625, 16.19482421875, 16.8544921875, 17.51416015625, 18.173828125, 18.83349609375, 19.4931640625, 20.15283203125, 20.8125]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 1.0, 3.0, 2.0, 11.0, 8.0, 10.0, 19.0, 11.0, 18.0, 19.0, 31.0, 32.0, 45.0, 45.0, 50.0, 53.0, 63.0, 57.0, 76.0, 51.0, 59.0, 45.0, 45.0, 59.0, 42.0, 31.0, 24.0, 19.0, 24.0, 15.0, 6.0, 6.0, 5.0, 6.0, 5.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-74.30104064941406, -72.1893310546875, -70.07762145996094, -67.96591186523438, -65.85420227050781, -63.742496490478516, -61.63079071044922, -59.519081115722656, -57.407371520996094, -55.29566192626953, -53.18395233154297, -51.07224655151367, -48.96053695678711, -46.84882736206055, -44.73712158203125, -42.62541198730469, -40.513702392578125, -38.40199279785156, -36.290283203125, -34.1785774230957, -32.06686782836914, -29.955158233642578, -27.84345054626465, -25.73174285888672, -23.620033264160156, -21.508323669433594, -19.396615982055664, -17.284908294677734, -15.173198699951172, -13.061490058898926, -10.94978141784668, -8.838072776794434, -6.726371765136719, -4.614663124084473, -2.5029544830322266, -0.39124584197998047, 1.7204627990722656, 3.8321714401245117, 5.943880081176758, 8.055588722229004, 10.16729736328125, 12.279006004333496, 14.390714645385742, 16.502422332763672, 18.614131927490234, 20.725841522216797, 22.837549209594727, 24.949256896972656, 27.06096649169922, 29.17267608642578, 31.28438377380371, 33.39609146118164, 35.5078010559082, 37.619510650634766, 39.73121643066406, 41.842926025390625, 43.95463562011719, 46.06634521484375, 48.17805480957031, 50.28976058959961, 52.40147018432617, 54.513179779052734, 56.62488555908203, 58.736595153808594, 60.848304748535156]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 0.0, 6.0, 4.0, 4.0, 7.0, 7.0, 7.0, 12.0, 18.0, 14.0, 23.0, 26.0, 30.0, 26.0, 31.0, 42.0, 34.0, 45.0, 32.0, 41.0, 52.0, 46.0, 48.0, 47.0, 41.0, 40.0, 47.0, 48.0, 32.0, 29.0, 19.0, 23.0, 26.0, 13.0, 17.0, 16.0, 11.0, 17.0, 8.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-70.2049560546875, -68.05781555175781, -65.91067504882812, -63.76353454589844, -61.61639404296875, -59.46925354003906, -57.32210922241211, -55.17496871948242, -53.027828216552734, -50.88068771362305, -48.73354721069336, -46.58640670776367, -44.43926239013672, -42.29212188720703, -40.144981384277344, -37.997840881347656, -35.85070037841797, -33.70355987548828, -31.556419372558594, -29.409276962280273, -27.262136459350586, -25.1149959564209, -22.967853546142578, -20.82071304321289, -18.673572540283203, -16.526432037353516, -14.379290580749512, -12.232149124145508, -10.08500862121582, -7.937868118286133, -5.790726661682129, -3.643585205078125, -1.4964370727539062, 0.6507039070129395, 2.797844886779785, 4.944985866546631, 7.092126846313477, 9.239267349243164, 11.386408805847168, 13.533550262451172, 15.68069076538086, 17.827831268310547, 19.974971771240234, 22.122114181518555, 24.269254684448242, 26.41639518737793, 28.56353759765625, 30.710678100585938, 32.857818603515625, 35.00495910644531, 37.152099609375, 39.29924011230469, 41.446380615234375, 43.59352111816406, 45.740665435791016, 47.8878059387207, 50.03494644165039, 52.18208694458008, 54.329227447509766, 56.47636795043945, 58.623512268066406, 60.770652770996094, 62.91779327392578, 65.06493377685547, 67.21207427978516]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 6.0, 8.0, 13.0, 26.0, 36.0, 52.0, 104.0, 144.0, 198.0, 332.0, 473.0, 806.0, 1353.0, 2379.0, 3962.0, 6753.0, 11954.0, 20958.0, 37621.0, 70564.0, 133206.0, 259327.0, 491185.0, 779244.0, 879261.0, 674995.0, 391103.0, 201879.0, 103449.0, 54656.0, 29454.0, 16266.0, 9317.0, 5266.0, 3075.0, 1837.0, 1105.0, 705.0, 440.0, 278.0, 203.0, 91.0, 82.0, 33.0, 34.0, 16.0, 17.0, 12.0, 2.0, 5.0, 2.0, 1.0, 0.0, 4.0], "bins": [-49.09375, -47.66259765625, -46.2314453125, -44.80029296875, -43.369140625, -41.93798828125, -40.5068359375, -39.07568359375, -37.64453125, -36.21337890625, -34.7822265625, -33.35107421875, -31.919921875, -30.48876953125, -29.0576171875, -27.62646484375, -26.1953125, -24.76416015625, -23.3330078125, -21.90185546875, -20.470703125, -19.03955078125, -17.6083984375, -16.17724609375, -14.74609375, -13.31494140625, -11.8837890625, -10.45263671875, -9.021484375, -7.59033203125, -6.1591796875, -4.72802734375, -3.296875, -1.86572265625, -0.4345703125, 0.99658203125, 2.427734375, 3.85888671875, 5.2900390625, 6.72119140625, 8.15234375, 9.58349609375, 11.0146484375, 12.44580078125, 13.876953125, 15.30810546875, 16.7392578125, 18.17041015625, 19.6015625, 21.03271484375, 22.4638671875, 23.89501953125, 25.326171875, 26.75732421875, 28.1884765625, 29.61962890625, 31.05078125, 32.48193359375, 33.9130859375, 35.34423828125, 36.775390625, 38.20654296875, 39.6376953125, 41.06884765625, 42.5]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 0.0, 4.0, 4.0, 5.0, 2.0, 11.0, 10.0, 17.0, 21.0, 19.0, 27.0, 32.0, 31.0, 34.0, 20.0, 35.0, 41.0, 40.0, 35.0, 48.0, 56.0, 49.0, 40.0, 39.0, 41.0, 37.0, 45.0, 39.0, 31.0, 27.0, 26.0, 20.0, 17.0, 14.0, 28.0, 13.0, 12.0, 11.0, 10.0, 4.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-50.0625, -48.55517578125, -47.0478515625, -45.54052734375, -44.033203125, -42.52587890625, -41.0185546875, -39.51123046875, -38.00390625, -36.49658203125, -34.9892578125, -33.48193359375, -31.974609375, -30.46728515625, -28.9599609375, -27.45263671875, -25.9453125, -24.43798828125, -22.9306640625, -21.42333984375, -19.916015625, -18.40869140625, -16.9013671875, -15.39404296875, -13.88671875, -12.37939453125, -10.8720703125, -9.36474609375, -7.857421875, -6.35009765625, -4.8427734375, -3.33544921875, -1.828125, -0.32080078125, 1.1865234375, 2.69384765625, 4.201171875, 5.70849609375, 7.2158203125, 8.72314453125, 10.23046875, 11.73779296875, 13.2451171875, 14.75244140625, 16.259765625, 17.76708984375, 19.2744140625, 20.78173828125, 22.2890625, 23.79638671875, 25.3037109375, 26.81103515625, 28.318359375, 29.82568359375, 31.3330078125, 32.84033203125, 34.34765625, 35.85498046875, 37.3623046875, 38.86962890625, 40.376953125, 41.88427734375, 43.3916015625, 44.89892578125, 46.40625]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 8.0, 5.0, 13.0, 9.0, 27.0, 42.0, 49.0, 75.0, 118.0, 172.0, 279.0, 415.0, 636.0, 1002.0, 1685.0, 2592.0, 4152.0, 6585.0, 11203.0, 18485.0, 30812.0, 51205.0, 86540.0, 146329.0, 241643.0, 382777.0, 565210.0, 698068.0, 654968.0, 486479.0, 317157.0, 194887.0, 116839.0, 69570.0, 41301.0, 24434.0, 14788.0, 8944.0, 5494.0, 3331.0, 2198.0, 1362.0, 850.0, 514.0, 376.0, 232.0, 137.0, 102.0, 69.0, 40.0, 33.0, 23.0, 13.0, 8.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-39.4375, -38.19677734375, -36.9560546875, -35.71533203125, -34.474609375, -33.23388671875, -31.9931640625, -30.75244140625, -29.51171875, -28.27099609375, -27.0302734375, -25.78955078125, -24.548828125, -23.30810546875, -22.0673828125, -20.82666015625, -19.5859375, -18.34521484375, -17.1044921875, -15.86376953125, -14.623046875, -13.38232421875, -12.1416015625, -10.90087890625, -9.66015625, -8.41943359375, -7.1787109375, -5.93798828125, -4.697265625, -3.45654296875, -2.2158203125, -0.97509765625, 0.265625, 1.50634765625, 2.7470703125, 3.98779296875, 5.228515625, 6.46923828125, 7.7099609375, 8.95068359375, 10.19140625, 11.43212890625, 12.6728515625, 13.91357421875, 15.154296875, 16.39501953125, 17.6357421875, 18.87646484375, 20.1171875, 21.35791015625, 22.5986328125, 23.83935546875, 25.080078125, 26.32080078125, 27.5615234375, 28.80224609375, 30.04296875, 31.28369140625, 32.5244140625, 33.76513671875, 35.005859375, 36.24658203125, 37.4873046875, 38.72802734375, 39.96875]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 5.0, 1.0, 4.0, 5.0, 11.0, 18.0, 10.0, 19.0, 19.0, 24.0, 46.0, 52.0, 66.0, 58.0, 93.0, 120.0, 123.0, 138.0, 194.0, 198.0, 206.0, 243.0, 248.0, 246.0, 294.0, 228.0, 229.0, 221.0, 196.0, 164.0, 139.0, 105.0, 77.0, 72.0, 46.0, 36.0, 31.0, 22.0, 17.0, 16.0, 8.0, 7.0, 5.0, 7.0, 2.0, 7.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.65625, -16.050537109375, -15.44482421875, -14.839111328125, -14.2333984375, -13.627685546875, -13.02197265625, -12.416259765625, -11.810546875, -11.204833984375, -10.59912109375, -9.993408203125, -9.3876953125, -8.781982421875, -8.17626953125, -7.570556640625, -6.96484375, -6.359130859375, -5.75341796875, -5.147705078125, -4.5419921875, -3.936279296875, -3.33056640625, -2.724853515625, -2.119140625, -1.513427734375, -0.90771484375, -0.302001953125, 0.3037109375, 0.909423828125, 1.51513671875, 2.120849609375, 2.7265625, 3.332275390625, 3.93798828125, 4.543701171875, 5.1494140625, 5.755126953125, 6.36083984375, 6.966552734375, 7.572265625, 8.177978515625, 8.78369140625, 9.389404296875, 9.9951171875, 10.600830078125, 11.20654296875, 11.812255859375, 12.41796875, 13.023681640625, 13.62939453125, 14.235107421875, 14.8408203125, 15.446533203125, 16.05224609375, 16.657958984375, 17.263671875, 17.869384765625, 18.47509765625, 19.080810546875, 19.6865234375, 20.292236328125, 20.89794921875, 21.503662109375, 22.109375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 5.0, 5.0, 5.0, 8.0, 7.0, 9.0, 23.0, 17.0, 17.0, 29.0, 38.0, 43.0, 42.0, 43.0, 69.0, 72.0, 63.0, 88.0, 55.0, 56.0, 59.0, 45.0, 52.0, 38.0, 22.0, 20.0, 13.0, 11.0, 17.0, 7.0, 7.0, 10.0, 7.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0], "bins": [-70.68123626708984, -68.78840637207031, -66.89556884765625, -65.00273895263672, -63.10990905761719, -61.21707534790039, -59.324241638183594, -57.43141174316406, -55.538578033447266, -53.64574432373047, -51.75291442871094, -49.86008071899414, -47.967247009277344, -46.07441711425781, -44.181583404541016, -42.28874969482422, -40.39591979980469, -38.50308609008789, -36.61025619506836, -34.71742248535156, -32.82459259033203, -30.931758880615234, -29.038925170898438, -27.146093368530273, -25.25326156616211, -23.360429763793945, -21.46759796142578, -19.574764251708984, -17.68193244934082, -15.789100646972656, -13.896267890930176, -12.003435134887695, -10.110599517822266, -8.217767715454102, -6.324934959411621, -4.432102680206299, -2.5392704010009766, -0.6464385986328125, 1.246394157409668, 3.1392269134521484, 5.0320587158203125, 6.924890995025635, 8.817723274230957, 10.710556030273438, 12.603387832641602, 14.496219635009766, 16.389053344726562, 18.281885147094727, 20.17471694946289, 22.067548751831055, 23.96038055419922, 25.853214263916016, 27.74604606628418, 29.638877868652344, 31.53171157836914, 33.42454528808594, 35.31737518310547, 37.210208892822266, 39.1030387878418, 40.995872497558594, 42.888702392578125, 44.78153610229492, 46.67436981201172, 48.56719970703125, 50.46003341674805]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 6.0, 6.0, 13.0, 10.0, 15.0, 18.0, 35.0, 24.0, 24.0, 27.0, 23.0, 38.0, 31.0, 25.0, 29.0, 43.0, 48.0, 48.0, 44.0, 42.0, 40.0, 47.0, 36.0, 38.0, 48.0, 30.0, 27.0, 20.0, 27.0, 23.0, 23.0, 23.0, 14.0, 16.0, 7.0, 7.0, 7.0, 5.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-53.50748062133789, -51.859893798828125, -50.212310791015625, -48.56472396850586, -46.917137145996094, -45.269554138183594, -43.62196731567383, -41.97438049316406, -40.32679748535156, -38.6792106628418, -37.0316276550293, -35.38404083251953, -33.73645782470703, -32.088871002197266, -30.4412841796875, -28.793699264526367, -27.146114349365234, -25.4985294342041, -23.85094451904297, -22.203357696533203, -20.55577278137207, -18.908187866210938, -17.260601043701172, -15.613016128540039, -13.965431213378906, -12.317846298217773, -10.670260429382324, -9.022674560546875, -7.375089645385742, -5.727504730224609, -4.07991886138916, -2.432332992553711, -0.7847480773925781, 0.8628373146057129, 2.510422706604004, 4.158008098602295, 5.805593490600586, 7.453178405761719, 9.100764274597168, 10.748350143432617, 12.39593505859375, 14.043519973754883, 15.691105842590332, 17.33869171142578, 18.986276626586914, 20.633861541748047, 22.281448364257812, 23.929033279418945, 25.576618194580078, 27.22420310974121, 28.871788024902344, 30.51937484741211, 32.166961669921875, 33.814544677734375, 35.46213150024414, 37.109718322753906, 38.757301330566406, 40.40488815307617, 42.05247116088867, 43.70005798339844, 45.34764099121094, 46.9952278137207, 48.64281463623047, 50.29039764404297, 51.937984466552734]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 0.0, 6.0, 10.0, 12.0, 21.0, 26.0, 37.0, 56.0, 57.0, 101.0, 134.0, 181.0, 297.0, 412.0, 624.0, 960.0, 1478.0, 2340.0, 3902.0, 6608.0, 12109.0, 24410.0, 57485.0, 151646.0, 330137.0, 266277.0, 105670.0, 40949.0, 18672.0, 9676.0, 5321.0, 3162.0, 1935.0, 1280.0, 793.0, 565.0, 374.0, 271.0, 174.0, 123.0, 87.0, 59.0, 38.0, 21.0, 17.0, 16.0, 8.0, 5.0, 8.0, 1.0, 0.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-146.25, -141.50390625, -136.7578125, -132.01171875, -127.265625, -122.51953125, -117.7734375, -113.02734375, -108.28125, -103.53515625, -98.7890625, -94.04296875, -89.296875, -84.55078125, -79.8046875, -75.05859375, -70.3125, -65.56640625, -60.8203125, -56.07421875, -51.328125, -46.58203125, -41.8359375, -37.08984375, -32.34375, -27.59765625, -22.8515625, -18.10546875, -13.359375, -8.61328125, -3.8671875, 0.87890625, 5.625, 10.37109375, 15.1171875, 19.86328125, 24.609375, 29.35546875, 34.1015625, 38.84765625, 43.59375, 48.33984375, 53.0859375, 57.83203125, 62.578125, 67.32421875, 72.0703125, 76.81640625, 81.5625, 86.30859375, 91.0546875, 95.80078125, 100.546875, 105.29296875, 110.0390625, 114.78515625, 119.53125, 124.27734375, 129.0234375, 133.76953125, 138.515625, 143.26171875, 148.0078125, 152.75390625, 157.5]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 3.0, 4.0, 7.0, 4.0, 12.0, 15.0, 23.0, 16.0, 20.0, 23.0, 26.0, 28.0, 23.0, 33.0, 27.0, 34.0, 38.0, 46.0, 50.0, 41.0, 49.0, 40.0, 34.0, 49.0, 42.0, 38.0, 36.0, 31.0, 34.0, 23.0, 25.0, 23.0, 17.0, 16.0, 17.0, 12.0, 13.0, 7.0, 6.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-48.8125, -47.3427734375, -45.873046875, -44.4033203125, -42.93359375, -41.4638671875, -39.994140625, -38.5244140625, -37.0546875, -35.5849609375, -34.115234375, -32.6455078125, -31.17578125, -29.7060546875, -28.236328125, -26.7666015625, -25.296875, -23.8271484375, -22.357421875, -20.8876953125, -19.41796875, -17.9482421875, -16.478515625, -15.0087890625, -13.5390625, -12.0693359375, -10.599609375, -9.1298828125, -7.66015625, -6.1904296875, -4.720703125, -3.2509765625, -1.78125, -0.3115234375, 1.158203125, 2.6279296875, 4.09765625, 5.5673828125, 7.037109375, 8.5068359375, 9.9765625, 11.4462890625, 12.916015625, 14.3857421875, 15.85546875, 17.3251953125, 18.794921875, 20.2646484375, 21.734375, 23.2041015625, 24.673828125, 26.1435546875, 27.61328125, 29.0830078125, 30.552734375, 32.0224609375, 33.4921875, 34.9619140625, 36.431640625, 37.9013671875, 39.37109375, 40.8408203125, 42.310546875, 43.7802734375, 45.25]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 6.0, 7.0, 8.0, 10.0, 21.0, 16.0, 25.0, 24.0, 29.0, 38.0, 49.0, 70.0, 99.0, 148.0, 198.0, 275.0, 403.0, 745.0, 1094.0, 1820.0, 3082.0, 5800.0, 11212.0, 23412.0, 58049.0, 184377.0, 450701.0, 195368.0, 61147.0, 24677.0, 11510.0, 5791.0, 3235.0, 1812.0, 1107.0, 694.0, 436.0, 266.0, 193.0, 178.0, 95.0, 83.0, 64.0, 55.0, 27.0, 28.0, 19.0, 18.0, 13.0, 8.0, 9.0, 2.0, 8.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-177.5, -171.869140625, -166.23828125, -160.607421875, -154.9765625, -149.345703125, -143.71484375, -138.083984375, -132.453125, -126.822265625, -121.19140625, -115.560546875, -109.9296875, -104.298828125, -98.66796875, -93.037109375, -87.40625, -81.775390625, -76.14453125, -70.513671875, -64.8828125, -59.251953125, -53.62109375, -47.990234375, -42.359375, -36.728515625, -31.09765625, -25.466796875, -19.8359375, -14.205078125, -8.57421875, -2.943359375, 2.6875, 8.318359375, 13.94921875, 19.580078125, 25.2109375, 30.841796875, 36.47265625, 42.103515625, 47.734375, 53.365234375, 58.99609375, 64.626953125, 70.2578125, 75.888671875, 81.51953125, 87.150390625, 92.78125, 98.412109375, 104.04296875, 109.673828125, 115.3046875, 120.935546875, 126.56640625, 132.197265625, 137.828125, 143.458984375, 149.08984375, 154.720703125, 160.3515625, 165.982421875, 171.61328125, 177.244140625, 182.875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 1.0, 3.0, 5.0, 6.0, 2.0, 13.0, 14.0, 12.0, 23.0, 32.0, 34.0, 44.0, 50.0, 62.0, 66.0, 93.0, 89.0, 66.0, 61.0, 54.0, 63.0, 48.0, 42.0, 31.0, 21.0, 11.0, 18.0, 15.0, 7.0, 1.0, 5.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.5, -55.63623046875, -53.7724609375, -51.90869140625, -50.044921875, -48.18115234375, -46.3173828125, -44.45361328125, -42.58984375, -40.72607421875, -38.8623046875, -36.99853515625, -35.134765625, -33.27099609375, -31.4072265625, -29.54345703125, -27.6796875, -25.81591796875, -23.9521484375, -22.08837890625, -20.224609375, -18.36083984375, -16.4970703125, -14.63330078125, -12.76953125, -10.90576171875, -9.0419921875, -7.17822265625, -5.314453125, -3.45068359375, -1.5869140625, 0.27685546875, 2.140625, 4.00439453125, 5.8681640625, 7.73193359375, 9.595703125, 11.45947265625, 13.3232421875, 15.18701171875, 17.05078125, 18.91455078125, 20.7783203125, 22.64208984375, 24.505859375, 26.36962890625, 28.2333984375, 30.09716796875, 31.9609375, 33.82470703125, 35.6884765625, 37.55224609375, 39.416015625, 41.27978515625, 43.1435546875, 45.00732421875, 46.87109375, 48.73486328125, 50.5986328125, 52.46240234375, 54.326171875, 56.18994140625, 58.0537109375, 59.91748046875, 61.78125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 8.0, 8.0, 18.0, 12.0, 34.0, 54.0, 94.0, 160.0, 268.0, 476.0, 735.0, 1270.0, 2412.0, 4545.0, 9413.0, 22137.0, 62632.0, 240190.0, 470686.0, 156502.0, 44489.0, 16725.0, 7347.0, 3738.0, 1969.0, 1117.0, 592.0, 356.0, 206.0, 117.0, 80.0, 60.0, 36.0, 30.0, 18.0, 8.0, 7.0, 4.0, 2.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-88.625, -85.7978515625, -82.970703125, -80.1435546875, -77.31640625, -74.4892578125, -71.662109375, -68.8349609375, -66.0078125, -63.1806640625, -60.353515625, -57.5263671875, -54.69921875, -51.8720703125, -49.044921875, -46.2177734375, -43.390625, -40.5634765625, -37.736328125, -34.9091796875, -32.08203125, -29.2548828125, -26.427734375, -23.6005859375, -20.7734375, -17.9462890625, -15.119140625, -12.2919921875, -9.46484375, -6.6376953125, -3.810546875, -0.9833984375, 1.84375, 4.6708984375, 7.498046875, 10.3251953125, 13.15234375, 15.9794921875, 18.806640625, 21.6337890625, 24.4609375, 27.2880859375, 30.115234375, 32.9423828125, 35.76953125, 38.5966796875, 41.423828125, 44.2509765625, 47.078125, 49.9052734375, 52.732421875, 55.5595703125, 58.38671875, 61.2138671875, 64.041015625, 66.8681640625, 69.6953125, 72.5224609375, 75.349609375, 78.1767578125, 81.00390625, 83.8310546875, 86.658203125, 89.4853515625, 92.3125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 0.0, 9.0, 3.0, 6.0, 2.0, 4.0, 6.0, 14.0, 13.0, 20.0, 24.0, 42.0, 97.0, 141.0, 178.0, 148.0, 109.0, 58.0, 41.0, 21.0, 22.0, 7.0, 6.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0064239501953125, -0.00625300407409668, -0.006082057952880859, -0.005911111831665039, -0.005740165710449219, -0.0055692195892333984, -0.005398273468017578, -0.005227327346801758, -0.0050563812255859375, -0.004885435104370117, -0.004714488983154297, -0.0045435428619384766, -0.004372596740722656, -0.004201650619506836, -0.004030704498291016, -0.0038597583770751953, -0.003688812255859375, -0.0035178661346435547, -0.0033469200134277344, -0.003175973892211914, -0.0030050277709960938, -0.0028340816497802734, -0.002663135528564453, -0.002492189407348633, -0.0023212432861328125, -0.002150297164916992, -0.001979351043701172, -0.0018084049224853516, -0.0016374588012695312, -0.001466512680053711, -0.0012955665588378906, -0.0011246204376220703, -0.00095367431640625, -0.0007827281951904297, -0.0006117820739746094, -0.00044083595275878906, -0.00026988983154296875, -9.894371032714844e-05, 7.200241088867188e-05, 0.0002429485321044922, 0.0004138946533203125, 0.0005848407745361328, 0.0007557868957519531, 0.0009267330169677734, 0.0010976791381835938, 0.001268625259399414, 0.0014395713806152344, 0.0016105175018310547, 0.001781463623046875, 0.0019524097442626953, 0.0021233558654785156, 0.002294301986694336, 0.0024652481079101562, 0.0026361942291259766, 0.002807140350341797, 0.002978086471557617, 0.0031490325927734375, 0.003319978713989258, 0.003490924835205078, 0.0036618709564208984, 0.0038328170776367188, 0.004003763198852539, 0.004174709320068359, 0.00434565544128418, 0.0045166015625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 7.0, 9.0, 12.0, 18.0, 20.0, 31.0, 58.0, 82.0, 118.0, 151.0, 224.0, 349.0, 533.0, 819.0, 1255.0, 2040.0, 3329.0, 5468.0, 9783.0, 18869.0, 38845.0, 89453.0, 202259.0, 300046.0, 203097.0, 89200.0, 39088.0, 19007.0, 9854.0, 5610.0, 3155.0, 2026.0, 1263.0, 800.0, 552.0, 380.0, 253.0, 157.0, 99.0, 73.0, 47.0, 37.0, 26.0, 18.0, 12.0, 5.0, 4.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0], "bins": [-59.59375, -57.81494140625, -56.0361328125, -54.25732421875, -52.478515625, -50.69970703125, -48.9208984375, -47.14208984375, -45.36328125, -43.58447265625, -41.8056640625, -40.02685546875, -38.248046875, -36.46923828125, -34.6904296875, -32.91162109375, -31.1328125, -29.35400390625, -27.5751953125, -25.79638671875, -24.017578125, -22.23876953125, -20.4599609375, -18.68115234375, -16.90234375, -15.12353515625, -13.3447265625, -11.56591796875, -9.787109375, -8.00830078125, -6.2294921875, -4.45068359375, -2.671875, -0.89306640625, 0.8857421875, 2.66455078125, 4.443359375, 6.22216796875, 8.0009765625, 9.77978515625, 11.55859375, 13.33740234375, 15.1162109375, 16.89501953125, 18.673828125, 20.45263671875, 22.2314453125, 24.01025390625, 25.7890625, 27.56787109375, 29.3466796875, 31.12548828125, 32.904296875, 34.68310546875, 36.4619140625, 38.24072265625, 40.01953125, 41.79833984375, 43.5771484375, 45.35595703125, 47.134765625, 48.91357421875, 50.6923828125, 52.47119140625, 54.25]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 1.0, 6.0, 7.0, 14.0, 11.0, 17.0, 23.0, 26.0, 41.0, 44.0, 61.0, 82.0, 82.0, 105.0, 85.0, 90.0, 71.0, 58.0, 41.0, 35.0, 23.0, 18.0, 12.0, 7.0, 4.0, 8.0, 4.0, 3.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.71875, -23.889404296875, -23.06005859375, -22.230712890625, -21.4013671875, -20.572021484375, -19.74267578125, -18.913330078125, -18.083984375, -17.254638671875, -16.42529296875, -15.595947265625, -14.7666015625, -13.937255859375, -13.10791015625, -12.278564453125, -11.44921875, -10.619873046875, -9.79052734375, -8.961181640625, -8.1318359375, -7.302490234375, -6.47314453125, -5.643798828125, -4.814453125, -3.985107421875, -3.15576171875, -2.326416015625, -1.4970703125, -0.667724609375, 0.16162109375, 0.990966796875, 1.8203125, 2.649658203125, 3.47900390625, 4.308349609375, 5.1376953125, 5.967041015625, 6.79638671875, 7.625732421875, 8.455078125, 9.284423828125, 10.11376953125, 10.943115234375, 11.7724609375, 12.601806640625, 13.43115234375, 14.260498046875, 15.08984375, 15.919189453125, 16.74853515625, 17.577880859375, 18.4072265625, 19.236572265625, 20.06591796875, 20.895263671875, 21.724609375, 22.553955078125, 23.38330078125, 24.212646484375, 25.0419921875, 25.871337890625, 26.70068359375, 27.530029296875, 28.359375]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 1.0, 5.0, 2.0, 0.0, 6.0, 9.0, 14.0, 14.0, 16.0, 30.0, 22.0, 32.0, 38.0, 57.0, 54.0, 39.0, 58.0, 54.0, 72.0, 64.0, 57.0, 53.0, 56.0, 49.0, 46.0, 34.0, 22.0, 30.0, 18.0, 9.0, 6.0, 13.0, 5.0, 8.0, 2.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.05623245239258, -48.432655334472656, -46.809078216552734, -45.18550109863281, -43.56192398071289, -41.93834686279297, -40.31477355957031, -38.69119644165039, -37.06761932373047, -35.44404220581055, -33.820465087890625, -32.1968879699707, -30.573312759399414, -28.949735641479492, -27.32615852355957, -25.70258331298828, -24.079004287719727, -22.455427169799805, -20.831850051879883, -19.208274841308594, -17.584697723388672, -15.96112060546875, -14.337543487548828, -12.713967323303223, -11.0903902053833, -9.466813087463379, -7.843236923217773, -6.219659805297852, -4.596083164215088, -2.972506523132324, -1.3489294052124023, 0.2746467590332031, 1.898223876953125, 3.5218005180358887, 5.145377159118652, 6.768954277038574, 8.39253044128418, 10.016107559204102, 11.639684677124023, 13.263260841369629, 14.88683795928955, 16.510414123535156, 18.133991241455078, 19.757568359375, 21.381145477294922, 23.004722595214844, 24.628299713134766, 26.251874923706055, 27.875452041625977, 29.4990291595459, 31.12260627746582, 32.74618148803711, 34.36975860595703, 35.99333572387695, 37.616912841796875, 39.2404899597168, 40.86406707763672, 42.48764419555664, 44.11122131347656, 45.734798431396484, 47.358375549316406, 48.98194885253906, 50.60552978515625, 52.229103088378906, 53.85268020629883]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 6.0, 8.0, 10.0, 8.0, 11.0, 15.0, 12.0, 17.0, 22.0, 20.0, 32.0, 22.0, 27.0, 31.0, 24.0, 28.0, 41.0, 40.0, 50.0, 55.0, 27.0, 41.0, 41.0, 35.0, 28.0, 36.0, 36.0, 39.0, 23.0, 27.0, 29.0, 23.0, 21.0, 18.0, 15.0, 19.0, 13.0, 11.0, 10.0, 7.0, 3.0, 5.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0], "bins": [-41.95718002319336, -40.70591735839844, -39.45465087890625, -38.20338821411133, -36.952125549316406, -35.700862884521484, -34.44960021972656, -33.198333740234375, -31.947071075439453, -30.69580841064453, -29.444543838500977, -28.193279266357422, -26.9420166015625, -25.690753936767578, -24.439489364624023, -23.18822479248047, -21.936962127685547, -20.685699462890625, -19.43443489074707, -18.183170318603516, -16.931907653808594, -15.680644035339355, -14.429380416870117, -13.178116798400879, -11.92685317993164, -10.675589561462402, -9.424325942993164, -8.173062324523926, -6.9217987060546875, -5.670535087585449, -4.419271469116211, -3.1680078506469727, -1.9167442321777344, -0.6654806137084961, 0.5857830047607422, 1.8370466232299805, 3.0883102416992188, 4.339573860168457, 5.590837478637695, 6.842101097106934, 8.093364715576172, 9.34462833404541, 10.595891952514648, 11.847155570983887, 13.098419189453125, 14.349682807922363, 15.600946426391602, 16.852210998535156, 18.103473663330078, 19.354736328125, 20.606000900268555, 21.85726547241211, 23.10852813720703, 24.359790802001953, 25.611055374145508, 26.862319946289062, 28.113582611083984, 29.364845275878906, 30.61610984802246, 31.867374420166016, 33.11863708496094, 34.36989974975586, 35.62116241455078, 36.87242889404297, 38.12369155883789]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 3.0, 10.0, 18.0, 29.0, 32.0, 56.0, 89.0, 120.0, 229.0, 321.0, 508.0, 769.0, 1218.0, 1986.0, 3195.0, 5218.0, 7978.0, 13360.0, 21682.0, 34792.0, 54989.0, 82508.0, 117315.0, 147298.0, 152921.0, 130741.0, 95787.0, 64495.0, 41984.0, 25982.0, 16393.0, 9931.0, 6185.0, 3803.0, 2401.0, 1495.0, 992.0, 608.0, 398.0, 248.0, 162.0, 110.0, 59.0, 60.0, 33.0, 12.0, 18.0, 11.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-41.125, -39.88623046875, -38.6474609375, -37.40869140625, -36.169921875, -34.93115234375, -33.6923828125, -32.45361328125, -31.21484375, -29.97607421875, -28.7373046875, -27.49853515625, -26.259765625, -25.02099609375, -23.7822265625, -22.54345703125, -21.3046875, -20.06591796875, -18.8271484375, -17.58837890625, -16.349609375, -15.11083984375, -13.8720703125, -12.63330078125, -11.39453125, -10.15576171875, -8.9169921875, -7.67822265625, -6.439453125, -5.20068359375, -3.9619140625, -2.72314453125, -1.484375, -0.24560546875, 0.9931640625, 2.23193359375, 3.470703125, 4.70947265625, 5.9482421875, 7.18701171875, 8.42578125, 9.66455078125, 10.9033203125, 12.14208984375, 13.380859375, 14.61962890625, 15.8583984375, 17.09716796875, 18.3359375, 19.57470703125, 20.8134765625, 22.05224609375, 23.291015625, 24.52978515625, 25.7685546875, 27.00732421875, 28.24609375, 29.48486328125, 30.7236328125, 31.96240234375, 33.201171875, 34.43994140625, 35.6787109375, 36.91748046875, 38.15625]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 4.0, 7.0, 7.0, 11.0, 6.0, 8.0, 21.0, 19.0, 14.0, 17.0, 19.0, 31.0, 23.0, 27.0, 31.0, 27.0, 37.0, 39.0, 37.0, 38.0, 45.0, 49.0, 39.0, 33.0, 36.0, 32.0, 41.0, 32.0, 33.0, 33.0, 24.0, 25.0, 26.0, 27.0, 18.0, 19.0, 13.0, 10.0, 3.0, 10.0, 5.0, 6.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-37.4375, -36.24951171875, -35.0615234375, -33.87353515625, -32.685546875, -31.49755859375, -30.3095703125, -29.12158203125, -27.93359375, -26.74560546875, -25.5576171875, -24.36962890625, -23.181640625, -21.99365234375, -20.8056640625, -19.61767578125, -18.4296875, -17.24169921875, -16.0537109375, -14.86572265625, -13.677734375, -12.48974609375, -11.3017578125, -10.11376953125, -8.92578125, -7.73779296875, -6.5498046875, -5.36181640625, -4.173828125, -2.98583984375, -1.7978515625, -0.60986328125, 0.578125, 1.76611328125, 2.9541015625, 4.14208984375, 5.330078125, 6.51806640625, 7.7060546875, 8.89404296875, 10.08203125, 11.27001953125, 12.4580078125, 13.64599609375, 14.833984375, 16.02197265625, 17.2099609375, 18.39794921875, 19.5859375, 20.77392578125, 21.9619140625, 23.14990234375, 24.337890625, 25.52587890625, 26.7138671875, 27.90185546875, 29.08984375, 30.27783203125, 31.4658203125, 32.65380859375, 33.841796875, 35.02978515625, 36.2177734375, 37.40576171875, 38.59375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 9.0, 12.0, 11.0, 19.0, 23.0, 32.0, 71.0, 109.0, 139.0, 238.0, 316.0, 511.0, 736.0, 1154.0, 1763.0, 2675.0, 4248.0, 6646.0, 10092.0, 15752.0, 24521.0, 37484.0, 56261.0, 81122.0, 109266.0, 131553.0, 137465.0, 123154.0, 97196.0, 69339.0, 47437.0, 31581.0, 20340.0, 13259.0, 8595.0, 5374.0, 3503.0, 2245.0, 1526.0, 925.0, 639.0, 434.0, 266.0, 163.0, 126.0, 81.0, 45.0, 42.0, 16.0, 17.0, 8.0, 7.0, 8.0, 4.0, 7.0, 1.0, 3.0, 2.0], "bins": [-32.40625, -31.402587890625, -30.39892578125, -29.395263671875, -28.3916015625, -27.387939453125, -26.38427734375, -25.380615234375, -24.376953125, -23.373291015625, -22.36962890625, -21.365966796875, -20.3623046875, -19.358642578125, -18.35498046875, -17.351318359375, -16.34765625, -15.343994140625, -14.34033203125, -13.336669921875, -12.3330078125, -11.329345703125, -10.32568359375, -9.322021484375, -8.318359375, -7.314697265625, -6.31103515625, -5.307373046875, -4.3037109375, -3.300048828125, -2.29638671875, -1.292724609375, -0.2890625, 0.714599609375, 1.71826171875, 2.721923828125, 3.7255859375, 4.729248046875, 5.73291015625, 6.736572265625, 7.740234375, 8.743896484375, 9.74755859375, 10.751220703125, 11.7548828125, 12.758544921875, 13.76220703125, 14.765869140625, 15.76953125, 16.773193359375, 17.77685546875, 18.780517578125, 19.7841796875, 20.787841796875, 21.79150390625, 22.795166015625, 23.798828125, 24.802490234375, 25.80615234375, 26.809814453125, 27.8134765625, 28.817138671875, 29.82080078125, 30.824462890625, 31.828125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 12.0, 6.0, 13.0, 7.0, 15.0, 16.0, 16.0, 13.0, 21.0, 18.0, 25.0, 26.0, 37.0, 23.0, 27.0, 31.0, 45.0, 38.0, 38.0, 42.0, 48.0, 31.0, 38.0, 46.0, 44.0, 34.0, 29.0, 31.0, 29.0, 24.0, 13.0, 25.0, 24.0, 14.0, 17.0, 12.0, 12.0, 12.0, 7.0, 7.0, 11.0, 4.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-21.921875, -21.212646484375, -20.50341796875, -19.794189453125, -19.0849609375, -18.375732421875, -17.66650390625, -16.957275390625, -16.248046875, -15.538818359375, -14.82958984375, -14.120361328125, -13.4111328125, -12.701904296875, -11.99267578125, -11.283447265625, -10.57421875, -9.864990234375, -9.15576171875, -8.446533203125, -7.7373046875, -7.028076171875, -6.31884765625, -5.609619140625, -4.900390625, -4.191162109375, -3.48193359375, -2.772705078125, -2.0634765625, -1.354248046875, -0.64501953125, 0.064208984375, 0.7734375, 1.482666015625, 2.19189453125, 2.901123046875, 3.6103515625, 4.319580078125, 5.02880859375, 5.738037109375, 6.447265625, 7.156494140625, 7.86572265625, 8.574951171875, 9.2841796875, 9.993408203125, 10.70263671875, 11.411865234375, 12.12109375, 12.830322265625, 13.53955078125, 14.248779296875, 14.9580078125, 15.667236328125, 16.37646484375, 17.085693359375, 17.794921875, 18.504150390625, 19.21337890625, 19.922607421875, 20.6318359375, 21.341064453125, 22.05029296875, 22.759521484375, 23.46875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 2.0, 4.0, 5.0, 3.0, 8.0, 5.0, 12.0, 20.0, 17.0, 27.0, 43.0, 46.0, 80.0, 93.0, 139.0, 168.0, 248.0, 352.0, 498.0, 770.0, 1068.0, 1859.0, 3158.0, 6060.0, 12692.0, 31188.0, 84872.0, 233400.0, 360935.0, 193120.0, 68165.0, 25631.0, 10820.0, 5189.0, 2798.0, 1664.0, 1090.0, 699.0, 426.0, 338.0, 214.0, 181.0, 133.0, 77.0, 55.0, 44.0, 45.0, 36.0, 15.0, 19.0, 11.0, 7.0, 4.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-49.5625, -47.98388671875, -46.4052734375, -44.82666015625, -43.248046875, -41.66943359375, -40.0908203125, -38.51220703125, -36.93359375, -35.35498046875, -33.7763671875, -32.19775390625, -30.619140625, -29.04052734375, -27.4619140625, -25.88330078125, -24.3046875, -22.72607421875, -21.1474609375, -19.56884765625, -17.990234375, -16.41162109375, -14.8330078125, -13.25439453125, -11.67578125, -10.09716796875, -8.5185546875, -6.93994140625, -5.361328125, -3.78271484375, -2.2041015625, -0.62548828125, 0.953125, 2.53173828125, 4.1103515625, 5.68896484375, 7.267578125, 8.84619140625, 10.4248046875, 12.00341796875, 13.58203125, 15.16064453125, 16.7392578125, 18.31787109375, 19.896484375, 21.47509765625, 23.0537109375, 24.63232421875, 26.2109375, 27.78955078125, 29.3681640625, 30.94677734375, 32.525390625, 34.10400390625, 35.6826171875, 37.26123046875, 38.83984375, 40.41845703125, 41.9970703125, 43.57568359375, 45.154296875, 46.73291015625, 48.3115234375, 49.89013671875, 51.46875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 1.0, 5.0, 7.0, 15.0, 26.0, 31.0, 60.0, 69.0, 90.0, 135.0, 138.0, 120.0, 93.0, 66.0, 40.0, 38.0, 19.0, 6.0, 14.0, 8.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00440216064453125, -0.004246711730957031, -0.0040912628173828125, -0.003935813903808594, -0.003780364990234375, -0.0036249160766601562, -0.0034694671630859375, -0.0033140182495117188, -0.0031585693359375, -0.0030031204223632812, -0.0028476715087890625, -0.0026922225952148438, -0.002536773681640625, -0.0023813247680664062, -0.0022258758544921875, -0.0020704269409179688, -0.00191497802734375, -0.0017595291137695312, -0.0016040802001953125, -0.0014486312866210938, -0.001293182373046875, -0.0011377334594726562, -0.0009822845458984375, -0.0008268356323242188, -0.00067138671875, -0.0005159378051757812, -0.0003604888916015625, -0.00020503997802734375, -4.9591064453125e-05, 0.00010585784912109375, 0.0002613067626953125, 0.00041675567626953125, 0.00057220458984375, 0.0007276535034179688, 0.0008831024169921875, 0.0010385513305664062, 0.001194000244140625, 0.0013494491577148438, 0.0015048980712890625, 0.0016603469848632812, 0.0018157958984375, 0.0019712448120117188, 0.0021266937255859375, 0.0022821426391601562, 0.002437591552734375, 0.0025930404663085938, 0.0027484893798828125, 0.0029039382934570312, 0.00305938720703125, 0.0032148361206054688, 0.0033702850341796875, 0.0035257339477539062, 0.003681182861328125, 0.0038366317749023438, 0.0039920806884765625, 0.004147529602050781, 0.004302978515625, 0.004458427429199219, 0.0046138763427734375, 0.004769325256347656, 0.004924774169921875, 0.005080223083496094, 0.0052356719970703125, 0.005391120910644531, 0.00554656982421875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 9.0, 6.0, 13.0, 22.0, 32.0, 41.0, 58.0, 75.0, 116.0, 165.0, 279.0, 324.0, 506.0, 808.0, 1139.0, 1765.0, 2661.0, 4071.0, 6740.0, 11136.0, 18846.0, 32743.0, 57284.0, 97009.0, 149795.0, 188198.0, 172547.0, 122548.0, 74373.0, 43168.0, 24369.0, 14175.0, 8729.0, 5229.0, 3240.0, 2137.0, 1349.0, 951.0, 571.0, 418.0, 266.0, 204.0, 130.0, 109.0, 60.0, 52.0, 38.0, 14.0, 10.0, 19.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.9375, -23.183349609375, -22.42919921875, -21.675048828125, -20.9208984375, -20.166748046875, -19.41259765625, -18.658447265625, -17.904296875, -17.150146484375, -16.39599609375, -15.641845703125, -14.8876953125, -14.133544921875, -13.37939453125, -12.625244140625, -11.87109375, -11.116943359375, -10.36279296875, -9.608642578125, -8.8544921875, -8.100341796875, -7.34619140625, -6.592041015625, -5.837890625, -5.083740234375, -4.32958984375, -3.575439453125, -2.8212890625, -2.067138671875, -1.31298828125, -0.558837890625, 0.1953125, 0.949462890625, 1.70361328125, 2.457763671875, 3.2119140625, 3.966064453125, 4.72021484375, 5.474365234375, 6.228515625, 6.982666015625, 7.73681640625, 8.490966796875, 9.2451171875, 9.999267578125, 10.75341796875, 11.507568359375, 12.26171875, 13.015869140625, 13.77001953125, 14.524169921875, 15.2783203125, 16.032470703125, 16.78662109375, 17.540771484375, 18.294921875, 19.049072265625, 19.80322265625, 20.557373046875, 21.3115234375, 22.065673828125, 22.81982421875, 23.573974609375, 24.328125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 5.0, 9.0, 6.0, 8.0, 9.0, 14.0, 11.0, 16.0, 28.0, 33.0, 33.0, 33.0, 47.0, 50.0, 72.0, 71.0, 62.0, 78.0, 58.0, 54.0, 49.0, 44.0, 43.0, 27.0, 31.0, 25.0, 13.0, 12.0, 16.0, 12.0, 9.0, 7.0, 6.0, 4.0, 3.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.7421875, -10.4505615234375, -10.158935546875, -9.8673095703125, -9.57568359375, -9.2840576171875, -8.992431640625, -8.7008056640625, -8.4091796875, -8.1175537109375, -7.825927734375, -7.5343017578125, -7.24267578125, -6.9510498046875, -6.659423828125, -6.3677978515625, -6.076171875, -5.7845458984375, -5.492919921875, -5.2012939453125, -4.90966796875, -4.6180419921875, -4.326416015625, -4.0347900390625, -3.7431640625, -3.4515380859375, -3.159912109375, -2.8682861328125, -2.57666015625, -2.2850341796875, -1.993408203125, -1.7017822265625, -1.41015625, -1.1185302734375, -0.826904296875, -0.5352783203125, -0.24365234375, 0.0479736328125, 0.339599609375, 0.6312255859375, 0.9228515625, 1.2144775390625, 1.506103515625, 1.7977294921875, 2.08935546875, 2.3809814453125, 2.672607421875, 2.9642333984375, 3.255859375, 3.5474853515625, 3.839111328125, 4.1307373046875, 4.42236328125, 4.7139892578125, 5.005615234375, 5.2972412109375, 5.5888671875, 5.8804931640625, 6.172119140625, 6.4637451171875, 6.75537109375, 7.0469970703125, 7.338623046875, 7.6302490234375, 7.921875]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 1.0, 4.0, 4.0, 8.0, 6.0, 11.0, 13.0, 20.0, 23.0, 23.0, 30.0, 35.0, 39.0, 53.0, 57.0, 49.0, 57.0, 79.0, 57.0, 65.0, 70.0, 62.0, 58.0, 40.0, 27.0, 26.0, 20.0, 20.0, 15.0, 7.0, 2.0, 6.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.41061019897461, -48.828453063964844, -47.246299743652344, -45.66414260864258, -44.08198547363281, -42.49983215332031, -40.91767501831055, -39.33551788330078, -37.75336456298828, -36.171207427978516, -34.589054107666016, -33.00689697265625, -31.424741744995117, -29.842586517333984, -28.26042938232422, -26.678274154663086, -25.09611701965332, -23.513961791992188, -21.931804656982422, -20.34964942932129, -18.767494201660156, -17.18533706665039, -15.603181838989258, -14.021026611328125, -12.438870429992676, -10.856714248657227, -9.274559020996094, -7.6924028396606445, -6.1102471351623535, -4.5280914306640625, -2.9459352493286133, -1.3637800216674805, 0.21837615966796875, 1.8005319833755493, 3.38268780708313, 4.96484375, 6.546999454498291, 8.129155158996582, 9.711311340332031, 11.293466567993164, 12.875622749328613, 14.457778930664062, 16.039934158325195, 17.622089385986328, 19.204246520996094, 20.786401748657227, 22.36855697631836, 23.950714111328125, 25.532869338989258, 27.11502456665039, 28.697181701660156, 30.27933692932129, 31.861492156982422, 33.44364929199219, 35.02580261230469, 36.60795974731445, 38.19011688232422, 39.772274017333984, 41.354427337646484, 42.93658447265625, 44.518741607666016, 46.100894927978516, 47.68305206298828, 49.26520538330078, 50.84736251831055]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 7.0, 5.0, 5.0, 4.0, 5.0, 12.0, 10.0, 9.0, 13.0, 20.0, 14.0, 25.0, 19.0, 20.0, 26.0, 36.0, 40.0, 30.0, 36.0, 47.0, 39.0, 39.0, 42.0, 26.0, 33.0, 41.0, 48.0, 37.0, 34.0, 32.0, 28.0, 39.0, 27.0, 22.0, 28.0, 20.0, 17.0, 15.0, 19.0, 12.0, 7.0, 4.0, 1.0, 4.0, 6.0, 7.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-40.945762634277344, -39.7737922668457, -38.60182189941406, -37.429847717285156, -36.257877349853516, -35.085906982421875, -33.913936614990234, -32.741966247558594, -31.56999397277832, -30.39802360534668, -29.226051330566406, -28.054080963134766, -26.882110595703125, -25.71013832092285, -24.53816795349121, -23.366195678710938, -22.194225311279297, -21.022254943847656, -19.850282669067383, -18.678312301635742, -17.50634002685547, -16.334369659423828, -15.162399291992188, -13.99042797088623, -12.818456649780273, -11.646485328674316, -10.47451400756836, -9.302543640136719, -8.130572319030762, -6.958600997924805, -5.786630153656006, -4.614659309387207, -3.44268798828125, -2.270716905593872, -1.0987458229064941, 0.07322525978088379, 1.2451963424682617, 2.4171676635742188, 3.5891385078430176, 4.761109352111816, 5.933080673217773, 7.1050519943237305, 8.277023315429688, 9.448993682861328, 10.620965003967285, 11.792936325073242, 12.964906692504883, 14.13687801361084, 15.308849334716797, 16.480819702148438, 17.65279197692871, 18.82476234436035, 19.996734619140625, 21.168704986572266, 22.340675354003906, 23.512645721435547, 24.68461799621582, 25.85658836364746, 27.028560638427734, 28.200531005859375, 29.372501373291016, 30.54447364807129, 31.71644401550293, 32.8884162902832, 34.060386657714844]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 2.0, 5.0, 8.0, 13.0, 30.0, 52.0, 75.0, 94.0, 171.0, 263.0, 385.0, 645.0, 949.0, 1478.0, 2152.0, 3267.0, 5214.0, 8384.0, 12862.0, 21182.0, 34367.0, 57172.0, 96861.0, 166869.0, 286547.0, 470811.0, 664112.0, 733194.0, 611312.0, 409949.0, 245962.0, 142854.0, 84457.0, 49803.0, 30466.0, 19128.0, 11910.0, 7491.0, 4870.0, 3087.0, 2018.0, 1289.0, 861.0, 536.0, 376.0, 242.0, 176.0, 133.0, 67.0, 52.0, 32.0, 22.0, 10.0, 8.0, 9.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-26.28125, -25.41552734375, -24.5498046875, -23.68408203125, -22.818359375, -21.95263671875, -21.0869140625, -20.22119140625, -19.35546875, -18.48974609375, -17.6240234375, -16.75830078125, -15.892578125, -15.02685546875, -14.1611328125, -13.29541015625, -12.4296875, -11.56396484375, -10.6982421875, -9.83251953125, -8.966796875, -8.10107421875, -7.2353515625, -6.36962890625, -5.50390625, -4.63818359375, -3.7724609375, -2.90673828125, -2.041015625, -1.17529296875, -0.3095703125, 0.55615234375, 1.421875, 2.28759765625, 3.1533203125, 4.01904296875, 4.884765625, 5.75048828125, 6.6162109375, 7.48193359375, 8.34765625, 9.21337890625, 10.0791015625, 10.94482421875, 11.810546875, 12.67626953125, 13.5419921875, 14.40771484375, 15.2734375, 16.13916015625, 17.0048828125, 17.87060546875, 18.736328125, 19.60205078125, 20.4677734375, 21.33349609375, 22.19921875, 23.06494140625, 23.9306640625, 24.79638671875, 25.662109375, 26.52783203125, 27.3935546875, 28.25927734375, 29.125]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 6.0, 4.0, 4.0, 2.0, 3.0, 9.0, 9.0, 16.0, 15.0, 13.0, 15.0, 20.0, 18.0, 14.0, 23.0, 27.0, 25.0, 30.0, 32.0, 30.0, 35.0, 37.0, 37.0, 44.0, 32.0, 39.0, 35.0, 36.0, 23.0, 37.0, 29.0, 21.0, 34.0, 27.0, 44.0, 22.0, 24.0, 22.0, 19.0, 18.0, 17.0, 12.0, 12.0, 9.0, 5.0, 3.0, 3.0, 5.0, 5.0, 3.0, 2.0, 4.0, 1.0, 4.0], "bins": [-26.0, -25.259033203125, -24.51806640625, -23.777099609375, -23.0361328125, -22.295166015625, -21.55419921875, -20.813232421875, -20.072265625, -19.331298828125, -18.59033203125, -17.849365234375, -17.1083984375, -16.367431640625, -15.62646484375, -14.885498046875, -14.14453125, -13.403564453125, -12.66259765625, -11.921630859375, -11.1806640625, -10.439697265625, -9.69873046875, -8.957763671875, -8.216796875, -7.475830078125, -6.73486328125, -5.993896484375, -5.2529296875, -4.511962890625, -3.77099609375, -3.030029296875, -2.2890625, -1.548095703125, -0.80712890625, -0.066162109375, 0.6748046875, 1.415771484375, 2.15673828125, 2.897705078125, 3.638671875, 4.379638671875, 5.12060546875, 5.861572265625, 6.6025390625, 7.343505859375, 8.08447265625, 8.825439453125, 9.56640625, 10.307373046875, 11.04833984375, 11.789306640625, 12.5302734375, 13.271240234375, 14.01220703125, 14.753173828125, 15.494140625, 16.235107421875, 16.97607421875, 17.717041015625, 18.4580078125, 19.198974609375, 19.93994140625, 20.680908203125, 21.421875]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 6.0, 6.0, 9.0, 13.0, 28.0, 36.0, 47.0, 74.0, 94.0, 163.0, 272.0, 367.0, 608.0, 961.0, 1476.0, 2503.0, 3905.0, 6369.0, 10576.0, 17554.0, 30280.0, 51555.0, 88417.0, 152494.0, 259206.0, 422624.0, 626253.0, 749351.0, 650134.0, 447870.0, 276649.0, 163944.0, 95059.0, 55061.0, 32055.0, 18930.0, 11283.0, 7012.0, 4055.0, 2524.0, 1575.0, 1047.0, 629.0, 427.0, 254.0, 180.0, 118.0, 74.0, 53.0, 38.0, 26.0, 15.0, 11.0, 7.0, 8.0, 3.0, 8.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.4375, -27.507080078125, -26.57666015625, -25.646240234375, -24.7158203125, -23.785400390625, -22.85498046875, -21.924560546875, -20.994140625, -20.063720703125, -19.13330078125, -18.202880859375, -17.2724609375, -16.342041015625, -15.41162109375, -14.481201171875, -13.55078125, -12.620361328125, -11.68994140625, -10.759521484375, -9.8291015625, -8.898681640625, -7.96826171875, -7.037841796875, -6.107421875, -5.177001953125, -4.24658203125, -3.316162109375, -2.3857421875, -1.455322265625, -0.52490234375, 0.405517578125, 1.3359375, 2.266357421875, 3.19677734375, 4.127197265625, 5.0576171875, 5.988037109375, 6.91845703125, 7.848876953125, 8.779296875, 9.709716796875, 10.64013671875, 11.570556640625, 12.5009765625, 13.431396484375, 14.36181640625, 15.292236328125, 16.22265625, 17.153076171875, 18.08349609375, 19.013916015625, 19.9443359375, 20.874755859375, 21.80517578125, 22.735595703125, 23.666015625, 24.596435546875, 25.52685546875, 26.457275390625, 27.3876953125, 28.318115234375, 29.24853515625, 30.178955078125, 31.109375]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 5.0, 1.0, 4.0, 2.0, 5.0, 10.0, 6.0, 14.0, 11.0, 20.0, 27.0, 27.0, 28.0, 50.0, 54.0, 65.0, 82.0, 94.0, 93.0, 133.0, 157.0, 140.0, 195.0, 211.0, 230.0, 229.0, 235.0, 260.0, 200.0, 209.0, 183.0, 178.0, 144.0, 124.0, 131.0, 107.0, 72.0, 77.0, 55.0, 48.0, 30.0, 35.0, 15.0, 16.0, 19.0, 11.0, 9.0, 11.0, 10.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-10.328125, -9.976806640625, -9.62548828125, -9.274169921875, -8.9228515625, -8.571533203125, -8.22021484375, -7.868896484375, -7.517578125, -7.166259765625, -6.81494140625, -6.463623046875, -6.1123046875, -5.760986328125, -5.40966796875, -5.058349609375, -4.70703125, -4.355712890625, -4.00439453125, -3.653076171875, -3.3017578125, -2.950439453125, -2.59912109375, -2.247802734375, -1.896484375, -1.545166015625, -1.19384765625, -0.842529296875, -0.4912109375, -0.139892578125, 0.21142578125, 0.562744140625, 0.9140625, 1.265380859375, 1.61669921875, 1.968017578125, 2.3193359375, 2.670654296875, 3.02197265625, 3.373291015625, 3.724609375, 4.075927734375, 4.42724609375, 4.778564453125, 5.1298828125, 5.481201171875, 5.83251953125, 6.183837890625, 6.53515625, 6.886474609375, 7.23779296875, 7.589111328125, 7.9404296875, 8.291748046875, 8.64306640625, 8.994384765625, 9.345703125, 9.697021484375, 10.04833984375, 10.399658203125, 10.7509765625, 11.102294921875, 11.45361328125, 11.804931640625, 12.15625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 6.0, 3.0, 4.0, 7.0, 6.0, 8.0, 9.0, 14.0, 24.0, 23.0, 20.0, 29.0, 25.0, 36.0, 37.0, 46.0, 43.0, 63.0, 45.0, 69.0, 46.0, 51.0, 40.0, 51.0, 53.0, 40.0, 33.0, 24.0, 20.0, 20.0, 12.0, 20.0, 13.0, 9.0, 15.0, 11.0, 7.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-35.933067321777344, -34.862876892089844, -33.792686462402344, -32.72249221801758, -31.652301788330078, -30.582111358642578, -29.511919021606445, -28.441726684570312, -27.371536254882812, -26.301345825195312, -25.23115348815918, -24.160961151123047, -23.090770721435547, -22.020580291748047, -20.950387954711914, -19.88019561767578, -18.81000518798828, -17.73981475830078, -16.66962242126465, -15.599431037902832, -14.529239654541016, -13.4590482711792, -12.388856887817383, -11.318665504455566, -10.24847412109375, -9.178282737731934, -8.108091354370117, -7.037899971008301, -5.967708587646484, -4.897517204284668, -3.8273258209228516, -2.757134437561035, -1.6869392395019531, -0.6167478561401367, 0.4534435272216797, 1.523634910583496, 2.5938262939453125, 3.664017677307129, 4.734209060668945, 5.804400444030762, 6.874591827392578, 7.9447832107543945, 9.014974594116211, 10.085165977478027, 11.155357360839844, 12.22554874420166, 13.295740127563477, 14.365931510925293, 15.43612289428711, 16.50631332397461, 17.576505661010742, 18.646697998046875, 19.716888427734375, 20.787078857421875, 21.857271194458008, 22.92746353149414, 23.99765396118164, 25.06784439086914, 26.138036727905273, 27.208229064941406, 28.278419494628906, 29.348609924316406, 30.41880226135254, 31.488994598388672, 32.55918502807617]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 5.0, 3.0, 4.0, 8.0, 2.0, 10.0, 6.0, 8.0, 5.0, 16.0, 15.0, 27.0, 21.0, 24.0, 34.0, 29.0, 31.0, 36.0, 25.0, 34.0, 44.0, 46.0, 53.0, 31.0, 44.0, 50.0, 42.0, 38.0, 37.0, 40.0, 33.0, 29.0, 28.0, 25.0, 17.0, 13.0, 15.0, 17.0, 15.0, 10.0, 9.0, 10.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-29.264554977416992, -28.384599685668945, -27.5046443939209, -26.62468910217285, -25.744733810424805, -24.864778518676758, -23.984825134277344, -23.104869842529297, -22.22491455078125, -21.344959259033203, -20.465003967285156, -19.58504867553711, -18.705093383789062, -17.825138092041016, -16.94518280029297, -16.065227508544922, -15.185272216796875, -14.305316925048828, -13.425361633300781, -12.545406341552734, -11.665451049804688, -10.78549575805664, -9.90554141998291, -9.025586128234863, -8.145630836486816, -7.2656755447387695, -6.385720252990723, -5.505765438079834, -4.625810146331787, -3.7458548545837402, -2.8659000396728516, -1.9859447479248047, -1.1059894561767578, -0.2260342836380005, 0.6539208889007568, 1.5338759422302246, 2.4138312339782715, 3.2937865257263184, 4.173741340637207, 5.053696632385254, 5.933651924133301, 6.813607215881348, 7.6935625076293945, 8.573516845703125, 9.453472137451172, 10.333427429199219, 11.213382720947266, 12.093338012695312, 12.97329330444336, 13.853248596191406, 14.733203887939453, 15.6131591796875, 16.493114471435547, 17.373069763183594, 18.25302505493164, 19.132980346679688, 20.012935638427734, 20.89289093017578, 21.772846221923828, 22.652801513671875, 23.532756805419922, 24.41271209716797, 25.292667388916016, 26.172622680664062, 27.052576065063477]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 7.0, 14.0, 35.0, 33.0, 60.0, 78.0, 108.0, 174.0, 271.0, 424.0, 650.0, 1033.0, 1687.0, 2799.0, 4627.0, 7967.0, 13674.0, 24296.0, 43021.0, 78120.0, 132827.0, 193216.0, 200139.0, 144819.0, 86150.0, 48282.0, 26953.0, 15204.0, 8608.0, 5130.0, 3081.0, 1923.0, 1169.0, 674.0, 430.0, 291.0, 197.0, 123.0, 99.0, 57.0, 33.0, 27.0, 13.0, 9.0, 7.0, 7.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-43.625, -42.306640625, -40.98828125, -39.669921875, -38.3515625, -37.033203125, -35.71484375, -34.396484375, -33.078125, -31.759765625, -30.44140625, -29.123046875, -27.8046875, -26.486328125, -25.16796875, -23.849609375, -22.53125, -21.212890625, -19.89453125, -18.576171875, -17.2578125, -15.939453125, -14.62109375, -13.302734375, -11.984375, -10.666015625, -9.34765625, -8.029296875, -6.7109375, -5.392578125, -4.07421875, -2.755859375, -1.4375, -0.119140625, 1.19921875, 2.517578125, 3.8359375, 5.154296875, 6.47265625, 7.791015625, 9.109375, 10.427734375, 11.74609375, 13.064453125, 14.3828125, 15.701171875, 17.01953125, 18.337890625, 19.65625, 20.974609375, 22.29296875, 23.611328125, 24.9296875, 26.248046875, 27.56640625, 28.884765625, 30.203125, 31.521484375, 32.83984375, 34.158203125, 35.4765625, 36.794921875, 38.11328125, 39.431640625, 40.75]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 6.0, 3.0, 4.0, 8.0, 3.0, 5.0, 8.0, 11.0, 14.0, 13.0, 10.0, 26.0, 24.0, 19.0, 27.0, 19.0, 37.0, 32.0, 35.0, 32.0, 37.0, 43.0, 47.0, 49.0, 47.0, 42.0, 42.0, 42.0, 36.0, 35.0, 29.0, 19.0, 34.0, 20.0, 14.0, 33.0, 18.0, 14.0, 17.0, 8.0, 10.0, 8.0, 11.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-28.78125, -27.923095703125, -27.06494140625, -26.206787109375, -25.3486328125, -24.490478515625, -23.63232421875, -22.774169921875, -21.916015625, -21.057861328125, -20.19970703125, -19.341552734375, -18.4833984375, -17.625244140625, -16.76708984375, -15.908935546875, -15.05078125, -14.192626953125, -13.33447265625, -12.476318359375, -11.6181640625, -10.760009765625, -9.90185546875, -9.043701171875, -8.185546875, -7.327392578125, -6.46923828125, -5.611083984375, -4.7529296875, -3.894775390625, -3.03662109375, -2.178466796875, -1.3203125, -0.462158203125, 0.39599609375, 1.254150390625, 2.1123046875, 2.970458984375, 3.82861328125, 4.686767578125, 5.544921875, 6.403076171875, 7.26123046875, 8.119384765625, 8.9775390625, 9.835693359375, 10.69384765625, 11.552001953125, 12.41015625, 13.268310546875, 14.12646484375, 14.984619140625, 15.8427734375, 16.700927734375, 17.55908203125, 18.417236328125, 19.275390625, 20.133544921875, 20.99169921875, 21.849853515625, 22.7080078125, 23.566162109375, 24.42431640625, 25.282470703125, 26.140625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 6.0, 1.0, 2.0, 9.0, 7.0, 7.0, 19.0, 23.0, 30.0, 50.0, 64.0, 77.0, 118.0, 212.0, 289.0, 406.0, 665.0, 984.0, 1595.0, 2476.0, 4155.0, 7073.0, 12803.0, 26875.0, 64776.0, 179128.0, 371929.0, 224769.0, 81384.0, 32810.0, 15212.0, 8128.0, 4619.0, 2745.0, 1728.0, 1146.0, 760.0, 508.0, 330.0, 198.0, 140.0, 92.0, 54.0, 56.0, 41.0, 23.0, 19.0, 12.0, 4.0, 7.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.125, -71.6220703125, -69.119140625, -66.6162109375, -64.11328125, -61.6103515625, -59.107421875, -56.6044921875, -54.1015625, -51.5986328125, -49.095703125, -46.5927734375, -44.08984375, -41.5869140625, -39.083984375, -36.5810546875, -34.078125, -31.5751953125, -29.072265625, -26.5693359375, -24.06640625, -21.5634765625, -19.060546875, -16.5576171875, -14.0546875, -11.5517578125, -9.048828125, -6.5458984375, -4.04296875, -1.5400390625, 0.962890625, 3.4658203125, 5.96875, 8.4716796875, 10.974609375, 13.4775390625, 15.98046875, 18.4833984375, 20.986328125, 23.4892578125, 25.9921875, 28.4951171875, 30.998046875, 33.5009765625, 36.00390625, 38.5068359375, 41.009765625, 43.5126953125, 46.015625, 48.5185546875, 51.021484375, 53.5244140625, 56.02734375, 58.5302734375, 61.033203125, 63.5361328125, 66.0390625, 68.5419921875, 71.044921875, 73.5478515625, 76.05078125, 78.5537109375, 81.056640625, 83.5595703125, 86.0625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 8.0, 1.0, 6.0, 12.0, 6.0, 11.0, 19.0, 9.0, 17.0, 28.0, 14.0, 17.0, 22.0, 30.0, 23.0, 31.0, 34.0, 35.0, 52.0, 37.0, 43.0, 38.0, 50.0, 42.0, 31.0, 36.0, 35.0, 40.0, 34.0, 27.0, 26.0, 35.0, 16.0, 22.0, 21.0, 23.0, 12.0, 14.0, 9.0, 9.0, 12.0, 6.0, 4.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-16.296875, -15.7578125, -15.21875, -14.6796875, -14.140625, -13.6015625, -13.0625, -12.5234375, -11.984375, -11.4453125, -10.90625, -10.3671875, -9.828125, -9.2890625, -8.75, -8.2109375, -7.671875, -7.1328125, -6.59375, -6.0546875, -5.515625, -4.9765625, -4.4375, -3.8984375, -3.359375, -2.8203125, -2.28125, -1.7421875, -1.203125, -0.6640625, -0.125, 0.4140625, 0.953125, 1.4921875, 2.03125, 2.5703125, 3.109375, 3.6484375, 4.1875, 4.7265625, 5.265625, 5.8046875, 6.34375, 6.8828125, 7.421875, 7.9609375, 8.5, 9.0390625, 9.578125, 10.1171875, 10.65625, 11.1953125, 11.734375, 12.2734375, 12.8125, 13.3515625, 13.890625, 14.4296875, 14.96875, 15.5078125, 16.046875, 16.5859375, 17.125, 17.6640625, 18.203125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 6.0, 6.0, 14.0, 15.0, 19.0, 29.0, 43.0, 65.0, 85.0, 112.0, 203.0, 280.0, 502.0, 789.0, 1327.0, 2336.0, 4495.0, 8823.0, 17827.0, 38093.0, 86998.0, 192638.0, 301301.0, 211659.0, 97833.0, 42709.0, 19481.0, 9641.0, 4896.0, 2642.0, 1488.0, 812.0, 478.0, 300.0, 196.0, 127.0, 94.0, 66.0, 31.0, 30.0, 19.0, 15.0, 16.0, 6.0, 4.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-30.65625, -29.76953125, -28.8828125, -27.99609375, -27.109375, -26.22265625, -25.3359375, -24.44921875, -23.5625, -22.67578125, -21.7890625, -20.90234375, -20.015625, -19.12890625, -18.2421875, -17.35546875, -16.46875, -15.58203125, -14.6953125, -13.80859375, -12.921875, -12.03515625, -11.1484375, -10.26171875, -9.375, -8.48828125, -7.6015625, -6.71484375, -5.828125, -4.94140625, -4.0546875, -3.16796875, -2.28125, -1.39453125, -0.5078125, 0.37890625, 1.265625, 2.15234375, 3.0390625, 3.92578125, 4.8125, 5.69921875, 6.5859375, 7.47265625, 8.359375, 9.24609375, 10.1328125, 11.01953125, 11.90625, 12.79296875, 13.6796875, 14.56640625, 15.453125, 16.33984375, 17.2265625, 18.11328125, 19.0, 19.88671875, 20.7734375, 21.66015625, 22.546875, 23.43359375, 24.3203125, 25.20703125, 26.09375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 5.0, 2.0, 2.0, 4.0, 8.0, 10.0, 9.0, 14.0, 21.0, 30.0, 24.0, 34.0, 43.0, 66.0, 65.0, 73.0, 96.0, 94.0, 84.0, 54.0, 51.0, 39.0, 29.0, 23.0, 21.0, 19.0, 12.0, 11.0, 5.0, 10.0, 8.0, 5.0, 3.0, 3.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0012836456298828125, -0.0012420117855072021, -0.0012003779411315918, -0.0011587440967559814, -0.001117110252380371, -0.0010754764080047607, -0.0010338425636291504, -0.00099220871925354, -0.0009505748748779297, -0.0009089410305023193, -0.000867307186126709, -0.0008256733417510986, -0.0007840394973754883, -0.0007424056529998779, -0.0007007718086242676, -0.0006591379642486572, -0.0006175041198730469, -0.0005758702754974365, -0.0005342364311218262, -0.0004926025867462158, -0.00045096874237060547, -0.0004093348979949951, -0.00036770105361938477, -0.0003260672092437744, -0.00028443336486816406, -0.0002427995204925537, -0.00020116567611694336, -0.000159531831741333, -0.00011789798736572266, -7.62641429901123e-05, -3.463029861450195e-05, 7.0035457611083984e-06, 4.863739013671875e-05, 9.02712345123291e-05, 0.00013190507888793945, 0.0001735389232635498, 0.00021517276763916016, 0.0002568066120147705, 0.00029844045639038086, 0.0003400743007659912, 0.00038170814514160156, 0.0004233419895172119, 0.00046497583389282227, 0.0005066096782684326, 0.000548243522644043, 0.0005898773670196533, 0.0006315112113952637, 0.000673145055770874, 0.0007147789001464844, 0.0007564127445220947, 0.0007980465888977051, 0.0008396804332733154, 0.0008813142776489258, 0.0009229481220245361, 0.0009645819664001465, 0.0010062158107757568, 0.0010478496551513672, 0.0010894834995269775, 0.0011311173439025879, 0.0011727511882781982, 0.0012143850326538086, 0.001256018877029419, 0.0012976527214050293, 0.0013392865657806396, 0.00138092041015625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 5.0, 11.0, 7.0, 13.0, 27.0, 30.0, 48.0, 83.0, 102.0, 153.0, 256.0, 400.0, 646.0, 960.0, 1580.0, 2447.0, 3868.0, 5965.0, 9760.0, 15722.0, 25756.0, 41738.0, 66663.0, 100801.0, 138213.0, 159472.0, 148962.0, 114568.0, 78875.0, 50210.0, 30711.0, 18775.0, 11770.0, 7274.0, 4457.0, 2991.0, 1886.0, 1211.0, 788.0, 490.0, 298.0, 182.0, 139.0, 91.0, 48.0, 38.0, 33.0, 13.0, 13.0, 6.0, 7.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.625, -13.114501953125, -12.60400390625, -12.093505859375, -11.5830078125, -11.072509765625, -10.56201171875, -10.051513671875, -9.541015625, -9.030517578125, -8.52001953125, -8.009521484375, -7.4990234375, -6.988525390625, -6.47802734375, -5.967529296875, -5.45703125, -4.946533203125, -4.43603515625, -3.925537109375, -3.4150390625, -2.904541015625, -2.39404296875, -1.883544921875, -1.373046875, -0.862548828125, -0.35205078125, 0.158447265625, 0.6689453125, 1.179443359375, 1.68994140625, 2.200439453125, 2.7109375, 3.221435546875, 3.73193359375, 4.242431640625, 4.7529296875, 5.263427734375, 5.77392578125, 6.284423828125, 6.794921875, 7.305419921875, 7.81591796875, 8.326416015625, 8.8369140625, 9.347412109375, 9.85791015625, 10.368408203125, 10.87890625, 11.389404296875, 11.89990234375, 12.410400390625, 12.9208984375, 13.431396484375, 13.94189453125, 14.452392578125, 14.962890625, 15.473388671875, 15.98388671875, 16.494384765625, 17.0048828125, 17.515380859375, 18.02587890625, 18.536376953125, 19.046875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 5.0, 6.0, 10.0, 12.0, 13.0, 20.0, 26.0, 34.0, 20.0, 40.0, 29.0, 43.0, 55.0, 53.0, 48.0, 58.0, 49.0, 53.0, 46.0, 45.0, 54.0, 40.0, 29.0, 26.0, 27.0, 25.0, 19.0, 23.0, 17.0, 20.0, 14.0, 7.0, 3.0, 8.0, 4.0, 3.0, 2.0, 1.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.515625, -5.32623291015625, -5.1368408203125, -4.94744873046875, -4.758056640625, -4.56866455078125, -4.3792724609375, -4.18988037109375, -4.00048828125, -3.81109619140625, -3.6217041015625, -3.43231201171875, -3.242919921875, -3.05352783203125, -2.8641357421875, -2.67474365234375, -2.4853515625, -2.29595947265625, -2.1065673828125, -1.91717529296875, -1.727783203125, -1.53839111328125, -1.3489990234375, -1.15960693359375, -0.97021484375, -0.78082275390625, -0.5914306640625, -0.40203857421875, -0.212646484375, -0.02325439453125, 0.1661376953125, 0.35552978515625, 0.544921875, 0.73431396484375, 0.9237060546875, 1.11309814453125, 1.302490234375, 1.49188232421875, 1.6812744140625, 1.87066650390625, 2.06005859375, 2.24945068359375, 2.4388427734375, 2.62823486328125, 2.817626953125, 3.00701904296875, 3.1964111328125, 3.38580322265625, 3.5751953125, 3.76458740234375, 3.9539794921875, 4.14337158203125, 4.332763671875, 4.52215576171875, 4.7115478515625, 4.90093994140625, 5.09033203125, 5.27972412109375, 5.4691162109375, 5.65850830078125, 5.847900390625, 6.03729248046875, 6.2266845703125, 6.41607666015625, 6.60546875]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 4.0, 4.0, 3.0, 10.0, 4.0, 4.0, 9.0, 10.0, 12.0, 12.0, 19.0, 15.0, 21.0, 23.0, 35.0, 41.0, 45.0, 60.0, 55.0, 40.0, 53.0, 54.0, 56.0, 47.0, 48.0, 43.0, 44.0, 38.0, 26.0, 26.0, 31.0, 23.0, 13.0, 11.0, 10.0, 8.0, 13.0, 3.0, 8.0, 8.0, 7.0, 3.0, 1.0, 5.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-35.86669921875, -34.82542419433594, -33.78415298461914, -32.74287796020508, -31.70160675048828, -30.66033172607422, -29.61905860900879, -28.57778549194336, -27.53651237487793, -26.4952392578125, -25.45396614074707, -24.41269302368164, -23.371417999267578, -22.33014678955078, -21.28887176513672, -20.24759864807129, -19.20632553100586, -18.16505241394043, -17.123779296875, -16.08250617980957, -15.041232109069824, -13.999958992004395, -12.958684921264648, -11.917411804199219, -10.876138687133789, -9.83486557006836, -8.79359245300293, -7.752318382263184, -6.711045265197754, -5.669772148132324, -4.628498554229736, -3.5872249603271484, -2.545949935913086, -1.5046765804290771, -0.46340322494506836, 0.5778701305389404, 1.6191434860229492, 2.660416603088379, 3.701690196990967, 4.742963790893555, 5.784236907958984, 6.825510025024414, 7.866783618927002, 8.90805721282959, 9.94933032989502, 10.99060344696045, 12.031877517700195, 13.073150634765625, 14.114423751831055, 15.155696868896484, 16.196969985961914, 17.238243103027344, 18.279518127441406, 19.320789337158203, 20.362064361572266, 21.403337478637695, 22.444610595703125, 23.485883712768555, 24.527156829833984, 25.568429946899414, 26.609703063964844, 27.650978088378906, 28.692251205444336, 29.733524322509766, 30.774797439575195]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 3.0, 1.0, 3.0, 9.0, 5.0, 4.0, 9.0, 9.0, 9.0, 6.0, 7.0, 19.0, 16.0, 22.0, 24.0, 29.0, 31.0, 31.0, 33.0, 33.0, 36.0, 37.0, 41.0, 45.0, 43.0, 43.0, 41.0, 40.0, 37.0, 43.0, 34.0, 36.0, 35.0, 28.0, 26.0, 20.0, 15.0, 21.0, 15.0, 18.0, 10.0, 9.0, 6.0, 9.0, 6.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-27.09512710571289, -26.266862869262695, -25.438600540161133, -24.610336303710938, -23.782072067260742, -22.953807830810547, -22.125545501708984, -21.29728126525879, -20.469017028808594, -19.6407527923584, -18.812490463256836, -17.98422622680664, -17.155961990356445, -16.32769775390625, -15.499435424804688, -14.671171188354492, -13.84290885925293, -13.01464557647705, -12.186381340026855, -11.358118057250977, -10.529853820800781, -9.701590538024902, -8.873327255249023, -8.045063018798828, -7.216799736022949, -6.388535976409912, -5.560272216796875, -4.732008934020996, -3.903745174407959, -3.075481414794922, -2.247218132019043, -1.4189543724060059, -0.5906925201416016, 0.237571120262146, 1.0658347606658936, 1.8940982818603516, 2.7223620414733887, 3.550625801086426, 4.378889083862305, 5.207152843475342, 6.035416603088379, 6.863680362701416, 7.691944122314453, 8.520207405090332, 9.348470687866211, 10.176734924316406, 11.004998207092285, 11.833261489868164, 12.66152572631836, 13.489789009094238, 14.318053245544434, 15.146316528320312, 15.974580764770508, 16.802845001220703, 17.631107330322266, 18.45937156677246, 19.287635803222656, 20.11590003967285, 20.944162368774414, 21.77242660522461, 22.600690841674805, 23.428955078125, 24.257217407226562, 25.085481643676758, 25.91374397277832]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 4.0, 5.0, 8.0, 17.0, 21.0, 38.0, 67.0, 90.0, 106.0, 174.0, 261.0, 401.0, 574.0, 933.0, 1476.0, 2143.0, 3122.0, 4869.0, 7706.0, 11536.0, 17682.0, 26467.0, 39236.0, 57273.0, 78022.0, 101954.0, 119871.0, 126162.0, 117114.0, 97191.0, 74099.0, 52769.0, 36335.0, 24328.0, 16440.0, 10522.0, 6805.0, 4385.0, 2908.0, 1838.0, 1214.0, 808.0, 499.0, 346.0, 255.0, 157.0, 93.0, 82.0, 52.0, 41.0, 24.0, 18.0, 5.0, 7.0, 5.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0], "bins": [-24.65625, -23.844970703125, -23.03369140625, -22.222412109375, -21.4111328125, -20.599853515625, -19.78857421875, -18.977294921875, -18.166015625, -17.354736328125, -16.54345703125, -15.732177734375, -14.9208984375, -14.109619140625, -13.29833984375, -12.487060546875, -11.67578125, -10.864501953125, -10.05322265625, -9.241943359375, -8.4306640625, -7.619384765625, -6.80810546875, -5.996826171875, -5.185546875, -4.374267578125, -3.56298828125, -2.751708984375, -1.9404296875, -1.129150390625, -0.31787109375, 0.493408203125, 1.3046875, 2.115966796875, 2.92724609375, 3.738525390625, 4.5498046875, 5.361083984375, 6.17236328125, 6.983642578125, 7.794921875, 8.606201171875, 9.41748046875, 10.228759765625, 11.0400390625, 11.851318359375, 12.66259765625, 13.473876953125, 14.28515625, 15.096435546875, 15.90771484375, 16.718994140625, 17.5302734375, 18.341552734375, 19.15283203125, 19.964111328125, 20.775390625, 21.586669921875, 22.39794921875, 23.209228515625, 24.0205078125, 24.831787109375, 25.64306640625, 26.454345703125, 27.265625]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 6.0, 5.0, 1.0, 7.0, 3.0, 9.0, 10.0, 11.0, 6.0, 10.0, 18.0, 20.0, 21.0, 17.0, 26.0, 31.0, 29.0, 36.0, 34.0, 32.0, 41.0, 43.0, 37.0, 38.0, 46.0, 49.0, 38.0, 40.0, 38.0, 46.0, 27.0, 33.0, 23.0, 24.0, 23.0, 16.0, 27.0, 10.0, 12.0, 16.0, 9.0, 7.0, 7.0, 5.0, 5.0, 3.0, 5.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-26.53125, -25.72119140625, -24.9111328125, -24.10107421875, -23.291015625, -22.48095703125, -21.6708984375, -20.86083984375, -20.05078125, -19.24072265625, -18.4306640625, -17.62060546875, -16.810546875, -16.00048828125, -15.1904296875, -14.38037109375, -13.5703125, -12.76025390625, -11.9501953125, -11.14013671875, -10.330078125, -9.52001953125, -8.7099609375, -7.89990234375, -7.08984375, -6.27978515625, -5.4697265625, -4.65966796875, -3.849609375, -3.03955078125, -2.2294921875, -1.41943359375, -0.609375, 0.20068359375, 1.0107421875, 1.82080078125, 2.630859375, 3.44091796875, 4.2509765625, 5.06103515625, 5.87109375, 6.68115234375, 7.4912109375, 8.30126953125, 9.111328125, 9.92138671875, 10.7314453125, 11.54150390625, 12.3515625, 13.16162109375, 13.9716796875, 14.78173828125, 15.591796875, 16.40185546875, 17.2119140625, 18.02197265625, 18.83203125, 19.64208984375, 20.4521484375, 21.26220703125, 22.072265625, 22.88232421875, 23.6923828125, 24.50244140625, 25.3125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 7.0, 7.0, 18.0, 29.0, 43.0, 78.0, 118.0, 165.0, 321.0, 520.0, 920.0, 1449.0, 2567.0, 4263.0, 7484.0, 12927.0, 22233.0, 37407.0, 61531.0, 94115.0, 131088.0, 156965.0, 154664.0, 127300.0, 89690.0, 57676.0, 35106.0, 20933.0, 11986.0, 7033.0, 4030.0, 2346.0, 1422.0, 811.0, 518.0, 324.0, 161.0, 115.0, 79.0, 42.0, 26.0, 14.0, 14.0, 5.0, 6.0, 2.0, 5.0, 3.0], "bins": [-35.4375, -34.50341796875, -33.5693359375, -32.63525390625, -31.701171875, -30.76708984375, -29.8330078125, -28.89892578125, -27.96484375, -27.03076171875, -26.0966796875, -25.16259765625, -24.228515625, -23.29443359375, -22.3603515625, -21.42626953125, -20.4921875, -19.55810546875, -18.6240234375, -17.68994140625, -16.755859375, -15.82177734375, -14.8876953125, -13.95361328125, -13.01953125, -12.08544921875, -11.1513671875, -10.21728515625, -9.283203125, -8.34912109375, -7.4150390625, -6.48095703125, -5.546875, -4.61279296875, -3.6787109375, -2.74462890625, -1.810546875, -0.87646484375, 0.0576171875, 0.99169921875, 1.92578125, 2.85986328125, 3.7939453125, 4.72802734375, 5.662109375, 6.59619140625, 7.5302734375, 8.46435546875, 9.3984375, 10.33251953125, 11.2666015625, 12.20068359375, 13.134765625, 14.06884765625, 15.0029296875, 15.93701171875, 16.87109375, 17.80517578125, 18.7392578125, 19.67333984375, 20.607421875, 21.54150390625, 22.4755859375, 23.40966796875, 24.34375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 7.0, 2.0, 6.0, 8.0, 14.0, 9.0, 13.0, 11.0, 22.0, 16.0, 26.0, 32.0, 38.0, 38.0, 29.0, 33.0, 37.0, 54.0, 63.0, 52.0, 51.0, 43.0, 51.0, 33.0, 42.0, 43.0, 37.0, 22.0, 24.0, 29.0, 19.0, 19.0, 21.0, 11.0, 9.0, 11.0, 7.0, 4.0, 6.0, 7.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-20.921875, -20.335693359375, -19.74951171875, -19.163330078125, -18.5771484375, -17.990966796875, -17.40478515625, -16.818603515625, -16.232421875, -15.646240234375, -15.06005859375, -14.473876953125, -13.8876953125, -13.301513671875, -12.71533203125, -12.129150390625, -11.54296875, -10.956787109375, -10.37060546875, -9.784423828125, -9.1982421875, -8.612060546875, -8.02587890625, -7.439697265625, -6.853515625, -6.267333984375, -5.68115234375, -5.094970703125, -4.5087890625, -3.922607421875, -3.33642578125, -2.750244140625, -2.1640625, -1.577880859375, -0.99169921875, -0.405517578125, 0.1806640625, 0.766845703125, 1.35302734375, 1.939208984375, 2.525390625, 3.111572265625, 3.69775390625, 4.283935546875, 4.8701171875, 5.456298828125, 6.04248046875, 6.628662109375, 7.21484375, 7.801025390625, 8.38720703125, 8.973388671875, 9.5595703125, 10.145751953125, 10.73193359375, 11.318115234375, 11.904296875, 12.490478515625, 13.07666015625, 13.662841796875, 14.2490234375, 14.835205078125, 15.42138671875, 16.007568359375, 16.59375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 10.0, 13.0, 34.0, 30.0, 49.0, 52.0, 110.0, 143.0, 206.0, 283.0, 451.0, 665.0, 994.0, 1597.0, 2408.0, 3944.0, 6167.0, 10044.0, 16480.0, 27047.0, 44638.0, 70786.0, 108537.0, 147490.0, 166036.0, 147302.0, 107754.0, 70824.0, 44164.0, 26742.0, 16426.0, 9979.0, 6229.0, 3885.0, 2461.0, 1559.0, 1039.0, 639.0, 427.0, 285.0, 205.0, 128.0, 117.0, 48.0, 47.0, 31.0, 15.0, 13.0, 5.0, 10.0, 2.0, 3.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0], "bins": [-18.03125, -17.43994140625, -16.8486328125, -16.25732421875, -15.666015625, -15.07470703125, -14.4833984375, -13.89208984375, -13.30078125, -12.70947265625, -12.1181640625, -11.52685546875, -10.935546875, -10.34423828125, -9.7529296875, -9.16162109375, -8.5703125, -7.97900390625, -7.3876953125, -6.79638671875, -6.205078125, -5.61376953125, -5.0224609375, -4.43115234375, -3.83984375, -3.24853515625, -2.6572265625, -2.06591796875, -1.474609375, -0.88330078125, -0.2919921875, 0.29931640625, 0.890625, 1.48193359375, 2.0732421875, 2.66455078125, 3.255859375, 3.84716796875, 4.4384765625, 5.02978515625, 5.62109375, 6.21240234375, 6.8037109375, 7.39501953125, 7.986328125, 8.57763671875, 9.1689453125, 9.76025390625, 10.3515625, 10.94287109375, 11.5341796875, 12.12548828125, 12.716796875, 13.30810546875, 13.8994140625, 14.49072265625, 15.08203125, 15.67333984375, 16.2646484375, 16.85595703125, 17.447265625, 18.03857421875, 18.6298828125, 19.22119140625, 19.8125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 2.0, 3.0, 5.0, 6.0, 7.0, 5.0, 9.0, 12.0, 15.0, 16.0, 26.0, 28.0, 29.0, 34.0, 46.0, 47.0, 48.0, 60.0, 54.0, 55.0, 74.0, 69.0, 53.0, 41.0, 47.0, 42.0, 26.0, 20.0, 30.0, 19.0, 20.0, 11.0, 11.0, 11.0, 6.0, 6.0, 5.0, 3.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001750946044921875, -0.0016855597496032715, -0.001620173454284668, -0.0015547871589660645, -0.001489400863647461, -0.0014240145683288574, -0.001358628273010254, -0.0012932419776916504, -0.0012278556823730469, -0.0011624693870544434, -0.0010970830917358398, -0.0010316967964172363, -0.0009663105010986328, -0.0009009242057800293, -0.0008355379104614258, -0.0007701516151428223, -0.0007047653198242188, -0.0006393790245056152, -0.0005739927291870117, -0.0005086064338684082, -0.0004432201385498047, -0.00037783384323120117, -0.00031244754791259766, -0.00024706125259399414, -0.00018167495727539062, -0.00011628866195678711, -5.0902366638183594e-05, 1.4483928680419922e-05, 7.987022399902344e-05, 0.00014525651931762695, 0.00021064281463623047, 0.000276029109954834, 0.0003414154052734375, 0.000406801700592041, 0.00047218799591064453, 0.000537574291229248, 0.0006029605865478516, 0.0006683468818664551, 0.0007337331771850586, 0.0007991194725036621, 0.0008645057678222656, 0.0009298920631408691, 0.0009952783584594727, 0.0010606646537780762, 0.0011260509490966797, 0.0011914372444152832, 0.0012568235397338867, 0.0013222098350524902, 0.0013875961303710938, 0.0014529824256896973, 0.0015183687210083008, 0.0015837550163269043, 0.0016491413116455078, 0.0017145276069641113, 0.0017799139022827148, 0.0018453001976013184, 0.0019106864929199219, 0.0019760727882385254, 0.002041459083557129, 0.0021068453788757324, 0.002172231674194336, 0.0022376179695129395, 0.002303004264831543, 0.0023683905601501465, 0.00243377685546875]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 1.0, 15.0, 16.0, 12.0, 26.0, 31.0, 53.0, 72.0, 103.0, 183.0, 242.0, 365.0, 590.0, 1011.0, 1546.0, 2629.0, 4405.0, 7418.0, 12127.0, 21011.0, 35351.0, 57625.0, 89821.0, 128291.0, 157968.0, 159453.0, 130251.0, 91224.0, 58536.0, 35638.0, 21352.0, 12477.0, 7357.0, 4421.0, 2571.0, 1614.0, 1011.0, 634.0, 384.0, 248.0, 156.0, 112.0, 64.0, 59.0, 23.0, 24.0, 13.0, 7.0, 8.0, 5.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-16.96875, -16.438720703125, -15.90869140625, -15.378662109375, -14.8486328125, -14.318603515625, -13.78857421875, -13.258544921875, -12.728515625, -12.198486328125, -11.66845703125, -11.138427734375, -10.6083984375, -10.078369140625, -9.54833984375, -9.018310546875, -8.48828125, -7.958251953125, -7.42822265625, -6.898193359375, -6.3681640625, -5.838134765625, -5.30810546875, -4.778076171875, -4.248046875, -3.718017578125, -3.18798828125, -2.657958984375, -2.1279296875, -1.597900390625, -1.06787109375, -0.537841796875, -0.0078125, 0.522216796875, 1.05224609375, 1.582275390625, 2.1123046875, 2.642333984375, 3.17236328125, 3.702392578125, 4.232421875, 4.762451171875, 5.29248046875, 5.822509765625, 6.3525390625, 6.882568359375, 7.41259765625, 7.942626953125, 8.47265625, 9.002685546875, 9.53271484375, 10.062744140625, 10.5927734375, 11.122802734375, 11.65283203125, 12.182861328125, 12.712890625, 13.242919921875, 13.77294921875, 14.302978515625, 14.8330078125, 15.363037109375, 15.89306640625, 16.423095703125, 16.953125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 8.0, 8.0, 9.0, 13.0, 14.0, 16.0, 17.0, 14.0, 35.0, 28.0, 27.0, 35.0, 49.0, 33.0, 59.0, 47.0, 58.0, 66.0, 41.0, 45.0, 47.0, 33.0, 34.0, 35.0, 35.0, 28.0, 19.0, 27.0, 20.0, 15.0, 14.0, 8.0, 7.0, 12.0, 9.0, 5.0, 5.0, 3.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.890625, -5.71954345703125, -5.5484619140625, -5.37738037109375, -5.206298828125, -5.03521728515625, -4.8641357421875, -4.69305419921875, -4.52197265625, -4.35089111328125, -4.1798095703125, -4.00872802734375, -3.837646484375, -3.66656494140625, -3.4954833984375, -3.32440185546875, -3.1533203125, -2.98223876953125, -2.8111572265625, -2.64007568359375, -2.468994140625, -2.29791259765625, -2.1268310546875, -1.95574951171875, -1.78466796875, -1.61358642578125, -1.4425048828125, -1.27142333984375, -1.100341796875, -0.92926025390625, -0.7581787109375, -0.58709716796875, -0.416015625, -0.24493408203125, -0.0738525390625, 0.09722900390625, 0.268310546875, 0.43939208984375, 0.6104736328125, 0.78155517578125, 0.95263671875, 1.12371826171875, 1.2947998046875, 1.46588134765625, 1.636962890625, 1.80804443359375, 1.9791259765625, 2.15020751953125, 2.3212890625, 2.49237060546875, 2.6634521484375, 2.83453369140625, 3.005615234375, 3.17669677734375, 3.3477783203125, 3.51885986328125, 3.68994140625, 3.86102294921875, 4.0321044921875, 4.20318603515625, 4.374267578125, 4.54534912109375, 4.7164306640625, 4.88751220703125, 5.05859375]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 3.0, 9.0, 5.0, 7.0, 10.0, 12.0, 16.0, 25.0, 22.0, 29.0, 26.0, 41.0, 55.0, 45.0, 60.0, 39.0, 67.0, 62.0, 71.0, 53.0, 51.0, 40.0, 38.0, 54.0, 22.0, 25.0, 24.0, 17.0, 11.0, 13.0, 12.0, 8.0, 7.0, 7.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-38.23472595214844, -37.09128952026367, -35.94785690307617, -34.804420471191406, -33.66098403930664, -32.51755142211914, -31.374114990234375, -30.230680465698242, -29.08724594116211, -27.943811416625977, -26.80037498474121, -25.656940460205078, -24.513505935668945, -23.370071411132812, -22.226634979248047, -21.083200454711914, -19.93976402282715, -18.796329498291016, -17.65289306640625, -16.509458541870117, -15.366024017333984, -14.222588539123535, -13.079153060913086, -11.935718536376953, -10.792283058166504, -9.648847579956055, -8.505413055419922, -7.361977577209473, -6.218542575836182, -5.075107574462891, -3.9316720962524414, -2.7882375717163086, -1.6448020935058594, -0.5013669729232788, 0.6420681476593018, 1.7855033874511719, 2.928938388824463, 4.072373390197754, 5.215808868408203, 6.359243392944336, 7.502678871154785, 8.646114349365234, 9.789548873901367, 10.932984352111816, 12.076419830322266, 13.219854354858398, 14.363289833068848, 15.50672435760498, 16.65015983581543, 17.793594360351562, 18.937030792236328, 20.08046531677246, 21.223899841308594, 22.36733627319336, 23.510770797729492, 24.654205322265625, 25.79764175415039, 26.941076278686523, 28.08451271057129, 29.227947235107422, 30.371381759643555, 31.514816284179688, 32.65825271606445, 33.80168914794922, 34.94512176513672]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 6.0, 2.0, 9.0, 10.0, 13.0, 9.0, 9.0, 15.0, 16.0, 14.0, 22.0, 22.0, 26.0, 28.0, 35.0, 32.0, 33.0, 31.0, 37.0, 46.0, 40.0, 31.0, 32.0, 50.0, 51.0, 41.0, 35.0, 32.0, 36.0, 35.0, 31.0, 21.0, 20.0, 27.0, 17.0, 21.0, 10.0, 13.0, 7.0, 4.0, 9.0, 6.0, 7.0, 9.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-26.145259857177734, -25.346248626708984, -24.547239303588867, -23.748228073120117, -22.94921875, -22.15020751953125, -21.3511962890625, -20.552186965942383, -19.753177642822266, -18.954166412353516, -18.1551570892334, -17.35614585876465, -16.55713653564453, -15.758125305175781, -14.959115028381348, -14.160104751586914, -13.361093521118164, -12.56208324432373, -11.763072967529297, -10.964061737060547, -10.16505241394043, -9.36604118347168, -8.567030906677246, -7.7680206298828125, -6.969010353088379, -6.170000076293945, -5.370989799499512, -4.57197904586792, -3.7729687690734863, -2.9739584922790527, -2.174947738647461, -1.3759374618530273, -0.5769290924072266, 0.22208130359649658, 1.0210916996002197, 1.8201022148132324, 2.619112491607666, 3.4181227684020996, 4.217133522033691, 5.016143798828125, 5.815154075622559, 6.614164352416992, 7.413174629211426, 8.21218490600586, 9.01119613647461, 9.810205459594727, 10.609216690063477, 11.40822696685791, 12.207237243652344, 13.006247520446777, 13.805257797241211, 14.604269027709961, 15.403278350830078, 16.202289581298828, 17.001300811767578, 17.800310134887695, 18.599319458007812, 19.398330688476562, 20.19734001159668, 20.99635124206543, 21.795360565185547, 22.594371795654297, 23.393383026123047, 24.192392349243164, 24.991403579711914]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 9.0, 12.0, 14.0, 23.0, 31.0, 58.0, 107.0, 147.0, 231.0, 387.0, 638.0, 1073.0, 1740.0, 2824.0, 4738.0, 8422.0, 14605.0, 26498.0, 48500.0, 94013.0, 186193.0, 373862.0, 682533.0, 926404.0, 808754.0, 489696.0, 250258.0, 126039.0, 65270.0, 35146.0, 19319.0, 10936.0, 6399.0, 3828.0, 2213.0, 1330.0, 804.0, 462.0, 298.0, 195.0, 117.0, 79.0, 31.0, 22.0, 11.0, 9.0, 7.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.625, -27.75, -26.875, -26.0, -25.125, -24.25, -23.375, -22.5, -21.625, -20.75, -19.875, -19.0, -18.125, -17.25, -16.375, -15.5, -14.625, -13.75, -12.875, -12.0, -11.125, -10.25, -9.375, -8.5, -7.625, -6.75, -5.875, -5.0, -4.125, -3.25, -2.375, -1.5, -0.625, 0.25, 1.125, 2.0, 2.875, 3.75, 4.625, 5.5, 6.375, 7.25, 8.125, 9.0, 9.875, 10.75, 11.625, 12.5, 13.375, 14.25, 15.125, 16.0, 16.875, 17.75, 18.625, 19.5, 20.375, 21.25, 22.125, 23.0, 23.875, 24.75, 25.625, 26.5, 27.375]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 6.0, 11.0, 5.0, 11.0, 9.0, 7.0, 20.0, 17.0, 15.0, 22.0, 23.0, 31.0, 27.0, 35.0, 46.0, 21.0, 38.0, 54.0, 36.0, 44.0, 42.0, 46.0, 46.0, 42.0, 32.0, 37.0, 34.0, 36.0, 28.0, 32.0, 21.0, 24.0, 14.0, 18.0, 16.0, 3.0, 10.0, 8.0, 13.0, 3.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-20.046875, -19.459228515625, -18.87158203125, -18.283935546875, -17.6962890625, -17.108642578125, -16.52099609375, -15.933349609375, -15.345703125, -14.758056640625, -14.17041015625, -13.582763671875, -12.9951171875, -12.407470703125, -11.81982421875, -11.232177734375, -10.64453125, -10.056884765625, -9.46923828125, -8.881591796875, -8.2939453125, -7.706298828125, -7.11865234375, -6.531005859375, -5.943359375, -5.355712890625, -4.76806640625, -4.180419921875, -3.5927734375, -3.005126953125, -2.41748046875, -1.829833984375, -1.2421875, -0.654541015625, -0.06689453125, 0.520751953125, 1.1083984375, 1.696044921875, 2.28369140625, 2.871337890625, 3.458984375, 4.046630859375, 4.63427734375, 5.221923828125, 5.8095703125, 6.397216796875, 6.98486328125, 7.572509765625, 8.16015625, 8.747802734375, 9.33544921875, 9.923095703125, 10.5107421875, 11.098388671875, 11.68603515625, 12.273681640625, 12.861328125, 13.448974609375, 14.03662109375, 14.624267578125, 15.2119140625, 15.799560546875, 16.38720703125, 16.974853515625, 17.5625]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 7.0, 9.0, 15.0, 14.0, 30.0, 44.0, 68.0, 104.0, 136.0, 227.0, 380.0, 603.0, 928.0, 1490.0, 2511.0, 3920.0, 6602.0, 10990.0, 18038.0, 30446.0, 51085.0, 86409.0, 146994.0, 247335.0, 402288.0, 596026.0, 731272.0, 660557.0, 467094.0, 294986.0, 177286.0, 104770.0, 61044.0, 36241.0, 21470.0, 12802.0, 7831.0, 4640.0, 2825.0, 1767.0, 1088.0, 678.0, 450.0, 279.0, 177.0, 115.0, 81.0, 52.0, 32.0, 18.0, 15.0, 10.0, 5.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0], "bins": [-23.5, -22.758056640625, -22.01611328125, -21.274169921875, -20.5322265625, -19.790283203125, -19.04833984375, -18.306396484375, -17.564453125, -16.822509765625, -16.08056640625, -15.338623046875, -14.5966796875, -13.854736328125, -13.11279296875, -12.370849609375, -11.62890625, -10.886962890625, -10.14501953125, -9.403076171875, -8.6611328125, -7.919189453125, -7.17724609375, -6.435302734375, -5.693359375, -4.951416015625, -4.20947265625, -3.467529296875, -2.7255859375, -1.983642578125, -1.24169921875, -0.499755859375, 0.2421875, 0.984130859375, 1.72607421875, 2.468017578125, 3.2099609375, 3.951904296875, 4.69384765625, 5.435791015625, 6.177734375, 6.919677734375, 7.66162109375, 8.403564453125, 9.1455078125, 9.887451171875, 10.62939453125, 11.371337890625, 12.11328125, 12.855224609375, 13.59716796875, 14.339111328125, 15.0810546875, 15.822998046875, 16.56494140625, 17.306884765625, 18.048828125, 18.790771484375, 19.53271484375, 20.274658203125, 21.0166015625, 21.758544921875, 22.50048828125, 23.242431640625, 23.984375]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 6.0, 6.0, 13.0, 6.0, 10.0, 15.0, 25.0, 34.0, 23.0, 37.0, 50.0, 50.0, 72.0, 83.0, 103.0, 100.0, 138.0, 155.0, 168.0, 192.0, 187.0, 223.0, 244.0, 222.0, 236.0, 248.0, 192.0, 173.0, 177.0, 143.0, 143.0, 126.0, 91.0, 75.0, 77.0, 55.0, 25.0, 33.0, 22.0, 24.0, 16.0, 7.0, 13.0, 9.0, 11.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 4.0], "bins": [-9.28125, -9.0115966796875, -8.741943359375, -8.4722900390625, -8.20263671875, -7.9329833984375, -7.663330078125, -7.3936767578125, -7.1240234375, -6.8543701171875, -6.584716796875, -6.3150634765625, -6.04541015625, -5.7757568359375, -5.506103515625, -5.2364501953125, -4.966796875, -4.6971435546875, -4.427490234375, -4.1578369140625, -3.88818359375, -3.6185302734375, -3.348876953125, -3.0792236328125, -2.8095703125, -2.5399169921875, -2.270263671875, -2.0006103515625, -1.73095703125, -1.4613037109375, -1.191650390625, -0.9219970703125, -0.65234375, -0.3826904296875, -0.113037109375, 0.1566162109375, 0.42626953125, 0.6959228515625, 0.965576171875, 1.2352294921875, 1.5048828125, 1.7745361328125, 2.044189453125, 2.3138427734375, 2.58349609375, 2.8531494140625, 3.122802734375, 3.3924560546875, 3.662109375, 3.9317626953125, 4.201416015625, 4.4710693359375, 4.74072265625, 5.0103759765625, 5.280029296875, 5.5496826171875, 5.8193359375, 6.0889892578125, 6.358642578125, 6.6282958984375, 6.89794921875, 7.1676025390625, 7.437255859375, 7.7069091796875, 7.9765625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 6.0, 3.0, 5.0, 7.0, 12.0, 15.0, 8.0, 18.0, 29.0, 36.0, 49.0, 45.0, 39.0, 47.0, 50.0, 55.0, 56.0, 61.0, 57.0, 44.0, 60.0, 50.0, 47.0, 36.0, 37.0, 20.0, 19.0, 14.0, 16.0, 13.0, 16.0, 7.0, 5.0, 9.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0], "bins": [-40.7682991027832, -39.72697448730469, -38.685646057128906, -37.644317626953125, -36.60299301147461, -35.561668395996094, -34.52033996582031, -33.47901153564453, -32.437686920166016, -31.396360397338867, -30.35503387451172, -29.31370735168457, -28.272380828857422, -27.231054306030273, -26.189727783203125, -25.148401260375977, -24.107074737548828, -23.06574821472168, -22.02442169189453, -20.983095169067383, -19.941768646240234, -18.900442123413086, -17.859115600585938, -16.81778907775879, -15.77646255493164, -14.735136032104492, -13.693809509277344, -12.652482986450195, -11.611156463623047, -10.569829940795898, -9.52850341796875, -8.487176895141602, -7.445850372314453, -6.404523849487305, -5.363197326660156, -4.321870803833008, -3.2805442810058594, -2.239217758178711, -1.1978912353515625, -0.15656471252441406, 0.8847618103027344, 1.9260883331298828, 2.9674148559570312, 4.00874137878418, 5.050067901611328, 6.091394424438477, 7.132720947265625, 8.174047470092773, 9.215373992919922, 10.25670051574707, 11.298027038574219, 12.339353561401367, 13.380680084228516, 14.422006607055664, 15.463333129882812, 16.50465965270996, 17.54598617553711, 18.587312698364258, 19.628639221191406, 20.669965744018555, 21.711292266845703, 22.75261878967285, 23.7939453125, 24.83527183532715, 25.876598358154297]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 9.0, 7.0, 8.0, 12.0, 13.0, 10.0, 14.0, 14.0, 27.0, 23.0, 28.0, 29.0, 36.0, 43.0, 40.0, 35.0, 30.0, 48.0, 51.0, 41.0, 53.0, 55.0, 44.0, 48.0, 31.0, 30.0, 28.0, 29.0, 23.0, 28.0, 19.0, 24.0, 16.0, 13.0, 12.0, 5.0, 3.0, 10.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.79245376586914, -22.08443832397461, -21.376422882080078, -20.668407440185547, -19.960390090942383, -19.25237464904785, -18.54435920715332, -17.83634376525879, -17.128328323364258, -16.420312881469727, -15.712296485900879, -15.004281044006348, -14.296265602111816, -13.588249206542969, -12.880233764648438, -12.172218322753906, -11.464201927185059, -10.756186485290527, -10.04817008972168, -9.340154647827148, -8.632139205932617, -7.924123287200928, -7.216107368469238, -6.508091926574707, -5.800076007843018, -5.092060089111328, -4.384044647216797, -3.6760287284851074, -2.968013048171997, -2.2599973678588867, -1.5519814491271973, -0.843966007232666, -0.13595008850097656, 0.5720656514167786, 1.2800813913345337, 1.9880971908569336, 2.696112871170044, 3.4041285514831543, 4.112144470214844, 4.820159912109375, 5.5281758308410645, 6.236191749572754, 6.944207191467285, 7.652223110198975, 8.360239028930664, 9.068254470825195, 9.776269912719727, 10.484285354614258, 11.192301750183105, 11.900317192077637, 12.608333587646484, 13.316349029541016, 14.024364471435547, 14.732379913330078, 15.440396308898926, 16.14841079711914, 16.856428146362305, 17.564443588256836, 18.272459030151367, 18.98047637939453, 19.688491821289062, 20.396507263183594, 21.104522705078125, 21.812538146972656, 22.520553588867188]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 5.0, 7.0, 8.0, 5.0, 7.0, 9.0, 13.0, 29.0, 39.0, 43.0, 74.0, 111.0, 125.0, 165.0, 267.0, 374.0, 527.0, 760.0, 986.0, 1625.0, 2445.0, 4167.0, 7625.0, 15984.0, 36079.0, 87204.0, 191308.0, 285082.0, 220314.0, 106811.0, 44708.0, 19355.0, 9197.0, 4706.0, 2690.0, 1802.0, 1175.0, 781.0, 548.0, 411.0, 298.0, 218.0, 131.0, 85.0, 74.0, 56.0, 36.0, 28.0, 20.0, 13.0, 12.0, 7.0, 5.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.40625, -40.00830078125, -38.6103515625, -37.21240234375, -35.814453125, -34.41650390625, -33.0185546875, -31.62060546875, -30.22265625, -28.82470703125, -27.4267578125, -26.02880859375, -24.630859375, -23.23291015625, -21.8349609375, -20.43701171875, -19.0390625, -17.64111328125, -16.2431640625, -14.84521484375, -13.447265625, -12.04931640625, -10.6513671875, -9.25341796875, -7.85546875, -6.45751953125, -5.0595703125, -3.66162109375, -2.263671875, -0.86572265625, 0.5322265625, 1.93017578125, 3.328125, 4.72607421875, 6.1240234375, 7.52197265625, 8.919921875, 10.31787109375, 11.7158203125, 13.11376953125, 14.51171875, 15.90966796875, 17.3076171875, 18.70556640625, 20.103515625, 21.50146484375, 22.8994140625, 24.29736328125, 25.6953125, 27.09326171875, 28.4912109375, 29.88916015625, 31.287109375, 32.68505859375, 34.0830078125, 35.48095703125, 36.87890625, 38.27685546875, 39.6748046875, 41.07275390625, 42.470703125, 43.86865234375, 45.2666015625, 46.66455078125, 48.0625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 8.0, 2.0, 5.0, 9.0, 13.0, 14.0, 8.0, 13.0, 13.0, 15.0, 18.0, 33.0, 18.0, 26.0, 32.0, 38.0, 38.0, 41.0, 54.0, 34.0, 38.0, 42.0, 49.0, 48.0, 44.0, 31.0, 42.0, 31.0, 32.0, 33.0, 28.0, 24.0, 22.0, 19.0, 18.0, 9.0, 8.0, 7.0, 14.0, 11.0, 3.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-21.234375, -20.55615234375, -19.8779296875, -19.19970703125, -18.521484375, -17.84326171875, -17.1650390625, -16.48681640625, -15.80859375, -15.13037109375, -14.4521484375, -13.77392578125, -13.095703125, -12.41748046875, -11.7392578125, -11.06103515625, -10.3828125, -9.70458984375, -9.0263671875, -8.34814453125, -7.669921875, -6.99169921875, -6.3134765625, -5.63525390625, -4.95703125, -4.27880859375, -3.6005859375, -2.92236328125, -2.244140625, -1.56591796875, -0.8876953125, -0.20947265625, 0.46875, 1.14697265625, 1.8251953125, 2.50341796875, 3.181640625, 3.85986328125, 4.5380859375, 5.21630859375, 5.89453125, 6.57275390625, 7.2509765625, 7.92919921875, 8.607421875, 9.28564453125, 9.9638671875, 10.64208984375, 11.3203125, 11.99853515625, 12.6767578125, 13.35498046875, 14.033203125, 14.71142578125, 15.3896484375, 16.06787109375, 16.74609375, 17.42431640625, 18.1025390625, 18.78076171875, 19.458984375, 20.13720703125, 20.8154296875, 21.49365234375, 22.171875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 6.0, 8.0, 10.0, 27.0, 31.0, 39.0, 62.0, 70.0, 109.0, 177.0, 237.0, 334.0, 482.0, 691.0, 1078.0, 1587.0, 2517.0, 3916.0, 6572.0, 12241.0, 24950.0, 57287.0, 142684.0, 302616.0, 273765.0, 120022.0, 48105.0, 21764.0, 10714.0, 6037.0, 3517.0, 2268.0, 1478.0, 1027.0, 632.0, 449.0, 293.0, 199.0, 175.0, 119.0, 75.0, 51.0, 35.0, 24.0, 20.0, 12.0, 20.0, 9.0, 1.0, 2.0, 3.0, 5.0, 4.0], "bins": [-54.65625, -53.09033203125, -51.5244140625, -49.95849609375, -48.392578125, -46.82666015625, -45.2607421875, -43.69482421875, -42.12890625, -40.56298828125, -38.9970703125, -37.43115234375, -35.865234375, -34.29931640625, -32.7333984375, -31.16748046875, -29.6015625, -28.03564453125, -26.4697265625, -24.90380859375, -23.337890625, -21.77197265625, -20.2060546875, -18.64013671875, -17.07421875, -15.50830078125, -13.9423828125, -12.37646484375, -10.810546875, -9.24462890625, -7.6787109375, -6.11279296875, -4.546875, -2.98095703125, -1.4150390625, 0.15087890625, 1.716796875, 3.28271484375, 4.8486328125, 6.41455078125, 7.98046875, 9.54638671875, 11.1123046875, 12.67822265625, 14.244140625, 15.81005859375, 17.3759765625, 18.94189453125, 20.5078125, 22.07373046875, 23.6396484375, 25.20556640625, 26.771484375, 28.33740234375, 29.9033203125, 31.46923828125, 33.03515625, 34.60107421875, 36.1669921875, 37.73291015625, 39.298828125, 40.86474609375, 42.4306640625, 43.99658203125, 45.5625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 7.0, 5.0, 5.0, 6.0, 9.0, 14.0, 13.0, 17.0, 18.0, 22.0, 22.0, 31.0, 25.0, 29.0, 29.0, 28.0, 29.0, 32.0, 45.0, 56.0, 39.0, 34.0, 32.0, 36.0, 31.0, 32.0, 34.0, 32.0, 29.0, 30.0, 25.0, 31.0, 19.0, 23.0, 14.0, 21.0, 8.0, 17.0, 12.0, 13.0, 11.0, 5.0, 6.0, 7.0, 10.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0], "bins": [-13.0546875, -12.6796875, -12.3046875, -11.9296875, -11.5546875, -11.1796875, -10.8046875, -10.4296875, -10.0546875, -9.6796875, -9.3046875, -8.9296875, -8.5546875, -8.1796875, -7.8046875, -7.4296875, -7.0546875, -6.6796875, -6.3046875, -5.9296875, -5.5546875, -5.1796875, -4.8046875, -4.4296875, -4.0546875, -3.6796875, -3.3046875, -2.9296875, -2.5546875, -2.1796875, -1.8046875, -1.4296875, -1.0546875, -0.6796875, -0.3046875, 0.0703125, 0.4453125, 0.8203125, 1.1953125, 1.5703125, 1.9453125, 2.3203125, 2.6953125, 3.0703125, 3.4453125, 3.8203125, 4.1953125, 4.5703125, 4.9453125, 5.3203125, 5.6953125, 6.0703125, 6.4453125, 6.8203125, 7.1953125, 7.5703125, 7.9453125, 8.3203125, 8.6953125, 9.0703125, 9.4453125, 9.8203125, 10.1953125, 10.5703125, 10.9453125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 2.0, 5.0, 7.0, 16.0, 31.0, 24.0, 39.0, 58.0, 78.0, 143.0, 205.0, 321.0, 432.0, 703.0, 1107.0, 1953.0, 3103.0, 5573.0, 9653.0, 17853.0, 34847.0, 70834.0, 149651.0, 262940.0, 238722.0, 125613.0, 59927.0, 29275.0, 15252.0, 8330.0, 4726.0, 2689.0, 1609.0, 1030.0, 634.0, 396.0, 252.0, 157.0, 105.0, 85.0, 48.0, 38.0, 22.0, 20.0, 13.0, 11.0, 11.0, 6.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-21.0625, -20.421875, -19.78125, -19.140625, -18.5, -17.859375, -17.21875, -16.578125, -15.9375, -15.296875, -14.65625, -14.015625, -13.375, -12.734375, -12.09375, -11.453125, -10.8125, -10.171875, -9.53125, -8.890625, -8.25, -7.609375, -6.96875, -6.328125, -5.6875, -5.046875, -4.40625, -3.765625, -3.125, -2.484375, -1.84375, -1.203125, -0.5625, 0.078125, 0.71875, 1.359375, 2.0, 2.640625, 3.28125, 3.921875, 4.5625, 5.203125, 5.84375, 6.484375, 7.125, 7.765625, 8.40625, 9.046875, 9.6875, 10.328125, 10.96875, 11.609375, 12.25, 12.890625, 13.53125, 14.171875, 14.8125, 15.453125, 16.09375, 16.734375, 17.375, 18.015625, 18.65625, 19.296875, 19.9375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 1.0, 2.0, 1.0, 7.0, 10.0, 10.0, 9.0, 16.0, 25.0, 50.0, 57.0, 82.0, 112.0, 121.0, 109.0, 125.0, 70.0, 52.0, 37.0, 32.0, 21.0, 10.0, 7.0, 9.0, 7.0, 3.0, 7.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0014095306396484375, -0.0013667196035385132, -0.0013239085674285889, -0.0012810975313186646, -0.0012382864952087402, -0.001195475459098816, -0.0011526644229888916, -0.0011098533868789673, -0.001067042350769043, -0.0010242313146591187, -0.0009814202785491943, -0.00093860924243927, -0.0008957982063293457, -0.0008529871702194214, -0.0008101761341094971, -0.0007673650979995728, -0.0007245540618896484, -0.0006817430257797241, -0.0006389319896697998, -0.0005961209535598755, -0.0005533099174499512, -0.0005104988813400269, -0.00046768784523010254, -0.0004248768091201782, -0.0003820657730102539, -0.0003392547369003296, -0.0002964437007904053, -0.00025363266468048096, -0.00021082162857055664, -0.00016801059246063232, -0.000125199556350708, -8.238852024078369e-05, -3.9577484130859375e-05, 3.2335519790649414e-06, 4.604458808898926e-05, 8.885562419891357e-05, 0.0001316666603088379, 0.0001744776964187622, 0.00021728873252868652, 0.00026009976863861084, 0.00030291080474853516, 0.00034572184085845947, 0.0003885328769683838, 0.0004313439130783081, 0.0004741549491882324, 0.0005169659852981567, 0.0005597770214080811, 0.0006025880575180054, 0.0006453990936279297, 0.000688210129737854, 0.0007310211658477783, 0.0007738322019577026, 0.000816643238067627, 0.0008594542741775513, 0.0009022653102874756, 0.0009450763463973999, 0.0009878873825073242, 0.0010306984186172485, 0.0010735094547271729, 0.0011163204908370972, 0.0011591315269470215, 0.0012019425630569458, 0.0012447535991668701, 0.0012875646352767944, 0.0013303756713867188]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 8.0, 9.0, 13.0, 26.0, 21.0, 34.0, 60.0, 65.0, 121.0, 189.0, 244.0, 377.0, 521.0, 862.0, 1385.0, 2165.0, 3383.0, 5693.0, 9110.0, 15594.0, 26905.0, 46359.0, 79305.0, 128325.0, 176929.0, 184791.0, 143344.0, 91472.0, 53960.0, 31248.0, 18001.0, 10778.0, 6510.0, 3864.0, 2398.0, 1493.0, 1010.0, 623.0, 438.0, 314.0, 199.0, 132.0, 86.0, 57.0, 35.0, 37.0, 16.0, 12.0, 15.0, 9.0, 7.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0], "bins": [-14.3984375, -13.950439453125, -13.50244140625, -13.054443359375, -12.6064453125, -12.158447265625, -11.71044921875, -11.262451171875, -10.814453125, -10.366455078125, -9.91845703125, -9.470458984375, -9.0224609375, -8.574462890625, -8.12646484375, -7.678466796875, -7.23046875, -6.782470703125, -6.33447265625, -5.886474609375, -5.4384765625, -4.990478515625, -4.54248046875, -4.094482421875, -3.646484375, -3.198486328125, -2.75048828125, -2.302490234375, -1.8544921875, -1.406494140625, -0.95849609375, -0.510498046875, -0.0625, 0.385498046875, 0.83349609375, 1.281494140625, 1.7294921875, 2.177490234375, 2.62548828125, 3.073486328125, 3.521484375, 3.969482421875, 4.41748046875, 4.865478515625, 5.3134765625, 5.761474609375, 6.20947265625, 6.657470703125, 7.10546875, 7.553466796875, 8.00146484375, 8.449462890625, 8.8974609375, 9.345458984375, 9.79345703125, 10.241455078125, 10.689453125, 11.137451171875, 11.58544921875, 12.033447265625, 12.4814453125, 12.929443359375, 13.37744140625, 13.825439453125, 14.2734375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 3.0, 7.0, 8.0, 8.0, 11.0, 11.0, 15.0, 24.0, 26.0, 26.0, 31.0, 42.0, 41.0, 56.0, 57.0, 66.0, 64.0, 64.0, 56.0, 49.0, 52.0, 44.0, 46.0, 35.0, 26.0, 26.0, 20.0, 18.0, 8.0, 12.0, 7.0, 2.0, 5.0, 8.0, 2.0, 4.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.06640625, -4.90667724609375, -4.7469482421875, -4.58721923828125, -4.427490234375, -4.26776123046875, -4.1080322265625, -3.94830322265625, -3.78857421875, -3.62884521484375, -3.4691162109375, -3.30938720703125, -3.149658203125, -2.98992919921875, -2.8302001953125, -2.67047119140625, -2.5107421875, -2.35101318359375, -2.1912841796875, -2.03155517578125, -1.871826171875, -1.71209716796875, -1.5523681640625, -1.39263916015625, -1.23291015625, -1.07318115234375, -0.9134521484375, -0.75372314453125, -0.593994140625, -0.43426513671875, -0.2745361328125, -0.11480712890625, 0.044921875, 0.20465087890625, 0.3643798828125, 0.52410888671875, 0.683837890625, 0.84356689453125, 1.0032958984375, 1.16302490234375, 1.32275390625, 1.48248291015625, 1.6422119140625, 1.80194091796875, 1.961669921875, 2.12139892578125, 2.2811279296875, 2.44085693359375, 2.6005859375, 2.76031494140625, 2.9200439453125, 3.07977294921875, 3.239501953125, 3.39923095703125, 3.5589599609375, 3.71868896484375, 3.87841796875, 4.03814697265625, 4.1978759765625, 4.35760498046875, 4.517333984375, 4.67706298828125, 4.8367919921875, 4.99652099609375, 5.15625]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 7.0, 12.0, 5.0, 8.0, 15.0, 15.0, 20.0, 29.0, 28.0, 37.0, 37.0, 50.0, 45.0, 53.0, 65.0, 50.0, 47.0, 53.0, 52.0, 52.0, 51.0, 34.0, 33.0, 40.0, 23.0, 25.0, 17.0, 14.0, 22.0, 16.0, 8.0, 7.0, 7.0, 8.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-33.87684631347656, -32.922794342041016, -31.96874237060547, -31.014690399169922, -30.060638427734375, -29.106586456298828, -28.152536392211914, -27.198484420776367, -26.24443244934082, -25.290380477905273, -24.336328506469727, -23.38227653503418, -22.428226470947266, -21.47417449951172, -20.520122528076172, -19.566070556640625, -18.612018585205078, -17.65796661376953, -16.703914642333984, -15.749863624572754, -14.795811653137207, -13.84175968170166, -12.88770866394043, -11.933656692504883, -10.979604721069336, -10.025552749633789, -9.071500778198242, -8.117449760437012, -7.163397789001465, -6.209345817565918, -5.255294322967529, -4.301242828369141, -3.347188949584961, -2.393137216567993, -1.4390854835510254, -0.4850337505340576, 0.46901798248291016, 1.423069953918457, 2.3771214485168457, 3.3311729431152344, 4.285224914550781, 5.239276885986328, 6.193328380584717, 7.1473798751831055, 8.101431846618652, 9.0554838180542, 10.00953483581543, 10.963586807250977, 11.917638778686523, 12.87169075012207, 13.825742721557617, 14.779793739318848, 15.733845710754395, 16.687896728515625, 17.641948699951172, 18.59600067138672, 19.550052642822266, 20.504104614257812, 21.45815658569336, 22.412208557128906, 23.366260528564453, 24.3203125, 25.274362564086914, 26.22841453552246, 27.182466506958008]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 6.0, 2.0, 3.0, 5.0, 9.0, 10.0, 10.0, 16.0, 15.0, 10.0, 21.0, 24.0, 19.0, 35.0, 26.0, 35.0, 45.0, 42.0, 38.0, 40.0, 48.0, 50.0, 48.0, 50.0, 47.0, 47.0, 36.0, 34.0, 31.0, 41.0, 18.0, 29.0, 22.0, 22.0, 18.0, 15.0, 11.0, 8.0, 5.0, 11.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.00705337524414, -22.3016414642334, -21.596229553222656, -20.890817642211914, -20.185405731201172, -19.47999382019043, -18.774581909179688, -18.069169998168945, -17.363758087158203, -16.65834617614746, -15.952934265136719, -15.247522354125977, -14.542110443115234, -13.836698532104492, -13.13128662109375, -12.425874710083008, -11.720462799072266, -11.015050888061523, -10.309638977050781, -9.604227066040039, -8.898815155029297, -8.193403244018555, -7.4879913330078125, -6.78257942199707, -6.077167510986328, -5.371755599975586, -4.666343688964844, -3.9609317779541016, -3.2555198669433594, -2.550107955932617, -1.844696044921875, -1.1392841339111328, -0.4338722229003906, 0.27153968811035156, 0.9769515991210938, 1.682363510131836, 2.387775421142578, 3.0931873321533203, 3.7985992431640625, 4.504011154174805, 5.209423065185547, 5.914834976196289, 6.620246887207031, 7.325658798217773, 8.031070709228516, 8.736482620239258, 9.44189453125, 10.147306442260742, 10.852718353271484, 11.558130264282227, 12.263542175292969, 12.968954086303711, 13.674365997314453, 14.379777908325195, 15.085189819335938, 15.79060173034668, 16.496013641357422, 17.201425552368164, 17.906837463378906, 18.61224937438965, 19.31766128540039, 20.023073196411133, 20.728485107421875, 21.433897018432617, 22.13930892944336]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 8.0, 4.0, 9.0, 14.0, 28.0, 26.0, 41.0, 57.0, 94.0, 149.0, 246.0, 385.0, 562.0, 862.0, 1314.0, 2100.0, 3304.0, 5366.0, 8192.0, 13061.0, 20516.0, 32183.0, 48693.0, 71432.0, 98800.0, 123633.0, 137162.0, 130374.0, 108574.0, 81289.0, 56197.0, 37341.0, 24092.0, 15359.0, 9992.0, 6255.0, 3984.0, 2432.0, 1569.0, 1011.0, 665.0, 389.0, 295.0, 183.0, 119.0, 84.0, 59.0, 23.0, 9.0, 13.0, 7.0, 2.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-25.53125, -24.75, -23.96875, -23.1875, -22.40625, -21.625, -20.84375, -20.0625, -19.28125, -18.5, -17.71875, -16.9375, -16.15625, -15.375, -14.59375, -13.8125, -13.03125, -12.25, -11.46875, -10.6875, -9.90625, -9.125, -8.34375, -7.5625, -6.78125, -6.0, -5.21875, -4.4375, -3.65625, -2.875, -2.09375, -1.3125, -0.53125, 0.25, 1.03125, 1.8125, 2.59375, 3.375, 4.15625, 4.9375, 5.71875, 6.5, 7.28125, 8.0625, 8.84375, 9.625, 10.40625, 11.1875, 11.96875, 12.75, 13.53125, 14.3125, 15.09375, 15.875, 16.65625, 17.4375, 18.21875, 19.0, 19.78125, 20.5625, 21.34375, 22.125, 22.90625, 23.6875, 24.46875]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 8.0, 5.0, 8.0, 11.0, 16.0, 8.0, 20.0, 19.0, 25.0, 14.0, 24.0, 25.0, 40.0, 26.0, 38.0, 40.0, 38.0, 35.0, 34.0, 39.0, 59.0, 36.0, 52.0, 21.0, 44.0, 57.0, 33.0, 31.0, 25.0, 31.0, 14.0, 23.0, 29.0, 7.0, 14.0, 10.0, 15.0, 5.0, 6.0, 4.0, 6.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.625, -21.9580078125, -21.291015625, -20.6240234375, -19.95703125, -19.2900390625, -18.623046875, -17.9560546875, -17.2890625, -16.6220703125, -15.955078125, -15.2880859375, -14.62109375, -13.9541015625, -13.287109375, -12.6201171875, -11.953125, -11.2861328125, -10.619140625, -9.9521484375, -9.28515625, -8.6181640625, -7.951171875, -7.2841796875, -6.6171875, -5.9501953125, -5.283203125, -4.6162109375, -3.94921875, -3.2822265625, -2.615234375, -1.9482421875, -1.28125, -0.6142578125, 0.052734375, 0.7197265625, 1.38671875, 2.0537109375, 2.720703125, 3.3876953125, 4.0546875, 4.7216796875, 5.388671875, 6.0556640625, 6.72265625, 7.3896484375, 8.056640625, 8.7236328125, 9.390625, 10.0576171875, 10.724609375, 11.3916015625, 12.05859375, 12.7255859375, 13.392578125, 14.0595703125, 14.7265625, 15.3935546875, 16.060546875, 16.7275390625, 17.39453125, 18.0615234375, 18.728515625, 19.3955078125, 20.0625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 4.0, 7.0, 7.0, 10.0, 10.0, 16.0, 28.0, 51.0, 67.0, 96.0, 145.0, 195.0, 292.0, 424.0, 648.0, 990.0, 1471.0, 2098.0, 3047.0, 4485.0, 6724.0, 9939.0, 14267.0, 21146.0, 30029.0, 42714.0, 58114.0, 77550.0, 96020.0, 110873.0, 115247.0, 107571.0, 91567.0, 72209.0, 54139.0, 38919.0, 27525.0, 19130.0, 13129.0, 8837.0, 6051.0, 4039.0, 2768.0, 1915.0, 1305.0, 860.0, 599.0, 414.0, 271.0, 197.0, 124.0, 94.0, 57.0, 42.0, 31.0, 26.0, 13.0, 13.0, 4.0, 4.0, 4.0, 3.0, 1.0], "bins": [-18.703125, -18.10693359375, -17.5107421875, -16.91455078125, -16.318359375, -15.72216796875, -15.1259765625, -14.52978515625, -13.93359375, -13.33740234375, -12.7412109375, -12.14501953125, -11.548828125, -10.95263671875, -10.3564453125, -9.76025390625, -9.1640625, -8.56787109375, -7.9716796875, -7.37548828125, -6.779296875, -6.18310546875, -5.5869140625, -4.99072265625, -4.39453125, -3.79833984375, -3.2021484375, -2.60595703125, -2.009765625, -1.41357421875, -0.8173828125, -0.22119140625, 0.375, 0.97119140625, 1.5673828125, 2.16357421875, 2.759765625, 3.35595703125, 3.9521484375, 4.54833984375, 5.14453125, 5.74072265625, 6.3369140625, 6.93310546875, 7.529296875, 8.12548828125, 8.7216796875, 9.31787109375, 9.9140625, 10.51025390625, 11.1064453125, 11.70263671875, 12.298828125, 12.89501953125, 13.4912109375, 14.08740234375, 14.68359375, 15.27978515625, 15.8759765625, 16.47216796875, 17.068359375, 17.66455078125, 18.2607421875, 18.85693359375, 19.453125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 9.0, 11.0, 8.0, 7.0, 15.0, 16.0, 15.0, 18.0, 23.0, 29.0, 23.0, 30.0, 39.0, 30.0, 38.0, 35.0, 49.0, 46.0, 32.0, 42.0, 36.0, 43.0, 39.0, 37.0, 41.0, 41.0, 29.0, 29.0, 29.0, 18.0, 20.0, 15.0, 22.0, 14.0, 12.0, 8.0, 10.0, 9.0, 4.0, 3.0, 2.0, 8.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-14.8671875, -14.431396484375, -13.99560546875, -13.559814453125, -13.1240234375, -12.688232421875, -12.25244140625, -11.816650390625, -11.380859375, -10.945068359375, -10.50927734375, -10.073486328125, -9.6376953125, -9.201904296875, -8.76611328125, -8.330322265625, -7.89453125, -7.458740234375, -7.02294921875, -6.587158203125, -6.1513671875, -5.715576171875, -5.27978515625, -4.843994140625, -4.408203125, -3.972412109375, -3.53662109375, -3.100830078125, -2.6650390625, -2.229248046875, -1.79345703125, -1.357666015625, -0.921875, -0.486083984375, -0.05029296875, 0.385498046875, 0.8212890625, 1.257080078125, 1.69287109375, 2.128662109375, 2.564453125, 3.000244140625, 3.43603515625, 3.871826171875, 4.3076171875, 4.743408203125, 5.17919921875, 5.614990234375, 6.05078125, 6.486572265625, 6.92236328125, 7.358154296875, 7.7939453125, 8.229736328125, 8.66552734375, 9.101318359375, 9.537109375, 9.972900390625, 10.40869140625, 10.844482421875, 11.2802734375, 11.716064453125, 12.15185546875, 12.587646484375, 13.0234375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 5.0, 10.0, 19.0, 14.0, 47.0, 55.0, 78.0, 154.0, 203.0, 347.0, 614.0, 959.0, 1581.0, 2669.0, 4686.0, 7927.0, 13739.0, 24533.0, 43465.0, 76888.0, 128276.0, 181770.0, 193883.0, 149005.0, 93865.0, 53679.0, 29865.0, 16946.0, 9617.0, 5550.0, 3213.0, 1887.0, 1133.0, 701.0, 401.0, 269.0, 174.0, 112.0, 75.0, 48.0, 24.0, 29.0, 12.0, 6.0, 8.0, 5.0, 2.0, 5.0, 3.0, 2.0, 0.0, 2.0], "bins": [-21.4375, -20.810302734375, -20.18310546875, -19.555908203125, -18.9287109375, -18.301513671875, -17.67431640625, -17.047119140625, -16.419921875, -15.792724609375, -15.16552734375, -14.538330078125, -13.9111328125, -13.283935546875, -12.65673828125, -12.029541015625, -11.40234375, -10.775146484375, -10.14794921875, -9.520751953125, -8.8935546875, -8.266357421875, -7.63916015625, -7.011962890625, -6.384765625, -5.757568359375, -5.13037109375, -4.503173828125, -3.8759765625, -3.248779296875, -2.62158203125, -1.994384765625, -1.3671875, -0.739990234375, -0.11279296875, 0.514404296875, 1.1416015625, 1.768798828125, 2.39599609375, 3.023193359375, 3.650390625, 4.277587890625, 4.90478515625, 5.531982421875, 6.1591796875, 6.786376953125, 7.41357421875, 8.040771484375, 8.66796875, 9.295166015625, 9.92236328125, 10.549560546875, 11.1767578125, 11.803955078125, 12.43115234375, 13.058349609375, 13.685546875, 14.312744140625, 14.93994140625, 15.567138671875, 16.1943359375, 16.821533203125, 17.44873046875, 18.075927734375, 18.703125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 2.0, 8.0, 10.0, 8.0, 10.0, 14.0, 13.0, 23.0, 28.0, 41.0, 29.0, 31.0, 31.0, 42.0, 50.0, 40.0, 48.0, 62.0, 57.0, 53.0, 50.0, 49.0, 40.0, 44.0, 27.0, 35.0, 32.0, 13.0, 13.0, 12.0, 12.0, 11.0, 5.0, 6.0, 9.0, 6.0, 2.0, 5.0, 8.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0015411376953125, -0.0014872103929519653, -0.0014332830905914307, -0.001379355788230896, -0.0013254284858703613, -0.0012715011835098267, -0.001217573881149292, -0.0011636465787887573, -0.0011097192764282227, -0.001055791974067688, -0.0010018646717071533, -0.0009479373693466187, -0.000894010066986084, -0.0008400827646255493, -0.0007861554622650146, -0.00073222815990448, -0.0006783008575439453, -0.0006243735551834106, -0.000570446252822876, -0.0005165189504623413, -0.00046259164810180664, -0.00040866434574127197, -0.0003547370433807373, -0.00030080974102020264, -0.00024688243865966797, -0.0001929551362991333, -0.00013902783393859863, -8.510053157806396e-05, -3.11732292175293e-05, 2.275407314300537e-05, 7.668137550354004e-05, 0.0001306086778640747, 0.00018453598022460938, 0.00023846328258514404, 0.0002923905849456787, 0.0003463178873062134, 0.00040024518966674805, 0.0004541724920272827, 0.0005080997943878174, 0.000562027096748352, 0.0006159543991088867, 0.0006698817014694214, 0.0007238090038299561, 0.0007777363061904907, 0.0008316636085510254, 0.0008855909109115601, 0.0009395182132720947, 0.0009934455156326294, 0.001047372817993164, 0.0011013001203536987, 0.0011552274227142334, 0.001209154725074768, 0.0012630820274353027, 0.0013170093297958374, 0.001370936632156372, 0.0014248639345169067, 0.0014787912368774414, 0.001532718539237976, 0.0015866458415985107, 0.0016405731439590454, 0.00169450044631958, 0.0017484277486801147, 0.0018023550510406494, 0.001856282353401184, 0.0019102096557617188]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 5.0, 7.0, 6.0, 10.0, 24.0, 37.0, 49.0, 61.0, 110.0, 182.0, 319.0, 535.0, 925.0, 1705.0, 3200.0, 5877.0, 10967.0, 20489.0, 38682.0, 71508.0, 123413.0, 182991.0, 203440.0, 161573.0, 101239.0, 56396.0, 29923.0, 16158.0, 8376.0, 4583.0, 2599.0, 1336.0, 757.0, 468.0, 227.0, 126.0, 72.0, 45.0, 40.0, 26.0, 14.0, 17.0, 11.0, 5.0, 7.0, 4.0, 5.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-19.078125, -18.487548828125, -17.89697265625, -17.306396484375, -16.7158203125, -16.125244140625, -15.53466796875, -14.944091796875, -14.353515625, -13.762939453125, -13.17236328125, -12.581787109375, -11.9912109375, -11.400634765625, -10.81005859375, -10.219482421875, -9.62890625, -9.038330078125, -8.44775390625, -7.857177734375, -7.2666015625, -6.676025390625, -6.08544921875, -5.494873046875, -4.904296875, -4.313720703125, -3.72314453125, -3.132568359375, -2.5419921875, -1.951416015625, -1.36083984375, -0.770263671875, -0.1796875, 0.410888671875, 1.00146484375, 1.592041015625, 2.1826171875, 2.773193359375, 3.36376953125, 3.954345703125, 4.544921875, 5.135498046875, 5.72607421875, 6.316650390625, 6.9072265625, 7.497802734375, 8.08837890625, 8.678955078125, 9.26953125, 9.860107421875, 10.45068359375, 11.041259765625, 11.6318359375, 12.222412109375, 12.81298828125, 13.403564453125, 13.994140625, 14.584716796875, 15.17529296875, 15.765869140625, 16.3564453125, 16.947021484375, 17.53759765625, 18.128173828125, 18.71875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 1.0, 2.0, 8.0, 3.0, 6.0, 10.0, 8.0, 16.0, 20.0, 32.0, 18.0, 20.0, 26.0, 43.0, 36.0, 50.0, 53.0, 57.0, 64.0, 66.0, 54.0, 59.0, 57.0, 49.0, 35.0, 42.0, 30.0, 24.0, 25.0, 20.0, 13.0, 12.0, 15.0, 7.0, 5.0, 4.0, 3.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.46875, -6.296875, -6.125, -5.953125, -5.78125, -5.609375, -5.4375, -5.265625, -5.09375, -4.921875, -4.75, -4.578125, -4.40625, -4.234375, -4.0625, -3.890625, -3.71875, -3.546875, -3.375, -3.203125, -3.03125, -2.859375, -2.6875, -2.515625, -2.34375, -2.171875, -2.0, -1.828125, -1.65625, -1.484375, -1.3125, -1.140625, -0.96875, -0.796875, -0.625, -0.453125, -0.28125, -0.109375, 0.0625, 0.234375, 0.40625, 0.578125, 0.75, 0.921875, 1.09375, 1.265625, 1.4375, 1.609375, 1.78125, 1.953125, 2.125, 2.296875, 2.46875, 2.640625, 2.8125, 2.984375, 3.15625, 3.328125, 3.5, 3.671875, 3.84375, 4.015625, 4.1875, 4.359375, 4.53125]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 7.0, 4.0, 3.0, 6.0, 13.0, 8.0, 14.0, 17.0, 23.0, 35.0, 41.0, 35.0, 37.0, 60.0, 63.0, 52.0, 63.0, 61.0, 46.0, 71.0, 56.0, 49.0, 51.0, 39.0, 37.0, 19.0, 30.0, 12.0, 14.0, 6.0, 11.0, 5.0, 4.0, 7.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.52616882324219, -36.46769714355469, -35.40922546386719, -34.35075378417969, -33.29228210449219, -32.23381042480469, -31.175338745117188, -30.116867065429688, -29.058395385742188, -27.999923706054688, -26.941452026367188, -25.882980346679688, -24.824508666992188, -23.766036987304688, -22.707565307617188, -21.649093627929688, -20.590621948242188, -19.532150268554688, -18.473678588867188, -17.415206909179688, -16.356735229492188, -15.298263549804688, -14.239791870117188, -13.181320190429688, -12.122848510742188, -11.064376831054688, -10.005905151367188, -8.947433471679688, -7.8889617919921875, -6.8304901123046875, -5.7720184326171875, -4.7135467529296875, -3.655078887939453, -2.596607208251953, -1.5381355285644531, -0.4796638488769531, 0.5788078308105469, 1.6372795104980469, 2.695751190185547, 3.754222869873047, 4.812694549560547, 5.871166229248047, 6.929637908935547, 7.988109588623047, 9.046581268310547, 10.105052947998047, 11.163524627685547, 12.221996307373047, 13.280467987060547, 14.338939666748047, 15.397411346435547, 16.455883026123047, 17.514354705810547, 18.572826385498047, 19.631298065185547, 20.689769744873047, 21.748241424560547, 22.806713104248047, 23.865184783935547, 24.923656463623047, 25.982128143310547, 27.040599822998047, 28.099071502685547, 29.157543182373047, 30.216014862060547]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 4.0, 9.0, 6.0, 9.0, 11.0, 10.0, 12.0, 10.0, 12.0, 16.0, 18.0, 28.0, 25.0, 23.0, 30.0, 36.0, 35.0, 21.0, 32.0, 28.0, 41.0, 64.0, 38.0, 39.0, 36.0, 39.0, 39.0, 40.0, 36.0, 29.0, 33.0, 27.0, 31.0, 24.0, 21.0, 11.0, 17.0, 17.0, 13.0, 11.0, 10.0, 3.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.468870162963867, -19.79831886291504, -19.12776756286621, -18.457216262817383, -17.786663055419922, -17.116111755371094, -16.445560455322266, -15.775009155273438, -15.10445785522461, -14.433906555175781, -13.763355255126953, -13.092803001403809, -12.42225170135498, -11.751700401306152, -11.081148147583008, -10.41059684753418, -9.740045547485352, -9.069494247436523, -8.398942947387695, -7.728390693664551, -7.057839393615723, -6.3872880935668945, -5.716736316680908, -5.046184539794922, -4.375633239746094, -3.7050817012786865, -3.0345301628112793, -2.363978624343872, -1.6934270858764648, -1.0228755474090576, -0.3523240089416504, 0.31822776794433594, 0.9887771606445312, 1.6593286991119385, 2.3298802375793457, 3.000431776046753, 3.67098331451416, 4.341534614562988, 5.012086391448975, 5.682638168334961, 6.353189468383789, 7.023740768432617, 7.6942925453186035, 8.36484432220459, 9.035395622253418, 9.705946922302246, 10.37649917602539, 11.047050476074219, 11.717601776123047, 12.388153076171875, 13.058704376220703, 13.729256629943848, 14.399807929992676, 15.070359230041504, 15.740911483764648, 16.411462783813477, 17.082014083862305, 17.752565383911133, 18.42311668395996, 19.09366798400879, 19.76422119140625, 20.434772491455078, 21.105323791503906, 21.775875091552734, 22.446426391601562]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 3.0, 9.0, 8.0, 18.0, 32.0, 52.0, 73.0, 120.0, 154.0, 310.0, 503.0, 830.0, 1451.0, 2572.0, 4488.0, 8294.0, 15348.0, 29663.0, 59609.0, 127794.0, 284348.0, 631812.0, 1066958.0, 985485.0, 531654.0, 234427.0, 105595.0, 49829.0, 24729.0, 12691.0, 6735.0, 3591.0, 2138.0, 1192.0, 672.0, 426.0, 255.0, 157.0, 83.0, 65.0, 36.0, 22.0, 29.0, 12.0, 8.0, 5.0, 0.0, 1.0, 1.0, 1.0], "bins": [-31.890625, -31.02587890625, -30.1611328125, -29.29638671875, -28.431640625, -27.56689453125, -26.7021484375, -25.83740234375, -24.97265625, -24.10791015625, -23.2431640625, -22.37841796875, -21.513671875, -20.64892578125, -19.7841796875, -18.91943359375, -18.0546875, -17.18994140625, -16.3251953125, -15.46044921875, -14.595703125, -13.73095703125, -12.8662109375, -12.00146484375, -11.13671875, -10.27197265625, -9.4072265625, -8.54248046875, -7.677734375, -6.81298828125, -5.9482421875, -5.08349609375, -4.21875, -3.35400390625, -2.4892578125, -1.62451171875, -0.759765625, 0.10498046875, 0.9697265625, 1.83447265625, 2.69921875, 3.56396484375, 4.4287109375, 5.29345703125, 6.158203125, 7.02294921875, 7.8876953125, 8.75244140625, 9.6171875, 10.48193359375, 11.3466796875, 12.21142578125, 13.076171875, 13.94091796875, 14.8056640625, 15.67041015625, 16.53515625, 17.39990234375, 18.2646484375, 19.12939453125, 19.994140625, 20.85888671875, 21.7236328125, 22.58837890625, 23.453125]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 9.0, 5.0, 8.0, 12.0, 8.0, 5.0, 16.0, 14.0, 10.0, 17.0, 10.0, 12.0, 18.0, 14.0, 23.0, 25.0, 17.0, 29.0, 30.0, 35.0, 28.0, 32.0, 28.0, 34.0, 29.0, 43.0, 33.0, 39.0, 36.0, 26.0, 35.0, 30.0, 28.0, 29.0, 33.0, 19.0, 34.0, 22.0, 19.0, 18.0, 20.0, 7.0, 17.0, 8.0, 5.0, 5.0, 5.0, 4.0, 10.0, 4.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0], "bins": [-13.1015625, -12.6968994140625, -12.292236328125, -11.8875732421875, -11.48291015625, -11.0782470703125, -10.673583984375, -10.2689208984375, -9.8642578125, -9.4595947265625, -9.054931640625, -8.6502685546875, -8.24560546875, -7.8409423828125, -7.436279296875, -7.0316162109375, -6.626953125, -6.2222900390625, -5.817626953125, -5.4129638671875, -5.00830078125, -4.6036376953125, -4.198974609375, -3.7943115234375, -3.3896484375, -2.9849853515625, -2.580322265625, -2.1756591796875, -1.77099609375, -1.3663330078125, -0.961669921875, -0.5570068359375, -0.15234375, 0.2523193359375, 0.656982421875, 1.0616455078125, 1.46630859375, 1.8709716796875, 2.275634765625, 2.6802978515625, 3.0849609375, 3.4896240234375, 3.894287109375, 4.2989501953125, 4.70361328125, 5.1082763671875, 5.512939453125, 5.9176025390625, 6.322265625, 6.7269287109375, 7.131591796875, 7.5362548828125, 7.94091796875, 8.3455810546875, 8.750244140625, 9.1549072265625, 9.5595703125, 9.9642333984375, 10.368896484375, 10.7735595703125, 11.17822265625, 11.5828857421875, 11.987548828125, 12.3922119140625, 12.796875]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 8.0, 11.0, 20.0, 36.0, 43.0, 60.0, 87.0, 173.0, 260.0, 418.0, 722.0, 1056.0, 1704.0, 2847.0, 4682.0, 7793.0, 13422.0, 23310.0, 41282.0, 74234.0, 136741.0, 249543.0, 445873.0, 719056.0, 870437.0, 678937.0, 410138.0, 227983.0, 124342.0, 67820.0, 38299.0, 21771.0, 12446.0, 7230.0, 4457.0, 2623.0, 1608.0, 1035.0, 588.0, 412.0, 261.0, 180.0, 130.0, 59.0, 58.0, 29.0, 17.0, 9.0, 10.0, 9.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0], "bins": [-22.703125, -21.980712890625, -21.25830078125, -20.535888671875, -19.8134765625, -19.091064453125, -18.36865234375, -17.646240234375, -16.923828125, -16.201416015625, -15.47900390625, -14.756591796875, -14.0341796875, -13.311767578125, -12.58935546875, -11.866943359375, -11.14453125, -10.422119140625, -9.69970703125, -8.977294921875, -8.2548828125, -7.532470703125, -6.81005859375, -6.087646484375, -5.365234375, -4.642822265625, -3.92041015625, -3.197998046875, -2.4755859375, -1.753173828125, -1.03076171875, -0.308349609375, 0.4140625, 1.136474609375, 1.85888671875, 2.581298828125, 3.3037109375, 4.026123046875, 4.74853515625, 5.470947265625, 6.193359375, 6.915771484375, 7.63818359375, 8.360595703125, 9.0830078125, 9.805419921875, 10.52783203125, 11.250244140625, 11.97265625, 12.695068359375, 13.41748046875, 14.139892578125, 14.8623046875, 15.584716796875, 16.30712890625, 17.029541015625, 17.751953125, 18.474365234375, 19.19677734375, 19.919189453125, 20.6416015625, 21.364013671875, 22.08642578125, 22.808837890625, 23.53125]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 6.0, 4.0, 10.0, 8.0, 12.0, 22.0, 26.0, 37.0, 48.0, 72.0, 74.0, 102.0, 121.0, 141.0, 192.0, 214.0, 261.0, 253.0, 299.0, 294.0, 275.0, 269.0, 246.0, 226.0, 160.0, 151.0, 120.0, 81.0, 92.0, 50.0, 58.0, 43.0, 31.0, 25.0, 19.0, 7.0, 9.0, 10.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5078125, -8.228271484375, -7.94873046875, -7.669189453125, -7.3896484375, -7.110107421875, -6.83056640625, -6.551025390625, -6.271484375, -5.991943359375, -5.71240234375, -5.432861328125, -5.1533203125, -4.873779296875, -4.59423828125, -4.314697265625, -4.03515625, -3.755615234375, -3.47607421875, -3.196533203125, -2.9169921875, -2.637451171875, -2.35791015625, -2.078369140625, -1.798828125, -1.519287109375, -1.23974609375, -0.960205078125, -0.6806640625, -0.401123046875, -0.12158203125, 0.157958984375, 0.4375, 0.717041015625, 0.99658203125, 1.276123046875, 1.5556640625, 1.835205078125, 2.11474609375, 2.394287109375, 2.673828125, 2.953369140625, 3.23291015625, 3.512451171875, 3.7919921875, 4.071533203125, 4.35107421875, 4.630615234375, 4.91015625, 5.189697265625, 5.46923828125, 5.748779296875, 6.0283203125, 6.307861328125, 6.58740234375, 6.866943359375, 7.146484375, 7.426025390625, 7.70556640625, 7.985107421875, 8.2646484375, 8.544189453125, 8.82373046875, 9.103271484375, 9.3828125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 9.0, 9.0, 8.0, 6.0, 17.0, 12.0, 20.0, 26.0, 32.0, 42.0, 50.0, 60.0, 62.0, 51.0, 85.0, 54.0, 61.0, 63.0, 59.0, 55.0, 41.0, 35.0, 30.0, 22.0, 20.0, 17.0, 17.0, 11.0, 8.0, 5.0, 3.0, 3.0, 5.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.959232330322266, -32.002872467041016, -31.0465087890625, -30.090147018432617, -29.133785247802734, -28.17742347717285, -27.22106170654297, -26.26470184326172, -25.308338165283203, -24.35197639465332, -23.395614624023438, -22.439252853393555, -21.482891082763672, -20.52652931213379, -19.570167541503906, -18.613807678222656, -17.657445907592773, -16.70108413696289, -15.744722366333008, -14.788360595703125, -13.831998825073242, -12.87563705444336, -11.919276237487793, -10.96291446685791, -10.006552696228027, -9.050190925598145, -8.093829154968262, -7.137467861175537, -6.181106090545654, -5.2247443199157715, -4.268383026123047, -3.312021255493164, -2.3556575775146484, -1.3992959260940552, -0.4429342746734619, 0.5134272575378418, 1.4697890281677246, 2.4261507987976074, 3.382512092590332, 4.338873863220215, 5.295235633850098, 6.2515974044799805, 7.207959175109863, 8.16431999206543, 9.120681762695312, 10.077043533325195, 11.033405303955078, 11.989767074584961, 12.946128845214844, 13.902490615844727, 14.85885238647461, 15.815214157104492, 16.771575927734375, 17.727937698364258, 18.68429946899414, 19.64065933227539, 20.597023010253906, 21.55338478088379, 22.509746551513672, 23.466108322143555, 24.422470092773438, 25.37883186340332, 26.335193634033203, 27.291553497314453, 28.247915267944336]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 1.0, 4.0, 3.0, 7.0, 12.0, 9.0, 14.0, 18.0, 13.0, 15.0, 17.0, 33.0, 33.0, 27.0, 40.0, 36.0, 32.0, 33.0, 45.0, 32.0, 37.0, 41.0, 48.0, 42.0, 35.0, 44.0, 45.0, 40.0, 33.0, 35.0, 29.0, 20.0, 19.0, 19.0, 17.0, 16.0, 14.0, 11.0, 7.0, 8.0, 5.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-19.292423248291016, -18.728939056396484, -18.16545295715332, -17.60196876525879, -17.038482666015625, -16.474998474121094, -15.911514282226562, -15.348029136657715, -14.784543991088867, -14.22105884552002, -13.657573699951172, -13.09408950805664, -12.530604362487793, -11.967119216918945, -11.403635025024414, -10.840149879455566, -10.276664733886719, -9.713179588317871, -9.149694442749023, -8.586210250854492, -8.022725105285645, -7.459239959716797, -6.895755290985107, -6.332270622253418, -5.76878547668457, -5.205300331115723, -4.641815662384033, -4.078330993652344, -3.514845848083496, -2.9513609409332275, -2.387876033782959, -1.8243911266326904, -1.2609062194824219, -0.6974213123321533, -0.13393640518188477, 0.4295485019683838, 0.9930334091186523, 1.556518316268921, 2.1200032234191895, 2.683488130569458, 3.2469730377197266, 3.810457944869995, 4.373942852020264, 4.937427520751953, 5.500912666320801, 6.064397811889648, 6.627882480621338, 7.191367149353027, 7.754852294921875, 8.318337440490723, 8.88182258605957, 9.445306777954102, 10.00879192352295, 10.572277069091797, 11.135761260986328, 11.699246406555176, 12.262731552124023, 12.826216697692871, 13.389701843261719, 13.95318603515625, 14.516671180725098, 15.080156326293945, 15.643640518188477, 16.20712661743164, 16.770610809326172]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 7.0, 10.0, 13.0, 21.0, 23.0, 38.0, 51.0, 87.0, 149.0, 198.0, 258.0, 416.0, 678.0, 1032.0, 1501.0, 2448.0, 3892.0, 6362.0, 10782.0, 18914.0, 33600.0, 61275.0, 109124.0, 172749.0, 208047.0, 170437.0, 107018.0, 59974.0, 33217.0, 18779.0, 10590.0, 6318.0, 3744.0, 2332.0, 1493.0, 1033.0, 675.0, 405.0, 267.0, 181.0, 144.0, 86.0, 68.0, 44.0, 26.0, 17.0, 12.0, 8.0, 13.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.390625, -22.623291015625, -21.85595703125, -21.088623046875, -20.3212890625, -19.553955078125, -18.78662109375, -18.019287109375, -17.251953125, -16.484619140625, -15.71728515625, -14.949951171875, -14.1826171875, -13.415283203125, -12.64794921875, -11.880615234375, -11.11328125, -10.345947265625, -9.57861328125, -8.811279296875, -8.0439453125, -7.276611328125, -6.50927734375, -5.741943359375, -4.974609375, -4.207275390625, -3.43994140625, -2.672607421875, -1.9052734375, -1.137939453125, -0.37060546875, 0.396728515625, 1.1640625, 1.931396484375, 2.69873046875, 3.466064453125, 4.2333984375, 5.000732421875, 5.76806640625, 6.535400390625, 7.302734375, 8.070068359375, 8.83740234375, 9.604736328125, 10.3720703125, 11.139404296875, 11.90673828125, 12.674072265625, 13.44140625, 14.208740234375, 14.97607421875, 15.743408203125, 16.5107421875, 17.278076171875, 18.04541015625, 18.812744140625, 19.580078125, 20.347412109375, 21.11474609375, 21.882080078125, 22.6494140625, 23.416748046875, 24.18408203125, 24.951416015625, 25.71875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 6.0, 3.0, 7.0, 4.0, 10.0, 5.0, 7.0, 10.0, 15.0, 16.0, 15.0, 20.0, 27.0, 26.0, 33.0, 37.0, 31.0, 31.0, 36.0, 44.0, 39.0, 55.0, 36.0, 50.0, 30.0, 46.0, 46.0, 31.0, 40.0, 30.0, 33.0, 28.0, 29.0, 29.0, 21.0, 10.0, 10.0, 11.0, 9.0, 12.0, 8.0, 8.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-20.75, -20.166259765625, -19.58251953125, -18.998779296875, -18.4150390625, -17.831298828125, -17.24755859375, -16.663818359375, -16.080078125, -15.496337890625, -14.91259765625, -14.328857421875, -13.7451171875, -13.161376953125, -12.57763671875, -11.993896484375, -11.41015625, -10.826416015625, -10.24267578125, -9.658935546875, -9.0751953125, -8.491455078125, -7.90771484375, -7.323974609375, -6.740234375, -6.156494140625, -5.57275390625, -4.989013671875, -4.4052734375, -3.821533203125, -3.23779296875, -2.654052734375, -2.0703125, -1.486572265625, -0.90283203125, -0.319091796875, 0.2646484375, 0.848388671875, 1.43212890625, 2.015869140625, 2.599609375, 3.183349609375, 3.76708984375, 4.350830078125, 4.9345703125, 5.518310546875, 6.10205078125, 6.685791015625, 7.26953125, 7.853271484375, 8.43701171875, 9.020751953125, 9.6044921875, 10.188232421875, 10.77197265625, 11.355712890625, 11.939453125, 12.523193359375, 13.10693359375, 13.690673828125, 14.2744140625, 14.858154296875, 15.44189453125, 16.025634765625, 16.609375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 9.0, 8.0, 8.0, 10.0, 22.0, 29.0, 44.0, 80.0, 112.0, 152.0, 214.0, 362.0, 569.0, 820.0, 1457.0, 2630.0, 5186.0, 11282.0, 29827.0, 101025.0, 365164.0, 371429.0, 103709.0, 30946.0, 11532.0, 5281.0, 2727.0, 1406.0, 932.0, 568.0, 356.0, 192.0, 141.0, 103.0, 64.0, 54.0, 32.0, 20.0, 14.0, 13.0, 7.0, 8.0, 7.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-68.0, -66.0576171875, -64.115234375, -62.1728515625, -60.23046875, -58.2880859375, -56.345703125, -54.4033203125, -52.4609375, -50.5185546875, -48.576171875, -46.6337890625, -44.69140625, -42.7490234375, -40.806640625, -38.8642578125, -36.921875, -34.9794921875, -33.037109375, -31.0947265625, -29.15234375, -27.2099609375, -25.267578125, -23.3251953125, -21.3828125, -19.4404296875, -17.498046875, -15.5556640625, -13.61328125, -11.6708984375, -9.728515625, -7.7861328125, -5.84375, -3.9013671875, -1.958984375, -0.0166015625, 1.92578125, 3.8681640625, 5.810546875, 7.7529296875, 9.6953125, 11.6376953125, 13.580078125, 15.5224609375, 17.46484375, 19.4072265625, 21.349609375, 23.2919921875, 25.234375, 27.1767578125, 29.119140625, 31.0615234375, 33.00390625, 34.9462890625, 36.888671875, 38.8310546875, 40.7734375, 42.7158203125, 44.658203125, 46.6005859375, 48.54296875, 50.4853515625, 52.427734375, 54.3701171875, 56.3125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 6.0, 4.0, 5.0, 8.0, 10.0, 12.0, 15.0, 12.0, 13.0, 17.0, 22.0, 22.0, 20.0, 35.0, 32.0, 44.0, 42.0, 34.0, 50.0, 45.0, 37.0, 46.0, 55.0, 44.0, 35.0, 39.0, 40.0, 41.0, 32.0, 29.0, 33.0, 16.0, 17.0, 23.0, 16.0, 9.0, 14.0, 6.0, 7.0, 7.0, 8.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.9140625, -11.522216796875, -11.13037109375, -10.738525390625, -10.3466796875, -9.954833984375, -9.56298828125, -9.171142578125, -8.779296875, -8.387451171875, -7.99560546875, -7.603759765625, -7.2119140625, -6.820068359375, -6.42822265625, -6.036376953125, -5.64453125, -5.252685546875, -4.86083984375, -4.468994140625, -4.0771484375, -3.685302734375, -3.29345703125, -2.901611328125, -2.509765625, -2.117919921875, -1.72607421875, -1.334228515625, -0.9423828125, -0.550537109375, -0.15869140625, 0.233154296875, 0.625, 1.016845703125, 1.40869140625, 1.800537109375, 2.1923828125, 2.584228515625, 2.97607421875, 3.367919921875, 3.759765625, 4.151611328125, 4.54345703125, 4.935302734375, 5.3271484375, 5.718994140625, 6.11083984375, 6.502685546875, 6.89453125, 7.286376953125, 7.67822265625, 8.070068359375, 8.4619140625, 8.853759765625, 9.24560546875, 9.637451171875, 10.029296875, 10.421142578125, 10.81298828125, 11.204833984375, 11.5966796875, 11.988525390625, 12.38037109375, 12.772216796875, 13.1640625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 5.0, 2.0, 6.0, 10.0, 10.0, 17.0, 24.0, 26.0, 42.0, 57.0, 57.0, 78.0, 114.0, 121.0, 166.0, 231.0, 343.0, 404.0, 679.0, 881.0, 1244.0, 1998.0, 3012.0, 5015.0, 8555.0, 15847.0, 32252.0, 73205.0, 173359.0, 318032.0, 225611.0, 97421.0, 42110.0, 20242.0, 10602.0, 5928.0, 3614.0, 2228.0, 1419.0, 961.0, 694.0, 486.0, 352.0, 272.0, 205.0, 134.0, 126.0, 90.0, 75.0, 46.0, 45.0, 39.0, 22.0, 17.0, 13.0, 13.0, 4.0, 7.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-19.21875, -18.592041015625, -17.96533203125, -17.338623046875, -16.7119140625, -16.085205078125, -15.45849609375, -14.831787109375, -14.205078125, -13.578369140625, -12.95166015625, -12.324951171875, -11.6982421875, -11.071533203125, -10.44482421875, -9.818115234375, -9.19140625, -8.564697265625, -7.93798828125, -7.311279296875, -6.6845703125, -6.057861328125, -5.43115234375, -4.804443359375, -4.177734375, -3.551025390625, -2.92431640625, -2.297607421875, -1.6708984375, -1.044189453125, -0.41748046875, 0.209228515625, 0.8359375, 1.462646484375, 2.08935546875, 2.716064453125, 3.3427734375, 3.969482421875, 4.59619140625, 5.222900390625, 5.849609375, 6.476318359375, 7.10302734375, 7.729736328125, 8.3564453125, 8.983154296875, 9.60986328125, 10.236572265625, 10.86328125, 11.489990234375, 12.11669921875, 12.743408203125, 13.3701171875, 13.996826171875, 14.62353515625, 15.250244140625, 15.876953125, 16.503662109375, 17.13037109375, 17.757080078125, 18.3837890625, 19.010498046875, 19.63720703125, 20.263916015625, 20.890625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 7.0, 7.0, 15.0, 21.0, 40.0, 74.0, 152.0, 154.0, 189.0, 129.0, 81.0, 50.0, 26.0, 16.0, 7.0, 5.0, 6.0, 4.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018215179443359375, -0.0017646849155426025, -0.0017078518867492676, -0.0016510188579559326, -0.0015941858291625977, -0.0015373528003692627, -0.0014805197715759277, -0.0014236867427825928, -0.0013668537139892578, -0.0013100206851959229, -0.0012531876564025879, -0.001196354627609253, -0.001139521598815918, -0.001082688570022583, -0.001025855541229248, -0.0009690225124359131, -0.0009121894836425781, -0.0008553564548492432, -0.0007985234260559082, -0.0007416903972625732, -0.0006848573684692383, -0.0006280243396759033, -0.0005711913108825684, -0.0005143582820892334, -0.00045752525329589844, -0.0004006922245025635, -0.0003438591957092285, -0.00028702616691589355, -0.0002301931381225586, -0.00017336010932922363, -0.00011652708053588867, -5.969405174255371e-05, -2.86102294921875e-06, 5.397200584411621e-05, 0.00011080503463745117, 0.00016763806343078613, 0.0002244710922241211, 0.00028130412101745605, 0.000338137149810791, 0.000394970178604126, 0.00045180320739746094, 0.0005086362361907959, 0.0005654692649841309, 0.0006223022937774658, 0.0006791353225708008, 0.0007359683513641357, 0.0007928013801574707, 0.0008496344089508057, 0.0009064674377441406, 0.0009633004665374756, 0.0010201334953308105, 0.0010769665241241455, 0.0011337995529174805, 0.0011906325817108154, 0.0012474656105041504, 0.0013042986392974854, 0.0013611316680908203, 0.0014179646968841553, 0.0014747977256774902, 0.0015316307544708252, 0.0015884637832641602, 0.0016452968120574951, 0.00170212984085083, 0.001758962869644165, 0.0018157958984375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 6.0, 6.0, 7.0, 7.0, 12.0, 17.0, 25.0, 35.0, 37.0, 55.0, 88.0, 108.0, 188.0, 273.0, 371.0, 556.0, 876.0, 1487.0, 2583.0, 4644.0, 9812.0, 22382.0, 58083.0, 158866.0, 315917.0, 275410.0, 118389.0, 43577.0, 17204.0, 7813.0, 3912.0, 2135.0, 1297.0, 801.0, 499.0, 329.0, 216.0, 167.0, 91.0, 77.0, 44.0, 37.0, 31.0, 18.0, 25.0, 14.0, 15.0, 6.0, 6.0, 2.0, 0.0, 3.0], "bins": [-23.859375, -23.2119140625, -22.564453125, -21.9169921875, -21.26953125, -20.6220703125, -19.974609375, -19.3271484375, -18.6796875, -18.0322265625, -17.384765625, -16.7373046875, -16.08984375, -15.4423828125, -14.794921875, -14.1474609375, -13.5, -12.8525390625, -12.205078125, -11.5576171875, -10.91015625, -10.2626953125, -9.615234375, -8.9677734375, -8.3203125, -7.6728515625, -7.025390625, -6.3779296875, -5.73046875, -5.0830078125, -4.435546875, -3.7880859375, -3.140625, -2.4931640625, -1.845703125, -1.1982421875, -0.55078125, 0.0966796875, 0.744140625, 1.3916015625, 2.0390625, 2.6865234375, 3.333984375, 3.9814453125, 4.62890625, 5.2763671875, 5.923828125, 6.5712890625, 7.21875, 7.8662109375, 8.513671875, 9.1611328125, 9.80859375, 10.4560546875, 11.103515625, 11.7509765625, 12.3984375, 13.0458984375, 13.693359375, 14.3408203125, 14.98828125, 15.6357421875, 16.283203125, 16.9306640625, 17.578125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 7.0, 8.0, 5.0, 7.0, 9.0, 8.0, 11.0, 11.0, 16.0, 32.0, 32.0, 41.0, 48.0, 58.0, 69.0, 82.0, 73.0, 68.0, 90.0, 67.0, 58.0, 39.0, 37.0, 22.0, 16.0, 18.0, 15.0, 9.0, 6.0, 8.0, 7.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.97265625, -4.828857421875, -4.68505859375, -4.541259765625, -4.3974609375, -4.253662109375, -4.10986328125, -3.966064453125, -3.822265625, -3.678466796875, -3.53466796875, -3.390869140625, -3.2470703125, -3.103271484375, -2.95947265625, -2.815673828125, -2.671875, -2.528076171875, -2.38427734375, -2.240478515625, -2.0966796875, -1.952880859375, -1.80908203125, -1.665283203125, -1.521484375, -1.377685546875, -1.23388671875, -1.090087890625, -0.9462890625, -0.802490234375, -0.65869140625, -0.514892578125, -0.37109375, -0.227294921875, -0.08349609375, 0.060302734375, 0.2041015625, 0.347900390625, 0.49169921875, 0.635498046875, 0.779296875, 0.923095703125, 1.06689453125, 1.210693359375, 1.3544921875, 1.498291015625, 1.64208984375, 1.785888671875, 1.9296875, 2.073486328125, 2.21728515625, 2.361083984375, 2.5048828125, 2.648681640625, 2.79248046875, 2.936279296875, 3.080078125, 3.223876953125, 3.36767578125, 3.511474609375, 3.6552734375, 3.799072265625, 3.94287109375, 4.086669921875, 4.23046875]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 7.0, 8.0, 10.0, 9.0, 15.0, 24.0, 26.0, 25.0, 39.0, 29.0, 41.0, 45.0, 61.0, 66.0, 75.0, 61.0, 64.0, 65.0, 59.0, 45.0, 52.0, 27.0, 25.0, 27.0, 24.0, 11.0, 13.0, 14.0, 9.0, 6.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-31.970867156982422, -31.039974212646484, -30.109081268310547, -29.17818832397461, -28.247295379638672, -27.316402435302734, -26.385509490966797, -25.45461654663086, -24.523723602294922, -23.592830657958984, -22.661937713623047, -21.73104476928711, -20.800151824951172, -19.869258880615234, -18.938365936279297, -18.00747299194336, -17.076580047607422, -16.145687103271484, -15.214794158935547, -14.28390121459961, -13.353008270263672, -12.422115325927734, -11.491222381591797, -10.56032943725586, -9.629434585571289, -8.698541641235352, -7.767648696899414, -6.836755752563477, -5.905862808227539, -4.974969387054443, -4.044076442718506, -3.1131834983825684, -2.182291030883789, -1.2513980865478516, -0.3205050230026245, 0.6103880405426025, 1.54128098487854, 2.4721741676330566, 3.403067111968994, 4.333960056304932, 5.264853000640869, 6.195745944976807, 7.126638889312744, 8.05753231048584, 8.988425254821777, 9.919318199157715, 10.850211143493652, 11.78110408782959, 12.711997032165527, 13.642889976501465, 14.573782920837402, 15.50467586517334, 16.435569763183594, 17.36646270751953, 18.29735565185547, 19.228248596191406, 20.159141540527344, 21.09003448486328, 22.02092742919922, 22.951820373535156, 23.882713317871094, 24.81360626220703, 25.74449920654297, 26.675392150878906, 27.606285095214844]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 4.0, 2.0, 2.0, 5.0, 6.0, 14.0, 11.0, 13.0, 10.0, 18.0, 11.0, 22.0, 26.0, 20.0, 45.0, 32.0, 39.0, 27.0, 42.0, 31.0, 41.0, 35.0, 35.0, 36.0, 46.0, 45.0, 36.0, 43.0, 49.0, 33.0, 38.0, 17.0, 25.0, 24.0, 25.0, 20.0, 16.0, 15.0, 14.0, 4.0, 5.0, 6.0, 5.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-18.145809173583984, -17.60721206665039, -17.068614959716797, -16.530019760131836, -15.991422653198242, -15.452825546264648, -14.914229393005371, -14.375633239746094, -13.8370361328125, -13.298439025878906, -12.759842872619629, -12.221246719360352, -11.682649612426758, -11.144052505493164, -10.605456352233887, -10.06686019897461, -9.528263092041016, -8.989665985107422, -8.451069831848145, -7.912473201751709, -7.373876571655273, -6.835279941558838, -6.296683311462402, -5.758086681365967, -5.219490051269531, -4.680893421173096, -4.14229679107666, -3.6037001609802246, -3.065103530883789, -2.5265069007873535, -1.987910270690918, -1.4493136405944824, -0.9107189178466797, -0.37212228775024414, 0.1664743423461914, 0.705070972442627, 1.2436676025390625, 1.782264232635498, 2.3208608627319336, 2.859457492828369, 3.3980541229248047, 3.9366507530212402, 4.475247383117676, 5.013844013214111, 5.552440643310547, 6.091037273406982, 6.629633903503418, 7.1682305335998535, 7.706827163696289, 8.245424270629883, 8.78402042388916, 9.322616577148438, 9.861213684082031, 10.399810791015625, 10.938406944274902, 11.47700309753418, 12.015600204467773, 12.554197311401367, 13.092793464660645, 13.631389617919922, 14.169986724853516, 14.70858383178711, 15.247179985046387, 15.785776138305664, 16.324373245239258]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 14.0, 16.0, 16.0, 25.0, 45.0, 58.0, 79.0, 108.0, 172.0, 266.0, 396.0, 596.0, 998.0, 1451.0, 2503.0, 3734.0, 6284.0, 10698.0, 17478.0, 29304.0, 48740.0, 77279.0, 116948.0, 154322.0, 167137.0, 141915.0, 100627.0, 65354.0, 40144.0, 24464.0, 14424.0, 8743.0, 5369.0, 3277.0, 2002.0, 1253.0, 838.0, 498.0, 329.0, 196.0, 130.0, 101.0, 77.0, 58.0, 31.0, 20.0, 18.0, 11.0, 5.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-23.34375, -22.621337890625, -21.89892578125, -21.176513671875, -20.4541015625, -19.731689453125, -19.00927734375, -18.286865234375, -17.564453125, -16.842041015625, -16.11962890625, -15.397216796875, -14.6748046875, -13.952392578125, -13.22998046875, -12.507568359375, -11.78515625, -11.062744140625, -10.34033203125, -9.617919921875, -8.8955078125, -8.173095703125, -7.45068359375, -6.728271484375, -6.005859375, -5.283447265625, -4.56103515625, -3.838623046875, -3.1162109375, -2.393798828125, -1.67138671875, -0.948974609375, -0.2265625, 0.495849609375, 1.21826171875, 1.940673828125, 2.6630859375, 3.385498046875, 4.10791015625, 4.830322265625, 5.552734375, 6.275146484375, 6.99755859375, 7.719970703125, 8.4423828125, 9.164794921875, 9.88720703125, 10.609619140625, 11.33203125, 12.054443359375, 12.77685546875, 13.499267578125, 14.2216796875, 14.944091796875, 15.66650390625, 16.388916015625, 17.111328125, 17.833740234375, 18.55615234375, 19.278564453125, 20.0009765625, 20.723388671875, 21.44580078125, 22.168212890625, 22.890625]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 3.0, 3.0, 4.0, 8.0, 14.0, 14.0, 19.0, 18.0, 16.0, 25.0, 36.0, 40.0, 30.0, 37.0, 50.0, 51.0, 36.0, 45.0, 50.0, 60.0, 51.0, 37.0, 51.0, 45.0, 44.0, 28.0, 41.0, 31.0, 27.0, 26.0, 17.0, 9.0, 8.0, 7.0, 6.0, 3.0, 7.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.609375, -18.951171875, -18.29296875, -17.634765625, -16.9765625, -16.318359375, -15.66015625, -15.001953125, -14.34375, -13.685546875, -13.02734375, -12.369140625, -11.7109375, -11.052734375, -10.39453125, -9.736328125, -9.078125, -8.419921875, -7.76171875, -7.103515625, -6.4453125, -5.787109375, -5.12890625, -4.470703125, -3.8125, -3.154296875, -2.49609375, -1.837890625, -1.1796875, -0.521484375, 0.13671875, 0.794921875, 1.453125, 2.111328125, 2.76953125, 3.427734375, 4.0859375, 4.744140625, 5.40234375, 6.060546875, 6.71875, 7.376953125, 8.03515625, 8.693359375, 9.3515625, 10.009765625, 10.66796875, 11.326171875, 11.984375, 12.642578125, 13.30078125, 13.958984375, 14.6171875, 15.275390625, 15.93359375, 16.591796875, 17.25, 17.908203125, 18.56640625, 19.224609375, 19.8828125, 20.541015625, 21.19921875, 21.857421875, 22.515625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 8.0, 6.0, 19.0, 35.0, 43.0, 55.0, 108.0, 156.0, 241.0, 374.0, 593.0, 1005.0, 1577.0, 2650.0, 4147.0, 6965.0, 11021.0, 18442.0, 28703.0, 45381.0, 69061.0, 99694.0, 130789.0, 147207.0, 139926.0, 112702.0, 80903.0, 54508.0, 34617.0, 22066.0, 13531.0, 8324.0, 5238.0, 3180.0, 1981.0, 1296.0, 761.0, 448.0, 300.0, 160.0, 135.0, 86.0, 52.0, 25.0, 19.0, 13.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-17.65625, -17.099365234375, -16.54248046875, -15.985595703125, -15.4287109375, -14.871826171875, -14.31494140625, -13.758056640625, -13.201171875, -12.644287109375, -12.08740234375, -11.530517578125, -10.9736328125, -10.416748046875, -9.85986328125, -9.302978515625, -8.74609375, -8.189208984375, -7.63232421875, -7.075439453125, -6.5185546875, -5.961669921875, -5.40478515625, -4.847900390625, -4.291015625, -3.734130859375, -3.17724609375, -2.620361328125, -2.0634765625, -1.506591796875, -0.94970703125, -0.392822265625, 0.1640625, 0.720947265625, 1.27783203125, 1.834716796875, 2.3916015625, 2.948486328125, 3.50537109375, 4.062255859375, 4.619140625, 5.176025390625, 5.73291015625, 6.289794921875, 6.8466796875, 7.403564453125, 7.96044921875, 8.517333984375, 9.07421875, 9.631103515625, 10.18798828125, 10.744873046875, 11.3017578125, 11.858642578125, 12.41552734375, 12.972412109375, 13.529296875, 14.086181640625, 14.64306640625, 15.199951171875, 15.7568359375, 16.313720703125, 16.87060546875, 17.427490234375, 17.984375]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 5.0, 8.0, 7.0, 17.0, 13.0, 17.0, 25.0, 25.0, 34.0, 36.0, 24.0, 39.0, 34.0, 34.0, 40.0, 45.0, 55.0, 50.0, 40.0, 48.0, 33.0, 41.0, 37.0, 39.0, 28.0, 29.0, 31.0, 21.0, 24.0, 18.0, 23.0, 18.0, 9.0, 13.0, 7.0, 9.0, 9.0, 6.0, 4.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.046875, -11.6805419921875, -11.314208984375, -10.9478759765625, -10.58154296875, -10.2152099609375, -9.848876953125, -9.4825439453125, -9.1162109375, -8.7498779296875, -8.383544921875, -8.0172119140625, -7.65087890625, -7.2845458984375, -6.918212890625, -6.5518798828125, -6.185546875, -5.8192138671875, -5.452880859375, -5.0865478515625, -4.72021484375, -4.3538818359375, -3.987548828125, -3.6212158203125, -3.2548828125, -2.8885498046875, -2.522216796875, -2.1558837890625, -1.78955078125, -1.4232177734375, -1.056884765625, -0.6905517578125, -0.32421875, 0.0421142578125, 0.408447265625, 0.7747802734375, 1.14111328125, 1.5074462890625, 1.873779296875, 2.2401123046875, 2.6064453125, 2.9727783203125, 3.339111328125, 3.7054443359375, 4.07177734375, 4.4381103515625, 4.804443359375, 5.1707763671875, 5.537109375, 5.9034423828125, 6.269775390625, 6.6361083984375, 7.00244140625, 7.3687744140625, 7.735107421875, 8.1014404296875, 8.4677734375, 8.8341064453125, 9.200439453125, 9.5667724609375, 9.93310546875, 10.2994384765625, 10.665771484375, 11.0321044921875, 11.3984375]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 2.0, 3.0, 7.0, 8.0, 11.0, 14.0, 22.0, 31.0, 51.0, 66.0, 99.0, 113.0, 175.0, 275.0, 353.0, 531.0, 847.0, 1348.0, 2094.0, 3087.0, 4952.0, 7676.0, 12482.0, 19936.0, 32705.0, 54208.0, 88267.0, 135683.0, 177069.0, 171387.0, 125971.0, 80762.0, 49143.0, 29690.0, 18351.0, 11241.0, 7040.0, 4406.0, 2805.0, 1895.0, 1206.0, 795.0, 561.0, 364.0, 242.0, 158.0, 124.0, 95.0, 56.0, 48.0, 32.0, 16.0, 16.0, 14.0, 13.0, 7.0, 2.0, 7.0, 3.0, 2.0, 1.0], "bins": [-14.3359375, -13.8865966796875, -13.437255859375, -12.9879150390625, -12.53857421875, -12.0892333984375, -11.639892578125, -11.1905517578125, -10.7412109375, -10.2918701171875, -9.842529296875, -9.3931884765625, -8.94384765625, -8.4945068359375, -8.045166015625, -7.5958251953125, -7.146484375, -6.6971435546875, -6.247802734375, -5.7984619140625, -5.34912109375, -4.8997802734375, -4.450439453125, -4.0010986328125, -3.5517578125, -3.1024169921875, -2.653076171875, -2.2037353515625, -1.75439453125, -1.3050537109375, -0.855712890625, -0.4063720703125, 0.04296875, 0.4923095703125, 0.941650390625, 1.3909912109375, 1.84033203125, 2.2896728515625, 2.739013671875, 3.1883544921875, 3.6376953125, 4.0870361328125, 4.536376953125, 4.9857177734375, 5.43505859375, 5.8843994140625, 6.333740234375, 6.7830810546875, 7.232421875, 7.6817626953125, 8.131103515625, 8.5804443359375, 9.02978515625, 9.4791259765625, 9.928466796875, 10.3778076171875, 10.8271484375, 11.2764892578125, 11.725830078125, 12.1751708984375, 12.62451171875, 13.0738525390625, 13.523193359375, 13.9725341796875, 14.421875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 4.0, 5.0, 7.0, 9.0, 5.0, 11.0, 20.0, 26.0, 39.0, 71.0, 85.0, 106.0, 122.0, 120.0, 75.0, 91.0, 69.0, 43.0, 26.0, 20.0, 10.0, 10.0, 12.0, 7.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020427703857421875, -0.001950383186340332, -0.0018579959869384766, -0.001765608787536621, -0.0016732215881347656, -0.0015808343887329102, -0.0014884471893310547, -0.0013960599899291992, -0.0013036727905273438, -0.0012112855911254883, -0.0011188983917236328, -0.0010265111923217773, -0.0009341239929199219, -0.0008417367935180664, -0.0007493495941162109, -0.0006569623947143555, -0.0005645751953125, -0.00047218799591064453, -0.00037980079650878906, -0.0002874135971069336, -0.00019502639770507812, -0.00010263919830322266, -1.0251998901367188e-05, 8.213520050048828e-05, 0.00017452239990234375, 0.0002669095993041992, 0.0003592967987060547, 0.00045168399810791016, 0.0005440711975097656, 0.0006364583969116211, 0.0007288455963134766, 0.000821232795715332, 0.0009136199951171875, 0.001006007194519043, 0.0010983943939208984, 0.001190781593322754, 0.0012831687927246094, 0.0013755559921264648, 0.0014679431915283203, 0.0015603303909301758, 0.0016527175903320312, 0.0017451047897338867, 0.0018374919891357422, 0.0019298791885375977, 0.002022266387939453, 0.0021146535873413086, 0.002207040786743164, 0.0022994279861450195, 0.002391815185546875, 0.0024842023849487305, 0.002576589584350586, 0.0026689767837524414, 0.002761363983154297, 0.0028537511825561523, 0.002946138381958008, 0.0030385255813598633, 0.0031309127807617188, 0.0032232999801635742, 0.0033156871795654297, 0.003408074378967285, 0.0035004615783691406, 0.003592848777770996, 0.0036852359771728516, 0.003777623176574707, 0.0038700103759765625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 4.0, 17.0, 13.0, 21.0, 26.0, 29.0, 47.0, 85.0, 99.0, 150.0, 202.0, 290.0, 428.0, 618.0, 843.0, 1318.0, 1760.0, 2532.0, 3865.0, 5603.0, 8622.0, 13282.0, 20747.0, 32771.0, 52461.0, 81896.0, 120894.0, 155094.0, 160105.0, 130547.0, 91537.0, 58735.0, 36745.0, 23081.0, 14776.0, 9434.0, 6273.0, 4285.0, 2869.0, 1903.0, 1338.0, 931.0, 687.0, 498.0, 338.0, 242.0, 162.0, 115.0, 89.0, 42.0, 35.0, 31.0, 12.0, 20.0, 7.0, 8.0, 1.0, 5.0, 0.0, 1.0], "bins": [-12.1484375, -11.770263671875, -11.39208984375, -11.013916015625, -10.6357421875, -10.257568359375, -9.87939453125, -9.501220703125, -9.123046875, -8.744873046875, -8.36669921875, -7.988525390625, -7.6103515625, -7.232177734375, -6.85400390625, -6.475830078125, -6.09765625, -5.719482421875, -5.34130859375, -4.963134765625, -4.5849609375, -4.206787109375, -3.82861328125, -3.450439453125, -3.072265625, -2.694091796875, -2.31591796875, -1.937744140625, -1.5595703125, -1.181396484375, -0.80322265625, -0.425048828125, -0.046875, 0.331298828125, 0.70947265625, 1.087646484375, 1.4658203125, 1.843994140625, 2.22216796875, 2.600341796875, 2.978515625, 3.356689453125, 3.73486328125, 4.113037109375, 4.4912109375, 4.869384765625, 5.24755859375, 5.625732421875, 6.00390625, 6.382080078125, 6.76025390625, 7.138427734375, 7.5166015625, 7.894775390625, 8.27294921875, 8.651123046875, 9.029296875, 9.407470703125, 9.78564453125, 10.163818359375, 10.5419921875, 10.920166015625, 11.29833984375, 11.676513671875, 12.0546875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 6.0, 3.0, 5.0, 2.0, 6.0, 6.0, 10.0, 14.0, 13.0, 20.0, 17.0, 26.0, 23.0, 34.0, 39.0, 44.0, 55.0, 63.0, 52.0, 59.0, 72.0, 41.0, 48.0, 47.0, 47.0, 32.0, 26.0, 43.0, 17.0, 29.0, 24.0, 14.0, 12.0, 15.0, 13.0, 8.0, 5.0, 2.0, 5.0, 5.0, 1.0, 4.0, 0.0, 3.0, 3.0], "bins": [-5.84765625, -5.699462890625, -5.55126953125, -5.403076171875, -5.2548828125, -5.106689453125, -4.95849609375, -4.810302734375, -4.662109375, -4.513916015625, -4.36572265625, -4.217529296875, -4.0693359375, -3.921142578125, -3.77294921875, -3.624755859375, -3.4765625, -3.328369140625, -3.18017578125, -3.031982421875, -2.8837890625, -2.735595703125, -2.58740234375, -2.439208984375, -2.291015625, -2.142822265625, -1.99462890625, -1.846435546875, -1.6982421875, -1.550048828125, -1.40185546875, -1.253662109375, -1.10546875, -0.957275390625, -0.80908203125, -0.660888671875, -0.5126953125, -0.364501953125, -0.21630859375, -0.068115234375, 0.080078125, 0.228271484375, 0.37646484375, 0.524658203125, 0.6728515625, 0.821044921875, 0.96923828125, 1.117431640625, 1.265625, 1.413818359375, 1.56201171875, 1.710205078125, 1.8583984375, 2.006591796875, 2.15478515625, 2.302978515625, 2.451171875, 2.599365234375, 2.74755859375, 2.895751953125, 3.0439453125, 3.192138671875, 3.34033203125, 3.488525390625, 3.63671875]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 12.0, 9.0, 18.0, 22.0, 21.0, 25.0, 21.0, 46.0, 45.0, 49.0, 49.0, 62.0, 58.0, 68.0, 76.0, 57.0, 59.0, 45.0, 63.0, 36.0, 34.0, 29.0, 29.0, 16.0, 8.0, 14.0, 8.0, 2.0, 6.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.97602081298828, -30.03790283203125, -29.09978485107422, -28.161666870117188, -27.223548889160156, -26.285430908203125, -25.347312927246094, -24.409194946289062, -23.47107696533203, -22.532958984375, -21.59484100341797, -20.656723022460938, -19.718605041503906, -18.780487060546875, -17.842369079589844, -16.904251098632812, -15.966133117675781, -15.02801513671875, -14.089897155761719, -13.151779174804688, -12.213661193847656, -11.275543212890625, -10.337425231933594, -9.399307250976562, -8.461189270019531, -7.5230712890625, -6.584953308105469, -5.6468353271484375, -4.708717346191406, -3.770599365234375, -2.8324813842773438, -1.8943634033203125, -0.9562473297119141, -0.018129348754882812, 0.9199886322021484, 1.8581066131591797, 2.796224594116211, 3.734342575073242, 4.672460556030273, 5.610578536987305, 6.548696517944336, 7.486814498901367, 8.424932479858398, 9.36305046081543, 10.301168441772461, 11.239286422729492, 12.177404403686523, 13.115522384643555, 14.053640365600586, 14.991758346557617, 15.929876327514648, 16.86799430847168, 17.80611228942871, 18.744230270385742, 19.682348251342773, 20.620466232299805, 21.558584213256836, 22.496702194213867, 23.4348201751709, 24.37293815612793, 25.31105613708496, 26.249174118041992, 27.187292098999023, 28.125410079956055, 29.063528060913086]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 5.0, 0.0, 4.0, 1.0, 4.0, 5.0, 7.0, 6.0, 7.0, 9.0, 10.0, 13.0, 14.0, 21.0, 24.0, 34.0, 20.0, 23.0, 31.0, 31.0, 45.0, 40.0, 33.0, 34.0, 45.0, 32.0, 37.0, 53.0, 50.0, 29.0, 44.0, 34.0, 33.0, 42.0, 18.0, 26.0, 27.0, 19.0, 20.0, 14.0, 13.0, 14.0, 2.0, 9.0, 9.0, 7.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-17.848920822143555, -17.321720123291016, -16.79452133178711, -16.26732063293457, -15.740120887756348, -15.212921142578125, -14.685720443725586, -14.158520698547363, -13.63132095336914, -13.104121208190918, -12.576921463012695, -12.049720764160156, -11.522521018981934, -10.995321273803711, -10.468120574951172, -9.94092082977295, -9.413721084594727, -8.886521339416504, -8.359321594238281, -7.832120895385742, -7.3049211502075195, -6.777721405029297, -6.250521183013916, -5.723320960998535, -5.1961212158203125, -4.66892147064209, -4.141721248626709, -3.6145212650299072, -3.0873212814331055, -2.5601212978363037, -2.032921314239502, -1.5057213306427002, -0.9785223007202148, -0.4513223171234131, 0.07587766647338867, 0.6030776500701904, 1.1302776336669922, 1.657477617263794, 2.1846776008605957, 2.7118775844573975, 3.239077568054199, 3.766277551651001, 4.293477535247803, 4.820677757263184, 5.347877502441406, 5.875077247619629, 6.40227746963501, 6.929477691650391, 7.456677436828613, 7.983877182006836, 8.511077880859375, 9.038277626037598, 9.56547737121582, 10.092677116394043, 10.619876861572266, 11.147077560424805, 11.674277305603027, 12.20147705078125, 12.728677749633789, 13.255877494812012, 13.783077239990234, 14.310276985168457, 14.83747673034668, 15.364677429199219, 15.891877174377441]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 8.0, 9.0, 22.0, 28.0, 38.0, 43.0, 98.0, 137.0, 217.0, 296.0, 468.0, 752.0, 1148.0, 1680.0, 2782.0, 4465.0, 7223.0, 11697.0, 20046.0, 34415.0, 61549.0, 111691.0, 211138.0, 403587.0, 699685.0, 898662.0, 747450.0, 447110.0, 237355.0, 125895.0, 68493.0, 38589.0, 22362.0, 13181.0, 8233.0, 5059.0, 3196.0, 1963.0, 1281.0, 795.0, 513.0, 335.0, 214.0, 131.0, 90.0, 62.0, 34.0, 24.0, 13.0, 10.0, 10.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0], "bins": [-19.390625, -18.795654296875, -18.20068359375, -17.605712890625, -17.0107421875, -16.415771484375, -15.82080078125, -15.225830078125, -14.630859375, -14.035888671875, -13.44091796875, -12.845947265625, -12.2509765625, -11.656005859375, -11.06103515625, -10.466064453125, -9.87109375, -9.276123046875, -8.68115234375, -8.086181640625, -7.4912109375, -6.896240234375, -6.30126953125, -5.706298828125, -5.111328125, -4.516357421875, -3.92138671875, -3.326416015625, -2.7314453125, -2.136474609375, -1.54150390625, -0.946533203125, -0.3515625, 0.243408203125, 0.83837890625, 1.433349609375, 2.0283203125, 2.623291015625, 3.21826171875, 3.813232421875, 4.408203125, 5.003173828125, 5.59814453125, 6.193115234375, 6.7880859375, 7.383056640625, 7.97802734375, 8.572998046875, 9.16796875, 9.762939453125, 10.35791015625, 10.952880859375, 11.5478515625, 12.142822265625, 12.73779296875, 13.332763671875, 13.927734375, 14.522705078125, 15.11767578125, 15.712646484375, 16.3076171875, 16.902587890625, 17.49755859375, 18.092529296875, 18.6875]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 1.0, 6.0, 8.0, 9.0, 7.0, 12.0, 12.0, 17.0, 18.0, 30.0, 22.0, 24.0, 31.0, 36.0, 40.0, 31.0, 40.0, 31.0, 43.0, 52.0, 34.0, 55.0, 41.0, 35.0, 35.0, 31.0, 38.0, 31.0, 33.0, 34.0, 29.0, 25.0, 19.0, 21.0, 14.0, 12.0, 11.0, 7.0, 4.0, 7.0, 4.0, 3.0, 2.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2890625, -10.9088134765625, -10.528564453125, -10.1483154296875, -9.76806640625, -9.3878173828125, -9.007568359375, -8.6273193359375, -8.2470703125, -7.8668212890625, -7.486572265625, -7.1063232421875, -6.72607421875, -6.3458251953125, -5.965576171875, -5.5853271484375, -5.205078125, -4.8248291015625, -4.444580078125, -4.0643310546875, -3.68408203125, -3.3038330078125, -2.923583984375, -2.5433349609375, -2.1630859375, -1.7828369140625, -1.402587890625, -1.0223388671875, -0.64208984375, -0.2618408203125, 0.118408203125, 0.4986572265625, 0.87890625, 1.2591552734375, 1.639404296875, 2.0196533203125, 2.39990234375, 2.7801513671875, 3.160400390625, 3.5406494140625, 3.9208984375, 4.3011474609375, 4.681396484375, 5.0616455078125, 5.44189453125, 5.8221435546875, 6.202392578125, 6.5826416015625, 6.962890625, 7.3431396484375, 7.723388671875, 8.1036376953125, 8.48388671875, 8.8641357421875, 9.244384765625, 9.6246337890625, 10.0048828125, 10.3851318359375, 10.765380859375, 11.1456298828125, 11.52587890625, 11.9061279296875, 12.286376953125, 12.6666259765625, 13.046875]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 11.0, 8.0, 25.0, 30.0, 42.0, 60.0, 101.0, 187.0, 292.0, 416.0, 651.0, 1018.0, 1564.0, 2576.0, 4263.0, 6923.0, 11905.0, 19841.0, 33560.0, 58908.0, 104026.0, 184420.0, 324443.0, 541175.0, 770886.0, 782593.0, 558549.0, 337277.0, 192609.0, 108068.0, 61466.0, 35211.0, 20470.0, 12014.0, 7128.0, 4374.0, 2712.0, 1628.0, 991.0, 682.0, 424.0, 270.0, 172.0, 100.0, 75.0, 53.0, 25.0, 25.0, 15.0, 16.0, 6.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.671875, -17.08349609375, -16.4951171875, -15.90673828125, -15.318359375, -14.72998046875, -14.1416015625, -13.55322265625, -12.96484375, -12.37646484375, -11.7880859375, -11.19970703125, -10.611328125, -10.02294921875, -9.4345703125, -8.84619140625, -8.2578125, -7.66943359375, -7.0810546875, -6.49267578125, -5.904296875, -5.31591796875, -4.7275390625, -4.13916015625, -3.55078125, -2.96240234375, -2.3740234375, -1.78564453125, -1.197265625, -0.60888671875, -0.0205078125, 0.56787109375, 1.15625, 1.74462890625, 2.3330078125, 2.92138671875, 3.509765625, 4.09814453125, 4.6865234375, 5.27490234375, 5.86328125, 6.45166015625, 7.0400390625, 7.62841796875, 8.216796875, 8.80517578125, 9.3935546875, 9.98193359375, 10.5703125, 11.15869140625, 11.7470703125, 12.33544921875, 12.923828125, 13.51220703125, 14.1005859375, 14.68896484375, 15.27734375, 15.86572265625, 16.4541015625, 17.04248046875, 17.630859375, 18.21923828125, 18.8076171875, 19.39599609375, 19.984375]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 9.0, 5.0, 11.0, 14.0, 13.0, 19.0, 20.0, 28.0, 44.0, 48.0, 42.0, 61.0, 82.0, 94.0, 95.0, 120.0, 153.0, 162.0, 204.0, 194.0, 225.0, 236.0, 257.0, 215.0, 227.0, 192.0, 205.0, 181.0, 137.0, 133.0, 95.0, 92.0, 91.0, 76.0, 55.0, 55.0, 38.0, 23.0, 26.0, 13.0, 16.0, 14.0, 17.0, 7.0, 3.0, 4.0, 6.0, 5.0, 5.0, 1.0, 1.0, 2.0, 4.0, 3.0], "bins": [-5.875, -5.6947021484375, -5.514404296875, -5.3341064453125, -5.15380859375, -4.9735107421875, -4.793212890625, -4.6129150390625, -4.4326171875, -4.2523193359375, -4.072021484375, -3.8917236328125, -3.71142578125, -3.5311279296875, -3.350830078125, -3.1705322265625, -2.990234375, -2.8099365234375, -2.629638671875, -2.4493408203125, -2.26904296875, -2.0887451171875, -1.908447265625, -1.7281494140625, -1.5478515625, -1.3675537109375, -1.187255859375, -1.0069580078125, -0.82666015625, -0.6463623046875, -0.466064453125, -0.2857666015625, -0.10546875, 0.0748291015625, 0.255126953125, 0.4354248046875, 0.61572265625, 0.7960205078125, 0.976318359375, 1.1566162109375, 1.3369140625, 1.5172119140625, 1.697509765625, 1.8778076171875, 2.05810546875, 2.2384033203125, 2.418701171875, 2.5989990234375, 2.779296875, 2.9595947265625, 3.139892578125, 3.3201904296875, 3.50048828125, 3.6807861328125, 3.861083984375, 4.0413818359375, 4.2216796875, 4.4019775390625, 4.582275390625, 4.7625732421875, 4.94287109375, 5.1231689453125, 5.303466796875, 5.4837646484375, 5.6640625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 2.0, 7.0, 7.0, 6.0, 13.0, 15.0, 26.0, 28.0, 36.0, 41.0, 53.0, 51.0, 75.0, 86.0, 73.0, 88.0, 52.0, 74.0, 50.0, 48.0, 33.0, 32.0, 21.0, 26.0, 4.0, 16.0, 12.0, 7.0, 7.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-29.978443145751953, -29.03729820251465, -28.09615135192871, -27.155006408691406, -26.2138614654541, -25.272716522216797, -24.33156967163086, -23.390424728393555, -22.44927978515625, -21.508134841918945, -20.566987991333008, -19.625843048095703, -18.6846981048584, -17.743553161621094, -16.802406311035156, -15.861261367797852, -14.920114517211914, -13.978968620300293, -13.037823677062988, -12.096677780151367, -11.155532836914062, -10.214386940002441, -9.27324104309082, -8.332096099853516, -7.3909502029418945, -6.449804782867432, -5.508659362792969, -4.567513465881348, -3.6263680458068848, -2.685222625732422, -1.7440767288208008, -0.8029313087463379, 0.1382160186767578, 1.0793615579605103, 2.0205070972442627, 2.9616527557373047, 3.9027981758117676, 4.8439435958862305, 5.785089492797852, 6.7262349128723145, 7.667380332946777, 8.608526229858398, 9.549671173095703, 10.490817070007324, 11.431962966918945, 12.37310791015625, 13.314253807067871, 14.255399703979492, 15.196544647216797, 16.1376895904541, 17.07883644104004, 18.019981384277344, 18.96112632751465, 19.902271270751953, 20.84341812133789, 21.784563064575195, 22.7257080078125, 23.666852951049805, 24.607999801635742, 25.549144744873047, 26.49028968811035, 27.431434631347656, 28.372581481933594, 29.3137264251709, 30.254873275756836]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 8.0, 5.0, 14.0, 9.0, 20.0, 17.0, 22.0, 16.0, 32.0, 18.0, 24.0, 36.0, 31.0, 42.0, 38.0, 40.0, 41.0, 47.0, 47.0, 52.0, 50.0, 40.0, 38.0, 32.0, 40.0, 32.0, 29.0, 24.0, 23.0, 24.0, 16.0, 15.0, 16.0, 9.0, 9.0, 12.0, 4.0, 6.0, 5.0, 2.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.447772026062012, -15.009613037109375, -14.571454048156738, -14.133295059204102, -13.695135116577148, -13.256977081298828, -12.818817138671875, -12.380658149719238, -11.942499160766602, -11.504340171813965, -11.066181182861328, -10.628022193908691, -10.189863204956055, -9.751703262329102, -9.313544273376465, -8.875385284423828, -8.437226295471191, -7.999067306518555, -7.560908317565918, -7.122748851776123, -6.684589862823486, -6.24643087387085, -5.808271408081055, -5.370112419128418, -4.931953430175781, -4.4937944412231445, -4.055635452270508, -3.617475986480713, -3.179316997528076, -2.7411580085754395, -2.3029987812042236, -1.8648395538330078, -1.426680564880371, -0.9885214567184448, -0.5503623485565186, -0.11220324039459229, 0.325955867767334, 0.7641148567199707, 1.2022740840911865, 1.6404333114624023, 2.078592300415039, 2.516751289367676, 2.9549105167388916, 3.3930697441101074, 3.831228733062744, 4.269387722015381, 4.707547187805176, 5.1457061767578125, 5.583865165710449, 6.022024154663086, 6.460183143615723, 6.898342609405518, 7.336501598358154, 7.774660587310791, 8.212820053100586, 8.650979042053223, 9.08913803100586, 9.527297019958496, 9.965456008911133, 10.40361499786377, 10.841773986816406, 11.27993392944336, 11.718092918395996, 12.156251907348633, 12.59441089630127]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 4.0, 5.0, 7.0, 9.0, 22.0, 30.0, 39.0, 68.0, 99.0, 138.0, 255.0, 418.0, 708.0, 1266.0, 2312.0, 4535.0, 9445.0, 19870.0, 42956.0, 88470.0, 161694.0, 228097.0, 212543.0, 137940.0, 71881.0, 34063.0, 15960.0, 7550.0, 3625.0, 2004.0, 1014.0, 584.0, 394.0, 186.0, 130.0, 71.0, 53.0, 25.0, 25.0, 23.0, 20.0, 6.0, 3.0, 7.0, 7.0, 3.0, 1.0], "bins": [-23.21875, -22.62109375, -22.0234375, -21.42578125, -20.828125, -20.23046875, -19.6328125, -19.03515625, -18.4375, -17.83984375, -17.2421875, -16.64453125, -16.046875, -15.44921875, -14.8515625, -14.25390625, -13.65625, -13.05859375, -12.4609375, -11.86328125, -11.265625, -10.66796875, -10.0703125, -9.47265625, -8.875, -8.27734375, -7.6796875, -7.08203125, -6.484375, -5.88671875, -5.2890625, -4.69140625, -4.09375, -3.49609375, -2.8984375, -2.30078125, -1.703125, -1.10546875, -0.5078125, 0.08984375, 0.6875, 1.28515625, 1.8828125, 2.48046875, 3.078125, 3.67578125, 4.2734375, 4.87109375, 5.46875, 6.06640625, 6.6640625, 7.26171875, 7.859375, 8.45703125, 9.0546875, 9.65234375, 10.25, 10.84765625, 11.4453125, 12.04296875, 12.640625, 13.23828125, 13.8359375, 14.43359375, 15.03125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 4.0, 2.0, 9.0, 7.0, 10.0, 14.0, 17.0, 13.0, 24.0, 27.0, 23.0, 30.0, 25.0, 33.0, 34.0, 44.0, 32.0, 38.0, 46.0, 45.0, 48.0, 46.0, 40.0, 38.0, 40.0, 33.0, 32.0, 39.0, 24.0, 18.0, 31.0, 29.0, 20.0, 17.0, 17.0, 10.0, 4.0, 10.0, 7.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 4.0, 2.0], "bins": [-16.59375, -16.1480712890625, -15.702392578125, -15.2567138671875, -14.81103515625, -14.3653564453125, -13.919677734375, -13.4739990234375, -13.0283203125, -12.5826416015625, -12.136962890625, -11.6912841796875, -11.24560546875, -10.7999267578125, -10.354248046875, -9.9085693359375, -9.462890625, -9.0172119140625, -8.571533203125, -8.1258544921875, -7.68017578125, -7.2344970703125, -6.788818359375, -6.3431396484375, -5.8974609375, -5.4517822265625, -5.006103515625, -4.5604248046875, -4.11474609375, -3.6690673828125, -3.223388671875, -2.7777099609375, -2.33203125, -1.8863525390625, -1.440673828125, -0.9949951171875, -0.54931640625, -0.1036376953125, 0.342041015625, 0.7877197265625, 1.2333984375, 1.6790771484375, 2.124755859375, 2.5704345703125, 3.01611328125, 3.4617919921875, 3.907470703125, 4.3531494140625, 4.798828125, 5.2445068359375, 5.690185546875, 6.1358642578125, 6.58154296875, 7.0272216796875, 7.472900390625, 7.9185791015625, 8.3642578125, 8.8099365234375, 9.255615234375, 9.7012939453125, 10.14697265625, 10.5926513671875, 11.038330078125, 11.4840087890625, 11.9296875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 7.0, 2.0, 12.0, 12.0, 11.0, 27.0, 34.0, 51.0, 70.0, 120.0, 200.0, 327.0, 526.0, 982.0, 1755.0, 3346.0, 6190.0, 13110.0, 27371.0, 60249.0, 127837.0, 236837.0, 266083.0, 159365.0, 75566.0, 35308.0, 16326.0, 7895.0, 4046.0, 2102.0, 1132.0, 619.0, 373.0, 242.0, 169.0, 88.0, 48.0, 49.0, 19.0, 14.0, 13.0, 8.0, 5.0, 6.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-23.296875, -22.59423828125, -21.8916015625, -21.18896484375, -20.486328125, -19.78369140625, -19.0810546875, -18.37841796875, -17.67578125, -16.97314453125, -16.2705078125, -15.56787109375, -14.865234375, -14.16259765625, -13.4599609375, -12.75732421875, -12.0546875, -11.35205078125, -10.6494140625, -9.94677734375, -9.244140625, -8.54150390625, -7.8388671875, -7.13623046875, -6.43359375, -5.73095703125, -5.0283203125, -4.32568359375, -3.623046875, -2.92041015625, -2.2177734375, -1.51513671875, -0.8125, -0.10986328125, 0.5927734375, 1.29541015625, 1.998046875, 2.70068359375, 3.4033203125, 4.10595703125, 4.80859375, 5.51123046875, 6.2138671875, 6.91650390625, 7.619140625, 8.32177734375, 9.0244140625, 9.72705078125, 10.4296875, 11.13232421875, 11.8349609375, 12.53759765625, 13.240234375, 13.94287109375, 14.6455078125, 15.34814453125, 16.05078125, 16.75341796875, 17.4560546875, 18.15869140625, 18.861328125, 19.56396484375, 20.2666015625, 20.96923828125, 21.671875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 6.0, 9.0, 8.0, 11.0, 12.0, 10.0, 19.0, 16.0, 17.0, 20.0, 20.0, 27.0, 27.0, 29.0, 29.0, 34.0, 32.0, 40.0, 38.0, 36.0, 42.0, 39.0, 32.0, 41.0, 34.0, 39.0, 37.0, 38.0, 37.0, 31.0, 27.0, 28.0, 20.0, 15.0, 14.0, 10.0, 8.0, 18.0, 8.0, 7.0, 3.0, 6.0, 9.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.3125, -7.0711669921875, -6.829833984375, -6.5885009765625, -6.34716796875, -6.1058349609375, -5.864501953125, -5.6231689453125, -5.3818359375, -5.1405029296875, -4.899169921875, -4.6578369140625, -4.41650390625, -4.1751708984375, -3.933837890625, -3.6925048828125, -3.451171875, -3.2098388671875, -2.968505859375, -2.7271728515625, -2.48583984375, -2.2445068359375, -2.003173828125, -1.7618408203125, -1.5205078125, -1.2791748046875, -1.037841796875, -0.7965087890625, -0.55517578125, -0.3138427734375, -0.072509765625, 0.1688232421875, 0.41015625, 0.6514892578125, 0.892822265625, 1.1341552734375, 1.37548828125, 1.6168212890625, 1.858154296875, 2.0994873046875, 2.3408203125, 2.5821533203125, 2.823486328125, 3.0648193359375, 3.30615234375, 3.5474853515625, 3.788818359375, 4.0301513671875, 4.271484375, 4.5128173828125, 4.754150390625, 4.9954833984375, 5.23681640625, 5.4781494140625, 5.719482421875, 5.9608154296875, 6.2021484375, 6.4434814453125, 6.684814453125, 6.9261474609375, 7.16748046875, 7.4088134765625, 7.650146484375, 7.8914794921875, 8.1328125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 6.0, 8.0, 14.0, 12.0, 26.0, 40.0, 70.0, 109.0, 170.0, 247.0, 388.0, 634.0, 1020.0, 1881.0, 3208.0, 5762.0, 10770.0, 21674.0, 45625.0, 100446.0, 214045.0, 293346.0, 185170.0, 84835.0, 38826.0, 18645.0, 9446.0, 5219.0, 2752.0, 1606.0, 964.0, 595.0, 354.0, 220.0, 155.0, 80.0, 60.0, 44.0, 23.0, 23.0, 7.0, 13.0, 3.0, 4.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.7265625, -11.35302734375, -10.9794921875, -10.60595703125, -10.232421875, -9.85888671875, -9.4853515625, -9.11181640625, -8.73828125, -8.36474609375, -7.9912109375, -7.61767578125, -7.244140625, -6.87060546875, -6.4970703125, -6.12353515625, -5.75, -5.37646484375, -5.0029296875, -4.62939453125, -4.255859375, -3.88232421875, -3.5087890625, -3.13525390625, -2.76171875, -2.38818359375, -2.0146484375, -1.64111328125, -1.267578125, -0.89404296875, -0.5205078125, -0.14697265625, 0.2265625, 0.60009765625, 0.9736328125, 1.34716796875, 1.720703125, 2.09423828125, 2.4677734375, 2.84130859375, 3.21484375, 3.58837890625, 3.9619140625, 4.33544921875, 4.708984375, 5.08251953125, 5.4560546875, 5.82958984375, 6.203125, 6.57666015625, 6.9501953125, 7.32373046875, 7.697265625, 8.07080078125, 8.4443359375, 8.81787109375, 9.19140625, 9.56494140625, 9.9384765625, 10.31201171875, 10.685546875, 11.05908203125, 11.4326171875, 11.80615234375, 12.1796875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 6.0, 2.0, 3.0, 5.0, 8.0, 11.0, 7.0, 15.0, 8.0, 31.0, 33.0, 50.0, 46.0, 44.0, 64.0, 53.0, 73.0, 64.0, 66.0, 63.0, 52.0, 62.0, 54.0, 36.0, 25.0, 28.0, 22.0, 23.0, 14.0, 9.0, 5.0, 6.0, 3.0, 6.0, 5.0, 7.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0004525184631347656, -0.0004387795925140381, -0.00042504072189331055, -0.000411301851272583, -0.00039756298065185547, -0.00038382411003112793, -0.0003700852394104004, -0.00035634636878967285, -0.0003426074981689453, -0.0003288686275482178, -0.00031512975692749023, -0.0003013908863067627, -0.00028765201568603516, -0.0002739131450653076, -0.0002601742744445801, -0.00024643540382385254, -0.000232696533203125, -0.00021895766258239746, -0.00020521879196166992, -0.00019147992134094238, -0.00017774105072021484, -0.0001640021800994873, -0.00015026330947875977, -0.00013652443885803223, -0.0001227855682373047, -0.00010904669761657715, -9.530782699584961e-05, -8.156895637512207e-05, -6.783008575439453e-05, -5.409121513366699e-05, -4.035234451293945e-05, -2.6613473892211914e-05, -1.2874603271484375e-05, 8.642673492431641e-07, 1.4603137969970703e-05, 2.8342008590698242e-05, 4.208087921142578e-05, 5.581974983215332e-05, 6.955862045288086e-05, 8.32974910736084e-05, 9.703636169433594e-05, 0.00011077523231506348, 0.00012451410293579102, 0.00013825297355651855, 0.0001519918441772461, 0.00016573071479797363, 0.00017946958541870117, 0.0001932084560394287, 0.00020694732666015625, 0.0002206861972808838, 0.00023442506790161133, 0.00024816393852233887, 0.0002619028091430664, 0.00027564167976379395, 0.0002893805503845215, 0.000303119421005249, 0.00031685829162597656, 0.0003305971622467041, 0.00034433603286743164, 0.0003580749034881592, 0.0003718137741088867, 0.00038555264472961426, 0.0003992915153503418, 0.00041303038597106934, 0.0004267692565917969]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 3.0, 7.0, 15.0, 17.0, 21.0, 32.0, 51.0, 68.0, 109.0, 175.0, 263.0, 444.0, 729.0, 1176.0, 1987.0, 3424.0, 5740.0, 10252.0, 18431.0, 33547.0, 59727.0, 101245.0, 153565.0, 188641.0, 172928.0, 123220.0, 75111.0, 42843.0, 23817.0, 13081.0, 7376.0, 4215.0, 2496.0, 1510.0, 816.0, 550.0, 356.0, 202.0, 123.0, 93.0, 45.0, 36.0, 24.0, 16.0, 12.0, 6.0, 10.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.2109375, -6.97613525390625, -6.7413330078125, -6.50653076171875, -6.271728515625, -6.03692626953125, -5.8021240234375, -5.56732177734375, -5.33251953125, -5.09771728515625, -4.8629150390625, -4.62811279296875, -4.393310546875, -4.15850830078125, -3.9237060546875, -3.68890380859375, -3.4541015625, -3.21929931640625, -2.9844970703125, -2.74969482421875, -2.514892578125, -2.28009033203125, -2.0452880859375, -1.81048583984375, -1.57568359375, -1.34088134765625, -1.1060791015625, -0.87127685546875, -0.636474609375, -0.40167236328125, -0.1668701171875, 0.06793212890625, 0.302734375, 0.53753662109375, 0.7723388671875, 1.00714111328125, 1.241943359375, 1.47674560546875, 1.7115478515625, 1.94635009765625, 2.18115234375, 2.41595458984375, 2.6507568359375, 2.88555908203125, 3.120361328125, 3.35516357421875, 3.5899658203125, 3.82476806640625, 4.0595703125, 4.29437255859375, 4.5291748046875, 4.76397705078125, 4.998779296875, 5.23358154296875, 5.4683837890625, 5.70318603515625, 5.93798828125, 6.17279052734375, 6.4075927734375, 6.64239501953125, 6.877197265625, 7.11199951171875, 7.3468017578125, 7.58160400390625, 7.81640625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 5.0, 7.0, 12.0, 12.0, 12.0, 15.0, 18.0, 18.0, 25.0, 35.0, 43.0, 33.0, 38.0, 53.0, 47.0, 51.0, 59.0, 56.0, 54.0, 54.0, 54.0, 46.0, 33.0, 42.0, 29.0, 22.0, 22.0, 17.0, 16.0, 14.0, 11.0, 8.0, 8.0, 7.0, 4.0, 4.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.125, -2.058868408203125, -1.99273681640625, -1.926605224609375, -1.8604736328125, -1.794342041015625, -1.72821044921875, -1.662078857421875, -1.595947265625, -1.529815673828125, -1.46368408203125, -1.397552490234375, -1.3314208984375, -1.265289306640625, -1.19915771484375, -1.133026123046875, -1.06689453125, -1.000762939453125, -0.93463134765625, -0.868499755859375, -0.8023681640625, -0.736236572265625, -0.67010498046875, -0.603973388671875, -0.537841796875, -0.471710205078125, -0.40557861328125, -0.339447021484375, -0.2733154296875, -0.207183837890625, -0.14105224609375, -0.074920654296875, -0.0087890625, 0.057342529296875, 0.12347412109375, 0.189605712890625, 0.2557373046875, 0.321868896484375, 0.38800048828125, 0.454132080078125, 0.520263671875, 0.586395263671875, 0.65252685546875, 0.718658447265625, 0.7847900390625, 0.850921630859375, 0.91705322265625, 0.983184814453125, 1.04931640625, 1.115447998046875, 1.18157958984375, 1.247711181640625, 1.3138427734375, 1.379974365234375, 1.44610595703125, 1.512237548828125, 1.578369140625, 1.644500732421875, 1.71063232421875, 1.776763916015625, 1.8428955078125, 1.909027099609375, 1.97515869140625, 2.041290283203125, 2.107421875]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 8.0, 7.0, 8.0, 10.0, 8.0, 21.0, 42.0, 39.0, 46.0, 51.0, 69.0, 77.0, 84.0, 83.0, 71.0, 71.0, 60.0, 55.0, 37.0, 38.0, 29.0, 19.0, 16.0, 14.0, 14.0, 7.0, 2.0, 4.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-29.729543685913086, -28.753942489624023, -27.778343200683594, -26.80274200439453, -25.82714080810547, -24.85154151916504, -23.875940322875977, -22.900341033935547, -21.924739837646484, -20.949138641357422, -19.973539352416992, -18.99793815612793, -18.0223388671875, -17.046737670898438, -16.071136474609375, -15.095536231994629, -14.119935989379883, -13.144335746765137, -12.16873550415039, -11.193134307861328, -10.217534065246582, -9.241933822631836, -8.266332626342773, -7.290732383728027, -6.315132141113281, -5.339531898498535, -4.363931179046631, -3.3883306980133057, -2.4127302169799805, -1.4371299743652344, -0.4615292549133301, 0.5140714645385742, 1.4896736145019531, 2.4652740955352783, 3.4408745765686035, 4.416475296020508, 5.392075538635254, 6.36767578125, 7.343276500701904, 8.318877220153809, 9.294477462768555, 10.2700777053833, 11.245677947998047, 12.22127914428711, 13.196879386901855, 14.172479629516602, 15.148080825805664, 16.123680114746094, 17.099281311035156, 18.07488250732422, 19.05048179626465, 20.02608299255371, 21.00168228149414, 21.977283477783203, 22.952884674072266, 23.928485870361328, 24.904085159301758, 25.87968635559082, 26.85528564453125, 27.830886840820312, 28.806488037109375, 29.782087326049805, 30.757688522338867, 31.733287811279297, 32.70888900756836]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 7.0, 6.0, 6.0, 6.0, 7.0, 18.0, 11.0, 22.0, 14.0, 25.0, 24.0, 26.0, 25.0, 34.0, 36.0, 38.0, 35.0, 51.0, 45.0, 55.0, 44.0, 42.0, 57.0, 49.0, 33.0, 33.0, 39.0, 37.0, 24.0, 21.0, 27.0, 20.0, 21.0, 11.0, 13.0, 6.0, 7.0, 10.0, 7.0, 5.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.315722465515137, -14.86660099029541, -14.417479515075684, -13.968358039855957, -13.51923656463623, -13.070115089416504, -12.620992660522461, -12.171871185302734, -11.722749710083008, -11.273628234863281, -10.824506759643555, -10.375385284423828, -9.926263809204102, -9.477142333984375, -9.028020858764648, -8.578899383544922, -8.129777908325195, -7.680656433105469, -7.231534957885742, -6.782413482666016, -6.333292007446289, -5.8841705322265625, -5.435048580169678, -4.985927104949951, -4.536805629730225, -4.087684154510498, -3.6385626792907715, -3.189440965652466, -2.7403194904327393, -2.2911980152130127, -1.842076301574707, -1.3929548263549805, -0.9438333511352539, -0.49471181631088257, -0.04559028148651123, 0.4035313129425049, 0.8526527881622314, 1.301774263381958, 1.7508959770202637, 2.2000174522399902, 2.649138927459717, 3.0982604026794434, 3.54738187789917, 3.9965035915374756, 4.445625305175781, 4.894746780395508, 5.343868255615234, 5.792989730834961, 6.2421112060546875, 6.691232681274414, 7.140354156494141, 7.589475631713867, 8.038597106933594, 8.48771858215332, 8.936840057373047, 9.385961532592773, 9.8350830078125, 10.284204483032227, 10.733325958251953, 11.18244743347168, 11.631568908691406, 12.080690383911133, 12.52981185913086, 12.978933334350586, 13.428055763244629]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 6.0, 9.0, 7.0, 10.0, 15.0, 26.0, 48.0, 51.0, 80.0, 124.0, 193.0, 292.0, 456.0, 691.0, 1115.0, 1617.0, 2578.0, 4171.0, 6560.0, 10701.0, 17148.0, 27464.0, 42696.0, 65214.0, 93633.0, 122722.0, 140931.0, 138732.0, 117389.0, 87851.0, 59754.0, 39667.0, 24731.0, 15712.0, 9706.0, 6121.0, 3695.0, 2378.0, 1527.0, 931.0, 652.0, 403.0, 253.0, 176.0, 113.0, 82.0, 44.0, 31.0, 14.0, 15.0, 8.0, 11.0, 2.0, 4.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-14.015625, -13.546875, -13.078125, -12.609375, -12.140625, -11.671875, -11.203125, -10.734375, -10.265625, -9.796875, -9.328125, -8.859375, -8.390625, -7.921875, -7.453125, -6.984375, -6.515625, -6.046875, -5.578125, -5.109375, -4.640625, -4.171875, -3.703125, -3.234375, -2.765625, -2.296875, -1.828125, -1.359375, -0.890625, -0.421875, 0.046875, 0.515625, 0.984375, 1.453125, 1.921875, 2.390625, 2.859375, 3.328125, 3.796875, 4.265625, 4.734375, 5.203125, 5.671875, 6.140625, 6.609375, 7.078125, 7.546875, 8.015625, 8.484375, 8.953125, 9.421875, 9.890625, 10.359375, 10.828125, 11.296875, 11.765625, 12.234375, 12.703125, 13.171875, 13.640625, 14.109375, 14.578125, 15.046875, 15.515625, 15.984375]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 6.0, 5.0, 4.0, 3.0, 12.0, 8.0, 11.0, 13.0, 10.0, 20.0, 18.0, 31.0, 35.0, 28.0, 33.0, 45.0, 46.0, 33.0, 44.0, 43.0, 46.0, 50.0, 44.0, 41.0, 45.0, 29.0, 53.0, 38.0, 29.0, 36.0, 23.0, 24.0, 20.0, 11.0, 9.0, 15.0, 9.0, 10.0, 11.0, 5.0, 7.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.7265625, -15.252685546875, -14.77880859375, -14.304931640625, -13.8310546875, -13.357177734375, -12.88330078125, -12.409423828125, -11.935546875, -11.461669921875, -10.98779296875, -10.513916015625, -10.0400390625, -9.566162109375, -9.09228515625, -8.618408203125, -8.14453125, -7.670654296875, -7.19677734375, -6.722900390625, -6.2490234375, -5.775146484375, -5.30126953125, -4.827392578125, -4.353515625, -3.879638671875, -3.40576171875, -2.931884765625, -2.4580078125, -1.984130859375, -1.51025390625, -1.036376953125, -0.5625, -0.088623046875, 0.38525390625, 0.859130859375, 1.3330078125, 1.806884765625, 2.28076171875, 2.754638671875, 3.228515625, 3.702392578125, 4.17626953125, 4.650146484375, 5.1240234375, 5.597900390625, 6.07177734375, 6.545654296875, 7.01953125, 7.493408203125, 7.96728515625, 8.441162109375, 8.9150390625, 9.388916015625, 9.86279296875, 10.336669921875, 10.810546875, 11.284423828125, 11.75830078125, 12.232177734375, 12.7060546875, 13.179931640625, 13.65380859375, 14.127685546875, 14.6015625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 14.0, 16.0, 23.0, 43.0, 52.0, 88.0, 123.0, 205.0, 302.0, 503.0, 800.0, 1264.0, 2087.0, 3510.0, 5626.0, 9451.0, 15523.0, 25340.0, 40597.0, 62940.0, 92275.0, 124003.0, 146159.0, 145156.0, 121007.0, 89633.0, 60298.0, 38837.0, 24407.0, 14975.0, 8894.0, 5638.0, 3381.0, 2025.0, 1204.0, 826.0, 498.0, 310.0, 187.0, 128.0, 79.0, 43.0, 33.0, 27.0, 7.0, 6.0, 9.0, 5.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.515625, -13.064453125, -12.61328125, -12.162109375, -11.7109375, -11.259765625, -10.80859375, -10.357421875, -9.90625, -9.455078125, -9.00390625, -8.552734375, -8.1015625, -7.650390625, -7.19921875, -6.748046875, -6.296875, -5.845703125, -5.39453125, -4.943359375, -4.4921875, -4.041015625, -3.58984375, -3.138671875, -2.6875, -2.236328125, -1.78515625, -1.333984375, -0.8828125, -0.431640625, 0.01953125, 0.470703125, 0.921875, 1.373046875, 1.82421875, 2.275390625, 2.7265625, 3.177734375, 3.62890625, 4.080078125, 4.53125, 4.982421875, 5.43359375, 5.884765625, 6.3359375, 6.787109375, 7.23828125, 7.689453125, 8.140625, 8.591796875, 9.04296875, 9.494140625, 9.9453125, 10.396484375, 10.84765625, 11.298828125, 11.75, 12.201171875, 12.65234375, 13.103515625, 13.5546875, 14.005859375, 14.45703125, 14.908203125, 15.359375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 7.0, 7.0, 7.0, 15.0, 10.0, 18.0, 16.0, 15.0, 18.0, 22.0, 29.0, 33.0, 16.0, 40.0, 41.0, 30.0, 34.0, 36.0, 37.0, 45.0, 41.0, 41.0, 39.0, 49.0, 39.0, 39.0, 39.0, 37.0, 29.0, 32.0, 20.0, 26.0, 18.0, 19.0, 9.0, 10.0, 7.0, 8.0, 8.0, 7.0, 4.0, 2.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.109375, -8.8173828125, -8.525390625, -8.2333984375, -7.94140625, -7.6494140625, -7.357421875, -7.0654296875, -6.7734375, -6.4814453125, -6.189453125, -5.8974609375, -5.60546875, -5.3134765625, -5.021484375, -4.7294921875, -4.4375, -4.1455078125, -3.853515625, -3.5615234375, -3.26953125, -2.9775390625, -2.685546875, -2.3935546875, -2.1015625, -1.8095703125, -1.517578125, -1.2255859375, -0.93359375, -0.6416015625, -0.349609375, -0.0576171875, 0.234375, 0.5263671875, 0.818359375, 1.1103515625, 1.40234375, 1.6943359375, 1.986328125, 2.2783203125, 2.5703125, 2.8623046875, 3.154296875, 3.4462890625, 3.73828125, 4.0302734375, 4.322265625, 4.6142578125, 4.90625, 5.1982421875, 5.490234375, 5.7822265625, 6.07421875, 6.3662109375, 6.658203125, 6.9501953125, 7.2421875, 7.5341796875, 7.826171875, 8.1181640625, 8.41015625, 8.7021484375, 8.994140625, 9.2861328125, 9.578125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 4.0, 12.0, 11.0, 19.0, 37.0, 54.0, 57.0, 109.0, 165.0, 291.0, 478.0, 902.0, 1643.0, 2913.0, 5765.0, 11628.0, 24338.0, 51876.0, 107984.0, 199469.0, 254920.0, 190259.0, 101953.0, 48566.0, 22503.0, 10823.0, 5396.0, 2775.0, 1572.0, 850.0, 466.0, 283.0, 172.0, 100.0, 54.0, 45.0, 27.0, 20.0, 11.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-15.1875, -14.7335205078125, -14.279541015625, -13.8255615234375, -13.37158203125, -12.9176025390625, -12.463623046875, -12.0096435546875, -11.5556640625, -11.1016845703125, -10.647705078125, -10.1937255859375, -9.73974609375, -9.2857666015625, -8.831787109375, -8.3778076171875, -7.923828125, -7.4698486328125, -7.015869140625, -6.5618896484375, -6.10791015625, -5.6539306640625, -5.199951171875, -4.7459716796875, -4.2919921875, -3.8380126953125, -3.384033203125, -2.9300537109375, -2.47607421875, -2.0220947265625, -1.568115234375, -1.1141357421875, -0.66015625, -0.2061767578125, 0.247802734375, 0.7017822265625, 1.15576171875, 1.6097412109375, 2.063720703125, 2.5177001953125, 2.9716796875, 3.4256591796875, 3.879638671875, 4.3336181640625, 4.78759765625, 5.2415771484375, 5.695556640625, 6.1495361328125, 6.603515625, 7.0574951171875, 7.511474609375, 7.9654541015625, 8.41943359375, 8.8734130859375, 9.327392578125, 9.7813720703125, 10.2353515625, 10.6893310546875, 11.143310546875, 11.5972900390625, 12.05126953125, 12.5052490234375, 12.959228515625, 13.4132080078125, 13.8671875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 5.0, 4.0, 6.0, 12.0, 7.0, 11.0, 25.0, 31.0, 37.0, 45.0, 40.0, 69.0, 69.0, 78.0, 82.0, 72.0, 83.0, 61.0, 57.0, 37.0, 32.0, 27.0, 27.0, 15.0, 10.0, 15.0, 8.0, 7.0, 7.0, 2.0, 5.0, 3.0, 0.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0015783309936523438, -0.0015366077423095703, -0.0014948844909667969, -0.0014531612396240234, -0.00141143798828125, -0.0013697147369384766, -0.0013279914855957031, -0.0012862682342529297, -0.0012445449829101562, -0.0012028217315673828, -0.0011610984802246094, -0.001119375228881836, -0.0010776519775390625, -0.001035928726196289, -0.0009942054748535156, -0.0009524822235107422, -0.0009107589721679688, -0.0008690357208251953, -0.0008273124694824219, -0.0007855892181396484, -0.000743865966796875, -0.0007021427154541016, -0.0006604194641113281, -0.0006186962127685547, -0.0005769729614257812, -0.0005352497100830078, -0.0004935264587402344, -0.00045180320739746094, -0.0004100799560546875, -0.00036835670471191406, -0.0003266334533691406, -0.0002849102020263672, -0.00024318695068359375, -0.0002014636993408203, -0.00015974044799804688, -0.00011801719665527344, -7.62939453125e-05, -3.457069396972656e-05, 7.152557373046875e-06, 4.887580871582031e-05, 9.059906005859375e-05, 0.0001323223114013672, 0.00017404556274414062, 0.00021576881408691406, 0.0002574920654296875, 0.00029921531677246094, 0.0003409385681152344, 0.0003826618194580078, 0.00042438507080078125, 0.0004661083221435547, 0.0005078315734863281, 0.0005495548248291016, 0.000591278076171875, 0.0006330013275146484, 0.0006747245788574219, 0.0007164478302001953, 0.0007581710815429688, 0.0007998943328857422, 0.0008416175842285156, 0.0008833408355712891, 0.0009250640869140625, 0.0009667873382568359, 0.0010085105895996094, 0.0010502338409423828, 0.0010919570922851562]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 8.0, 8.0, 4.0, 9.0, 16.0, 17.0, 25.0, 33.0, 61.0, 85.0, 128.0, 211.0, 284.0, 430.0, 688.0, 1051.0, 1741.0, 2922.0, 4852.0, 8167.0, 13799.0, 23679.0, 39870.0, 65667.0, 102419.0, 142858.0, 167724.0, 156435.0, 118234.0, 78251.0, 47995.0, 28806.0, 16846.0, 10083.0, 5976.0, 3456.0, 2083.0, 1318.0, 800.0, 512.0, 342.0, 202.0, 158.0, 92.0, 78.0, 40.0, 33.0, 22.0, 7.0, 11.0, 8.0, 11.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.1328125, -8.8446044921875, -8.556396484375, -8.2681884765625, -7.97998046875, -7.6917724609375, -7.403564453125, -7.1153564453125, -6.8271484375, -6.5389404296875, -6.250732421875, -5.9625244140625, -5.67431640625, -5.3861083984375, -5.097900390625, -4.8096923828125, -4.521484375, -4.2332763671875, -3.945068359375, -3.6568603515625, -3.36865234375, -3.0804443359375, -2.792236328125, -2.5040283203125, -2.2158203125, -1.9276123046875, -1.639404296875, -1.3511962890625, -1.06298828125, -0.7747802734375, -0.486572265625, -0.1983642578125, 0.08984375, 0.3780517578125, 0.666259765625, 0.9544677734375, 1.24267578125, 1.5308837890625, 1.819091796875, 2.1072998046875, 2.3955078125, 2.6837158203125, 2.971923828125, 3.2601318359375, 3.54833984375, 3.8365478515625, 4.124755859375, 4.4129638671875, 4.701171875, 4.9893798828125, 5.277587890625, 5.5657958984375, 5.85400390625, 6.1422119140625, 6.430419921875, 6.7186279296875, 7.0068359375, 7.2950439453125, 7.583251953125, 7.8714599609375, 8.15966796875, 8.4478759765625, 8.736083984375, 9.0242919921875, 9.3125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 4.0, 5.0, 5.0, 9.0, 14.0, 10.0, 24.0, 29.0, 41.0, 42.0, 53.0, 67.0, 78.0, 88.0, 76.0, 73.0, 78.0, 65.0, 62.0, 56.0, 37.0, 27.0, 17.0, 11.0, 10.0, 4.0, 5.0, 2.0, 2.0, 5.0, 0.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.703125, -4.5491943359375, -4.395263671875, -4.2413330078125, -4.08740234375, -3.9334716796875, -3.779541015625, -3.6256103515625, -3.4716796875, -3.3177490234375, -3.163818359375, -3.0098876953125, -2.85595703125, -2.7020263671875, -2.548095703125, -2.3941650390625, -2.240234375, -2.0863037109375, -1.932373046875, -1.7784423828125, -1.62451171875, -1.4705810546875, -1.316650390625, -1.1627197265625, -1.0087890625, -0.8548583984375, -0.700927734375, -0.5469970703125, -0.39306640625, -0.2391357421875, -0.085205078125, 0.0687255859375, 0.22265625, 0.3765869140625, 0.530517578125, 0.6844482421875, 0.83837890625, 0.9923095703125, 1.146240234375, 1.3001708984375, 1.4541015625, 1.6080322265625, 1.761962890625, 1.9158935546875, 2.06982421875, 2.2237548828125, 2.377685546875, 2.5316162109375, 2.685546875, 2.8394775390625, 2.993408203125, 3.1473388671875, 3.30126953125, 3.4552001953125, 3.609130859375, 3.7630615234375, 3.9169921875, 4.0709228515625, 4.224853515625, 4.3787841796875, 4.53271484375, 4.6866455078125, 4.840576171875, 4.9945068359375, 5.1484375]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 4.0, 3.0, 6.0, 7.0, 10.0, 18.0, 23.0, 26.0, 40.0, 34.0, 41.0, 56.0, 60.0, 79.0, 94.0, 75.0, 80.0, 47.0, 49.0, 49.0, 49.0, 37.0, 21.0, 25.0, 18.0, 13.0, 11.0, 8.0, 8.0, 5.0, 2.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.850130081176758, -27.93405532836914, -27.017980575561523, -26.101905822753906, -25.18583106994629, -24.269756317138672, -23.353683471679688, -22.437606811523438, -21.521533966064453, -20.605459213256836, -19.68938446044922, -18.7733097076416, -17.857234954833984, -16.941160202026367, -16.02508544921875, -15.10901165008545, -14.192935943603516, -13.276861190795898, -12.360786437988281, -11.444711685180664, -10.528636932373047, -9.61256217956543, -8.696488380432129, -7.780413627624512, -6.8643388748168945, -5.948264122009277, -5.03218936920166, -4.116115093231201, -3.200040340423584, -2.283965587615967, -1.3678913116455078, -0.4518165588378906, 0.4642601013183594, 1.380334734916687, 2.2964093685150146, 3.2124838829040527, 4.12855863571167, 5.044633388519287, 5.960707664489746, 6.876782417297363, 7.7928571701049805, 8.708931922912598, 9.625006675720215, 10.541080474853516, 11.457155227661133, 12.37322998046875, 13.289304733276367, 14.205379486083984, 15.121454238891602, 16.03752899169922, 16.953603744506836, 17.869678497314453, 18.78575325012207, 19.701828002929688, 20.617900848388672, 21.533977508544922, 22.450050354003906, 23.366125106811523, 24.28219985961914, 25.198274612426758, 26.114349365234375, 27.030424118041992, 27.94649887084961, 28.862571716308594, 29.778648376464844]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 7.0, 6.0, 6.0, 8.0, 14.0, 11.0, 13.0, 25.0, 23.0, 25.0, 19.0, 35.0, 30.0, 29.0, 37.0, 40.0, 52.0, 42.0, 51.0, 45.0, 46.0, 38.0, 47.0, 34.0, 44.0, 49.0, 27.0, 31.0, 27.0, 26.0, 25.0, 11.0, 16.0, 15.0, 10.0, 9.0, 6.0, 9.0, 5.0, 5.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.063613891601562, -15.586197853088379, -15.108782768249512, -14.631366729736328, -14.153950691223145, -13.676534652709961, -13.199119567871094, -12.72170352935791, -12.244287490844727, -11.766871452331543, -11.289456367492676, -10.812040328979492, -10.334624290466309, -9.857208251953125, -9.379793167114258, -8.902377128601074, -8.42496109008789, -7.947545528411865, -7.470129489898682, -6.992713928222656, -6.515297889709473, -6.037882328033447, -5.560466766357422, -5.083050727844238, -4.605635643005371, -4.128220081329346, -3.650804042816162, -3.1733884811401367, -2.695972442626953, -2.2185568809509277, -1.7411410808563232, -1.2637252807617188, -0.7863092422485352, -0.30889347195625305, 0.16852229833602905, 0.6459380388259888, 1.1233538389205933, 1.6007695198059082, 2.0781853199005127, 2.555601119995117, 3.0330169200897217, 3.510432720184326, 3.9878485202789307, 4.465264320373535, 4.9426798820495605, 5.420095443725586, 5.8975114822387695, 6.374927520751953, 6.8523430824279785, 7.329758644104004, 7.8071746826171875, 8.284590721130371, 8.762005805969238, 9.239421844482422, 9.716837882995605, 10.194253921508789, 10.671669006347656, 11.14908504486084, 11.626500129699707, 12.10391616821289, 12.581332206726074, 13.058748245239258, 13.536163330078125, 14.013579368591309, 14.490995407104492]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 7.0, 4.0, 4.0, 10.0, 11.0, 22.0, 30.0, 41.0, 58.0, 84.0, 136.0, 178.0, 305.0, 460.0, 797.0, 1301.0, 2123.0, 3553.0, 6592.0, 12129.0, 22876.0, 45786.0, 96648.0, 215759.0, 501709.0, 1000826.0, 1121214.0, 640720.0, 278849.0, 122940.0, 57372.0, 28396.0, 14436.0, 7876.0, 4346.0, 2548.0, 1534.0, 897.0, 587.0, 373.0, 243.0, 185.0, 115.0, 64.0, 52.0, 31.0, 17.0, 20.0, 4.0, 10.0, 2.0, 6.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.75, -19.072509765625, -18.39501953125, -17.717529296875, -17.0400390625, -16.362548828125, -15.68505859375, -15.007568359375, -14.330078125, -13.652587890625, -12.97509765625, -12.297607421875, -11.6201171875, -10.942626953125, -10.26513671875, -9.587646484375, -8.91015625, -8.232666015625, -7.55517578125, -6.877685546875, -6.2001953125, -5.522705078125, -4.84521484375, -4.167724609375, -3.490234375, -2.812744140625, -2.13525390625, -1.457763671875, -0.7802734375, -0.102783203125, 0.57470703125, 1.252197265625, 1.9296875, 2.607177734375, 3.28466796875, 3.962158203125, 4.6396484375, 5.317138671875, 5.99462890625, 6.672119140625, 7.349609375, 8.027099609375, 8.70458984375, 9.382080078125, 10.0595703125, 10.737060546875, 11.41455078125, 12.092041015625, 12.76953125, 13.447021484375, 14.12451171875, 14.802001953125, 15.4794921875, 16.156982421875, 16.83447265625, 17.511962890625, 18.189453125, 18.866943359375, 19.54443359375, 20.221923828125, 20.8994140625, 21.576904296875, 22.25439453125, 22.931884765625, 23.609375]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 2.0, 5.0, 8.0, 4.0, 9.0, 5.0, 7.0, 12.0, 15.0, 22.0, 20.0, 26.0, 24.0, 24.0, 30.0, 31.0, 28.0, 30.0, 45.0, 43.0, 41.0, 42.0, 40.0, 37.0, 44.0, 47.0, 39.0, 35.0, 29.0, 31.0, 30.0, 30.0, 31.0, 25.0, 16.0, 16.0, 16.0, 10.0, 11.0, 7.0, 10.0, 9.0, 3.0, 4.0, 6.0, 5.0, 1.0, 1.0, 2.0, 2.0], "bins": [-11.3125, -11.003173828125, -10.69384765625, -10.384521484375, -10.0751953125, -9.765869140625, -9.45654296875, -9.147216796875, -8.837890625, -8.528564453125, -8.21923828125, -7.909912109375, -7.6005859375, -7.291259765625, -6.98193359375, -6.672607421875, -6.36328125, -6.053955078125, -5.74462890625, -5.435302734375, -5.1259765625, -4.816650390625, -4.50732421875, -4.197998046875, -3.888671875, -3.579345703125, -3.27001953125, -2.960693359375, -2.6513671875, -2.342041015625, -2.03271484375, -1.723388671875, -1.4140625, -1.104736328125, -0.79541015625, -0.486083984375, -0.1767578125, 0.132568359375, 0.44189453125, 0.751220703125, 1.060546875, 1.369873046875, 1.67919921875, 1.988525390625, 2.2978515625, 2.607177734375, 2.91650390625, 3.225830078125, 3.53515625, 3.844482421875, 4.15380859375, 4.463134765625, 4.7724609375, 5.081787109375, 5.39111328125, 5.700439453125, 6.009765625, 6.319091796875, 6.62841796875, 6.937744140625, 7.2470703125, 7.556396484375, 7.86572265625, 8.175048828125, 8.484375]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 7.0, 5.0, 10.0, 7.0, 12.0, 37.0, 31.0, 63.0, 82.0, 129.0, 230.0, 305.0, 533.0, 819.0, 1419.0, 2346.0, 4012.0, 7208.0, 13144.0, 25066.0, 49075.0, 97280.0, 198694.0, 403904.0, 759442.0, 1038040.0, 770654.0, 412691.0, 202435.0, 99913.0, 49822.0, 25820.0, 13598.0, 7268.0, 4167.0, 2378.0, 1389.0, 887.0, 492.0, 309.0, 196.0, 126.0, 86.0, 59.0, 37.0, 29.0, 18.0, 7.0, 9.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-21.203125, -20.551025390625, -19.89892578125, -19.246826171875, -18.5947265625, -17.942626953125, -17.29052734375, -16.638427734375, -15.986328125, -15.334228515625, -14.68212890625, -14.030029296875, -13.3779296875, -12.725830078125, -12.07373046875, -11.421630859375, -10.76953125, -10.117431640625, -9.46533203125, -8.813232421875, -8.1611328125, -7.509033203125, -6.85693359375, -6.204833984375, -5.552734375, -4.900634765625, -4.24853515625, -3.596435546875, -2.9443359375, -2.292236328125, -1.64013671875, -0.988037109375, -0.3359375, 0.316162109375, 0.96826171875, 1.620361328125, 2.2724609375, 2.924560546875, 3.57666015625, 4.228759765625, 4.880859375, 5.532958984375, 6.18505859375, 6.837158203125, 7.4892578125, 8.141357421875, 8.79345703125, 9.445556640625, 10.09765625, 10.749755859375, 11.40185546875, 12.053955078125, 12.7060546875, 13.358154296875, 14.01025390625, 14.662353515625, 15.314453125, 15.966552734375, 16.61865234375, 17.270751953125, 17.9228515625, 18.574951171875, 19.22705078125, 19.879150390625, 20.53125]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 8.0, 4.0, 7.0, 9.0, 17.0, 24.0, 28.0, 31.0, 40.0, 62.0, 83.0, 110.0, 119.0, 157.0, 189.0, 231.0, 270.0, 283.0, 307.0, 290.0, 315.0, 272.0, 226.0, 188.0, 183.0, 127.0, 126.0, 76.0, 67.0, 56.0, 47.0, 30.0, 23.0, 23.0, 13.0, 22.0, 5.0, 7.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.7421875, -6.53192138671875, -6.3216552734375, -6.11138916015625, -5.901123046875, -5.69085693359375, -5.4805908203125, -5.27032470703125, -5.06005859375, -4.84979248046875, -4.6395263671875, -4.42926025390625, -4.218994140625, -4.00872802734375, -3.7984619140625, -3.58819580078125, -3.3779296875, -3.16766357421875, -2.9573974609375, -2.74713134765625, -2.536865234375, -2.32659912109375, -2.1163330078125, -1.90606689453125, -1.69580078125, -1.48553466796875, -1.2752685546875, -1.06500244140625, -0.854736328125, -0.64447021484375, -0.4342041015625, -0.22393798828125, -0.013671875, 0.19659423828125, 0.4068603515625, 0.61712646484375, 0.827392578125, 1.03765869140625, 1.2479248046875, 1.45819091796875, 1.66845703125, 1.87872314453125, 2.0889892578125, 2.29925537109375, 2.509521484375, 2.71978759765625, 2.9300537109375, 3.14031982421875, 3.3505859375, 3.56085205078125, 3.7711181640625, 3.98138427734375, 4.191650390625, 4.40191650390625, 4.6121826171875, 4.82244873046875, 5.03271484375, 5.24298095703125, 5.4532470703125, 5.66351318359375, 5.873779296875, 6.08404541015625, 6.2943115234375, 6.50457763671875, 6.71484375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 11.0, 4.0, 7.0, 9.0, 6.0, 31.0, 25.0, 33.0, 33.0, 39.0, 45.0, 38.0, 45.0, 56.0, 72.0, 48.0, 56.0, 53.0, 54.0, 38.0, 47.0, 37.0, 42.0, 28.0, 31.0, 16.0, 16.0, 15.0, 12.0, 6.0, 11.0, 6.0, 4.0, 8.0, 5.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.8176326751709, -19.158353805541992, -18.499074935913086, -17.839797973632812, -17.180519104003906, -16.521240234375, -15.861961364746094, -15.202682495117188, -14.543403625488281, -13.884124755859375, -13.224846839904785, -12.565567970275879, -11.906289100646973, -11.247011184692383, -10.587732315063477, -9.92845344543457, -9.26917552947998, -8.609896659851074, -7.950618267059326, -7.291339874267578, -6.632061004638672, -5.972782611846924, -5.313504219055176, -4.6542253494262695, -3.9949469566345215, -3.3356683254241943, -2.676389694213867, -2.017111301422119, -1.357832670211792, -0.6985540390014648, -0.0392756462097168, 0.6200032234191895, 1.2792816162109375, 1.9385602474212646, 2.597838878631592, 3.25711727142334, 3.916395902633667, 4.575674533843994, 5.234952926635742, 5.894231796264648, 6.5535101890563965, 7.2127885818481445, 7.872067451477051, 8.53134536743164, 9.190624237060547, 9.849903106689453, 10.50918197631836, 11.168460845947266, 11.827738761901855, 12.487017631530762, 13.146295547485352, 13.805574417114258, 14.464853286743164, 15.12413215637207, 15.78341007232666, 16.44268798828125, 17.101966857910156, 17.761245727539062, 18.42052459716797, 19.079803466796875, 19.73908042907715, 20.398359298706055, 21.05763816833496, 21.716917037963867, 22.376195907592773]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 5.0, 10.0, 9.0, 9.0, 13.0, 24.0, 17.0, 25.0, 31.0, 27.0, 38.0, 39.0, 32.0, 40.0, 50.0, 44.0, 50.0, 53.0, 44.0, 47.0, 51.0, 39.0, 37.0, 46.0, 43.0, 37.0, 25.0, 22.0, 13.0, 19.0, 18.0, 10.0, 10.0, 5.0, 2.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-14.765066146850586, -14.335415840148926, -13.905765533447266, -13.476116180419922, -13.046465873718262, -12.616815567016602, -12.187166213989258, -11.757515907287598, -11.327865600585938, -10.898215293884277, -10.468564987182617, -10.038915634155273, -9.609265327453613, -9.179615020751953, -8.74996566772461, -8.32031536102295, -7.890665054321289, -7.461014747619629, -7.031364917755127, -6.601715087890625, -6.172064781188965, -5.742414474487305, -5.312764644622803, -4.883114814758301, -4.453464508056641, -4.0238142013549805, -3.5941643714904785, -3.1645143032073975, -2.7348642349243164, -2.3052141666412354, -1.8755640983581543, -1.4459140300750732, -1.0162630081176758, -0.5866129398345947, -0.15696287155151367, 0.2726871967315674, 0.7023372650146484, 1.1319873332977295, 1.5616374015808105, 1.9912874698638916, 2.4209375381469727, 2.8505876064300537, 3.2802376747131348, 3.709887742996216, 4.139537811279297, 4.569188117980957, 4.998837947845459, 5.428487777709961, 5.858138084411621, 6.287788391113281, 6.717438220977783, 7.147088050842285, 7.576738357543945, 8.006388664245605, 8.436038970947266, 8.86568832397461, 9.29533863067627, 9.72498893737793, 10.154638290405273, 10.584288597106934, 11.013938903808594, 11.443589210510254, 11.873239517211914, 12.302888870239258, 12.732539176940918]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 10.0, 10.0, 16.0, 10.0, 23.0, 43.0, 56.0, 80.0, 107.0, 202.0, 307.0, 489.0, 860.0, 1445.0, 2606.0, 4678.0, 8738.0, 16421.0, 31892.0, 59183.0, 106245.0, 167913.0, 205160.0, 179278.0, 118160.0, 67541.0, 35649.0, 18966.0, 9910.0, 5389.0, 2977.0, 1691.0, 946.0, 580.0, 358.0, 201.0, 140.0, 94.0, 58.0, 42.0, 29.0, 20.0, 13.0, 6.0, 5.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-13.6875, -13.240234375, -12.79296875, -12.345703125, -11.8984375, -11.451171875, -11.00390625, -10.556640625, -10.109375, -9.662109375, -9.21484375, -8.767578125, -8.3203125, -7.873046875, -7.42578125, -6.978515625, -6.53125, -6.083984375, -5.63671875, -5.189453125, -4.7421875, -4.294921875, -3.84765625, -3.400390625, -2.953125, -2.505859375, -2.05859375, -1.611328125, -1.1640625, -0.716796875, -0.26953125, 0.177734375, 0.625, 1.072265625, 1.51953125, 1.966796875, 2.4140625, 2.861328125, 3.30859375, 3.755859375, 4.203125, 4.650390625, 5.09765625, 5.544921875, 5.9921875, 6.439453125, 6.88671875, 7.333984375, 7.78125, 8.228515625, 8.67578125, 9.123046875, 9.5703125, 10.017578125, 10.46484375, 10.912109375, 11.359375, 11.806640625, 12.25390625, 12.701171875, 13.1484375, 13.595703125, 14.04296875, 14.490234375, 14.9375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 1.0, 5.0, 9.0, 9.0, 9.0, 9.0, 10.0, 19.0, 19.0, 24.0, 29.0, 37.0, 26.0, 40.0, 41.0, 50.0, 36.0, 50.0, 61.0, 47.0, 56.0, 49.0, 51.0, 49.0, 43.0, 37.0, 43.0, 21.0, 32.0, 15.0, 20.0, 11.0, 11.0, 7.0, 6.0, 10.0, 5.0, 2.0, 2.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-16.3125, -15.835205078125, -15.35791015625, -14.880615234375, -14.4033203125, -13.926025390625, -13.44873046875, -12.971435546875, -12.494140625, -12.016845703125, -11.53955078125, -11.062255859375, -10.5849609375, -10.107666015625, -9.63037109375, -9.153076171875, -8.67578125, -8.198486328125, -7.72119140625, -7.243896484375, -6.7666015625, -6.289306640625, -5.81201171875, -5.334716796875, -4.857421875, -4.380126953125, -3.90283203125, -3.425537109375, -2.9482421875, -2.470947265625, -1.99365234375, -1.516357421875, -1.0390625, -0.561767578125, -0.08447265625, 0.392822265625, 0.8701171875, 1.347412109375, 1.82470703125, 2.302001953125, 2.779296875, 3.256591796875, 3.73388671875, 4.211181640625, 4.6884765625, 5.165771484375, 5.64306640625, 6.120361328125, 6.59765625, 7.074951171875, 7.55224609375, 8.029541015625, 8.5068359375, 8.984130859375, 9.46142578125, 9.938720703125, 10.416015625, 10.893310546875, 11.37060546875, 11.847900390625, 12.3251953125, 12.802490234375, 13.27978515625, 13.757080078125, 14.234375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 8.0, 2.0, 5.0, 10.0, 17.0, 17.0, 20.0, 28.0, 49.0, 70.0, 111.0, 120.0, 200.0, 309.0, 519.0, 837.0, 1475.0, 2773.0, 5725.0, 12010.0, 27608.0, 64747.0, 148930.0, 282196.0, 265796.0, 132195.0, 56813.0, 24288.0, 10680.0, 4986.0, 2560.0, 1391.0, 753.0, 462.0, 280.0, 175.0, 116.0, 87.0, 63.0, 45.0, 23.0, 14.0, 21.0, 12.0, 6.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-23.796875, -23.095458984375, -22.39404296875, -21.692626953125, -20.9912109375, -20.289794921875, -19.58837890625, -18.886962890625, -18.185546875, -17.484130859375, -16.78271484375, -16.081298828125, -15.3798828125, -14.678466796875, -13.97705078125, -13.275634765625, -12.57421875, -11.872802734375, -11.17138671875, -10.469970703125, -9.7685546875, -9.067138671875, -8.36572265625, -7.664306640625, -6.962890625, -6.261474609375, -5.56005859375, -4.858642578125, -4.1572265625, -3.455810546875, -2.75439453125, -2.052978515625, -1.3515625, -0.650146484375, 0.05126953125, 0.752685546875, 1.4541015625, 2.155517578125, 2.85693359375, 3.558349609375, 4.259765625, 4.961181640625, 5.66259765625, 6.364013671875, 7.0654296875, 7.766845703125, 8.46826171875, 9.169677734375, 9.87109375, 10.572509765625, 11.27392578125, 11.975341796875, 12.6767578125, 13.378173828125, 14.07958984375, 14.781005859375, 15.482421875, 16.183837890625, 16.88525390625, 17.586669921875, 18.2880859375, 18.989501953125, 19.69091796875, 20.392333984375, 21.09375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 3.0, 7.0, 6.0, 9.0, 16.0, 11.0, 12.0, 22.0, 20.0, 32.0, 31.0, 33.0, 34.0, 32.0, 43.0, 39.0, 43.0, 54.0, 37.0, 40.0, 29.0, 46.0, 39.0, 34.0, 47.0, 33.0, 39.0, 32.0, 32.0, 19.0, 23.0, 15.0, 13.0, 15.0, 14.0, 12.0, 5.0, 8.0, 7.0, 4.0, 3.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.59375, -7.348388671875, -7.10302734375, -6.857666015625, -6.6123046875, -6.366943359375, -6.12158203125, -5.876220703125, -5.630859375, -5.385498046875, -5.14013671875, -4.894775390625, -4.6494140625, -4.404052734375, -4.15869140625, -3.913330078125, -3.66796875, -3.422607421875, -3.17724609375, -2.931884765625, -2.6865234375, -2.441162109375, -2.19580078125, -1.950439453125, -1.705078125, -1.459716796875, -1.21435546875, -0.968994140625, -0.7236328125, -0.478271484375, -0.23291015625, 0.012451171875, 0.2578125, 0.503173828125, 0.74853515625, 0.993896484375, 1.2392578125, 1.484619140625, 1.72998046875, 1.975341796875, 2.220703125, 2.466064453125, 2.71142578125, 2.956787109375, 3.2021484375, 3.447509765625, 3.69287109375, 3.938232421875, 4.18359375, 4.428955078125, 4.67431640625, 4.919677734375, 5.1650390625, 5.410400390625, 5.65576171875, 5.901123046875, 6.146484375, 6.391845703125, 6.63720703125, 6.882568359375, 7.1279296875, 7.373291015625, 7.61865234375, 7.864013671875, 8.109375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 9.0, 8.0, 22.0, 25.0, 32.0, 63.0, 103.0, 143.0, 214.0, 279.0, 469.0, 742.0, 1140.0, 1861.0, 3040.0, 5050.0, 8580.0, 14966.0, 27423.0, 50385.0, 94088.0, 166886.0, 233633.0, 190601.0, 111753.0, 60696.0, 32906.0, 17959.0, 10080.0, 5884.0, 3526.0, 2117.0, 1414.0, 862.0, 534.0, 368.0, 234.0, 154.0, 114.0, 59.0, 44.0, 26.0, 27.0, 8.0, 20.0, 2.0, 4.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.59765625, -7.34136962890625, -7.0850830078125, -6.82879638671875, -6.572509765625, -6.31622314453125, -6.0599365234375, -5.80364990234375, -5.54736328125, -5.29107666015625, -5.0347900390625, -4.77850341796875, -4.522216796875, -4.26593017578125, -4.0096435546875, -3.75335693359375, -3.4970703125, -3.24078369140625, -2.9844970703125, -2.72821044921875, -2.471923828125, -2.21563720703125, -1.9593505859375, -1.70306396484375, -1.44677734375, -1.19049072265625, -0.9342041015625, -0.67791748046875, -0.421630859375, -0.16534423828125, 0.0909423828125, 0.34722900390625, 0.603515625, 0.85980224609375, 1.1160888671875, 1.37237548828125, 1.628662109375, 1.88494873046875, 2.1412353515625, 2.39752197265625, 2.65380859375, 2.91009521484375, 3.1663818359375, 3.42266845703125, 3.678955078125, 3.93524169921875, 4.1915283203125, 4.44781494140625, 4.7041015625, 4.96038818359375, 5.2166748046875, 5.47296142578125, 5.729248046875, 5.98553466796875, 6.2418212890625, 6.49810791015625, 6.75439453125, 7.01068115234375, 7.2669677734375, 7.52325439453125, 7.779541015625, 8.03582763671875, 8.2921142578125, 8.54840087890625, 8.8046875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 5.0, 2.0, 9.0, 5.0, 8.0, 10.0, 12.0, 12.0, 23.0, 22.0, 31.0, 41.0, 49.0, 62.0, 80.0, 91.0, 85.0, 96.0, 74.0, 65.0, 48.0, 41.0, 34.0, 20.0, 24.0, 13.0, 10.0, 5.0, 3.0, 5.0, 4.0, 3.0, 1.0, 3.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00048279762268066406, -0.00046736374497413635, -0.00045192986726760864, -0.00043649598956108093, -0.0004210621118545532, -0.0004056282341480255, -0.0003901943564414978, -0.0003747604787349701, -0.0003593266010284424, -0.00034389272332191467, -0.00032845884561538696, -0.00031302496790885925, -0.00029759109020233154, -0.00028215721249580383, -0.0002667233347892761, -0.0002512894570827484, -0.0002358555793762207, -0.000220421701669693, -0.00020498782396316528, -0.00018955394625663757, -0.00017412006855010986, -0.00015868619084358215, -0.00014325231313705444, -0.00012781843543052673, -0.00011238455772399902, -9.695068001747131e-05, -8.15168023109436e-05, -6.60829246044159e-05, -5.0649046897888184e-05, -3.5215169191360474e-05, -1.9781291484832764e-05, -4.347413778305054e-06, 1.1086463928222656e-05, 2.6520341634750366e-05, 4.1954219341278076e-05, 5.7388097047805786e-05, 7.28219747543335e-05, 8.82558524608612e-05, 0.00010368973016738892, 0.00011912360787391663, 0.00013455748558044434, 0.00014999136328697205, 0.00016542524099349976, 0.00018085911870002747, 0.00019629299640655518, 0.00021172687411308289, 0.0002271607518196106, 0.0002425946295261383, 0.000258028507232666, 0.0002734623849391937, 0.00028889626264572144, 0.00030433014035224915, 0.00031976401805877686, 0.00033519789576530457, 0.0003506317734718323, 0.00036606565117836, 0.0003814995288848877, 0.0003969334065914154, 0.0004123672842979431, 0.0004278011620044708, 0.00044323503971099854, 0.00045866891741752625, 0.00047410279512405396, 0.0004895366728305817, 0.0005049705505371094]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 3.0, 3.0, 3.0, 6.0, 10.0, 17.0, 22.0, 26.0, 24.0, 52.0, 78.0, 101.0, 143.0, 212.0, 326.0, 494.0, 795.0, 1240.0, 1974.0, 3337.0, 5595.0, 8871.0, 15128.0, 25301.0, 42102.0, 68101.0, 104243.0, 144099.0, 165275.0, 152108.0, 113730.0, 76015.0, 47455.0, 28386.0, 17089.0, 10076.0, 6109.0, 3594.0, 2316.0, 1395.0, 898.0, 599.0, 391.0, 240.0, 189.0, 120.0, 87.0, 50.0, 37.0, 24.0, 24.0, 15.0, 16.0, 10.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-5.671875, -5.49249267578125, -5.3131103515625, -5.13372802734375, -4.954345703125, -4.77496337890625, -4.5955810546875, -4.41619873046875, -4.23681640625, -4.05743408203125, -3.8780517578125, -3.69866943359375, -3.519287109375, -3.33990478515625, -3.1605224609375, -2.98114013671875, -2.8017578125, -2.62237548828125, -2.4429931640625, -2.26361083984375, -2.084228515625, -1.90484619140625, -1.7254638671875, -1.54608154296875, -1.36669921875, -1.18731689453125, -1.0079345703125, -0.82855224609375, -0.649169921875, -0.46978759765625, -0.2904052734375, -0.11102294921875, 0.068359375, 0.24774169921875, 0.4271240234375, 0.60650634765625, 0.785888671875, 0.96527099609375, 1.1446533203125, 1.32403564453125, 1.50341796875, 1.68280029296875, 1.8621826171875, 2.04156494140625, 2.220947265625, 2.40032958984375, 2.5797119140625, 2.75909423828125, 2.9384765625, 3.11785888671875, 3.2972412109375, 3.47662353515625, 3.656005859375, 3.83538818359375, 4.0147705078125, 4.19415283203125, 4.37353515625, 4.55291748046875, 4.7322998046875, 4.91168212890625, 5.091064453125, 5.27044677734375, 5.4498291015625, 5.62921142578125, 5.80859375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 6.0, 1.0, 4.0, 1.0, 5.0, 8.0, 5.0, 6.0, 14.0, 6.0, 11.0, 25.0, 21.0, 19.0, 22.0, 35.0, 44.0, 30.0, 40.0, 45.0, 45.0, 41.0, 47.0, 51.0, 37.0, 54.0, 48.0, 45.0, 40.0, 39.0, 34.0, 30.0, 25.0, 21.0, 11.0, 23.0, 13.0, 8.0, 7.0, 7.0, 6.0, 8.0, 7.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.6396484375, -1.592010498046875, -1.54437255859375, -1.496734619140625, -1.4490966796875, -1.401458740234375, -1.35382080078125, -1.306182861328125, -1.258544921875, -1.210906982421875, -1.16326904296875, -1.115631103515625, -1.0679931640625, -1.020355224609375, -0.97271728515625, -0.925079345703125, -0.87744140625, -0.829803466796875, -0.78216552734375, -0.734527587890625, -0.6868896484375, -0.639251708984375, -0.59161376953125, -0.543975830078125, -0.496337890625, -0.448699951171875, -0.40106201171875, -0.353424072265625, -0.3057861328125, -0.258148193359375, -0.21051025390625, -0.162872314453125, -0.115234375, -0.067596435546875, -0.01995849609375, 0.027679443359375, 0.0753173828125, 0.122955322265625, 0.17059326171875, 0.218231201171875, 0.265869140625, 0.313507080078125, 0.36114501953125, 0.408782958984375, 0.4564208984375, 0.504058837890625, 0.55169677734375, 0.599334716796875, 0.64697265625, 0.694610595703125, 0.74224853515625, 0.789886474609375, 0.8375244140625, 0.885162353515625, 0.93280029296875, 0.980438232421875, 1.028076171875, 1.075714111328125, 1.12335205078125, 1.170989990234375, 1.2186279296875, 1.266265869140625, 1.31390380859375, 1.361541748046875, 1.4091796875]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 0.0, 7.0, 3.0, 4.0, 7.0, 12.0, 9.0, 12.0, 19.0, 21.0, 32.0, 34.0, 35.0, 39.0, 44.0, 62.0, 54.0, 54.0, 58.0, 58.0, 59.0, 43.0, 38.0, 46.0, 48.0, 30.0, 39.0, 21.0, 24.0, 17.0, 11.0, 14.0, 9.0, 6.0, 10.0, 6.0, 3.0, 5.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-19.617773056030273, -18.964508056640625, -18.311241149902344, -17.657976150512695, -17.004711151123047, -16.351444244384766, -15.698179244995117, -15.044913291931152, -14.391647338867188, -13.738381385803223, -13.085115432739258, -12.43185043334961, -11.778584480285645, -11.12531852722168, -10.472053527832031, -9.818787574768066, -9.165521621704102, -8.512255668640137, -7.85899019241333, -7.205724716186523, -6.552458763122559, -5.899192810058594, -5.245927333831787, -4.5926618576049805, -3.9393959045410156, -3.28613018989563, -2.632864475250244, -1.9795987606048584, -1.3263330459594727, -0.6730673313140869, -0.019801616668701172, 0.6334638595581055, 1.2867317199707031, 1.9399974346160889, 2.5932631492614746, 3.2465288639068604, 3.899794578552246, 4.553060531616211, 5.206326007843018, 5.859591484069824, 6.512857437133789, 7.166123390197754, 7.8193888664245605, 8.472654342651367, 9.125920295715332, 9.779186248779297, 10.432451248168945, 11.08571720123291, 11.738983154296875, 12.39224910736084, 13.045515060424805, 13.698780059814453, 14.352046012878418, 15.005311965942383, 15.658576965332031, 16.311843872070312, 16.96510887145996, 17.61837387084961, 18.27164077758789, 18.92490577697754, 19.578170776367188, 20.23143768310547, 20.884702682495117, 21.537967681884766, 22.191234588623047]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 7.0, 5.0, 10.0, 6.0, 12.0, 10.0, 12.0, 19.0, 29.0, 24.0, 27.0, 37.0, 42.0, 34.0, 37.0, 39.0, 49.0, 49.0, 50.0, 54.0, 51.0, 46.0, 40.0, 43.0, 40.0, 45.0, 39.0, 31.0, 25.0, 18.0, 13.0, 22.0, 8.0, 5.0, 14.0, 0.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-14.852544784545898, -14.425804138183594, -13.999063491821289, -13.572322845458984, -13.145581245422363, -12.718840599060059, -12.292099952697754, -11.86535930633545, -11.438618659973145, -11.01187801361084, -10.585137367248535, -10.158395767211914, -9.73165512084961, -9.304914474487305, -8.878173828125, -8.451433181762695, -8.02469253540039, -7.597951889038086, -7.171210765838623, -6.744470119476318, -6.317729473114014, -5.890988349914551, -5.464247703552246, -5.037507057189941, -4.61076545715332, -4.184024810791016, -3.757283926010132, -3.330543041229248, -2.9038023948669434, -2.4770615100860596, -2.050320625305176, -1.623579978942871, -1.1968393325805664, -0.7700985670089722, -0.34335774183273315, 0.08338308334350586, 0.5101238489151001, 0.9368646144866943, 1.3636054992675781, 1.7903461456298828, 2.2170870304107666, 2.6438279151916504, 3.070568561553955, 3.497309446334839, 3.9240503311157227, 4.350790977478027, 4.777531623840332, 5.204272270202637, 5.6310133934021, 6.057754039764404, 6.484495162963867, 6.911235809326172, 7.337976455688477, 7.764717102050781, 8.191457748413086, 8.61819839477539, 9.044939994812012, 9.471680641174316, 9.898421287536621, 10.325162887573242, 10.751903533935547, 11.178644180297852, 11.605384826660156, 12.032125473022461, 12.458866119384766]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 11.0, 6.0, 14.0, 21.0, 22.0, 42.0, 38.0, 61.0, 113.0, 123.0, 156.0, 248.0, 399.0, 626.0, 946.0, 1732.0, 2895.0, 5159.0, 9289.0, 17290.0, 31734.0, 56799.0, 96975.0, 147487.0, 182704.0, 175094.0, 131211.0, 82357.0, 46890.0, 25607.0, 14271.0, 7652.0, 4170.0, 2471.0, 1436.0, 862.0, 561.0, 352.0, 219.0, 146.0, 116.0, 73.0, 44.0, 33.0, 33.0, 17.0, 16.0, 11.0, 7.0, 5.0, 7.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-16.703125, -16.178466796875, -15.65380859375, -15.129150390625, -14.6044921875, -14.079833984375, -13.55517578125, -13.030517578125, -12.505859375, -11.981201171875, -11.45654296875, -10.931884765625, -10.4072265625, -9.882568359375, -9.35791015625, -8.833251953125, -8.30859375, -7.783935546875, -7.25927734375, -6.734619140625, -6.2099609375, -5.685302734375, -5.16064453125, -4.635986328125, -4.111328125, -3.586669921875, -3.06201171875, -2.537353515625, -2.0126953125, -1.488037109375, -0.96337890625, -0.438720703125, 0.0859375, 0.610595703125, 1.13525390625, 1.659912109375, 2.1845703125, 2.709228515625, 3.23388671875, 3.758544921875, 4.283203125, 4.807861328125, 5.33251953125, 5.857177734375, 6.3818359375, 6.906494140625, 7.43115234375, 7.955810546875, 8.48046875, 9.005126953125, 9.52978515625, 10.054443359375, 10.5791015625, 11.103759765625, 11.62841796875, 12.153076171875, 12.677734375, 13.202392578125, 13.72705078125, 14.251708984375, 14.7763671875, 15.301025390625, 15.82568359375, 16.350341796875, 16.875]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 5.0, 8.0, 8.0, 12.0, 9.0, 7.0, 13.0, 23.0, 23.0, 33.0, 35.0, 46.0, 64.0, 46.0, 40.0, 49.0, 49.0, 63.0, 48.0, 52.0, 60.0, 59.0, 37.0, 32.0, 36.0, 32.0, 28.0, 17.0, 12.0, 9.0, 13.0, 13.0, 4.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.296875, -14.80712890625, -14.3173828125, -13.82763671875, -13.337890625, -12.84814453125, -12.3583984375, -11.86865234375, -11.37890625, -10.88916015625, -10.3994140625, -9.90966796875, -9.419921875, -8.93017578125, -8.4404296875, -7.95068359375, -7.4609375, -6.97119140625, -6.4814453125, -5.99169921875, -5.501953125, -5.01220703125, -4.5224609375, -4.03271484375, -3.54296875, -3.05322265625, -2.5634765625, -2.07373046875, -1.583984375, -1.09423828125, -0.6044921875, -0.11474609375, 0.375, 0.86474609375, 1.3544921875, 1.84423828125, 2.333984375, 2.82373046875, 3.3134765625, 3.80322265625, 4.29296875, 4.78271484375, 5.2724609375, 5.76220703125, 6.251953125, 6.74169921875, 7.2314453125, 7.72119140625, 8.2109375, 8.70068359375, 9.1904296875, 9.68017578125, 10.169921875, 10.65966796875, 11.1494140625, 11.63916015625, 12.12890625, 12.61865234375, 13.1083984375, 13.59814453125, 14.087890625, 14.57763671875, 15.0673828125, 15.55712890625, 16.046875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 10.0, 16.0, 19.0, 36.0, 44.0, 78.0, 108.0, 142.0, 250.0, 398.0, 697.0, 1073.0, 1875.0, 3167.0, 5568.0, 9994.0, 17554.0, 30909.0, 53229.0, 85670.0, 126711.0, 159577.0, 165628.0, 138669.0, 98334.0, 62301.0, 37481.0, 21139.0, 11958.0, 6654.0, 3865.0, 2167.0, 1278.0, 756.0, 475.0, 269.0, 148.0, 113.0, 72.0, 50.0, 33.0, 16.0, 10.0, 10.0, 6.0, 6.0, 2.0, 1.0, 0.0, 4.0], "bins": [-15.5859375, -15.1549072265625, -14.723876953125, -14.2928466796875, -13.86181640625, -13.4307861328125, -12.999755859375, -12.5687255859375, -12.1376953125, -11.7066650390625, -11.275634765625, -10.8446044921875, -10.41357421875, -9.9825439453125, -9.551513671875, -9.1204833984375, -8.689453125, -8.2584228515625, -7.827392578125, -7.3963623046875, -6.96533203125, -6.5343017578125, -6.103271484375, -5.6722412109375, -5.2412109375, -4.8101806640625, -4.379150390625, -3.9481201171875, -3.51708984375, -3.0860595703125, -2.655029296875, -2.2239990234375, -1.79296875, -1.3619384765625, -0.930908203125, -0.4998779296875, -0.06884765625, 0.3621826171875, 0.793212890625, 1.2242431640625, 1.6552734375, 2.0863037109375, 2.517333984375, 2.9483642578125, 3.37939453125, 3.8104248046875, 4.241455078125, 4.6724853515625, 5.103515625, 5.5345458984375, 5.965576171875, 6.3966064453125, 6.82763671875, 7.2586669921875, 7.689697265625, 8.1207275390625, 8.5517578125, 8.9827880859375, 9.413818359375, 9.8448486328125, 10.27587890625, 10.7069091796875, 11.137939453125, 11.5689697265625, 12.0]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 0.0, 4.0, 6.0, 3.0, 6.0, 5.0, 8.0, 10.0, 12.0, 12.0, 14.0, 25.0, 24.0, 21.0, 27.0, 27.0, 34.0, 30.0, 33.0, 48.0, 38.0, 43.0, 40.0, 32.0, 36.0, 41.0, 31.0, 33.0, 32.0, 34.0, 31.0, 25.0, 36.0, 26.0, 27.0, 27.0, 22.0, 18.0, 11.0, 11.0, 13.0, 7.0, 8.0, 4.0, 7.0, 6.0, 6.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-6.875, -6.6630859375, -6.451171875, -6.2392578125, -6.02734375, -5.8154296875, -5.603515625, -5.3916015625, -5.1796875, -4.9677734375, -4.755859375, -4.5439453125, -4.33203125, -4.1201171875, -3.908203125, -3.6962890625, -3.484375, -3.2724609375, -3.060546875, -2.8486328125, -2.63671875, -2.4248046875, -2.212890625, -2.0009765625, -1.7890625, -1.5771484375, -1.365234375, -1.1533203125, -0.94140625, -0.7294921875, -0.517578125, -0.3056640625, -0.09375, 0.1181640625, 0.330078125, 0.5419921875, 0.75390625, 0.9658203125, 1.177734375, 1.3896484375, 1.6015625, 1.8134765625, 2.025390625, 2.2373046875, 2.44921875, 2.6611328125, 2.873046875, 3.0849609375, 3.296875, 3.5087890625, 3.720703125, 3.9326171875, 4.14453125, 4.3564453125, 4.568359375, 4.7802734375, 4.9921875, 5.2041015625, 5.416015625, 5.6279296875, 5.83984375, 6.0517578125, 6.263671875, 6.4755859375, 6.6875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 1.0, 7.0, 6.0, 13.0, 13.0, 21.0, 37.0, 37.0, 72.0, 66.0, 98.0, 164.0, 223.0, 333.0, 512.0, 780.0, 1298.0, 2012.0, 3446.0, 6031.0, 10538.0, 19480.0, 35885.0, 65926.0, 113589.0, 171128.0, 199419.0, 167229.0, 109885.0, 62614.0, 34367.0, 18497.0, 10352.0, 5750.0, 3323.0, 1885.0, 1225.0, 738.0, 488.0, 319.0, 237.0, 159.0, 92.0, 84.0, 57.0, 29.0, 28.0, 16.0, 15.0, 14.0, 7.0, 5.0, 2.0, 4.0, 5.0, 2.0, 1.0, 1.0], "bins": [-9.046875, -8.7681884765625, -8.489501953125, -8.2108154296875, -7.93212890625, -7.6534423828125, -7.374755859375, -7.0960693359375, -6.8173828125, -6.5386962890625, -6.260009765625, -5.9813232421875, -5.70263671875, -5.4239501953125, -5.145263671875, -4.8665771484375, -4.587890625, -4.3092041015625, -4.030517578125, -3.7518310546875, -3.47314453125, -3.1944580078125, -2.915771484375, -2.6370849609375, -2.3583984375, -2.0797119140625, -1.801025390625, -1.5223388671875, -1.24365234375, -0.9649658203125, -0.686279296875, -0.4075927734375, -0.12890625, 0.1497802734375, 0.428466796875, 0.7071533203125, 0.98583984375, 1.2645263671875, 1.543212890625, 1.8218994140625, 2.1005859375, 2.3792724609375, 2.657958984375, 2.9366455078125, 3.21533203125, 3.4940185546875, 3.772705078125, 4.0513916015625, 4.330078125, 4.6087646484375, 4.887451171875, 5.1661376953125, 5.44482421875, 5.7235107421875, 6.002197265625, 6.2808837890625, 6.5595703125, 6.8382568359375, 7.116943359375, 7.3956298828125, 7.67431640625, 7.9530029296875, 8.231689453125, 8.5103759765625, 8.7890625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 2.0, 8.0, 9.0, 16.0, 8.0, 15.0, 18.0, 19.0, 25.0, 40.0, 32.0, 42.0, 63.0, 39.0, 48.0, 53.0, 60.0, 56.0, 67.0, 51.0, 46.0, 50.0, 36.0, 33.0, 26.0, 23.0, 27.0, 18.0, 20.0, 12.0, 9.0, 9.0, 8.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008192062377929688, -0.0007928088307380676, -0.0007664114236831665, -0.0007400140166282654, -0.0007136166095733643, -0.0006872192025184631, -0.000660821795463562, -0.0006344243884086609, -0.0006080269813537598, -0.0005816295742988586, -0.0005552321672439575, -0.0005288347601890564, -0.0005024373531341553, -0.00047603994607925415, -0.00044964253902435303, -0.0004232451319694519, -0.0003968477249145508, -0.00037045031785964966, -0.00034405291080474854, -0.0003176555037498474, -0.0002912580966949463, -0.00026486068964004517, -0.00023846328258514404, -0.00021206587553024292, -0.0001856684684753418, -0.00015927106142044067, -0.00013287365436553955, -0.00010647624731063843, -8.00788402557373e-05, -5.368143320083618e-05, -2.728402614593506e-05, -8.866190910339355e-07, 2.5510787963867188e-05, 5.190819501876831e-05, 7.830560207366943e-05, 0.00010470300912857056, 0.00013110041618347168, 0.0001574978232383728, 0.00018389523029327393, 0.00021029263734817505, 0.00023669004440307617, 0.0002630874514579773, 0.0002894848585128784, 0.00031588226556777954, 0.00034227967262268066, 0.0003686770796775818, 0.0003950744867324829, 0.00042147189378738403, 0.00044786930084228516, 0.0004742667078971863, 0.0005006641149520874, 0.0005270615220069885, 0.0005534589290618896, 0.0005798563361167908, 0.0006062537431716919, 0.000632651150226593, 0.0006590485572814941, 0.0006854459643363953, 0.0007118433713912964, 0.0007382407784461975, 0.0007646381855010986, 0.0007910355925559998, 0.0008174329996109009, 0.000843830406665802, 0.0008702278137207031]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 3.0, 5.0, 8.0, 15.0, 24.0, 32.0, 34.0, 59.0, 95.0, 159.0, 231.0, 386.0, 602.0, 971.0, 1608.0, 2722.0, 4543.0, 7668.0, 13634.0, 23915.0, 41913.0, 72201.0, 117297.0, 164632.0, 182693.0, 154980.0, 106081.0, 64356.0, 37463.0, 21145.0, 12076.0, 6894.0, 3939.0, 2354.0, 1471.0, 842.0, 538.0, 342.0, 219.0, 143.0, 96.0, 62.0, 30.0, 26.0, 18.0, 8.0, 8.0, 6.0, 6.0, 1.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.03125, -7.775390625, -7.51953125, -7.263671875, -7.0078125, -6.751953125, -6.49609375, -6.240234375, -5.984375, -5.728515625, -5.47265625, -5.216796875, -4.9609375, -4.705078125, -4.44921875, -4.193359375, -3.9375, -3.681640625, -3.42578125, -3.169921875, -2.9140625, -2.658203125, -2.40234375, -2.146484375, -1.890625, -1.634765625, -1.37890625, -1.123046875, -0.8671875, -0.611328125, -0.35546875, -0.099609375, 0.15625, 0.412109375, 0.66796875, 0.923828125, 1.1796875, 1.435546875, 1.69140625, 1.947265625, 2.203125, 2.458984375, 2.71484375, 2.970703125, 3.2265625, 3.482421875, 3.73828125, 3.994140625, 4.25, 4.505859375, 4.76171875, 5.017578125, 5.2734375, 5.529296875, 5.78515625, 6.041015625, 6.296875, 6.552734375, 6.80859375, 7.064453125, 7.3203125, 7.576171875, 7.83203125, 8.087890625, 8.34375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 9.0, 6.0, 15.0, 11.0, 14.0, 12.0, 17.0, 22.0, 27.0, 47.0, 35.0, 45.0, 53.0, 54.0, 55.0, 61.0, 75.0, 66.0, 49.0, 49.0, 40.0, 48.0, 29.0, 27.0, 25.0, 21.0, 13.0, 16.0, 12.0, 11.0, 3.0, 8.0, 2.0, 2.0, 3.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.55859375, -2.47100830078125, -2.3834228515625, -2.29583740234375, -2.208251953125, -2.12066650390625, -2.0330810546875, -1.94549560546875, -1.85791015625, -1.77032470703125, -1.6827392578125, -1.59515380859375, -1.507568359375, -1.41998291015625, -1.3323974609375, -1.24481201171875, -1.1572265625, -1.06964111328125, -0.9820556640625, -0.89447021484375, -0.806884765625, -0.71929931640625, -0.6317138671875, -0.54412841796875, -0.45654296875, -0.36895751953125, -0.2813720703125, -0.19378662109375, -0.106201171875, -0.01861572265625, 0.0689697265625, 0.15655517578125, 0.244140625, 0.33172607421875, 0.4193115234375, 0.50689697265625, 0.594482421875, 0.68206787109375, 0.7696533203125, 0.85723876953125, 0.94482421875, 1.03240966796875, 1.1199951171875, 1.20758056640625, 1.295166015625, 1.38275146484375, 1.4703369140625, 1.55792236328125, 1.6455078125, 1.73309326171875, 1.8206787109375, 1.90826416015625, 1.995849609375, 2.08343505859375, 2.1710205078125, 2.25860595703125, 2.34619140625, 2.43377685546875, 2.5213623046875, 2.60894775390625, 2.696533203125, 2.78411865234375, 2.8717041015625, 2.95928955078125, 3.046875]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 1.0, 3.0, 3.0, 7.0, 6.0, 9.0, 9.0, 12.0, 18.0, 18.0, 22.0, 41.0, 37.0, 37.0, 54.0, 51.0, 82.0, 52.0, 77.0, 56.0, 68.0, 58.0, 50.0, 38.0, 37.0, 30.0, 27.0, 17.0, 19.0, 17.0, 11.0, 6.0, 8.0, 2.0, 12.0, 4.0, 0.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.460142135620117, -18.730737686157227, -18.001331329345703, -17.271926879882812, -16.542522430419922, -15.813116073608398, -15.083711624145508, -14.3543062210083, -13.624900817871094, -12.895495414733887, -12.16609001159668, -11.436685562133789, -10.707280158996582, -9.977874755859375, -9.248470306396484, -8.519064903259277, -7.78965950012207, -7.060254096984863, -6.3308491706848145, -5.601444244384766, -4.872038841247559, -4.142633438110352, -3.4132285118103027, -2.683823585510254, -1.9544181823730469, -1.225013017654419, -0.495607852935791, 0.23379731178283691, 0.9632024765014648, 1.6926076412200928, 2.4220128059387207, 3.1514177322387695, 3.8808231353759766, 4.610228538513184, 5.339633464813232, 6.069038391113281, 6.798443794250488, 7.527849197387695, 8.257253646850586, 8.986659049987793, 9.716064453125, 10.445469856262207, 11.174875259399414, 11.904279708862305, 12.633685111999512, 13.363090515136719, 14.09249496459961, 14.821900367736816, 15.551305770874023, 16.280710220336914, 17.010116577148438, 17.739521026611328, 18.46892547607422, 19.198331832885742, 19.927736282348633, 20.657142639160156, 21.386547088623047, 22.115951538085938, 22.84535789489746, 23.57476234436035, 24.304168701171875, 25.033573150634766, 25.762977600097656, 26.492382049560547, 27.22178840637207]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 6.0, 3.0, 4.0, 4.0, 8.0, 7.0, 13.0, 13.0, 11.0, 15.0, 8.0, 14.0, 26.0, 26.0, 24.0, 34.0, 44.0, 29.0, 25.0, 52.0, 43.0, 42.0, 51.0, 42.0, 49.0, 41.0, 39.0, 52.0, 37.0, 16.0, 30.0, 29.0, 27.0, 21.0, 24.0, 20.0, 13.0, 14.0, 14.0, 9.0, 7.0, 7.0, 12.0, 4.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.368841171264648, -10.982305526733398, -10.595768928527832, -10.209233283996582, -9.822696685791016, -9.436161041259766, -9.049625396728516, -8.66308879852295, -8.2765531539917, -7.890017032623291, -7.503480911254883, -7.116945266723633, -6.730409145355225, -6.343873023986816, -5.957336902618408, -5.57080078125, -5.184264659881592, -4.797728538513184, -4.411192417144775, -4.024656295776367, -3.638120651245117, -3.251584529876709, -2.865048408508301, -2.4785125255584717, -2.0919764041900635, -1.7054404020309448, -1.3189043998718262, -0.932368278503418, -0.5458322763442993, -0.15929627418518066, 0.22723984718322754, 0.6137757301330566, 1.0003118515014648, 1.3868478536605835, 1.7733838558197021, 2.1599199771881104, 2.5464558601379395, 2.9329919815063477, 3.319528102874756, 3.706063985824585, 4.092599868774414, 4.479135990142822, 4.8656721115112305, 5.2522077560424805, 5.638743877410889, 6.025279998779297, 6.411816120147705, 6.798352241516113, 7.1848883628845215, 7.57142448425293, 7.957960605621338, 8.344496726989746, 8.731032371520996, 9.117568969726562, 9.504104614257812, 9.890640258789062, 10.277176856994629, 10.663712501525879, 11.050249099731445, 11.436784744262695, 11.823321342468262, 12.209856986999512, 12.596393585205078, 12.982929229736328, 13.369464874267578]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 3.0, 10.0, 13.0, 16.0, 26.0, 32.0, 51.0, 75.0, 89.0, 146.0, 202.0, 338.0, 479.0, 703.0, 1128.0, 1687.0, 2632.0, 4415.0, 7187.0, 12117.0, 21513.0, 37874.0, 69756.0, 133270.0, 262834.0, 522323.0, 881499.0, 946883.0, 620571.0, 317167.0, 159035.0, 83116.0, 44393.0, 24837.0, 14659.0, 8566.0, 5215.0, 3308.0, 1999.0, 1354.0, 933.0, 597.0, 387.0, 242.0, 192.0, 118.0, 100.0, 55.0, 39.0, 32.0, 17.0, 16.0, 9.0, 12.0, 7.0, 5.0, 3.0, 2.0], "bins": [-16.84375, -16.3355712890625, -15.827392578125, -15.3192138671875, -14.81103515625, -14.3028564453125, -13.794677734375, -13.2864990234375, -12.7783203125, -12.2701416015625, -11.761962890625, -11.2537841796875, -10.74560546875, -10.2374267578125, -9.729248046875, -9.2210693359375, -8.712890625, -8.2047119140625, -7.696533203125, -7.1883544921875, -6.68017578125, -6.1719970703125, -5.663818359375, -5.1556396484375, -4.6474609375, -4.1392822265625, -3.631103515625, -3.1229248046875, -2.61474609375, -2.1065673828125, -1.598388671875, -1.0902099609375, -0.58203125, -0.0738525390625, 0.434326171875, 0.9425048828125, 1.45068359375, 1.9588623046875, 2.467041015625, 2.9752197265625, 3.4833984375, 3.9915771484375, 4.499755859375, 5.0079345703125, 5.51611328125, 6.0242919921875, 6.532470703125, 7.0406494140625, 7.548828125, 8.0570068359375, 8.565185546875, 9.0733642578125, 9.58154296875, 10.0897216796875, 10.597900390625, 11.1060791015625, 11.6142578125, 12.1224365234375, 12.630615234375, 13.1387939453125, 13.64697265625, 14.1551513671875, 14.663330078125, 15.1715087890625, 15.6796875]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 1.0, 5.0, 5.0, 2.0, 5.0, 11.0, 13.0, 13.0, 10.0, 10.0, 17.0, 15.0, 28.0, 25.0, 32.0, 33.0, 29.0, 32.0, 38.0, 39.0, 41.0, 42.0, 44.0, 35.0, 61.0, 50.0, 46.0, 42.0, 40.0, 38.0, 39.0, 27.0, 23.0, 21.0, 17.0, 17.0, 12.0, 6.0, 12.0, 11.0, 4.0, 3.0, 1.0, 5.0, 10.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.1640625, -8.87841796875, -8.5927734375, -8.30712890625, -8.021484375, -7.73583984375, -7.4501953125, -7.16455078125, -6.87890625, -6.59326171875, -6.3076171875, -6.02197265625, -5.736328125, -5.45068359375, -5.1650390625, -4.87939453125, -4.59375, -4.30810546875, -4.0224609375, -3.73681640625, -3.451171875, -3.16552734375, -2.8798828125, -2.59423828125, -2.30859375, -2.02294921875, -1.7373046875, -1.45166015625, -1.166015625, -0.88037109375, -0.5947265625, -0.30908203125, -0.0234375, 0.26220703125, 0.5478515625, 0.83349609375, 1.119140625, 1.40478515625, 1.6904296875, 1.97607421875, 2.26171875, 2.54736328125, 2.8330078125, 3.11865234375, 3.404296875, 3.68994140625, 3.9755859375, 4.26123046875, 4.546875, 4.83251953125, 5.1181640625, 5.40380859375, 5.689453125, 5.97509765625, 6.2607421875, 6.54638671875, 6.83203125, 7.11767578125, 7.4033203125, 7.68896484375, 7.974609375, 8.26025390625, 8.5458984375, 8.83154296875, 9.1171875]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 7.0, 15.0, 23.0, 45.0, 51.0, 77.0, 131.0, 160.0, 273.0, 401.0, 673.0, 1060.0, 1697.0, 2688.0, 4383.0, 7276.0, 12377.0, 21725.0, 38595.0, 69415.0, 128998.0, 237706.0, 434658.0, 720980.0, 896821.0, 696263.0, 413971.0, 226675.0, 121935.0, 66786.0, 37166.0, 20911.0, 12091.0, 6993.0, 4306.0, 2563.0, 1576.0, 1036.0, 623.0, 373.0, 269.0, 178.0, 112.0, 69.0, 45.0, 39.0, 22.0, 14.0, 9.0, 10.0, 8.0, 3.0, 1.0, 2.0], "bins": [-17.78125, -17.2652587890625, -16.749267578125, -16.2332763671875, -15.71728515625, -15.2012939453125, -14.685302734375, -14.1693115234375, -13.6533203125, -13.1373291015625, -12.621337890625, -12.1053466796875, -11.58935546875, -11.0733642578125, -10.557373046875, -10.0413818359375, -9.525390625, -9.0093994140625, -8.493408203125, -7.9774169921875, -7.46142578125, -6.9454345703125, -6.429443359375, -5.9134521484375, -5.3974609375, -4.8814697265625, -4.365478515625, -3.8494873046875, -3.33349609375, -2.8175048828125, -2.301513671875, -1.7855224609375, -1.26953125, -0.7535400390625, -0.237548828125, 0.2784423828125, 0.79443359375, 1.3104248046875, 1.826416015625, 2.3424072265625, 2.8583984375, 3.3743896484375, 3.890380859375, 4.4063720703125, 4.92236328125, 5.4383544921875, 5.954345703125, 6.4703369140625, 6.986328125, 7.5023193359375, 8.018310546875, 8.5343017578125, 9.05029296875, 9.5662841796875, 10.082275390625, 10.5982666015625, 11.1142578125, 11.6302490234375, 12.146240234375, 12.6622314453125, 13.17822265625, 13.6942138671875, 14.210205078125, 14.7261962890625, 15.2421875]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 8.0, 9.0, 16.0, 30.0, 26.0, 35.0, 43.0, 60.0, 88.0, 117.0, 147.0, 176.0, 215.0, 262.0, 278.0, 303.0, 321.0, 310.0, 280.0, 275.0, 222.0, 159.0, 165.0, 128.0, 109.0, 65.0, 61.0, 38.0, 33.0, 32.0, 20.0, 11.0, 5.0, 11.0, 5.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.19140625, -4.99627685546875, -4.8011474609375, -4.60601806640625, -4.410888671875, -4.21575927734375, -4.0206298828125, -3.82550048828125, -3.63037109375, -3.43524169921875, -3.2401123046875, -3.04498291015625, -2.849853515625, -2.65472412109375, -2.4595947265625, -2.26446533203125, -2.0693359375, -1.87420654296875, -1.6790771484375, -1.48394775390625, -1.288818359375, -1.09368896484375, -0.8985595703125, -0.70343017578125, -0.50830078125, -0.31317138671875, -0.1180419921875, 0.07708740234375, 0.272216796875, 0.46734619140625, 0.6624755859375, 0.85760498046875, 1.052734375, 1.24786376953125, 1.4429931640625, 1.63812255859375, 1.833251953125, 2.02838134765625, 2.2235107421875, 2.41864013671875, 2.61376953125, 2.80889892578125, 3.0040283203125, 3.19915771484375, 3.394287109375, 3.58941650390625, 3.7845458984375, 3.97967529296875, 4.1748046875, 4.36993408203125, 4.5650634765625, 4.76019287109375, 4.955322265625, 5.15045166015625, 5.3455810546875, 5.54071044921875, 5.73583984375, 5.93096923828125, 6.1260986328125, 6.32122802734375, 6.516357421875, 6.71148681640625, 6.9066162109375, 7.10174560546875, 7.296875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 4.0, 6.0, 3.0, 4.0, 9.0, 9.0, 19.0, 15.0, 22.0, 23.0, 20.0, 45.0, 34.0, 48.0, 43.0, 66.0, 74.0, 67.0, 69.0, 62.0, 60.0, 46.0, 51.0, 34.0, 19.0, 18.0, 28.0, 16.0, 18.0, 12.0, 9.0, 7.0, 10.0, 6.0, 2.0, 2.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.273786544799805, -18.626934051513672, -17.98008155822754, -17.333229064941406, -16.686378479003906, -16.039525985717773, -15.39267349243164, -14.745820999145508, -14.098968505859375, -13.452116012573242, -12.80526351928711, -12.158411979675293, -11.51155948638916, -10.864706993103027, -10.217855453491211, -9.571002960205078, -8.924150466918945, -8.277297973632812, -7.630445957183838, -6.983593940734863, -6.3367414474487305, -5.689888954162598, -5.043036937713623, -4.396184921264648, -3.7493324279785156, -3.102480173110962, -2.455627918243408, -1.8087756633758545, -1.1619234085083008, -0.5150711536407471, 0.13178110122680664, 0.7786331176757812, 1.425485610961914, 2.0723378658294678, 2.7191901206970215, 3.366042375564575, 4.012894630432129, 4.659747123718262, 5.306599140167236, 5.953451156616211, 6.600303649902344, 7.247156143188477, 7.894008159637451, 8.540860176086426, 9.187712669372559, 9.834565162658691, 10.481416702270508, 11.12826919555664, 11.775121688842773, 12.421974182128906, 13.068826675415039, 13.715678215026855, 14.362530708312988, 15.009383201599121, 15.656234741210938, 16.30308723449707, 16.949939727783203, 17.596792221069336, 18.24364471435547, 18.8904972076416, 19.537349700927734, 20.184200286865234, 20.831052780151367, 21.4779052734375, 22.124757766723633]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 4.0, 9.0, 6.0, 18.0, 12.0, 18.0, 12.0, 24.0, 24.0, 29.0, 25.0, 32.0, 33.0, 40.0, 43.0, 43.0, 49.0, 45.0, 41.0, 63.0, 44.0, 39.0, 37.0, 38.0, 42.0, 25.0, 25.0, 31.0, 30.0, 22.0, 19.0, 18.0, 14.0, 9.0, 13.0, 8.0, 1.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.629175186157227, -10.27098560333252, -9.912796020507812, -9.554606437683105, -9.196416854858398, -8.838227272033691, -8.480037689208984, -8.121848106384277, -7.76365852355957, -7.405468940734863, -7.047279357910156, -6.689089775085449, -6.330900192260742, -5.972710609436035, -5.614521026611328, -5.256331443786621, -4.898141860961914, -4.539952278137207, -4.1817626953125, -3.823573112487793, -3.465383529663086, -3.107193946838379, -2.749004364013672, -2.390814781188965, -2.032625198364258, -1.6744356155395508, -1.3162460327148438, -0.9580564498901367, -0.5998668670654297, -0.24167728424072266, 0.11651229858398438, 0.4747018814086914, 0.832890510559082, 1.191080093383789, 1.549269676208496, 1.9074592590332031, 2.26564884185791, 2.623838424682617, 2.982028007507324, 3.3402175903320312, 3.6984071731567383, 4.056596755981445, 4.414786338806152, 4.772975921630859, 5.131165504455566, 5.489355087280273, 5.8475446701049805, 6.2057342529296875, 6.5639238357543945, 6.922113418579102, 7.280303001403809, 7.638492584228516, 7.996682167053223, 8.35487174987793, 8.713061332702637, 9.071250915527344, 9.42944049835205, 9.787630081176758, 10.145819664001465, 10.504009246826172, 10.862198829650879, 11.220388412475586, 11.578577995300293, 11.936767578125, 12.294957160949707]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 5.0, 6.0, 6.0, 10.0, 10.0, 12.0, 21.0, 34.0, 51.0, 65.0, 85.0, 112.0, 186.0, 279.0, 393.0, 526.0, 833.0, 1343.0, 2006.0, 3336.0, 5647.0, 9537.0, 16024.0, 28479.0, 49858.0, 87495.0, 140043.0, 185596.0, 183389.0, 135696.0, 83814.0, 48099.0, 27109.0, 15159.0, 9010.0, 5357.0, 3180.0, 1947.0, 1261.0, 834.0, 589.0, 333.0, 219.0, 172.0, 125.0, 67.0, 58.0, 46.0, 24.0, 34.0, 12.0, 5.0, 11.0, 8.0, 4.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0], "bins": [-11.265625, -10.9017333984375, -10.537841796875, -10.1739501953125, -9.81005859375, -9.4461669921875, -9.082275390625, -8.7183837890625, -8.3544921875, -7.9906005859375, -7.626708984375, -7.2628173828125, -6.89892578125, -6.5350341796875, -6.171142578125, -5.8072509765625, -5.443359375, -5.0794677734375, -4.715576171875, -4.3516845703125, -3.98779296875, -3.6239013671875, -3.260009765625, -2.8961181640625, -2.5322265625, -2.1683349609375, -1.804443359375, -1.4405517578125, -1.07666015625, -0.7127685546875, -0.348876953125, 0.0150146484375, 0.37890625, 0.7427978515625, 1.106689453125, 1.4705810546875, 1.83447265625, 2.1983642578125, 2.562255859375, 2.9261474609375, 3.2900390625, 3.6539306640625, 4.017822265625, 4.3817138671875, 4.74560546875, 5.1094970703125, 5.473388671875, 5.8372802734375, 6.201171875, 6.5650634765625, 6.928955078125, 7.2928466796875, 7.65673828125, 8.0206298828125, 8.384521484375, 8.7484130859375, 9.1123046875, 9.4761962890625, 9.840087890625, 10.2039794921875, 10.56787109375, 10.9317626953125, 11.295654296875, 11.6595458984375, 12.0234375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 9.0, 6.0, 11.0, 7.0, 17.0, 10.0, 17.0, 17.0, 25.0, 22.0, 34.0, 37.0, 32.0, 21.0, 41.0, 50.0, 58.0, 43.0, 43.0, 60.0, 45.0, 47.0, 49.0, 34.0, 30.0, 27.0, 26.0, 36.0, 30.0, 20.0, 20.0, 13.0, 15.0, 12.0, 13.0, 10.0, 5.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.1796875, -11.789306640625, -11.39892578125, -11.008544921875, -10.6181640625, -10.227783203125, -9.83740234375, -9.447021484375, -9.056640625, -8.666259765625, -8.27587890625, -7.885498046875, -7.4951171875, -7.104736328125, -6.71435546875, -6.323974609375, -5.93359375, -5.543212890625, -5.15283203125, -4.762451171875, -4.3720703125, -3.981689453125, -3.59130859375, -3.200927734375, -2.810546875, -2.420166015625, -2.02978515625, -1.639404296875, -1.2490234375, -0.858642578125, -0.46826171875, -0.077880859375, 0.3125, 0.702880859375, 1.09326171875, 1.483642578125, 1.8740234375, 2.264404296875, 2.65478515625, 3.045166015625, 3.435546875, 3.825927734375, 4.21630859375, 4.606689453125, 4.9970703125, 5.387451171875, 5.77783203125, 6.168212890625, 6.55859375, 6.948974609375, 7.33935546875, 7.729736328125, 8.1201171875, 8.510498046875, 8.90087890625, 9.291259765625, 9.681640625, 10.072021484375, 10.46240234375, 10.852783203125, 11.2431640625, 11.633544921875, 12.02392578125, 12.414306640625, 12.8046875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 5.0, 8.0, 7.0, 13.0, 28.0, 35.0, 56.0, 80.0, 158.0, 203.0, 324.0, 658.0, 1134.0, 2046.0, 3939.0, 8433.0, 19049.0, 45334.0, 110973.0, 245685.0, 310000.0, 172985.0, 72177.0, 29856.0, 12864.0, 5904.0, 2912.0, 1556.0, 849.0, 499.0, 282.0, 159.0, 114.0, 83.0, 54.0, 23.0, 24.0, 20.0, 9.0, 3.0, 9.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.4375, -15.8115234375, -15.185546875, -14.5595703125, -13.93359375, -13.3076171875, -12.681640625, -12.0556640625, -11.4296875, -10.8037109375, -10.177734375, -9.5517578125, -8.92578125, -8.2998046875, -7.673828125, -7.0478515625, -6.421875, -5.7958984375, -5.169921875, -4.5439453125, -3.91796875, -3.2919921875, -2.666015625, -2.0400390625, -1.4140625, -0.7880859375, -0.162109375, 0.4638671875, 1.08984375, 1.7158203125, 2.341796875, 2.9677734375, 3.59375, 4.2197265625, 4.845703125, 5.4716796875, 6.09765625, 6.7236328125, 7.349609375, 7.9755859375, 8.6015625, 9.2275390625, 9.853515625, 10.4794921875, 11.10546875, 11.7314453125, 12.357421875, 12.9833984375, 13.609375, 14.2353515625, 14.861328125, 15.4873046875, 16.11328125, 16.7392578125, 17.365234375, 17.9912109375, 18.6171875, 19.2431640625, 19.869140625, 20.4951171875, 21.12109375, 21.7470703125, 22.373046875, 22.9990234375, 23.625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 2.0, 3.0, 5.0, 6.0, 10.0, 18.0, 22.0, 20.0, 32.0, 29.0, 22.0, 39.0, 46.0, 41.0, 42.0, 47.0, 41.0, 44.0, 47.0, 46.0, 39.0, 41.0, 36.0, 40.0, 36.0, 41.0, 39.0, 27.0, 25.0, 28.0, 20.0, 17.0, 7.0, 9.0, 13.0, 11.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.03125, -6.7958984375, -6.560546875, -6.3251953125, -6.08984375, -5.8544921875, -5.619140625, -5.3837890625, -5.1484375, -4.9130859375, -4.677734375, -4.4423828125, -4.20703125, -3.9716796875, -3.736328125, -3.5009765625, -3.265625, -3.0302734375, -2.794921875, -2.5595703125, -2.32421875, -2.0888671875, -1.853515625, -1.6181640625, -1.3828125, -1.1474609375, -0.912109375, -0.6767578125, -0.44140625, -0.2060546875, 0.029296875, 0.2646484375, 0.5, 0.7353515625, 0.970703125, 1.2060546875, 1.44140625, 1.6767578125, 1.912109375, 2.1474609375, 2.3828125, 2.6181640625, 2.853515625, 3.0888671875, 3.32421875, 3.5595703125, 3.794921875, 4.0302734375, 4.265625, 4.5009765625, 4.736328125, 4.9716796875, 5.20703125, 5.4423828125, 5.677734375, 5.9130859375, 6.1484375, 6.3837890625, 6.619140625, 6.8544921875, 7.08984375, 7.3251953125, 7.560546875, 7.7958984375, 8.03125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 5.0, 3.0, 4.0, 11.0, 16.0, 13.0, 21.0, 44.0, 42.0, 60.0, 107.0, 180.0, 249.0, 393.0, 737.0, 1275.0, 2319.0, 4479.0, 9404.0, 20295.0, 45979.0, 109466.0, 240736.0, 309134.0, 171005.0, 73401.0, 31187.0, 13983.0, 6570.0, 3225.0, 1701.0, 964.0, 586.0, 319.0, 248.0, 119.0, 99.0, 55.0, 34.0, 29.0, 18.0, 17.0, 7.0, 12.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.1015625, -8.8280029296875, -8.554443359375, -8.2808837890625, -8.00732421875, -7.7337646484375, -7.460205078125, -7.1866455078125, -6.9130859375, -6.6395263671875, -6.365966796875, -6.0924072265625, -5.81884765625, -5.5452880859375, -5.271728515625, -4.9981689453125, -4.724609375, -4.4510498046875, -4.177490234375, -3.9039306640625, -3.63037109375, -3.3568115234375, -3.083251953125, -2.8096923828125, -2.5361328125, -2.2625732421875, -1.989013671875, -1.7154541015625, -1.44189453125, -1.1683349609375, -0.894775390625, -0.6212158203125, -0.34765625, -0.0740966796875, 0.199462890625, 0.4730224609375, 0.74658203125, 1.0201416015625, 1.293701171875, 1.5672607421875, 1.8408203125, 2.1143798828125, 2.387939453125, 2.6614990234375, 2.93505859375, 3.2086181640625, 3.482177734375, 3.7557373046875, 4.029296875, 4.3028564453125, 4.576416015625, 4.8499755859375, 5.12353515625, 5.3970947265625, 5.670654296875, 5.9442138671875, 6.2177734375, 6.4913330078125, 6.764892578125, 7.0384521484375, 7.31201171875, 7.5855712890625, 7.859130859375, 8.1326904296875, 8.40625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 7.0, 7.0, 6.0, 6.0, 17.0, 14.0, 17.0, 15.0, 20.0, 24.0, 38.0, 51.0, 54.0, 58.0, 79.0, 68.0, 64.0, 56.0, 79.0, 52.0, 62.0, 34.0, 40.0, 22.0, 20.0, 19.0, 12.0, 9.0, 17.0, 6.0, 4.0, 3.0, 4.0, 1.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002980232238769531, -0.0002882517874240875, -0.0002784803509712219, -0.0002687089145183563, -0.0002589374780654907, -0.0002491660416126251, -0.00023939460515975952, -0.00022962316870689392, -0.00021985173225402832, -0.00021008029580116272, -0.00020030885934829712, -0.00019053742289543152, -0.00018076598644256592, -0.00017099454998970032, -0.00016122311353683472, -0.00015145167708396912, -0.00014168024063110352, -0.00013190880417823792, -0.00012213736772537231, -0.00011236593127250671, -0.00010259449481964111, -9.282305836677551e-05, -8.305162191390991e-05, -7.328018546104431e-05, -6.350874900817871e-05, -5.373731255531311e-05, -4.396587610244751e-05, -3.419443964958191e-05, -2.442300319671631e-05, -1.4651566743850708e-05, -4.880130290985107e-06, 4.891306161880493e-06, 1.4662742614746094e-05, 2.4434179067611694e-05, 3.4205615520477295e-05, 4.3977051973342896e-05, 5.3748488426208496e-05, 6.35199248790741e-05, 7.32913613319397e-05, 8.30627977848053e-05, 9.28342342376709e-05, 0.0001026056706905365, 0.0001123771071434021, 0.0001221485435962677, 0.0001319199800491333, 0.0001416914165019989, 0.0001514628529548645, 0.0001612342894077301, 0.0001710057258605957, 0.0001807771623134613, 0.0001905485987663269, 0.0002003200352191925, 0.0002100914716720581, 0.0002198629081249237, 0.0002296343445777893, 0.0002394057810306549, 0.0002491772174835205, 0.0002589486539363861, 0.0002687200903892517, 0.0002784915268421173, 0.0002882629632949829, 0.0002980343997478485, 0.0003078058362007141, 0.0003175772726535797, 0.0003273487091064453]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 3.0, 3.0, 6.0, 3.0, 11.0, 18.0, 13.0, 29.0, 34.0, 57.0, 91.0, 128.0, 191.0, 319.0, 387.0, 600.0, 947.0, 1563.0, 2632.0, 4654.0, 8422.0, 15615.0, 31224.0, 60140.0, 112702.0, 182010.0, 216921.0, 177022.0, 109268.0, 58458.0, 30101.0, 15393.0, 8206.0, 4475.0, 2617.0, 1478.0, 960.0, 634.0, 388.0, 273.0, 187.0, 121.0, 81.0, 60.0, 44.0, 20.0, 19.0, 16.0, 4.0, 6.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.9296875, -5.735107421875, -5.54052734375, -5.345947265625, -5.1513671875, -4.956787109375, -4.76220703125, -4.567626953125, -4.373046875, -4.178466796875, -3.98388671875, -3.789306640625, -3.5947265625, -3.400146484375, -3.20556640625, -3.010986328125, -2.81640625, -2.621826171875, -2.42724609375, -2.232666015625, -2.0380859375, -1.843505859375, -1.64892578125, -1.454345703125, -1.259765625, -1.065185546875, -0.87060546875, -0.676025390625, -0.4814453125, -0.286865234375, -0.09228515625, 0.102294921875, 0.296875, 0.491455078125, 0.68603515625, 0.880615234375, 1.0751953125, 1.269775390625, 1.46435546875, 1.658935546875, 1.853515625, 2.048095703125, 2.24267578125, 2.437255859375, 2.6318359375, 2.826416015625, 3.02099609375, 3.215576171875, 3.41015625, 3.604736328125, 3.79931640625, 3.993896484375, 4.1884765625, 4.383056640625, 4.57763671875, 4.772216796875, 4.966796875, 5.161376953125, 5.35595703125, 5.550537109375, 5.7451171875, 5.939697265625, 6.13427734375, 6.328857421875, 6.5234375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 0.0, 2.0, 7.0, 2.0, 7.0, 3.0, 9.0, 15.0, 19.0, 16.0, 28.0, 32.0, 29.0, 32.0, 35.0, 45.0, 58.0, 53.0, 55.0, 54.0, 65.0, 57.0, 57.0, 59.0, 51.0, 51.0, 28.0, 30.0, 22.0, 19.0, 9.0, 7.0, 12.0, 9.0, 1.0, 9.0, 8.0, 3.0, 2.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.736328125, -1.67657470703125, -1.6168212890625, -1.55706787109375, -1.497314453125, -1.43756103515625, -1.3778076171875, -1.31805419921875, -1.25830078125, -1.19854736328125, -1.1387939453125, -1.07904052734375, -1.019287109375, -0.95953369140625, -0.8997802734375, -0.84002685546875, -0.7802734375, -0.72052001953125, -0.6607666015625, -0.60101318359375, -0.541259765625, -0.48150634765625, -0.4217529296875, -0.36199951171875, -0.30224609375, -0.24249267578125, -0.1827392578125, -0.12298583984375, -0.063232421875, -0.00347900390625, 0.0562744140625, 0.11602783203125, 0.17578125, 0.23553466796875, 0.2952880859375, 0.35504150390625, 0.414794921875, 0.47454833984375, 0.5343017578125, 0.59405517578125, 0.65380859375, 0.71356201171875, 0.7733154296875, 0.83306884765625, 0.892822265625, 0.95257568359375, 1.0123291015625, 1.07208251953125, 1.1318359375, 1.19158935546875, 1.2513427734375, 1.31109619140625, 1.370849609375, 1.43060302734375, 1.4903564453125, 1.55010986328125, 1.60986328125, 1.66961669921875, 1.7293701171875, 1.78912353515625, 1.848876953125, 1.90863037109375, 1.9683837890625, 2.02813720703125, 2.087890625]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 7.0, 4.0, 7.0, 3.0, 4.0, 11.0, 15.0, 11.0, 17.0, 22.0, 19.0, 43.0, 32.0, 35.0, 52.0, 63.0, 63.0, 72.0, 69.0, 71.0, 61.0, 57.0, 46.0, 50.0, 22.0, 18.0, 27.0, 23.0, 17.0, 8.0, 10.0, 11.0, 9.0, 6.0, 0.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.129344940185547, -19.466495513916016, -18.803647994995117, -18.140798568725586, -17.477951049804688, -16.815101623535156, -16.152254104614258, -15.489404678344727, -14.826556205749512, -14.163707733154297, -13.500859260559082, -12.838010787963867, -12.175161361694336, -11.512313842773438, -10.849464416503906, -10.186615943908691, -9.523767471313477, -8.860918998718262, -8.198070526123047, -7.535221576690674, -6.872373104095459, -6.209524631500244, -5.546675682067871, -4.883827209472656, -4.220978736877441, -3.5581302642822266, -2.8952815532684326, -2.2324328422546387, -1.5695843696594238, -0.906735897064209, -0.24388718605041504, 0.4189615249633789, 1.081808090209961, 1.7446566820144653, 2.4075052738189697, 3.0703539848327637, 3.7332024574279785, 4.396050930023193, 5.058899879455566, 5.721748352050781, 6.384596824645996, 7.047445297241211, 7.710293769836426, 8.37314224243164, 9.035991668701172, 9.69883918762207, 10.361688613891602, 11.024537086486816, 11.687385559082031, 12.350234031677246, 13.013082504272461, 13.675930976867676, 14.33877944946289, 15.001628875732422, 15.664477348327637, 16.32732582092285, 16.99017333984375, 17.65302276611328, 18.31587028503418, 18.97871971130371, 19.64156723022461, 20.30441665649414, 20.96726417541504, 21.63011360168457, 22.2929630279541]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 3.0, 6.0, 13.0, 14.0, 10.0, 15.0, 18.0, 25.0, 23.0, 25.0, 25.0, 26.0, 34.0, 38.0, 38.0, 34.0, 48.0, 40.0, 48.0, 48.0, 41.0, 37.0, 44.0, 37.0, 32.0, 38.0, 29.0, 25.0, 19.0, 33.0, 20.0, 25.0, 14.0, 14.0, 17.0, 8.0, 9.0, 6.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.874702453613281, -9.548356056213379, -9.22200870513916, -8.895662307739258, -8.569314956665039, -8.242968559265137, -7.916621208190918, -7.590274810791016, -7.263927459716797, -6.937580585479736, -6.611233711242676, -6.284886837005615, -5.958539962768555, -5.632193088531494, -5.305846214294434, -4.979499816894531, -4.653152942657471, -4.32680606842041, -4.00045919418335, -3.674112319946289, -3.3477654457092285, -3.021418571472168, -2.6950719356536865, -2.368725061416626, -2.0423781871795654, -1.7160313129425049, -1.3896844387054443, -1.0633376836776733, -0.7369908094406128, -0.41064393520355225, -0.08429718017578125, 0.2420496940612793, 0.5683965682983398, 0.8947434425354004, 1.221090316772461, 1.547437071800232, 1.8737839460372925, 2.2001309394836426, 2.526477575302124, 2.8528244495391846, 3.179171323776245, 3.5055181980133057, 3.831865072250366, 4.158211708068848, 4.484558582305908, 4.810905456542969, 5.137252330780029, 5.46359920501709, 5.78994607925415, 6.116292953491211, 6.4426398277282715, 6.768986701965332, 7.095333576202393, 7.421680450439453, 7.7480268478393555, 8.074374198913574, 8.400720596313477, 8.727066993713379, 9.053414344787598, 9.3797607421875, 9.706108093261719, 10.032454490661621, 10.35880184173584, 10.685148239135742, 11.011495590209961]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 6.0, 6.0, 7.0, 16.0, 26.0, 30.0, 55.0, 87.0, 135.0, 208.0, 371.0, 628.0, 1163.0, 2228.0, 4489.0, 8944.0, 18498.0, 37723.0, 73628.0, 129921.0, 191645.0, 208267.0, 163324.0, 100287.0, 53934.0, 26745.0, 13099.0, 6321.0, 3101.0, 1570.0, 860.0, 517.0, 272.0, 150.0, 107.0, 63.0, 43.0, 27.0, 22.0, 13.0, 5.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.40625, -15.88134765625, -15.3564453125, -14.83154296875, -14.306640625, -13.78173828125, -13.2568359375, -12.73193359375, -12.20703125, -11.68212890625, -11.1572265625, -10.63232421875, -10.107421875, -9.58251953125, -9.0576171875, -8.53271484375, -8.0078125, -7.48291015625, -6.9580078125, -6.43310546875, -5.908203125, -5.38330078125, -4.8583984375, -4.33349609375, -3.80859375, -3.28369140625, -2.7587890625, -2.23388671875, -1.708984375, -1.18408203125, -0.6591796875, -0.13427734375, 0.390625, 0.91552734375, 1.4404296875, 1.96533203125, 2.490234375, 3.01513671875, 3.5400390625, 4.06494140625, 4.58984375, 5.11474609375, 5.6396484375, 6.16455078125, 6.689453125, 7.21435546875, 7.7392578125, 8.26416015625, 8.7890625, 9.31396484375, 9.8388671875, 10.36376953125, 10.888671875, 11.41357421875, 11.9384765625, 12.46337890625, 12.98828125, 13.51318359375, 14.0380859375, 14.56298828125, 15.087890625, 15.61279296875, 16.1376953125, 16.66259765625, 17.1875]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 5.0, 6.0, 5.0, 4.0, 8.0, 7.0, 10.0, 12.0, 16.0, 21.0, 19.0, 27.0, 29.0, 22.0, 19.0, 27.0, 33.0, 28.0, 39.0, 43.0, 42.0, 45.0, 50.0, 33.0, 34.0, 36.0, 40.0, 39.0, 27.0, 31.0, 28.0, 26.0, 27.0, 25.0, 24.0, 25.0, 18.0, 8.0, 19.0, 12.0, 7.0, 7.0, 4.0, 3.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.953125, -9.6209716796875, -9.288818359375, -8.9566650390625, -8.62451171875, -8.2923583984375, -7.960205078125, -7.6280517578125, -7.2958984375, -6.9637451171875, -6.631591796875, -6.2994384765625, -5.96728515625, -5.6351318359375, -5.302978515625, -4.9708251953125, -4.638671875, -4.3065185546875, -3.974365234375, -3.6422119140625, -3.31005859375, -2.9779052734375, -2.645751953125, -2.3135986328125, -1.9814453125, -1.6492919921875, -1.317138671875, -0.9849853515625, -0.65283203125, -0.3206787109375, 0.011474609375, 0.3436279296875, 0.67578125, 1.0079345703125, 1.340087890625, 1.6722412109375, 2.00439453125, 2.3365478515625, 2.668701171875, 3.0008544921875, 3.3330078125, 3.6651611328125, 3.997314453125, 4.3294677734375, 4.66162109375, 4.9937744140625, 5.325927734375, 5.6580810546875, 5.990234375, 6.3223876953125, 6.654541015625, 6.9866943359375, 7.31884765625, 7.6510009765625, 7.983154296875, 8.3153076171875, 8.6474609375, 8.9796142578125, 9.311767578125, 9.6439208984375, 9.97607421875, 10.3082275390625, 10.640380859375, 10.9725341796875, 11.3046875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 7.0, 11.0, 13.0, 26.0, 38.0, 48.0, 57.0, 69.0, 119.0, 165.0, 246.0, 446.0, 746.0, 1339.0, 2816.0, 6710.0, 17135.0, 44537.0, 109220.0, 216825.0, 278653.0, 203763.0, 98627.0, 39959.0, 15401.0, 5980.0, 2592.0, 1230.0, 678.0, 410.0, 239.0, 145.0, 105.0, 64.0, 41.0, 24.0, 17.0, 21.0, 14.0, 9.0, 4.0, 1.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.09375, -18.42236328125, -17.7509765625, -17.07958984375, -16.408203125, -15.73681640625, -15.0654296875, -14.39404296875, -13.72265625, -13.05126953125, -12.3798828125, -11.70849609375, -11.037109375, -10.36572265625, -9.6943359375, -9.02294921875, -8.3515625, -7.68017578125, -7.0087890625, -6.33740234375, -5.666015625, -4.99462890625, -4.3232421875, -3.65185546875, -2.98046875, -2.30908203125, -1.6376953125, -0.96630859375, -0.294921875, 0.37646484375, 1.0478515625, 1.71923828125, 2.390625, 3.06201171875, 3.7333984375, 4.40478515625, 5.076171875, 5.74755859375, 6.4189453125, 7.09033203125, 7.76171875, 8.43310546875, 9.1044921875, 9.77587890625, 10.447265625, 11.11865234375, 11.7900390625, 12.46142578125, 13.1328125, 13.80419921875, 14.4755859375, 15.14697265625, 15.818359375, 16.48974609375, 17.1611328125, 17.83251953125, 18.50390625, 19.17529296875, 19.8466796875, 20.51806640625, 21.189453125, 21.86083984375, 22.5322265625, 23.20361328125, 23.875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 4.0, 11.0, 6.0, 11.0, 9.0, 10.0, 29.0, 7.0, 14.0, 17.0, 29.0, 18.0, 28.0, 28.0, 32.0, 31.0, 34.0, 38.0, 31.0, 35.0, 31.0, 38.0, 40.0, 31.0, 41.0, 20.0, 29.0, 37.0, 31.0, 29.0, 23.0, 18.0, 33.0, 24.0, 26.0, 13.0, 19.0, 18.0, 17.0, 12.0, 4.0, 17.0, 3.0, 2.0, 5.0, 5.0, 7.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.84765625, -5.6590576171875, -5.470458984375, -5.2818603515625, -5.09326171875, -4.9046630859375, -4.716064453125, -4.5274658203125, -4.3388671875, -4.1502685546875, -3.961669921875, -3.7730712890625, -3.58447265625, -3.3958740234375, -3.207275390625, -3.0186767578125, -2.830078125, -2.6414794921875, -2.452880859375, -2.2642822265625, -2.07568359375, -1.8870849609375, -1.698486328125, -1.5098876953125, -1.3212890625, -1.1326904296875, -0.944091796875, -0.7554931640625, -0.56689453125, -0.3782958984375, -0.189697265625, -0.0010986328125, 0.1875, 0.3760986328125, 0.564697265625, 0.7532958984375, 0.94189453125, 1.1304931640625, 1.319091796875, 1.5076904296875, 1.6962890625, 1.8848876953125, 2.073486328125, 2.2620849609375, 2.45068359375, 2.6392822265625, 2.827880859375, 3.0164794921875, 3.205078125, 3.3936767578125, 3.582275390625, 3.7708740234375, 3.95947265625, 4.1480712890625, 4.336669921875, 4.5252685546875, 4.7138671875, 4.9024658203125, 5.091064453125, 5.2796630859375, 5.46826171875, 5.6568603515625, 5.845458984375, 6.0340576171875, 6.22265625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 9.0, 8.0, 11.0, 20.0, 34.0, 34.0, 72.0, 105.0, 162.0, 234.0, 380.0, 559.0, 812.0, 1227.0, 1916.0, 3071.0, 4616.0, 7441.0, 11793.0, 19078.0, 30929.0, 50086.0, 78853.0, 117520.0, 151793.0, 161875.0, 137070.0, 98691.0, 63892.0, 39782.0, 24915.0, 15192.0, 9467.0, 5995.0, 3804.0, 2477.0, 1651.0, 1011.0, 647.0, 462.0, 297.0, 198.0, 129.0, 82.0, 45.0, 37.0, 31.0, 16.0, 6.0, 7.0, 10.0, 1.0, 4.0, 4.0], "bins": [-6.22265625, -6.04620361328125, -5.8697509765625, -5.69329833984375, -5.516845703125, -5.34039306640625, -5.1639404296875, -4.98748779296875, -4.81103515625, -4.63458251953125, -4.4581298828125, -4.28167724609375, -4.105224609375, -3.92877197265625, -3.7523193359375, -3.57586669921875, -3.3994140625, -3.22296142578125, -3.0465087890625, -2.87005615234375, -2.693603515625, -2.51715087890625, -2.3406982421875, -2.16424560546875, -1.98779296875, -1.81134033203125, -1.6348876953125, -1.45843505859375, -1.281982421875, -1.10552978515625, -0.9290771484375, -0.75262451171875, -0.576171875, -0.39971923828125, -0.2232666015625, -0.04681396484375, 0.129638671875, 0.30609130859375, 0.4825439453125, 0.65899658203125, 0.83544921875, 1.01190185546875, 1.1883544921875, 1.36480712890625, 1.541259765625, 1.71771240234375, 1.8941650390625, 2.07061767578125, 2.2470703125, 2.42352294921875, 2.5999755859375, 2.77642822265625, 2.952880859375, 3.12933349609375, 3.3057861328125, 3.48223876953125, 3.65869140625, 3.83514404296875, 4.0115966796875, 4.18804931640625, 4.364501953125, 4.54095458984375, 4.7174072265625, 4.89385986328125, 5.0703125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 2.0, 6.0, 4.0, 8.0, 12.0, 15.0, 24.0, 21.0, 32.0, 53.0, 48.0, 62.0, 77.0, 78.0, 91.0, 81.0, 89.0, 65.0, 45.0, 41.0, 29.0, 30.0, 24.0, 11.0, 11.0, 11.0, 7.0, 6.0, 6.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006399154663085938, -0.0006174445152282715, -0.0005949735641479492, -0.000572502613067627, -0.0005500316619873047, -0.0005275607109069824, -0.0005050897598266602, -0.0004826188087463379, -0.0004601478576660156, -0.00043767690658569336, -0.0004152059555053711, -0.00039273500442504883, -0.00037026405334472656, -0.0003477931022644043, -0.00032532215118408203, -0.00030285120010375977, -0.0002803802490234375, -0.00025790929794311523, -0.00023543834686279297, -0.0002129673957824707, -0.00019049644470214844, -0.00016802549362182617, -0.0001455545425415039, -0.00012308359146118164, -0.00010061264038085938, -7.814168930053711e-05, -5.5670738220214844e-05, -3.319978713989258e-05, -1.0728836059570312e-05, 1.1742115020751953e-05, 3.421306610107422e-05, 5.6684017181396484e-05, 7.915496826171875e-05, 0.00010162591934204102, 0.00012409687042236328, 0.00014656782150268555, 0.0001690387725830078, 0.00019150972366333008, 0.00021398067474365234, 0.0002364516258239746, 0.0002589225769042969, 0.00028139352798461914, 0.0003038644790649414, 0.00032633543014526367, 0.00034880638122558594, 0.0003712773323059082, 0.00039374828338623047, 0.00041621923446655273, 0.000438690185546875, 0.00046116113662719727, 0.00048363208770751953, 0.0005061030387878418, 0.0005285739898681641, 0.0005510449409484863, 0.0005735158920288086, 0.0005959868431091309, 0.0006184577941894531, 0.0006409287452697754, 0.0006633996963500977, 0.0006858706474304199, 0.0007083415985107422, 0.0007308125495910645, 0.0007532835006713867, 0.000775754451751709, 0.0007982254028320312]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 9.0, 8.0, 5.0, 9.0, 15.0, 14.0, 23.0, 43.0, 40.0, 72.0, 103.0, 144.0, 214.0, 329.0, 519.0, 773.0, 1227.0, 1827.0, 2921.0, 4758.0, 7813.0, 12918.0, 21635.0, 36179.0, 59153.0, 92919.0, 134716.0, 163554.0, 159542.0, 125429.0, 85667.0, 53640.0, 32240.0, 19526.0, 11549.0, 7157.0, 4279.0, 2658.0, 1743.0, 1075.0, 728.0, 434.0, 325.0, 183.0, 144.0, 106.0, 57.0, 46.0, 40.0, 23.0, 11.0, 9.0, 3.0, 5.0, 5.0, 3.0, 0.0, 3.0, 1.0], "bins": [-5.80859375, -5.63201904296875, -5.4554443359375, -5.27886962890625, -5.102294921875, -4.92572021484375, -4.7491455078125, -4.57257080078125, -4.39599609375, -4.21942138671875, -4.0428466796875, -3.86627197265625, -3.689697265625, -3.51312255859375, -3.3365478515625, -3.15997314453125, -2.9833984375, -2.80682373046875, -2.6302490234375, -2.45367431640625, -2.277099609375, -2.10052490234375, -1.9239501953125, -1.74737548828125, -1.57080078125, -1.39422607421875, -1.2176513671875, -1.04107666015625, -0.864501953125, -0.68792724609375, -0.5113525390625, -0.33477783203125, -0.158203125, 0.01837158203125, 0.1949462890625, 0.37152099609375, 0.548095703125, 0.72467041015625, 0.9012451171875, 1.07781982421875, 1.25439453125, 1.43096923828125, 1.6075439453125, 1.78411865234375, 1.960693359375, 2.13726806640625, 2.3138427734375, 2.49041748046875, 2.6669921875, 2.84356689453125, 3.0201416015625, 3.19671630859375, 3.373291015625, 3.54986572265625, 3.7264404296875, 3.90301513671875, 4.07958984375, 4.25616455078125, 4.4327392578125, 4.60931396484375, 4.785888671875, 4.96246337890625, 5.1390380859375, 5.31561279296875, 5.4921875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 7.0, 18.0, 13.0, 11.0, 21.0, 23.0, 21.0, 23.0, 30.0, 49.0, 46.0, 46.0, 50.0, 69.0, 53.0, 56.0, 54.0, 35.0, 70.0, 45.0, 41.0, 29.0, 35.0, 14.0, 27.0, 21.0, 18.0, 21.0, 10.0, 10.0, 4.0, 9.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.876953125, -1.81781005859375, -1.7586669921875, -1.69952392578125, -1.640380859375, -1.58123779296875, -1.5220947265625, -1.46295166015625, -1.40380859375, -1.34466552734375, -1.2855224609375, -1.22637939453125, -1.167236328125, -1.10809326171875, -1.0489501953125, -0.98980712890625, -0.9306640625, -0.87152099609375, -0.8123779296875, -0.75323486328125, -0.694091796875, -0.63494873046875, -0.5758056640625, -0.51666259765625, -0.45751953125, -0.39837646484375, -0.3392333984375, -0.28009033203125, -0.220947265625, -0.16180419921875, -0.1026611328125, -0.04351806640625, 0.015625, 0.07476806640625, 0.1339111328125, 0.19305419921875, 0.252197265625, 0.31134033203125, 0.3704833984375, 0.42962646484375, 0.48876953125, 0.54791259765625, 0.6070556640625, 0.66619873046875, 0.725341796875, 0.78448486328125, 0.8436279296875, 0.90277099609375, 0.9619140625, 1.02105712890625, 1.0802001953125, 1.13934326171875, 1.198486328125, 1.25762939453125, 1.3167724609375, 1.37591552734375, 1.43505859375, 1.49420166015625, 1.5533447265625, 1.61248779296875, 1.671630859375, 1.73077392578125, 1.7899169921875, 1.84906005859375, 1.908203125]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 6.0, 3.0, 2.0, 7.0, 9.0, 10.0, 19.0, 18.0, 26.0, 30.0, 41.0, 50.0, 50.0, 61.0, 75.0, 57.0, 72.0, 81.0, 71.0, 59.0, 55.0, 46.0, 25.0, 18.0, 21.0, 15.0, 17.0, 12.0, 10.0, 9.0, 8.0, 3.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-22.58266830444336, -21.86414337158203, -21.145618438720703, -20.427093505859375, -19.708568572998047, -18.99004364013672, -18.27151870727539, -17.552993774414062, -16.834468841552734, -16.115943908691406, -15.397418975830078, -14.67889404296875, -13.960369110107422, -13.241844177246094, -12.523320198059082, -11.804795265197754, -11.086271286010742, -10.367746353149414, -9.649221420288086, -8.930696487426758, -8.21217155456543, -7.49364709854126, -6.77512264251709, -6.056597709655762, -5.338072776794434, -4.6195478439331055, -3.9010231494903564, -3.1824984550476074, -2.4639735221862793, -1.7454485893249512, -1.0269241333007812, -0.3083992004394531, 0.410125732421875, 1.1286505460739136, 1.8471753597259521, 2.565700054168701, 3.2842249870300293, 4.002749919891357, 4.721274375915527, 5.4397993087768555, 6.158324241638184, 6.876849174499512, 7.59537410736084, 8.313898086547852, 9.03242301940918, 9.750947952270508, 10.469472885131836, 11.187997817993164, 11.906522750854492, 12.62504768371582, 13.343572616577148, 14.062097549438477, 14.780622482299805, 15.499147415161133, 16.217670440673828, 16.936195373535156, 17.654720306396484, 18.373245239257812, 19.09177017211914, 19.81029510498047, 20.528820037841797, 21.247344970703125, 21.965869903564453, 22.68439483642578, 23.40291976928711]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 3.0, 3.0, 1.0, 5.0, 11.0, 7.0, 7.0, 4.0, 9.0, 11.0, 15.0, 18.0, 24.0, 23.0, 18.0, 26.0, 32.0, 29.0, 44.0, 46.0, 47.0, 37.0, 27.0, 45.0, 37.0, 38.0, 45.0, 45.0, 39.0, 28.0, 44.0, 27.0, 25.0, 23.0, 20.0, 18.0, 21.0, 21.0, 19.0, 13.0, 9.0, 11.0, 12.0, 4.0, 2.0, 4.0, 8.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.802571296691895, -8.481050491333008, -8.159530639648438, -7.838009834289551, -7.516489505767822, -7.194969177246094, -6.873448371887207, -6.5519280433654785, -6.23040771484375, -5.9088873863220215, -5.587367057800293, -5.265846252441406, -4.944325923919678, -4.622805595397949, -4.3012847900390625, -3.979764461517334, -3.6582441329956055, -3.336723804473877, -3.0152032375335693, -2.6936826705932617, -2.372162342071533, -2.0506420135498047, -1.729121446609497, -1.4076008796691895, -1.086080551147461, -0.7645601034164429, -0.4430396556854248, -0.12151920795440674, 0.20000123977661133, 0.5215216875076294, 0.8430421352386475, 1.164562702178955, 1.4860830307006836, 1.8076034784317017, 2.1291239261627197, 2.4506444931030273, 2.772164821624756, 3.0936851501464844, 3.415205717086792, 3.7367262840270996, 4.058246612548828, 4.379766941070557, 4.701287269592285, 5.022808074951172, 5.3443284034729, 5.665848731994629, 5.987369537353516, 6.308889865875244, 6.630410194396973, 6.951930522918701, 7.27345085144043, 7.594971656799316, 7.916491985321045, 8.238012313842773, 8.55953311920166, 8.881053924560547, 9.202573776245117, 9.524094581604004, 9.845614433288574, 10.167135238647461, 10.488655090332031, 10.810175895690918, 11.131696701049805, 11.453216552734375, 11.774737358093262]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 7.0, 3.0, 11.0, 12.0, 16.0, 25.0, 23.0, 50.0, 72.0, 113.0, 171.0, 284.0, 417.0, 785.0, 1408.0, 2520.0, 5214.0, 10711.0, 22889.0, 51782.0, 124898.0, 331470.0, 902695.0, 1436223.0, 808525.0, 293911.0, 111810.0, 46490.0, 20726.0, 9949.0, 5024.0, 2524.0, 1424.0, 796.0, 474.0, 299.0, 169.0, 126.0, 78.0, 44.0, 37.0, 27.0, 14.0, 20.0, 6.0, 7.0, 1.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-23.953125, -23.23681640625, -22.5205078125, -21.80419921875, -21.087890625, -20.37158203125, -19.6552734375, -18.93896484375, -18.22265625, -17.50634765625, -16.7900390625, -16.07373046875, -15.357421875, -14.64111328125, -13.9248046875, -13.20849609375, -12.4921875, -11.77587890625, -11.0595703125, -10.34326171875, -9.626953125, -8.91064453125, -8.1943359375, -7.47802734375, -6.76171875, -6.04541015625, -5.3291015625, -4.61279296875, -3.896484375, -3.18017578125, -2.4638671875, -1.74755859375, -1.03125, -0.31494140625, 0.4013671875, 1.11767578125, 1.833984375, 2.55029296875, 3.2666015625, 3.98291015625, 4.69921875, 5.41552734375, 6.1318359375, 6.84814453125, 7.564453125, 8.28076171875, 8.9970703125, 9.71337890625, 10.4296875, 11.14599609375, 11.8623046875, 12.57861328125, 13.294921875, 14.01123046875, 14.7275390625, 15.44384765625, 16.16015625, 16.87646484375, 17.5927734375, 18.30908203125, 19.025390625, 19.74169921875, 20.4580078125, 21.17431640625, 21.890625]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 8.0, 5.0, 12.0, 18.0, 13.0, 23.0, 10.0, 27.0, 19.0, 33.0, 37.0, 39.0, 45.0, 37.0, 48.0, 55.0, 51.0, 59.0, 43.0, 47.0, 40.0, 46.0, 38.0, 39.0, 33.0, 30.0, 26.0, 22.0, 23.0, 15.0, 14.0, 8.0, 11.0, 8.0, 4.0, 5.0, 5.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6953125, -7.4146728515625, -7.134033203125, -6.8533935546875, -6.57275390625, -6.2921142578125, -6.011474609375, -5.7308349609375, -5.4501953125, -5.1695556640625, -4.888916015625, -4.6082763671875, -4.32763671875, -4.0469970703125, -3.766357421875, -3.4857177734375, -3.205078125, -2.9244384765625, -2.643798828125, -2.3631591796875, -2.08251953125, -1.8018798828125, -1.521240234375, -1.2406005859375, -0.9599609375, -0.6793212890625, -0.398681640625, -0.1180419921875, 0.16259765625, 0.4432373046875, 0.723876953125, 1.0045166015625, 1.28515625, 1.5657958984375, 1.846435546875, 2.1270751953125, 2.40771484375, 2.6883544921875, 2.968994140625, 3.2496337890625, 3.5302734375, 3.8109130859375, 4.091552734375, 4.3721923828125, 4.65283203125, 4.9334716796875, 5.214111328125, 5.4947509765625, 5.775390625, 6.0560302734375, 6.336669921875, 6.6173095703125, 6.89794921875, 7.1785888671875, 7.459228515625, 7.7398681640625, 8.0205078125, 8.3011474609375, 8.581787109375, 8.8624267578125, 9.14306640625, 9.4237060546875, 9.704345703125, 9.9849853515625, 10.265625]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 8.0, 15.0, 9.0, 11.0, 28.0, 37.0, 57.0, 84.0, 129.0, 183.0, 321.0, 526.0, 856.0, 1400.0, 2266.0, 4026.0, 6829.0, 12496.0, 22174.0, 41410.0, 78777.0, 152526.0, 294826.0, 557030.0, 893641.0, 906856.0, 575189.0, 306470.0, 156697.0, 82111.0, 43095.0, 23434.0, 12884.0, 7114.0, 4230.0, 2509.0, 1529.0, 923.0, 601.0, 339.0, 211.0, 120.0, 98.0, 63.0, 56.0, 30.0, 22.0, 14.0, 10.0, 2.0, 6.0, 2.0, 4.0, 4.0], "bins": [-18.609375, -18.078125, -17.546875, -17.015625, -16.484375, -15.953125, -15.421875, -14.890625, -14.359375, -13.828125, -13.296875, -12.765625, -12.234375, -11.703125, -11.171875, -10.640625, -10.109375, -9.578125, -9.046875, -8.515625, -7.984375, -7.453125, -6.921875, -6.390625, -5.859375, -5.328125, -4.796875, -4.265625, -3.734375, -3.203125, -2.671875, -2.140625, -1.609375, -1.078125, -0.546875, -0.015625, 0.515625, 1.046875, 1.578125, 2.109375, 2.640625, 3.171875, 3.703125, 4.234375, 4.765625, 5.296875, 5.828125, 6.359375, 6.890625, 7.421875, 7.953125, 8.484375, 9.015625, 9.546875, 10.078125, 10.609375, 11.140625, 11.671875, 12.203125, 12.734375, 13.265625, 13.796875, 14.328125, 14.859375, 15.390625]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 5.0, 18.0, 14.0, 16.0, 34.0, 35.0, 71.0, 64.0, 104.0, 150.0, 164.0, 195.0, 274.0, 272.0, 351.0, 322.0, 342.0, 308.0, 259.0, 253.0, 203.0, 177.0, 123.0, 91.0, 67.0, 51.0, 34.0, 20.0, 18.0, 13.0, 5.0, 4.0, 6.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.953125, -5.7525634765625, -5.552001953125, -5.3514404296875, -5.15087890625, -4.9503173828125, -4.749755859375, -4.5491943359375, -4.3486328125, -4.1480712890625, -3.947509765625, -3.7469482421875, -3.54638671875, -3.3458251953125, -3.145263671875, -2.9447021484375, -2.744140625, -2.5435791015625, -2.343017578125, -2.1424560546875, -1.94189453125, -1.7413330078125, -1.540771484375, -1.3402099609375, -1.1396484375, -0.9390869140625, -0.738525390625, -0.5379638671875, -0.33740234375, -0.1368408203125, 0.063720703125, 0.2642822265625, 0.46484375, 0.6654052734375, 0.865966796875, 1.0665283203125, 1.26708984375, 1.4676513671875, 1.668212890625, 1.8687744140625, 2.0693359375, 2.2698974609375, 2.470458984375, 2.6710205078125, 2.87158203125, 3.0721435546875, 3.272705078125, 3.4732666015625, 3.673828125, 3.8743896484375, 4.074951171875, 4.2755126953125, 4.47607421875, 4.6766357421875, 4.877197265625, 5.0777587890625, 5.2783203125, 5.4788818359375, 5.679443359375, 5.8800048828125, 6.08056640625, 6.2811279296875, 6.481689453125, 6.6822509765625, 6.8828125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 7.0, 16.0, 15.0, 14.0, 26.0, 34.0, 43.0, 52.0, 71.0, 57.0, 71.0, 90.0, 86.0, 78.0, 67.0, 59.0, 45.0, 35.0, 30.0, 26.0, 17.0, 15.0, 9.0, 9.0, 5.0, 7.0, 5.0, 3.0, 2.0, 0.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.007352828979492, -24.204038619995117, -23.400724411010742, -22.597408294677734, -21.79409408569336, -20.990779876708984, -20.18746566772461, -19.384151458740234, -18.58083724975586, -17.777523040771484, -16.97420883178711, -16.170894622802734, -15.367578506469727, -14.564264297485352, -13.760950088500977, -12.957635879516602, -12.154319763183594, -11.351005554199219, -10.547690391540527, -9.744376182556152, -8.941061019897461, -8.137746810913086, -7.334432601928711, -6.531117916107178, -5.7278032302856445, -4.924488544464111, -4.121173858642578, -3.317859649658203, -2.51454496383667, -1.7112302780151367, -0.9079160690307617, -0.10460138320922852, 0.6987133026123047, 1.5020278692245483, 2.305342435836792, 3.108656883239746, 3.9119715690612793, 4.7152862548828125, 5.5186004638671875, 6.321915149688721, 7.125229835510254, 7.928544521331787, 8.73185920715332, 9.535173416137695, 10.33848762512207, 11.141802787780762, 11.945116996765137, 12.748432159423828, 13.551746368408203, 14.355060577392578, 15.15837574005127, 15.961689949035645, 16.765005111694336, 17.56831932067871, 18.371633529663086, 19.17494773864746, 19.97826385498047, 20.781578063964844, 21.58489227294922, 22.388206481933594, 23.1915225982666, 23.994836807250977, 24.79815101623535, 25.601465225219727, 26.4047794342041]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 4.0, 5.0, 0.0, 2.0, 3.0, 5.0, 5.0, 10.0, 6.0, 12.0, 18.0, 11.0, 18.0, 21.0, 23.0, 17.0, 23.0, 27.0, 33.0, 29.0, 41.0, 36.0, 37.0, 38.0, 36.0, 47.0, 46.0, 40.0, 29.0, 34.0, 39.0, 34.0, 34.0, 33.0, 26.0, 28.0, 22.0, 24.0, 14.0, 21.0, 16.0, 13.0, 8.0, 6.0, 7.0, 5.0, 8.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.131150245666504, -7.8515729904174805, -7.571995258331299, -7.292417526245117, -7.012840270996094, -6.73326301574707, -6.453685283660889, -6.174107551574707, -5.894530296325684, -5.61495304107666, -5.3353753089904785, -5.055797576904297, -4.776220321655273, -4.49664306640625, -4.217065334320068, -3.937487840652466, -3.6579103469848633, -3.3783328533172607, -3.098755359649658, -2.8191778659820557, -2.539600372314453, -2.2600228786468506, -1.980445384979248, -1.7008678913116455, -1.421290397644043, -1.1417129039764404, -0.8621354103088379, -0.5825579166412354, -0.3029804229736328, -0.023402929306030273, 0.25617456436157227, 0.5357520580291748, 0.8153285980224609, 1.0949060916900635, 1.374483585357666, 1.6540610790252686, 1.933638572692871, 2.2132160663604736, 2.492793560028076, 2.7723710536956787, 3.0519485473632812, 3.331526041030884, 3.6111035346984863, 3.890681028366089, 4.170258522033691, 4.449835777282715, 4.7294135093688965, 5.008991241455078, 5.288568496704102, 5.568145751953125, 5.847723484039307, 6.127301216125488, 6.406878471374512, 6.686455726623535, 6.966033458709717, 7.245611190795898, 7.525188446044922, 7.804765701293945, 8.084342956542969, 8.363921165466309, 8.643498420715332, 8.923075675964355, 9.202653884887695, 9.482231140136719, 9.761808395385742]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 6.0, 2.0, 8.0, 16.0, 15.0, 25.0, 37.0, 66.0, 85.0, 136.0, 185.0, 298.0, 443.0, 734.0, 1094.0, 1830.0, 2947.0, 5176.0, 8993.0, 16064.0, 28659.0, 51849.0, 91063.0, 146598.0, 193830.0, 183685.0, 132459.0, 79369.0, 44749.0, 24849.0, 13913.0, 7709.0, 4474.0, 2701.0, 1610.0, 1045.0, 631.0, 410.0, 273.0, 166.0, 129.0, 83.0, 50.0, 36.0, 20.0, 17.0, 7.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0], "bins": [-11.4453125, -11.09716796875, -10.7490234375, -10.40087890625, -10.052734375, -9.70458984375, -9.3564453125, -9.00830078125, -8.66015625, -8.31201171875, -7.9638671875, -7.61572265625, -7.267578125, -6.91943359375, -6.5712890625, -6.22314453125, -5.875, -5.52685546875, -5.1787109375, -4.83056640625, -4.482421875, -4.13427734375, -3.7861328125, -3.43798828125, -3.08984375, -2.74169921875, -2.3935546875, -2.04541015625, -1.697265625, -1.34912109375, -1.0009765625, -0.65283203125, -0.3046875, 0.04345703125, 0.3916015625, 0.73974609375, 1.087890625, 1.43603515625, 1.7841796875, 2.13232421875, 2.48046875, 2.82861328125, 3.1767578125, 3.52490234375, 3.873046875, 4.22119140625, 4.5693359375, 4.91748046875, 5.265625, 5.61376953125, 5.9619140625, 6.31005859375, 6.658203125, 7.00634765625, 7.3544921875, 7.70263671875, 8.05078125, 8.39892578125, 8.7470703125, 9.09521484375, 9.443359375, 9.79150390625, 10.1396484375, 10.48779296875, 10.8359375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 7.0, 3.0, 4.0, 5.0, 5.0, 11.0, 17.0, 15.0, 17.0, 18.0, 20.0, 30.0, 28.0, 45.0, 36.0, 39.0, 52.0, 38.0, 48.0, 46.0, 53.0, 45.0, 33.0, 42.0, 51.0, 42.0, 34.0, 33.0, 29.0, 24.0, 27.0, 25.0, 16.0, 20.0, 15.0, 5.0, 4.0, 3.0, 8.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.109375, -10.74853515625, -10.3876953125, -10.02685546875, -9.666015625, -9.30517578125, -8.9443359375, -8.58349609375, -8.22265625, -7.86181640625, -7.5009765625, -7.14013671875, -6.779296875, -6.41845703125, -6.0576171875, -5.69677734375, -5.3359375, -4.97509765625, -4.6142578125, -4.25341796875, -3.892578125, -3.53173828125, -3.1708984375, -2.81005859375, -2.44921875, -2.08837890625, -1.7275390625, -1.36669921875, -1.005859375, -0.64501953125, -0.2841796875, 0.07666015625, 0.4375, 0.79833984375, 1.1591796875, 1.52001953125, 1.880859375, 2.24169921875, 2.6025390625, 2.96337890625, 3.32421875, 3.68505859375, 4.0458984375, 4.40673828125, 4.767578125, 5.12841796875, 5.4892578125, 5.85009765625, 6.2109375, 6.57177734375, 6.9326171875, 7.29345703125, 7.654296875, 8.01513671875, 8.3759765625, 8.73681640625, 9.09765625, 9.45849609375, 9.8193359375, 10.18017578125, 10.541015625, 10.90185546875, 11.2626953125, 11.62353515625, 11.984375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 11.0, 5.0, 13.0, 17.0, 22.0, 34.0, 40.0, 71.0, 98.0, 150.0, 233.0, 329.0, 523.0, 770.0, 1208.0, 2249.0, 3675.0, 6694.0, 12547.0, 24503.0, 49178.0, 99288.0, 189977.0, 259609.0, 192228.0, 101399.0, 49804.0, 24625.0, 12881.0, 6754.0, 3843.0, 2170.0, 1291.0, 820.0, 492.0, 330.0, 224.0, 147.0, 92.0, 67.0, 41.0, 35.0, 19.0, 19.0, 9.0, 6.0, 7.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-15.4375, -14.976806640625, -14.51611328125, -14.055419921875, -13.5947265625, -13.134033203125, -12.67333984375, -12.212646484375, -11.751953125, -11.291259765625, -10.83056640625, -10.369873046875, -9.9091796875, -9.448486328125, -8.98779296875, -8.527099609375, -8.06640625, -7.605712890625, -7.14501953125, -6.684326171875, -6.2236328125, -5.762939453125, -5.30224609375, -4.841552734375, -4.380859375, -3.920166015625, -3.45947265625, -2.998779296875, -2.5380859375, -2.077392578125, -1.61669921875, -1.156005859375, -0.6953125, -0.234619140625, 0.22607421875, 0.686767578125, 1.1474609375, 1.608154296875, 2.06884765625, 2.529541015625, 2.990234375, 3.450927734375, 3.91162109375, 4.372314453125, 4.8330078125, 5.293701171875, 5.75439453125, 6.215087890625, 6.67578125, 7.136474609375, 7.59716796875, 8.057861328125, 8.5185546875, 8.979248046875, 9.43994140625, 9.900634765625, 10.361328125, 10.822021484375, 11.28271484375, 11.743408203125, 12.2041015625, 12.664794921875, 13.12548828125, 13.586181640625, 14.046875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 4.0, 3.0, 8.0, 11.0, 8.0, 14.0, 8.0, 15.0, 20.0, 28.0, 35.0, 22.0, 28.0, 29.0, 31.0, 37.0, 43.0, 47.0, 43.0, 52.0, 48.0, 53.0, 44.0, 33.0, 40.0, 43.0, 38.0, 32.0, 28.0, 29.0, 28.0, 17.0, 15.0, 14.0, 14.0, 11.0, 8.0, 10.0, 4.0, 6.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0], "bins": [-8.046875, -7.83538818359375, -7.6239013671875, -7.41241455078125, -7.200927734375, -6.98944091796875, -6.7779541015625, -6.56646728515625, -6.35498046875, -6.14349365234375, -5.9320068359375, -5.72052001953125, -5.509033203125, -5.29754638671875, -5.0860595703125, -4.87457275390625, -4.6630859375, -4.45159912109375, -4.2401123046875, -4.02862548828125, -3.817138671875, -3.60565185546875, -3.3941650390625, -3.18267822265625, -2.97119140625, -2.75970458984375, -2.5482177734375, -2.33673095703125, -2.125244140625, -1.91375732421875, -1.7022705078125, -1.49078369140625, -1.279296875, -1.06781005859375, -0.8563232421875, -0.64483642578125, -0.433349609375, -0.22186279296875, -0.0103759765625, 0.20111083984375, 0.41259765625, 0.62408447265625, 0.8355712890625, 1.04705810546875, 1.258544921875, 1.47003173828125, 1.6815185546875, 1.89300537109375, 2.1044921875, 2.31597900390625, 2.5274658203125, 2.73895263671875, 2.950439453125, 3.16192626953125, 3.3734130859375, 3.58489990234375, 3.79638671875, 4.00787353515625, 4.2193603515625, 4.43084716796875, 4.642333984375, 4.85382080078125, 5.0653076171875, 5.27679443359375, 5.48828125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 7.0, 7.0, 9.0, 16.0, 14.0, 19.0, 31.0, 39.0, 64.0, 72.0, 129.0, 167.0, 235.0, 389.0, 581.0, 937.0, 1626.0, 3160.0, 7230.0, 20510.0, 70277.0, 269987.0, 451755.0, 156382.0, 40970.0, 13134.0, 4986.0, 2328.0, 1243.0, 739.0, 457.0, 347.0, 223.0, 135.0, 105.0, 67.0, 59.0, 32.0, 26.0, 18.0, 13.0, 12.0, 7.0, 8.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-13.4375, -13.0213623046875, -12.605224609375, -12.1890869140625, -11.77294921875, -11.3568115234375, -10.940673828125, -10.5245361328125, -10.1083984375, -9.6922607421875, -9.276123046875, -8.8599853515625, -8.44384765625, -8.0277099609375, -7.611572265625, -7.1954345703125, -6.779296875, -6.3631591796875, -5.947021484375, -5.5308837890625, -5.11474609375, -4.6986083984375, -4.282470703125, -3.8663330078125, -3.4501953125, -3.0340576171875, -2.617919921875, -2.2017822265625, -1.78564453125, -1.3695068359375, -0.953369140625, -0.5372314453125, -0.12109375, 0.2950439453125, 0.711181640625, 1.1273193359375, 1.54345703125, 1.9595947265625, 2.375732421875, 2.7918701171875, 3.2080078125, 3.6241455078125, 4.040283203125, 4.4564208984375, 4.87255859375, 5.2886962890625, 5.704833984375, 6.1209716796875, 6.537109375, 6.9532470703125, 7.369384765625, 7.7855224609375, 8.20166015625, 8.6177978515625, 9.033935546875, 9.4500732421875, 9.8662109375, 10.2823486328125, 10.698486328125, 11.1146240234375, 11.53076171875, 11.9468994140625, 12.363037109375, 12.7791748046875, 13.1953125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 1.0, 3.0, 7.0, 16.0, 12.0, 16.0, 20.0, 27.0, 37.0, 54.0, 70.0, 75.0, 84.0, 74.0, 77.0, 77.0, 65.0, 69.0, 57.0, 39.0, 36.0, 22.0, 20.0, 5.0, 12.0, 8.0, 9.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0003781318664550781, -0.00036704540252685547, -0.0003559589385986328, -0.00034487247467041016, -0.0003337860107421875, -0.00032269954681396484, -0.0003116130828857422, -0.00030052661895751953, -0.0002894401550292969, -0.0002783536911010742, -0.00026726722717285156, -0.0002561807632446289, -0.00024509429931640625, -0.0002340078353881836, -0.00022292137145996094, -0.00021183490753173828, -0.00020074844360351562, -0.00018966197967529297, -0.0001785755157470703, -0.00016748905181884766, -0.000156402587890625, -0.00014531612396240234, -0.0001342296600341797, -0.00012314319610595703, -0.00011205673217773438, -0.00010097026824951172, -8.988380432128906e-05, -7.87973403930664e-05, -6.771087646484375e-05, -5.6624412536621094e-05, -4.553794860839844e-05, -3.445148468017578e-05, -2.3365020751953125e-05, -1.2278556823730469e-05, -1.1920928955078125e-06, 9.894371032714844e-06, 2.09808349609375e-05, 3.2067298889160156e-05, 4.315376281738281e-05, 5.424022674560547e-05, 6.532669067382812e-05, 7.641315460205078e-05, 8.749961853027344e-05, 9.85860824584961e-05, 0.00010967254638671875, 0.0001207590103149414, 0.00013184547424316406, 0.00014293193817138672, 0.00015401840209960938, 0.00016510486602783203, 0.0001761913299560547, 0.00018727779388427734, 0.0001983642578125, 0.00020945072174072266, 0.0002205371856689453, 0.00023162364959716797, 0.00024271011352539062, 0.0002537965774536133, 0.00026488304138183594, 0.0002759695053100586, 0.00028705596923828125, 0.0002981424331665039, 0.00030922889709472656, 0.0003203153610229492, 0.0003314018249511719]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 4.0, 17.0, 14.0, 18.0, 24.0, 41.0, 46.0, 74.0, 96.0, 142.0, 191.0, 241.0, 385.0, 494.0, 774.0, 1179.0, 1901.0, 3252.0, 6626.0, 16370.0, 50743.0, 168097.0, 367367.0, 281941.0, 96675.0, 29704.0, 10269.0, 4659.0, 2524.0, 1528.0, 987.0, 640.0, 452.0, 315.0, 217.0, 151.0, 98.0, 87.0, 53.0, 46.0, 39.0, 20.0, 13.0, 15.0, 8.0, 6.0, 7.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-11.125, -10.7955322265625, -10.466064453125, -10.1365966796875, -9.80712890625, -9.4776611328125, -9.148193359375, -8.8187255859375, -8.4892578125, -8.1597900390625, -7.830322265625, -7.5008544921875, -7.17138671875, -6.8419189453125, -6.512451171875, -6.1829833984375, -5.853515625, -5.5240478515625, -5.194580078125, -4.8651123046875, -4.53564453125, -4.2061767578125, -3.876708984375, -3.5472412109375, -3.2177734375, -2.8883056640625, -2.558837890625, -2.2293701171875, -1.89990234375, -1.5704345703125, -1.240966796875, -0.9114990234375, -0.58203125, -0.2525634765625, 0.076904296875, 0.4063720703125, 0.73583984375, 1.0653076171875, 1.394775390625, 1.7242431640625, 2.0537109375, 2.3831787109375, 2.712646484375, 3.0421142578125, 3.37158203125, 3.7010498046875, 4.030517578125, 4.3599853515625, 4.689453125, 5.0189208984375, 5.348388671875, 5.6778564453125, 6.00732421875, 6.3367919921875, 6.666259765625, 6.9957275390625, 7.3251953125, 7.6546630859375, 7.984130859375, 8.3135986328125, 8.64306640625, 8.9725341796875, 9.302001953125, 9.6314697265625, 9.9609375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 9.0, 12.0, 19.0, 32.0, 31.0, 37.0, 52.0, 62.0, 62.0, 74.0, 85.0, 83.0, 83.0, 79.0, 59.0, 63.0, 69.0, 24.0, 21.0, 20.0, 7.0, 5.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.171875, -2.101959228515625, -2.03204345703125, -1.962127685546875, -1.8922119140625, -1.822296142578125, -1.75238037109375, -1.682464599609375, -1.612548828125, -1.542633056640625, -1.47271728515625, -1.402801513671875, -1.3328857421875, -1.262969970703125, -1.19305419921875, -1.123138427734375, -1.05322265625, -0.983306884765625, -0.91339111328125, -0.843475341796875, -0.7735595703125, -0.703643798828125, -0.63372802734375, -0.563812255859375, -0.493896484375, -0.423980712890625, -0.35406494140625, -0.284149169921875, -0.2142333984375, -0.144317626953125, -0.07440185546875, -0.004486083984375, 0.0654296875, 0.135345458984375, 0.20526123046875, 0.275177001953125, 0.3450927734375, 0.415008544921875, 0.48492431640625, 0.554840087890625, 0.624755859375, 0.694671630859375, 0.76458740234375, 0.834503173828125, 0.9044189453125, 0.974334716796875, 1.04425048828125, 1.114166259765625, 1.18408203125, 1.253997802734375, 1.32391357421875, 1.393829345703125, 1.4637451171875, 1.533660888671875, 1.60357666015625, 1.673492431640625, 1.743408203125, 1.813323974609375, 1.88323974609375, 1.953155517578125, 2.0230712890625, 2.092987060546875, 2.16290283203125, 2.232818603515625, 2.302734375]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 6.0, 1.0, 8.0, 7.0, 11.0, 18.0, 13.0, 24.0, 38.0, 52.0, 45.0, 65.0, 73.0, 74.0, 67.0, 95.0, 81.0, 66.0, 51.0, 50.0, 37.0, 29.0, 17.0, 20.0, 11.0, 10.0, 10.0, 8.0, 4.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.588699340820312, -22.803377151489258, -22.018054962158203, -21.23273468017578, -20.447412490844727, -19.662090301513672, -18.87677001953125, -18.091447830200195, -17.30612564086914, -16.520803451538086, -15.735482215881348, -14.95016098022461, -14.164838790893555, -13.3795166015625, -12.594195365905762, -11.808874130249023, -11.023551940917969, -10.238229751586914, -9.452908515930176, -8.667587280273438, -7.882265090942383, -7.096943378448486, -6.31162166595459, -5.526299953460693, -4.740978240966797, -3.9556565284729004, -3.170334815979004, -2.3850131034851074, -1.599691390991211, -0.8143696784973145, -0.02904796600341797, 0.7562737464904785, 1.5415935516357422, 2.3269152641296387, 3.112236976623535, 3.8975586891174316, 4.682880401611328, 5.468202114105225, 6.253523826599121, 7.038845539093018, 7.824167251586914, 8.609489440917969, 9.394810676574707, 10.180131912231445, 10.9654541015625, 11.750776290893555, 12.536097526550293, 13.321418762207031, 14.106740951538086, 14.89206314086914, 15.677384376525879, 16.462705612182617, 17.248027801513672, 18.033349990844727, 18.81867218017578, 19.603992462158203, 20.389314651489258, 21.174636840820312, 21.959957122802734, 22.74527931213379, 23.530601501464844, 24.3159236907959, 25.101245880126953, 25.886566162109375, 26.67188835144043]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 5.0, 3.0, 1.0, 2.0, 5.0, 4.0, 6.0, 11.0, 11.0, 10.0, 15.0, 21.0, 16.0, 26.0, 22.0, 16.0, 21.0, 31.0, 39.0, 28.0, 32.0, 36.0, 42.0, 48.0, 44.0, 43.0, 35.0, 28.0, 35.0, 33.0, 45.0, 38.0, 28.0, 27.0, 26.0, 23.0, 28.0, 13.0, 25.0, 14.0, 10.0, 16.0, 7.0, 3.0, 7.0, 12.0, 4.0, 5.0, 5.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.110013008117676, -7.8352484703063965, -7.560483932495117, -7.285719394683838, -7.010954856872559, -6.736190319061279, -6.46142578125, -6.186661243438721, -5.911896705627441, -5.637132167816162, -5.362367630004883, -5.0876030921936035, -4.812838554382324, -4.538074016571045, -4.263309478759766, -3.9885449409484863, -3.713780403137207, -3.4390158653259277, -3.1642513275146484, -2.889486789703369, -2.61472225189209, -2.3399577140808105, -2.0651931762695312, -1.790428638458252, -1.5156641006469727, -1.2408995628356934, -0.9661350250244141, -0.6913704872131348, -0.41660594940185547, -0.14184141159057617, 0.13292312622070312, 0.4076876640319824, 0.6824531555175781, 0.9572176933288574, 1.2319822311401367, 1.506746768951416, 1.7815113067626953, 2.0562758445739746, 2.331040382385254, 2.605804920196533, 2.8805694580078125, 3.155333995819092, 3.430098533630371, 3.7048630714416504, 3.9796276092529297, 4.254392147064209, 4.529156684875488, 4.803921222686768, 5.078685760498047, 5.353450298309326, 5.6282148361206055, 5.902979373931885, 6.177743911743164, 6.452508449554443, 6.727272987365723, 7.002037525177002, 7.276802062988281, 7.5515666007995605, 7.82633113861084, 8.101095199584961, 8.375860214233398, 8.650625228881836, 8.925389289855957, 9.200153350830078, 9.474918365478516]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 5.0, 15.0, 19.0, 33.0, 37.0, 73.0, 111.0, 131.0, 224.0, 384.0, 580.0, 983.0, 1653.0, 2765.0, 4598.0, 7844.0, 13847.0, 23744.0, 39975.0, 66761.0, 101297.0, 137819.0, 160017.0, 152763.0, 121325.0, 83439.0, 52792.0, 31319.0, 18258.0, 10496.0, 6038.0, 3546.0, 2153.0, 1324.0, 822.0, 523.0, 311.0, 179.0, 110.0, 85.0, 57.0, 26.0, 21.0, 20.0, 14.0, 4.0, 5.0, 5.0, 0.0, 4.0, 0.0, 0.0, 1.0], "bins": [-12.4921875, -12.1221923828125, -11.752197265625, -11.3822021484375, -11.01220703125, -10.6422119140625, -10.272216796875, -9.9022216796875, -9.5322265625, -9.1622314453125, -8.792236328125, -8.4222412109375, -8.05224609375, -7.6822509765625, -7.312255859375, -6.9422607421875, -6.572265625, -6.2022705078125, -5.832275390625, -5.4622802734375, -5.09228515625, -4.7222900390625, -4.352294921875, -3.9822998046875, -3.6123046875, -3.2423095703125, -2.872314453125, -2.5023193359375, -2.13232421875, -1.7623291015625, -1.392333984375, -1.0223388671875, -0.65234375, -0.2823486328125, 0.087646484375, 0.4576416015625, 0.82763671875, 1.1976318359375, 1.567626953125, 1.9376220703125, 2.3076171875, 2.6776123046875, 3.047607421875, 3.4176025390625, 3.78759765625, 4.1575927734375, 4.527587890625, 4.8975830078125, 5.267578125, 5.6375732421875, 6.007568359375, 6.3775634765625, 6.74755859375, 7.1175537109375, 7.487548828125, 7.8575439453125, 8.2275390625, 8.5975341796875, 8.967529296875, 9.3375244140625, 9.70751953125, 10.0775146484375, 10.447509765625, 10.8175048828125, 11.1875]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 8.0, 2.0, 10.0, 10.0, 15.0, 28.0, 23.0, 25.0, 27.0, 40.0, 44.0, 48.0, 49.0, 57.0, 42.0, 58.0, 54.0, 49.0, 56.0, 37.0, 40.0, 32.0, 44.0, 36.0, 37.0, 29.0, 19.0, 21.0, 11.0, 13.0, 2.0, 7.0, 7.0, 5.0, 6.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.0234375, -12.6182861328125, -12.213134765625, -11.8079833984375, -11.40283203125, -10.9976806640625, -10.592529296875, -10.1873779296875, -9.7822265625, -9.3770751953125, -8.971923828125, -8.5667724609375, -8.16162109375, -7.7564697265625, -7.351318359375, -6.9461669921875, -6.541015625, -6.1358642578125, -5.730712890625, -5.3255615234375, -4.92041015625, -4.5152587890625, -4.110107421875, -3.7049560546875, -3.2998046875, -2.8946533203125, -2.489501953125, -2.0843505859375, -1.67919921875, -1.2740478515625, -0.868896484375, -0.4637451171875, -0.05859375, 0.3465576171875, 0.751708984375, 1.1568603515625, 1.56201171875, 1.9671630859375, 2.372314453125, 2.7774658203125, 3.1826171875, 3.5877685546875, 3.992919921875, 4.3980712890625, 4.80322265625, 5.2083740234375, 5.613525390625, 6.0186767578125, 6.423828125, 6.8289794921875, 7.234130859375, 7.6392822265625, 8.04443359375, 8.4495849609375, 8.854736328125, 9.2598876953125, 9.6650390625, 10.0701904296875, 10.475341796875, 10.8804931640625, 11.28564453125, 11.6907958984375, 12.095947265625, 12.5010986328125, 12.90625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 12.0, 24.0, 25.0, 38.0, 52.0, 77.0, 128.0, 181.0, 233.0, 386.0, 568.0, 888.0, 1432.0, 2244.0, 3577.0, 5687.0, 9287.0, 14842.0, 23793.0, 37284.0, 57228.0, 83603.0, 113339.0, 135869.0, 140900.0, 125851.0, 97651.0, 68953.0, 45581.0, 29354.0, 18476.0, 11506.0, 7128.0, 4450.0, 2873.0, 1736.0, 1082.0, 804.0, 473.0, 313.0, 203.0, 135.0, 93.0, 61.0, 48.0, 35.0, 15.0, 18.0, 6.0, 5.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.1953125, -9.868896484375, -9.54248046875, -9.216064453125, -8.8896484375, -8.563232421875, -8.23681640625, -7.910400390625, -7.583984375, -7.257568359375, -6.93115234375, -6.604736328125, -6.2783203125, -5.951904296875, -5.62548828125, -5.299072265625, -4.97265625, -4.646240234375, -4.31982421875, -3.993408203125, -3.6669921875, -3.340576171875, -3.01416015625, -2.687744140625, -2.361328125, -2.034912109375, -1.70849609375, -1.382080078125, -1.0556640625, -0.729248046875, -0.40283203125, -0.076416015625, 0.25, 0.576416015625, 0.90283203125, 1.229248046875, 1.5556640625, 1.882080078125, 2.20849609375, 2.534912109375, 2.861328125, 3.187744140625, 3.51416015625, 3.840576171875, 4.1669921875, 4.493408203125, 4.81982421875, 5.146240234375, 5.47265625, 5.799072265625, 6.12548828125, 6.451904296875, 6.7783203125, 7.104736328125, 7.43115234375, 7.757568359375, 8.083984375, 8.410400390625, 8.73681640625, 9.063232421875, 9.3896484375, 9.716064453125, 10.04248046875, 10.368896484375, 10.6953125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 8.0, 7.0, 9.0, 11.0, 17.0, 15.0, 15.0, 12.0, 25.0, 30.0, 25.0, 17.0, 41.0, 34.0, 34.0, 31.0, 44.0, 36.0, 37.0, 50.0, 52.0, 45.0, 35.0, 38.0, 35.0, 32.0, 32.0, 30.0, 23.0, 34.0, 27.0, 30.0, 19.0, 8.0, 7.0, 12.0, 9.0, 12.0, 4.0, 6.0, 4.0, 5.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.140625, -5.9434814453125, -5.746337890625, -5.5491943359375, -5.35205078125, -5.1549072265625, -4.957763671875, -4.7606201171875, -4.5634765625, -4.3663330078125, -4.169189453125, -3.9720458984375, -3.77490234375, -3.5777587890625, -3.380615234375, -3.1834716796875, -2.986328125, -2.7891845703125, -2.592041015625, -2.3948974609375, -2.19775390625, -2.0006103515625, -1.803466796875, -1.6063232421875, -1.4091796875, -1.2120361328125, -1.014892578125, -0.8177490234375, -0.62060546875, -0.4234619140625, -0.226318359375, -0.0291748046875, 0.16796875, 0.3651123046875, 0.562255859375, 0.7593994140625, 0.95654296875, 1.1536865234375, 1.350830078125, 1.5479736328125, 1.7451171875, 1.9422607421875, 2.139404296875, 2.3365478515625, 2.53369140625, 2.7308349609375, 2.927978515625, 3.1251220703125, 3.322265625, 3.5194091796875, 3.716552734375, 3.9136962890625, 4.11083984375, 4.3079833984375, 4.505126953125, 4.7022705078125, 4.8994140625, 5.0965576171875, 5.293701171875, 5.4908447265625, 5.68798828125, 5.8851318359375, 6.082275390625, 6.2794189453125, 6.4765625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 8.0, 9.0, 16.0, 22.0, 38.0, 67.0, 99.0, 114.0, 194.0, 298.0, 434.0, 687.0, 1191.0, 1947.0, 3256.0, 5255.0, 9074.0, 15267.0, 25542.0, 43012.0, 70742.0, 107777.0, 148180.0, 168641.0, 151307.0, 111548.0, 72578.0, 45162.0, 26746.0, 16000.0, 9287.0, 5417.0, 3335.0, 2074.0, 1172.0, 777.0, 470.0, 258.0, 177.0, 145.0, 69.0, 46.0, 32.0, 22.0, 25.0, 15.0, 12.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.3125, -5.14923095703125, -4.9859619140625, -4.82269287109375, -4.659423828125, -4.49615478515625, -4.3328857421875, -4.16961669921875, -4.00634765625, -3.84307861328125, -3.6798095703125, -3.51654052734375, -3.353271484375, -3.19000244140625, -3.0267333984375, -2.86346435546875, -2.7001953125, -2.53692626953125, -2.3736572265625, -2.21038818359375, -2.047119140625, -1.88385009765625, -1.7205810546875, -1.55731201171875, -1.39404296875, -1.23077392578125, -1.0675048828125, -0.90423583984375, -0.740966796875, -0.57769775390625, -0.4144287109375, -0.25115966796875, -0.087890625, 0.07537841796875, 0.2386474609375, 0.40191650390625, 0.565185546875, 0.72845458984375, 0.8917236328125, 1.05499267578125, 1.21826171875, 1.38153076171875, 1.5447998046875, 1.70806884765625, 1.871337890625, 2.03460693359375, 2.1978759765625, 2.36114501953125, 2.5244140625, 2.68768310546875, 2.8509521484375, 3.01422119140625, 3.177490234375, 3.34075927734375, 3.5040283203125, 3.66729736328125, 3.83056640625, 3.99383544921875, 4.1571044921875, 4.32037353515625, 4.483642578125, 4.64691162109375, 4.8101806640625, 4.97344970703125, 5.13671875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 6.0, 4.0, 9.0, 7.0, 4.0, 23.0, 21.0, 19.0, 30.0, 36.0, 44.0, 53.0, 56.0, 76.0, 57.0, 71.0, 97.0, 62.0, 60.0, 57.0, 43.0, 37.0, 34.0, 25.0, 14.0, 20.0, 9.0, 10.0, 7.0, 8.0, 1.0, 2.0, 2.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0006604194641113281, -0.0006402879953384399, -0.0006201565265655518, -0.0006000250577926636, -0.0005798935890197754, -0.0005597621202468872, -0.000539630651473999, -0.0005194991827011108, -0.0004993677139282227, -0.00047923624515533447, -0.0004591047763824463, -0.0004389733076095581, -0.0004188418388366699, -0.00039871037006378174, -0.00037857890129089355, -0.00035844743251800537, -0.0003383159637451172, -0.000318184494972229, -0.0002980530261993408, -0.00027792155742645264, -0.00025779008865356445, -0.00023765861988067627, -0.00021752715110778809, -0.0001973956823348999, -0.00017726421356201172, -0.00015713274478912354, -0.00013700127601623535, -0.00011686980724334717, -9.673833847045898e-05, -7.66068696975708e-05, -5.647540092468262e-05, -3.6343932151794434e-05, -1.621246337890625e-05, 3.919005393981934e-06, 2.4050474166870117e-05, 4.41819429397583e-05, 6.431341171264648e-05, 8.444488048553467e-05, 0.00010457634925842285, 0.00012470781803131104, 0.00014483928680419922, 0.0001649707555770874, 0.00018510222434997559, 0.00020523369312286377, 0.00022536516189575195, 0.00024549663066864014, 0.0002656280994415283, 0.0002857595682144165, 0.0003058910369873047, 0.00032602250576019287, 0.00034615397453308105, 0.00036628544330596924, 0.0003864169120788574, 0.0004065483808517456, 0.0004266798496246338, 0.00044681131839752197, 0.00046694278717041016, 0.00048707425594329834, 0.0005072057247161865, 0.0005273371934890747, 0.0005474686622619629, 0.0005676001310348511, 0.0005877315998077393, 0.0006078630685806274, 0.0006279945373535156]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 8.0, 7.0, 5.0, 12.0, 17.0, 23.0, 39.0, 65.0, 103.0, 146.0, 220.0, 291.0, 505.0, 752.0, 1237.0, 1900.0, 2871.0, 4689.0, 7381.0, 11864.0, 19064.0, 30574.0, 48749.0, 74657.0, 108463.0, 140144.0, 154320.0, 137424.0, 105297.0, 72148.0, 47053.0, 29239.0, 18348.0, 11282.0, 7231.0, 4439.0, 2866.0, 1821.0, 1135.0, 725.0, 505.0, 341.0, 211.0, 147.0, 77.0, 63.0, 36.0, 23.0, 17.0, 11.0, 6.0, 4.0, 6.0, 3.0, 0.0, 1.0, 2.0, 3.0], "bins": [-4.84375, -4.69451904296875, -4.5452880859375, -4.39605712890625, -4.246826171875, -4.09759521484375, -3.9483642578125, -3.79913330078125, -3.64990234375, -3.50067138671875, -3.3514404296875, -3.20220947265625, -3.052978515625, -2.90374755859375, -2.7545166015625, -2.60528564453125, -2.4560546875, -2.30682373046875, -2.1575927734375, -2.00836181640625, -1.859130859375, -1.70989990234375, -1.5606689453125, -1.41143798828125, -1.26220703125, -1.11297607421875, -0.9637451171875, -0.81451416015625, -0.665283203125, -0.51605224609375, -0.3668212890625, -0.21759033203125, -0.068359375, 0.08087158203125, 0.2301025390625, 0.37933349609375, 0.528564453125, 0.67779541015625, 0.8270263671875, 0.97625732421875, 1.12548828125, 1.27471923828125, 1.4239501953125, 1.57318115234375, 1.722412109375, 1.87164306640625, 2.0208740234375, 2.17010498046875, 2.3193359375, 2.46856689453125, 2.6177978515625, 2.76702880859375, 2.916259765625, 3.06549072265625, 3.2147216796875, 3.36395263671875, 3.51318359375, 3.66241455078125, 3.8116455078125, 3.96087646484375, 4.110107421875, 4.25933837890625, 4.4085693359375, 4.55780029296875, 4.70703125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 8.0, 9.0, 7.0, 12.0, 19.0, 24.0, 28.0, 34.0, 46.0, 64.0, 52.0, 62.0, 66.0, 75.0, 67.0, 56.0, 62.0, 48.0, 54.0, 55.0, 32.0, 20.0, 17.0, 19.0, 10.0, 10.0, 12.0, 5.0, 3.0, 3.0, 2.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7646484375, -1.7018890380859375, -1.639129638671875, -1.5763702392578125, -1.51361083984375, -1.4508514404296875, -1.388092041015625, -1.3253326416015625, -1.2625732421875, -1.1998138427734375, -1.137054443359375, -1.0742950439453125, -1.01153564453125, -0.9487762451171875, -0.886016845703125, -0.8232574462890625, -0.760498046875, -0.6977386474609375, -0.634979248046875, -0.5722198486328125, -0.50946044921875, -0.4467010498046875, -0.383941650390625, -0.3211822509765625, -0.2584228515625, -0.1956634521484375, -0.132904052734375, -0.0701446533203125, -0.00738525390625, 0.0553741455078125, 0.118133544921875, 0.1808929443359375, 0.24365234375, 0.3064117431640625, 0.369171142578125, 0.4319305419921875, 0.49468994140625, 0.5574493408203125, 0.620208740234375, 0.6829681396484375, 0.7457275390625, 0.8084869384765625, 0.871246337890625, 0.9340057373046875, 0.99676513671875, 1.0595245361328125, 1.122283935546875, 1.1850433349609375, 1.247802734375, 1.3105621337890625, 1.373321533203125, 1.4360809326171875, 1.49884033203125, 1.5615997314453125, 1.624359130859375, 1.6871185302734375, 1.7498779296875, 1.8126373291015625, 1.875396728515625, 1.9381561279296875, 2.00091552734375, 2.0636749267578125, 2.126434326171875, 2.1891937255859375, 2.251953125]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 8.0, 11.0, 11.0, 9.0, 27.0, 23.0, 41.0, 51.0, 62.0, 48.0, 68.0, 84.0, 70.0, 75.0, 73.0, 70.0, 57.0, 40.0, 35.0, 19.0, 28.0, 13.0, 18.0, 10.0, 6.0, 11.0, 5.0, 5.0, 4.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.393449783325195, -21.668926239013672, -20.94440269470215, -20.219879150390625, -19.49535369873047, -18.770830154418945, -18.046306610107422, -17.3217830657959, -16.597259521484375, -15.872735977172852, -15.148212432861328, -14.423687934875488, -13.699164390563965, -12.974640846252441, -12.250116348266602, -11.525592803955078, -10.801069259643555, -10.076545715332031, -9.352022171020508, -8.627497673034668, -7.9029741287231445, -7.178450584411621, -6.4539265632629395, -5.729402542114258, -5.004878997802734, -4.280355453491211, -3.5558314323425293, -2.8313076496124268, -2.106783866882324, -1.3822600841522217, -0.6577363014221191, 0.0667877197265625, 0.7913093566894531, 1.5158331394195557, 2.240356922149658, 2.9648807048797607, 3.6894044876098633, 4.413928031921387, 5.138452053070068, 5.86297607421875, 6.587499618530273, 7.312023162841797, 8.03654670715332, 8.76107120513916, 9.485594749450684, 10.210118293762207, 10.934642791748047, 11.65916633605957, 12.383689880371094, 13.108213424682617, 13.83273696899414, 14.55726146697998, 15.281785011291504, 16.006309509277344, 16.730833053588867, 17.45535659790039, 18.179880142211914, 18.904403686523438, 19.62892723083496, 20.353450775146484, 21.07797622680664, 21.802499771118164, 22.527023315429688, 23.25154685974121, 23.976070404052734]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 2.0, 5.0, 5.0, 14.0, 17.0, 13.0, 14.0, 16.0, 20.0, 30.0, 24.0, 33.0, 31.0, 26.0, 43.0, 38.0, 38.0, 42.0, 52.0, 50.0, 44.0, 43.0, 54.0, 32.0, 40.0, 38.0, 34.0, 30.0, 20.0, 25.0, 24.0, 15.0, 23.0, 15.0, 9.0, 5.0, 13.0, 3.0, 8.0, 2.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.620841979980469, -9.307011604309082, -8.993182182312012, -8.679351806640625, -8.365522384643555, -8.051692008972168, -7.7378621101379395, -7.424032211303711, -7.110201835632324, -6.796371936798096, -6.482542037963867, -6.1687116622924805, -5.854881763458252, -5.541051864624023, -5.227221965789795, -4.913392066955566, -4.599562168121338, -4.285732269287109, -3.9719021320343018, -3.6580722332000732, -3.3442420959472656, -3.030412197113037, -2.7165822982788086, -2.402752161026001, -2.0889222621917725, -1.7750922441482544, -1.4612622261047363, -1.1474323272705078, -0.8336023092269897, -0.5197722911834717, -0.20594239234924316, 0.10788774490356445, 0.42171764373779297, 0.735547661781311, 1.049377679824829, 1.3632075786590576, 1.6770375967025757, 1.9908676147460938, 2.3046975135803223, 2.61852765083313, 2.9323575496673584, 3.246187448501587, 3.5600175857543945, 3.873847484588623, 4.187677383422852, 4.501507759094238, 4.815337181091309, 5.129167556762695, 5.442997455596924, 5.756827354431152, 6.070657253265381, 6.384487152099609, 6.698317527770996, 7.012147426605225, 7.325977325439453, 7.63980770111084, 7.95363712310791, 8.267467498779297, 8.581296920776367, 8.895127296447754, 9.208956718444824, 9.522787094116211, 9.836616516113281, 10.150446891784668, 10.464277267456055]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 12.0, 12.0, 16.0, 36.0, 41.0, 41.0, 82.0, 119.0, 181.0, 329.0, 454.0, 760.0, 1269.0, 2154.0, 3628.0, 6808.0, 12233.0, 23108.0, 44323.0, 89697.0, 193065.0, 433588.0, 920256.0, 1160130.0, 707608.0, 313208.0, 140803.0, 67147.0, 33407.0, 17384.0, 9324.0, 5243.0, 2997.0, 1785.0, 1110.0, 671.0, 403.0, 288.0, 180.0, 119.0, 89.0, 51.0, 38.0, 30.0, 22.0, 9.0, 8.0, 5.0, 5.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0], "bins": [-17.5, -16.958251953125, -16.41650390625, -15.874755859375, -15.3330078125, -14.791259765625, -14.24951171875, -13.707763671875, -13.166015625, -12.624267578125, -12.08251953125, -11.540771484375, -10.9990234375, -10.457275390625, -9.91552734375, -9.373779296875, -8.83203125, -8.290283203125, -7.74853515625, -7.206787109375, -6.6650390625, -6.123291015625, -5.58154296875, -5.039794921875, -4.498046875, -3.956298828125, -3.41455078125, -2.872802734375, -2.3310546875, -1.789306640625, -1.24755859375, -0.705810546875, -0.1640625, 0.377685546875, 0.91943359375, 1.461181640625, 2.0029296875, 2.544677734375, 3.08642578125, 3.628173828125, 4.169921875, 4.711669921875, 5.25341796875, 5.795166015625, 6.3369140625, 6.878662109375, 7.42041015625, 7.962158203125, 8.50390625, 9.045654296875, 9.58740234375, 10.129150390625, 10.6708984375, 11.212646484375, 11.75439453125, 12.296142578125, 12.837890625, 13.379638671875, 13.92138671875, 14.463134765625, 15.0048828125, 15.546630859375, 16.08837890625, 16.630126953125, 17.171875]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 7.0, 8.0, 12.0, 15.0, 11.0, 20.0, 21.0, 16.0, 26.0, 37.0, 28.0, 34.0, 38.0, 45.0, 51.0, 39.0, 54.0, 41.0, 50.0, 49.0, 52.0, 50.0, 47.0, 28.0, 33.0, 26.0, 31.0, 17.0, 24.0, 18.0, 15.0, 23.0, 6.0, 9.0, 3.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5703125, -8.31622314453125, -8.0621337890625, -7.80804443359375, -7.553955078125, -7.29986572265625, -7.0457763671875, -6.79168701171875, -6.53759765625, -6.28350830078125, -6.0294189453125, -5.77532958984375, -5.521240234375, -5.26715087890625, -5.0130615234375, -4.75897216796875, -4.5048828125, -4.25079345703125, -3.9967041015625, -3.74261474609375, -3.488525390625, -3.23443603515625, -2.9803466796875, -2.72625732421875, -2.47216796875, -2.21807861328125, -1.9639892578125, -1.70989990234375, -1.455810546875, -1.20172119140625, -0.9476318359375, -0.69354248046875, -0.439453125, -0.18536376953125, 0.0687255859375, 0.32281494140625, 0.576904296875, 0.83099365234375, 1.0850830078125, 1.33917236328125, 1.59326171875, 1.84735107421875, 2.1014404296875, 2.35552978515625, 2.609619140625, 2.86370849609375, 3.1177978515625, 3.37188720703125, 3.6259765625, 3.88006591796875, 4.1341552734375, 4.38824462890625, 4.642333984375, 4.89642333984375, 5.1505126953125, 5.40460205078125, 5.65869140625, 5.91278076171875, 6.1668701171875, 6.42095947265625, 6.675048828125, 6.92913818359375, 7.1832275390625, 7.43731689453125, 7.69140625]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 7.0, 15.0, 10.0, 18.0, 30.0, 38.0, 59.0, 101.0, 151.0, 191.0, 324.0, 529.0, 782.0, 1214.0, 1908.0, 3068.0, 5120.0, 8803.0, 15161.0, 26720.0, 48072.0, 88251.0, 163854.0, 303449.0, 546089.0, 846154.0, 864364.0, 569016.0, 318537.0, 171116.0, 92318.0, 50896.0, 28279.0, 15863.0, 9467.0, 5469.0, 3299.0, 1935.0, 1324.0, 792.0, 520.0, 343.0, 216.0, 119.0, 107.0, 81.0, 32.0, 29.0, 14.0, 14.0, 8.0, 8.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.453125, -14.9708251953125, -14.488525390625, -14.0062255859375, -13.52392578125, -13.0416259765625, -12.559326171875, -12.0770263671875, -11.5947265625, -11.1124267578125, -10.630126953125, -10.1478271484375, -9.66552734375, -9.1832275390625, -8.700927734375, -8.2186279296875, -7.736328125, -7.2540283203125, -6.771728515625, -6.2894287109375, -5.80712890625, -5.3248291015625, -4.842529296875, -4.3602294921875, -3.8779296875, -3.3956298828125, -2.913330078125, -2.4310302734375, -1.94873046875, -1.4664306640625, -0.984130859375, -0.5018310546875, -0.01953125, 0.4627685546875, 0.945068359375, 1.4273681640625, 1.90966796875, 2.3919677734375, 2.874267578125, 3.3565673828125, 3.8388671875, 4.3211669921875, 4.803466796875, 5.2857666015625, 5.76806640625, 6.2503662109375, 6.732666015625, 7.2149658203125, 7.697265625, 8.1795654296875, 8.661865234375, 9.1441650390625, 9.62646484375, 10.1087646484375, 10.591064453125, 11.0733642578125, 11.5556640625, 12.0379638671875, 12.520263671875, 13.0025634765625, 13.48486328125, 13.9671630859375, 14.449462890625, 14.9317626953125, 15.4140625]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 10.0, 11.0, 23.0, 22.0, 23.0, 26.0, 31.0, 40.0, 60.0, 101.0, 105.0, 125.0, 150.0, 203.0, 244.0, 260.0, 281.0, 287.0, 295.0, 267.0, 289.0, 233.0, 195.0, 156.0, 145.0, 112.0, 70.0, 75.0, 54.0, 53.0, 34.0, 23.0, 14.0, 13.0, 13.0, 8.0, 3.0, 4.0, 7.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.875, -4.7135009765625, -4.552001953125, -4.3905029296875, -4.22900390625, -4.0675048828125, -3.906005859375, -3.7445068359375, -3.5830078125, -3.4215087890625, -3.260009765625, -3.0985107421875, -2.93701171875, -2.7755126953125, -2.614013671875, -2.4525146484375, -2.291015625, -2.1295166015625, -1.968017578125, -1.8065185546875, -1.64501953125, -1.4835205078125, -1.322021484375, -1.1605224609375, -0.9990234375, -0.8375244140625, -0.676025390625, -0.5145263671875, -0.35302734375, -0.1915283203125, -0.030029296875, 0.1314697265625, 0.29296875, 0.4544677734375, 0.615966796875, 0.7774658203125, 0.93896484375, 1.1004638671875, 1.261962890625, 1.4234619140625, 1.5849609375, 1.7464599609375, 1.907958984375, 2.0694580078125, 2.23095703125, 2.3924560546875, 2.553955078125, 2.7154541015625, 2.876953125, 3.0384521484375, 3.199951171875, 3.3614501953125, 3.52294921875, 3.6844482421875, 3.845947265625, 4.0074462890625, 4.1689453125, 4.3304443359375, 4.491943359375, 4.6534423828125, 4.81494140625, 4.9764404296875, 5.137939453125, 5.2994384765625, 5.4609375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 11.0, 5.0, 11.0, 15.0, 23.0, 22.0, 29.0, 39.0, 45.0, 60.0, 71.0, 75.0, 82.0, 71.0, 70.0, 70.0, 57.0, 53.0, 30.0, 26.0, 33.0, 21.0, 16.0, 12.0, 10.0, 8.0, 8.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.947229385375977, -22.237016677856445, -21.526803970336914, -20.816591262817383, -20.10637855529785, -19.39616584777832, -18.685951232910156, -17.975738525390625, -17.265525817871094, -16.555313110351562, -15.845100402832031, -15.1348876953125, -14.424674987792969, -13.714462280273438, -13.00424861907959, -12.294035911560059, -11.583824157714844, -10.873611450195312, -10.163398742675781, -9.45318603515625, -8.742973327636719, -8.032760620117188, -7.32254695892334, -6.612334251403809, -5.902121543884277, -5.191908836364746, -4.481696128845215, -3.7714829444885254, -3.061270236968994, -2.351057529449463, -1.6408443450927734, -0.9306316375732422, -0.22041893005371094, 0.48979389667510986, 1.2000067234039307, 1.910219669342041, 2.6204323768615723, 3.3306450843811035, 4.040858268737793, 4.751070976257324, 5.4612836837768555, 6.171496391296387, 6.881709098815918, 7.591922283172607, 8.302135467529297, 9.012348175048828, 9.72256088256836, 10.43277359008789, 11.142986297607422, 11.853199005126953, 12.563411712646484, 13.273624420166016, 13.983837127685547, 14.694049835205078, 15.404263496398926, 16.11447525024414, 16.824687957763672, 17.534900665283203, 18.245113372802734, 18.955326080322266, 19.665538787841797, 20.375751495361328, 21.08596420288086, 21.79617691040039, 22.506391525268555]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 4.0, 8.0, 5.0, 16.0, 8.0, 14.0, 15.0, 17.0, 16.0, 28.0, 34.0, 37.0, 31.0, 47.0, 38.0, 35.0, 49.0, 43.0, 38.0, 50.0, 48.0, 56.0, 43.0, 36.0, 41.0, 30.0, 31.0, 27.0, 21.0, 21.0, 13.0, 17.0, 18.0, 16.0, 12.0, 7.0, 9.0, 5.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.6331353187561035, -7.344013214111328, -7.054891109466553, -6.765769004821777, -6.476646900177002, -6.187524795532227, -5.898402214050293, -5.609280586242676, -5.320158004760742, -5.031035900115967, -4.741913795471191, -4.452791690826416, -4.163669586181641, -3.8745474815368652, -3.5854251384735107, -3.2963030338287354, -3.007181167602539, -2.7180590629577637, -2.4289369583129883, -2.139814853668213, -1.850692629814148, -1.5615705251693726, -1.2724483013153076, -0.9833261966705322, -0.6942040920257568, -0.40508195757865906, -0.11595982313156128, 0.1731623411178589, 0.4622844457626343, 0.7514065504074097, 1.0405287742614746, 1.32965087890625, 1.6187725067138672, 1.9078946113586426, 2.197016716003418, 2.4861388206481934, 2.7752609252929688, 3.064383029937744, 3.3535053730010986, 3.642627477645874, 3.9317495822906494, 4.220871925354004, 4.509994029998779, 4.799116134643555, 5.08823823928833, 5.3773603439331055, 5.666482448577881, 5.955604553222656, 6.244726657867432, 6.533848762512207, 6.822970867156982, 7.112092971801758, 7.401215076446533, 7.690337181091309, 7.979459762573242, 8.26858139038086, 8.557703971862793, 8.846826553344727, 9.135948181152344, 9.425070762634277, 9.714192390441895, 10.003314971923828, 10.292436599731445, 10.581559181213379, 10.870680809020996]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 7.0, 7.0, 11.0, 7.0, 17.0, 28.0, 53.0, 84.0, 121.0, 193.0, 248.0, 485.0, 780.0, 1408.0, 2515.0, 4650.0, 8796.0, 18493.0, 40494.0, 90993.0, 192971.0, 280828.0, 211845.0, 104424.0, 46298.0, 21047.0, 10101.0, 5193.0, 2635.0, 1558.0, 855.0, 527.0, 328.0, 181.0, 127.0, 99.0, 41.0, 29.0, 29.0, 18.0, 12.0, 10.0, 1.0, 5.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-16.15625, -15.6751708984375, -15.194091796875, -14.7130126953125, -14.23193359375, -13.7508544921875, -13.269775390625, -12.7886962890625, -12.3076171875, -11.8265380859375, -11.345458984375, -10.8643798828125, -10.38330078125, -9.9022216796875, -9.421142578125, -8.9400634765625, -8.458984375, -7.9779052734375, -7.496826171875, -7.0157470703125, -6.53466796875, -6.0535888671875, -5.572509765625, -5.0914306640625, -4.6103515625, -4.1292724609375, -3.648193359375, -3.1671142578125, -2.68603515625, -2.2049560546875, -1.723876953125, -1.2427978515625, -0.76171875, -0.2806396484375, 0.200439453125, 0.6815185546875, 1.16259765625, 1.6436767578125, 2.124755859375, 2.6058349609375, 3.0869140625, 3.5679931640625, 4.049072265625, 4.5301513671875, 5.01123046875, 5.4923095703125, 5.973388671875, 6.4544677734375, 6.935546875, 7.4166259765625, 7.897705078125, 8.3787841796875, 8.85986328125, 9.3409423828125, 9.822021484375, 10.3031005859375, 10.7841796875, 11.2652587890625, 11.746337890625, 12.2274169921875, 12.70849609375, 13.1895751953125, 13.670654296875, 14.1517333984375, 14.6328125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 4.0, 6.0, 3.0, 10.0, 13.0, 12.0, 27.0, 19.0, 30.0, 28.0, 27.0, 38.0, 48.0, 49.0, 56.0, 50.0, 57.0, 44.0, 52.0, 47.0, 48.0, 42.0, 39.0, 40.0, 34.0, 28.0, 22.0, 28.0, 16.0, 22.0, 14.0, 14.0, 3.0, 8.0, 9.0, 2.0, 4.0, 2.0, 2.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8203125, -10.4588623046875, -10.097412109375, -9.7359619140625, -9.37451171875, -9.0130615234375, -8.651611328125, -8.2901611328125, -7.9287109375, -7.5672607421875, -7.205810546875, -6.8443603515625, -6.48291015625, -6.1214599609375, -5.760009765625, -5.3985595703125, -5.037109375, -4.6756591796875, -4.314208984375, -3.9527587890625, -3.59130859375, -3.2298583984375, -2.868408203125, -2.5069580078125, -2.1455078125, -1.7840576171875, -1.422607421875, -1.0611572265625, -0.69970703125, -0.3382568359375, 0.023193359375, 0.3846435546875, 0.74609375, 1.1075439453125, 1.468994140625, 1.8304443359375, 2.19189453125, 2.5533447265625, 2.914794921875, 3.2762451171875, 3.6376953125, 3.9991455078125, 4.360595703125, 4.7220458984375, 5.08349609375, 5.4449462890625, 5.806396484375, 6.1678466796875, 6.529296875, 6.8907470703125, 7.252197265625, 7.6136474609375, 7.97509765625, 8.3365478515625, 8.697998046875, 9.0594482421875, 9.4208984375, 9.7823486328125, 10.143798828125, 10.5052490234375, 10.86669921875, 11.2281494140625, 11.589599609375, 11.9510498046875, 12.3125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 11.0, 9.0, 17.0, 31.0, 31.0, 45.0, 71.0, 105.0, 174.0, 265.0, 446.0, 769.0, 1541.0, 3168.0, 7548.0, 19885.0, 61183.0, 204820.0, 430399.0, 217958.0, 64272.0, 21012.0, 7792.0, 3391.0, 1564.0, 811.0, 466.0, 269.0, 174.0, 100.0, 67.0, 37.0, 41.0, 25.0, 16.0, 6.0, 9.0, 10.0, 3.0, 7.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-27.703125, -26.92333984375, -26.1435546875, -25.36376953125, -24.583984375, -23.80419921875, -23.0244140625, -22.24462890625, -21.46484375, -20.68505859375, -19.9052734375, -19.12548828125, -18.345703125, -17.56591796875, -16.7861328125, -16.00634765625, -15.2265625, -14.44677734375, -13.6669921875, -12.88720703125, -12.107421875, -11.32763671875, -10.5478515625, -9.76806640625, -8.98828125, -8.20849609375, -7.4287109375, -6.64892578125, -5.869140625, -5.08935546875, -4.3095703125, -3.52978515625, -2.75, -1.97021484375, -1.1904296875, -0.41064453125, 0.369140625, 1.14892578125, 1.9287109375, 2.70849609375, 3.48828125, 4.26806640625, 5.0478515625, 5.82763671875, 6.607421875, 7.38720703125, 8.1669921875, 8.94677734375, 9.7265625, 10.50634765625, 11.2861328125, 12.06591796875, 12.845703125, 13.62548828125, 14.4052734375, 15.18505859375, 15.96484375, 16.74462890625, 17.5244140625, 18.30419921875, 19.083984375, 19.86376953125, 20.6435546875, 21.42333984375, 22.203125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 5.0, 4.0, 10.0, 13.0, 12.0, 21.0, 22.0, 16.0, 15.0, 28.0, 24.0, 35.0, 29.0, 35.0, 43.0, 34.0, 52.0, 38.0, 45.0, 37.0, 44.0, 41.0, 45.0, 49.0, 45.0, 28.0, 27.0, 29.0, 22.0, 14.0, 19.0, 18.0, 19.0, 11.0, 12.0, 11.0, 8.0, 9.0, 6.0, 7.0, 4.0, 0.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.98046875, -5.79559326171875, -5.6107177734375, -5.42584228515625, -5.240966796875, -5.05609130859375, -4.8712158203125, -4.68634033203125, -4.50146484375, -4.31658935546875, -4.1317138671875, -3.94683837890625, -3.761962890625, -3.57708740234375, -3.3922119140625, -3.20733642578125, -3.0224609375, -2.83758544921875, -2.6527099609375, -2.46783447265625, -2.282958984375, -2.09808349609375, -1.9132080078125, -1.72833251953125, -1.54345703125, -1.35858154296875, -1.1737060546875, -0.98883056640625, -0.803955078125, -0.61907958984375, -0.4342041015625, -0.24932861328125, -0.064453125, 0.12042236328125, 0.3052978515625, 0.49017333984375, 0.675048828125, 0.85992431640625, 1.0447998046875, 1.22967529296875, 1.41455078125, 1.59942626953125, 1.7843017578125, 1.96917724609375, 2.154052734375, 2.33892822265625, 2.5238037109375, 2.70867919921875, 2.8935546875, 3.07843017578125, 3.2633056640625, 3.44818115234375, 3.633056640625, 3.81793212890625, 4.0028076171875, 4.18768310546875, 4.37255859375, 4.55743408203125, 4.7423095703125, 4.92718505859375, 5.112060546875, 5.29693603515625, 5.4818115234375, 5.66668701171875, 5.8515625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 8.0, 3.0, 2.0, 4.0, 3.0, 12.0, 11.0, 13.0, 24.0, 21.0, 44.0, 57.0, 76.0, 111.0, 129.0, 212.0, 254.0, 399.0, 614.0, 900.0, 1261.0, 1837.0, 2755.0, 4360.0, 6861.0, 11031.0, 19325.0, 35062.0, 67905.0, 134879.0, 240356.0, 237161.0, 132465.0, 66318.0, 34541.0, 19108.0, 10954.0, 6591.0, 4291.0, 2729.0, 1797.0, 1224.0, 841.0, 583.0, 387.0, 277.0, 218.0, 165.0, 121.0, 66.0, 60.0, 39.0, 32.0, 18.0, 17.0, 14.0, 10.0, 9.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-6.671875, -6.4632568359375, -6.254638671875, -6.0460205078125, -5.83740234375, -5.6287841796875, -5.420166015625, -5.2115478515625, -5.0029296875, -4.7943115234375, -4.585693359375, -4.3770751953125, -4.16845703125, -3.9598388671875, -3.751220703125, -3.5426025390625, -3.333984375, -3.1253662109375, -2.916748046875, -2.7081298828125, -2.49951171875, -2.2908935546875, -2.082275390625, -1.8736572265625, -1.6650390625, -1.4564208984375, -1.247802734375, -1.0391845703125, -0.83056640625, -0.6219482421875, -0.413330078125, -0.2047119140625, 0.00390625, 0.2125244140625, 0.421142578125, 0.6297607421875, 0.83837890625, 1.0469970703125, 1.255615234375, 1.4642333984375, 1.6728515625, 1.8814697265625, 2.090087890625, 2.2987060546875, 2.50732421875, 2.7159423828125, 2.924560546875, 3.1331787109375, 3.341796875, 3.5504150390625, 3.759033203125, 3.9676513671875, 4.17626953125, 4.3848876953125, 4.593505859375, 4.8021240234375, 5.0107421875, 5.2193603515625, 5.427978515625, 5.6365966796875, 5.84521484375, 6.0538330078125, 6.262451171875, 6.4710693359375, 6.6796875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 5.0, 7.0, 10.0, 6.0, 8.0, 11.0, 14.0, 20.0, 22.0, 30.0, 43.0, 75.0, 92.0, 93.0, 98.0, 115.0, 71.0, 69.0, 55.0, 47.0, 33.0, 19.0, 13.0, 13.0, 9.0, 6.0, 10.0, 4.0, 1.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00044727325439453125, -0.00043395906686782837, -0.0004206448793411255, -0.0004073306918144226, -0.0003940165042877197, -0.00038070231676101685, -0.00036738812923431396, -0.0003540739417076111, -0.0003407597541809082, -0.0003274455666542053, -0.00031413137912750244, -0.00030081719160079956, -0.0002875030040740967, -0.0002741888165473938, -0.0002608746290206909, -0.00024756044149398804, -0.00023424625396728516, -0.00022093206644058228, -0.0002076178789138794, -0.00019430369138717651, -0.00018098950386047363, -0.00016767531633377075, -0.00015436112880706787, -0.000141046941280365, -0.0001277327537536621, -0.00011441856622695923, -0.00010110437870025635, -8.779019117355347e-05, -7.447600364685059e-05, -6.11618161201477e-05, -4.7847628593444824e-05, -3.453344106674194e-05, -2.1219253540039062e-05, -7.905066013336182e-06, 5.409121513366699e-06, 1.872330904006958e-05, 3.203749656677246e-05, 4.535168409347534e-05, 5.866587162017822e-05, 7.19800591468811e-05, 8.529424667358398e-05, 9.860843420028687e-05, 0.00011192262172698975, 0.00012523680925369263, 0.0001385509967803955, 0.0001518651843070984, 0.00016517937183380127, 0.00017849355936050415, 0.00019180774688720703, 0.0002051219344139099, 0.0002184361219406128, 0.00023175030946731567, 0.00024506449699401855, 0.00025837868452072144, 0.0002716928720474243, 0.0002850070595741272, 0.0002983212471008301, 0.00031163543462753296, 0.00032494962215423584, 0.0003382638096809387, 0.0003515779972076416, 0.0003648921847343445, 0.00037820637226104736, 0.00039152055978775024, 0.0004048347473144531]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 19.0, 10.0, 21.0, 37.0, 48.0, 68.0, 98.0, 138.0, 249.0, 422.0, 649.0, 1106.0, 1869.0, 3178.0, 5576.0, 10281.0, 19984.0, 40492.0, 85818.0, 173048.0, 260451.0, 217306.0, 116015.0, 54510.0, 26711.0, 13590.0, 7106.0, 3923.0, 2201.0, 1383.0, 847.0, 505.0, 340.0, 194.0, 123.0, 80.0, 49.0, 38.0, 22.0, 16.0, 6.0, 6.0, 5.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9296875, -6.71112060546875, -6.4925537109375, -6.27398681640625, -6.055419921875, -5.83685302734375, -5.6182861328125, -5.39971923828125, -5.18115234375, -4.96258544921875, -4.7440185546875, -4.52545166015625, -4.306884765625, -4.08831787109375, -3.8697509765625, -3.65118408203125, -3.4326171875, -3.21405029296875, -2.9954833984375, -2.77691650390625, -2.558349609375, -2.33978271484375, -2.1212158203125, -1.90264892578125, -1.68408203125, -1.46551513671875, -1.2469482421875, -1.02838134765625, -0.809814453125, -0.59124755859375, -0.3726806640625, -0.15411376953125, 0.064453125, 0.28302001953125, 0.5015869140625, 0.72015380859375, 0.938720703125, 1.15728759765625, 1.3758544921875, 1.59442138671875, 1.81298828125, 2.03155517578125, 2.2501220703125, 2.46868896484375, 2.687255859375, 2.90582275390625, 3.1243896484375, 3.34295654296875, 3.5615234375, 3.78009033203125, 3.9986572265625, 4.21722412109375, 4.435791015625, 4.65435791015625, 4.8729248046875, 5.09149169921875, 5.31005859375, 5.52862548828125, 5.7471923828125, 5.96575927734375, 6.184326171875, 6.40289306640625, 6.6214599609375, 6.84002685546875, 7.05859375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 6.0, 4.0, 6.0, 13.0, 4.0, 8.0, 5.0, 18.0, 19.0, 22.0, 21.0, 31.0, 38.0, 34.0, 67.0, 66.0, 62.0, 46.0, 64.0, 52.0, 47.0, 56.0, 42.0, 48.0, 32.0, 45.0, 27.0, 20.0, 10.0, 17.0, 16.0, 11.0, 9.0, 4.0, 5.0, 5.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-1.384765625, -1.3418731689453125, -1.298980712890625, -1.2560882568359375, -1.21319580078125, -1.1703033447265625, -1.127410888671875, -1.0845184326171875, -1.0416259765625, -0.9987335205078125, -0.955841064453125, -0.9129486083984375, -0.87005615234375, -0.8271636962890625, -0.784271240234375, -0.7413787841796875, -0.698486328125, -0.6555938720703125, -0.612701416015625, -0.5698089599609375, -0.52691650390625, -0.4840240478515625, -0.441131591796875, -0.3982391357421875, -0.3553466796875, -0.3124542236328125, -0.269561767578125, -0.2266693115234375, -0.18377685546875, -0.1408843994140625, -0.097991943359375, -0.0550994873046875, -0.01220703125, 0.0306854248046875, 0.073577880859375, 0.1164703369140625, 0.15936279296875, 0.2022552490234375, 0.245147705078125, 0.2880401611328125, 0.3309326171875, 0.3738250732421875, 0.416717529296875, 0.4596099853515625, 0.50250244140625, 0.5453948974609375, 0.588287353515625, 0.6311798095703125, 0.674072265625, 0.7169647216796875, 0.759857177734375, 0.8027496337890625, 0.84564208984375, 0.8885345458984375, 0.931427001953125, 0.9743194580078125, 1.0172119140625, 1.0601043701171875, 1.102996826171875, 1.1458892822265625, 1.18878173828125, 1.2316741943359375, 1.274566650390625, 1.3174591064453125, 1.3603515625]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 7.0, 3.0, 13.0, 8.0, 10.0, 14.0, 21.0, 29.0, 37.0, 45.0, 51.0, 58.0, 81.0, 83.0, 77.0, 62.0, 71.0, 69.0, 53.0, 49.0, 36.0, 22.0, 23.0, 14.0, 11.0, 14.0, 11.0, 6.0, 4.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0], "bins": [-25.621694564819336, -24.904603958129883, -24.18751335144043, -23.470422744750977, -22.753334045410156, -22.036243438720703, -21.31915283203125, -20.602062225341797, -19.884971618652344, -19.16788101196289, -18.450790405273438, -17.733699798583984, -17.01660919189453, -16.29952049255371, -15.582429885864258, -14.865339279174805, -14.148248672485352, -13.431158065795898, -12.714067459106445, -11.996977806091309, -11.279887199401855, -10.562796592712402, -9.845706939697266, -9.128616333007812, -8.41152572631836, -7.694435119628906, -6.977344989776611, -6.260254859924316, -5.543164253234863, -4.82607364654541, -4.108983516693115, -3.3918933868408203, -2.6748046875, -1.957714319229126, -1.240623950958252, -0.5235335826873779, 0.1935567855834961, 0.9106471538543701, 1.6277375221252441, 2.344827651977539, 3.061918258666992, 3.779008626937866, 4.49609899520874, 5.213189125061035, 5.930279731750488, 6.647370338439941, 7.364460468292236, 8.081550598144531, 8.798641204833984, 9.515731811523438, 10.23282241821289, 10.949912071228027, 11.66700267791748, 12.384093284606934, 13.10118293762207, 13.818273544311523, 14.535364151000977, 15.25245475769043, 15.969545364379883, 16.686635971069336, 17.403724670410156, 18.12081527709961, 18.837905883789062, 19.554996490478516, 20.27208709716797]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 4.0, 2.0, 6.0, 10.0, 8.0, 7.0, 12.0, 7.0, 24.0, 13.0, 13.0, 27.0, 31.0, 37.0, 38.0, 33.0, 36.0, 48.0, 36.0, 32.0, 40.0, 53.0, 46.0, 46.0, 46.0, 47.0, 36.0, 36.0, 31.0, 28.0, 25.0, 16.0, 22.0, 9.0, 20.0, 16.0, 18.0, 10.0, 9.0, 10.0, 3.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.047958850860596, -6.774683952331543, -6.501409530639648, -6.228134632110596, -5.954859733581543, -5.68158483505249, -5.4083099365234375, -5.135035514831543, -4.86176061630249, -4.5884857177734375, -4.315211296081543, -4.04193639755249, -3.7686614990234375, -3.4953866004943848, -3.222111940383911, -2.9488372802734375, -2.6755623817443848, -2.402287483215332, -2.1290128231048584, -1.8557380437850952, -1.582463264465332, -1.3091884851455688, -1.0359137058258057, -0.7626389265060425, -0.4893641471862793, -0.2160893678665161, 0.05718541145324707, 0.33046019077301025, 0.6037349700927734, 0.8770097494125366, 1.1502845287322998, 1.423559308052063, 1.6968345642089844, 1.9701093435287476, 2.2433841228485107, 2.5166587829589844, 2.789933681488037, 3.06320858001709, 3.3364832401275635, 3.609757900238037, 3.88303279876709, 4.156307697296143, 4.429582595825195, 4.70285701751709, 4.976131916046143, 5.249406814575195, 5.52268123626709, 5.795956134796143, 6.069231033325195, 6.342505931854248, 6.615780830383301, 6.889055252075195, 7.162330150604248, 7.435605049133301, 7.708879470825195, 7.982154369354248, 8.2554292678833, 8.528703689575195, 8.801979064941406, 9.0752534866333, 9.348527908325195, 9.621803283691406, 9.8950777053833, 10.168353080749512, 10.441627502441406]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 3.0, 12.0, 18.0, 22.0, 23.0, 42.0, 61.0, 94.0, 154.0, 230.0, 380.0, 624.0, 896.0, 1578.0, 2601.0, 4664.0, 7887.0, 14002.0, 24700.0, 43223.0, 72982.0, 115304.0, 158621.0, 175972.0, 153260.0, 109188.0, 68729.0, 39911.0, 22630.0, 12879.0, 7380.0, 4261.0, 2460.0, 1419.0, 868.0, 546.0, 321.0, 186.0, 123.0, 113.0, 54.0, 34.0, 27.0, 25.0, 12.0, 10.0, 8.0, 8.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.890625, -12.48046875, -12.0703125, -11.66015625, -11.25, -10.83984375, -10.4296875, -10.01953125, -9.609375, -9.19921875, -8.7890625, -8.37890625, -7.96875, -7.55859375, -7.1484375, -6.73828125, -6.328125, -5.91796875, -5.5078125, -5.09765625, -4.6875, -4.27734375, -3.8671875, -3.45703125, -3.046875, -2.63671875, -2.2265625, -1.81640625, -1.40625, -0.99609375, -0.5859375, -0.17578125, 0.234375, 0.64453125, 1.0546875, 1.46484375, 1.875, 2.28515625, 2.6953125, 3.10546875, 3.515625, 3.92578125, 4.3359375, 4.74609375, 5.15625, 5.56640625, 5.9765625, 6.38671875, 6.796875, 7.20703125, 7.6171875, 8.02734375, 8.4375, 8.84765625, 9.2578125, 9.66796875, 10.078125, 10.48828125, 10.8984375, 11.30859375, 11.71875, 12.12890625, 12.5390625, 12.94921875, 13.359375]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 4.0, 1.0, 9.0, 10.0, 9.0, 7.0, 14.0, 16.0, 23.0, 25.0, 17.0, 36.0, 44.0, 40.0, 35.0, 36.0, 52.0, 39.0, 47.0, 49.0, 39.0, 39.0, 45.0, 47.0, 34.0, 43.0, 27.0, 34.0, 20.0, 25.0, 18.0, 16.0, 19.0, 13.0, 11.0, 13.0, 6.0, 9.0, 7.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.0859375, -9.7691650390625, -9.452392578125, -9.1356201171875, -8.81884765625, -8.5020751953125, -8.185302734375, -7.8685302734375, -7.5517578125, -7.2349853515625, -6.918212890625, -6.6014404296875, -6.28466796875, -5.9678955078125, -5.651123046875, -5.3343505859375, -5.017578125, -4.7008056640625, -4.384033203125, -4.0672607421875, -3.75048828125, -3.4337158203125, -3.116943359375, -2.8001708984375, -2.4833984375, -2.1666259765625, -1.849853515625, -1.5330810546875, -1.21630859375, -0.8995361328125, -0.582763671875, -0.2659912109375, 0.05078125, 0.3675537109375, 0.684326171875, 1.0010986328125, 1.31787109375, 1.6346435546875, 1.951416015625, 2.2681884765625, 2.5849609375, 2.9017333984375, 3.218505859375, 3.5352783203125, 3.85205078125, 4.1688232421875, 4.485595703125, 4.8023681640625, 5.119140625, 5.4359130859375, 5.752685546875, 6.0694580078125, 6.38623046875, 6.7030029296875, 7.019775390625, 7.3365478515625, 7.6533203125, 7.9700927734375, 8.286865234375, 8.6036376953125, 8.92041015625, 9.2371826171875, 9.553955078125, 9.8707275390625, 10.1875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 3.0, 9.0, 12.0, 13.0, 36.0, 36.0, 62.0, 89.0, 152.0, 237.0, 419.0, 803.0, 1493.0, 2840.0, 5695.0, 11663.0, 24566.0, 49306.0, 95149.0, 159970.0, 210294.0, 197395.0, 135392.0, 76441.0, 39094.0, 18982.0, 8997.0, 4539.0, 2218.0, 1095.0, 614.0, 350.0, 199.0, 123.0, 99.0, 46.0, 36.0, 22.0, 25.0, 9.0, 14.0, 7.0, 5.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.6640625, -15.1558837890625, -14.647705078125, -14.1395263671875, -13.63134765625, -13.1231689453125, -12.614990234375, -12.1068115234375, -11.5986328125, -11.0904541015625, -10.582275390625, -10.0740966796875, -9.56591796875, -9.0577392578125, -8.549560546875, -8.0413818359375, -7.533203125, -7.0250244140625, -6.516845703125, -6.0086669921875, -5.50048828125, -4.9923095703125, -4.484130859375, -3.9759521484375, -3.4677734375, -2.9595947265625, -2.451416015625, -1.9432373046875, -1.43505859375, -0.9268798828125, -0.418701171875, 0.0894775390625, 0.59765625, 1.1058349609375, 1.614013671875, 2.1221923828125, 2.63037109375, 3.1385498046875, 3.646728515625, 4.1549072265625, 4.6630859375, 5.1712646484375, 5.679443359375, 6.1876220703125, 6.69580078125, 7.2039794921875, 7.712158203125, 8.2203369140625, 8.728515625, 9.2366943359375, 9.744873046875, 10.2530517578125, 10.76123046875, 11.2694091796875, 11.777587890625, 12.2857666015625, 12.7939453125, 13.3021240234375, 13.810302734375, 14.3184814453125, 14.82666015625, 15.3348388671875, 15.843017578125, 16.3511962890625, 16.859375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 5.0, 3.0, 5.0, 5.0, 7.0, 14.0, 12.0, 6.0, 23.0, 17.0, 24.0, 13.0, 20.0, 31.0, 35.0, 31.0, 33.0, 25.0, 38.0, 28.0, 39.0, 40.0, 38.0, 36.0, 41.0, 38.0, 40.0, 45.0, 44.0, 37.0, 28.0, 35.0, 31.0, 19.0, 21.0, 12.0, 14.0, 13.0, 9.0, 6.0, 15.0, 7.0, 6.0, 9.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.65625, -4.4765625, -4.296875, -4.1171875, -3.9375, -3.7578125, -3.578125, -3.3984375, -3.21875, -3.0390625, -2.859375, -2.6796875, -2.5, -2.3203125, -2.140625, -1.9609375, -1.78125, -1.6015625, -1.421875, -1.2421875, -1.0625, -0.8828125, -0.703125, -0.5234375, -0.34375, -0.1640625, 0.015625, 0.1953125, 0.375, 0.5546875, 0.734375, 0.9140625, 1.09375, 1.2734375, 1.453125, 1.6328125, 1.8125, 1.9921875, 2.171875, 2.3515625, 2.53125, 2.7109375, 2.890625, 3.0703125, 3.25, 3.4296875, 3.609375, 3.7890625, 3.96875, 4.1484375, 4.328125, 4.5078125, 4.6875, 4.8671875, 5.046875, 5.2265625, 5.40625, 5.5859375, 5.765625, 5.9453125, 6.125, 6.3046875, 6.484375, 6.6640625, 6.84375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 4.0, 6.0, 8.0, 10.0, 9.0, 23.0, 16.0, 26.0, 53.0, 58.0, 81.0, 95.0, 165.0, 220.0, 318.0, 510.0, 890.0, 1581.0, 2897.0, 5876.0, 13263.0, 31685.0, 80812.0, 186615.0, 295145.0, 236329.0, 112411.0, 44919.0, 18025.0, 7713.0, 3820.0, 2031.0, 1094.0, 626.0, 373.0, 273.0, 151.0, 129.0, 88.0, 61.0, 39.0, 27.0, 21.0, 14.0, 13.0, 14.0, 4.0, 6.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-10.15625, -9.854736328125, -9.55322265625, -9.251708984375, -8.9501953125, -8.648681640625, -8.34716796875, -8.045654296875, -7.744140625, -7.442626953125, -7.14111328125, -6.839599609375, -6.5380859375, -6.236572265625, -5.93505859375, -5.633544921875, -5.33203125, -5.030517578125, -4.72900390625, -4.427490234375, -4.1259765625, -3.824462890625, -3.52294921875, -3.221435546875, -2.919921875, -2.618408203125, -2.31689453125, -2.015380859375, -1.7138671875, -1.412353515625, -1.11083984375, -0.809326171875, -0.5078125, -0.206298828125, 0.09521484375, 0.396728515625, 0.6982421875, 0.999755859375, 1.30126953125, 1.602783203125, 1.904296875, 2.205810546875, 2.50732421875, 2.808837890625, 3.1103515625, 3.411865234375, 3.71337890625, 4.014892578125, 4.31640625, 4.617919921875, 4.91943359375, 5.220947265625, 5.5224609375, 5.823974609375, 6.12548828125, 6.427001953125, 6.728515625, 7.030029296875, 7.33154296875, 7.633056640625, 7.9345703125, 8.236083984375, 8.53759765625, 8.839111328125, 9.140625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 5.0, 7.0, 5.0, 5.0, 7.0, 7.0, 12.0, 12.0, 29.0, 23.0, 29.0, 29.0, 36.0, 37.0, 45.0, 54.0, 60.0, 57.0, 62.0, 49.0, 55.0, 52.0, 56.0, 44.0, 43.0, 31.0, 33.0, 22.0, 20.0, 16.0, 10.0, 15.0, 14.0, 8.0, 5.0, 4.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0004963874816894531, -0.00047941505908966064, -0.00046244263648986816, -0.0004454702138900757, -0.0004284977912902832, -0.0004115253686904907, -0.00039455294609069824, -0.00037758052349090576, -0.0003606081008911133, -0.0003436356782913208, -0.0003266632556915283, -0.00030969083309173584, -0.00029271841049194336, -0.0002757459878921509, -0.0002587735652923584, -0.00024180114269256592, -0.00022482872009277344, -0.00020785629749298096, -0.00019088387489318848, -0.000173911452293396, -0.00015693902969360352, -0.00013996660709381104, -0.00012299418449401855, -0.00010602176189422607, -8.90493392944336e-05, -7.207691669464111e-05, -5.510449409484863e-05, -3.813207149505615e-05, -2.1159648895263672e-05, -4.187226295471191e-06, 1.2785196304321289e-05, 2.975761890411377e-05, 4.673004150390625e-05, 6.370246410369873e-05, 8.067488670349121e-05, 9.764730930328369e-05, 0.00011461973190307617, 0.00013159215450286865, 0.00014856457710266113, 0.0001655369997024536, 0.0001825094223022461, 0.00019948184490203857, 0.00021645426750183105, 0.00023342669010162354, 0.000250399112701416, 0.0002673715353012085, 0.000284343957901001, 0.00030131638050079346, 0.00031828880310058594, 0.0003352612257003784, 0.0003522336483001709, 0.0003692060708999634, 0.00038617849349975586, 0.00040315091609954834, 0.0004201233386993408, 0.0004370957612991333, 0.0004540681838989258, 0.00047104060649871826, 0.00048801302909851074, 0.0005049854516983032, 0.0005219578742980957, 0.0005389302968978882, 0.0005559027194976807, 0.0005728751420974731, 0.0005898475646972656]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 9.0, 2.0, 7.0, 8.0, 9.0, 16.0, 13.0, 18.0, 38.0, 49.0, 75.0, 107.0, 140.0, 211.0, 309.0, 510.0, 748.0, 1178.0, 1964.0, 3369.0, 6126.0, 10828.0, 20216.0, 37614.0, 67563.0, 114816.0, 168142.0, 193541.0, 165033.0, 110730.0, 65062.0, 35953.0, 19425.0, 10432.0, 5773.0, 3281.0, 1995.0, 1130.0, 725.0, 448.0, 294.0, 199.0, 139.0, 92.0, 66.0, 40.0, 29.0, 31.0, 18.0, 11.0, 13.0, 8.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-5.734375, -5.5521240234375, -5.369873046875, -5.1876220703125, -5.00537109375, -4.8231201171875, -4.640869140625, -4.4586181640625, -4.2763671875, -4.0941162109375, -3.911865234375, -3.7296142578125, -3.54736328125, -3.3651123046875, -3.182861328125, -3.0006103515625, -2.818359375, -2.6361083984375, -2.453857421875, -2.2716064453125, -2.08935546875, -1.9071044921875, -1.724853515625, -1.5426025390625, -1.3603515625, -1.1781005859375, -0.995849609375, -0.8135986328125, -0.63134765625, -0.4490966796875, -0.266845703125, -0.0845947265625, 0.09765625, 0.2799072265625, 0.462158203125, 0.6444091796875, 0.82666015625, 1.0089111328125, 1.191162109375, 1.3734130859375, 1.5556640625, 1.7379150390625, 1.920166015625, 2.1024169921875, 2.28466796875, 2.4669189453125, 2.649169921875, 2.8314208984375, 3.013671875, 3.1959228515625, 3.378173828125, 3.5604248046875, 3.74267578125, 3.9249267578125, 4.107177734375, 4.2894287109375, 4.4716796875, 4.6539306640625, 4.836181640625, 5.0184326171875, 5.20068359375, 5.3829345703125, 5.565185546875, 5.7474365234375, 5.9296875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 7.0, 7.0, 14.0, 9.0, 19.0, 20.0, 23.0, 33.0, 42.0, 40.0, 56.0, 69.0, 60.0, 79.0, 70.0, 76.0, 55.0, 46.0, 57.0, 43.0, 43.0, 37.0, 21.0, 18.0, 5.0, 15.0, 10.0, 3.0, 6.0, 6.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9248046875, -1.8626861572265625, -1.800567626953125, -1.7384490966796875, -1.67633056640625, -1.6142120361328125, -1.552093505859375, -1.4899749755859375, -1.4278564453125, -1.3657379150390625, -1.303619384765625, -1.2415008544921875, -1.17938232421875, -1.1172637939453125, -1.055145263671875, -0.9930267333984375, -0.930908203125, -0.8687896728515625, -0.806671142578125, -0.7445526123046875, -0.68243408203125, -0.6203155517578125, -0.558197021484375, -0.4960784912109375, -0.4339599609375, -0.3718414306640625, -0.309722900390625, -0.2476043701171875, -0.18548583984375, -0.1233673095703125, -0.061248779296875, 0.0008697509765625, 0.06298828125, 0.1251068115234375, 0.187225341796875, 0.2493438720703125, 0.31146240234375, 0.3735809326171875, 0.435699462890625, 0.4978179931640625, 0.5599365234375, 0.6220550537109375, 0.684173583984375, 0.7462921142578125, 0.80841064453125, 0.8705291748046875, 0.932647705078125, 0.9947662353515625, 1.056884765625, 1.1190032958984375, 1.181121826171875, 1.2432403564453125, 1.30535888671875, 1.3674774169921875, 1.429595947265625, 1.4917144775390625, 1.5538330078125, 1.6159515380859375, 1.678070068359375, 1.7401885986328125, 1.80230712890625, 1.8644256591796875, 1.926544189453125, 1.9886627197265625, 2.05078125]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 9.0, 3.0, 10.0, 10.0, 16.0, 16.0, 21.0, 28.0, 46.0, 50.0, 63.0, 74.0, 93.0, 79.0, 96.0, 64.0, 71.0, 66.0, 31.0, 36.0, 31.0, 27.0, 9.0, 12.0, 13.0, 5.0, 4.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.34234046936035, -26.557292938232422, -25.772245407104492, -24.987197875976562, -24.202150344848633, -23.417102813720703, -22.63205337524414, -21.847007751464844, -21.06195831298828, -20.27691078186035, -19.491863250732422, -18.706815719604492, -17.921768188476562, -17.136720657348633, -16.351673126220703, -15.566624641418457, -14.781578063964844, -13.996530532836914, -13.211483001708984, -12.426435470581055, -11.641387939453125, -10.856340408325195, -10.07129192352295, -9.28624439239502, -8.50119686126709, -7.71614933013916, -6.9311017990112305, -6.146053791046143, -5.361006259918213, -4.575958728790283, -3.7909107208251953, -3.0058631896972656, -2.220815658569336, -1.4357680082321167, -0.6507203578948975, 0.13432741165161133, 0.919374942779541, 1.7044224739074707, 2.4894704818725586, 3.2745180130004883, 4.059565544128418, 4.844613075256348, 5.629660606384277, 6.414708614349365, 7.199756145477295, 7.984803676605225, 8.769851684570312, 9.554899215698242, 10.339946746826172, 11.124994277954102, 11.910041809082031, 12.695089340209961, 13.48013687133789, 14.26518440246582, 15.050232887268066, 15.835280418395996, 16.62032699584961, 17.40537452697754, 18.19042205810547, 18.9754695892334, 19.760517120361328, 20.545564651489258, 21.330612182617188, 22.11566162109375, 22.90070915222168]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 8.0, 6.0, 11.0, 12.0, 13.0, 13.0, 8.0, 23.0, 20.0, 20.0, 25.0, 23.0, 29.0, 40.0, 32.0, 52.0, 43.0, 38.0, 32.0, 46.0, 63.0, 42.0, 36.0, 40.0, 41.0, 46.0, 32.0, 34.0, 26.0, 28.0, 18.0, 22.0, 10.0, 6.0, 14.0, 15.0, 14.0, 7.0, 2.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.717850208282471, -7.419209957122803, -7.120569705963135, -6.821929454803467, -6.523289203643799, -6.224648952484131, -5.926008701324463, -5.627368450164795, -5.328728199005127, -5.030087947845459, -4.731447696685791, -4.432807445526123, -4.134167194366455, -3.835526943206787, -3.536886692047119, -3.238246440887451, -2.939606189727783, -2.6409659385681152, -2.3423256874084473, -2.0436854362487793, -1.7450451850891113, -1.4464049339294434, -1.1477646827697754, -0.8491244316101074, -0.5504841804504395, -0.2518439292907715, 0.046796321868896484, 0.34543657302856445, 0.6440768241882324, 0.9427170753479004, 1.2413573265075684, 1.5399975776672363, 1.838637351989746, 2.137277603149414, 2.435917854309082, 2.73455810546875, 3.033198356628418, 3.331838607788086, 3.630478858947754, 3.929119110107422, 4.22775936126709, 4.526399612426758, 4.825039863586426, 5.123680114746094, 5.422320365905762, 5.72096061706543, 6.019600868225098, 6.318241119384766, 6.616881370544434, 6.915521621704102, 7.2141618728637695, 7.5128021240234375, 7.8114423751831055, 8.110082626342773, 8.408722877502441, 8.70736312866211, 9.006003379821777, 9.304643630981445, 9.603283882141113, 9.901924133300781, 10.20056438446045, 10.499204635620117, 10.797844886779785, 11.096485137939453, 11.395125389099121]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 6.0, 10.0, 10.0, 19.0, 26.0, 40.0, 60.0, 95.0, 155.0, 223.0, 413.0, 637.0, 1182.0, 1927.0, 3337.0, 6259.0, 12609.0, 25167.0, 52574.0, 117310.0, 278734.0, 690717.0, 1276717.0, 981621.0, 420102.0, 173308.0, 77183.0, 35898.0, 17722.0, 9130.0, 4725.0, 2657.0, 1511.0, 859.0, 499.0, 319.0, 184.0, 131.0, 69.0, 50.0, 30.0, 19.0, 13.0, 8.0, 4.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-18.671875, -18.064208984375, -17.45654296875, -16.848876953125, -16.2412109375, -15.633544921875, -15.02587890625, -14.418212890625, -13.810546875, -13.202880859375, -12.59521484375, -11.987548828125, -11.3798828125, -10.772216796875, -10.16455078125, -9.556884765625, -8.94921875, -8.341552734375, -7.73388671875, -7.126220703125, -6.5185546875, -5.910888671875, -5.30322265625, -4.695556640625, -4.087890625, -3.480224609375, -2.87255859375, -2.264892578125, -1.6572265625, -1.049560546875, -0.44189453125, 0.165771484375, 0.7734375, 1.381103515625, 1.98876953125, 2.596435546875, 3.2041015625, 3.811767578125, 4.41943359375, 5.027099609375, 5.634765625, 6.242431640625, 6.85009765625, 7.457763671875, 8.0654296875, 8.673095703125, 9.28076171875, 9.888427734375, 10.49609375, 11.103759765625, 11.71142578125, 12.319091796875, 12.9267578125, 13.534423828125, 14.14208984375, 14.749755859375, 15.357421875, 15.965087890625, 16.57275390625, 17.180419921875, 17.7880859375, 18.395751953125, 19.00341796875, 19.611083984375, 20.21875]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 5.0, 7.0, 12.0, 7.0, 13.0, 7.0, 13.0, 20.0, 17.0, 21.0, 27.0, 30.0, 24.0, 27.0, 37.0, 29.0, 41.0, 44.0, 48.0, 50.0, 41.0, 35.0, 52.0, 46.0, 33.0, 43.0, 48.0, 32.0, 33.0, 25.0, 20.0, 21.0, 21.0, 12.0, 13.0, 16.0, 11.0, 9.0, 5.0, 5.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.125, -5.9002685546875, -5.675537109375, -5.4508056640625, -5.22607421875, -5.0013427734375, -4.776611328125, -4.5518798828125, -4.3271484375, -4.1024169921875, -3.877685546875, -3.6529541015625, -3.42822265625, -3.2034912109375, -2.978759765625, -2.7540283203125, -2.529296875, -2.3045654296875, -2.079833984375, -1.8551025390625, -1.63037109375, -1.4056396484375, -1.180908203125, -0.9561767578125, -0.7314453125, -0.5067138671875, -0.281982421875, -0.0572509765625, 0.16748046875, 0.3922119140625, 0.616943359375, 0.8416748046875, 1.06640625, 1.2911376953125, 1.515869140625, 1.7406005859375, 1.96533203125, 2.1900634765625, 2.414794921875, 2.6395263671875, 2.8642578125, 3.0889892578125, 3.313720703125, 3.5384521484375, 3.76318359375, 3.9879150390625, 4.212646484375, 4.4373779296875, 4.662109375, 4.8868408203125, 5.111572265625, 5.3363037109375, 5.56103515625, 5.7857666015625, 6.010498046875, 6.2352294921875, 6.4599609375, 6.6846923828125, 6.909423828125, 7.1341552734375, 7.35888671875, 7.5836181640625, 7.808349609375, 8.0330810546875, 8.2578125]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 5.0, 6.0, 14.0, 16.0, 19.0, 50.0, 73.0, 98.0, 178.0, 226.0, 390.0, 611.0, 1036.0, 1723.0, 2951.0, 5233.0, 9068.0, 15928.0, 28858.0, 53743.0, 102391.0, 197687.0, 382617.0, 694030.0, 959245.0, 785904.0, 453863.0, 235495.0, 121026.0, 63869.0, 33960.0, 18675.0, 10674.0, 6126.0, 3440.0, 1995.0, 1168.0, 722.0, 428.0, 270.0, 188.0, 100.0, 66.0, 43.0, 29.0, 13.0, 14.0, 9.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.53125, -16.024658203125, -15.51806640625, -15.011474609375, -14.5048828125, -13.998291015625, -13.49169921875, -12.985107421875, -12.478515625, -11.971923828125, -11.46533203125, -10.958740234375, -10.4521484375, -9.945556640625, -9.43896484375, -8.932373046875, -8.42578125, -7.919189453125, -7.41259765625, -6.906005859375, -6.3994140625, -5.892822265625, -5.38623046875, -4.879638671875, -4.373046875, -3.866455078125, -3.35986328125, -2.853271484375, -2.3466796875, -1.840087890625, -1.33349609375, -0.826904296875, -0.3203125, 0.186279296875, 0.69287109375, 1.199462890625, 1.7060546875, 2.212646484375, 2.71923828125, 3.225830078125, 3.732421875, 4.239013671875, 4.74560546875, 5.252197265625, 5.7587890625, 6.265380859375, 6.77197265625, 7.278564453125, 7.78515625, 8.291748046875, 8.79833984375, 9.304931640625, 9.8115234375, 10.318115234375, 10.82470703125, 11.331298828125, 11.837890625, 12.344482421875, 12.85107421875, 13.357666015625, 13.8642578125, 14.370849609375, 14.87744140625, 15.384033203125, 15.890625]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 3.0, 7.0, 10.0, 8.0, 23.0, 25.0, 33.0, 52.0, 62.0, 62.0, 87.0, 112.0, 127.0, 186.0, 206.0, 241.0, 265.0, 297.0, 274.0, 304.0, 276.0, 242.0, 215.0, 196.0, 161.0, 137.0, 127.0, 75.0, 69.0, 55.0, 31.0, 25.0, 21.0, 21.0, 10.0, 13.0, 7.0, 4.0, 2.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.98046875, -4.82391357421875, -4.6673583984375, -4.51080322265625, -4.354248046875, -4.19769287109375, -4.0411376953125, -3.88458251953125, -3.72802734375, -3.57147216796875, -3.4149169921875, -3.25836181640625, -3.101806640625, -2.94525146484375, -2.7886962890625, -2.63214111328125, -2.4755859375, -2.31903076171875, -2.1624755859375, -2.00592041015625, -1.849365234375, -1.69281005859375, -1.5362548828125, -1.37969970703125, -1.22314453125, -1.06658935546875, -0.9100341796875, -0.75347900390625, -0.596923828125, -0.44036865234375, -0.2838134765625, -0.12725830078125, 0.029296875, 0.18585205078125, 0.3424072265625, 0.49896240234375, 0.655517578125, 0.81207275390625, 0.9686279296875, 1.12518310546875, 1.28173828125, 1.43829345703125, 1.5948486328125, 1.75140380859375, 1.907958984375, 2.06451416015625, 2.2210693359375, 2.37762451171875, 2.5341796875, 2.69073486328125, 2.8472900390625, 3.00384521484375, 3.160400390625, 3.31695556640625, 3.4735107421875, 3.63006591796875, 3.78662109375, 3.94317626953125, 4.0997314453125, 4.25628662109375, 4.412841796875, 4.56939697265625, 4.7259521484375, 4.88250732421875, 5.0390625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 5.0, 12.0, 13.0, 12.0, 23.0, 42.0, 46.0, 49.0, 63.0, 70.0, 68.0, 75.0, 87.0, 92.0, 64.0, 46.0, 46.0, 46.0, 34.0, 18.0, 20.0, 12.0, 15.0, 10.0, 6.0, 5.0, 6.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.599149703979492, -23.857467651367188, -23.11578369140625, -22.374101638793945, -21.63241958618164, -20.890735626220703, -20.1490535736084, -19.407371520996094, -18.665687561035156, -17.92400550842285, -17.182321548461914, -16.44063949584961, -15.698956489562988, -14.957273483276367, -14.215591430664062, -13.473908424377441, -12.73222541809082, -11.9905424118042, -11.248859405517578, -10.507177352905273, -9.765494346618652, -9.023811340332031, -8.282129287719727, -7.5404462814331055, -6.798763275146484, -6.057080268859863, -5.3153977394104, -4.5737152099609375, -3.8320322036743164, -3.0903494358062744, -2.3486666679382324, -1.6069841384887695, -0.8652992248535156, -0.12361645698547363, 0.6180663108825684, 1.3597490787506104, 2.1014318466186523, 2.8431146144866943, 3.5847973823547363, 4.326479911804199, 5.06816291809082, 5.809845924377441, 6.551528453826904, 7.293210983276367, 8.034893989562988, 8.77657699584961, 9.518259048461914, 10.259942054748535, 11.001625061035156, 11.743308067321777, 12.484991073608398, 13.226673126220703, 13.968356132507324, 14.710039138793945, 15.45172119140625, 16.193405151367188, 16.935087203979492, 17.676769256591797, 18.418453216552734, 19.16013526916504, 19.901817321777344, 20.64350128173828, 21.385183334350586, 22.12686538696289, 22.868549346923828]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 6.0, 12.0, 12.0, 14.0, 11.0, 23.0, 19.0, 24.0, 31.0, 33.0, 30.0, 36.0, 32.0, 36.0, 45.0, 43.0, 49.0, 41.0, 38.0, 43.0, 38.0, 35.0, 46.0, 35.0, 25.0, 39.0, 28.0, 29.0, 28.0, 13.0, 14.0, 12.0, 15.0, 14.0, 10.0, 7.0, 6.0, 9.0, 3.0, 6.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.250918388366699, -6.986877918243408, -6.722837924957275, -6.458797454833984, -6.194757461547852, -5.9307169914245605, -5.6666765213012695, -5.402636528015137, -5.138596057891846, -4.874555587768555, -4.610515594482422, -4.346475124359131, -4.08243465423584, -3.818394660949707, -3.554354190826416, -3.290313959121704, -3.026273727416992, -2.7622334957122803, -2.4981932640075684, -2.2341527938842773, -1.9701125621795654, -1.7060723304748535, -1.442031979560852, -1.1779916286468506, -0.9139513969421387, -0.649911105632782, -0.3858708143234253, -0.1218305230140686, 0.14220976829528809, 0.40625, 0.6702903509140015, 0.9343307018280029, 1.1983709335327148, 1.4624111652374268, 1.7264515161514282, 1.9904918670654297, 2.2545320987701416, 2.5185723304748535, 2.7826128005981445, 3.0466530323028564, 3.3106932640075684, 3.5747334957122803, 3.838773727416992, 4.102814197540283, 4.366854667663574, 4.630894660949707, 4.894935131072998, 5.158975601196289, 5.423015594482422, 5.687056064605713, 5.951096057891846, 6.215136528015137, 6.4791765213012695, 6.7432169914245605, 7.007257461547852, 7.271297454833984, 7.535337924957275, 7.799378395080566, 8.0634183883667, 8.327458381652832, 8.591499328613281, 8.855539321899414, 9.119579315185547, 9.383620262145996, 9.647660255432129]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 4.0, 5.0, 8.0, 12.0, 23.0, 35.0, 33.0, 71.0, 100.0, 156.0, 265.0, 398.0, 658.0, 1006.0, 1662.0, 2859.0, 4652.0, 7814.0, 13232.0, 22623.0, 38257.0, 63084.0, 99364.0, 138930.0, 164313.0, 156854.0, 122564.0, 82549.0, 51940.0, 30649.0, 18110.0, 10438.0, 6334.0, 3639.0, 2228.0, 1350.0, 845.0, 539.0, 308.0, 216.0, 159.0, 85.0, 69.0, 46.0, 26.0, 32.0, 5.0, 9.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.796875, -6.560791015625, -6.32470703125, -6.088623046875, -5.8525390625, -5.616455078125, -5.38037109375, -5.144287109375, -4.908203125, -4.672119140625, -4.43603515625, -4.199951171875, -3.9638671875, -3.727783203125, -3.49169921875, -3.255615234375, -3.01953125, -2.783447265625, -2.54736328125, -2.311279296875, -2.0751953125, -1.839111328125, -1.60302734375, -1.366943359375, -1.130859375, -0.894775390625, -0.65869140625, -0.422607421875, -0.1865234375, 0.049560546875, 0.28564453125, 0.521728515625, 0.7578125, 0.993896484375, 1.22998046875, 1.466064453125, 1.7021484375, 1.938232421875, 2.17431640625, 2.410400390625, 2.646484375, 2.882568359375, 3.11865234375, 3.354736328125, 3.5908203125, 3.826904296875, 4.06298828125, 4.299072265625, 4.53515625, 4.771240234375, 5.00732421875, 5.243408203125, 5.4794921875, 5.715576171875, 5.95166015625, 6.187744140625, 6.423828125, 6.659912109375, 6.89599609375, 7.132080078125, 7.3681640625, 7.604248046875, 7.84033203125, 8.076416015625, 8.3125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 7.0, 8.0, 13.0, 11.0, 14.0, 21.0, 26.0, 22.0, 26.0, 28.0, 32.0, 49.0, 34.0, 44.0, 48.0, 48.0, 47.0, 34.0, 58.0, 57.0, 46.0, 46.0, 39.0, 34.0, 34.0, 22.0, 28.0, 21.0, 17.0, 17.0, 20.0, 11.0, 5.0, 6.0, 11.0, 6.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3046875, -8.9765625, -8.6484375, -8.3203125, -7.9921875, -7.6640625, -7.3359375, -7.0078125, -6.6796875, -6.3515625, -6.0234375, -5.6953125, -5.3671875, -5.0390625, -4.7109375, -4.3828125, -4.0546875, -3.7265625, -3.3984375, -3.0703125, -2.7421875, -2.4140625, -2.0859375, -1.7578125, -1.4296875, -1.1015625, -0.7734375, -0.4453125, -0.1171875, 0.2109375, 0.5390625, 0.8671875, 1.1953125, 1.5234375, 1.8515625, 2.1796875, 2.5078125, 2.8359375, 3.1640625, 3.4921875, 3.8203125, 4.1484375, 4.4765625, 4.8046875, 5.1328125, 5.4609375, 5.7890625, 6.1171875, 6.4453125, 6.7734375, 7.1015625, 7.4296875, 7.7578125, 8.0859375, 8.4140625, 8.7421875, 9.0703125, 9.3984375, 9.7265625, 10.0546875, 10.3828125, 10.7109375, 11.0390625, 11.3671875, 11.6953125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 4.0, 7.0, 9.0, 22.0, 18.0, 30.0, 58.0, 79.0, 116.0, 172.0, 261.0, 363.0, 522.0, 853.0, 1271.0, 2013.0, 3348.0, 5513.0, 9028.0, 15156.0, 25262.0, 43311.0, 72413.0, 116794.0, 168501.0, 187242.0, 149228.0, 98188.0, 60020.0, 35883.0, 20650.0, 12379.0, 7545.0, 4644.0, 2745.0, 1803.0, 1110.0, 663.0, 412.0, 285.0, 215.0, 120.0, 92.0, 69.0, 41.0, 32.0, 22.0, 13.0, 15.0, 6.0, 7.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0], "bins": [-8.9140625, -8.63818359375, -8.3623046875, -8.08642578125, -7.810546875, -7.53466796875, -7.2587890625, -6.98291015625, -6.70703125, -6.43115234375, -6.1552734375, -5.87939453125, -5.603515625, -5.32763671875, -5.0517578125, -4.77587890625, -4.5, -4.22412109375, -3.9482421875, -3.67236328125, -3.396484375, -3.12060546875, -2.8447265625, -2.56884765625, -2.29296875, -2.01708984375, -1.7412109375, -1.46533203125, -1.189453125, -0.91357421875, -0.6376953125, -0.36181640625, -0.0859375, 0.18994140625, 0.4658203125, 0.74169921875, 1.017578125, 1.29345703125, 1.5693359375, 1.84521484375, 2.12109375, 2.39697265625, 2.6728515625, 2.94873046875, 3.224609375, 3.50048828125, 3.7763671875, 4.05224609375, 4.328125, 4.60400390625, 4.8798828125, 5.15576171875, 5.431640625, 5.70751953125, 5.9833984375, 6.25927734375, 6.53515625, 6.81103515625, 7.0869140625, 7.36279296875, 7.638671875, 7.91455078125, 8.1904296875, 8.46630859375, 8.7421875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 4.0, 4.0, 10.0, 4.0, 11.0, 14.0, 14.0, 15.0, 18.0, 20.0, 21.0, 27.0, 29.0, 28.0, 41.0, 26.0, 38.0, 45.0, 45.0, 38.0, 38.0, 49.0, 44.0, 41.0, 39.0, 46.0, 42.0, 32.0, 35.0, 24.0, 25.0, 21.0, 25.0, 17.0, 12.0, 12.0, 13.0, 9.0, 5.0, 7.0, 4.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.921875, -4.74652099609375, -4.5711669921875, -4.39581298828125, -4.220458984375, -4.04510498046875, -3.8697509765625, -3.69439697265625, -3.51904296875, -3.34368896484375, -3.1683349609375, -2.99298095703125, -2.817626953125, -2.64227294921875, -2.4669189453125, -2.29156494140625, -2.1162109375, -1.94085693359375, -1.7655029296875, -1.59014892578125, -1.414794921875, -1.23944091796875, -1.0640869140625, -0.88873291015625, -0.71337890625, -0.53802490234375, -0.3626708984375, -0.18731689453125, -0.011962890625, 0.16339111328125, 0.3387451171875, 0.51409912109375, 0.689453125, 0.86480712890625, 1.0401611328125, 1.21551513671875, 1.390869140625, 1.56622314453125, 1.7415771484375, 1.91693115234375, 2.09228515625, 2.26763916015625, 2.4429931640625, 2.61834716796875, 2.793701171875, 2.96905517578125, 3.1444091796875, 3.31976318359375, 3.4951171875, 3.67047119140625, 3.8458251953125, 4.02117919921875, 4.196533203125, 4.37188720703125, 4.5472412109375, 4.72259521484375, 4.89794921875, 5.07330322265625, 5.2486572265625, 5.42401123046875, 5.599365234375, 5.77471923828125, 5.9500732421875, 6.12542724609375, 6.30078125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 9.0, 16.0, 15.0, 22.0, 39.0, 77.0, 113.0, 161.0, 275.0, 406.0, 678.0, 1121.0, 1847.0, 2928.0, 4989.0, 8315.0, 14539.0, 25520.0, 45036.0, 79193.0, 137057.0, 202794.0, 202844.0, 136084.0, 79425.0, 44611.0, 25176.0, 14539.0, 8236.0, 4978.0, 2923.0, 1711.0, 1126.0, 629.0, 408.0, 253.0, 153.0, 100.0, 82.0, 46.0, 29.0, 25.0, 18.0, 6.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.9140625, -4.76513671875, -4.6162109375, -4.46728515625, -4.318359375, -4.16943359375, -4.0205078125, -3.87158203125, -3.72265625, -3.57373046875, -3.4248046875, -3.27587890625, -3.126953125, -2.97802734375, -2.8291015625, -2.68017578125, -2.53125, -2.38232421875, -2.2333984375, -2.08447265625, -1.935546875, -1.78662109375, -1.6376953125, -1.48876953125, -1.33984375, -1.19091796875, -1.0419921875, -0.89306640625, -0.744140625, -0.59521484375, -0.4462890625, -0.29736328125, -0.1484375, 0.00048828125, 0.1494140625, 0.29833984375, 0.447265625, 0.59619140625, 0.7451171875, 0.89404296875, 1.04296875, 1.19189453125, 1.3408203125, 1.48974609375, 1.638671875, 1.78759765625, 1.9365234375, 2.08544921875, 2.234375, 2.38330078125, 2.5322265625, 2.68115234375, 2.830078125, 2.97900390625, 3.1279296875, 3.27685546875, 3.42578125, 3.57470703125, 3.7236328125, 3.87255859375, 4.021484375, 4.17041015625, 4.3193359375, 4.46826171875, 4.6171875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 5.0, 3.0, 11.0, 5.0, 16.0, 11.0, 25.0, 25.0, 31.0, 41.0, 42.0, 53.0, 58.0, 64.0, 54.0, 65.0, 70.0, 50.0, 68.0, 54.0, 36.0, 37.0, 45.0, 21.0, 22.0, 15.0, 23.0, 14.0, 7.0, 10.0, 5.0, 3.0, 2.0, 4.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0002429485321044922, -0.00023453310132026672, -0.00022611767053604126, -0.0002177022397518158, -0.00020928680896759033, -0.00020087137818336487, -0.0001924559473991394, -0.00018404051661491394, -0.00017562508583068848, -0.000167209655046463, -0.00015879422426223755, -0.00015037879347801208, -0.00014196336269378662, -0.00013354793190956116, -0.0001251325011253357, -0.00011671707034111023, -0.00010830163955688477, -9.98862087726593e-05, -9.147077798843384e-05, -8.305534720420837e-05, -7.463991641998291e-05, -6.622448563575745e-05, -5.780905485153198e-05, -4.939362406730652e-05, -4.0978193283081055e-05, -3.256276249885559e-05, -2.4147331714630127e-05, -1.5731900930404663e-05, -7.316470146179199e-06, 1.0989606380462646e-06, 9.514391422271729e-06, 1.7929822206497192e-05, 2.6345252990722656e-05, 3.476068377494812e-05, 4.3176114559173584e-05, 5.159154534339905e-05, 6.000697612762451e-05, 6.842240691184998e-05, 7.683783769607544e-05, 8.52532684803009e-05, 9.366869926452637e-05, 0.00010208413004875183, 0.0001104995608329773, 0.00011891499161720276, 0.00012733042240142822, 0.0001357458531856537, 0.00014416128396987915, 0.00015257671475410461, 0.00016099214553833008, 0.00016940757632255554, 0.000177823007106781, 0.00018623843789100647, 0.00019465386867523193, 0.0002030692994594574, 0.00021148473024368286, 0.00021990016102790833, 0.0002283155918121338, 0.00023673102259635925, 0.0002451464533805847, 0.0002535618841648102, 0.00026197731494903564, 0.0002703927457332611, 0.00027880817651748657, 0.00028722360730171204, 0.0002956390380859375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 4.0, 2.0, 6.0, 4.0, 5.0, 8.0, 16.0, 24.0, 40.0, 53.0, 75.0, 110.0, 159.0, 231.0, 354.0, 624.0, 865.0, 1396.0, 2068.0, 3336.0, 5329.0, 8479.0, 13566.0, 20736.0, 32973.0, 51534.0, 77120.0, 107484.0, 136071.0, 146233.0, 131985.0, 102713.0, 72381.0, 48189.0, 30708.0, 19558.0, 12439.0, 7856.0, 4987.0, 3111.0, 2002.0, 1314.0, 851.0, 510.0, 361.0, 265.0, 135.0, 98.0, 65.0, 41.0, 20.0, 23.0, 16.0, 16.0, 6.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0], "bins": [-3.458984375, -3.352294921875, -3.24560546875, -3.138916015625, -3.0322265625, -2.925537109375, -2.81884765625, -2.712158203125, -2.60546875, -2.498779296875, -2.39208984375, -2.285400390625, -2.1787109375, -2.072021484375, -1.96533203125, -1.858642578125, -1.751953125, -1.645263671875, -1.53857421875, -1.431884765625, -1.3251953125, -1.218505859375, -1.11181640625, -1.005126953125, -0.8984375, -0.791748046875, -0.68505859375, -0.578369140625, -0.4716796875, -0.364990234375, -0.25830078125, -0.151611328125, -0.044921875, 0.061767578125, 0.16845703125, 0.275146484375, 0.3818359375, 0.488525390625, 0.59521484375, 0.701904296875, 0.80859375, 0.915283203125, 1.02197265625, 1.128662109375, 1.2353515625, 1.342041015625, 1.44873046875, 1.555419921875, 1.662109375, 1.768798828125, 1.87548828125, 1.982177734375, 2.0888671875, 2.195556640625, 2.30224609375, 2.408935546875, 2.515625, 2.622314453125, 2.72900390625, 2.835693359375, 2.9423828125, 3.049072265625, 3.15576171875, 3.262451171875, 3.369140625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 2.0, 10.0, 5.0, 12.0, 19.0, 10.0, 16.0, 26.0, 20.0, 27.0, 27.0, 34.0, 29.0, 55.0, 37.0, 34.0, 46.0, 48.0, 49.0, 46.0, 42.0, 37.0, 41.0, 46.0, 32.0, 33.0, 29.0, 34.0, 22.0, 20.0, 13.0, 12.0, 11.0, 16.0, 13.0, 7.0, 8.0, 8.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.96728515625, -0.93695068359375, -0.9066162109375, -0.87628173828125, -0.845947265625, -0.81561279296875, -0.7852783203125, -0.75494384765625, -0.724609375, -0.69427490234375, -0.6639404296875, -0.63360595703125, -0.603271484375, -0.57293701171875, -0.5426025390625, -0.51226806640625, -0.48193359375, -0.45159912109375, -0.4212646484375, -0.39093017578125, -0.360595703125, -0.33026123046875, -0.2999267578125, -0.26959228515625, -0.2392578125, -0.20892333984375, -0.1785888671875, -0.14825439453125, -0.117919921875, -0.08758544921875, -0.0572509765625, -0.02691650390625, 0.00341796875, 0.03375244140625, 0.0640869140625, 0.09442138671875, 0.124755859375, 0.15509033203125, 0.1854248046875, 0.21575927734375, 0.24609375, 0.27642822265625, 0.3067626953125, 0.33709716796875, 0.367431640625, 0.39776611328125, 0.4281005859375, 0.45843505859375, 0.48876953125, 0.51910400390625, 0.5494384765625, 0.57977294921875, 0.610107421875, 0.64044189453125, 0.6707763671875, 0.70111083984375, 0.7314453125, 0.76177978515625, 0.7921142578125, 0.82244873046875, 0.852783203125, 0.88311767578125, 0.9134521484375, 0.94378662109375, 0.97412109375]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 6.0, 6.0, 11.0, 10.0, 23.0, 16.0, 39.0, 46.0, 48.0, 59.0, 80.0, 50.0, 85.0, 87.0, 92.0, 64.0, 48.0, 43.0, 43.0, 30.0, 25.0, 19.0, 14.0, 12.0, 15.0, 6.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.877593994140625, -23.158777236938477, -22.439960479736328, -21.721141815185547, -21.0023250579834, -20.28350830078125, -19.5646915435791, -18.845874786376953, -18.127058029174805, -17.408241271972656, -16.689424514770508, -15.970606803894043, -15.251790046691895, -14.53297233581543, -13.814155578613281, -13.095338821411133, -12.376521110534668, -11.65770435333252, -10.938886642456055, -10.220069885253906, -9.501253128051758, -8.78243637084961, -8.063618659973145, -7.344801902770996, -6.6259846687316895, -5.907167434692383, -5.188350677490234, -4.469533443450928, -3.7507164478302, -3.0318994522094727, -2.313082218170166, -1.5942654609680176, -0.8754482269287109, -0.15663117170333862, 0.5621858835220337, 1.2810029983520508, 1.9998199939727783, 2.718636989593506, 3.4374542236328125, 4.156270980834961, 4.875088214874268, 5.593905448913574, 6.312722206115723, 7.031539440155029, 7.750356674194336, 8.469173431396484, 9.187990188598633, 9.906806945800781, 10.625624656677246, 11.344441413879395, 12.06325912475586, 12.782075881958008, 13.500892639160156, 14.219709396362305, 14.93852710723877, 15.657343864440918, 16.376161575317383, 17.09497833251953, 17.81379508972168, 18.532611846923828, 19.25143051147461, 19.970247268676758, 20.689064025878906, 21.407880783081055, 22.126697540283203]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 3.0, 1.0, 5.0, 14.0, 13.0, 12.0, 14.0, 20.0, 25.0, 24.0, 23.0, 41.0, 26.0, 40.0, 30.0, 39.0, 43.0, 54.0, 48.0, 45.0, 37.0, 34.0, 55.0, 29.0, 38.0, 31.0, 33.0, 23.0, 42.0, 26.0, 19.0, 17.0, 16.0, 11.0, 17.0, 12.0, 10.0, 9.0, 3.0, 7.0, 3.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.34538459777832, -7.082252025604248, -6.819119453430176, -6.555986404418945, -6.292853832244873, -6.029721260070801, -5.76658821105957, -5.503455638885498, -5.240323066711426, -4.9771904945373535, -4.714057922363281, -4.450924873352051, -4.1877923011779785, -3.9246597290039062, -3.661526918411255, -3.3983941078186035, -3.1352615356445312, -2.872128963470459, -2.6089961528778076, -2.3458633422851562, -2.082730770111084, -1.8195980787277222, -1.5564653873443604, -1.2933326959609985, -1.0302000045776367, -0.7670673131942749, -0.5039346218109131, -0.24080193042755127, 0.022330760955810547, 0.28546345233917236, 0.5485961437225342, 0.811728835105896, 1.0748615264892578, 1.3379942178726196, 1.6011269092559814, 1.8642596006393433, 2.127392292022705, 2.3905248641967773, 2.6536576747894287, 2.91679048538208, 3.1799230575561523, 3.4430556297302246, 3.706188440322876, 3.9693212509155273, 4.2324538230896, 4.495586395263672, 4.758719444274902, 5.021852016448975, 5.284984588623047, 5.548117160797119, 5.811249732971191, 6.074382781982422, 6.337515354156494, 6.600647926330566, 6.863780975341797, 7.126913547515869, 7.390046119689941, 7.653178691864014, 7.916311264038086, 8.179444313049316, 8.442577362060547, 8.705709457397461, 8.968842506408691, 9.231974601745605, 9.495107650756836]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 5.0, 8.0, 5.0, 5.0, 10.0, 22.0, 30.0, 54.0, 74.0, 112.0, 199.0, 247.0, 409.0, 625.0, 994.0, 1522.0, 2279.0, 3680.0, 5735.0, 9338.0, 14549.0, 22630.0, 34685.0, 51624.0, 73368.0, 98198.0, 119614.0, 129898.0, 123666.0, 105216.0, 80975.0, 57704.0, 39409.0, 25789.0, 16776.0, 10669.0, 6813.0, 4224.0, 2660.0, 1695.0, 1038.0, 703.0, 438.0, 289.0, 198.0, 123.0, 82.0, 61.0, 38.0, 18.0, 21.0, 16.0, 7.0, 13.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.4921875, -8.223876953125, -7.95556640625, -7.687255859375, -7.4189453125, -7.150634765625, -6.88232421875, -6.614013671875, -6.345703125, -6.077392578125, -5.80908203125, -5.540771484375, -5.2724609375, -5.004150390625, -4.73583984375, -4.467529296875, -4.19921875, -3.930908203125, -3.66259765625, -3.394287109375, -3.1259765625, -2.857666015625, -2.58935546875, -2.321044921875, -2.052734375, -1.784423828125, -1.51611328125, -1.247802734375, -0.9794921875, -0.711181640625, -0.44287109375, -0.174560546875, 0.09375, 0.362060546875, 0.63037109375, 0.898681640625, 1.1669921875, 1.435302734375, 1.70361328125, 1.971923828125, 2.240234375, 2.508544921875, 2.77685546875, 3.045166015625, 3.3134765625, 3.581787109375, 3.85009765625, 4.118408203125, 4.38671875, 4.655029296875, 4.92333984375, 5.191650390625, 5.4599609375, 5.728271484375, 5.99658203125, 6.264892578125, 6.533203125, 6.801513671875, 7.06982421875, 7.338134765625, 7.6064453125, 7.874755859375, 8.14306640625, 8.411376953125, 8.6796875]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 9.0, 3.0, 6.0, 6.0, 6.0, 13.0, 17.0, 18.0, 19.0, 26.0, 25.0, 19.0, 30.0, 29.0, 37.0, 34.0, 42.0, 45.0, 38.0, 51.0, 48.0, 42.0, 37.0, 41.0, 40.0, 38.0, 32.0, 32.0, 26.0, 30.0, 26.0, 19.0, 20.0, 18.0, 22.0, 9.0, 17.0, 8.0, 8.0, 4.0, 5.0, 6.0, 3.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.2734375, -8.98095703125, -8.6884765625, -8.39599609375, -8.103515625, -7.81103515625, -7.5185546875, -7.22607421875, -6.93359375, -6.64111328125, -6.3486328125, -6.05615234375, -5.763671875, -5.47119140625, -5.1787109375, -4.88623046875, -4.59375, -4.30126953125, -4.0087890625, -3.71630859375, -3.423828125, -3.13134765625, -2.8388671875, -2.54638671875, -2.25390625, -1.96142578125, -1.6689453125, -1.37646484375, -1.083984375, -0.79150390625, -0.4990234375, -0.20654296875, 0.0859375, 0.37841796875, 0.6708984375, 0.96337890625, 1.255859375, 1.54833984375, 1.8408203125, 2.13330078125, 2.42578125, 2.71826171875, 3.0107421875, 3.30322265625, 3.595703125, 3.88818359375, 4.1806640625, 4.47314453125, 4.765625, 5.05810546875, 5.3505859375, 5.64306640625, 5.935546875, 6.22802734375, 6.5205078125, 6.81298828125, 7.10546875, 7.39794921875, 7.6904296875, 7.98291015625, 8.275390625, 8.56787109375, 8.8603515625, 9.15283203125, 9.4453125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 6.0, 7.0, 8.0, 20.0, 28.0, 40.0, 42.0, 77.0, 152.0, 240.0, 330.0, 626.0, 1063.0, 1812.0, 3182.0, 5370.0, 9127.0, 15484.0, 25758.0, 41363.0, 64579.0, 94519.0, 125005.0, 146018.0, 142799.0, 121592.0, 90267.0, 60896.0, 39372.0, 23786.0, 14295.0, 8634.0, 4927.0, 2900.0, 1739.0, 977.0, 571.0, 347.0, 201.0, 142.0, 98.0, 54.0, 32.0, 19.0, 17.0, 5.0, 16.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 3.0], "bins": [-10.703125, -10.3876953125, -10.072265625, -9.7568359375, -9.44140625, -9.1259765625, -8.810546875, -8.4951171875, -8.1796875, -7.8642578125, -7.548828125, -7.2333984375, -6.91796875, -6.6025390625, -6.287109375, -5.9716796875, -5.65625, -5.3408203125, -5.025390625, -4.7099609375, -4.39453125, -4.0791015625, -3.763671875, -3.4482421875, -3.1328125, -2.8173828125, -2.501953125, -2.1865234375, -1.87109375, -1.5556640625, -1.240234375, -0.9248046875, -0.609375, -0.2939453125, 0.021484375, 0.3369140625, 0.65234375, 0.9677734375, 1.283203125, 1.5986328125, 1.9140625, 2.2294921875, 2.544921875, 2.8603515625, 3.17578125, 3.4912109375, 3.806640625, 4.1220703125, 4.4375, 4.7529296875, 5.068359375, 5.3837890625, 5.69921875, 6.0146484375, 6.330078125, 6.6455078125, 6.9609375, 7.2763671875, 7.591796875, 7.9072265625, 8.22265625, 8.5380859375, 8.853515625, 9.1689453125, 9.484375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 6.0, 5.0, 0.0, 8.0, 9.0, 7.0, 12.0, 12.0, 21.0, 21.0, 18.0, 25.0, 29.0, 31.0, 25.0, 36.0, 37.0, 38.0, 37.0, 44.0, 47.0, 42.0, 47.0, 45.0, 60.0, 37.0, 29.0, 41.0, 33.0, 35.0, 27.0, 25.0, 15.0, 19.0, 19.0, 11.0, 8.0, 13.0, 11.0, 8.0, 7.0, 4.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.15234375, -5.9656982421875, -5.779052734375, -5.5924072265625, -5.40576171875, -5.2191162109375, -5.032470703125, -4.8458251953125, -4.6591796875, -4.4725341796875, -4.285888671875, -4.0992431640625, -3.91259765625, -3.7259521484375, -3.539306640625, -3.3526611328125, -3.166015625, -2.9793701171875, -2.792724609375, -2.6060791015625, -2.41943359375, -2.2327880859375, -2.046142578125, -1.8594970703125, -1.6728515625, -1.4862060546875, -1.299560546875, -1.1129150390625, -0.92626953125, -0.7396240234375, -0.552978515625, -0.3663330078125, -0.1796875, 0.0069580078125, 0.193603515625, 0.3802490234375, 0.56689453125, 0.7535400390625, 0.940185546875, 1.1268310546875, 1.3134765625, 1.5001220703125, 1.686767578125, 1.8734130859375, 2.06005859375, 2.2467041015625, 2.433349609375, 2.6199951171875, 2.806640625, 2.9932861328125, 3.179931640625, 3.3665771484375, 3.55322265625, 3.7398681640625, 3.926513671875, 4.1131591796875, 4.2998046875, 4.4864501953125, 4.673095703125, 4.8597412109375, 5.04638671875, 5.2330322265625, 5.419677734375, 5.6063232421875, 5.79296875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 8.0, 11.0, 16.0, 26.0, 36.0, 85.0, 101.0, 176.0, 256.0, 407.0, 671.0, 1035.0, 1745.0, 2885.0, 4683.0, 7473.0, 12163.0, 19602.0, 31126.0, 48066.0, 71451.0, 99613.0, 127535.0, 141185.0, 134357.0, 110737.0, 80653.0, 55881.0, 36157.0, 22990.0, 14427.0, 8830.0, 5346.0, 3220.0, 2142.0, 1302.0, 844.0, 493.0, 303.0, 184.0, 128.0, 83.0, 40.0, 31.0, 12.0, 15.0, 11.0, 9.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-4.02734375, -3.904083251953125, -3.78082275390625, -3.657562255859375, -3.5343017578125, -3.411041259765625, -3.28778076171875, -3.164520263671875, -3.041259765625, -2.917999267578125, -2.79473876953125, -2.671478271484375, -2.5482177734375, -2.424957275390625, -2.30169677734375, -2.178436279296875, -2.05517578125, -1.931915283203125, -1.80865478515625, -1.685394287109375, -1.5621337890625, -1.438873291015625, -1.31561279296875, -1.192352294921875, -1.069091796875, -0.945831298828125, -0.82257080078125, -0.699310302734375, -0.5760498046875, -0.452789306640625, -0.32952880859375, -0.206268310546875, -0.0830078125, 0.040252685546875, 0.16351318359375, 0.286773681640625, 0.4100341796875, 0.533294677734375, 0.65655517578125, 0.779815673828125, 0.903076171875, 1.026336669921875, 1.14959716796875, 1.272857666015625, 1.3961181640625, 1.519378662109375, 1.64263916015625, 1.765899658203125, 1.88916015625, 2.012420654296875, 2.13568115234375, 2.258941650390625, 2.3822021484375, 2.505462646484375, 2.62872314453125, 2.751983642578125, 2.875244140625, 2.998504638671875, 3.12176513671875, 3.245025634765625, 3.3682861328125, 3.491546630859375, 3.61480712890625, 3.738067626953125, 3.861328125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 1.0, 2.0, 9.0, 10.0, 6.0, 11.0, 18.0, 32.0, 36.0, 37.0, 53.0, 60.0, 59.0, 81.0, 87.0, 69.0, 66.0, 70.0, 51.0, 47.0, 36.0, 36.0, 33.0, 27.0, 19.0, 11.0, 11.0, 7.0, 8.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005793571472167969, -0.0005607008934020996, -0.0005420446395874023, -0.0005233883857727051, -0.0005047321319580078, -0.00048607587814331055, -0.0004674196243286133, -0.000448763370513916, -0.00043010711669921875, -0.0004114508628845215, -0.0003927946090698242, -0.00037413835525512695, -0.0003554821014404297, -0.0003368258476257324, -0.00031816959381103516, -0.0002995133399963379, -0.0002808570861816406, -0.00026220083236694336, -0.0002435445785522461, -0.00022488832473754883, -0.00020623207092285156, -0.0001875758171081543, -0.00016891956329345703, -0.00015026330947875977, -0.0001316070556640625, -0.00011295080184936523, -9.429454803466797e-05, -7.56382942199707e-05, -5.698204040527344e-05, -3.832578659057617e-05, -1.9669532775878906e-05, -1.0132789611816406e-06, 1.7642974853515625e-05, 3.629922866821289e-05, 5.4955482482910156e-05, 7.361173629760742e-05, 9.226799011230469e-05, 0.00011092424392700195, 0.00012958049774169922, 0.00014823675155639648, 0.00016689300537109375, 0.00018554925918579102, 0.00020420551300048828, 0.00022286176681518555, 0.0002415180206298828, 0.0002601742744445801, 0.00027883052825927734, 0.0002974867820739746, 0.0003161430358886719, 0.00033479928970336914, 0.0003534555435180664, 0.00037211179733276367, 0.00039076805114746094, 0.0004094243049621582, 0.00042808055877685547, 0.00044673681259155273, 0.00046539306640625, 0.00048404932022094727, 0.0005027055740356445, 0.0005213618278503418, 0.0005400180816650391, 0.0005586743354797363, 0.0005773305892944336, 0.0005959868431091309, 0.0006146430969238281]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 7.0, 8.0, 13.0, 21.0, 33.0, 49.0, 69.0, 119.0, 161.0, 248.0, 386.0, 572.0, 892.0, 1328.0, 2153.0, 3243.0, 5030.0, 7392.0, 11436.0, 17523.0, 25975.0, 38533.0, 55562.0, 74980.0, 97310.0, 115445.0, 124092.0, 116973.0, 98997.0, 76793.0, 55767.0, 39222.0, 26252.0, 17850.0, 11809.0, 7772.0, 4915.0, 3418.0, 2237.0, 1398.0, 916.0, 547.0, 338.0, 274.0, 169.0, 112.0, 76.0, 57.0, 25.0, 17.0, 21.0, 13.0, 6.0, 4.0, 1.0, 3.0, 1.0], "bins": [-3.5390625, -3.433502197265625, -3.32794189453125, -3.222381591796875, -3.1168212890625, -3.011260986328125, -2.90570068359375, -2.800140380859375, -2.694580078125, -2.589019775390625, -2.48345947265625, -2.377899169921875, -2.2723388671875, -2.166778564453125, -2.06121826171875, -1.955657958984375, -1.85009765625, -1.744537353515625, -1.63897705078125, -1.533416748046875, -1.4278564453125, -1.322296142578125, -1.21673583984375, -1.111175537109375, -1.005615234375, -0.900054931640625, -0.79449462890625, -0.688934326171875, -0.5833740234375, -0.477813720703125, -0.37225341796875, -0.266693115234375, -0.1611328125, -0.055572509765625, 0.04998779296875, 0.155548095703125, 0.2611083984375, 0.366668701171875, 0.47222900390625, 0.577789306640625, 0.683349609375, 0.788909912109375, 0.89447021484375, 1.000030517578125, 1.1055908203125, 1.211151123046875, 1.31671142578125, 1.422271728515625, 1.52783203125, 1.633392333984375, 1.73895263671875, 1.844512939453125, 1.9500732421875, 2.055633544921875, 2.16119384765625, 2.266754150390625, 2.372314453125, 2.477874755859375, 2.58343505859375, 2.688995361328125, 2.7945556640625, 2.900115966796875, 3.00567626953125, 3.111236572265625, 3.216796875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 6.0, 3.0, 5.0, 6.0, 8.0, 11.0, 13.0, 11.0, 15.0, 13.0, 32.0, 24.0, 20.0, 27.0, 26.0, 34.0, 45.0, 38.0, 39.0, 35.0, 47.0, 44.0, 50.0, 40.0, 47.0, 36.0, 34.0, 33.0, 27.0, 38.0, 27.0, 24.0, 21.0, 18.0, 13.0, 12.0, 13.0, 12.0, 10.0, 13.0, 3.0, 5.0, 5.0, 4.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.1240234375, -1.089202880859375, -1.05438232421875, -1.019561767578125, -0.9847412109375, -0.949920654296875, -0.91510009765625, -0.880279541015625, -0.845458984375, -0.810638427734375, -0.77581787109375, -0.740997314453125, -0.7061767578125, -0.671356201171875, -0.63653564453125, -0.601715087890625, -0.56689453125, -0.532073974609375, -0.49725341796875, -0.462432861328125, -0.4276123046875, -0.392791748046875, -0.35797119140625, -0.323150634765625, -0.288330078125, -0.253509521484375, -0.21868896484375, -0.183868408203125, -0.1490478515625, -0.114227294921875, -0.07940673828125, -0.044586181640625, -0.009765625, 0.025054931640625, 0.05987548828125, 0.094696044921875, 0.1295166015625, 0.164337158203125, 0.19915771484375, 0.233978271484375, 0.268798828125, 0.303619384765625, 0.33843994140625, 0.373260498046875, 0.4080810546875, 0.442901611328125, 0.47772216796875, 0.512542724609375, 0.54736328125, 0.582183837890625, 0.61700439453125, 0.651824951171875, 0.6866455078125, 0.721466064453125, 0.75628662109375, 0.791107177734375, 0.825927734375, 0.860748291015625, 0.89556884765625, 0.930389404296875, 0.9652099609375, 1.000030517578125, 1.03485107421875, 1.069671630859375, 1.1044921875]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 7.0, 3.0, 5.0, 10.0, 15.0, 21.0, 27.0, 31.0, 43.0, 41.0, 66.0, 74.0, 83.0, 78.0, 77.0, 81.0, 65.0, 52.0, 51.0, 40.0, 32.0, 22.0, 12.0, 16.0, 15.0, 10.0, 7.0, 2.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-25.025188446044922, -24.291629791259766, -23.558069229125977, -22.82451057434082, -22.09095001220703, -21.357391357421875, -20.62383270263672, -19.89027214050293, -19.15671157836914, -18.423152923583984, -17.689592361450195, -16.95603370666504, -16.22247314453125, -15.488914489746094, -14.755354881286621, -14.021795272827148, -13.288236618041992, -12.55467700958252, -11.821117401123047, -11.08755874633789, -10.353998184204102, -9.620439529418945, -8.886879920959473, -8.1533203125, -7.419760704040527, -6.686201095581055, -5.952641487121582, -5.219082355499268, -4.485522747039795, -3.7519631385803223, -3.018404006958008, -2.284844398498535, -1.5512828826904297, -0.8177233934402466, -0.08416390419006348, 0.6493954658508301, 1.3829550743103027, 2.1165146827697754, 2.85007381439209, 3.5836334228515625, 4.317193031311035, 5.050752639770508, 5.7843122482299805, 6.517871379852295, 7.251430988311768, 7.98499059677124, 8.718549728393555, 9.452109336853027, 10.1856689453125, 10.919228553771973, 11.652788162231445, 12.386346817016602, 13.11990737915039, 13.853466033935547, 14.58702564239502, 15.320585250854492, 16.05414581298828, 16.787704467773438, 17.521265029907227, 18.254823684692383, 18.988384246826172, 19.721942901611328, 20.455501556396484, 21.189062118530273, 21.92262077331543]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 9.0, 10.0, 14.0, 14.0, 19.0, 19.0, 14.0, 28.0, 17.0, 27.0, 29.0, 51.0, 36.0, 36.0, 40.0, 49.0, 51.0, 50.0, 41.0, 50.0, 33.0, 36.0, 36.0, 40.0, 24.0, 36.0, 32.0, 18.0, 17.0, 23.0, 16.0, 18.0, 5.0, 13.0, 15.0, 7.0, 8.0, 5.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.810589790344238, -8.527017593383789, -8.243444442749023, -7.959872245788574, -7.676299571990967, -7.392726898193359, -7.10915470123291, -6.825582027435303, -6.542009353637695, -6.258436679840088, -5.9748640060424805, -5.691291809082031, -5.407719135284424, -5.124146461486816, -4.840574264526367, -4.55700159072876, -4.273428916931152, -3.989856243133545, -3.7062838077545166, -3.4227113723754883, -3.139138698577881, -2.8555660247802734, -2.571993589401245, -2.288421154022217, -2.0048484802246094, -1.7212759256362915, -1.4377033710479736, -1.1541308164596558, -0.8705582618713379, -0.58698570728302, -0.30341315269470215, -0.019840598106384277, 0.2637319564819336, 0.5473045110702515, 0.8308770656585693, 1.1144496202468872, 1.398022174835205, 1.681594729423523, 1.9651672840118408, 2.248739719390869, 2.5323123931884766, 2.815885066986084, 3.0994575023651123, 3.3830299377441406, 3.666602611541748, 3.9501752853393555, 4.233747482299805, 4.517320156097412, 4.8008928298950195, 5.084465503692627, 5.368038177490234, 5.651610374450684, 5.935183048248291, 6.218755722045898, 6.502327919006348, 6.785900592803955, 7.0694732666015625, 7.35304594039917, 7.636618614196777, 7.920190811157227, 8.203763961791992, 8.487336158752441, 8.77090835571289, 9.054481506347656, 9.338053703308105]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 6.0, 2.0, 15.0, 18.0, 26.0, 37.0, 56.0, 76.0, 95.0, 140.0, 246.0, 385.0, 582.0, 976.0, 1832.0, 3084.0, 5583.0, 10401.0, 20757.0, 42792.0, 93038.0, 215440.0, 529385.0, 1138360.0, 1166090.0, 551700.0, 224289.0, 95870.0, 44702.0, 22163.0, 11593.0, 6191.0, 3370.0, 1922.0, 1154.0, 723.0, 433.0, 243.0, 178.0, 99.0, 75.0, 45.0, 32.0, 29.0, 18.0, 15.0, 6.0, 2.0, 4.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-18.578125, -17.998046875, -17.41796875, -16.837890625, -16.2578125, -15.677734375, -15.09765625, -14.517578125, -13.9375, -13.357421875, -12.77734375, -12.197265625, -11.6171875, -11.037109375, -10.45703125, -9.876953125, -9.296875, -8.716796875, -8.13671875, -7.556640625, -6.9765625, -6.396484375, -5.81640625, -5.236328125, -4.65625, -4.076171875, -3.49609375, -2.916015625, -2.3359375, -1.755859375, -1.17578125, -0.595703125, -0.015625, 0.564453125, 1.14453125, 1.724609375, 2.3046875, 2.884765625, 3.46484375, 4.044921875, 4.625, 5.205078125, 5.78515625, 6.365234375, 6.9453125, 7.525390625, 8.10546875, 8.685546875, 9.265625, 9.845703125, 10.42578125, 11.005859375, 11.5859375, 12.166015625, 12.74609375, 13.326171875, 13.90625, 14.486328125, 15.06640625, 15.646484375, 16.2265625, 16.806640625, 17.38671875, 17.966796875, 18.546875]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 7.0, 10.0, 5.0, 14.0, 16.0, 19.0, 18.0, 12.0, 26.0, 39.0, 28.0, 23.0, 37.0, 37.0, 32.0, 38.0, 34.0, 42.0, 41.0, 57.0, 43.0, 51.0, 48.0, 35.0, 33.0, 27.0, 35.0, 35.0, 31.0, 18.0, 16.0, 17.0, 10.0, 10.0, 12.0, 12.0, 5.0, 6.0, 6.0, 5.0, 2.0, 2.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.1015625, -6.87933349609375, -6.6571044921875, -6.43487548828125, -6.212646484375, -5.99041748046875, -5.7681884765625, -5.54595947265625, -5.32373046875, -5.10150146484375, -4.8792724609375, -4.65704345703125, -4.434814453125, -4.21258544921875, -3.9903564453125, -3.76812744140625, -3.5458984375, -3.32366943359375, -3.1014404296875, -2.87921142578125, -2.656982421875, -2.43475341796875, -2.2125244140625, -1.99029541015625, -1.76806640625, -1.54583740234375, -1.3236083984375, -1.10137939453125, -0.879150390625, -0.65692138671875, -0.4346923828125, -0.21246337890625, 0.009765625, 0.23199462890625, 0.4542236328125, 0.67645263671875, 0.898681640625, 1.12091064453125, 1.3431396484375, 1.56536865234375, 1.78759765625, 2.00982666015625, 2.2320556640625, 2.45428466796875, 2.676513671875, 2.89874267578125, 3.1209716796875, 3.34320068359375, 3.5654296875, 3.78765869140625, 4.0098876953125, 4.23211669921875, 4.454345703125, 4.67657470703125, 4.8988037109375, 5.12103271484375, 5.34326171875, 5.56549072265625, 5.7877197265625, 6.00994873046875, 6.232177734375, 6.45440673828125, 6.6766357421875, 6.89886474609375, 7.12109375]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 8.0, 8.0, 13.0, 21.0, 42.0, 65.0, 91.0, 146.0, 236.0, 333.0, 566.0, 902.0, 1471.0, 2358.0, 3987.0, 6940.0, 11424.0, 20366.0, 36080.0, 65018.0, 120805.0, 226193.0, 421760.0, 721622.0, 920162.0, 718435.0, 420285.0, 224840.0, 119826.0, 64875.0, 36088.0, 20102.0, 11835.0, 6865.0, 4089.0, 2491.0, 1479.0, 880.0, 606.0, 368.0, 222.0, 132.0, 88.0, 57.0, 41.0, 26.0, 12.0, 14.0, 8.0, 2.0, 2.0, 3.0, 2.0, 1.0], "bins": [-16.40625, -15.9306640625, -15.455078125, -14.9794921875, -14.50390625, -14.0283203125, -13.552734375, -13.0771484375, -12.6015625, -12.1259765625, -11.650390625, -11.1748046875, -10.69921875, -10.2236328125, -9.748046875, -9.2724609375, -8.796875, -8.3212890625, -7.845703125, -7.3701171875, -6.89453125, -6.4189453125, -5.943359375, -5.4677734375, -4.9921875, -4.5166015625, -4.041015625, -3.5654296875, -3.08984375, -2.6142578125, -2.138671875, -1.6630859375, -1.1875, -0.7119140625, -0.236328125, 0.2392578125, 0.71484375, 1.1904296875, 1.666015625, 2.1416015625, 2.6171875, 3.0927734375, 3.568359375, 4.0439453125, 4.51953125, 4.9951171875, 5.470703125, 5.9462890625, 6.421875, 6.8974609375, 7.373046875, 7.8486328125, 8.32421875, 8.7998046875, 9.275390625, 9.7509765625, 10.2265625, 10.7021484375, 11.177734375, 11.6533203125, 12.12890625, 12.6044921875, 13.080078125, 13.5556640625, 14.03125]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 8.0, 6.0, 10.0, 7.0, 10.0, 15.0, 25.0, 18.0, 38.0, 45.0, 65.0, 92.0, 119.0, 166.0, 174.0, 234.0, 269.0, 287.0, 311.0, 293.0, 301.0, 281.0, 259.0, 232.0, 178.0, 133.0, 111.0, 74.0, 86.0, 66.0, 36.0, 32.0, 30.0, 15.0, 13.0, 13.0, 8.0, 8.0, 6.0, 3.0, 1.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.74609375, -5.5792236328125, -5.412353515625, -5.2454833984375, -5.07861328125, -4.9117431640625, -4.744873046875, -4.5780029296875, -4.4111328125, -4.2442626953125, -4.077392578125, -3.9105224609375, -3.74365234375, -3.5767822265625, -3.409912109375, -3.2430419921875, -3.076171875, -2.9093017578125, -2.742431640625, -2.5755615234375, -2.40869140625, -2.2418212890625, -2.074951171875, -1.9080810546875, -1.7412109375, -1.5743408203125, -1.407470703125, -1.2406005859375, -1.07373046875, -0.9068603515625, -0.739990234375, -0.5731201171875, -0.40625, -0.2393798828125, -0.072509765625, 0.0943603515625, 0.26123046875, 0.4281005859375, 0.594970703125, 0.7618408203125, 0.9287109375, 1.0955810546875, 1.262451171875, 1.4293212890625, 1.59619140625, 1.7630615234375, 1.929931640625, 2.0968017578125, 2.263671875, 2.4305419921875, 2.597412109375, 2.7642822265625, 2.93115234375, 3.0980224609375, 3.264892578125, 3.4317626953125, 3.5986328125, 3.7655029296875, 3.932373046875, 4.0992431640625, 4.26611328125, 4.4329833984375, 4.599853515625, 4.7667236328125, 4.93359375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 10.0, 8.0, 6.0, 12.0, 14.0, 33.0, 33.0, 22.0, 41.0, 54.0, 54.0, 68.0, 71.0, 61.0, 77.0, 73.0, 56.0, 53.0, 42.0, 35.0, 32.0, 32.0, 15.0, 20.0, 10.0, 4.0, 12.0, 11.0, 4.0, 4.0, 6.0, 3.0, 4.0, 3.0, 2.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.09366798400879, -18.480443954467773, -17.867218017578125, -17.25399398803711, -16.64076805114746, -16.027544021606445, -15.414319038391113, -14.801094055175781, -14.18786907196045, -13.574644088745117, -12.961419105529785, -12.348194122314453, -11.734970092773438, -11.121744155883789, -10.508520126342773, -9.895295143127441, -9.28207015991211, -8.668845176696777, -8.055620193481445, -7.4423956871032715, -6.8291707038879395, -6.215945720672607, -5.602721214294434, -4.989496231079102, -4.3762712478637695, -3.7630462646484375, -3.1498215198516846, -2.5365967750549316, -1.9233717918395996, -1.3101468086242676, -0.6969220638275146, -0.08369731903076172, 0.5295276641845703, 1.1427525281906128, 1.7559773921966553, 2.369202136993408, 2.9824271202087402, 3.5956521034240723, 4.208876609802246, 4.822101593017578, 5.43532657623291, 6.048551559448242, 6.661776542663574, 7.275001049041748, 7.88822603225708, 8.50145149230957, 9.114675521850586, 9.727900505065918, 10.34112548828125, 10.954350471496582, 11.567575454711914, 12.180800437927246, 12.794025421142578, 13.407249450683594, 14.020474433898926, 14.633699417114258, 15.24692440032959, 15.860149383544922, 16.473373413085938, 17.086599349975586, 17.6998233795166, 18.31304931640625, 18.926273345947266, 19.53949737548828, 20.15272331237793]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 7.0, 3.0, 5.0, 9.0, 13.0, 13.0, 14.0, 11.0, 22.0, 30.0, 32.0, 19.0, 33.0, 37.0, 35.0, 44.0, 45.0, 39.0, 45.0, 45.0, 59.0, 56.0, 41.0, 36.0, 37.0, 42.0, 24.0, 24.0, 24.0, 17.0, 19.0, 28.0, 18.0, 10.0, 14.0, 5.0, 11.0, 9.0, 5.0, 4.0, 8.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.348005294799805, -8.07004165649414, -7.792078018188477, -7.5141143798828125, -7.236151218414307, -6.958187580108643, -6.6802239418029785, -6.4022603034973145, -6.124297142028809, -5.8463335037231445, -5.5683698654174805, -5.290406227111816, -5.0124430656433105, -4.7344794273376465, -4.456515789031982, -4.178552150726318, -3.9005885124206543, -3.6226248741149902, -3.3446614742279053, -3.066697835922241, -2.7887344360351562, -2.510770797729492, -2.232807159423828, -1.9548436403274536, -1.676880121231079, -1.3989166021347046, -1.12095308303833, -0.842989444732666, -0.5650259256362915, -0.287062406539917, -0.00909876823425293, 0.2688647508621216, 0.5468282699584961, 0.8247917890548706, 1.1027553081512451, 1.3807189464569092, 1.6586824655532837, 1.9366459846496582, 2.2146096229553223, 2.4925732612609863, 2.7705366611480713, 3.0485002994537354, 3.3264636993408203, 3.6044273376464844, 3.8823909759521484, 4.1603546142578125, 4.438318252563477, 4.716281414031982, 4.9942450523376465, 5.2722086906433105, 5.550172328948975, 5.8281354904174805, 6.1060991287231445, 6.384062767028809, 6.662026405334473, 6.939990043640137, 7.217953681945801, 7.495917320251465, 7.773880958557129, 8.051844596862793, 8.329808235168457, 8.607770919799805, 8.885734558105469, 9.163698196411133, 9.441661834716797]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 8.0, 9.0, 11.0, 22.0, 28.0, 54.0, 79.0, 132.0, 206.0, 329.0, 567.0, 920.0, 1618.0, 3055.0, 5831.0, 11472.0, 22080.0, 42717.0, 80288.0, 136228.0, 192485.0, 199576.0, 152880.0, 93059.0, 50670.0, 25750.0, 13353.0, 6939.0, 3566.0, 1928.0, 1112.0, 625.0, 332.0, 210.0, 137.0, 92.0, 53.0, 35.0, 25.0, 16.0, 15.0, 7.0, 7.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0], "bins": [-9.296875, -9.0162353515625, -8.735595703125, -8.4549560546875, -8.17431640625, -7.8936767578125, -7.613037109375, -7.3323974609375, -7.0517578125, -6.7711181640625, -6.490478515625, -6.2098388671875, -5.92919921875, -5.6485595703125, -5.367919921875, -5.0872802734375, -4.806640625, -4.5260009765625, -4.245361328125, -3.9647216796875, -3.68408203125, -3.4034423828125, -3.122802734375, -2.8421630859375, -2.5615234375, -2.2808837890625, -2.000244140625, -1.7196044921875, -1.43896484375, -1.1583251953125, -0.877685546875, -0.5970458984375, -0.31640625, -0.0357666015625, 0.244873046875, 0.5255126953125, 0.80615234375, 1.0867919921875, 1.367431640625, 1.6480712890625, 1.9287109375, 2.2093505859375, 2.489990234375, 2.7706298828125, 3.05126953125, 3.3319091796875, 3.612548828125, 3.8931884765625, 4.173828125, 4.4544677734375, 4.735107421875, 5.0157470703125, 5.29638671875, 5.5770263671875, 5.857666015625, 6.1383056640625, 6.4189453125, 6.6995849609375, 6.980224609375, 7.2608642578125, 7.54150390625, 7.8221435546875, 8.102783203125, 8.3834228515625, 8.6640625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 9.0, 11.0, 13.0, 15.0, 11.0, 24.0, 19.0, 27.0, 25.0, 33.0, 27.0, 33.0, 32.0, 48.0, 34.0, 37.0, 54.0, 36.0, 50.0, 49.0, 40.0, 34.0, 36.0, 40.0, 32.0, 29.0, 27.0, 26.0, 20.0, 14.0, 17.0, 24.0, 5.0, 14.0, 18.0, 6.0, 4.0, 3.0, 5.0, 4.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.1484375, -7.850830078125, -7.55322265625, -7.255615234375, -6.9580078125, -6.660400390625, -6.36279296875, -6.065185546875, -5.767578125, -5.469970703125, -5.17236328125, -4.874755859375, -4.5771484375, -4.279541015625, -3.98193359375, -3.684326171875, -3.38671875, -3.089111328125, -2.79150390625, -2.493896484375, -2.1962890625, -1.898681640625, -1.60107421875, -1.303466796875, -1.005859375, -0.708251953125, -0.41064453125, -0.113037109375, 0.1845703125, 0.482177734375, 0.77978515625, 1.077392578125, 1.375, 1.672607421875, 1.97021484375, 2.267822265625, 2.5654296875, 2.863037109375, 3.16064453125, 3.458251953125, 3.755859375, 4.053466796875, 4.35107421875, 4.648681640625, 4.9462890625, 5.243896484375, 5.54150390625, 5.839111328125, 6.13671875, 6.434326171875, 6.73193359375, 7.029541015625, 7.3271484375, 7.624755859375, 7.92236328125, 8.219970703125, 8.517578125, 8.815185546875, 9.11279296875, 9.410400390625, 9.7080078125, 10.005615234375, 10.30322265625, 10.600830078125, 10.8984375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 8.0, 8.0, 14.0, 23.0, 32.0, 47.0, 100.0, 118.0, 187.0, 311.0, 587.0, 953.0, 1695.0, 3265.0, 6600.0, 13247.0, 28096.0, 60577.0, 127494.0, 228609.0, 258409.0, 164087.0, 80825.0, 38001.0, 17462.0, 8398.0, 4197.0, 2226.0, 1193.0, 718.0, 413.0, 259.0, 140.0, 90.0, 56.0, 43.0, 19.0, 18.0, 9.0, 8.0, 6.0, 7.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2734375, -10.88720703125, -10.5009765625, -10.11474609375, -9.728515625, -9.34228515625, -8.9560546875, -8.56982421875, -8.18359375, -7.79736328125, -7.4111328125, -7.02490234375, -6.638671875, -6.25244140625, -5.8662109375, -5.47998046875, -5.09375, -4.70751953125, -4.3212890625, -3.93505859375, -3.548828125, -3.16259765625, -2.7763671875, -2.39013671875, -2.00390625, -1.61767578125, -1.2314453125, -0.84521484375, -0.458984375, -0.07275390625, 0.3134765625, 0.69970703125, 1.0859375, 1.47216796875, 1.8583984375, 2.24462890625, 2.630859375, 3.01708984375, 3.4033203125, 3.78955078125, 4.17578125, 4.56201171875, 4.9482421875, 5.33447265625, 5.720703125, 6.10693359375, 6.4931640625, 6.87939453125, 7.265625, 7.65185546875, 8.0380859375, 8.42431640625, 8.810546875, 9.19677734375, 9.5830078125, 9.96923828125, 10.35546875, 10.74169921875, 11.1279296875, 11.51416015625, 11.900390625, 12.28662109375, 12.6728515625, 13.05908203125, 13.4453125]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 7.0, 5.0, 4.0, 8.0, 17.0, 12.0, 7.0, 14.0, 22.0, 13.0, 21.0, 18.0, 17.0, 33.0, 33.0, 30.0, 28.0, 40.0, 35.0, 32.0, 32.0, 31.0, 38.0, 45.0, 42.0, 39.0, 40.0, 44.0, 39.0, 27.0, 32.0, 30.0, 23.0, 26.0, 16.0, 21.0, 16.0, 16.0, 15.0, 13.0, 4.0, 5.0, 4.0, 0.0, 6.0, 4.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0], "bins": [-5.390625, -5.22869873046875, -5.0667724609375, -4.90484619140625, -4.742919921875, -4.58099365234375, -4.4190673828125, -4.25714111328125, -4.09521484375, -3.93328857421875, -3.7713623046875, -3.60943603515625, -3.447509765625, -3.28558349609375, -3.1236572265625, -2.96173095703125, -2.7998046875, -2.63787841796875, -2.4759521484375, -2.31402587890625, -2.152099609375, -1.99017333984375, -1.8282470703125, -1.66632080078125, -1.50439453125, -1.34246826171875, -1.1805419921875, -1.01861572265625, -0.856689453125, -0.69476318359375, -0.5328369140625, -0.37091064453125, -0.208984375, -0.04705810546875, 0.1148681640625, 0.27679443359375, 0.438720703125, 0.60064697265625, 0.7625732421875, 0.92449951171875, 1.08642578125, 1.24835205078125, 1.4102783203125, 1.57220458984375, 1.734130859375, 1.89605712890625, 2.0579833984375, 2.21990966796875, 2.3818359375, 2.54376220703125, 2.7056884765625, 2.86761474609375, 3.029541015625, 3.19146728515625, 3.3533935546875, 3.51531982421875, 3.67724609375, 3.83917236328125, 4.0010986328125, 4.16302490234375, 4.324951171875, 4.48687744140625, 4.6488037109375, 4.81072998046875, 4.97265625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 4.0, 10.0, 9.0, 15.0, 10.0, 21.0, 28.0, 41.0, 58.0, 72.0, 104.0, 178.0, 251.0, 452.0, 666.0, 1256.0, 2184.0, 4515.0, 9895.0, 23368.0, 60254.0, 159746.0, 335123.0, 267527.0, 109246.0, 41607.0, 16828.0, 7162.0, 3492.0, 1843.0, 991.0, 556.0, 320.0, 231.0, 154.0, 103.0, 59.0, 44.0, 47.0, 26.0, 18.0, 8.0, 12.0, 8.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.6328125, -8.36962890625, -8.1064453125, -7.84326171875, -7.580078125, -7.31689453125, -7.0537109375, -6.79052734375, -6.52734375, -6.26416015625, -6.0009765625, -5.73779296875, -5.474609375, -5.21142578125, -4.9482421875, -4.68505859375, -4.421875, -4.15869140625, -3.8955078125, -3.63232421875, -3.369140625, -3.10595703125, -2.8427734375, -2.57958984375, -2.31640625, -2.05322265625, -1.7900390625, -1.52685546875, -1.263671875, -1.00048828125, -0.7373046875, -0.47412109375, -0.2109375, 0.05224609375, 0.3154296875, 0.57861328125, 0.841796875, 1.10498046875, 1.3681640625, 1.63134765625, 1.89453125, 2.15771484375, 2.4208984375, 2.68408203125, 2.947265625, 3.21044921875, 3.4736328125, 3.73681640625, 4.0, 4.26318359375, 4.5263671875, 4.78955078125, 5.052734375, 5.31591796875, 5.5791015625, 5.84228515625, 6.10546875, 6.36865234375, 6.6318359375, 6.89501953125, 7.158203125, 7.42138671875, 7.6845703125, 7.94775390625, 8.2109375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 3.0, 3.0, 7.0, 4.0, 7.0, 14.0, 25.0, 29.0, 25.0, 39.0, 50.0, 47.0, 72.0, 91.0, 79.0, 90.0, 83.0, 56.0, 53.0, 48.0, 42.0, 38.0, 24.0, 25.0, 13.0, 6.0, 6.0, 5.0, 3.0, 2.0, 6.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000331878662109375, -0.000321120023727417, -0.000310361385345459, -0.000299602746963501, -0.00028884410858154297, -0.00027808547019958496, -0.00026732683181762695, -0.00025656819343566895, -0.00024580955505371094, -0.00023505091667175293, -0.00022429227828979492, -0.00021353363990783691, -0.0002027750015258789, -0.0001920163631439209, -0.0001812577247619629, -0.00017049908638000488, -0.00015974044799804688, -0.00014898180961608887, -0.00013822317123413086, -0.00012746453285217285, -0.00011670589447021484, -0.00010594725608825684, -9.518861770629883e-05, -8.442997932434082e-05, -7.367134094238281e-05, -6.29127025604248e-05, -5.21540641784668e-05, -4.139542579650879e-05, -3.063678741455078e-05, -1.9878149032592773e-05, -9.119510650634766e-06, 1.6391277313232422e-06, 1.239776611328125e-05, 2.3156404495239258e-05, 3.3915042877197266e-05, 4.4673681259155273e-05, 5.543231964111328e-05, 6.619095802307129e-05, 7.69495964050293e-05, 8.77082347869873e-05, 9.846687316894531e-05, 0.00010922551155090332, 0.00011998414993286133, 0.00013074278831481934, 0.00014150142669677734, 0.00015226006507873535, 0.00016301870346069336, 0.00017377734184265137, 0.00018453598022460938, 0.00019529461860656738, 0.0002060532569885254, 0.0002168118953704834, 0.0002275705337524414, 0.00023832917213439941, 0.0002490878105163574, 0.00025984644889831543, 0.00027060508728027344, 0.00028136372566223145, 0.00029212236404418945, 0.00030288100242614746, 0.00031363964080810547, 0.0003243982791900635, 0.0003351569175720215, 0.0003459155559539795, 0.0003566741943359375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 8.0, 9.0, 12.0, 16.0, 25.0, 32.0, 54.0, 88.0, 130.0, 192.0, 279.0, 508.0, 790.0, 1422.0, 2519.0, 4805.0, 9615.0, 20909.0, 47211.0, 104500.0, 202442.0, 264023.0, 199587.0, 102411.0, 46173.0, 20671.0, 9493.0, 4655.0, 2431.0, 1387.0, 798.0, 509.0, 313.0, 177.0, 122.0, 72.0, 58.0, 51.0, 21.0, 12.0, 14.0, 6.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.63671875, -6.43243408203125, -6.2281494140625, -6.02386474609375, -5.819580078125, -5.61529541015625, -5.4110107421875, -5.20672607421875, -5.00244140625, -4.79815673828125, -4.5938720703125, -4.38958740234375, -4.185302734375, -3.98101806640625, -3.7767333984375, -3.57244873046875, -3.3681640625, -3.16387939453125, -2.9595947265625, -2.75531005859375, -2.551025390625, -2.34674072265625, -2.1424560546875, -1.93817138671875, -1.73388671875, -1.52960205078125, -1.3253173828125, -1.12103271484375, -0.916748046875, -0.71246337890625, -0.5081787109375, -0.30389404296875, -0.099609375, 0.10467529296875, 0.3089599609375, 0.51324462890625, 0.717529296875, 0.92181396484375, 1.1260986328125, 1.33038330078125, 1.53466796875, 1.73895263671875, 1.9432373046875, 2.14752197265625, 2.351806640625, 2.55609130859375, 2.7603759765625, 2.96466064453125, 3.1689453125, 3.37322998046875, 3.5775146484375, 3.78179931640625, 3.986083984375, 4.19036865234375, 4.3946533203125, 4.59893798828125, 4.80322265625, 5.00750732421875, 5.2117919921875, 5.41607666015625, 5.620361328125, 5.82464599609375, 6.0289306640625, 6.23321533203125, 6.4375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 6.0, 8.0, 6.0, 9.0, 8.0, 26.0, 31.0, 40.0, 37.0, 46.0, 53.0, 51.0, 53.0, 62.0, 64.0, 83.0, 57.0, 71.0, 49.0, 49.0, 32.0, 35.0, 33.0, 18.0, 23.0, 8.0, 12.0, 11.0, 2.0, 8.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3876953125, -1.339019775390625, -1.29034423828125, -1.241668701171875, -1.1929931640625, -1.144317626953125, -1.09564208984375, -1.046966552734375, -0.998291015625, -0.949615478515625, -0.90093994140625, -0.852264404296875, -0.8035888671875, -0.754913330078125, -0.70623779296875, -0.657562255859375, -0.60888671875, -0.560211181640625, -0.51153564453125, -0.462860107421875, -0.4141845703125, -0.365509033203125, -0.31683349609375, -0.268157958984375, -0.219482421875, -0.170806884765625, -0.12213134765625, -0.073455810546875, -0.0247802734375, 0.023895263671875, 0.07257080078125, 0.121246337890625, 0.169921875, 0.218597412109375, 0.26727294921875, 0.315948486328125, 0.3646240234375, 0.413299560546875, 0.46197509765625, 0.510650634765625, 0.559326171875, 0.608001708984375, 0.65667724609375, 0.705352783203125, 0.7540283203125, 0.802703857421875, 0.85137939453125, 0.900054931640625, 0.94873046875, 0.997406005859375, 1.04608154296875, 1.094757080078125, 1.1434326171875, 1.192108154296875, 1.24078369140625, 1.289459228515625, 1.338134765625, 1.386810302734375, 1.43548583984375, 1.484161376953125, 1.5328369140625, 1.581512451171875, 1.63018798828125, 1.678863525390625, 1.7275390625]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 12.0, 5.0, 8.0, 9.0, 20.0, 24.0, 30.0, 32.0, 27.0, 43.0, 55.0, 54.0, 54.0, 64.0, 71.0, 65.0, 72.0, 54.0, 49.0, 37.0, 35.0, 25.0, 32.0, 20.0, 18.0, 15.0, 9.0, 11.0, 9.0, 3.0, 7.0, 7.0, 1.0, 4.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.752038955688477, -17.176942825317383, -16.601844787597656, -16.026748657226562, -15.451651573181152, -14.876554489135742, -14.301458358764648, -13.726361274719238, -13.151264190673828, -12.576167106628418, -12.001070022583008, -11.425973892211914, -10.850876808166504, -10.275779724121094, -9.70068359375, -9.12558650970459, -8.55048942565918, -7.9753923416137695, -7.400295734405518, -6.825199127197266, -6.2501020431518555, -5.675004959106445, -5.099908351898193, -4.524811744689941, -3.9497146606445312, -3.3746178150177, -2.799520969390869, -2.224424123764038, -1.649327278137207, -1.074230432510376, -0.4991335868835449, 0.07596302032470703, 0.6510601043701172, 1.2261569499969482, 1.8012537956237793, 2.3763506412506104, 2.9514474868774414, 3.5265443325042725, 4.1016411781311035, 4.6767377853393555, 5.251834869384766, 5.826931953430176, 6.402028560638428, 6.97712516784668, 7.55222225189209, 8.1273193359375, 8.702415466308594, 9.277512550354004, 9.852609634399414, 10.427706718444824, 11.002803802490234, 11.577899932861328, 12.152997016906738, 12.728094100952148, 13.303190231323242, 13.878287315368652, 14.453384399414062, 15.028481483459473, 15.603578567504883, 16.178674697875977, 16.753772735595703, 17.328868865966797, 17.90396499633789, 18.479061126708984, 19.05415916442871]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 3.0, 4.0, 11.0, 13.0, 15.0, 14.0, 16.0, 24.0, 31.0, 31.0, 25.0, 33.0, 43.0, 40.0, 48.0, 30.0, 63.0, 52.0, 48.0, 50.0, 50.0, 34.0, 40.0, 46.0, 28.0, 18.0, 23.0, 25.0, 25.0, 20.0, 15.0, 14.0, 9.0, 12.0, 9.0, 8.0, 4.0, 9.0, 4.0, 4.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.358636856079102, -8.073909759521484, -7.789182186126709, -7.504454612731934, -7.219727516174316, -6.934999942779541, -6.650272369384766, -6.365545272827148, -6.080817699432373, -5.796090126037598, -5.5113630294799805, -5.226635456085205, -4.94190788269043, -4.6571807861328125, -4.372453212738037, -4.087725639343262, -3.8029985427856445, -3.5182712078094482, -3.233543872833252, -2.9488162994384766, -2.6640889644622803, -2.379361629486084, -2.0946340560913086, -1.8099067211151123, -1.525179386138916, -1.2404520511627197, -0.9557245969772339, -0.6709972023963928, -0.38626980781555176, -0.10154247283935547, 0.18318498134613037, 0.4679124355316162, 0.7526388168334961, 1.0373661518096924, 1.3220936059951782, 1.606821060180664, 1.8915483951568604, 2.1762757301330566, 2.461003303527832, 2.7457306385040283, 3.0304579734802246, 3.315185308456421, 3.599912643432617, 3.8846402168273926, 4.169367790222168, 4.454094886779785, 4.7388224601745605, 5.023550033569336, 5.308277130126953, 5.5930047035217285, 5.877731800079346, 6.162459373474121, 6.447186470031738, 6.731914043426514, 7.016641616821289, 7.301368713378906, 7.586096286773682, 7.870823860168457, 8.155550956726074, 8.440278053283691, 8.725006103515625, 9.009733200073242, 9.29446029663086, 9.579188346862793, 9.86391544342041]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 3.0, 10.0, 9.0, 10.0, 18.0, 46.0, 72.0, 104.0, 147.0, 250.0, 407.0, 675.0, 1110.0, 1880.0, 2968.0, 5178.0, 8590.0, 14277.0, 24333.0, 39856.0, 63910.0, 97137.0, 133156.0, 157221.0, 151091.0, 121782.0, 85174.0, 54654.0, 33784.0, 20256.0, 12248.0, 7147.0, 4426.0, 2543.0, 1499.0, 979.0, 597.0, 375.0, 246.0, 134.0, 110.0, 54.0, 35.0, 31.0, 14.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9453125, -9.5880126953125, -9.230712890625, -8.8734130859375, -8.51611328125, -8.1588134765625, -7.801513671875, -7.4442138671875, -7.0869140625, -6.7296142578125, -6.372314453125, -6.0150146484375, -5.65771484375, -5.3004150390625, -4.943115234375, -4.5858154296875, -4.228515625, -3.8712158203125, -3.513916015625, -3.1566162109375, -2.79931640625, -2.4420166015625, -2.084716796875, -1.7274169921875, -1.3701171875, -1.0128173828125, -0.655517578125, -0.2982177734375, 0.05908203125, 0.4163818359375, 0.773681640625, 1.1309814453125, 1.48828125, 1.8455810546875, 2.202880859375, 2.5601806640625, 2.91748046875, 3.2747802734375, 3.632080078125, 3.9893798828125, 4.3466796875, 4.7039794921875, 5.061279296875, 5.4185791015625, 5.77587890625, 6.1331787109375, 6.490478515625, 6.8477783203125, 7.205078125, 7.5623779296875, 7.919677734375, 8.2769775390625, 8.63427734375, 8.9915771484375, 9.348876953125, 9.7061767578125, 10.0634765625, 10.4207763671875, 10.778076171875, 11.1353759765625, 11.49267578125, 11.8499755859375, 12.207275390625, 12.5645751953125, 12.921875]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 9.0, 5.0, 7.0, 9.0, 10.0, 20.0, 8.0, 13.0, 11.0, 16.0, 23.0, 29.0, 33.0, 24.0, 29.0, 44.0, 42.0, 25.0, 50.0, 46.0, 38.0, 50.0, 51.0, 50.0, 41.0, 36.0, 29.0, 28.0, 32.0, 38.0, 24.0, 26.0, 18.0, 16.0, 13.0, 10.0, 12.0, 7.0, 8.0, 9.0, 4.0, 4.0, 1.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.7265625, -9.42431640625, -9.1220703125, -8.81982421875, -8.517578125, -8.21533203125, -7.9130859375, -7.61083984375, -7.30859375, -7.00634765625, -6.7041015625, -6.40185546875, -6.099609375, -5.79736328125, -5.4951171875, -5.19287109375, -4.890625, -4.58837890625, -4.2861328125, -3.98388671875, -3.681640625, -3.37939453125, -3.0771484375, -2.77490234375, -2.47265625, -2.17041015625, -1.8681640625, -1.56591796875, -1.263671875, -0.96142578125, -0.6591796875, -0.35693359375, -0.0546875, 0.24755859375, 0.5498046875, 0.85205078125, 1.154296875, 1.45654296875, 1.7587890625, 2.06103515625, 2.36328125, 2.66552734375, 2.9677734375, 3.27001953125, 3.572265625, 3.87451171875, 4.1767578125, 4.47900390625, 4.78125, 5.08349609375, 5.3857421875, 5.68798828125, 5.990234375, 6.29248046875, 6.5947265625, 6.89697265625, 7.19921875, 7.50146484375, 7.8037109375, 8.10595703125, 8.408203125, 8.71044921875, 9.0126953125, 9.31494140625, 9.6171875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 8.0, 15.0, 15.0, 24.0, 45.0, 80.0, 104.0, 160.0, 265.0, 366.0, 588.0, 911.0, 1521.0, 2493.0, 3915.0, 6168.0, 10112.0, 16608.0, 26311.0, 40850.0, 62254.0, 89542.0, 117350.0, 136074.0, 137422.0, 119894.0, 93086.0, 65860.0, 43190.0, 27601.0, 17217.0, 10762.0, 6602.0, 4207.0, 2543.0, 1591.0, 1021.0, 626.0, 400.0, 258.0, 187.0, 105.0, 70.0, 43.0, 36.0, 20.0, 11.0, 10.0, 11.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.46875, -10.1422119140625, -9.815673828125, -9.4891357421875, -9.16259765625, -8.8360595703125, -8.509521484375, -8.1829833984375, -7.8564453125, -7.5299072265625, -7.203369140625, -6.8768310546875, -6.55029296875, -6.2237548828125, -5.897216796875, -5.5706787109375, -5.244140625, -4.9176025390625, -4.591064453125, -4.2645263671875, -3.93798828125, -3.6114501953125, -3.284912109375, -2.9583740234375, -2.6318359375, -2.3052978515625, -1.978759765625, -1.6522216796875, -1.32568359375, -0.9991455078125, -0.672607421875, -0.3460693359375, -0.01953125, 0.3070068359375, 0.633544921875, 0.9600830078125, 1.28662109375, 1.6131591796875, 1.939697265625, 2.2662353515625, 2.5927734375, 2.9193115234375, 3.245849609375, 3.5723876953125, 3.89892578125, 4.2254638671875, 4.552001953125, 4.8785400390625, 5.205078125, 5.5316162109375, 5.858154296875, 6.1846923828125, 6.51123046875, 6.8377685546875, 7.164306640625, 7.4908447265625, 7.8173828125, 8.1439208984375, 8.470458984375, 8.7969970703125, 9.12353515625, 9.4500732421875, 9.776611328125, 10.1031494140625, 10.4296875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 5.0, 3.0, 5.0, 7.0, 7.0, 7.0, 10.0, 14.0, 10.0, 8.0, 17.0, 28.0, 24.0, 37.0, 40.0, 36.0, 39.0, 36.0, 35.0, 43.0, 44.0, 36.0, 49.0, 50.0, 50.0, 38.0, 43.0, 28.0, 30.0, 30.0, 32.0, 25.0, 14.0, 22.0, 20.0, 14.0, 13.0, 9.0, 9.0, 8.0, 6.0, 5.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-5.35546875, -5.1781005859375, -5.000732421875, -4.8233642578125, -4.64599609375, -4.4686279296875, -4.291259765625, -4.1138916015625, -3.9365234375, -3.7591552734375, -3.581787109375, -3.4044189453125, -3.22705078125, -3.0496826171875, -2.872314453125, -2.6949462890625, -2.517578125, -2.3402099609375, -2.162841796875, -1.9854736328125, -1.80810546875, -1.6307373046875, -1.453369140625, -1.2760009765625, -1.0986328125, -0.9212646484375, -0.743896484375, -0.5665283203125, -0.38916015625, -0.2117919921875, -0.034423828125, 0.1429443359375, 0.3203125, 0.4976806640625, 0.675048828125, 0.8524169921875, 1.02978515625, 1.2071533203125, 1.384521484375, 1.5618896484375, 1.7392578125, 1.9166259765625, 2.093994140625, 2.2713623046875, 2.44873046875, 2.6260986328125, 2.803466796875, 2.9808349609375, 3.158203125, 3.3355712890625, 3.512939453125, 3.6903076171875, 3.86767578125, 4.0450439453125, 4.222412109375, 4.3997802734375, 4.5771484375, 4.7545166015625, 4.931884765625, 5.1092529296875, 5.28662109375, 5.4639892578125, 5.641357421875, 5.8187255859375, 5.99609375]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 10.0, 6.0, 14.0, 10.0, 16.0, 21.0, 26.0, 48.0, 80.0, 103.0, 150.0, 225.0, 360.0, 504.0, 778.0, 1300.0, 2085.0, 3508.0, 6243.0, 10815.0, 20394.0, 37239.0, 66385.0, 112221.0, 165778.0, 192223.0, 165537.0, 112497.0, 66268.0, 37090.0, 20220.0, 11113.0, 6165.0, 3539.0, 2070.0, 1246.0, 775.0, 512.0, 315.0, 208.0, 147.0, 94.0, 63.0, 47.0, 27.0, 22.0, 23.0, 15.0, 8.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0], "bins": [-6.23046875, -6.04986572265625, -5.8692626953125, -5.68865966796875, -5.508056640625, -5.32745361328125, -5.1468505859375, -4.96624755859375, -4.78564453125, -4.60504150390625, -4.4244384765625, -4.24383544921875, -4.063232421875, -3.88262939453125, -3.7020263671875, -3.52142333984375, -3.3408203125, -3.16021728515625, -2.9796142578125, -2.79901123046875, -2.618408203125, -2.43780517578125, -2.2572021484375, -2.07659912109375, -1.89599609375, -1.71539306640625, -1.5347900390625, -1.35418701171875, -1.173583984375, -0.99298095703125, -0.8123779296875, -0.63177490234375, -0.451171875, -0.27056884765625, -0.0899658203125, 0.09063720703125, 0.271240234375, 0.45184326171875, 0.6324462890625, 0.81304931640625, 0.99365234375, 1.17425537109375, 1.3548583984375, 1.53546142578125, 1.716064453125, 1.89666748046875, 2.0772705078125, 2.25787353515625, 2.4384765625, 2.61907958984375, 2.7996826171875, 2.98028564453125, 3.160888671875, 3.34149169921875, 3.5220947265625, 3.70269775390625, 3.88330078125, 4.06390380859375, 4.2445068359375, 4.42510986328125, 4.605712890625, 4.78631591796875, 4.9669189453125, 5.14752197265625, 5.328125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 9.0, 8.0, 4.0, 8.0, 10.0, 19.0, 14.0, 25.0, 44.0, 42.0, 49.0, 56.0, 67.0, 65.0, 88.0, 70.0, 62.0, 59.0, 57.0, 48.0, 43.0, 42.0, 20.0, 24.0, 18.0, 18.0, 10.0, 5.0, 7.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006918907165527344, -0.0006720125675201416, -0.0006521344184875488, -0.0006322562694549561, -0.0006123781204223633, -0.0005924999713897705, -0.0005726218223571777, -0.000552743673324585, -0.0005328655242919922, -0.0005129873752593994, -0.0004931092262268066, -0.00047323107719421387, -0.0004533529281616211, -0.0004334747791290283, -0.00041359663009643555, -0.0003937184810638428, -0.00037384033203125, -0.0003539621829986572, -0.00033408403396606445, -0.0003142058849334717, -0.0002943277359008789, -0.00027444958686828613, -0.00025457143783569336, -0.00023469328880310059, -0.0002148151397705078, -0.00019493699073791504, -0.00017505884170532227, -0.0001551806926727295, -0.00013530254364013672, -0.00011542439460754395, -9.554624557495117e-05, -7.56680965423584e-05, -5.5789947509765625e-05, -3.591179847717285e-05, -1.6033649444580078e-05, 3.844499588012695e-06, 2.372264862060547e-05, 4.360079765319824e-05, 6.347894668579102e-05, 8.335709571838379e-05, 0.00010323524475097656, 0.00012311339378356934, 0.0001429915428161621, 0.00016286969184875488, 0.00018274784088134766, 0.00020262598991394043, 0.0002225041389465332, 0.00024238228797912598, 0.00026226043701171875, 0.0002821385860443115, 0.0003020167350769043, 0.00032189488410949707, 0.00034177303314208984, 0.0003616511821746826, 0.0003815293312072754, 0.00040140748023986816, 0.00042128562927246094, 0.0004411637783050537, 0.0004610419273376465, 0.00048092007637023926, 0.000500798225402832, 0.0005206763744354248, 0.0005405545234680176, 0.0005604326725006104, 0.0005803108215332031]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 8.0, 4.0, 8.0, 18.0, 20.0, 29.0, 41.0, 83.0, 130.0, 142.0, 245.0, 341.0, 620.0, 939.0, 1552.0, 2508.0, 4238.0, 7322.0, 12581.0, 22236.0, 39696.0, 69184.0, 113847.0, 164196.0, 186134.0, 159360.0, 108949.0, 66204.0, 37799.0, 21000.0, 11887.0, 6825.0, 4002.0, 2391.0, 1454.0, 918.0, 565.0, 374.0, 230.0, 155.0, 106.0, 79.0, 39.0, 24.0, 23.0, 14.0, 15.0, 5.0, 3.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0], "bins": [-5.625, -5.45684814453125, -5.2886962890625, -5.12054443359375, -4.952392578125, -4.78424072265625, -4.6160888671875, -4.44793701171875, -4.27978515625, -4.11163330078125, -3.9434814453125, -3.77532958984375, -3.607177734375, -3.43902587890625, -3.2708740234375, -3.10272216796875, -2.9345703125, -2.76641845703125, -2.5982666015625, -2.43011474609375, -2.261962890625, -2.09381103515625, -1.9256591796875, -1.75750732421875, -1.58935546875, -1.42120361328125, -1.2530517578125, -1.08489990234375, -0.916748046875, -0.74859619140625, -0.5804443359375, -0.41229248046875, -0.244140625, -0.07598876953125, 0.0921630859375, 0.26031494140625, 0.428466796875, 0.59661865234375, 0.7647705078125, 0.93292236328125, 1.10107421875, 1.26922607421875, 1.4373779296875, 1.60552978515625, 1.773681640625, 1.94183349609375, 2.1099853515625, 2.27813720703125, 2.4462890625, 2.61444091796875, 2.7825927734375, 2.95074462890625, 3.118896484375, 3.28704833984375, 3.4552001953125, 3.62335205078125, 3.79150390625, 3.95965576171875, 4.1278076171875, 4.29595947265625, 4.464111328125, 4.63226318359375, 4.8004150390625, 4.96856689453125, 5.13671875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 1.0, 4.0, 8.0, 13.0, 7.0, 13.0, 13.0, 17.0, 22.0, 27.0, 25.0, 31.0, 37.0, 42.0, 55.0, 64.0, 45.0, 73.0, 64.0, 64.0, 48.0, 55.0, 41.0, 40.0, 30.0, 48.0, 26.0, 15.0, 17.0, 10.0, 11.0, 6.0, 6.0, 6.0, 5.0, 2.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4228515625, -1.374725341796875, -1.32659912109375, -1.278472900390625, -1.2303466796875, -1.182220458984375, -1.13409423828125, -1.085968017578125, -1.037841796875, -0.989715576171875, -0.94158935546875, -0.893463134765625, -0.8453369140625, -0.797210693359375, -0.74908447265625, -0.700958251953125, -0.65283203125, -0.604705810546875, -0.55657958984375, -0.508453369140625, -0.4603271484375, -0.412200927734375, -0.36407470703125, -0.315948486328125, -0.267822265625, -0.219696044921875, -0.17156982421875, -0.123443603515625, -0.0753173828125, -0.027191162109375, 0.02093505859375, 0.069061279296875, 0.1171875, 0.165313720703125, 0.21343994140625, 0.261566162109375, 0.3096923828125, 0.357818603515625, 0.40594482421875, 0.454071044921875, 0.502197265625, 0.550323486328125, 0.59844970703125, 0.646575927734375, 0.6947021484375, 0.742828369140625, 0.79095458984375, 0.839080810546875, 0.88720703125, 0.935333251953125, 0.98345947265625, 1.031585693359375, 1.0797119140625, 1.127838134765625, 1.17596435546875, 1.224090576171875, 1.272216796875, 1.320343017578125, 1.36846923828125, 1.416595458984375, 1.4647216796875, 1.512847900390625, 1.56097412109375, 1.609100341796875, 1.6572265625]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 3.0, 3.0, 5.0, 8.0, 7.0, 12.0, 12.0, 23.0, 25.0, 28.0, 26.0, 48.0, 44.0, 53.0, 57.0, 75.0, 63.0, 72.0, 77.0, 64.0, 60.0, 40.0, 32.0, 26.0, 27.0, 26.0, 14.0, 12.0, 11.0, 8.0, 14.0, 1.0, 3.0, 7.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.33849334716797, -17.729873657226562, -17.121252059936523, -16.512632369995117, -15.904010772705078, -15.295391082763672, -14.68677043914795, -14.078149795532227, -13.469529151916504, -12.860908508300781, -12.252287864685059, -11.643667221069336, -11.03504753112793, -10.42642593383789, -9.817806243896484, -9.209185600280762, -8.600564956665039, -7.991944313049316, -7.383323669433594, -6.774703502655029, -6.166082859039307, -5.557462215423584, -4.9488420486450195, -4.340221405029297, -3.731600761413574, -3.1229801177978516, -2.514359712600708, -1.905739188194275, -1.2971186637878418, -0.6884980201721191, -0.07987761497497559, 0.528742790222168, 1.1373653411865234, 1.7459858655929565, 2.3546063899993896, 2.963226795196533, 3.571847438812256, 4.1804680824279785, 4.789088249206543, 5.397708892822266, 6.006329536437988, 6.614950180053711, 7.223570823669434, 7.832190990447998, 8.440811157226562, 9.049432754516602, 9.658052444458008, 10.26667308807373, 10.875293731689453, 11.483914375305176, 12.092535018920898, 12.701155662536621, 13.309776306152344, 13.91839599609375, 14.527016639709473, 15.135637283325195, 15.744257926940918, 16.35287857055664, 16.961498260498047, 17.570119857788086, 18.178739547729492, 18.78736114501953, 19.395980834960938, 20.004600524902344, 20.613222122192383]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 5.0, 13.0, 12.0, 16.0, 13.0, 18.0, 28.0, 29.0, 23.0, 36.0, 31.0, 41.0, 51.0, 40.0, 52.0, 43.0, 54.0, 36.0, 45.0, 43.0, 50.0, 41.0, 36.0, 23.0, 22.0, 22.0, 20.0, 25.0, 18.0, 21.0, 11.0, 14.0, 7.0, 13.0, 10.0, 7.0, 7.0, 3.0, 4.0, 5.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.433783531188965, -8.144537925720215, -7.855292797088623, -7.566047668457031, -7.276802062988281, -6.987556457519531, -6.6983113288879395, -6.409066200256348, -6.119820594787598, -5.830574989318848, -5.541329860687256, -5.252084732055664, -4.962839126586914, -4.673593521118164, -4.384348392486572, -4.0951032638549805, -3.8058576583862305, -3.5166122913360596, -3.2273669242858887, -2.9381215572357178, -2.648876190185547, -2.359630823135376, -2.070385456085205, -1.7811400890350342, -1.4918947219848633, -1.2026493549346924, -0.9134039878845215, -0.6241586208343506, -0.3349132537841797, -0.04566788673400879, 0.2435774803161621, 0.532822847366333, 0.8220691680908203, 1.1113145351409912, 1.400559902191162, 1.689805269241333, 1.979050636291504, 2.268296003341675, 2.5575413703918457, 2.8467867374420166, 3.1360321044921875, 3.4252774715423584, 3.7145228385925293, 4.003767967224121, 4.293013572692871, 4.582259178161621, 4.871504306793213, 5.160749435424805, 5.449995040893555, 5.739240646362305, 6.0284857749938965, 6.317730903625488, 6.606976509094238, 6.896222114562988, 7.18546724319458, 7.474712371826172, 7.763957977294922, 8.053203582763672, 8.342449188232422, 8.631693840026855, 8.920939445495605, 9.210185050964355, 9.499429702758789, 9.788675308227539, 10.077920913696289]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 6.0, 18.0, 19.0, 27.0, 49.0, 96.0, 138.0, 215.0, 333.0, 599.0, 1103.0, 2050.0, 4011.0, 8126.0, 17486.0, 39255.0, 95415.0, 249939.0, 696532.0, 1447838.0, 1024094.0, 368907.0, 135293.0, 54827.0, 24062.0, 11402.0, 5603.0, 2924.0, 1630.0, 882.0, 535.0, 291.0, 188.0, 117.0, 84.0, 58.0, 43.0, 29.0, 19.0, 12.0, 9.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.21875, -17.536376953125, -16.85400390625, -16.171630859375, -15.4892578125, -14.806884765625, -14.12451171875, -13.442138671875, -12.759765625, -12.077392578125, -11.39501953125, -10.712646484375, -10.0302734375, -9.347900390625, -8.66552734375, -7.983154296875, -7.30078125, -6.618408203125, -5.93603515625, -5.253662109375, -4.5712890625, -3.888916015625, -3.20654296875, -2.524169921875, -1.841796875, -1.159423828125, -0.47705078125, 0.205322265625, 0.8876953125, 1.570068359375, 2.25244140625, 2.934814453125, 3.6171875, 4.299560546875, 4.98193359375, 5.664306640625, 6.3466796875, 7.029052734375, 7.71142578125, 8.393798828125, 9.076171875, 9.758544921875, 10.44091796875, 11.123291015625, 11.8056640625, 12.488037109375, 13.17041015625, 13.852783203125, 14.53515625, 15.217529296875, 15.89990234375, 16.582275390625, 17.2646484375, 17.947021484375, 18.62939453125, 19.311767578125, 19.994140625, 20.676513671875, 21.35888671875, 22.041259765625, 22.7236328125, 23.406005859375, 24.08837890625, 24.770751953125, 25.453125]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 9.0, 12.0, 12.0, 5.0, 10.0, 15.0, 21.0, 23.0, 30.0, 37.0, 36.0, 41.0, 46.0, 54.0, 43.0, 52.0, 37.0, 38.0, 53.0, 45.0, 56.0, 39.0, 38.0, 35.0, 29.0, 29.0, 26.0, 27.0, 18.0, 11.0, 20.0, 9.0, 6.0, 15.0, 6.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.76953125, -6.52386474609375, -6.2781982421875, -6.03253173828125, -5.786865234375, -5.54119873046875, -5.2955322265625, -5.04986572265625, -4.80419921875, -4.55853271484375, -4.3128662109375, -4.06719970703125, -3.821533203125, -3.57586669921875, -3.3302001953125, -3.08453369140625, -2.8388671875, -2.59320068359375, -2.3475341796875, -2.10186767578125, -1.856201171875, -1.61053466796875, -1.3648681640625, -1.11920166015625, -0.87353515625, -0.62786865234375, -0.3822021484375, -0.13653564453125, 0.109130859375, 0.35479736328125, 0.6004638671875, 0.84613037109375, 1.091796875, 1.33746337890625, 1.5831298828125, 1.82879638671875, 2.074462890625, 2.32012939453125, 2.5657958984375, 2.81146240234375, 3.05712890625, 3.30279541015625, 3.5484619140625, 3.79412841796875, 4.039794921875, 4.28546142578125, 4.5311279296875, 4.77679443359375, 5.0224609375, 5.26812744140625, 5.5137939453125, 5.75946044921875, 6.005126953125, 6.25079345703125, 6.4964599609375, 6.74212646484375, 6.98779296875, 7.23345947265625, 7.4791259765625, 7.72479248046875, 7.970458984375, 8.21612548828125, 8.4617919921875, 8.70745849609375, 8.953125]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 2.0, 5.0, 7.0, 14.0, 24.0, 32.0, 46.0, 56.0, 93.0, 161.0, 252.0, 447.0, 723.0, 1250.0, 2294.0, 4227.0, 8081.0, 15567.0, 32151.0, 66691.0, 144174.0, 317426.0, 678610.0, 1111245.0, 928393.0, 473193.0, 216063.0, 98877.0, 46489.0, 22643.0, 11554.0, 6057.0, 3197.0, 1752.0, 998.0, 576.0, 338.0, 221.0, 132.0, 72.0, 53.0, 35.0, 16.0, 17.0, 11.0, 6.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-20.859375, -20.241455078125, -19.62353515625, -19.005615234375, -18.3876953125, -17.769775390625, -17.15185546875, -16.533935546875, -15.916015625, -15.298095703125, -14.68017578125, -14.062255859375, -13.4443359375, -12.826416015625, -12.20849609375, -11.590576171875, -10.97265625, -10.354736328125, -9.73681640625, -9.118896484375, -8.5009765625, -7.883056640625, -7.26513671875, -6.647216796875, -6.029296875, -5.411376953125, -4.79345703125, -4.175537109375, -3.5576171875, -2.939697265625, -2.32177734375, -1.703857421875, -1.0859375, -0.468017578125, 0.14990234375, 0.767822265625, 1.3857421875, 2.003662109375, 2.62158203125, 3.239501953125, 3.857421875, 4.475341796875, 5.09326171875, 5.711181640625, 6.3291015625, 6.947021484375, 7.56494140625, 8.182861328125, 8.80078125, 9.418701171875, 10.03662109375, 10.654541015625, 11.2724609375, 11.890380859375, 12.50830078125, 13.126220703125, 13.744140625, 14.362060546875, 14.97998046875, 15.597900390625, 16.2158203125, 16.833740234375, 17.45166015625, 18.069580078125, 18.6875]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 8.0, 8.0, 7.0, 12.0, 15.0, 28.0, 36.0, 60.0, 64.0, 94.0, 132.0, 179.0, 239.0, 300.0, 323.0, 384.0, 397.0, 315.0, 327.0, 276.0, 215.0, 174.0, 144.0, 97.0, 78.0, 48.0, 33.0, 34.0, 20.0, 10.0, 8.0, 4.0, 4.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.1171875, -7.91162109375, -7.7060546875, -7.50048828125, -7.294921875, -7.08935546875, -6.8837890625, -6.67822265625, -6.47265625, -6.26708984375, -6.0615234375, -5.85595703125, -5.650390625, -5.44482421875, -5.2392578125, -5.03369140625, -4.828125, -4.62255859375, -4.4169921875, -4.21142578125, -4.005859375, -3.80029296875, -3.5947265625, -3.38916015625, -3.18359375, -2.97802734375, -2.7724609375, -2.56689453125, -2.361328125, -2.15576171875, -1.9501953125, -1.74462890625, -1.5390625, -1.33349609375, -1.1279296875, -0.92236328125, -0.716796875, -0.51123046875, -0.3056640625, -0.10009765625, 0.10546875, 0.31103515625, 0.5166015625, 0.72216796875, 0.927734375, 1.13330078125, 1.3388671875, 1.54443359375, 1.75, 1.95556640625, 2.1611328125, 2.36669921875, 2.572265625, 2.77783203125, 2.9833984375, 3.18896484375, 3.39453125, 3.60009765625, 3.8056640625, 4.01123046875, 4.216796875, 4.42236328125, 4.6279296875, 4.83349609375, 5.0390625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 4.0, 5.0, 8.0, 5.0, 10.0, 14.0, 18.0, 21.0, 26.0, 28.0, 48.0, 52.0, 48.0, 75.0, 81.0, 68.0, 88.0, 65.0, 61.0, 58.0, 49.0, 33.0, 40.0, 20.0, 15.0, 17.0, 7.0, 12.0, 8.0, 7.0, 4.0, 0.0, 2.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.16599464416504, -20.458349227905273, -19.750701904296875, -19.04305648803711, -18.335411071777344, -17.627765655517578, -16.92011833190918, -16.212472915649414, -15.504826545715332, -14.79718017578125, -14.089534759521484, -13.381888389587402, -12.67424201965332, -11.966596603393555, -11.258950233459473, -10.55130386352539, -9.843658447265625, -9.136012077331543, -8.428366661071777, -7.720720291137695, -7.0130743980407715, -6.305428504943848, -5.597782135009766, -4.890136241912842, -4.182490348815918, -3.474844455718994, -2.767198324203491, -2.0595521926879883, -1.3519062995910645, -0.6442604064941406, 0.0633859634399414, 0.7710318565368652, 1.4786758422851562, 2.18632173538208, 2.893967866897583, 3.601613998413086, 4.30925989151001, 5.016905784606934, 5.724552154541016, 6.4321980476379395, 7.139843940734863, 7.847489833831787, 8.555135726928711, 9.262782096862793, 9.970428466796875, 10.67807388305664, 11.385720252990723, 12.093366622924805, 12.80101203918457, 13.508658409118652, 14.216303825378418, 14.9239501953125, 15.631595611572266, 16.33924102783203, 17.04688835144043, 17.754533767700195, 18.462181091308594, 19.16982650756836, 19.877473831176758, 20.585119247436523, 21.29276466369629, 22.000411987304688, 22.708057403564453, 23.41570281982422, 24.123348236083984]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 4.0, 7.0, 5.0, 7.0, 9.0, 14.0, 22.0, 23.0, 17.0, 28.0, 32.0, 31.0, 37.0, 26.0, 48.0, 37.0, 35.0, 46.0, 32.0, 46.0, 44.0, 46.0, 45.0, 49.0, 35.0, 35.0, 31.0, 35.0, 24.0, 22.0, 28.0, 18.0, 16.0, 9.0, 15.0, 3.0, 9.0, 5.0, 9.0, 4.0, 5.0, 2.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.962663173675537, -7.675048351287842, -7.387433052062988, -7.099818229675293, -6.812203407287598, -6.524588584899902, -6.236973285675049, -5.9493584632873535, -5.6617431640625, -5.374128341674805, -5.086513042449951, -4.798898220062256, -4.5112833976745605, -4.223668098449707, -3.9360532760620117, -3.6484384536743164, -3.360823631286621, -3.0732085704803467, -2.7855937480926514, -2.497978687286377, -2.2103638648986816, -1.9227488040924072, -1.6351337432861328, -1.3475189208984375, -1.059903860092163, -0.7722889184951782, -0.4846739172935486, -0.19705891609191895, 0.09055602550506592, 0.3781709671020508, 0.6657860279083252, 0.9534008502960205, 1.2410163879394531, 1.528631329536438, 1.8162462711334229, 2.1038613319396973, 2.3914761543273926, 2.679091215133667, 2.9667062759399414, 3.2543210983276367, 3.541936159133911, 3.8295512199401855, 4.117166042327881, 4.404781341552734, 4.69239616394043, 4.980010986328125, 5.26762580871582, 5.555240631103516, 5.842855930328369, 6.1304707527160645, 6.418086051940918, 6.705700874328613, 6.993315696716309, 7.280930519104004, 7.568545818328857, 7.856160640716553, 8.143775939941406, 8.431390762329102, 8.719005584716797, 9.006620407104492, 9.294236183166504, 9.5818510055542, 9.869465827941895, 10.15708065032959, 10.444695472717285]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 1.0, 6.0, 4.0, 6.0, 10.0, 18.0, 24.0, 38.0, 35.0, 51.0, 76.0, 101.0, 145.0, 205.0, 267.0, 391.0, 601.0, 868.0, 1552.0, 2615.0, 4570.0, 8702.0, 17252.0, 37218.0, 81199.0, 164321.0, 251651.0, 227007.0, 130291.0, 61070.0, 28257.0, 13407.0, 6895.0, 3723.0, 2100.0, 1288.0, 840.0, 546.0, 380.0, 225.0, 181.0, 121.0, 78.0, 66.0, 44.0, 39.0, 18.0, 13.0, 14.0, 7.0, 4.0, 10.0, 4.0, 6.0, 3.0, 0.0, 1.0], "bins": [-14.578125, -14.1470947265625, -13.716064453125, -13.2850341796875, -12.85400390625, -12.4229736328125, -11.991943359375, -11.5609130859375, -11.1298828125, -10.6988525390625, -10.267822265625, -9.8367919921875, -9.40576171875, -8.9747314453125, -8.543701171875, -8.1126708984375, -7.681640625, -7.2506103515625, -6.819580078125, -6.3885498046875, -5.95751953125, -5.5264892578125, -5.095458984375, -4.6644287109375, -4.2333984375, -3.8023681640625, -3.371337890625, -2.9403076171875, -2.50927734375, -2.0782470703125, -1.647216796875, -1.2161865234375, -0.78515625, -0.3541259765625, 0.076904296875, 0.5079345703125, 0.93896484375, 1.3699951171875, 1.801025390625, 2.2320556640625, 2.6630859375, 3.0941162109375, 3.525146484375, 3.9561767578125, 4.38720703125, 4.8182373046875, 5.249267578125, 5.6802978515625, 6.111328125, 6.5423583984375, 6.973388671875, 7.4044189453125, 7.83544921875, 8.2664794921875, 8.697509765625, 9.1285400390625, 9.5595703125, 9.9906005859375, 10.421630859375, 10.8526611328125, 11.28369140625, 11.7147216796875, 12.145751953125, 12.5767822265625, 13.0078125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 5.0, 6.0, 4.0, 5.0, 7.0, 3.0, 5.0, 8.0, 10.0, 11.0, 20.0, 19.0, 17.0, 16.0, 25.0, 25.0, 24.0, 33.0, 26.0, 35.0, 34.0, 37.0, 36.0, 37.0, 35.0, 37.0, 42.0, 40.0, 47.0, 44.0, 30.0, 34.0, 32.0, 29.0, 24.0, 27.0, 20.0, 12.0, 19.0, 15.0, 11.0, 11.0, 8.0, 7.0, 7.0, 8.0, 7.0, 3.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-8.5390625, -8.2655029296875, -7.991943359375, -7.7183837890625, -7.44482421875, -7.1712646484375, -6.897705078125, -6.6241455078125, -6.3505859375, -6.0770263671875, -5.803466796875, -5.5299072265625, -5.25634765625, -4.9827880859375, -4.709228515625, -4.4356689453125, -4.162109375, -3.8885498046875, -3.614990234375, -3.3414306640625, -3.06787109375, -2.7943115234375, -2.520751953125, -2.2471923828125, -1.9736328125, -1.7000732421875, -1.426513671875, -1.1529541015625, -0.87939453125, -0.6058349609375, -0.332275390625, -0.0587158203125, 0.21484375, 0.4884033203125, 0.761962890625, 1.0355224609375, 1.30908203125, 1.5826416015625, 1.856201171875, 2.1297607421875, 2.4033203125, 2.6768798828125, 2.950439453125, 3.2239990234375, 3.49755859375, 3.7711181640625, 4.044677734375, 4.3182373046875, 4.591796875, 4.8653564453125, 5.138916015625, 5.4124755859375, 5.68603515625, 5.9595947265625, 6.233154296875, 6.5067138671875, 6.7802734375, 7.0538330078125, 7.327392578125, 7.6009521484375, 7.87451171875, 8.1480712890625, 8.421630859375, 8.6951904296875, 8.96875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 4.0, 9.0, 18.0, 17.0, 23.0, 39.0, 31.0, 56.0, 79.0, 106.0, 172.0, 209.0, 298.0, 419.0, 690.0, 1065.0, 1839.0, 3412.0, 7570.0, 19542.0, 59221.0, 191086.0, 404617.0, 238431.0, 76038.0, 24595.0, 9176.0, 4168.0, 2101.0, 1271.0, 717.0, 472.0, 312.0, 215.0, 139.0, 110.0, 67.0, 55.0, 48.0, 35.0, 27.0, 12.0, 7.0, 9.0, 9.0, 4.0, 7.0, 1.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.84375, -20.1396484375, -19.435546875, -18.7314453125, -18.02734375, -17.3232421875, -16.619140625, -15.9150390625, -15.2109375, -14.5068359375, -13.802734375, -13.0986328125, -12.39453125, -11.6904296875, -10.986328125, -10.2822265625, -9.578125, -8.8740234375, -8.169921875, -7.4658203125, -6.76171875, -6.0576171875, -5.353515625, -4.6494140625, -3.9453125, -3.2412109375, -2.537109375, -1.8330078125, -1.12890625, -0.4248046875, 0.279296875, 0.9833984375, 1.6875, 2.3916015625, 3.095703125, 3.7998046875, 4.50390625, 5.2080078125, 5.912109375, 6.6162109375, 7.3203125, 8.0244140625, 8.728515625, 9.4326171875, 10.13671875, 10.8408203125, 11.544921875, 12.2490234375, 12.953125, 13.6572265625, 14.361328125, 15.0654296875, 15.76953125, 16.4736328125, 17.177734375, 17.8818359375, 18.5859375, 19.2900390625, 19.994140625, 20.6982421875, 21.40234375, 22.1064453125, 22.810546875, 23.5146484375, 24.21875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 3.0, 4.0, 2.0, 4.0, 11.0, 8.0, 11.0, 15.0, 13.0, 12.0, 25.0, 24.0, 29.0, 37.0, 37.0, 41.0, 42.0, 43.0, 38.0, 36.0, 47.0, 47.0, 39.0, 42.0, 40.0, 49.0, 48.0, 25.0, 31.0, 25.0, 28.0, 23.0, 16.0, 16.0, 16.0, 16.0, 15.0, 12.0, 5.0, 4.0, 4.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.5859375, -5.40032958984375, -5.2147216796875, -5.02911376953125, -4.843505859375, -4.65789794921875, -4.4722900390625, -4.28668212890625, -4.10107421875, -3.91546630859375, -3.7298583984375, -3.54425048828125, -3.358642578125, -3.17303466796875, -2.9874267578125, -2.80181884765625, -2.6162109375, -2.43060302734375, -2.2449951171875, -2.05938720703125, -1.873779296875, -1.68817138671875, -1.5025634765625, -1.31695556640625, -1.13134765625, -0.94573974609375, -0.7601318359375, -0.57452392578125, -0.388916015625, -0.20330810546875, -0.0177001953125, 0.16790771484375, 0.353515625, 0.53912353515625, 0.7247314453125, 0.91033935546875, 1.095947265625, 1.28155517578125, 1.4671630859375, 1.65277099609375, 1.83837890625, 2.02398681640625, 2.2095947265625, 2.39520263671875, 2.580810546875, 2.76641845703125, 2.9520263671875, 3.13763427734375, 3.3232421875, 3.50885009765625, 3.6944580078125, 3.88006591796875, 4.065673828125, 4.25128173828125, 4.4368896484375, 4.62249755859375, 4.80810546875, 4.99371337890625, 5.1793212890625, 5.36492919921875, 5.550537109375, 5.73614501953125, 5.9217529296875, 6.10736083984375, 6.29296875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 2.0, 7.0, 7.0, 22.0, 18.0, 20.0, 38.0, 45.0, 70.0, 83.0, 120.0, 166.0, 227.0, 266.0, 397.0, 549.0, 797.0, 1115.0, 1570.0, 2308.0, 3639.0, 6298.0, 13909.0, 48610.0, 243899.0, 528143.0, 139653.0, 30719.0, 10421.0, 5185.0, 3069.0, 2059.0, 1429.0, 1043.0, 730.0, 536.0, 362.0, 301.0, 189.0, 140.0, 111.0, 81.0, 68.0, 38.0, 29.0, 23.0, 13.0, 11.0, 6.0, 6.0, 6.0, 2.0, 3.0, 2.0], "bins": [-17.140625, -16.655517578125, -16.17041015625, -15.685302734375, -15.2001953125, -14.715087890625, -14.22998046875, -13.744873046875, -13.259765625, -12.774658203125, -12.28955078125, -11.804443359375, -11.3193359375, -10.834228515625, -10.34912109375, -9.864013671875, -9.37890625, -8.893798828125, -8.40869140625, -7.923583984375, -7.4384765625, -6.953369140625, -6.46826171875, -5.983154296875, -5.498046875, -5.012939453125, -4.52783203125, -4.042724609375, -3.5576171875, -3.072509765625, -2.58740234375, -2.102294921875, -1.6171875, -1.132080078125, -0.64697265625, -0.161865234375, 0.3232421875, 0.808349609375, 1.29345703125, 1.778564453125, 2.263671875, 2.748779296875, 3.23388671875, 3.718994140625, 4.2041015625, 4.689208984375, 5.17431640625, 5.659423828125, 6.14453125, 6.629638671875, 7.11474609375, 7.599853515625, 8.0849609375, 8.570068359375, 9.05517578125, 9.540283203125, 10.025390625, 10.510498046875, 10.99560546875, 11.480712890625, 11.9658203125, 12.450927734375, 12.93603515625, 13.421142578125, 13.90625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 4.0, 9.0, 15.0, 33.0, 49.0, 119.0, 195.0, 243.0, 162.0, 78.0, 41.0, 18.0, 12.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.00164794921875, -0.0016115084290504456, -0.0015750676393508911, -0.0015386268496513367, -0.0015021860599517822, -0.0014657452702522278, -0.0014293044805526733, -0.001392863690853119, -0.0013564229011535645, -0.00131998211145401, -0.0012835413217544556, -0.0012471005320549011, -0.0012106597423553467, -0.0011742189526557922, -0.0011377781629562378, -0.0011013373732566833, -0.001064896583557129, -0.0010284557938575745, -0.00099201500415802, -0.0009555742144584656, -0.0009191334247589111, -0.0008826926350593567, -0.0008462518453598022, -0.0008098110556602478, -0.0007733702659606934, -0.0007369294762611389, -0.0007004886865615845, -0.00066404789686203, -0.0006276071071624756, -0.0005911663174629211, -0.0005547255277633667, -0.0005182847380638123, -0.0004818439483642578, -0.00044540315866470337, -0.0004089623689651489, -0.0003725215792655945, -0.00033608078956604004, -0.0002996399998664856, -0.00026319921016693115, -0.0002267584204673767, -0.00019031763076782227, -0.00015387684106826782, -0.00011743605136871338, -8.099526166915894e-05, -4.455447196960449e-05, -8.113682270050049e-06, 2.8327107429504395e-05, 6.476789712905884e-05, 0.00010120868682861328, 0.00013764947652816772, 0.00017409026622772217, 0.0002105310559272766, 0.00024697184562683105, 0.0002834126353263855, 0.00031985342502593994, 0.0003562942147254944, 0.00039273500442504883, 0.00042917579412460327, 0.0004656165838241577, 0.0005020573735237122, 0.0005384981632232666, 0.000574938952922821, 0.0006113797426223755, 0.0006478205323219299, 0.0006842613220214844]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 3.0, 7.0, 7.0, 11.0, 9.0, 22.0, 19.0, 41.0, 46.0, 66.0, 96.0, 126.0, 164.0, 177.0, 284.0, 353.0, 448.0, 617.0, 867.0, 1123.0, 1411.0, 1849.0, 2648.0, 3688.0, 6422.0, 19218.0, 112551.0, 505271.0, 313304.0, 49546.0, 11120.0, 4871.0, 3067.0, 2219.0, 1654.0, 1254.0, 974.0, 734.0, 550.0, 427.0, 344.0, 272.0, 174.0, 143.0, 81.0, 79.0, 58.0, 34.0, 30.0, 24.0, 16.0, 14.0, 10.0, 6.0, 10.0, 3.0, 2.0, 0.0, 1.0, 5.0], "bins": [-16.171875, -15.6630859375, -15.154296875, -14.6455078125, -14.13671875, -13.6279296875, -13.119140625, -12.6103515625, -12.1015625, -11.5927734375, -11.083984375, -10.5751953125, -10.06640625, -9.5576171875, -9.048828125, -8.5400390625, -8.03125, -7.5224609375, -7.013671875, -6.5048828125, -5.99609375, -5.4873046875, -4.978515625, -4.4697265625, -3.9609375, -3.4521484375, -2.943359375, -2.4345703125, -1.92578125, -1.4169921875, -0.908203125, -0.3994140625, 0.109375, 0.6181640625, 1.126953125, 1.6357421875, 2.14453125, 2.6533203125, 3.162109375, 3.6708984375, 4.1796875, 4.6884765625, 5.197265625, 5.7060546875, 6.21484375, 6.7236328125, 7.232421875, 7.7412109375, 8.25, 8.7587890625, 9.267578125, 9.7763671875, 10.28515625, 10.7939453125, 11.302734375, 11.8115234375, 12.3203125, 12.8291015625, 13.337890625, 13.8466796875, 14.35546875, 14.8642578125, 15.373046875, 15.8818359375, 16.390625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 3.0, 7.0, 10.0, 23.0, 55.0, 97.0, 144.0, 189.0, 195.0, 120.0, 71.0, 31.0, 19.0, 9.0, 3.0, 6.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7109375, -3.57171630859375, -3.4324951171875, -3.29327392578125, -3.154052734375, -3.01483154296875, -2.8756103515625, -2.73638916015625, -2.59716796875, -2.45794677734375, -2.3187255859375, -2.17950439453125, -2.040283203125, -1.90106201171875, -1.7618408203125, -1.62261962890625, -1.4833984375, -1.34417724609375, -1.2049560546875, -1.06573486328125, -0.926513671875, -0.78729248046875, -0.6480712890625, -0.50885009765625, -0.36962890625, -0.23040771484375, -0.0911865234375, 0.04803466796875, 0.187255859375, 0.32647705078125, 0.4656982421875, 0.60491943359375, 0.744140625, 0.88336181640625, 1.0225830078125, 1.16180419921875, 1.301025390625, 1.44024658203125, 1.5794677734375, 1.71868896484375, 1.85791015625, 1.99713134765625, 2.1363525390625, 2.27557373046875, 2.414794921875, 2.55401611328125, 2.6932373046875, 2.83245849609375, 2.9716796875, 3.11090087890625, 3.2501220703125, 3.38934326171875, 3.528564453125, 3.66778564453125, 3.8070068359375, 3.94622802734375, 4.08544921875, 4.22467041015625, 4.3638916015625, 4.50311279296875, 4.642333984375, 4.78155517578125, 4.9207763671875, 5.05999755859375, 5.19921875]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 6.0, 6.0, 4.0, 3.0, 15.0, 19.0, 18.0, 23.0, 22.0, 38.0, 30.0, 47.0, 70.0, 69.0, 72.0, 73.0, 86.0, 66.0, 59.0, 63.0, 52.0, 32.0, 26.0, 21.0, 18.0, 15.0, 14.0, 4.0, 8.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 7.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.578258514404297, -19.88836097717285, -19.198463439941406, -18.50856590270996, -17.818668365478516, -17.12877082824707, -16.438873291015625, -15.74897575378418, -15.059078216552734, -14.369180679321289, -13.679283142089844, -12.989385604858398, -12.299488067626953, -11.609590530395508, -10.919692993164062, -10.229795455932617, -9.539897918701172, -8.850000381469727, -8.160102844238281, -7.470205307006836, -6.780307769775391, -6.090410232543945, -5.4005126953125, -4.710615158081055, -4.020717620849609, -3.330820083618164, -2.6409225463867188, -1.9510250091552734, -1.2611274719238281, -0.5712299346923828, 0.1186676025390625, 0.8085651397705078, 1.4984607696533203, 2.1883583068847656, 2.878255844116211, 3.5681533813476562, 4.258050918579102, 4.947948455810547, 5.637845993041992, 6.3277435302734375, 7.017641067504883, 7.707538604736328, 8.397436141967773, 9.087333679199219, 9.777231216430664, 10.46712875366211, 11.157026290893555, 11.846923828125, 12.536821365356445, 13.22671890258789, 13.916616439819336, 14.606513977050781, 15.296411514282227, 15.986309051513672, 16.676206588745117, 17.366104125976562, 18.056001663208008, 18.745899200439453, 19.4357967376709, 20.125694274902344, 20.81559181213379, 21.505489349365234, 22.19538688659668, 22.885284423828125, 23.57518196105957]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 6.0, 6.0, 7.0, 5.0, 10.0, 17.0, 11.0, 22.0, 31.0, 19.0, 37.0, 31.0, 33.0, 26.0, 43.0, 43.0, 41.0, 47.0, 41.0, 40.0, 52.0, 44.0, 35.0, 52.0, 40.0, 33.0, 31.0, 31.0, 28.0, 25.0, 21.0, 15.0, 18.0, 12.0, 5.0, 12.0, 8.0, 5.0, 4.0, 3.0, 4.0, 6.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.086185455322266, -7.793124675750732, -7.500064373016357, -7.207003593444824, -6.913943290710449, -6.620882511138916, -6.327821731567383, -6.034761428833008, -5.741701126098633, -5.4486403465271, -5.155580043792725, -4.862519264221191, -4.569458961486816, -4.276398181915283, -3.983337640762329, -3.690277099609375, -3.397216320037842, -3.1041557788848877, -2.8110952377319336, -2.5180344581604004, -2.2249741554260254, -1.9319134950637817, -1.638852834701538, -1.345792293548584, -1.0527317523956299, -0.7596712112426758, -0.4666106104850769, -0.17355000972747803, 0.11951053142547607, 0.4125710725784302, 0.7056317329406738, 0.9986922740936279, 1.291752815246582, 1.5848133563995361, 1.8778738975524902, 2.1709346771240234, 2.4639949798583984, 2.7570557594299316, 3.0501163005828857, 3.34317684173584, 3.636237382888794, 3.929297924041748, 4.222358703613281, 4.515419006347656, 4.8084797859191895, 5.1015400886535645, 5.394600868225098, 5.687661170959473, 5.980721950531006, 6.273782730102539, 6.566843032836914, 6.859903812408447, 7.152964115142822, 7.4460248947143555, 7.7390851974487305, 8.032146453857422, 8.325206756591797, 8.618267059326172, 8.911328315734863, 9.204388618469238, 9.497448921203613, 9.790509223937988, 10.08357048034668, 10.376630783081055, 10.66969108581543]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 7.0, 5.0, 18.0, 8.0, 28.0, 34.0, 58.0, 79.0, 133.0, 186.0, 339.0, 510.0, 825.0, 1373.0, 2397.0, 4175.0, 7255.0, 13002.0, 23031.0, 40163.0, 68985.0, 108627.0, 149823.0, 172127.0, 157698.0, 117596.0, 75396.0, 44996.0, 25755.0, 14300.0, 8271.0, 4616.0, 2678.0, 1574.0, 942.0, 565.0, 328.0, 245.0, 142.0, 106.0, 62.0, 28.0, 24.0, 12.0, 10.0, 11.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.6171875, -13.199462890625, -12.78173828125, -12.364013671875, -11.9462890625, -11.528564453125, -11.11083984375, -10.693115234375, -10.275390625, -9.857666015625, -9.43994140625, -9.022216796875, -8.6044921875, -8.186767578125, -7.76904296875, -7.351318359375, -6.93359375, -6.515869140625, -6.09814453125, -5.680419921875, -5.2626953125, -4.844970703125, -4.42724609375, -4.009521484375, -3.591796875, -3.174072265625, -2.75634765625, -2.338623046875, -1.9208984375, -1.503173828125, -1.08544921875, -0.667724609375, -0.25, 0.167724609375, 0.58544921875, 1.003173828125, 1.4208984375, 1.838623046875, 2.25634765625, 2.674072265625, 3.091796875, 3.509521484375, 3.92724609375, 4.344970703125, 4.7626953125, 5.180419921875, 5.59814453125, 6.015869140625, 6.43359375, 6.851318359375, 7.26904296875, 7.686767578125, 8.1044921875, 8.522216796875, 8.93994140625, 9.357666015625, 9.775390625, 10.193115234375, 10.61083984375, 11.028564453125, 11.4462890625, 11.864013671875, 12.28173828125, 12.699462890625, 13.1171875]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 4.0, 8.0, 17.0, 11.0, 19.0, 15.0, 19.0, 20.0, 35.0, 25.0, 27.0, 38.0, 37.0, 43.0, 52.0, 52.0, 55.0, 45.0, 46.0, 43.0, 50.0, 50.0, 37.0, 34.0, 36.0, 28.0, 17.0, 27.0, 9.0, 23.0, 12.0, 24.0, 11.0, 6.0, 8.0, 4.0, 1.0, 3.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9375, -9.5906982421875, -9.243896484375, -8.8970947265625, -8.55029296875, -8.2034912109375, -7.856689453125, -7.5098876953125, -7.1630859375, -6.8162841796875, -6.469482421875, -6.1226806640625, -5.77587890625, -5.4290771484375, -5.082275390625, -4.7354736328125, -4.388671875, -4.0418701171875, -3.695068359375, -3.3482666015625, -3.00146484375, -2.6546630859375, -2.307861328125, -1.9610595703125, -1.6142578125, -1.2674560546875, -0.920654296875, -0.5738525390625, -0.22705078125, 0.1197509765625, 0.466552734375, 0.8133544921875, 1.16015625, 1.5069580078125, 1.853759765625, 2.2005615234375, 2.54736328125, 2.8941650390625, 3.240966796875, 3.5877685546875, 3.9345703125, 4.2813720703125, 4.628173828125, 4.9749755859375, 5.32177734375, 5.6685791015625, 6.015380859375, 6.3621826171875, 6.708984375, 7.0557861328125, 7.402587890625, 7.7493896484375, 8.09619140625, 8.4429931640625, 8.789794921875, 9.1365966796875, 9.4833984375, 9.8302001953125, 10.177001953125, 10.5238037109375, 10.87060546875, 11.2174072265625, 11.564208984375, 11.9110107421875, 12.2578125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 6.0, 5.0, 10.0, 7.0, 23.0, 28.0, 38.0, 53.0, 97.0, 121.0, 192.0, 340.0, 584.0, 956.0, 1619.0, 2750.0, 4834.0, 8322.0, 14699.0, 25574.0, 43380.0, 71347.0, 108012.0, 144377.0, 162831.0, 150217.0, 115359.0, 77824.0, 48045.0, 28700.0, 16232.0, 9292.0, 5325.0, 3064.0, 1690.0, 1004.0, 605.0, 380.0, 221.0, 129.0, 98.0, 56.0, 33.0, 28.0, 19.0, 13.0, 8.0, 8.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-14.53125, -14.1112060546875, -13.691162109375, -13.2711181640625, -12.85107421875, -12.4310302734375, -12.010986328125, -11.5909423828125, -11.1708984375, -10.7508544921875, -10.330810546875, -9.9107666015625, -9.49072265625, -9.0706787109375, -8.650634765625, -8.2305908203125, -7.810546875, -7.3905029296875, -6.970458984375, -6.5504150390625, -6.13037109375, -5.7103271484375, -5.290283203125, -4.8702392578125, -4.4501953125, -4.0301513671875, -3.610107421875, -3.1900634765625, -2.77001953125, -2.3499755859375, -1.929931640625, -1.5098876953125, -1.08984375, -0.6697998046875, -0.249755859375, 0.1702880859375, 0.59033203125, 1.0103759765625, 1.430419921875, 1.8504638671875, 2.2705078125, 2.6905517578125, 3.110595703125, 3.5306396484375, 3.95068359375, 4.3707275390625, 4.790771484375, 5.2108154296875, 5.630859375, 6.0509033203125, 6.470947265625, 6.8909912109375, 7.31103515625, 7.7310791015625, 8.151123046875, 8.5711669921875, 8.9912109375, 9.4112548828125, 9.831298828125, 10.2513427734375, 10.67138671875, 11.0914306640625, 11.511474609375, 11.9315185546875, 12.3515625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 9.0, 5.0, 15.0, 9.0, 9.0, 11.0, 14.0, 12.0, 15.0, 24.0, 25.0, 36.0, 20.0, 19.0, 32.0, 29.0, 29.0, 39.0, 37.0, 39.0, 35.0, 35.0, 46.0, 37.0, 50.0, 40.0, 27.0, 35.0, 34.0, 29.0, 33.0, 25.0, 20.0, 14.0, 16.0, 22.0, 16.0, 11.0, 11.0, 11.0, 4.0, 9.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.2890625, -5.10894775390625, -4.9288330078125, -4.74871826171875, -4.568603515625, -4.38848876953125, -4.2083740234375, -4.02825927734375, -3.84814453125, -3.66802978515625, -3.4879150390625, -3.30780029296875, -3.127685546875, -2.94757080078125, -2.7674560546875, -2.58734130859375, -2.4072265625, -2.22711181640625, -2.0469970703125, -1.86688232421875, -1.686767578125, -1.50665283203125, -1.3265380859375, -1.14642333984375, -0.96630859375, -0.78619384765625, -0.6060791015625, -0.42596435546875, -0.245849609375, -0.06573486328125, 0.1143798828125, 0.29449462890625, 0.474609375, 0.65472412109375, 0.8348388671875, 1.01495361328125, 1.195068359375, 1.37518310546875, 1.5552978515625, 1.73541259765625, 1.91552734375, 2.09564208984375, 2.2757568359375, 2.45587158203125, 2.635986328125, 2.81610107421875, 2.9962158203125, 3.17633056640625, 3.3564453125, 3.53656005859375, 3.7166748046875, 3.89678955078125, 4.076904296875, 4.25701904296875, 4.4371337890625, 4.61724853515625, 4.79736328125, 4.97747802734375, 5.1575927734375, 5.33770751953125, 5.517822265625, 5.69793701171875, 5.8780517578125, 6.05816650390625, 6.23828125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 1.0, 8.0, 8.0, 14.0, 19.0, 17.0, 48.0, 48.0, 72.0, 146.0, 194.0, 276.0, 416.0, 607.0, 1026.0, 1534.0, 2422.0, 4004.0, 6872.0, 12709.0, 23837.0, 49500.0, 101850.0, 188921.0, 245067.0, 194109.0, 106702.0, 51856.0, 25261.0, 12975.0, 7019.0, 4059.0, 2438.0, 1545.0, 935.0, 680.0, 455.0, 269.0, 195.0, 148.0, 87.0, 65.0, 54.0, 28.0, 24.0, 10.0, 13.0, 4.0, 3.0, 2.0, 2.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.6484375, -8.3741455078125, -8.099853515625, -7.8255615234375, -7.55126953125, -7.2769775390625, -7.002685546875, -6.7283935546875, -6.4541015625, -6.1798095703125, -5.905517578125, -5.6312255859375, -5.35693359375, -5.0826416015625, -4.808349609375, -4.5340576171875, -4.259765625, -3.9854736328125, -3.711181640625, -3.4368896484375, -3.16259765625, -2.8883056640625, -2.614013671875, -2.3397216796875, -2.0654296875, -1.7911376953125, -1.516845703125, -1.2425537109375, -0.96826171875, -0.6939697265625, -0.419677734375, -0.1453857421875, 0.12890625, 0.4031982421875, 0.677490234375, 0.9517822265625, 1.22607421875, 1.5003662109375, 1.774658203125, 2.0489501953125, 2.3232421875, 2.5975341796875, 2.871826171875, 3.1461181640625, 3.42041015625, 3.6947021484375, 3.968994140625, 4.2432861328125, 4.517578125, 4.7918701171875, 5.066162109375, 5.3404541015625, 5.61474609375, 5.8890380859375, 6.163330078125, 6.4376220703125, 6.7119140625, 6.9862060546875, 7.260498046875, 7.5347900390625, 7.80908203125, 8.0833740234375, 8.357666015625, 8.6319580078125, 8.90625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 5.0, 3.0, 9.0, 6.0, 12.0, 16.0, 12.0, 34.0, 31.0, 38.0, 64.0, 77.0, 80.0, 73.0, 84.0, 99.0, 77.0, 65.0, 52.0, 47.0, 35.0, 19.0, 17.0, 16.0, 5.0, 5.0, 10.0, 6.0, 6.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008287429809570312, -0.0007984191179275513, -0.0007680952548980713, -0.0007377713918685913, -0.0007074475288391113, -0.0006771236658096313, -0.0006467998027801514, -0.0006164759397506714, -0.0005861520767211914, -0.0005558282136917114, -0.0005255043506622314, -0.0004951804876327515, -0.0004648566246032715, -0.0004345327615737915, -0.0004042088985443115, -0.00037388503551483154, -0.00034356117248535156, -0.0003132373094558716, -0.0002829134464263916, -0.0002525895833969116, -0.00022226572036743164, -0.00019194185733795166, -0.00016161799430847168, -0.0001312941312789917, -0.00010097026824951172, -7.064640522003174e-05, -4.032254219055176e-05, -9.998679161071777e-06, 2.0325183868408203e-05, 5.0649046897888184e-05, 8.097290992736816e-05, 0.00011129677295684814, 0.00014162063598632812, 0.0001719444990158081, 0.00020226836204528809, 0.00023259222507476807, 0.00026291608810424805, 0.00029323995113372803, 0.000323563814163208, 0.000353887677192688, 0.00038421154022216797, 0.00041453540325164795, 0.00044485926628112793, 0.0004751831293106079, 0.0005055069923400879, 0.0005358308553695679, 0.0005661547183990479, 0.0005964785814285278, 0.0006268024444580078, 0.0006571263074874878, 0.0006874501705169678, 0.0007177740335464478, 0.0007480978965759277, 0.0007784217596054077, 0.0008087456226348877, 0.0008390694856643677, 0.0008693933486938477, 0.0008997172117233276, 0.0009300410747528076, 0.0009603649377822876, 0.0009906888008117676, 0.0010210126638412476, 0.0010513365268707275, 0.0010816603899002075, 0.0011119842529296875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 7.0, 8.0, 13.0, 10.0, 22.0, 34.0, 43.0, 64.0, 98.0, 144.0, 217.0, 327.0, 496.0, 691.0, 1053.0, 1561.0, 2398.0, 3625.0, 5863.0, 9362.0, 15890.0, 26395.0, 45224.0, 76144.0, 120523.0, 164908.0, 178663.0, 146301.0, 98728.0, 59872.0, 35353.0, 20957.0, 12422.0, 7598.0, 4688.0, 3029.0, 1918.0, 1243.0, 866.0, 582.0, 403.0, 270.0, 182.0, 92.0, 98.0, 51.0, 48.0, 27.0, 16.0, 22.0, 9.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.09375, -5.9049072265625, -5.716064453125, -5.5272216796875, -5.33837890625, -5.1495361328125, -4.960693359375, -4.7718505859375, -4.5830078125, -4.3941650390625, -4.205322265625, -4.0164794921875, -3.82763671875, -3.6387939453125, -3.449951171875, -3.2611083984375, -3.072265625, -2.8834228515625, -2.694580078125, -2.5057373046875, -2.31689453125, -2.1280517578125, -1.939208984375, -1.7503662109375, -1.5615234375, -1.3726806640625, -1.183837890625, -0.9949951171875, -0.80615234375, -0.6173095703125, -0.428466796875, -0.2396240234375, -0.05078125, 0.1380615234375, 0.326904296875, 0.5157470703125, 0.70458984375, 0.8934326171875, 1.082275390625, 1.2711181640625, 1.4599609375, 1.6488037109375, 1.837646484375, 2.0264892578125, 2.21533203125, 2.4041748046875, 2.593017578125, 2.7818603515625, 2.970703125, 3.1595458984375, 3.348388671875, 3.5372314453125, 3.72607421875, 3.9149169921875, 4.103759765625, 4.2926025390625, 4.4814453125, 4.6702880859375, 4.859130859375, 5.0479736328125, 5.23681640625, 5.4256591796875, 5.614501953125, 5.8033447265625, 5.9921875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 6.0, 2.0, 6.0, 6.0, 4.0, 11.0, 9.0, 15.0, 17.0, 22.0, 19.0, 23.0, 30.0, 42.0, 49.0, 44.0, 43.0, 69.0, 65.0, 67.0, 70.0, 54.0, 48.0, 57.0, 30.0, 22.0, 33.0, 31.0, 31.0, 19.0, 14.0, 13.0, 8.0, 3.0, 5.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.103515625, -2.042724609375, -1.98193359375, -1.921142578125, -1.8603515625, -1.799560546875, -1.73876953125, -1.677978515625, -1.6171875, -1.556396484375, -1.49560546875, -1.434814453125, -1.3740234375, -1.313232421875, -1.25244140625, -1.191650390625, -1.130859375, -1.070068359375, -1.00927734375, -0.948486328125, -0.8876953125, -0.826904296875, -0.76611328125, -0.705322265625, -0.64453125, -0.583740234375, -0.52294921875, -0.462158203125, -0.4013671875, -0.340576171875, -0.27978515625, -0.218994140625, -0.158203125, -0.097412109375, -0.03662109375, 0.024169921875, 0.0849609375, 0.145751953125, 0.20654296875, 0.267333984375, 0.328125, 0.388916015625, 0.44970703125, 0.510498046875, 0.5712890625, 0.632080078125, 0.69287109375, 0.753662109375, 0.814453125, 0.875244140625, 0.93603515625, 0.996826171875, 1.0576171875, 1.118408203125, 1.17919921875, 1.239990234375, 1.30078125, 1.361572265625, 1.42236328125, 1.483154296875, 1.5439453125, 1.604736328125, 1.66552734375, 1.726318359375, 1.787109375]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 5.0, 5.0, 12.0, 10.0, 14.0, 18.0, 17.0, 20.0, 23.0, 30.0, 42.0, 48.0, 65.0, 65.0, 73.0, 62.0, 80.0, 78.0, 65.0, 54.0, 39.0, 38.0, 22.0, 25.0, 21.0, 14.0, 13.0, 14.0, 6.0, 11.0, 1.0, 3.0, 4.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.22071647644043, -18.55204963684082, -17.883380889892578, -17.21471405029297, -16.54604721069336, -15.877379417419434, -15.208711624145508, -14.540044784545898, -13.871376991271973, -13.202709197998047, -12.534042358398438, -11.865374565124512, -11.196706771850586, -10.528039932250977, -9.85937213897705, -9.190704345703125, -8.522037506103516, -7.853370189666748, -7.1847028732299805, -6.516035079956055, -5.847367763519287, -5.1787004470825195, -4.510032653808594, -3.841365337371826, -3.1726980209350586, -2.504030704498291, -1.8353631496429443, -1.1666955947875977, -0.4980282783508301, 0.1706390380859375, 0.8393068313598633, 1.5079741477966309, 2.1766414642333984, 2.845308780670166, 3.5139763355255127, 4.182643890380859, 4.851311206817627, 5.5199785232543945, 6.18864631652832, 6.857313632965088, 7.5259809494018555, 8.194648742675781, 8.86331558227539, 9.531983375549316, 10.200651168823242, 10.869318008422852, 11.537985801696777, 12.206653594970703, 12.875320434570312, 13.543988227844238, 14.212655067443848, 14.881322860717773, 15.549989700317383, 16.218658447265625, 16.887325286865234, 17.555992126464844, 18.224658966064453, 18.893325805664062, 19.561994552612305, 20.230661392211914, 20.899328231811523, 21.567996978759766, 22.236663818359375, 22.905330657958984, 23.573999404907227]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 8.0, 6.0, 11.0, 10.0, 10.0, 11.0, 5.0, 22.0, 15.0, 14.0, 20.0, 15.0, 28.0, 28.0, 31.0, 23.0, 43.0, 36.0, 20.0, 40.0, 38.0, 32.0, 37.0, 51.0, 37.0, 36.0, 27.0, 31.0, 36.0, 38.0, 31.0, 34.0, 20.0, 19.0, 23.0, 24.0, 9.0, 18.0, 17.0, 2.0, 10.0, 9.0, 4.0, 3.0, 3.0, 2.0, 5.0, 7.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.744450569152832, -7.483931541442871, -7.22341251373291, -6.962893962860107, -6.7023749351501465, -6.4418559074401855, -6.181337356567383, -5.920818328857422, -5.660299301147461, -5.3997802734375, -5.139261245727539, -4.878742694854736, -4.618223667144775, -4.3577046394348145, -4.097186088562012, -3.836667060852051, -3.57614803314209, -3.315629005432129, -3.055110216140747, -2.7945914268493652, -2.5340723991394043, -2.2735533714294434, -2.0130345821380615, -1.7525156736373901, -1.4919967651367188, -1.2314778566360474, -0.970958948135376, -0.7104400396347046, -0.4499211311340332, -0.18940222263336182, 0.07111668586730957, 0.33163559436798096, 0.5921535491943359, 0.8526724576950073, 1.1131913661956787, 1.37371027469635, 1.6342291831970215, 1.8947480916976929, 2.1552670001983643, 2.415785789489746, 2.676304817199707, 2.936823844909668, 3.19734263420105, 3.4578614234924316, 3.7183804512023926, 3.9788994789123535, 4.239418029785156, 4.499937057495117, 4.760456085205078, 5.020975112915039, 5.281494140625, 5.542012691497803, 5.802531719207764, 6.063050746917725, 6.323569297790527, 6.584088325500488, 6.844607353210449, 7.10512638092041, 7.365645408630371, 7.626163959503174, 7.886682987213135, 8.147201538085938, 8.407720565795898, 8.66823959350586, 8.92875862121582]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [3.0, 4.0, 5.0, 8.0, 27.0, 34.0, 60.0, 96.0, 154.0, 237.0, 307.0, 541.0, 903.0, 1395.0, 2593.0, 4367.0, 7605.0, 14153.0, 27345.0, 54478.0, 114518.0, 254984.0, 585474.0, 1133987.0, 1063404.0, 510661.0, 217767.0, 97877.0, 47018.0, 23839.0, 12736.0, 7205.0, 4109.0, 2406.0, 1399.0, 887.0, 548.0, 373.0, 245.0, 171.0, 97.0, 85.0, 42.0, 40.0, 20.0, 21.0, 15.0, 13.0, 6.0, 13.0, 8.0, 3.0, 4.0, 0.0, 2.0, 6.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.7421875, -13.1676025390625, -12.593017578125, -12.0184326171875, -11.44384765625, -10.8692626953125, -10.294677734375, -9.7200927734375, -9.1455078125, -8.5709228515625, -7.996337890625, -7.4217529296875, -6.84716796875, -6.2725830078125, -5.697998046875, -5.1234130859375, -4.548828125, -3.9742431640625, -3.399658203125, -2.8250732421875, -2.25048828125, -1.6759033203125, -1.101318359375, -0.5267333984375, 0.0478515625, 0.6224365234375, 1.197021484375, 1.7716064453125, 2.34619140625, 2.9207763671875, 3.495361328125, 4.0699462890625, 4.64453125, 5.2191162109375, 5.793701171875, 6.3682861328125, 6.94287109375, 7.5174560546875, 8.092041015625, 8.6666259765625, 9.2412109375, 9.8157958984375, 10.390380859375, 10.9649658203125, 11.53955078125, 12.1141357421875, 12.688720703125, 13.2633056640625, 13.837890625, 14.4124755859375, 14.987060546875, 15.5616455078125, 16.13623046875, 16.7108154296875, 17.285400390625, 17.8599853515625, 18.4345703125, 19.0091552734375, 19.583740234375, 20.1583251953125, 20.73291015625, 21.3074951171875, 21.882080078125, 22.4566650390625, 23.03125]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 7.0, 7.0, 10.0, 12.0, 16.0, 14.0, 15.0, 24.0, 21.0, 18.0, 18.0, 37.0, 42.0, 33.0, 38.0, 50.0, 49.0, 39.0, 47.0, 48.0, 43.0, 45.0, 56.0, 47.0, 37.0, 36.0, 34.0, 19.0, 23.0, 17.0, 22.0, 20.0, 8.0, 14.0, 9.0, 9.0, 9.0, 3.0, 3.0, 4.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5390625, -7.2803955078125, -7.021728515625, -6.7630615234375, -6.50439453125, -6.2457275390625, -5.987060546875, -5.7283935546875, -5.4697265625, -5.2110595703125, -4.952392578125, -4.6937255859375, -4.43505859375, -4.1763916015625, -3.917724609375, -3.6590576171875, -3.400390625, -3.1417236328125, -2.883056640625, -2.6243896484375, -2.36572265625, -2.1070556640625, -1.848388671875, -1.5897216796875, -1.3310546875, -1.0723876953125, -0.813720703125, -0.5550537109375, -0.29638671875, -0.0377197265625, 0.220947265625, 0.4796142578125, 0.73828125, 0.9969482421875, 1.255615234375, 1.5142822265625, 1.77294921875, 2.0316162109375, 2.290283203125, 2.5489501953125, 2.8076171875, 3.0662841796875, 3.324951171875, 3.5836181640625, 3.84228515625, 4.1009521484375, 4.359619140625, 4.6182861328125, 4.876953125, 5.1356201171875, 5.394287109375, 5.6529541015625, 5.91162109375, 6.1702880859375, 6.428955078125, 6.6876220703125, 6.9462890625, 7.2049560546875, 7.463623046875, 7.7222900390625, 7.98095703125, 8.2396240234375, 8.498291015625, 8.7569580078125, 9.015625]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 9.0, 1.0, 9.0, 21.0, 27.0, 32.0, 46.0, 65.0, 103.0, 171.0, 225.0, 370.0, 614.0, 973.0, 1569.0, 2681.0, 4457.0, 7570.0, 13582.0, 24706.0, 46361.0, 88545.0, 173028.0, 334746.0, 623080.0, 942603.0, 856483.0, 510840.0, 267856.0, 137360.0, 70748.0, 37817.0, 20372.0, 11242.0, 6387.0, 3732.0, 2171.0, 1378.0, 837.0, 530.0, 334.0, 213.0, 134.0, 74.0, 58.0, 46.0, 23.0, 17.0, 15.0, 11.0, 5.0, 7.0, 2.0, 3.0, 1.0, 2.0], "bins": [-18.328125, -17.786376953125, -17.24462890625, -16.702880859375, -16.1611328125, -15.619384765625, -15.07763671875, -14.535888671875, -13.994140625, -13.452392578125, -12.91064453125, -12.368896484375, -11.8271484375, -11.285400390625, -10.74365234375, -10.201904296875, -9.66015625, -9.118408203125, -8.57666015625, -8.034912109375, -7.4931640625, -6.951416015625, -6.40966796875, -5.867919921875, -5.326171875, -4.784423828125, -4.24267578125, -3.700927734375, -3.1591796875, -2.617431640625, -2.07568359375, -1.533935546875, -0.9921875, -0.450439453125, 0.09130859375, 0.633056640625, 1.1748046875, 1.716552734375, 2.25830078125, 2.800048828125, 3.341796875, 3.883544921875, 4.42529296875, 4.967041015625, 5.5087890625, 6.050537109375, 6.59228515625, 7.134033203125, 7.67578125, 8.217529296875, 8.75927734375, 9.301025390625, 9.8427734375, 10.384521484375, 10.92626953125, 11.468017578125, 12.009765625, 12.551513671875, 13.09326171875, 13.635009765625, 14.1767578125, 14.718505859375, 15.26025390625, 15.802001953125, 16.34375]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 5.0, 15.0, 20.0, 18.0, 24.0, 37.0, 39.0, 39.0, 73.0, 78.0, 106.0, 97.0, 111.0, 152.0, 201.0, 188.0, 234.0, 253.0, 268.0, 247.0, 258.0, 220.0, 240.0, 205.0, 183.0, 144.0, 115.0, 108.0, 84.0, 73.0, 48.0, 42.0, 18.0, 26.0, 26.0, 14.0, 12.0, 13.0, 8.0, 7.0, 4.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.49609375, -4.3480224609375, -4.199951171875, -4.0518798828125, -3.90380859375, -3.7557373046875, -3.607666015625, -3.4595947265625, -3.3115234375, -3.1634521484375, -3.015380859375, -2.8673095703125, -2.71923828125, -2.5711669921875, -2.423095703125, -2.2750244140625, -2.126953125, -1.9788818359375, -1.830810546875, -1.6827392578125, -1.53466796875, -1.3865966796875, -1.238525390625, -1.0904541015625, -0.9423828125, -0.7943115234375, -0.646240234375, -0.4981689453125, -0.35009765625, -0.2020263671875, -0.053955078125, 0.0941162109375, 0.2421875, 0.3902587890625, 0.538330078125, 0.6864013671875, 0.83447265625, 0.9825439453125, 1.130615234375, 1.2786865234375, 1.4267578125, 1.5748291015625, 1.722900390625, 1.8709716796875, 2.01904296875, 2.1671142578125, 2.315185546875, 2.4632568359375, 2.611328125, 2.7593994140625, 2.907470703125, 3.0555419921875, 3.20361328125, 3.3516845703125, 3.499755859375, 3.6478271484375, 3.7958984375, 3.9439697265625, 4.092041015625, 4.2401123046875, 4.38818359375, 4.5362548828125, 4.684326171875, 4.8323974609375, 4.98046875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 8.0, 8.0, 4.0, 13.0, 11.0, 12.0, 15.0, 16.0, 27.0, 32.0, 37.0, 39.0, 51.0, 72.0, 71.0, 61.0, 86.0, 68.0, 62.0, 58.0, 49.0, 37.0, 28.0, 26.0, 23.0, 20.0, 12.0, 9.0, 12.0, 8.0, 6.0, 3.0, 1.0, 8.0, 2.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.71157455444336, -19.039499282836914, -18.36742401123047, -17.695348739624023, -17.023273468017578, -16.351198196411133, -15.679121971130371, -15.007046699523926, -14.33497142791748, -13.662896156311035, -12.99082088470459, -12.318744659423828, -11.646669387817383, -10.974594116210938, -10.302518844604492, -9.630443572998047, -8.958368301391602, -8.286293029785156, -7.614217758178711, -6.942142009735107, -6.270066738128662, -5.597991466522217, -4.925915718078613, -4.253840446472168, -3.5817651748657227, -2.9096899032592773, -2.237614393234253, -1.5655388832092285, -0.8934636116027832, -0.2213883399963379, 0.4506874084472656, 1.122762680053711, 1.794839859008789, 2.4669151306152344, 3.138990640640259, 3.811066150665283, 4.4831414222717285, 5.155216693878174, 5.827292442321777, 6.499367713928223, 7.171442985534668, 7.843518257141113, 8.515593528747559, 9.18766975402832, 9.859745025634766, 10.531820297241211, 11.203895568847656, 11.875970840454102, 12.548046112060547, 13.220121383666992, 13.892196655273438, 14.564271926879883, 15.236347198486328, 15.908422470092773, 16.58049774169922, 17.252574920654297, 17.92464828491211, 18.596723556518555, 19.268798828125, 19.940874099731445, 20.61294937133789, 21.285024642944336, 21.95709991455078, 22.62917709350586, 23.301252365112305]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 5.0, 3.0, 4.0, 6.0, 5.0, 10.0, 14.0, 19.0, 18.0, 16.0, 19.0, 28.0, 29.0, 21.0, 40.0, 41.0, 31.0, 43.0, 42.0, 44.0, 41.0, 58.0, 54.0, 42.0, 35.0, 33.0, 37.0, 39.0, 27.0, 29.0, 30.0, 24.0, 19.0, 22.0, 16.0, 13.0, 9.0, 11.0, 5.0, 6.0, 7.0, 0.0, 8.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.642413139343262, -9.33700942993164, -9.03160572052002, -8.726202011108398, -8.420797348022461, -8.11539363861084, -7.809989929199219, -7.504586219787598, -7.199182510375977, -6.8937788009643555, -6.588375091552734, -6.282970905303955, -5.977567195892334, -5.672163486480713, -5.366759300231934, -5.0613555908203125, -4.755951881408691, -4.45054817199707, -4.145144462585449, -3.83974027633667, -3.534336566925049, -3.2289328575134277, -2.9235289096832275, -2.6181249618530273, -2.3127212524414062, -2.007317543029785, -1.701913595199585, -1.3965097665786743, -1.0911059379577637, -0.785702109336853, -0.4802982807159424, -0.1748943328857422, 0.1305093765258789, 0.43591320514678955, 0.7413170337677002, 1.0467208623886108, 1.3521246910095215, 1.6575285196304321, 1.9629323482513428, 2.268336296081543, 2.573740005493164, 2.879143714904785, 3.1845476627349854, 3.4899516105651855, 3.7953553199768066, 4.100759029388428, 4.406163215637207, 4.711566925048828, 5.016970634460449, 5.32237434387207, 5.627778053283691, 5.933182239532471, 6.238585948944092, 6.543989658355713, 6.849393844604492, 7.154797554016113, 7.460201263427734, 7.7656049728393555, 8.071008682250977, 8.376412391662598, 8.681816101074219, 8.987220764160156, 9.292624473571777, 9.598028182983398, 9.90343189239502]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 3.0, 9.0, 11.0, 7.0, 9.0, 23.0, 37.0, 42.0, 60.0, 81.0, 144.0, 210.0, 299.0, 461.0, 822.0, 1302.0, 2210.0, 4300.0, 8350.0, 17642.0, 38591.0, 84483.0, 168683.0, 250725.0, 224094.0, 129689.0, 61331.0, 27650.0, 12988.0, 6362.0, 3262.0, 1849.0, 1035.0, 590.0, 389.0, 265.0, 170.0, 127.0, 85.0, 44.0, 41.0, 25.0, 22.0, 10.0, 11.0, 9.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-12.546875, -12.139404296875, -11.73193359375, -11.324462890625, -10.9169921875, -10.509521484375, -10.10205078125, -9.694580078125, -9.287109375, -8.879638671875, -8.47216796875, -8.064697265625, -7.6572265625, -7.249755859375, -6.84228515625, -6.434814453125, -6.02734375, -5.619873046875, -5.21240234375, -4.804931640625, -4.3974609375, -3.989990234375, -3.58251953125, -3.175048828125, -2.767578125, -2.360107421875, -1.95263671875, -1.545166015625, -1.1376953125, -0.730224609375, -0.32275390625, 0.084716796875, 0.4921875, 0.899658203125, 1.30712890625, 1.714599609375, 2.1220703125, 2.529541015625, 2.93701171875, 3.344482421875, 3.751953125, 4.159423828125, 4.56689453125, 4.974365234375, 5.3818359375, 5.789306640625, 6.19677734375, 6.604248046875, 7.01171875, 7.419189453125, 7.82666015625, 8.234130859375, 8.6416015625, 9.049072265625, 9.45654296875, 9.864013671875, 10.271484375, 10.678955078125, 11.08642578125, 11.493896484375, 11.9013671875, 12.308837890625, 12.71630859375, 13.123779296875, 13.53125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 9.0, 5.0, 4.0, 12.0, 10.0, 15.0, 17.0, 16.0, 18.0, 27.0, 30.0, 23.0, 32.0, 37.0, 47.0, 49.0, 40.0, 40.0, 52.0, 49.0, 46.0, 51.0, 43.0, 41.0, 46.0, 31.0, 21.0, 26.0, 26.0, 25.0, 18.0, 14.0, 18.0, 19.0, 12.0, 7.0, 7.0, 6.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.296875, -9.94677734375, -9.5966796875, -9.24658203125, -8.896484375, -8.54638671875, -8.1962890625, -7.84619140625, -7.49609375, -7.14599609375, -6.7958984375, -6.44580078125, -6.095703125, -5.74560546875, -5.3955078125, -5.04541015625, -4.6953125, -4.34521484375, -3.9951171875, -3.64501953125, -3.294921875, -2.94482421875, -2.5947265625, -2.24462890625, -1.89453125, -1.54443359375, -1.1943359375, -0.84423828125, -0.494140625, -0.14404296875, 0.2060546875, 0.55615234375, 0.90625, 1.25634765625, 1.6064453125, 1.95654296875, 2.306640625, 2.65673828125, 3.0068359375, 3.35693359375, 3.70703125, 4.05712890625, 4.4072265625, 4.75732421875, 5.107421875, 5.45751953125, 5.8076171875, 6.15771484375, 6.5078125, 6.85791015625, 7.2080078125, 7.55810546875, 7.908203125, 8.25830078125, 8.6083984375, 8.95849609375, 9.30859375, 9.65869140625, 10.0087890625, 10.35888671875, 10.708984375, 11.05908203125, 11.4091796875, 11.75927734375, 12.109375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 4.0, 11.0, 12.0, 23.0, 33.0, 41.0, 49.0, 100.0, 150.0, 231.0, 334.0, 468.0, 781.0, 1279.0, 2125.0, 3800.0, 6989.0, 13311.0, 26638.0, 55028.0, 113970.0, 213836.0, 262710.0, 173486.0, 87292.0, 41804.0, 20388.0, 10171.0, 5562.0, 3166.0, 1749.0, 1071.0, 661.0, 420.0, 263.0, 194.0, 122.0, 85.0, 60.0, 37.0, 34.0, 20.0, 11.0, 15.0, 9.0, 4.0, 9.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-14.1015625, -13.67822265625, -13.2548828125, -12.83154296875, -12.408203125, -11.98486328125, -11.5615234375, -11.13818359375, -10.71484375, -10.29150390625, -9.8681640625, -9.44482421875, -9.021484375, -8.59814453125, -8.1748046875, -7.75146484375, -7.328125, -6.90478515625, -6.4814453125, -6.05810546875, -5.634765625, -5.21142578125, -4.7880859375, -4.36474609375, -3.94140625, -3.51806640625, -3.0947265625, -2.67138671875, -2.248046875, -1.82470703125, -1.4013671875, -0.97802734375, -0.5546875, -0.13134765625, 0.2919921875, 0.71533203125, 1.138671875, 1.56201171875, 1.9853515625, 2.40869140625, 2.83203125, 3.25537109375, 3.6787109375, 4.10205078125, 4.525390625, 4.94873046875, 5.3720703125, 5.79541015625, 6.21875, 6.64208984375, 7.0654296875, 7.48876953125, 7.912109375, 8.33544921875, 8.7587890625, 9.18212890625, 9.60546875, 10.02880859375, 10.4521484375, 10.87548828125, 11.298828125, 11.72216796875, 12.1455078125, 12.56884765625, 12.9921875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 7.0, 9.0, 9.0, 9.0, 14.0, 15.0, 10.0, 27.0, 24.0, 19.0, 28.0, 47.0, 50.0, 50.0, 40.0, 51.0, 53.0, 55.0, 54.0, 47.0, 39.0, 53.0, 38.0, 40.0, 47.0, 25.0, 28.0, 33.0, 19.0, 13.0, 7.0, 7.0, 12.0, 7.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.01171875, -5.78448486328125, -5.5572509765625, -5.33001708984375, -5.102783203125, -4.87554931640625, -4.6483154296875, -4.42108154296875, -4.19384765625, -3.96661376953125, -3.7393798828125, -3.51214599609375, -3.284912109375, -3.05767822265625, -2.8304443359375, -2.60321044921875, -2.3759765625, -2.14874267578125, -1.9215087890625, -1.69427490234375, -1.467041015625, -1.23980712890625, -1.0125732421875, -0.78533935546875, -0.55810546875, -0.33087158203125, -0.1036376953125, 0.12359619140625, 0.350830078125, 0.57806396484375, 0.8052978515625, 1.03253173828125, 1.259765625, 1.48699951171875, 1.7142333984375, 1.94146728515625, 2.168701171875, 2.39593505859375, 2.6231689453125, 2.85040283203125, 3.07763671875, 3.30487060546875, 3.5321044921875, 3.75933837890625, 3.986572265625, 4.21380615234375, 4.4410400390625, 4.66827392578125, 4.8955078125, 5.12274169921875, 5.3499755859375, 5.57720947265625, 5.804443359375, 6.03167724609375, 6.2589111328125, 6.48614501953125, 6.71337890625, 6.94061279296875, 7.1678466796875, 7.39508056640625, 7.622314453125, 7.84954833984375, 8.0767822265625, 8.30401611328125, 8.53125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 6.0, 6.0, 13.0, 26.0, 14.0, 26.0, 32.0, 51.0, 71.0, 99.0, 145.0, 245.0, 352.0, 564.0, 920.0, 1430.0, 2515.0, 4468.0, 8459.0, 17344.0, 37362.0, 85058.0, 189990.0, 305712.0, 212550.0, 97515.0, 42626.0, 19561.0, 9549.0, 4982.0, 2627.0, 1593.0, 917.0, 591.0, 359.0, 269.0, 167.0, 88.0, 71.0, 58.0, 31.0, 27.0, 16.0, 13.0, 10.0, 10.0, 8.0, 6.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-7.68359375, -7.44775390625, -7.2119140625, -6.97607421875, -6.740234375, -6.50439453125, -6.2685546875, -6.03271484375, -5.796875, -5.56103515625, -5.3251953125, -5.08935546875, -4.853515625, -4.61767578125, -4.3818359375, -4.14599609375, -3.91015625, -3.67431640625, -3.4384765625, -3.20263671875, -2.966796875, -2.73095703125, -2.4951171875, -2.25927734375, -2.0234375, -1.78759765625, -1.5517578125, -1.31591796875, -1.080078125, -0.84423828125, -0.6083984375, -0.37255859375, -0.13671875, 0.09912109375, 0.3349609375, 0.57080078125, 0.806640625, 1.04248046875, 1.2783203125, 1.51416015625, 1.75, 1.98583984375, 2.2216796875, 2.45751953125, 2.693359375, 2.92919921875, 3.1650390625, 3.40087890625, 3.63671875, 3.87255859375, 4.1083984375, 4.34423828125, 4.580078125, 4.81591796875, 5.0517578125, 5.28759765625, 5.5234375, 5.75927734375, 5.9951171875, 6.23095703125, 6.466796875, 6.70263671875, 6.9384765625, 7.17431640625, 7.41015625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 9.0, 9.0, 11.0, 11.0, 17.0, 18.0, 26.0, 35.0, 55.0, 51.0, 67.0, 80.0, 60.0, 73.0, 84.0, 72.0, 67.0, 48.0, 54.0, 40.0, 23.0, 18.0, 15.0, 11.0, 7.0, 4.0, 5.0, 8.0, 9.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.000423431396484375, -0.0004111379384994507, -0.00039884448051452637, -0.00038655102252960205, -0.00037425756454467773, -0.0003619641065597534, -0.0003496706485748291, -0.0003373771905899048, -0.00032508373260498047, -0.00031279027462005615, -0.00030049681663513184, -0.0002882033586502075, -0.0002759099006652832, -0.0002636164426803589, -0.00025132298469543457, -0.00023902952671051025, -0.00022673606872558594, -0.00021444261074066162, -0.0002021491527557373, -0.000189855694770813, -0.00017756223678588867, -0.00016526877880096436, -0.00015297532081604004, -0.00014068186283111572, -0.0001283884048461914, -0.00011609494686126709, -0.00010380148887634277, -9.150803089141846e-05, -7.921457290649414e-05, -6.692111492156982e-05, -5.462765693664551e-05, -4.233419895172119e-05, -3.0040740966796875e-05, -1.774728298187256e-05, -5.453824996948242e-06, 6.839632987976074e-06, 1.913309097290039e-05, 3.142654895782471e-05, 4.3720006942749023e-05, 5.601346492767334e-05, 6.830692291259766e-05, 8.060038089752197e-05, 9.289383888244629e-05, 0.0001051872968673706, 0.00011748075485229492, 0.00012977421283721924, 0.00014206767082214355, 0.00015436112880706787, 0.0001666545867919922, 0.0001789480447769165, 0.00019124150276184082, 0.00020353496074676514, 0.00021582841873168945, 0.00022812187671661377, 0.00024041533470153809, 0.0002527087926864624, 0.0002650022506713867, 0.00027729570865631104, 0.00028958916664123535, 0.00030188262462615967, 0.000314176082611084, 0.0003264695405960083, 0.0003387629985809326, 0.00035105645656585693, 0.00036334991455078125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 8.0, 5.0, 9.0, 16.0, 22.0, 31.0, 39.0, 67.0, 62.0, 128.0, 189.0, 277.0, 483.0, 730.0, 1246.0, 2268.0, 4791.0, 10893.0, 29134.0, 83362.0, 212005.0, 327488.0, 227316.0, 92763.0, 32154.0, 11986.0, 5106.0, 2472.0, 1313.0, 780.0, 496.0, 339.0, 164.0, 130.0, 88.0, 63.0, 26.0, 24.0, 23.0, 14.0, 19.0, 7.0, 7.0, 6.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.75, -8.47265625, -8.1953125, -7.91796875, -7.640625, -7.36328125, -7.0859375, -6.80859375, -6.53125, -6.25390625, -5.9765625, -5.69921875, -5.421875, -5.14453125, -4.8671875, -4.58984375, -4.3125, -4.03515625, -3.7578125, -3.48046875, -3.203125, -2.92578125, -2.6484375, -2.37109375, -2.09375, -1.81640625, -1.5390625, -1.26171875, -0.984375, -0.70703125, -0.4296875, -0.15234375, 0.125, 0.40234375, 0.6796875, 0.95703125, 1.234375, 1.51171875, 1.7890625, 2.06640625, 2.34375, 2.62109375, 2.8984375, 3.17578125, 3.453125, 3.73046875, 4.0078125, 4.28515625, 4.5625, 4.83984375, 5.1171875, 5.39453125, 5.671875, 5.94921875, 6.2265625, 6.50390625, 6.78125, 7.05859375, 7.3359375, 7.61328125, 7.890625, 8.16796875, 8.4453125, 8.72265625, 9.0]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 8.0, 4.0, 4.0, 9.0, 17.0, 15.0, 45.0, 35.0, 26.0, 54.0, 63.0, 70.0, 79.0, 92.0, 90.0, 67.0, 70.0, 58.0, 46.0, 31.0, 21.0, 31.0, 14.0, 11.0, 6.0, 6.0, 12.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6171875, -1.56268310546875, -1.5081787109375, -1.45367431640625, -1.399169921875, -1.34466552734375, -1.2901611328125, -1.23565673828125, -1.18115234375, -1.12664794921875, -1.0721435546875, -1.01763916015625, -0.963134765625, -0.90863037109375, -0.8541259765625, -0.79962158203125, -0.7451171875, -0.69061279296875, -0.6361083984375, -0.58160400390625, -0.527099609375, -0.47259521484375, -0.4180908203125, -0.36358642578125, -0.30908203125, -0.25457763671875, -0.2000732421875, -0.14556884765625, -0.091064453125, -0.03656005859375, 0.0179443359375, 0.07244873046875, 0.126953125, 0.18145751953125, 0.2359619140625, 0.29046630859375, 0.344970703125, 0.39947509765625, 0.4539794921875, 0.50848388671875, 0.56298828125, 0.61749267578125, 0.6719970703125, 0.72650146484375, 0.781005859375, 0.83551025390625, 0.8900146484375, 0.94451904296875, 0.9990234375, 1.05352783203125, 1.1080322265625, 1.16253662109375, 1.217041015625, 1.27154541015625, 1.3260498046875, 1.38055419921875, 1.43505859375, 1.48956298828125, 1.5440673828125, 1.59857177734375, 1.653076171875, 1.70758056640625, 1.7620849609375, 1.81658935546875, 1.87109375]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 8.0, 9.0, 5.0, 11.0, 19.0, 16.0, 31.0, 23.0, 25.0, 43.0, 51.0, 54.0, 74.0, 73.0, 89.0, 65.0, 69.0, 52.0, 58.0, 47.0, 25.0, 32.0, 20.0, 29.0, 7.0, 15.0, 14.0, 5.0, 3.0, 7.0, 2.0, 5.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.77476692199707, -19.087709426879883, -18.400651931762695, -17.71359634399414, -17.026538848876953, -16.339481353759766, -15.652423858642578, -14.96536636352539, -14.27830982208252, -13.591252326965332, -12.904195785522461, -12.217138290405273, -11.530080795288086, -10.843024253845215, -10.155966758728027, -9.468910217285156, -8.781852722167969, -8.094795227050781, -7.40773868560791, -6.720681190490723, -6.033624172210693, -5.346567153930664, -4.659509658813477, -3.9724526405334473, -3.285395622253418, -2.5983386039733887, -1.9112813472747803, -1.2242240905761719, -0.5371670722961426, 0.14988994598388672, 0.8369474411010742, 1.5240044593811035, 2.2110595703125, 2.8981165885925293, 3.5851738452911377, 4.272231101989746, 4.959288120269775, 5.646345138549805, 6.333402633666992, 7.0204596519470215, 7.707516670227051, 8.394574165344238, 9.08163070678711, 9.768688201904297, 10.455745697021484, 11.142802238464355, 11.829859733581543, 12.516916275024414, 13.203973770141602, 13.891031265258789, 14.57808780670166, 15.265145301818848, 15.952201843261719, 16.639259338378906, 17.326316833496094, 18.01337432861328, 18.70043182373047, 19.387489318847656, 20.074546813964844, 20.76160430908203, 21.448659896850586, 22.135717391967773, 22.82277488708496, 23.50983238220215, 24.196887969970703]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 0.0, 6.0, 2.0, 6.0, 3.0, 12.0, 12.0, 19.0, 15.0, 18.0, 17.0, 22.0, 27.0, 30.0, 35.0, 38.0, 37.0, 34.0, 45.0, 44.0, 47.0, 54.0, 53.0, 47.0, 41.0, 28.0, 34.0, 33.0, 35.0, 29.0, 30.0, 30.0, 15.0, 25.0, 13.0, 17.0, 11.0, 6.0, 11.0, 5.0, 6.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.260191917419434, -8.958500862121582, -8.65680980682373, -8.355118751525879, -8.053426742553711, -7.751736164093018, -7.450044631958008, -7.148353576660156, -6.846662521362305, -6.544971466064453, -6.243280410766602, -5.941588878631592, -5.63989782333374, -5.338206768035889, -5.036515235900879, -4.734824180603027, -4.433133125305176, -4.131442070007324, -3.8297507762908936, -3.528059482574463, -3.2263684272766113, -2.9246773719787598, -2.622986078262329, -2.3212947845458984, -2.019603729248047, -1.7179125547409058, -1.4162213802337646, -1.1145302057266235, -0.8128390312194824, -0.5111478567123413, -0.2094566822052002, 0.09223461151123047, 0.39392662048339844, 0.6956177949905396, 0.9973089694976807, 1.2990001440048218, 1.600691318511963, 1.902382493019104, 2.204073667526245, 2.505764961242676, 2.8074560165405273, 3.109147071838379, 3.4108383655548096, 3.7125296592712402, 4.014220714569092, 4.315911769866943, 4.617603302001953, 4.919294357299805, 5.220985412597656, 5.522676467895508, 5.824367523193359, 6.126059055328369, 6.427750110626221, 6.729441165924072, 7.031132698059082, 7.332823753356934, 7.634514808654785, 7.936205863952637, 8.237896919250488, 8.53958797454834, 8.841279983520508, 9.14297103881836, 9.444662094116211, 9.746353149414062, 10.048044204711914]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 7.0, 4.0, 10.0, 12.0, 12.0, 29.0, 37.0, 66.0, 124.0, 198.0, 328.0, 601.0, 1189.0, 2226.0, 4381.0, 8619.0, 17752.0, 35645.0, 71264.0, 129424.0, 195040.0, 213724.0, 165721.0, 99137.0, 51979.0, 25428.0, 12583.0, 6075.0, 3207.0, 1677.0, 880.0, 487.0, 274.0, 173.0, 98.0, 48.0, 35.0, 23.0, 14.0, 8.0, 6.0, 7.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.765625, -16.150634765625, -15.53564453125, -14.920654296875, -14.3056640625, -13.690673828125, -13.07568359375, -12.460693359375, -11.845703125, -11.230712890625, -10.61572265625, -10.000732421875, -9.3857421875, -8.770751953125, -8.15576171875, -7.540771484375, -6.92578125, -6.310791015625, -5.69580078125, -5.080810546875, -4.4658203125, -3.850830078125, -3.23583984375, -2.620849609375, -2.005859375, -1.390869140625, -0.77587890625, -0.160888671875, 0.4541015625, 1.069091796875, 1.68408203125, 2.299072265625, 2.9140625, 3.529052734375, 4.14404296875, 4.759033203125, 5.3740234375, 5.989013671875, 6.60400390625, 7.218994140625, 7.833984375, 8.448974609375, 9.06396484375, 9.678955078125, 10.2939453125, 10.908935546875, 11.52392578125, 12.138916015625, 12.75390625, 13.368896484375, 13.98388671875, 14.598876953125, 15.2138671875, 15.828857421875, 16.44384765625, 17.058837890625, 17.673828125, 18.288818359375, 18.90380859375, 19.518798828125, 20.1337890625, 20.748779296875, 21.36376953125, 21.978759765625, 22.59375]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 3.0, 4.0, 4.0, 3.0, 9.0, 9.0, 13.0, 14.0, 15.0, 18.0, 22.0, 22.0, 21.0, 25.0, 32.0, 33.0, 35.0, 37.0, 41.0, 38.0, 34.0, 41.0, 44.0, 39.0, 48.0, 38.0, 41.0, 21.0, 38.0, 40.0, 26.0, 26.0, 25.0, 22.0, 22.0, 12.0, 9.0, 18.0, 10.0, 10.0, 7.0, 9.0, 7.0, 3.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-10.34375, -10.0341796875, -9.724609375, -9.4150390625, -9.10546875, -8.7958984375, -8.486328125, -8.1767578125, -7.8671875, -7.5576171875, -7.248046875, -6.9384765625, -6.62890625, -6.3193359375, -6.009765625, -5.7001953125, -5.390625, -5.0810546875, -4.771484375, -4.4619140625, -4.15234375, -3.8427734375, -3.533203125, -3.2236328125, -2.9140625, -2.6044921875, -2.294921875, -1.9853515625, -1.67578125, -1.3662109375, -1.056640625, -0.7470703125, -0.4375, -0.1279296875, 0.181640625, 0.4912109375, 0.80078125, 1.1103515625, 1.419921875, 1.7294921875, 2.0390625, 2.3486328125, 2.658203125, 2.9677734375, 3.27734375, 3.5869140625, 3.896484375, 4.2060546875, 4.515625, 4.8251953125, 5.134765625, 5.4443359375, 5.75390625, 6.0634765625, 6.373046875, 6.6826171875, 6.9921875, 7.3017578125, 7.611328125, 7.9208984375, 8.23046875, 8.5400390625, 8.849609375, 9.1591796875, 9.46875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 6.0, 8.0, 14.0, 18.0, 36.0, 44.0, 70.0, 125.0, 169.0, 247.0, 361.0, 601.0, 889.0, 1309.0, 2035.0, 3097.0, 4656.0, 7360.0, 11432.0, 17372.0, 26151.0, 38887.0, 56408.0, 77272.0, 99693.0, 118358.0, 125136.0, 117054.0, 98301.0, 75418.0, 54502.0, 37540.0, 25676.0, 16774.0, 11025.0, 7130.0, 4587.0, 3062.0, 1974.0, 1294.0, 833.0, 567.0, 361.0, 248.0, 163.0, 95.0, 68.0, 50.0, 27.0, 24.0, 15.0, 8.0, 8.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-12.359375, -11.9786376953125, -11.597900390625, -11.2171630859375, -10.83642578125, -10.4556884765625, -10.074951171875, -9.6942138671875, -9.3134765625, -8.9327392578125, -8.552001953125, -8.1712646484375, -7.79052734375, -7.4097900390625, -7.029052734375, -6.6483154296875, -6.267578125, -5.8868408203125, -5.506103515625, -5.1253662109375, -4.74462890625, -4.3638916015625, -3.983154296875, -3.6024169921875, -3.2216796875, -2.8409423828125, -2.460205078125, -2.0794677734375, -1.69873046875, -1.3179931640625, -0.937255859375, -0.5565185546875, -0.17578125, 0.2049560546875, 0.585693359375, 0.9664306640625, 1.34716796875, 1.7279052734375, 2.108642578125, 2.4893798828125, 2.8701171875, 3.2508544921875, 3.631591796875, 4.0123291015625, 4.39306640625, 4.7738037109375, 5.154541015625, 5.5352783203125, 5.916015625, 6.2967529296875, 6.677490234375, 7.0582275390625, 7.43896484375, 7.8197021484375, 8.200439453125, 8.5811767578125, 8.9619140625, 9.3426513671875, 9.723388671875, 10.1041259765625, 10.48486328125, 10.8656005859375, 11.246337890625, 11.6270751953125, 12.0078125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 1.0, 5.0, 4.0, 11.0, 10.0, 11.0, 12.0, 19.0, 13.0, 11.0, 13.0, 25.0, 23.0, 28.0, 25.0, 37.0, 27.0, 41.0, 45.0, 43.0, 43.0, 43.0, 43.0, 31.0, 45.0, 51.0, 31.0, 42.0, 30.0, 32.0, 37.0, 34.0, 17.0, 20.0, 18.0, 16.0, 12.0, 14.0, 10.0, 9.0, 2.0, 7.0, 3.0, 0.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.4453125, -6.244140625, -6.04296875, -5.841796875, -5.640625, -5.439453125, -5.23828125, -5.037109375, -4.8359375, -4.634765625, -4.43359375, -4.232421875, -4.03125, -3.830078125, -3.62890625, -3.427734375, -3.2265625, -3.025390625, -2.82421875, -2.623046875, -2.421875, -2.220703125, -2.01953125, -1.818359375, -1.6171875, -1.416015625, -1.21484375, -1.013671875, -0.8125, -0.611328125, -0.41015625, -0.208984375, -0.0078125, 0.193359375, 0.39453125, 0.595703125, 0.796875, 0.998046875, 1.19921875, 1.400390625, 1.6015625, 1.802734375, 2.00390625, 2.205078125, 2.40625, 2.607421875, 2.80859375, 3.009765625, 3.2109375, 3.412109375, 3.61328125, 3.814453125, 4.015625, 4.216796875, 4.41796875, 4.619140625, 4.8203125, 5.021484375, 5.22265625, 5.423828125, 5.625, 5.826171875, 6.02734375, 6.228515625, 6.4296875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 3.0, 4.0, 5.0, 18.0, 22.0, 31.0, 30.0, 49.0, 65.0, 87.0, 147.0, 222.0, 366.0, 548.0, 885.0, 1530.0, 2667.0, 4613.0, 8132.0, 15203.0, 29253.0, 57656.0, 110582.0, 186015.0, 227365.0, 180950.0, 106214.0, 54970.0, 27779.0, 14420.0, 7801.0, 4525.0, 2487.0, 1518.0, 871.0, 536.0, 335.0, 206.0, 157.0, 101.0, 56.0, 47.0, 36.0, 30.0, 6.0, 5.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.734375, -11.3729248046875, -11.011474609375, -10.6500244140625, -10.28857421875, -9.9271240234375, -9.565673828125, -9.2042236328125, -8.8427734375, -8.4813232421875, -8.119873046875, -7.7584228515625, -7.39697265625, -7.0355224609375, -6.674072265625, -6.3126220703125, -5.951171875, -5.5897216796875, -5.228271484375, -4.8668212890625, -4.50537109375, -4.1439208984375, -3.782470703125, -3.4210205078125, -3.0595703125, -2.6981201171875, -2.336669921875, -1.9752197265625, -1.61376953125, -1.2523193359375, -0.890869140625, -0.5294189453125, -0.16796875, 0.1934814453125, 0.554931640625, 0.9163818359375, 1.27783203125, 1.6392822265625, 2.000732421875, 2.3621826171875, 2.7236328125, 3.0850830078125, 3.446533203125, 3.8079833984375, 4.16943359375, 4.5308837890625, 4.892333984375, 5.2537841796875, 5.615234375, 5.9766845703125, 6.338134765625, 6.6995849609375, 7.06103515625, 7.4224853515625, 7.783935546875, 8.1453857421875, 8.5068359375, 8.8682861328125, 9.229736328125, 9.5911865234375, 9.95263671875, 10.3140869140625, 10.675537109375, 11.0369873046875, 11.3984375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 5.0, 9.0, 15.0, 9.0, 6.0, 12.0, 11.0, 29.0, 30.0, 35.0, 60.0, 42.0, 57.0, 69.0, 75.0, 65.0, 75.0, 74.0, 45.0, 56.0, 40.0, 37.0, 33.0, 21.0, 20.0, 11.0, 10.0, 16.0, 8.0, 7.0, 4.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0011281967163085938, -0.0010912269353866577, -0.0010542571544647217, -0.0010172873735427856, -0.0009803175926208496, -0.0009433478116989136, -0.0009063780307769775, -0.0008694082498550415, -0.0008324384689331055, -0.0007954686880111694, -0.0007584989070892334, -0.0007215291261672974, -0.0006845593452453613, -0.0006475895643234253, -0.0006106197834014893, -0.0005736500024795532, -0.0005366802215576172, -0.0004997104406356812, -0.0004627406597137451, -0.0004257708787918091, -0.00038880109786987305, -0.000351831316947937, -0.000314861536026001, -0.00027789175510406494, -0.0002409219741821289, -0.00020395219326019287, -0.00016698241233825684, -0.0001300126314163208, -9.304285049438477e-05, -5.607306957244873e-05, -1.9103288650512695e-05, 1.786649227142334e-05, 5.4836273193359375e-05, 9.180605411529541e-05, 0.00012877583503723145, 0.00016574561595916748, 0.00020271539688110352, 0.00023968517780303955, 0.0002766549587249756, 0.0003136247396469116, 0.00035059452056884766, 0.0003875643014907837, 0.0004245340824127197, 0.00046150386333465576, 0.0004984736442565918, 0.0005354434251785278, 0.0005724132061004639, 0.0006093829870223999, 0.0006463527679443359, 0.000683322548866272, 0.000720292329788208, 0.000757262110710144, 0.0007942318916320801, 0.0008312016725540161, 0.0008681714534759521, 0.0009051412343978882, 0.0009421110153198242, 0.0009790807962417603, 0.0010160505771636963, 0.0010530203580856323, 0.0010899901390075684, 0.0011269599199295044, 0.0011639297008514404, 0.0012008994817733765, 0.0012378692626953125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 9.0, 8.0, 20.0, 23.0, 32.0, 50.0, 56.0, 83.0, 116.0, 199.0, 311.0, 458.0, 716.0, 1145.0, 1884.0, 3169.0, 5289.0, 9035.0, 15929.0, 28232.0, 49698.0, 84454.0, 131496.0, 172771.0, 177100.0, 141466.0, 93614.0, 55985.0, 31840.0, 18341.0, 10076.0, 5875.0, 3441.0, 2090.0, 1288.0, 780.0, 484.0, 314.0, 218.0, 126.0, 101.0, 72.0, 60.0, 28.0, 24.0, 15.0, 15.0, 7.0, 7.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.015625, -7.7579345703125, -7.500244140625, -7.2425537109375, -6.98486328125, -6.7271728515625, -6.469482421875, -6.2117919921875, -5.9541015625, -5.6964111328125, -5.438720703125, -5.1810302734375, -4.92333984375, -4.6656494140625, -4.407958984375, -4.1502685546875, -3.892578125, -3.6348876953125, -3.377197265625, -3.1195068359375, -2.86181640625, -2.6041259765625, -2.346435546875, -2.0887451171875, -1.8310546875, -1.5733642578125, -1.315673828125, -1.0579833984375, -0.80029296875, -0.5426025390625, -0.284912109375, -0.0272216796875, 0.23046875, 0.4881591796875, 0.745849609375, 1.0035400390625, 1.26123046875, 1.5189208984375, 1.776611328125, 2.0343017578125, 2.2919921875, 2.5496826171875, 2.807373046875, 3.0650634765625, 3.32275390625, 3.5804443359375, 3.838134765625, 4.0958251953125, 4.353515625, 4.6112060546875, 4.868896484375, 5.1265869140625, 5.38427734375, 5.6419677734375, 5.899658203125, 6.1573486328125, 6.4150390625, 6.6727294921875, 6.930419921875, 7.1881103515625, 7.44580078125, 7.7034912109375, 7.961181640625, 8.2188720703125, 8.4765625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 8.0, 5.0, 9.0, 5.0, 12.0, 14.0, 13.0, 14.0, 22.0, 21.0, 39.0, 37.0, 43.0, 42.0, 49.0, 52.0, 60.0, 47.0, 54.0, 61.0, 61.0, 45.0, 35.0, 41.0, 41.0, 33.0, 34.0, 27.0, 17.0, 18.0, 9.0, 10.0, 4.0, 2.0, 2.0, 3.0, 2.0, 5.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.42578125, -2.35546875, -2.28515625, -2.21484375, -2.14453125, -2.07421875, -2.00390625, -1.93359375, -1.86328125, -1.79296875, -1.72265625, -1.65234375, -1.58203125, -1.51171875, -1.44140625, -1.37109375, -1.30078125, -1.23046875, -1.16015625, -1.08984375, -1.01953125, -0.94921875, -0.87890625, -0.80859375, -0.73828125, -0.66796875, -0.59765625, -0.52734375, -0.45703125, -0.38671875, -0.31640625, -0.24609375, -0.17578125, -0.10546875, -0.03515625, 0.03515625, 0.10546875, 0.17578125, 0.24609375, 0.31640625, 0.38671875, 0.45703125, 0.52734375, 0.59765625, 0.66796875, 0.73828125, 0.80859375, 0.87890625, 0.94921875, 1.01953125, 1.08984375, 1.16015625, 1.23046875, 1.30078125, 1.37109375, 1.44140625, 1.51171875, 1.58203125, 1.65234375, 1.72265625, 1.79296875, 1.86328125, 1.93359375, 2.00390625, 2.07421875]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 6.0, 9.0, 12.0, 15.0, 18.0, 15.0, 30.0, 38.0, 35.0, 59.0, 64.0, 58.0, 77.0, 69.0, 75.0, 76.0, 68.0, 53.0, 43.0, 35.0, 29.0, 22.0, 20.0, 13.0, 15.0, 5.0, 9.0, 9.0, 4.0, 7.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.27089500427246, -18.551015853881836, -17.83113670349121, -17.11125946044922, -16.391380310058594, -15.671501159667969, -14.951622009277344, -14.231742858886719, -13.51186466217041, -12.791985511779785, -12.072107315063477, -11.352228164672852, -10.632349014282227, -9.912470817565918, -9.192591667175293, -8.472713470458984, -7.752834320068359, -7.032955646514893, -6.313076972961426, -5.593197822570801, -4.873319149017334, -4.153440475463867, -3.433561325073242, -2.7136826515197754, -1.9938039779663086, -1.2739251852035522, -0.5540463924407959, 0.16583251953125, 0.8857111930847168, 1.6055898666381836, 2.3254690170288086, 3.0453476905822754, 3.765228271484375, 4.485106945037842, 5.204985618591309, 5.924864768981934, 6.6447434425354, 7.364622116088867, 8.084501266479492, 8.804380416870117, 9.524258613586426, 10.24413776397705, 10.96401596069336, 11.683895111083984, 12.40377426147461, 13.123652458190918, 13.843531608581543, 14.563409805297852, 15.283288955688477, 16.0031681060791, 16.723047256469727, 17.44292449951172, 18.162803649902344, 18.88268280029297, 19.602561950683594, 20.32244110107422, 21.042320251464844, 21.76219940185547, 22.482078552246094, 23.20195770263672, 23.92183494567871, 24.641714096069336, 25.36159324645996, 26.081472396850586, 26.801349639892578]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 10.0, 4.0, 9.0, 8.0, 12.0, 17.0, 15.0, 23.0, 24.0, 24.0, 31.0, 21.0, 36.0, 42.0, 45.0, 32.0, 42.0, 43.0, 47.0, 44.0, 40.0, 45.0, 35.0, 39.0, 38.0, 29.0, 24.0, 35.0, 19.0, 23.0, 22.0, 15.0, 23.0, 11.0, 16.0, 13.0, 10.0, 12.0, 7.0, 3.0, 5.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.428163528442383, -9.131139755249023, -8.834115982055664, -8.537092208862305, -8.240068435668945, -7.943045139312744, -7.646021366119385, -7.348998069763184, -7.051974296569824, -6.754950523376465, -6.4579267501831055, -6.160902976989746, -5.863879680633545, -5.5668559074401855, -5.269832134246826, -4.972808837890625, -4.675784587860107, -4.378760814666748, -4.081737041473389, -3.7847135066986084, -3.487689971923828, -3.1906661987304688, -2.8936424255371094, -2.596618890762329, -2.2995951175689697, -2.0025713443756104, -1.70554780960083, -1.4085240364074707, -1.1115003824234009, -0.814476728439331, -0.5174529552459717, -0.2204294204711914, 0.07659435272216797, 0.3736180365085602, 0.6706417202949524, 0.967665433883667, 1.2646890878677368, 1.5617127418518066, 1.858736515045166, 2.1557600498199463, 2.4527838230133057, 2.749807596206665, 3.0468311309814453, 3.3438549041748047, 3.640878677368164, 3.9379022121429443, 4.234926223754883, 4.531949520111084, 4.828973293304443, 5.125997066497803, 5.423020839691162, 5.720044136047363, 6.017067909240723, 6.314091682434082, 6.611115455627441, 6.908139228820801, 7.20516300201416, 7.5021867752075195, 7.799210548400879, 8.096234321594238, 8.393258094787598, 8.69028091430664, 8.9873046875, 9.28432846069336, 9.581352233886719]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 12.0, 12.0, 19.0, 48.0, 62.0, 92.0, 142.0, 250.0, 468.0, 812.0, 1442.0, 2578.0, 4815.0, 9495.0, 19446.0, 40661.0, 91648.0, 218491.0, 562537.0, 1221540.0, 1159082.0, 507554.0, 197779.0, 82172.0, 36799.0, 17538.0, 8674.0, 4359.0, 2430.0, 1369.0, 748.0, 477.0, 274.0, 150.0, 85.0, 62.0, 37.0, 21.0, 22.0, 22.0, 18.0, 9.0, 14.0, 9.0, 5.0, 4.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.6328125, -14.9515380859375, -14.270263671875, -13.5889892578125, -12.90771484375, -12.2264404296875, -11.545166015625, -10.8638916015625, -10.1826171875, -9.5013427734375, -8.820068359375, -8.1387939453125, -7.45751953125, -6.7762451171875, -6.094970703125, -5.4136962890625, -4.732421875, -4.0511474609375, -3.369873046875, -2.6885986328125, -2.00732421875, -1.3260498046875, -0.644775390625, 0.0364990234375, 0.7177734375, 1.3990478515625, 2.080322265625, 2.7615966796875, 3.44287109375, 4.1241455078125, 4.805419921875, 5.4866943359375, 6.16796875, 6.8492431640625, 7.530517578125, 8.2117919921875, 8.89306640625, 9.5743408203125, 10.255615234375, 10.9368896484375, 11.6181640625, 12.2994384765625, 12.980712890625, 13.6619873046875, 14.34326171875, 15.0245361328125, 15.705810546875, 16.3870849609375, 17.068359375, 17.7496337890625, 18.430908203125, 19.1121826171875, 19.79345703125, 20.4747314453125, 21.156005859375, 21.8372802734375, 22.5185546875, 23.1998291015625, 23.881103515625, 24.5623779296875, 25.24365234375, 25.9249267578125, 26.606201171875, 27.2874755859375, 27.96875]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 6.0, 8.0, 7.0, 12.0, 13.0, 12.0, 21.0, 24.0, 23.0, 27.0, 40.0, 29.0, 35.0, 36.0, 41.0, 62.0, 57.0, 47.0, 50.0, 39.0, 46.0, 35.0, 49.0, 40.0, 45.0, 29.0, 23.0, 18.0, 23.0, 14.0, 13.0, 14.0, 14.0, 7.0, 8.0, 8.0, 7.0, 9.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4453125, -8.174560546875, -7.90380859375, -7.633056640625, -7.3623046875, -7.091552734375, -6.82080078125, -6.550048828125, -6.279296875, -6.008544921875, -5.73779296875, -5.467041015625, -5.1962890625, -4.925537109375, -4.65478515625, -4.384033203125, -4.11328125, -3.842529296875, -3.57177734375, -3.301025390625, -3.0302734375, -2.759521484375, -2.48876953125, -2.218017578125, -1.947265625, -1.676513671875, -1.40576171875, -1.135009765625, -0.8642578125, -0.593505859375, -0.32275390625, -0.052001953125, 0.21875, 0.489501953125, 0.76025390625, 1.031005859375, 1.3017578125, 1.572509765625, 1.84326171875, 2.114013671875, 2.384765625, 2.655517578125, 2.92626953125, 3.197021484375, 3.4677734375, 3.738525390625, 4.00927734375, 4.280029296875, 4.55078125, 4.821533203125, 5.09228515625, 5.363037109375, 5.6337890625, 5.904541015625, 6.17529296875, 6.446044921875, 6.716796875, 6.987548828125, 7.25830078125, 7.529052734375, 7.7998046875, 8.070556640625, 8.34130859375, 8.612060546875, 8.8828125]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 9.0, 17.0, 18.0, 28.0, 37.0, 66.0, 98.0, 142.0, 239.0, 341.0, 509.0, 852.0, 1360.0, 2239.0, 3479.0, 5997.0, 10244.0, 17611.0, 32275.0, 60352.0, 113445.0, 215016.0, 405964.0, 701669.0, 922602.0, 745870.0, 442421.0, 238656.0, 124413.0, 65861.0, 35293.0, 19535.0, 11051.0, 6508.0, 3704.0, 2295.0, 1378.0, 938.0, 590.0, 395.0, 273.0, 166.0, 115.0, 73.0, 46.0, 27.0, 23.0, 13.0, 11.0, 7.0, 5.0, 5.0, 2.0, 0.0, 1.0, 2.0], "bins": [-17.75, -17.205078125, -16.66015625, -16.115234375, -15.5703125, -15.025390625, -14.48046875, -13.935546875, -13.390625, -12.845703125, -12.30078125, -11.755859375, -11.2109375, -10.666015625, -10.12109375, -9.576171875, -9.03125, -8.486328125, -7.94140625, -7.396484375, -6.8515625, -6.306640625, -5.76171875, -5.216796875, -4.671875, -4.126953125, -3.58203125, -3.037109375, -2.4921875, -1.947265625, -1.40234375, -0.857421875, -0.3125, 0.232421875, 0.77734375, 1.322265625, 1.8671875, 2.412109375, 2.95703125, 3.501953125, 4.046875, 4.591796875, 5.13671875, 5.681640625, 6.2265625, 6.771484375, 7.31640625, 7.861328125, 8.40625, 8.951171875, 9.49609375, 10.041015625, 10.5859375, 11.130859375, 11.67578125, 12.220703125, 12.765625, 13.310546875, 13.85546875, 14.400390625, 14.9453125, 15.490234375, 16.03515625, 16.580078125, 17.125]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 7.0, 11.0, 11.0, 19.0, 16.0, 23.0, 35.0, 52.0, 59.0, 56.0, 99.0, 135.0, 125.0, 173.0, 239.0, 285.0, 303.0, 324.0, 273.0, 286.0, 281.0, 251.0, 210.0, 184.0, 131.0, 126.0, 80.0, 68.0, 48.0, 42.0, 27.0, 29.0, 20.0, 11.0, 11.0, 12.0, 3.0, 5.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.33203125, -6.1473388671875, -5.962646484375, -5.7779541015625, -5.59326171875, -5.4085693359375, -5.223876953125, -5.0391845703125, -4.8544921875, -4.6697998046875, -4.485107421875, -4.3004150390625, -4.11572265625, -3.9310302734375, -3.746337890625, -3.5616455078125, -3.376953125, -3.1922607421875, -3.007568359375, -2.8228759765625, -2.63818359375, -2.4534912109375, -2.268798828125, -2.0841064453125, -1.8994140625, -1.7147216796875, -1.530029296875, -1.3453369140625, -1.16064453125, -0.9759521484375, -0.791259765625, -0.6065673828125, -0.421875, -0.2371826171875, -0.052490234375, 0.1322021484375, 0.31689453125, 0.5015869140625, 0.686279296875, 0.8709716796875, 1.0556640625, 1.2403564453125, 1.425048828125, 1.6097412109375, 1.79443359375, 1.9791259765625, 2.163818359375, 2.3485107421875, 2.533203125, 2.7178955078125, 2.902587890625, 3.0872802734375, 3.27197265625, 3.4566650390625, 3.641357421875, 3.8260498046875, 4.0107421875, 4.1954345703125, 4.380126953125, 4.5648193359375, 4.74951171875, 4.9342041015625, 5.118896484375, 5.3035888671875, 5.48828125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 3.0, 8.0, 5.0, 9.0, 13.0, 17.0, 14.0, 19.0, 28.0, 27.0, 41.0, 49.0, 48.0, 63.0, 56.0, 68.0, 82.0, 60.0, 52.0, 67.0, 47.0, 38.0, 36.0, 35.0, 19.0, 21.0, 17.0, 13.0, 5.0, 9.0, 6.0, 7.0, 6.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.768938064575195, -20.087682723999023, -19.406429290771484, -18.725173950195312, -18.04391860961914, -17.36266326904297, -16.68140983581543, -16.000154495239258, -15.318899154663086, -14.63764476776123, -13.956389427185059, -13.275135040283203, -12.593879699707031, -11.912625312805176, -11.23137092590332, -10.550115585327148, -9.868861198425293, -9.187606811523438, -8.506351470947266, -7.82509708404541, -7.143841743469238, -6.462587356567383, -5.781332492828369, -5.1000776290893555, -4.418822765350342, -3.737567901611328, -3.0563130378723145, -2.37505841255188, -1.6938035488128662, -1.0125486850738525, -0.33129405975341797, 0.3499608039855957, 1.0312156677246094, 1.712470531463623, 2.3937253952026367, 3.0749800205230713, 3.756234884262085, 4.4374895095825195, 5.118744373321533, 5.799999237060547, 6.4812541007995605, 7.162508964538574, 7.843763828277588, 8.525018692016602, 9.206273078918457, 9.887528419494629, 10.568782806396484, 11.250038146972656, 11.931292533874512, 12.612546920776367, 13.293802261352539, 13.975056648254395, 14.656311988830566, 15.337566375732422, 16.018821716308594, 16.700077056884766, 17.381330490112305, 18.062585830688477, 18.743839263916016, 19.425094604492188, 20.10634994506836, 20.78760528564453, 21.46885871887207, 22.150114059448242, 22.831369400024414]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 8.0, 3.0, 4.0, 11.0, 10.0, 6.0, 13.0, 13.0, 15.0, 14.0, 27.0, 21.0, 20.0, 28.0, 23.0, 31.0, 39.0, 35.0, 41.0, 25.0, 48.0, 41.0, 41.0, 42.0, 34.0, 37.0, 40.0, 29.0, 34.0, 27.0, 27.0, 27.0, 19.0, 35.0, 18.0, 15.0, 16.0, 17.0, 14.0, 10.0, 14.0, 11.0, 8.0, 4.0, 4.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.9055757522583, -8.616514205932617, -8.327452659606934, -8.03839111328125, -7.749330043792725, -7.460268497467041, -7.171207427978516, -6.882145881652832, -6.593084335327148, -6.304022789001465, -6.014961242675781, -5.725900173187256, -5.436838626861572, -5.147777080535889, -4.858716011047363, -4.56965446472168, -4.280592918395996, -3.9915313720703125, -3.702470064163208, -3.4134087562561035, -3.12434720993042, -2.8352856636047363, -2.546224355697632, -2.2571630477905273, -1.9681015014648438, -1.6790400743484497, -1.3899786472320557, -1.1009172201156616, -0.8118557929992676, -0.5227943658828735, -0.2337329387664795, 0.055328369140625, 0.3443889617919922, 0.6334503889083862, 0.9225118160247803, 1.2115732431411743, 1.5006346702575684, 1.7896960973739624, 2.0787575244903564, 2.367818832397461, 2.6568803787231445, 2.945941925048828, 3.2350032329559326, 3.524064540863037, 3.8131260871887207, 4.102187633514404, 4.39124870300293, 4.680310249328613, 4.969371795654297, 5.2584333419799805, 5.547494888305664, 5.8365559577941895, 6.125617504119873, 6.414679050445557, 6.703740119934082, 6.992801666259766, 7.281863212585449, 7.570924758911133, 7.859986305236816, 8.1490478515625, 8.438108444213867, 8.72716999053955, 9.016231536865234, 9.305293083190918, 9.594354629516602]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 6.0, 6.0, 5.0, 12.0, 14.0, 20.0, 35.0, 43.0, 69.0, 89.0, 128.0, 183.0, 255.0, 385.0, 543.0, 759.0, 1159.0, 1733.0, 2870.0, 4818.0, 8386.0, 15661.0, 29984.0, 58548.0, 107101.0, 172408.0, 210186.0, 180176.0, 115927.0, 63809.0, 32901.0, 17255.0, 9319.0, 5015.0, 3064.0, 1860.0, 1196.0, 803.0, 568.0, 346.0, 287.0, 179.0, 146.0, 98.0, 70.0, 45.0, 27.0, 21.0, 11.0, 14.0, 10.0, 6.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5703125, -10.1868896484375, -9.803466796875, -9.4200439453125, -9.03662109375, -8.6531982421875, -8.269775390625, -7.8863525390625, -7.5029296875, -7.1195068359375, -6.736083984375, -6.3526611328125, -5.96923828125, -5.5858154296875, -5.202392578125, -4.8189697265625, -4.435546875, -4.0521240234375, -3.668701171875, -3.2852783203125, -2.90185546875, -2.5184326171875, -2.135009765625, -1.7515869140625, -1.3681640625, -0.9847412109375, -0.601318359375, -0.2178955078125, 0.16552734375, 0.5489501953125, 0.932373046875, 1.3157958984375, 1.69921875, 2.0826416015625, 2.466064453125, 2.8494873046875, 3.23291015625, 3.6163330078125, 3.999755859375, 4.3831787109375, 4.7666015625, 5.1500244140625, 5.533447265625, 5.9168701171875, 6.30029296875, 6.6837158203125, 7.067138671875, 7.4505615234375, 7.833984375, 8.2174072265625, 8.600830078125, 8.9842529296875, 9.36767578125, 9.7510986328125, 10.134521484375, 10.5179443359375, 10.9013671875, 11.2847900390625, 11.668212890625, 12.0516357421875, 12.43505859375, 12.8184814453125, 13.201904296875, 13.5853271484375, 13.96875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 3.0, 5.0, 4.0, 6.0, 4.0, 7.0, 17.0, 16.0, 8.0, 17.0, 18.0, 20.0, 24.0, 36.0, 34.0, 34.0, 48.0, 44.0, 41.0, 50.0, 35.0, 46.0, 41.0, 43.0, 37.0, 44.0, 32.0, 35.0, 30.0, 34.0, 24.0, 32.0, 26.0, 14.0, 21.0, 15.0, 10.0, 8.0, 15.0, 10.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.7578125, -10.3970947265625, -10.036376953125, -9.6756591796875, -9.31494140625, -8.9542236328125, -8.593505859375, -8.2327880859375, -7.8720703125, -7.5113525390625, -7.150634765625, -6.7899169921875, -6.42919921875, -6.0684814453125, -5.707763671875, -5.3470458984375, -4.986328125, -4.6256103515625, -4.264892578125, -3.9041748046875, -3.54345703125, -3.1827392578125, -2.822021484375, -2.4613037109375, -2.1005859375, -1.7398681640625, -1.379150390625, -1.0184326171875, -0.65771484375, -0.2969970703125, 0.063720703125, 0.4244384765625, 0.78515625, 1.1458740234375, 1.506591796875, 1.8673095703125, 2.22802734375, 2.5887451171875, 2.949462890625, 3.3101806640625, 3.6708984375, 4.0316162109375, 4.392333984375, 4.7530517578125, 5.11376953125, 5.4744873046875, 5.835205078125, 6.1959228515625, 6.556640625, 6.9173583984375, 7.278076171875, 7.6387939453125, 7.99951171875, 8.3602294921875, 8.720947265625, 9.0816650390625, 9.4423828125, 9.8031005859375, 10.163818359375, 10.5245361328125, 10.88525390625, 11.2459716796875, 11.606689453125, 11.9674072265625, 12.328125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 14.0, 12.0, 12.0, 14.0, 28.0, 37.0, 47.0, 53.0, 62.0, 101.0, 135.0, 182.0, 234.0, 339.0, 513.0, 963.0, 1924.0, 5046.0, 16143.0, 64834.0, 286758.0, 475723.0, 146123.0, 33000.0, 9274.0, 3259.0, 1488.0, 718.0, 386.0, 303.0, 222.0, 149.0, 112.0, 100.0, 58.0, 49.0, 41.0, 25.0, 11.0, 26.0, 4.0, 9.0, 6.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.203125, -28.205322265625, -27.20751953125, -26.209716796875, -25.2119140625, -24.214111328125, -23.21630859375, -22.218505859375, -21.220703125, -20.222900390625, -19.22509765625, -18.227294921875, -17.2294921875, -16.231689453125, -15.23388671875, -14.236083984375, -13.23828125, -12.240478515625, -11.24267578125, -10.244873046875, -9.2470703125, -8.249267578125, -7.25146484375, -6.253662109375, -5.255859375, -4.258056640625, -3.26025390625, -2.262451171875, -1.2646484375, -0.266845703125, 0.73095703125, 1.728759765625, 2.7265625, 3.724365234375, 4.72216796875, 5.719970703125, 6.7177734375, 7.715576171875, 8.71337890625, 9.711181640625, 10.708984375, 11.706787109375, 12.70458984375, 13.702392578125, 14.7001953125, 15.697998046875, 16.69580078125, 17.693603515625, 18.69140625, 19.689208984375, 20.68701171875, 21.684814453125, 22.6826171875, 23.680419921875, 24.67822265625, 25.676025390625, 26.673828125, 27.671630859375, 28.66943359375, 29.667236328125, 30.6650390625, 31.662841796875, 32.66064453125, 33.658447265625, 34.65625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 4.0, 3.0, 4.0, 2.0, 2.0, 4.0, 2.0, 9.0, 6.0, 13.0, 8.0, 15.0, 18.0, 20.0, 28.0, 22.0, 24.0, 25.0, 27.0, 30.0, 46.0, 32.0, 39.0, 40.0, 39.0, 48.0, 45.0, 49.0, 36.0, 29.0, 40.0, 24.0, 41.0, 26.0, 28.0, 23.0, 22.0, 19.0, 18.0, 13.0, 12.0, 14.0, 13.0, 8.0, 14.0, 9.0, 3.0, 6.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.68359375, -5.492919921875, -5.30224609375, -5.111572265625, -4.9208984375, -4.730224609375, -4.53955078125, -4.348876953125, -4.158203125, -3.967529296875, -3.77685546875, -3.586181640625, -3.3955078125, -3.204833984375, -3.01416015625, -2.823486328125, -2.6328125, -2.442138671875, -2.25146484375, -2.060791015625, -1.8701171875, -1.679443359375, -1.48876953125, -1.298095703125, -1.107421875, -0.916748046875, -0.72607421875, -0.535400390625, -0.3447265625, -0.154052734375, 0.03662109375, 0.227294921875, 0.41796875, 0.608642578125, 0.79931640625, 0.989990234375, 1.1806640625, 1.371337890625, 1.56201171875, 1.752685546875, 1.943359375, 2.134033203125, 2.32470703125, 2.515380859375, 2.7060546875, 2.896728515625, 3.08740234375, 3.278076171875, 3.46875, 3.659423828125, 3.85009765625, 4.040771484375, 4.2314453125, 4.422119140625, 4.61279296875, 4.803466796875, 4.994140625, 5.184814453125, 5.37548828125, 5.566162109375, 5.7568359375, 5.947509765625, 6.13818359375, 6.328857421875, 6.51953125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 2.0, 5.0, 18.0, 17.0, 23.0, 45.0, 55.0, 86.0, 119.0, 162.0, 226.0, 320.0, 458.0, 730.0, 1018.0, 1481.0, 2234.0, 3656.0, 6863.0, 19218.0, 81617.0, 399956.0, 408475.0, 84306.0, 19959.0, 7002.0, 3571.0, 2224.0, 1458.0, 1026.0, 686.0, 469.0, 315.0, 240.0, 155.0, 103.0, 76.0, 56.0, 46.0, 29.0, 12.0, 13.0, 14.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-20.09375, -19.519775390625, -18.94580078125, -18.371826171875, -17.7978515625, -17.223876953125, -16.64990234375, -16.075927734375, -15.501953125, -14.927978515625, -14.35400390625, -13.780029296875, -13.2060546875, -12.632080078125, -12.05810546875, -11.484130859375, -10.91015625, -10.336181640625, -9.76220703125, -9.188232421875, -8.6142578125, -8.040283203125, -7.46630859375, -6.892333984375, -6.318359375, -5.744384765625, -5.17041015625, -4.596435546875, -4.0224609375, -3.448486328125, -2.87451171875, -2.300537109375, -1.7265625, -1.152587890625, -0.57861328125, -0.004638671875, 0.5693359375, 1.143310546875, 1.71728515625, 2.291259765625, 2.865234375, 3.439208984375, 4.01318359375, 4.587158203125, 5.1611328125, 5.735107421875, 6.30908203125, 6.883056640625, 7.45703125, 8.031005859375, 8.60498046875, 9.178955078125, 9.7529296875, 10.326904296875, 10.90087890625, 11.474853515625, 12.048828125, 12.622802734375, 13.19677734375, 13.770751953125, 14.3447265625, 14.918701171875, 15.49267578125, 16.066650390625, 16.640625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 14.0, 14.0, 10.0, 22.0, 55.0, 78.0, 120.0, 151.0, 142.0, 136.0, 97.0, 64.0, 38.0, 22.0, 10.0, 9.0, 5.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011377334594726562, -0.0011100620031356812, -0.001082390546798706, -0.001054719090461731, -0.0010270476341247559, -0.0009993761777877808, -0.0009717047214508057, -0.0009440332651138306, -0.0009163618087768555, -0.0008886903524398804, -0.0008610188961029053, -0.0008333474397659302, -0.0008056759834289551, -0.00077800452709198, -0.0007503330707550049, -0.0007226616144180298, -0.0006949901580810547, -0.0006673187017440796, -0.0006396472454071045, -0.0006119757890701294, -0.0005843043327331543, -0.0005566328763961792, -0.0005289614200592041, -0.000501289963722229, -0.0004736185073852539, -0.0004459470510482788, -0.0004182755947113037, -0.0003906041383743286, -0.0003629326820373535, -0.0003352612257003784, -0.0003075897693634033, -0.0002799183130264282, -0.0002522468566894531, -0.00022457540035247803, -0.00019690394401550293, -0.00016923248767852783, -0.00014156103134155273, -0.00011388957500457764, -8.621811866760254e-05, -5.854666233062744e-05, -3.0875205993652344e-05, -3.203749656677246e-06, 2.446770668029785e-05, 5.213916301727295e-05, 7.981061935424805e-05, 0.00010748207569122314, 0.00013515353202819824, 0.00016282498836517334, 0.00019049644470214844, 0.00021816790103912354, 0.00024583935737609863, 0.00027351081371307373, 0.00030118227005004883, 0.0003288537263870239, 0.000356525182723999, 0.0003841966390609741, 0.0004118680953979492, 0.0004395395517349243, 0.0004672110080718994, 0.0004948824644088745, 0.0005225539207458496, 0.0005502253770828247, 0.0005778968334197998, 0.0006055682897567749, 0.00063323974609375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 2.0, 4.0, 7.0, 10.0, 9.0, 21.0, 16.0, 21.0, 35.0, 55.0, 64.0, 100.0, 166.0, 196.0, 274.0, 363.0, 514.0, 721.0, 951.0, 1327.0, 1801.0, 2541.0, 3843.0, 7418.0, 24394.0, 125070.0, 452066.0, 326521.0, 68192.0, 14916.0, 5541.0, 3286.0, 2219.0, 1556.0, 1219.0, 858.0, 617.0, 445.0, 323.0, 254.0, 156.0, 133.0, 103.0, 74.0, 41.0, 43.0, 28.0, 14.0, 12.0, 10.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-16.140625, -15.599365234375, -15.05810546875, -14.516845703125, -13.9755859375, -13.434326171875, -12.89306640625, -12.351806640625, -11.810546875, -11.269287109375, -10.72802734375, -10.186767578125, -9.6455078125, -9.104248046875, -8.56298828125, -8.021728515625, -7.48046875, -6.939208984375, -6.39794921875, -5.856689453125, -5.3154296875, -4.774169921875, -4.23291015625, -3.691650390625, -3.150390625, -2.609130859375, -2.06787109375, -1.526611328125, -0.9853515625, -0.444091796875, 0.09716796875, 0.638427734375, 1.1796875, 1.720947265625, 2.26220703125, 2.803466796875, 3.3447265625, 3.885986328125, 4.42724609375, 4.968505859375, 5.509765625, 6.051025390625, 6.59228515625, 7.133544921875, 7.6748046875, 8.216064453125, 8.75732421875, 9.298583984375, 9.83984375, 10.381103515625, 10.92236328125, 11.463623046875, 12.0048828125, 12.546142578125, 13.08740234375, 13.628662109375, 14.169921875, 14.711181640625, 15.25244140625, 15.793701171875, 16.3349609375, 16.876220703125, 17.41748046875, 17.958740234375, 18.5]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 10.0, 16.0, 22.0, 30.0, 47.0, 101.0, 127.0, 134.0, 151.0, 126.0, 89.0, 51.0, 37.0, 20.0, 8.0, 9.0, 3.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.44140625, -4.314208984375, -4.18701171875, -4.059814453125, -3.9326171875, -3.805419921875, -3.67822265625, -3.551025390625, -3.423828125, -3.296630859375, -3.16943359375, -3.042236328125, -2.9150390625, -2.787841796875, -2.66064453125, -2.533447265625, -2.40625, -2.279052734375, -2.15185546875, -2.024658203125, -1.8974609375, -1.770263671875, -1.64306640625, -1.515869140625, -1.388671875, -1.261474609375, -1.13427734375, -1.007080078125, -0.8798828125, -0.752685546875, -0.62548828125, -0.498291015625, -0.37109375, -0.243896484375, -0.11669921875, 0.010498046875, 0.1376953125, 0.264892578125, 0.39208984375, 0.519287109375, 0.646484375, 0.773681640625, 0.90087890625, 1.028076171875, 1.1552734375, 1.282470703125, 1.40966796875, 1.536865234375, 1.6640625, 1.791259765625, 1.91845703125, 2.045654296875, 2.1728515625, 2.300048828125, 2.42724609375, 2.554443359375, 2.681640625, 2.808837890625, 2.93603515625, 3.063232421875, 3.1904296875, 3.317626953125, 3.44482421875, 3.572021484375, 3.69921875]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 1.0, 5.0, 3.0, 4.0, 6.0, 8.0, 12.0, 19.0, 14.0, 24.0, 28.0, 24.0, 41.0, 33.0, 47.0, 63.0, 63.0, 66.0, 82.0, 65.0, 59.0, 43.0, 51.0, 43.0, 35.0, 25.0, 32.0, 24.0, 11.0, 11.0, 15.0, 11.0, 3.0, 8.0, 9.0, 0.0, 7.0, 0.0, 4.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.522510528564453, -16.86768341064453, -16.212858200073242, -15.558032035827637, -14.903205871582031, -14.248379707336426, -13.59355354309082, -12.938727378845215, -12.28390121459961, -11.629075050354004, -10.974248886108398, -10.319422721862793, -9.664596557617188, -9.009770393371582, -8.354944229125977, -7.700118064880371, -7.045291900634766, -6.39046573638916, -5.735639572143555, -5.080813407897949, -4.425987243652344, -3.7711610794067383, -3.116334915161133, -2.4615087509155273, -1.8066825866699219, -1.1518564224243164, -0.49703025817871094, 0.15779590606689453, 0.8126220703125, 1.4674482345581055, 2.122274398803711, 2.7771005630493164, 3.4319286346435547, 4.08675479888916, 4.741580963134766, 5.396407127380371, 6.051233291625977, 6.706059455871582, 7.3608856201171875, 8.015711784362793, 8.670537948608398, 9.325364112854004, 9.98019027709961, 10.635016441345215, 11.28984260559082, 11.944668769836426, 12.599494934082031, 13.254321098327637, 13.909147262573242, 14.563973426818848, 15.218799591064453, 15.873625755310059, 16.528451919555664, 17.183277130126953, 17.838104248046875, 18.492931365966797, 19.147756576538086, 19.802581787109375, 20.457408905029297, 21.11223602294922, 21.767061233520508, 22.421886444091797, 23.07671356201172, 23.73154067993164, 24.38636589050293]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 4.0, 1.0, 12.0, 8.0, 7.0, 19.0, 12.0, 12.0, 18.0, 23.0, 18.0, 23.0, 23.0, 31.0, 26.0, 32.0, 37.0, 39.0, 33.0, 44.0, 45.0, 34.0, 38.0, 48.0, 34.0, 35.0, 40.0, 29.0, 36.0, 27.0, 22.0, 25.0, 14.0, 26.0, 15.0, 15.0, 17.0, 14.0, 22.0, 8.0, 7.0, 9.0, 8.0, 4.0, 3.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.298133850097656, -8.011815071105957, -7.725496292114258, -7.439177513122559, -7.152858734130859, -6.86653995513916, -6.580220699310303, -6.2939019203186035, -6.007583141326904, -5.721264362335205, -5.434945583343506, -5.148626804351807, -4.862307548522949, -4.57598876953125, -4.289669990539551, -4.003351211547852, -3.7170324325561523, -3.430713653564453, -3.144394874572754, -2.8580758571624756, -2.5717570781707764, -2.285438299179077, -1.9991194009780884, -1.7128005027770996, -1.4264817237854004, -1.1401629447937012, -0.8538440465927124, -0.5675252079963684, -0.2812063694000244, 0.005112409591674805, 0.2914313077926636, 0.5777502059936523, 0.8640689849853516, 1.1503877639770508, 1.4367066621780396, 1.7230255603790283, 2.0093443393707275, 2.2956631183624268, 2.581982135772705, 2.8683009147644043, 3.1546196937561035, 3.4409384727478027, 3.727257251739502, 4.013576030731201, 4.299895286560059, 4.586214065551758, 4.872532844543457, 5.158851623535156, 5.4451704025268555, 5.731489181518555, 6.017807960510254, 6.304126739501953, 6.590445518493652, 6.876764297485352, 7.163083553314209, 7.449402332305908, 7.735721111297607, 8.022040367126465, 8.308359146118164, 8.594677925109863, 8.880996704101562, 9.167315483093262, 9.453634262084961, 9.73995304107666, 10.02627182006836]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 5.0, 5.0, 6.0, 8.0, 11.0, 21.0, 28.0, 50.0, 97.0, 179.0, 314.0, 478.0, 1031.0, 2023.0, 4468.0, 9856.0, 22085.0, 49816.0, 106576.0, 191657.0, 243619.0, 200656.0, 115732.0, 55214.0, 24283.0, 10727.0, 4857.0, 2348.0, 1082.0, 572.0, 347.0, 167.0, 91.0, 51.0, 35.0, 18.0, 16.0, 14.0, 7.0, 6.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.53125, -22.76123046875, -21.9912109375, -21.22119140625, -20.451171875, -19.68115234375, -18.9111328125, -18.14111328125, -17.37109375, -16.60107421875, -15.8310546875, -15.06103515625, -14.291015625, -13.52099609375, -12.7509765625, -11.98095703125, -11.2109375, -10.44091796875, -9.6708984375, -8.90087890625, -8.130859375, -7.36083984375, -6.5908203125, -5.82080078125, -5.05078125, -4.28076171875, -3.5107421875, -2.74072265625, -1.970703125, -1.20068359375, -0.4306640625, 0.33935546875, 1.109375, 1.87939453125, 2.6494140625, 3.41943359375, 4.189453125, 4.95947265625, 5.7294921875, 6.49951171875, 7.26953125, 8.03955078125, 8.8095703125, 9.57958984375, 10.349609375, 11.11962890625, 11.8896484375, 12.65966796875, 13.4296875, 14.19970703125, 14.9697265625, 15.73974609375, 16.509765625, 17.27978515625, 18.0498046875, 18.81982421875, 19.58984375, 20.35986328125, 21.1298828125, 21.89990234375, 22.669921875, 23.43994140625, 24.2099609375, 24.97998046875, 25.75]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 1.0, 2.0, 5.0, 5.0, 7.0, 8.0, 16.0, 13.0, 25.0, 25.0, 15.0, 18.0, 37.0, 25.0, 37.0, 47.0, 44.0, 59.0, 56.0, 54.0, 58.0, 49.0, 53.0, 50.0, 31.0, 34.0, 31.0, 37.0, 34.0, 24.0, 24.0, 17.0, 24.0, 10.0, 9.0, 7.0, 9.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9140625, -9.5062255859375, -9.098388671875, -8.6905517578125, -8.28271484375, -7.8748779296875, -7.467041015625, -7.0592041015625, -6.6513671875, -6.2435302734375, -5.835693359375, -5.4278564453125, -5.02001953125, -4.6121826171875, -4.204345703125, -3.7965087890625, -3.388671875, -2.9808349609375, -2.572998046875, -2.1651611328125, -1.75732421875, -1.3494873046875, -0.941650390625, -0.5338134765625, -0.1259765625, 0.2818603515625, 0.689697265625, 1.0975341796875, 1.50537109375, 1.9132080078125, 2.321044921875, 2.7288818359375, 3.13671875, 3.5445556640625, 3.952392578125, 4.3602294921875, 4.76806640625, 5.1759033203125, 5.583740234375, 5.9915771484375, 6.3994140625, 6.8072509765625, 7.215087890625, 7.6229248046875, 8.03076171875, 8.4385986328125, 8.846435546875, 9.2542724609375, 9.662109375, 10.0699462890625, 10.477783203125, 10.8856201171875, 11.29345703125, 11.7012939453125, 12.109130859375, 12.5169677734375, 12.9248046875, 13.3326416015625, 13.740478515625, 14.1483154296875, 14.55615234375, 14.9639892578125, 15.371826171875, 15.7796630859375, 16.1875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 7.0, 9.0, 4.0, 22.0, 21.0, 29.0, 32.0, 52.0, 96.0, 137.0, 216.0, 302.0, 526.0, 731.0, 1140.0, 1783.0, 2701.0, 4409.0, 6682.0, 10563.0, 16257.0, 25016.0, 37983.0, 55527.0, 76937.0, 99498.0, 118346.0, 126291.0, 118813.0, 100309.0, 77414.0, 56051.0, 38819.0, 25400.0, 16689.0, 10635.0, 6780.0, 4314.0, 2770.0, 1868.0, 1176.0, 715.0, 472.0, 345.0, 214.0, 151.0, 105.0, 75.0, 41.0, 27.0, 23.0, 11.0, 9.0, 8.0, 7.0, 6.0, 1.0, 0.0, 5.0], "bins": [-13.0078125, -12.6077880859375, -12.207763671875, -11.8077392578125, -11.40771484375, -11.0076904296875, -10.607666015625, -10.2076416015625, -9.8076171875, -9.4075927734375, -9.007568359375, -8.6075439453125, -8.20751953125, -7.8074951171875, -7.407470703125, -7.0074462890625, -6.607421875, -6.2073974609375, -5.807373046875, -5.4073486328125, -5.00732421875, -4.6072998046875, -4.207275390625, -3.8072509765625, -3.4072265625, -3.0072021484375, -2.607177734375, -2.2071533203125, -1.80712890625, -1.4071044921875, -1.007080078125, -0.6070556640625, -0.20703125, 0.1929931640625, 0.593017578125, 0.9930419921875, 1.39306640625, 1.7930908203125, 2.193115234375, 2.5931396484375, 2.9931640625, 3.3931884765625, 3.793212890625, 4.1932373046875, 4.59326171875, 4.9932861328125, 5.393310546875, 5.7933349609375, 6.193359375, 6.5933837890625, 6.993408203125, 7.3934326171875, 7.79345703125, 8.1934814453125, 8.593505859375, 8.9935302734375, 9.3935546875, 9.7935791015625, 10.193603515625, 10.5936279296875, 10.99365234375, 11.3936767578125, 11.793701171875, 12.1937255859375, 12.59375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 2.0, 6.0, 5.0, 8.0, 2.0, 8.0, 12.0, 14.0, 17.0, 9.0, 19.0, 19.0, 27.0, 21.0, 35.0, 29.0, 28.0, 29.0, 39.0, 43.0, 54.0, 42.0, 40.0, 42.0, 34.0, 38.0, 45.0, 45.0, 40.0, 31.0, 22.0, 29.0, 29.0, 29.0, 18.0, 21.0, 16.0, 9.0, 7.0, 7.0, 6.0, 6.0, 6.0, 5.0, 4.0, 2.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.47265625, -6.2720947265625, -6.071533203125, -5.8709716796875, -5.67041015625, -5.4698486328125, -5.269287109375, -5.0687255859375, -4.8681640625, -4.6676025390625, -4.467041015625, -4.2664794921875, -4.06591796875, -3.8653564453125, -3.664794921875, -3.4642333984375, -3.263671875, -3.0631103515625, -2.862548828125, -2.6619873046875, -2.46142578125, -2.2608642578125, -2.060302734375, -1.8597412109375, -1.6591796875, -1.4586181640625, -1.258056640625, -1.0574951171875, -0.85693359375, -0.6563720703125, -0.455810546875, -0.2552490234375, -0.0546875, 0.1458740234375, 0.346435546875, 0.5469970703125, 0.74755859375, 0.9481201171875, 1.148681640625, 1.3492431640625, 1.5498046875, 1.7503662109375, 1.950927734375, 2.1514892578125, 2.35205078125, 2.5526123046875, 2.753173828125, 2.9537353515625, 3.154296875, 3.3548583984375, 3.555419921875, 3.7559814453125, 3.95654296875, 4.1571044921875, 4.357666015625, 4.5582275390625, 4.7587890625, 4.9593505859375, 5.159912109375, 5.3604736328125, 5.56103515625, 5.7615966796875, 5.962158203125, 6.1627197265625, 6.36328125]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 12.0, 21.0, 17.0, 17.0, 30.0, 58.0, 63.0, 121.0, 163.0, 248.0, 339.0, 449.0, 642.0, 964.0, 1292.0, 1971.0, 2881.0, 4419.0, 6555.0, 10464.0, 16818.0, 28832.0, 51259.0, 93271.0, 163058.0, 218812.0, 184976.0, 111549.0, 60731.0, 33922.0, 19858.0, 12051.0, 7425.0, 4889.0, 3290.0, 2127.0, 1514.0, 1062.0, 734.0, 501.0, 343.0, 257.0, 177.0, 120.0, 78.0, 60.0, 29.0, 31.0, 25.0, 8.0, 10.0, 4.0, 3.0, 1.0, 6.0, 2.0, 0.0, 1.0], "bins": [-10.828125, -10.4859619140625, -10.143798828125, -9.8016357421875, -9.45947265625, -9.1173095703125, -8.775146484375, -8.4329833984375, -8.0908203125, -7.7486572265625, -7.406494140625, -7.0643310546875, -6.72216796875, -6.3800048828125, -6.037841796875, -5.6956787109375, -5.353515625, -5.0113525390625, -4.669189453125, -4.3270263671875, -3.98486328125, -3.6427001953125, -3.300537109375, -2.9583740234375, -2.6162109375, -2.2740478515625, -1.931884765625, -1.5897216796875, -1.24755859375, -0.9053955078125, -0.563232421875, -0.2210693359375, 0.12109375, 0.4632568359375, 0.805419921875, 1.1475830078125, 1.48974609375, 1.8319091796875, 2.174072265625, 2.5162353515625, 2.8583984375, 3.2005615234375, 3.542724609375, 3.8848876953125, 4.22705078125, 4.5692138671875, 4.911376953125, 5.2535400390625, 5.595703125, 5.9378662109375, 6.280029296875, 6.6221923828125, 6.96435546875, 7.3065185546875, 7.648681640625, 7.9908447265625, 8.3330078125, 8.6751708984375, 9.017333984375, 9.3594970703125, 9.70166015625, 10.0438232421875, 10.385986328125, 10.7281494140625, 11.0703125]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 8.0, 10.0, 6.0, 7.0, 11.0, 8.0, 12.0, 22.0, 14.0, 29.0, 28.0, 57.0, 50.0, 56.0, 57.0, 71.0, 77.0, 100.0, 73.0, 55.0, 44.0, 44.0, 27.0, 22.0, 17.0, 24.0, 15.0, 8.0, 13.0, 10.0, 5.0, 2.0, 3.0, 2.0, 4.0, 1.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00109100341796875, -0.0010495781898498535, -0.001008152961730957, -0.0009667277336120605, -0.0009253025054931641, -0.0008838772773742676, -0.0008424520492553711, -0.0008010268211364746, -0.0007596015930175781, -0.0007181763648986816, -0.0006767511367797852, -0.0006353259086608887, -0.0005939006805419922, -0.0005524754524230957, -0.0005110502243041992, -0.00046962499618530273, -0.00042819976806640625, -0.00038677453994750977, -0.0003453493118286133, -0.0003039240837097168, -0.0002624988555908203, -0.00022107362747192383, -0.00017964839935302734, -0.00013822317123413086, -9.679794311523438e-05, -5.537271499633789e-05, -1.3947486877441406e-05, 2.7477741241455078e-05, 6.890296936035156e-05, 0.00011032819747924805, 0.00015175342559814453, 0.00019317865371704102, 0.0002346038818359375, 0.000276029109954834, 0.00031745433807373047, 0.00035887956619262695, 0.00040030479431152344, 0.0004417300224304199, 0.0004831552505493164, 0.0005245804786682129, 0.0005660057067871094, 0.0006074309349060059, 0.0006488561630249023, 0.0006902813911437988, 0.0007317066192626953, 0.0007731318473815918, 0.0008145570755004883, 0.0008559823036193848, 0.0008974075317382812, 0.0009388327598571777, 0.0009802579879760742, 0.0010216832160949707, 0.0010631084442138672, 0.0011045336723327637, 0.0011459589004516602, 0.0011873841285705566, 0.0012288093566894531, 0.0012702345848083496, 0.001311659812927246, 0.0013530850410461426, 0.001394510269165039, 0.0014359354972839355, 0.001477360725402832, 0.0015187859535217285, 0.001560211181640625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 10.0, 16.0, 5.0, 29.0, 39.0, 52.0, 86.0, 112.0, 176.0, 278.0, 392.0, 575.0, 912.0, 1446.0, 2186.0, 3577.0, 5569.0, 9457.0, 16076.0, 28420.0, 51911.0, 95075.0, 160080.0, 210813.0, 187389.0, 119923.0, 66760.0, 36362.0, 20359.0, 11595.0, 6928.0, 4250.0, 2686.0, 1730.0, 1117.0, 745.0, 489.0, 306.0, 205.0, 148.0, 87.0, 55.0, 41.0, 37.0, 15.0, 16.0, 8.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-9.2734375, -8.971435546875, -8.66943359375, -8.367431640625, -8.0654296875, -7.763427734375, -7.46142578125, -7.159423828125, -6.857421875, -6.555419921875, -6.25341796875, -5.951416015625, -5.6494140625, -5.347412109375, -5.04541015625, -4.743408203125, -4.44140625, -4.139404296875, -3.83740234375, -3.535400390625, -3.2333984375, -2.931396484375, -2.62939453125, -2.327392578125, -2.025390625, -1.723388671875, -1.42138671875, -1.119384765625, -0.8173828125, -0.515380859375, -0.21337890625, 0.088623046875, 0.390625, 0.692626953125, 0.99462890625, 1.296630859375, 1.5986328125, 1.900634765625, 2.20263671875, 2.504638671875, 2.806640625, 3.108642578125, 3.41064453125, 3.712646484375, 4.0146484375, 4.316650390625, 4.61865234375, 4.920654296875, 5.22265625, 5.524658203125, 5.82666015625, 6.128662109375, 6.4306640625, 6.732666015625, 7.03466796875, 7.336669921875, 7.638671875, 7.940673828125, 8.24267578125, 8.544677734375, 8.8466796875, 9.148681640625, 9.45068359375, 9.752685546875, 10.0546875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 7.0, 3.0, 10.0, 10.0, 16.0, 13.0, 22.0, 25.0, 25.0, 36.0, 45.0, 60.0, 73.0, 70.0, 77.0, 84.0, 72.0, 68.0, 46.0, 53.0, 35.0, 26.0, 24.0, 25.0, 11.0, 9.0, 9.0, 13.0, 6.0, 7.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.20703125, -3.10699462890625, -3.0069580078125, -2.90692138671875, -2.806884765625, -2.70684814453125, -2.6068115234375, -2.50677490234375, -2.40673828125, -2.30670166015625, -2.2066650390625, -2.10662841796875, -2.006591796875, -1.90655517578125, -1.8065185546875, -1.70648193359375, -1.6064453125, -1.50640869140625, -1.4063720703125, -1.30633544921875, -1.206298828125, -1.10626220703125, -1.0062255859375, -0.90618896484375, -0.80615234375, -0.70611572265625, -0.6060791015625, -0.50604248046875, -0.406005859375, -0.30596923828125, -0.2059326171875, -0.10589599609375, -0.005859375, 0.09417724609375, 0.1942138671875, 0.29425048828125, 0.394287109375, 0.49432373046875, 0.5943603515625, 0.69439697265625, 0.79443359375, 0.89447021484375, 0.9945068359375, 1.09454345703125, 1.194580078125, 1.29461669921875, 1.3946533203125, 1.49468994140625, 1.5947265625, 1.69476318359375, 1.7947998046875, 1.89483642578125, 1.994873046875, 2.09490966796875, 2.1949462890625, 2.29498291015625, 2.39501953125, 2.49505615234375, 2.5950927734375, 2.69512939453125, 2.795166015625, 2.89520263671875, 2.9952392578125, 3.09527587890625, 3.1953125]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 3.0, 8.0, 5.0, 5.0, 12.0, 17.0, 16.0, 20.0, 22.0, 27.0, 35.0, 48.0, 41.0, 58.0, 56.0, 64.0, 77.0, 77.0, 58.0, 48.0, 51.0, 45.0, 44.0, 31.0, 30.0, 23.0, 18.0, 12.0, 7.0, 8.0, 6.0, 9.0, 6.0, 2.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-21.015472412109375, -20.329940795898438, -19.644407272338867, -18.958873748779297, -18.27334213256836, -17.587810516357422, -16.90227699279785, -16.21674346923828, -15.531211853027344, -14.84567928314209, -14.160146713256836, -13.474614143371582, -12.789081573486328, -12.103549003601074, -11.41801643371582, -10.732483863830566, -10.046951293945312, -9.361418724060059, -8.675886154174805, -7.990353584289551, -7.304821014404297, -6.619288444519043, -5.933755874633789, -5.248223304748535, -4.562690734863281, -3.8771581649780273, -3.1916255950927734, -2.5060930252075195, -1.8205604553222656, -1.1350278854370117, -0.4494953155517578, 0.2360372543334961, 0.92156982421875, 1.607102394104004, 2.292634963989258, 2.9781675338745117, 3.6637001037597656, 4.3492326736450195, 5.034765243530273, 5.720297813415527, 6.405830383300781, 7.091362953186035, 7.776895523071289, 8.462428092956543, 9.147960662841797, 9.83349323272705, 10.519025802612305, 11.204558372497559, 11.890090942382812, 12.575623512268066, 13.26115608215332, 13.946688652038574, 14.632221221923828, 15.317753791809082, 16.003286361694336, 16.688819885253906, 17.374351501464844, 18.05988311767578, 18.74541664123535, 19.430950164794922, 20.11648178100586, 20.802013397216797, 21.487546920776367, 22.173080444335938, 22.858612060546875]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 6.0, 8.0, 3.0, 3.0, 4.0, 9.0, 5.0, 9.0, 11.0, 11.0, 17.0, 21.0, 23.0, 18.0, 30.0, 30.0, 17.0, 25.0, 37.0, 39.0, 41.0, 33.0, 36.0, 43.0, 37.0, 41.0, 36.0, 44.0, 40.0, 34.0, 26.0, 34.0, 31.0, 24.0, 25.0, 25.0, 18.0, 16.0, 14.0, 15.0, 13.0, 17.0, 5.0, 8.0, 7.0, 3.0, 5.0, 7.0, 2.0, 3.0, 1.0, 1.0, 3.0], "bins": [-10.551229476928711, -10.25379467010498, -9.956360816955566, -9.658926010131836, -9.361491203308105, -9.064057350158691, -8.766622543334961, -8.469188690185547, -8.171753883361816, -7.874319553375244, -7.576884746551514, -7.279450416564941, -6.982016086578369, -6.684581756591797, -6.387146949768066, -6.089712619781494, -5.792277812957764, -5.494843482971191, -5.197408676147461, -4.899974346160889, -4.602540016174316, -4.305105209350586, -4.007670879364014, -3.7102365493774414, -3.41280198097229, -3.1153674125671387, -2.8179330825805664, -2.520498514175415, -2.2230639457702637, -1.9256296157836914, -1.62819504737854, -1.3307607173919678, -1.0333261489868164, -0.7358916997909546, -0.438457190990448, -0.1410226821899414, 0.1564117670059204, 0.4538462162017822, 0.7512807846069336, 1.0487151145935059, 1.3461496829986572, 1.643584132194519, 1.9410185813903809, 2.2384531497955322, 2.5358877182006836, 2.833322048187256, 3.1307566165924072, 3.4281909465789795, 3.725625514984131, 4.023059844970703, 4.320494651794434, 4.617928981781006, 4.915363311767578, 5.212798118591309, 5.510232448577881, 5.807666778564453, 6.105101585388184, 6.402535915374756, 6.699970722198486, 6.997405052185059, 7.294839382171631, 7.592273712158203, 7.889708518981934, 8.187143325805664, 8.484577178955078]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 6.0, 3.0, 5.0, 10.0, 15.0, 22.0, 31.0, 47.0, 60.0, 84.0, 137.0, 221.0, 340.0, 558.0, 964.0, 1584.0, 3008.0, 5452.0, 10598.0, 22913.0, 50169.0, 118510.0, 298956.0, 761194.0, 1316778.0, 942052.0, 390717.0, 152590.0, 62293.0, 27534.0, 12859.0, 6501.0, 3307.0, 1939.0, 1072.0, 631.0, 393.0, 250.0, 140.0, 126.0, 60.0, 50.0, 31.0, 22.0, 17.0, 13.0, 10.0, 3.0, 3.0, 2.0, 8.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-19.90625, -19.18603515625, -18.4658203125, -17.74560546875, -17.025390625, -16.30517578125, -15.5849609375, -14.86474609375, -14.14453125, -13.42431640625, -12.7041015625, -11.98388671875, -11.263671875, -10.54345703125, -9.8232421875, -9.10302734375, -8.3828125, -7.66259765625, -6.9423828125, -6.22216796875, -5.501953125, -4.78173828125, -4.0615234375, -3.34130859375, -2.62109375, -1.90087890625, -1.1806640625, -0.46044921875, 0.259765625, 0.97998046875, 1.7001953125, 2.42041015625, 3.140625, 3.86083984375, 4.5810546875, 5.30126953125, 6.021484375, 6.74169921875, 7.4619140625, 8.18212890625, 8.90234375, 9.62255859375, 10.3427734375, 11.06298828125, 11.783203125, 12.50341796875, 13.2236328125, 13.94384765625, 14.6640625, 15.38427734375, 16.1044921875, 16.82470703125, 17.544921875, 18.26513671875, 18.9853515625, 19.70556640625, 20.42578125, 21.14599609375, 21.8662109375, 22.58642578125, 23.306640625, 24.02685546875, 24.7470703125, 25.46728515625, 26.1875]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 1.0, 4.0, 8.0, 6.0, 5.0, 11.0, 12.0, 26.0, 16.0, 30.0, 29.0, 37.0, 38.0, 41.0, 55.0, 56.0, 49.0, 54.0, 58.0, 58.0, 63.0, 61.0, 43.0, 34.0, 44.0, 34.0, 25.0, 22.0, 31.0, 18.0, 10.0, 9.0, 7.0, 4.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7578125, -9.399169921875, -9.04052734375, -8.681884765625, -8.3232421875, -7.964599609375, -7.60595703125, -7.247314453125, -6.888671875, -6.530029296875, -6.17138671875, -5.812744140625, -5.4541015625, -5.095458984375, -4.73681640625, -4.378173828125, -4.01953125, -3.660888671875, -3.30224609375, -2.943603515625, -2.5849609375, -2.226318359375, -1.86767578125, -1.509033203125, -1.150390625, -0.791748046875, -0.43310546875, -0.074462890625, 0.2841796875, 0.642822265625, 1.00146484375, 1.360107421875, 1.71875, 2.077392578125, 2.43603515625, 2.794677734375, 3.1533203125, 3.511962890625, 3.87060546875, 4.229248046875, 4.587890625, 4.946533203125, 5.30517578125, 5.663818359375, 6.0224609375, 6.381103515625, 6.73974609375, 7.098388671875, 7.45703125, 7.815673828125, 8.17431640625, 8.532958984375, 8.8916015625, 9.250244140625, 9.60888671875, 9.967529296875, 10.326171875, 10.684814453125, 11.04345703125, 11.402099609375, 11.7607421875, 12.119384765625, 12.47802734375, 12.836669921875, 13.1953125]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 6.0, 11.0, 20.0, 21.0, 36.0, 79.0, 98.0, 160.0, 259.0, 435.0, 809.0, 1465.0, 2569.0, 4827.0, 9538.0, 19315.0, 42011.0, 93380.0, 215331.0, 485968.0, 952529.0, 1123965.0, 678551.0, 311800.0, 136639.0, 59593.0, 27360.0, 13170.0, 6606.0, 3385.0, 1905.0, 948.0, 639.0, 321.0, 204.0, 128.0, 77.0, 49.0, 33.0, 25.0, 8.0, 6.0, 6.0, 0.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.625, -25.869140625, -25.11328125, -24.357421875, -23.6015625, -22.845703125, -22.08984375, -21.333984375, -20.578125, -19.822265625, -19.06640625, -18.310546875, -17.5546875, -16.798828125, -16.04296875, -15.287109375, -14.53125, -13.775390625, -13.01953125, -12.263671875, -11.5078125, -10.751953125, -9.99609375, -9.240234375, -8.484375, -7.728515625, -6.97265625, -6.216796875, -5.4609375, -4.705078125, -3.94921875, -3.193359375, -2.4375, -1.681640625, -0.92578125, -0.169921875, 0.5859375, 1.341796875, 2.09765625, 2.853515625, 3.609375, 4.365234375, 5.12109375, 5.876953125, 6.6328125, 7.388671875, 8.14453125, 8.900390625, 9.65625, 10.412109375, 11.16796875, 11.923828125, 12.6796875, 13.435546875, 14.19140625, 14.947265625, 15.703125, 16.458984375, 17.21484375, 17.970703125, 18.7265625, 19.482421875, 20.23828125, 20.994140625, 21.75]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 6.0, 8.0, 11.0, 14.0, 20.0, 15.0, 28.0, 39.0, 60.0, 70.0, 112.0, 146.0, 182.0, 246.0, 273.0, 278.0, 326.0, 312.0, 364.0, 308.0, 283.0, 212.0, 180.0, 159.0, 121.0, 80.0, 58.0, 49.0, 48.0, 25.0, 10.0, 12.0, 9.0, 5.0, 3.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.609375, -8.38525390625, -8.1611328125, -7.93701171875, -7.712890625, -7.48876953125, -7.2646484375, -7.04052734375, -6.81640625, -6.59228515625, -6.3681640625, -6.14404296875, -5.919921875, -5.69580078125, -5.4716796875, -5.24755859375, -5.0234375, -4.79931640625, -4.5751953125, -4.35107421875, -4.126953125, -3.90283203125, -3.6787109375, -3.45458984375, -3.23046875, -3.00634765625, -2.7822265625, -2.55810546875, -2.333984375, -2.10986328125, -1.8857421875, -1.66162109375, -1.4375, -1.21337890625, -0.9892578125, -0.76513671875, -0.541015625, -0.31689453125, -0.0927734375, 0.13134765625, 0.35546875, 0.57958984375, 0.8037109375, 1.02783203125, 1.251953125, 1.47607421875, 1.7001953125, 1.92431640625, 2.1484375, 2.37255859375, 2.5966796875, 2.82080078125, 3.044921875, 3.26904296875, 3.4931640625, 3.71728515625, 3.94140625, 4.16552734375, 4.3896484375, 4.61376953125, 4.837890625, 5.06201171875, 5.2861328125, 5.51025390625, 5.734375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 7.0, 14.0, 13.0, 14.0, 18.0, 29.0, 38.0, 46.0, 52.0, 75.0, 66.0, 73.0, 90.0, 73.0, 77.0, 63.0, 62.0, 33.0, 45.0, 23.0, 22.0, 16.0, 16.0, 6.0, 5.0, 10.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.674388885498047, -23.811080932617188, -22.947772979736328, -22.08446502685547, -21.22115707397461, -20.35784912109375, -19.494543075561523, -18.631235122680664, -17.767927169799805, -16.904619216918945, -16.041311264038086, -15.178004264831543, -14.314696311950684, -13.451388359069824, -12.588081359863281, -11.724773406982422, -10.861465454101562, -9.998157501220703, -9.134849548339844, -8.2715425491333, -7.408234596252441, -6.544926643371582, -5.681619167327881, -4.81831169128418, -3.9550037384033203, -3.09169602394104, -2.2283883094787598, -1.3650805950164795, -0.5017728805541992, 0.36153507232666016, 1.2248425483703613, 2.0881500244140625, 2.951457977294922, 3.814765691757202, 4.678073406219482, 5.541380882263184, 6.404688835144043, 7.267996788024902, 8.131303787231445, 8.994611740112305, 9.857919692993164, 10.721227645874023, 11.584535598754883, 12.447842597961426, 13.311150550842285, 14.174458503723145, 15.037765502929688, 15.901073455810547, 16.764381408691406, 17.627689361572266, 18.490997314453125, 19.354305267333984, 20.217613220214844, 21.080921173095703, 21.94422721862793, 22.80753517150879, 23.67084312438965, 24.534151077270508, 25.397459030151367, 26.260766983032227, 27.124073028564453, 27.987380981445312, 28.850688934326172, 29.71399688720703, 30.57730484008789]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 4.0, 6.0, 3.0, 8.0, 5.0, 12.0, 5.0, 8.0, 14.0, 22.0, 18.0, 12.0, 11.0, 30.0, 30.0, 30.0, 29.0, 33.0, 31.0, 36.0, 40.0, 40.0, 43.0, 43.0, 37.0, 41.0, 40.0, 33.0, 33.0, 38.0, 18.0, 37.0, 22.0, 22.0, 22.0, 21.0, 18.0, 17.0, 12.0, 11.0, 15.0, 15.0, 7.0, 10.0, 5.0, 5.0, 3.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0], "bins": [-10.755313873291016, -10.445636749267578, -10.13595962524414, -9.826282501220703, -9.516605377197266, -9.206928253173828, -8.89725112915039, -8.587574005126953, -8.277896881103516, -7.968219757080078, -7.658542633056641, -7.348865509033203, -7.039188385009766, -6.729511260986328, -6.419834613800049, -6.110157489776611, -5.800480842590332, -5.4908037185668945, -5.181126594543457, -4.8714494705200195, -4.561772346496582, -4.2520952224731445, -3.9424185752868652, -3.6327414512634277, -3.3230643272399902, -3.0133872032165527, -2.7037100791931152, -2.394033193588257, -2.0843560695648193, -1.7746789455413818, -1.4650019407272339, -1.155324935913086, -0.8456487655639648, -0.5359717011451721, -0.2262946367263794, 0.08338242769241333, 0.39305949211120605, 0.7027366161346436, 1.0124136209487915, 1.3220906257629395, 1.631767749786377, 1.9414448738098145, 2.251121997833252, 2.5607988834381104, 2.870476007461548, 3.1801531314849854, 3.4898300170898438, 3.7995071411132812, 4.109184265136719, 4.418861389160156, 4.728538513183594, 5.038215637207031, 5.347892761230469, 5.657569885253906, 5.9672465324401855, 6.276923656463623, 6.5866007804870605, 6.896277904510498, 7.2059550285339355, 7.515632152557373, 7.825308799743652, 8.13498592376709, 8.444663047790527, 8.754340171813965, 9.064017295837402]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 9.0, 6.0, 8.0, 9.0, 11.0, 18.0, 27.0, 47.0, 70.0, 88.0, 118.0, 247.0, 319.0, 512.0, 858.0, 1682.0, 2787.0, 5615.0, 11143.0, 23089.0, 48031.0, 96707.0, 170518.0, 228127.0, 201876.0, 127258.0, 65861.0, 31815.0, 15205.0, 7600.0, 3853.0, 2070.0, 1155.0, 673.0, 388.0, 230.0, 154.0, 101.0, 81.0, 49.0, 46.0, 36.0, 18.0, 17.0, 10.0, 7.0, 4.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.7265625, -12.312255859375, -11.89794921875, -11.483642578125, -11.0693359375, -10.655029296875, -10.24072265625, -9.826416015625, -9.412109375, -8.997802734375, -8.58349609375, -8.169189453125, -7.7548828125, -7.340576171875, -6.92626953125, -6.511962890625, -6.09765625, -5.683349609375, -5.26904296875, -4.854736328125, -4.4404296875, -4.026123046875, -3.61181640625, -3.197509765625, -2.783203125, -2.368896484375, -1.95458984375, -1.540283203125, -1.1259765625, -0.711669921875, -0.29736328125, 0.116943359375, 0.53125, 0.945556640625, 1.35986328125, 1.774169921875, 2.1884765625, 2.602783203125, 3.01708984375, 3.431396484375, 3.845703125, 4.260009765625, 4.67431640625, 5.088623046875, 5.5029296875, 5.917236328125, 6.33154296875, 6.745849609375, 7.16015625, 7.574462890625, 7.98876953125, 8.403076171875, 8.8173828125, 9.231689453125, 9.64599609375, 10.060302734375, 10.474609375, 10.888916015625, 11.30322265625, 11.717529296875, 12.1318359375, 12.546142578125, 12.96044921875, 13.374755859375, 13.7890625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 2.0, 6.0, 4.0, 3.0, 10.0, 8.0, 12.0, 10.0, 21.0, 16.0, 13.0, 22.0, 26.0, 37.0, 29.0, 35.0, 41.0, 37.0, 38.0, 32.0, 50.0, 52.0, 48.0, 48.0, 37.0, 41.0, 43.0, 42.0, 30.0, 31.0, 21.0, 21.0, 23.0, 23.0, 18.0, 17.0, 15.0, 9.0, 4.0, 8.0, 2.0, 6.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.796875, -12.4193115234375, -12.041748046875, -11.6641845703125, -11.28662109375, -10.9090576171875, -10.531494140625, -10.1539306640625, -9.7763671875, -9.3988037109375, -9.021240234375, -8.6436767578125, -8.26611328125, -7.8885498046875, -7.510986328125, -7.1334228515625, -6.755859375, -6.3782958984375, -6.000732421875, -5.6231689453125, -5.24560546875, -4.8680419921875, -4.490478515625, -4.1129150390625, -3.7353515625, -3.3577880859375, -2.980224609375, -2.6026611328125, -2.22509765625, -1.8475341796875, -1.469970703125, -1.0924072265625, -0.71484375, -0.3372802734375, 0.040283203125, 0.4178466796875, 0.79541015625, 1.1729736328125, 1.550537109375, 1.9281005859375, 2.3056640625, 2.6832275390625, 3.060791015625, 3.4383544921875, 3.81591796875, 4.1934814453125, 4.571044921875, 4.9486083984375, 5.326171875, 5.7037353515625, 6.081298828125, 6.4588623046875, 6.83642578125, 7.2139892578125, 7.591552734375, 7.9691162109375, 8.3466796875, 8.7242431640625, 9.101806640625, 9.4793701171875, 9.85693359375, 10.2344970703125, 10.612060546875, 10.9896240234375, 11.3671875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 6.0, 10.0, 14.0, 11.0, 16.0, 27.0, 45.0, 75.0, 119.0, 224.0, 342.0, 631.0, 1079.0, 1912.0, 3746.0, 7298.0, 15415.0, 33274.0, 72425.0, 150772.0, 256561.0, 243005.0, 137768.0, 65079.0, 30360.0, 13942.0, 6786.0, 3515.0, 1741.0, 970.0, 544.0, 312.0, 201.0, 132.0, 66.0, 41.0, 37.0, 23.0, 12.0, 8.0, 7.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.359375, -15.862548828125, -15.36572265625, -14.868896484375, -14.3720703125, -13.875244140625, -13.37841796875, -12.881591796875, -12.384765625, -11.887939453125, -11.39111328125, -10.894287109375, -10.3974609375, -9.900634765625, -9.40380859375, -8.906982421875, -8.41015625, -7.913330078125, -7.41650390625, -6.919677734375, -6.4228515625, -5.926025390625, -5.42919921875, -4.932373046875, -4.435546875, -3.938720703125, -3.44189453125, -2.945068359375, -2.4482421875, -1.951416015625, -1.45458984375, -0.957763671875, -0.4609375, 0.035888671875, 0.53271484375, 1.029541015625, 1.5263671875, 2.023193359375, 2.52001953125, 3.016845703125, 3.513671875, 4.010498046875, 4.50732421875, 5.004150390625, 5.5009765625, 5.997802734375, 6.49462890625, 6.991455078125, 7.48828125, 7.985107421875, 8.48193359375, 8.978759765625, 9.4755859375, 9.972412109375, 10.46923828125, 10.966064453125, 11.462890625, 11.959716796875, 12.45654296875, 12.953369140625, 13.4501953125, 13.947021484375, 14.44384765625, 14.940673828125, 15.4375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 19.0, 8.0, 13.0, 13.0, 14.0, 19.0, 15.0, 28.0, 28.0, 20.0, 30.0, 39.0, 34.0, 41.0, 41.0, 38.0, 38.0, 35.0, 44.0, 39.0, 44.0, 41.0, 33.0, 36.0, 35.0, 35.0, 27.0, 23.0, 19.0, 21.0, 15.0, 19.0, 13.0, 18.0, 11.0, 12.0, 8.0, 9.0, 6.0, 3.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6953125, -5.4979248046875, -5.300537109375, -5.1031494140625, -4.90576171875, -4.7083740234375, -4.510986328125, -4.3135986328125, -4.1162109375, -3.9188232421875, -3.721435546875, -3.5240478515625, -3.32666015625, -3.1292724609375, -2.931884765625, -2.7344970703125, -2.537109375, -2.3397216796875, -2.142333984375, -1.9449462890625, -1.74755859375, -1.5501708984375, -1.352783203125, -1.1553955078125, -0.9580078125, -0.7606201171875, -0.563232421875, -0.3658447265625, -0.16845703125, 0.0289306640625, 0.226318359375, 0.4237060546875, 0.62109375, 0.8184814453125, 1.015869140625, 1.2132568359375, 1.41064453125, 1.6080322265625, 1.805419921875, 2.0028076171875, 2.2001953125, 2.3975830078125, 2.594970703125, 2.7923583984375, 2.98974609375, 3.1871337890625, 3.384521484375, 3.5819091796875, 3.779296875, 3.9766845703125, 4.174072265625, 4.3714599609375, 4.56884765625, 4.7662353515625, 4.963623046875, 5.1610107421875, 5.3583984375, 5.5557861328125, 5.753173828125, 5.9505615234375, 6.14794921875, 6.3453369140625, 6.542724609375, 6.7401123046875, 6.9375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 4.0, 4.0, 9.0, 9.0, 13.0, 18.0, 27.0, 41.0, 61.0, 91.0, 121.0, 193.0, 263.0, 369.0, 596.0, 832.0, 1158.0, 1761.0, 2609.0, 3890.0, 5881.0, 9023.0, 13436.0, 20784.0, 32354.0, 50246.0, 77524.0, 115310.0, 155103.0, 164577.0, 131786.0, 90966.0, 59402.0, 38364.0, 24656.0, 15910.0, 10437.0, 6907.0, 4517.0, 3028.0, 2004.0, 1347.0, 938.0, 627.0, 411.0, 283.0, 205.0, 148.0, 95.0, 83.0, 59.0, 31.0, 14.0, 16.0, 6.0, 6.0, 6.0, 5.0, 4.0, 1.0, 1.0], "bins": [-4.796875, -4.64788818359375, -4.4989013671875, -4.34991455078125, -4.200927734375, -4.05194091796875, -3.9029541015625, -3.75396728515625, -3.60498046875, -3.45599365234375, -3.3070068359375, -3.15802001953125, -3.009033203125, -2.86004638671875, -2.7110595703125, -2.56207275390625, -2.4130859375, -2.26409912109375, -2.1151123046875, -1.96612548828125, -1.817138671875, -1.66815185546875, -1.5191650390625, -1.37017822265625, -1.22119140625, -1.07220458984375, -0.9232177734375, -0.77423095703125, -0.625244140625, -0.47625732421875, -0.3272705078125, -0.17828369140625, -0.029296875, 0.11968994140625, 0.2686767578125, 0.41766357421875, 0.566650390625, 0.71563720703125, 0.8646240234375, 1.01361083984375, 1.16259765625, 1.31158447265625, 1.4605712890625, 1.60955810546875, 1.758544921875, 1.90753173828125, 2.0565185546875, 2.20550537109375, 2.3544921875, 2.50347900390625, 2.6524658203125, 2.80145263671875, 2.950439453125, 3.09942626953125, 3.2484130859375, 3.39739990234375, 3.54638671875, 3.69537353515625, 3.8443603515625, 3.99334716796875, 4.142333984375, 4.29132080078125, 4.4403076171875, 4.58929443359375, 4.73828125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 1.0, 4.0, 4.0, 10.0, 10.0, 9.0, 20.0, 26.0, 24.0, 28.0, 24.0, 42.0, 52.0, 61.0, 65.0, 57.0, 62.0, 51.0, 55.0, 71.0, 52.0, 53.0, 41.0, 39.0, 23.0, 19.0, 17.0, 14.0, 16.0, 9.0, 9.0, 4.0, 7.0, 3.0, 3.0, 3.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00033473968505859375, -0.00032487884163856506, -0.0003150179982185364, -0.0003051571547985077, -0.000295296311378479, -0.0002854354679584503, -0.00027557462453842163, -0.00026571378111839294, -0.00025585293769836426, -0.00024599209427833557, -0.00023613125085830688, -0.0002262704074382782, -0.0002164095640182495, -0.00020654872059822083, -0.00019668787717819214, -0.00018682703375816345, -0.00017696619033813477, -0.00016710534691810608, -0.0001572445034980774, -0.0001473836600780487, -0.00013752281665802002, -0.00012766197323799133, -0.00011780112981796265, -0.00010794028639793396, -9.807944297790527e-05, -8.821859955787659e-05, -7.83577561378479e-05, -6.849691271781921e-05, -5.863606929779053e-05, -4.877522587776184e-05, -3.8914382457733154e-05, -2.9053539037704468e-05, -1.919269561767578e-05, -9.331852197647095e-06, 5.289912223815918e-07, 1.0389834642410278e-05, 2.0250678062438965e-05, 3.011152148246765e-05, 3.997236490249634e-05, 4.9833208322525024e-05, 5.969405174255371e-05, 6.95548951625824e-05, 7.941573858261108e-05, 8.927658200263977e-05, 9.913742542266846e-05, 0.00010899826884269714, 0.00011885911226272583, 0.00012871995568275452, 0.0001385807991027832, 0.0001484416425228119, 0.00015830248594284058, 0.00016816332936286926, 0.00017802417278289795, 0.00018788501620292664, 0.00019774585962295532, 0.000207606703042984, 0.0002174675464630127, 0.00022732838988304138, 0.00023718923330307007, 0.00024705007672309875, 0.00025691092014312744, 0.00026677176356315613, 0.0002766326069831848, 0.0002864934504032135, 0.0002963542938232422]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 2.0, 8.0, 26.0, 37.0, 48.0, 70.0, 94.0, 124.0, 228.0, 321.0, 447.0, 752.0, 1101.0, 1756.0, 2736.0, 4284.0, 6593.0, 10535.0, 16142.0, 25430.0, 38980.0, 59299.0, 85086.0, 114902.0, 135758.0, 138299.0, 121389.0, 93390.0, 66255.0, 44093.0, 28831.0, 18630.0, 11784.0, 7607.0, 4683.0, 3090.0, 1965.0, 1259.0, 878.0, 517.0, 351.0, 287.0, 157.0, 103.0, 78.0, 50.0, 31.0, 27.0, 15.0, 10.0, 9.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-4.4296875, -4.2918701171875, -4.154052734375, -4.0162353515625, -3.87841796875, -3.7406005859375, -3.602783203125, -3.4649658203125, -3.3271484375, -3.1893310546875, -3.051513671875, -2.9136962890625, -2.77587890625, -2.6380615234375, -2.500244140625, -2.3624267578125, -2.224609375, -2.0867919921875, -1.948974609375, -1.8111572265625, -1.67333984375, -1.5355224609375, -1.397705078125, -1.2598876953125, -1.1220703125, -0.9842529296875, -0.846435546875, -0.7086181640625, -0.57080078125, -0.4329833984375, -0.295166015625, -0.1573486328125, -0.01953125, 0.1182861328125, 0.256103515625, 0.3939208984375, 0.53173828125, 0.6695556640625, 0.807373046875, 0.9451904296875, 1.0830078125, 1.2208251953125, 1.358642578125, 1.4964599609375, 1.63427734375, 1.7720947265625, 1.909912109375, 2.0477294921875, 2.185546875, 2.3233642578125, 2.461181640625, 2.5989990234375, 2.73681640625, 2.8746337890625, 3.012451171875, 3.1502685546875, 3.2880859375, 3.4259033203125, 3.563720703125, 3.7015380859375, 3.83935546875, 3.9771728515625, 4.114990234375, 4.2528076171875, 4.390625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 6.0, 6.0, 7.0, 10.0, 6.0, 12.0, 22.0, 22.0, 22.0, 29.0, 36.0, 32.0, 35.0, 49.0, 41.0, 50.0, 43.0, 59.0, 59.0, 53.0, 61.0, 51.0, 29.0, 43.0, 40.0, 33.0, 33.0, 19.0, 18.0, 17.0, 13.0, 6.0, 11.0, 8.0, 11.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.609375, -1.5604705810546875, -1.511566162109375, -1.4626617431640625, -1.41375732421875, -1.3648529052734375, -1.315948486328125, -1.2670440673828125, -1.2181396484375, -1.1692352294921875, -1.120330810546875, -1.0714263916015625, -1.02252197265625, -0.9736175537109375, -0.924713134765625, -0.8758087158203125, -0.826904296875, -0.7779998779296875, -0.729095458984375, -0.6801910400390625, -0.63128662109375, -0.5823822021484375, -0.533477783203125, -0.4845733642578125, -0.4356689453125, -0.3867645263671875, -0.337860107421875, -0.2889556884765625, -0.24005126953125, -0.1911468505859375, -0.142242431640625, -0.0933380126953125, -0.04443359375, 0.0044708251953125, 0.053375244140625, 0.1022796630859375, 0.15118408203125, 0.2000885009765625, 0.248992919921875, 0.2978973388671875, 0.3468017578125, 0.3957061767578125, 0.444610595703125, 0.4935150146484375, 0.54241943359375, 0.5913238525390625, 0.640228271484375, 0.6891326904296875, 0.738037109375, 0.7869415283203125, 0.835845947265625, 0.8847503662109375, 0.93365478515625, 0.9825592041015625, 1.031463623046875, 1.0803680419921875, 1.1292724609375, 1.1781768798828125, 1.227081298828125, 1.2759857177734375, 1.32489013671875, 1.3737945556640625, 1.422698974609375, 1.4716033935546875, 1.5205078125]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 5.0, 6.0, 17.0, 14.0, 11.0, 14.0, 26.0, 35.0, 38.0, 57.0, 68.0, 66.0, 85.0, 80.0, 68.0, 74.0, 76.0, 61.0, 42.0, 36.0, 27.0, 29.0, 14.0, 20.0, 9.0, 6.0, 5.0, 4.0, 8.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.879331588745117, -22.02912139892578, -21.178913116455078, -20.328702926635742, -19.478492736816406, -18.628284454345703, -17.778074264526367, -16.92786407470703, -16.077655792236328, -15.227446556091309, -14.377236366271973, -13.527027130126953, -12.676817893981934, -11.826608657836914, -10.976398468017578, -10.126189231872559, -9.275979042053223, -8.425769805908203, -7.575560092926025, -6.725350379943848, -5.875141143798828, -5.02493143081665, -4.174721717834473, -3.324512481689453, -2.4743027687072754, -1.6240932941436768, -0.7738837003707886, 0.07632589340209961, 0.9265353679656982, 1.7767448425292969, 2.6269545555114746, 3.477163791656494, 4.327373504638672, 5.17758321762085, 6.027792453765869, 6.878002166748047, 7.728211402893066, 8.578420639038086, 9.428630828857422, 10.278840065002441, 11.129049301147461, 11.97925853729248, 12.829468727111816, 13.679677963256836, 14.529887199401855, 15.380096435546875, 16.23030662536621, 17.080516815185547, 17.93072509765625, 18.780935287475586, 19.63114356994629, 20.481353759765625, 21.33156394958496, 22.181772232055664, 23.031982421875, 23.882190704345703, 24.732402801513672, 25.582612991333008, 26.43282127380371, 27.283031463623047, 28.133241653442383, 28.983449935913086, 29.833660125732422, 30.683868408203125, 31.53407859802246]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 6.0, 2.0, 8.0, 7.0, 3.0, 7.0, 10.0, 12.0, 16.0, 22.0, 15.0, 10.0, 24.0, 21.0, 26.0, 29.0, 33.0, 40.0, 33.0, 33.0, 39.0, 42.0, 37.0, 38.0, 37.0, 47.0, 36.0, 36.0, 32.0, 24.0, 27.0, 31.0, 22.0, 24.0, 24.0, 18.0, 18.0, 18.0, 10.0, 20.0, 8.0, 15.0, 10.0, 5.0, 8.0, 4.0, 5.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0], "bins": [-10.28503704071045, -9.988395690917969, -9.691754341125488, -9.395112991333008, -9.098471641540527, -8.801830291748047, -8.505188941955566, -8.208547592163086, -7.911906719207764, -7.615265369415283, -7.318624019622803, -7.021982669830322, -6.725341796875, -6.4287004470825195, -6.132059097290039, -5.835417747497559, -5.538776397705078, -5.242135047912598, -4.945493698120117, -4.648852348327637, -4.352210998535156, -4.055569648742676, -3.7589287757873535, -3.462287425994873, -3.1656460762023926, -2.869004726409912, -2.5723633766174316, -2.2757222652435303, -1.9790809154510498, -1.6824395656585693, -1.3857983350753784, -1.0891571044921875, -0.7925148010253906, -0.49587351083755493, -0.19923222064971924, 0.09740906953811646, 0.39405035972595215, 0.6906917095184326, 0.9873329401016235, 1.2839741706848145, 1.580615520477295, 1.8772568702697754, 2.173898220062256, 2.4705393314361572, 2.7671806812286377, 3.063822031021118, 3.3604631423950195, 3.6571044921875, 3.9537458419799805, 4.250387191772461, 4.547028541564941, 4.843669891357422, 5.140311241149902, 5.436952590942383, 5.733593463897705, 6.0302348136901855, 6.326876163482666, 6.6235175132751465, 6.920158863067627, 7.216800212860107, 7.51344108581543, 7.81008243560791, 8.10672378540039, 8.403365135192871, 8.700006484985352]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 5.0, 5.0, 9.0, 15.0, 12.0, 26.0, 34.0, 33.0, 41.0, 81.0, 131.0, 166.0, 236.0, 348.0, 525.0, 904.0, 1701.0, 3280.0, 6861.0, 15148.0, 34465.0, 75735.0, 150797.0, 231406.0, 232204.0, 152055.0, 77147.0, 35027.0, 15627.0, 6860.0, 3429.0, 1682.0, 932.0, 539.0, 354.0, 221.0, 158.0, 105.0, 68.0, 43.0, 36.0, 31.0, 19.0, 11.0, 17.0, 5.0, 11.0, 7.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-24.234375, -23.477294921875, -22.72021484375, -21.963134765625, -21.2060546875, -20.448974609375, -19.69189453125, -18.934814453125, -18.177734375, -17.420654296875, -16.66357421875, -15.906494140625, -15.1494140625, -14.392333984375, -13.63525390625, -12.878173828125, -12.12109375, -11.364013671875, -10.60693359375, -9.849853515625, -9.0927734375, -8.335693359375, -7.57861328125, -6.821533203125, -6.064453125, -5.307373046875, -4.55029296875, -3.793212890625, -3.0361328125, -2.279052734375, -1.52197265625, -0.764892578125, -0.0078125, 0.749267578125, 1.50634765625, 2.263427734375, 3.0205078125, 3.777587890625, 4.53466796875, 5.291748046875, 6.048828125, 6.805908203125, 7.56298828125, 8.320068359375, 9.0771484375, 9.834228515625, 10.59130859375, 11.348388671875, 12.10546875, 12.862548828125, 13.61962890625, 14.376708984375, 15.1337890625, 15.890869140625, 16.64794921875, 17.405029296875, 18.162109375, 18.919189453125, 19.67626953125, 20.433349609375, 21.1904296875, 21.947509765625, 22.70458984375, 23.461669921875, 24.21875]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 6.0, 11.0, 6.0, 9.0, 17.0, 16.0, 27.0, 30.0, 22.0, 29.0, 45.0, 34.0, 44.0, 45.0, 35.0, 41.0, 36.0, 43.0, 49.0, 42.0, 39.0, 40.0, 39.0, 26.0, 28.0, 31.0, 18.0, 28.0, 21.0, 20.0, 20.0, 13.0, 17.0, 13.0, 8.0, 7.0, 12.0, 3.0, 5.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.296875, -11.950927734375, -11.60498046875, -11.259033203125, -10.9130859375, -10.567138671875, -10.22119140625, -9.875244140625, -9.529296875, -9.183349609375, -8.83740234375, -8.491455078125, -8.1455078125, -7.799560546875, -7.45361328125, -7.107666015625, -6.76171875, -6.415771484375, -6.06982421875, -5.723876953125, -5.3779296875, -5.031982421875, -4.68603515625, -4.340087890625, -3.994140625, -3.648193359375, -3.30224609375, -2.956298828125, -2.6103515625, -2.264404296875, -1.91845703125, -1.572509765625, -1.2265625, -0.880615234375, -0.53466796875, -0.188720703125, 0.1572265625, 0.503173828125, 0.84912109375, 1.195068359375, 1.541015625, 1.886962890625, 2.23291015625, 2.578857421875, 2.9248046875, 3.270751953125, 3.61669921875, 3.962646484375, 4.30859375, 4.654541015625, 5.00048828125, 5.346435546875, 5.6923828125, 6.038330078125, 6.38427734375, 6.730224609375, 7.076171875, 7.422119140625, 7.76806640625, 8.114013671875, 8.4599609375, 8.805908203125, 9.15185546875, 9.497802734375, 9.84375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 10.0, 11.0, 10.0, 20.0, 38.0, 57.0, 77.0, 126.0, 165.0, 234.0, 432.0, 598.0, 958.0, 1528.0, 2402.0, 3898.0, 6609.0, 10872.0, 18862.0, 31501.0, 50961.0, 79491.0, 114062.0, 143272.0, 154409.0, 137340.0, 104526.0, 71617.0, 45212.0, 27703.0, 16384.0, 9840.0, 5827.0, 3590.0, 2107.0, 1364.0, 831.0, 533.0, 358.0, 261.0, 163.0, 88.0, 73.0, 53.0, 29.0, 17.0, 18.0, 10.0, 6.0, 4.0, 4.0, 4.0, 0.0, 0.0, 2.0], "bins": [-15.4453125, -14.9825439453125, -14.519775390625, -14.0570068359375, -13.59423828125, -13.1314697265625, -12.668701171875, -12.2059326171875, -11.7431640625, -11.2803955078125, -10.817626953125, -10.3548583984375, -9.89208984375, -9.4293212890625, -8.966552734375, -8.5037841796875, -8.041015625, -7.5782470703125, -7.115478515625, -6.6527099609375, -6.18994140625, -5.7271728515625, -5.264404296875, -4.8016357421875, -4.3388671875, -3.8760986328125, -3.413330078125, -2.9505615234375, -2.48779296875, -2.0250244140625, -1.562255859375, -1.0994873046875, -0.63671875, -0.1739501953125, 0.288818359375, 0.7515869140625, 1.21435546875, 1.6771240234375, 2.139892578125, 2.6026611328125, 3.0654296875, 3.5281982421875, 3.990966796875, 4.4537353515625, 4.91650390625, 5.3792724609375, 5.842041015625, 6.3048095703125, 6.767578125, 7.2303466796875, 7.693115234375, 8.1558837890625, 8.61865234375, 9.0814208984375, 9.544189453125, 10.0069580078125, 10.4697265625, 10.9324951171875, 11.395263671875, 11.8580322265625, 12.32080078125, 12.7835693359375, 13.246337890625, 13.7091064453125, 14.171875]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 11.0, 7.0, 15.0, 11.0, 4.0, 15.0, 17.0, 18.0, 22.0, 25.0, 26.0, 18.0, 40.0, 31.0, 30.0, 30.0, 31.0, 32.0, 44.0, 41.0, 33.0, 29.0, 53.0, 35.0, 40.0, 27.0, 39.0, 43.0, 33.0, 33.0, 23.0, 27.0, 24.0, 19.0, 7.0, 12.0, 11.0, 7.0, 6.0, 13.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-6.41015625, -6.21337890625, -6.0166015625, -5.81982421875, -5.623046875, -5.42626953125, -5.2294921875, -5.03271484375, -4.8359375, -4.63916015625, -4.4423828125, -4.24560546875, -4.048828125, -3.85205078125, -3.6552734375, -3.45849609375, -3.26171875, -3.06494140625, -2.8681640625, -2.67138671875, -2.474609375, -2.27783203125, -2.0810546875, -1.88427734375, -1.6875, -1.49072265625, -1.2939453125, -1.09716796875, -0.900390625, -0.70361328125, -0.5068359375, -0.31005859375, -0.11328125, 0.08349609375, 0.2802734375, 0.47705078125, 0.673828125, 0.87060546875, 1.0673828125, 1.26416015625, 1.4609375, 1.65771484375, 1.8544921875, 2.05126953125, 2.248046875, 2.44482421875, 2.6416015625, 2.83837890625, 3.03515625, 3.23193359375, 3.4287109375, 3.62548828125, 3.822265625, 4.01904296875, 4.2158203125, 4.41259765625, 4.609375, 4.80615234375, 5.0029296875, 5.19970703125, 5.396484375, 5.59326171875, 5.7900390625, 5.98681640625, 6.18359375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 5.0, 3.0, 6.0, 7.0, 20.0, 28.0, 34.0, 35.0, 67.0, 91.0, 141.0, 166.0, 235.0, 313.0, 482.0, 715.0, 1040.0, 1544.0, 2416.0, 3725.0, 6363.0, 11653.0, 22204.0, 43493.0, 89521.0, 177935.0, 260854.0, 206159.0, 107882.0, 52146.0, 25618.0, 13772.0, 7535.0, 4327.0, 2605.0, 1677.0, 1171.0, 743.0, 523.0, 365.0, 310.0, 189.0, 148.0, 94.0, 57.0, 44.0, 25.0, 20.0, 14.0, 17.0, 12.0, 4.0, 8.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-12.2421875, -11.8551025390625, -11.468017578125, -11.0809326171875, -10.69384765625, -10.3067626953125, -9.919677734375, -9.5325927734375, -9.1455078125, -8.7584228515625, -8.371337890625, -7.9842529296875, -7.59716796875, -7.2100830078125, -6.822998046875, -6.4359130859375, -6.048828125, -5.6617431640625, -5.274658203125, -4.8875732421875, -4.50048828125, -4.1134033203125, -3.726318359375, -3.3392333984375, -2.9521484375, -2.5650634765625, -2.177978515625, -1.7908935546875, -1.40380859375, -1.0167236328125, -0.629638671875, -0.2425537109375, 0.14453125, 0.5316162109375, 0.918701171875, 1.3057861328125, 1.69287109375, 2.0799560546875, 2.467041015625, 2.8541259765625, 3.2412109375, 3.6282958984375, 4.015380859375, 4.4024658203125, 4.78955078125, 5.1766357421875, 5.563720703125, 5.9508056640625, 6.337890625, 6.7249755859375, 7.112060546875, 7.4991455078125, 7.88623046875, 8.2733154296875, 8.660400390625, 9.0474853515625, 9.4345703125, 9.8216552734375, 10.208740234375, 10.5958251953125, 10.98291015625, 11.3699951171875, 11.757080078125, 12.1441650390625, 12.53125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 4.0, 8.0, 6.0, 9.0, 16.0, 14.0, 18.0, 22.0, 44.0, 32.0, 79.0, 83.0, 116.0, 128.0, 93.0, 89.0, 78.0, 38.0, 37.0, 17.0, 19.0, 13.0, 6.0, 11.0, 6.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017423629760742188, -0.001691579818725586, -0.0016407966613769531, -0.0015900135040283203, -0.0015392303466796875, -0.0014884471893310547, -0.0014376640319824219, -0.001386880874633789, -0.0013360977172851562, -0.0012853145599365234, -0.0012345314025878906, -0.0011837482452392578, -0.001132965087890625, -0.0010821819305419922, -0.0010313987731933594, -0.0009806156158447266, -0.0009298324584960938, -0.0008790493011474609, -0.0008282661437988281, -0.0007774829864501953, -0.0007266998291015625, -0.0006759166717529297, -0.0006251335144042969, -0.0005743503570556641, -0.0005235671997070312, -0.00047278404235839844, -0.0004220008850097656, -0.0003712177276611328, -0.0003204345703125, -0.0002696514129638672, -0.00021886825561523438, -0.00016808509826660156, -0.00011730194091796875, -6.651878356933594e-05, -1.5735626220703125e-05, 3.504753112792969e-05, 8.58306884765625e-05, 0.0001366138458251953, 0.00018739700317382812, 0.00023818016052246094, 0.00028896331787109375, 0.00033974647521972656, 0.0003905296325683594, 0.0004413127899169922, 0.000492095947265625, 0.0005428791046142578, 0.0005936622619628906, 0.0006444454193115234, 0.0006952285766601562, 0.0007460117340087891, 0.0007967948913574219, 0.0008475780487060547, 0.0008983612060546875, 0.0009491443634033203, 0.0009999275207519531, 0.001050710678100586, 0.0011014938354492188, 0.0011522769927978516, 0.0012030601501464844, 0.0012538433074951172, 0.00130462646484375, 0.0013554096221923828, 0.0014061927795410156, 0.0014569759368896484, 0.0015077590942382812]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 6.0, 4.0, 11.0, 1.0, 7.0, 12.0, 14.0, 34.0, 60.0, 48.0, 72.0, 116.0, 166.0, 235.0, 304.0, 442.0, 660.0, 972.0, 1549.0, 2572.0, 4522.0, 8827.0, 19355.0, 45028.0, 111724.0, 243822.0, 301712.0, 174452.0, 72739.0, 30012.0, 13330.0, 6479.0, 3387.0, 1984.0, 1280.0, 832.0, 528.0, 352.0, 247.0, 195.0, 131.0, 102.0, 66.0, 50.0, 38.0, 31.0, 19.0, 14.0, 6.0, 6.0, 5.0, 2.0, 5.0, 0.0, 0.0, 2.0], "bins": [-15.2578125, -14.8125, -14.3671875, -13.921875, -13.4765625, -13.03125, -12.5859375, -12.140625, -11.6953125, -11.25, -10.8046875, -10.359375, -9.9140625, -9.46875, -9.0234375, -8.578125, -8.1328125, -7.6875, -7.2421875, -6.796875, -6.3515625, -5.90625, -5.4609375, -5.015625, -4.5703125, -4.125, -3.6796875, -3.234375, -2.7890625, -2.34375, -1.8984375, -1.453125, -1.0078125, -0.5625, -0.1171875, 0.328125, 0.7734375, 1.21875, 1.6640625, 2.109375, 2.5546875, 3.0, 3.4453125, 3.890625, 4.3359375, 4.78125, 5.2265625, 5.671875, 6.1171875, 6.5625, 7.0078125, 7.453125, 7.8984375, 8.34375, 8.7890625, 9.234375, 9.6796875, 10.125, 10.5703125, 11.015625, 11.4609375, 11.90625, 12.3515625, 12.796875, 13.2421875]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 7.0, 3.0, 4.0, 9.0, 13.0, 6.0, 15.0, 17.0, 19.0, 24.0, 36.0, 39.0, 52.0, 48.0, 58.0, 61.0, 59.0, 57.0, 74.0, 60.0, 56.0, 57.0, 41.0, 33.0, 32.0, 21.0, 14.0, 16.0, 11.0, 10.0, 8.0, 7.0, 8.0, 7.0, 7.0, 5.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.125, -3.034820556640625, -2.94464111328125, -2.854461669921875, -2.7642822265625, -2.674102783203125, -2.58392333984375, -2.493743896484375, -2.403564453125, -2.313385009765625, -2.22320556640625, -2.133026123046875, -2.0428466796875, -1.952667236328125, -1.86248779296875, -1.772308349609375, -1.68212890625, -1.591949462890625, -1.50177001953125, -1.411590576171875, -1.3214111328125, -1.231231689453125, -1.14105224609375, -1.050872802734375, -0.960693359375, -0.870513916015625, -0.78033447265625, -0.690155029296875, -0.5999755859375, -0.509796142578125, -0.41961669921875, -0.329437255859375, -0.2392578125, -0.149078369140625, -0.05889892578125, 0.031280517578125, 0.1214599609375, 0.211639404296875, 0.30181884765625, 0.391998291015625, 0.482177734375, 0.572357177734375, 0.66253662109375, 0.752716064453125, 0.8428955078125, 0.933074951171875, 1.02325439453125, 1.113433837890625, 1.20361328125, 1.293792724609375, 1.38397216796875, 1.474151611328125, 1.5643310546875, 1.654510498046875, 1.74468994140625, 1.834869384765625, 1.925048828125, 2.015228271484375, 2.10540771484375, 2.195587158203125, 2.2857666015625, 2.375946044921875, 2.46612548828125, 2.556304931640625, 2.646484375]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 3.0, 1.0, 9.0, 5.0, 11.0, 15.0, 10.0, 15.0, 26.0, 32.0, 36.0, 40.0, 36.0, 49.0, 49.0, 66.0, 61.0, 60.0, 80.0, 77.0, 49.0, 42.0, 37.0, 41.0, 27.0, 26.0, 23.0, 25.0, 18.0, 11.0, 6.0, 10.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-19.293867111206055, -18.58577537536621, -17.877683639526367, -17.169593811035156, -16.461502075195312, -15.753410339355469, -15.045318603515625, -14.337226867675781, -13.629136085510254, -12.92104434967041, -12.212953567504883, -11.504861831665039, -10.796770095825195, -10.088679313659668, -9.380587577819824, -8.672496795654297, -7.964405059814453, -7.256313800811768, -6.548222541809082, -5.840130805969238, -5.132039546966553, -4.423948287963867, -3.7158565521240234, -3.007765293121338, -2.2996740341186523, -1.5915826559066772, -0.8834912776947021, -0.1753997802734375, 0.532691478729248, 1.2407827377319336, 1.9488744735717773, 2.656965732574463, 3.3650550842285156, 4.073146343231201, 4.781237602233887, 5.4893293380737305, 6.197420597076416, 6.905511856079102, 7.613603591918945, 8.321695327758789, 9.029786109924316, 9.73787784576416, 10.445968627929688, 11.154060363769531, 11.862152099609375, 12.570242881774902, 13.278334617614746, 13.986425399780273, 14.694517135620117, 15.402608871459961, 16.110700607299805, 16.818790435791016, 17.52688217163086, 18.234973907470703, 18.943065643310547, 19.65115737915039, 20.359249114990234, 21.067340850830078, 21.775432586669922, 22.483524322509766, 23.191614151000977, 23.89970588684082, 24.607797622680664, 25.315889358520508, 26.02397918701172]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 5.0, 6.0, 7.0, 10.0, 5.0, 4.0, 14.0, 10.0, 15.0, 24.0, 22.0, 24.0, 27.0, 19.0, 40.0, 33.0, 36.0, 33.0, 46.0, 37.0, 46.0, 28.0, 35.0, 56.0, 53.0, 43.0, 42.0, 36.0, 31.0, 29.0, 21.0, 26.0, 22.0, 26.0, 14.0, 19.0, 13.0, 9.0, 7.0, 4.0, 8.0, 5.0, 4.0, 8.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.718064308166504, -9.37883186340332, -9.03959846496582, -8.700366020202637, -8.361133575439453, -8.02190113067627, -7.682668209075928, -7.343435287475586, -7.004202842712402, -6.664970397949219, -6.325737476348877, -5.986504554748535, -5.647272109985352, -5.308039665222168, -4.968806743621826, -4.629573822021484, -4.290341377258301, -3.951108694076538, -3.6118760108947754, -3.2726433277130127, -2.93341064453125, -2.5941779613494873, -2.2549452781677246, -1.915712594985962, -1.5764799118041992, -1.2372472286224365, -0.8980145454406738, -0.5587818622589111, -0.21954917907714844, 0.11968350410461426, 0.45891618728637695, 0.7981488704681396, 1.1373815536499023, 1.476614236831665, 1.8158469200134277, 2.1550796031951904, 2.494312286376953, 2.833544969558716, 3.1727776527404785, 3.512010335922241, 3.851243019104004, 4.1904754638671875, 4.529708385467529, 4.868941307067871, 5.208173751831055, 5.547406196594238, 5.88663911819458, 6.225872039794922, 6.5651044845581055, 6.904336929321289, 7.243569850921631, 7.582802772521973, 7.922035217285156, 8.26126766204834, 8.600500106811523, 8.939733505249023, 9.278965950012207, 9.61819839477539, 9.95743179321289, 10.296664237976074, 10.635896682739258, 10.975129127502441, 11.314361572265625, 11.653594970703125, 11.992827415466309]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 1.0, 9.0, 10.0, 16.0, 24.0, 27.0, 33.0, 51.0, 66.0, 112.0, 146.0, 217.0, 344.0, 482.0, 836.0, 1163.0, 1852.0, 3073.0, 5224.0, 8874.0, 16601.0, 31389.0, 62480.0, 130923.0, 286982.0, 622053.0, 1053119.0, 970843.0, 528769.0, 242456.0, 110747.0, 53930.0, 27261.0, 14248.0, 8149.0, 4549.0, 2568.0, 1665.0, 1001.0, 665.0, 426.0, 264.0, 215.0, 122.0, 83.0, 70.0, 34.0, 36.0, 24.0, 18.0, 16.0, 9.0, 2.0, 1.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-19.6875, -19.02880859375, -18.3701171875, -17.71142578125, -17.052734375, -16.39404296875, -15.7353515625, -15.07666015625, -14.41796875, -13.75927734375, -13.1005859375, -12.44189453125, -11.783203125, -11.12451171875, -10.4658203125, -9.80712890625, -9.1484375, -8.48974609375, -7.8310546875, -7.17236328125, -6.513671875, -5.85498046875, -5.1962890625, -4.53759765625, -3.87890625, -3.22021484375, -2.5615234375, -1.90283203125, -1.244140625, -0.58544921875, 0.0732421875, 0.73193359375, 1.390625, 2.04931640625, 2.7080078125, 3.36669921875, 4.025390625, 4.68408203125, 5.3427734375, 6.00146484375, 6.66015625, 7.31884765625, 7.9775390625, 8.63623046875, 9.294921875, 9.95361328125, 10.6123046875, 11.27099609375, 11.9296875, 12.58837890625, 13.2470703125, 13.90576171875, 14.564453125, 15.22314453125, 15.8818359375, 16.54052734375, 17.19921875, 17.85791015625, 18.5166015625, 19.17529296875, 19.833984375, 20.49267578125, 21.1513671875, 21.81005859375, 22.46875]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 3.0, 4.0, 3.0, 8.0, 9.0, 12.0, 10.0, 15.0, 17.0, 21.0, 27.0, 31.0, 32.0, 30.0, 33.0, 38.0, 39.0, 48.0, 50.0, 48.0, 53.0, 49.0, 49.0, 39.0, 38.0, 50.0, 33.0, 29.0, 26.0, 32.0, 22.0, 15.0, 9.0, 14.0, 12.0, 10.0, 14.0, 6.0, 7.0, 5.0, 9.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3359375, -9.0272216796875, -8.718505859375, -8.4097900390625, -8.10107421875, -7.7923583984375, -7.483642578125, -7.1749267578125, -6.8662109375, -6.5574951171875, -6.248779296875, -5.9400634765625, -5.63134765625, -5.3226318359375, -5.013916015625, -4.7052001953125, -4.396484375, -4.0877685546875, -3.779052734375, -3.4703369140625, -3.16162109375, -2.8529052734375, -2.544189453125, -2.2354736328125, -1.9267578125, -1.6180419921875, -1.309326171875, -1.0006103515625, -0.69189453125, -0.3831787109375, -0.074462890625, 0.2342529296875, 0.54296875, 0.8516845703125, 1.160400390625, 1.4691162109375, 1.77783203125, 2.0865478515625, 2.395263671875, 2.7039794921875, 3.0126953125, 3.3214111328125, 3.630126953125, 3.9388427734375, 4.24755859375, 4.5562744140625, 4.864990234375, 5.1737060546875, 5.482421875, 5.7911376953125, 6.099853515625, 6.4085693359375, 6.71728515625, 7.0260009765625, 7.334716796875, 7.6434326171875, 7.9521484375, 8.2608642578125, 8.569580078125, 8.8782958984375, 9.18701171875, 9.4957275390625, 9.804443359375, 10.1131591796875, 10.421875]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 7.0, 6.0, 9.0, 12.0, 6.0, 19.0, 21.0, 40.0, 60.0, 60.0, 90.0, 146.0, 221.0, 348.0, 536.0, 879.0, 1406.0, 2259.0, 3802.0, 6575.0, 11286.0, 19651.0, 34508.0, 62868.0, 114539.0, 212807.0, 382621.0, 634483.0, 841551.0, 752811.0, 490491.0, 277905.0, 152857.0, 83064.0, 45143.0, 25451.0, 14633.0, 8431.0, 4835.0, 2924.0, 1811.0, 1130.0, 678.0, 449.0, 303.0, 192.0, 119.0, 95.0, 44.0, 38.0, 22.0, 12.0, 13.0, 11.0, 10.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-19.25, -18.643310546875, -18.03662109375, -17.429931640625, -16.8232421875, -16.216552734375, -15.60986328125, -15.003173828125, -14.396484375, -13.789794921875, -13.18310546875, -12.576416015625, -11.9697265625, -11.363037109375, -10.75634765625, -10.149658203125, -9.54296875, -8.936279296875, -8.32958984375, -7.722900390625, -7.1162109375, -6.509521484375, -5.90283203125, -5.296142578125, -4.689453125, -4.082763671875, -3.47607421875, -2.869384765625, -2.2626953125, -1.656005859375, -1.04931640625, -0.442626953125, 0.1640625, 0.770751953125, 1.37744140625, 1.984130859375, 2.5908203125, 3.197509765625, 3.80419921875, 4.410888671875, 5.017578125, 5.624267578125, 6.23095703125, 6.837646484375, 7.4443359375, 8.051025390625, 8.65771484375, 9.264404296875, 9.87109375, 10.477783203125, 11.08447265625, 11.691162109375, 12.2978515625, 12.904541015625, 13.51123046875, 14.117919921875, 14.724609375, 15.331298828125, 15.93798828125, 16.544677734375, 17.1513671875, 17.758056640625, 18.36474609375, 18.971435546875, 19.578125]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 9.0, 13.0, 13.0, 30.0, 22.0, 38.0, 32.0, 52.0, 84.0, 91.0, 119.0, 143.0, 188.0, 235.0, 248.0, 301.0, 269.0, 302.0, 320.0, 264.0, 262.0, 228.0, 177.0, 122.0, 112.0, 116.0, 67.0, 69.0, 30.0, 27.0, 26.0, 21.0, 9.0, 10.0, 8.0, 2.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.0078125, -7.7862548828125, -7.564697265625, -7.3431396484375, -7.12158203125, -6.9000244140625, -6.678466796875, -6.4569091796875, -6.2353515625, -6.0137939453125, -5.792236328125, -5.5706787109375, -5.34912109375, -5.1275634765625, -4.906005859375, -4.6844482421875, -4.462890625, -4.2413330078125, -4.019775390625, -3.7982177734375, -3.57666015625, -3.3551025390625, -3.133544921875, -2.9119873046875, -2.6904296875, -2.4688720703125, -2.247314453125, -2.0257568359375, -1.80419921875, -1.5826416015625, -1.361083984375, -1.1395263671875, -0.91796875, -0.6964111328125, -0.474853515625, -0.2532958984375, -0.03173828125, 0.1898193359375, 0.411376953125, 0.6329345703125, 0.8544921875, 1.0760498046875, 1.297607421875, 1.5191650390625, 1.74072265625, 1.9622802734375, 2.183837890625, 2.4053955078125, 2.626953125, 2.8485107421875, 3.070068359375, 3.2916259765625, 3.51318359375, 3.7347412109375, 3.956298828125, 4.1778564453125, 4.3994140625, 4.6209716796875, 4.842529296875, 5.0640869140625, 5.28564453125, 5.5072021484375, 5.728759765625, 5.9503173828125, 6.171875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 5.0, 11.0, 12.0, 9.0, 19.0, 14.0, 17.0, 20.0, 28.0, 18.0, 40.0, 44.0, 51.0, 55.0, 43.0, 46.0, 55.0, 47.0, 56.0, 52.0, 52.0, 48.0, 44.0, 41.0, 24.0, 21.0, 21.0, 25.0, 16.0, 13.0, 8.0, 6.0, 9.0, 4.0, 11.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.998210906982422, -16.371292114257812, -15.744372367858887, -15.117452621459961, -14.490533828735352, -13.863615036010742, -13.236695289611816, -12.60977554321289, -11.982856750488281, -11.355937957763672, -10.729018211364746, -10.10209846496582, -9.475179672241211, -8.848260879516602, -8.221341133117676, -7.594421863555908, -6.967502593994141, -6.340583324432373, -5.7136640548706055, -5.086744785308838, -4.45982551574707, -3.8329062461853027, -3.205986976623535, -2.5790677070617676, -1.9521484375, -1.3252291679382324, -0.6983098983764648, -0.07139062881469727, 0.5555286407470703, 1.182447910308838, 1.8093671798706055, 2.436286449432373, 3.063203811645508, 3.6901230812072754, 4.317042350769043, 4.9439616203308105, 5.570880889892578, 6.197800159454346, 6.824719429016113, 7.451638698577881, 8.078557968139648, 8.705476760864258, 9.332396507263184, 9.95931625366211, 10.586235046386719, 11.213153839111328, 11.840073585510254, 12.46699333190918, 13.093912124633789, 13.720830917358398, 14.347750663757324, 14.97467041015625, 15.60158920288086, 16.22850799560547, 16.855426788330078, 17.48234748840332, 18.10926628112793, 18.73618507385254, 19.36310577392578, 19.99002456665039, 20.616943359375, 21.24386215209961, 21.87078094482422, 22.49770164489746, 23.12462043762207]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 4.0, 5.0, 6.0, 11.0, 12.0, 11.0, 20.0, 13.0, 16.0, 24.0, 25.0, 20.0, 33.0, 33.0, 46.0, 42.0, 34.0, 42.0, 35.0, 48.0, 45.0, 41.0, 38.0, 36.0, 34.0, 37.0, 38.0, 32.0, 35.0, 24.0, 27.0, 26.0, 17.0, 15.0, 12.0, 15.0, 7.0, 11.0, 10.0, 3.0, 2.0, 4.0, 3.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6232271194458, -12.234650611877441, -11.846074104309082, -11.457497596740723, -11.06892204284668, -10.68034553527832, -10.291769027709961, -9.903192520141602, -9.514616012573242, -9.126039505004883, -8.737462997436523, -8.348886489868164, -7.960310459136963, -7.5717339515686035, -7.183157920837402, -6.794581413269043, -6.406004905700684, -6.017428398132324, -5.628851890563965, -5.240275859832764, -4.851699352264404, -4.463122844696045, -4.074546813964844, -3.6859703063964844, -3.297393798828125, -2.9088172912597656, -2.5202410221099854, -2.131664752960205, -1.7430882453918457, -1.3545118570327759, -0.965935468673706, -0.5773591995239258, -0.1887836456298828, 0.199792742729187, 0.5883691310882568, 0.9769455194473267, 1.3655219078063965, 1.7540982961654663, 2.142674684524536, 2.5312509536743164, 2.919827461242676, 3.308403968811035, 3.6969802379608154, 4.085556507110596, 4.474133014678955, 4.8627095222473145, 5.251285552978516, 5.639862060546875, 6.028438568115234, 6.417015075683594, 6.805591583251953, 7.194167613983154, 7.582744121551514, 7.971320629119873, 8.359896659851074, 8.748473167419434, 9.137049674987793, 9.525626182556152, 9.914202690124512, 10.302779197692871, 10.691354751586914, 11.079931259155273, 11.468507766723633, 11.857084274291992, 12.245660781860352]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 9.0, 12.0, 8.0, 18.0, 44.0, 44.0, 67.0, 84.0, 148.0, 202.0, 306.0, 535.0, 818.0, 1342.0, 2163.0, 3814.0, 6910.0, 13635.0, 30306.0, 76403.0, 188641.0, 310426.0, 234222.0, 101651.0, 40063.0, 17178.0, 8418.0, 4409.0, 2652.0, 1519.0, 870.0, 528.0, 372.0, 237.0, 145.0, 119.0, 66.0, 38.0, 41.0, 27.0, 15.0, 20.0, 5.0, 14.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.515625, -21.729736328125, -20.94384765625, -20.157958984375, -19.3720703125, -18.586181640625, -17.80029296875, -17.014404296875, -16.228515625, -15.442626953125, -14.65673828125, -13.870849609375, -13.0849609375, -12.299072265625, -11.51318359375, -10.727294921875, -9.94140625, -9.155517578125, -8.36962890625, -7.583740234375, -6.7978515625, -6.011962890625, -5.22607421875, -4.440185546875, -3.654296875, -2.868408203125, -2.08251953125, -1.296630859375, -0.5107421875, 0.275146484375, 1.06103515625, 1.846923828125, 2.6328125, 3.418701171875, 4.20458984375, 4.990478515625, 5.7763671875, 6.562255859375, 7.34814453125, 8.134033203125, 8.919921875, 9.705810546875, 10.49169921875, 11.277587890625, 12.0634765625, 12.849365234375, 13.63525390625, 14.421142578125, 15.20703125, 15.992919921875, 16.77880859375, 17.564697265625, 18.3505859375, 19.136474609375, 19.92236328125, 20.708251953125, 21.494140625, 22.280029296875, 23.06591796875, 23.851806640625, 24.6376953125, 25.423583984375, 26.20947265625, 26.995361328125, 27.78125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 4.0, 4.0, 6.0, 10.0, 4.0, 13.0, 19.0, 13.0, 21.0, 16.0, 24.0, 23.0, 32.0, 37.0, 33.0, 38.0, 41.0, 44.0, 40.0, 41.0, 32.0, 43.0, 44.0, 42.0, 36.0, 41.0, 39.0, 32.0, 27.0, 25.0, 26.0, 26.0, 23.0, 16.0, 15.0, 10.0, 10.0, 12.0, 11.0, 6.0, 5.0, 1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0], "bins": [-14.453125, -14.03759765625, -13.6220703125, -13.20654296875, -12.791015625, -12.37548828125, -11.9599609375, -11.54443359375, -11.12890625, -10.71337890625, -10.2978515625, -9.88232421875, -9.466796875, -9.05126953125, -8.6357421875, -8.22021484375, -7.8046875, -7.38916015625, -6.9736328125, -6.55810546875, -6.142578125, -5.72705078125, -5.3115234375, -4.89599609375, -4.48046875, -4.06494140625, -3.6494140625, -3.23388671875, -2.818359375, -2.40283203125, -1.9873046875, -1.57177734375, -1.15625, -0.74072265625, -0.3251953125, 0.09033203125, 0.505859375, 0.92138671875, 1.3369140625, 1.75244140625, 2.16796875, 2.58349609375, 2.9990234375, 3.41455078125, 3.830078125, 4.24560546875, 4.6611328125, 5.07666015625, 5.4921875, 5.90771484375, 6.3232421875, 6.73876953125, 7.154296875, 7.56982421875, 7.9853515625, 8.40087890625, 8.81640625, 9.23193359375, 9.6474609375, 10.06298828125, 10.478515625, 10.89404296875, 11.3095703125, 11.72509765625, 12.140625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 9.0, 9.0, 7.0, 16.0, 18.0, 27.0, 32.0, 54.0, 59.0, 93.0, 116.0, 157.0, 226.0, 333.0, 422.0, 630.0, 928.0, 1436.0, 2473.0, 4365.0, 8644.0, 20467.0, 61866.0, 232867.0, 451484.0, 178812.0, 48238.0, 16795.0, 7581.0, 3820.0, 2255.0, 1423.0, 868.0, 590.0, 416.0, 284.0, 218.0, 125.0, 91.0, 88.0, 50.0, 49.0, 39.0, 24.0, 15.0, 12.0, 7.0, 3.0, 5.0, 9.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.40625, -36.21484375, -35.0234375, -33.83203125, -32.640625, -31.44921875, -30.2578125, -29.06640625, -27.875, -26.68359375, -25.4921875, -24.30078125, -23.109375, -21.91796875, -20.7265625, -19.53515625, -18.34375, -17.15234375, -15.9609375, -14.76953125, -13.578125, -12.38671875, -11.1953125, -10.00390625, -8.8125, -7.62109375, -6.4296875, -5.23828125, -4.046875, -2.85546875, -1.6640625, -0.47265625, 0.71875, 1.91015625, 3.1015625, 4.29296875, 5.484375, 6.67578125, 7.8671875, 9.05859375, 10.25, 11.44140625, 12.6328125, 13.82421875, 15.015625, 16.20703125, 17.3984375, 18.58984375, 19.78125, 20.97265625, 22.1640625, 23.35546875, 24.546875, 25.73828125, 26.9296875, 28.12109375, 29.3125, 30.50390625, 31.6953125, 32.88671875, 34.078125, 35.26953125, 36.4609375, 37.65234375, 38.84375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 2.0, 3.0, 1.0, 5.0, 6.0, 9.0, 6.0, 14.0, 12.0, 16.0, 19.0, 19.0, 20.0, 23.0, 35.0, 26.0, 26.0, 40.0, 28.0, 38.0, 38.0, 45.0, 35.0, 47.0, 27.0, 44.0, 41.0, 38.0, 35.0, 35.0, 36.0, 30.0, 31.0, 25.0, 21.0, 17.0, 17.0, 15.0, 8.0, 14.0, 8.0, 5.0, 12.0, 9.0, 4.0, 3.0, 3.0, 4.0, 4.0, 3.0, 3.0, 5.0, 2.0, 0.0, 1.0], "bins": [-7.62890625, -7.397216796875, -7.16552734375, -6.933837890625, -6.7021484375, -6.470458984375, -6.23876953125, -6.007080078125, -5.775390625, -5.543701171875, -5.31201171875, -5.080322265625, -4.8486328125, -4.616943359375, -4.38525390625, -4.153564453125, -3.921875, -3.690185546875, -3.45849609375, -3.226806640625, -2.9951171875, -2.763427734375, -2.53173828125, -2.300048828125, -2.068359375, -1.836669921875, -1.60498046875, -1.373291015625, -1.1416015625, -0.909912109375, -0.67822265625, -0.446533203125, -0.21484375, 0.016845703125, 0.24853515625, 0.480224609375, 0.7119140625, 0.943603515625, 1.17529296875, 1.406982421875, 1.638671875, 1.870361328125, 2.10205078125, 2.333740234375, 2.5654296875, 2.797119140625, 3.02880859375, 3.260498046875, 3.4921875, 3.723876953125, 3.95556640625, 4.187255859375, 4.4189453125, 4.650634765625, 4.88232421875, 5.114013671875, 5.345703125, 5.577392578125, 5.80908203125, 6.040771484375, 6.2724609375, 6.504150390625, 6.73583984375, 6.967529296875, 7.19921875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 7.0, 12.0, 10.0, 14.0, 21.0, 34.0, 51.0, 59.0, 84.0, 126.0, 180.0, 292.0, 399.0, 584.0, 853.0, 1227.0, 1850.0, 2689.0, 4400.0, 7232.0, 13801.0, 31358.0, 92852.0, 299693.0, 377313.0, 131713.0, 41387.0, 16993.0, 8624.0, 5015.0, 3120.0, 2081.0, 1416.0, 952.0, 625.0, 476.0, 321.0, 209.0, 147.0, 114.0, 81.0, 47.0, 31.0, 20.0, 8.0, 16.0, 10.0, 5.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-17.0, -16.487060546875, -15.97412109375, -15.461181640625, -14.9482421875, -14.435302734375, -13.92236328125, -13.409423828125, -12.896484375, -12.383544921875, -11.87060546875, -11.357666015625, -10.8447265625, -10.331787109375, -9.81884765625, -9.305908203125, -8.79296875, -8.280029296875, -7.76708984375, -7.254150390625, -6.7412109375, -6.228271484375, -5.71533203125, -5.202392578125, -4.689453125, -4.176513671875, -3.66357421875, -3.150634765625, -2.6376953125, -2.124755859375, -1.61181640625, -1.098876953125, -0.5859375, -0.072998046875, 0.43994140625, 0.952880859375, 1.4658203125, 1.978759765625, 2.49169921875, 3.004638671875, 3.517578125, 4.030517578125, 4.54345703125, 5.056396484375, 5.5693359375, 6.082275390625, 6.59521484375, 7.108154296875, 7.62109375, 8.134033203125, 8.64697265625, 9.159912109375, 9.6728515625, 10.185791015625, 10.69873046875, 11.211669921875, 11.724609375, 12.237548828125, 12.75048828125, 13.263427734375, 13.7763671875, 14.289306640625, 14.80224609375, 15.315185546875, 15.828125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 3.0, 0.0, 5.0, 7.0, 3.0, 2.0, 12.0, 13.0, 18.0, 26.0, 55.0, 76.0, 122.0, 143.0, 142.0, 120.0, 82.0, 55.0, 30.0, 19.0, 16.0, 9.0, 12.0, 3.0, 2.0, 2.0, 6.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0008711814880371094, -0.0008402243256568909, -0.0008092671632766724, -0.0007783100008964539, -0.0007473528385162354, -0.0007163956761360168, -0.0006854385137557983, -0.0006544813513755798, -0.0006235241889953613, -0.0005925670266151428, -0.0005616098642349243, -0.0005306527018547058, -0.0004996955394744873, -0.0004687383770942688, -0.0004377812147140503, -0.0004068240523338318, -0.0003758668899536133, -0.0003449097275733948, -0.00031395256519317627, -0.00028299540281295776, -0.00025203824043273926, -0.00022108107805252075, -0.00019012391567230225, -0.00015916675329208374, -0.00012820959091186523, -9.725242853164673e-05, -6.629526615142822e-05, -3.533810377120972e-05, -4.380941390991211e-06, 2.6576220989227295e-05, 5.75333833694458e-05, 8.84905457496643e-05, 0.00011944770812988281, 0.00015040487051010132, 0.00018136203289031982, 0.00021231919527053833, 0.00024327635765075684, 0.00027423352003097534, 0.00030519068241119385, 0.00033614784479141235, 0.00036710500717163086, 0.00039806216955184937, 0.00042901933193206787, 0.0004599764943122864, 0.0004909336566925049, 0.0005218908190727234, 0.0005528479814529419, 0.0005838051438331604, 0.0006147623062133789, 0.0006457194685935974, 0.0006766766309738159, 0.0007076337933540344, 0.0007385909557342529, 0.0007695481181144714, 0.0008005052804946899, 0.0008314624428749084, 0.000862419605255127, 0.0008933767676353455, 0.000924333930015564, 0.0009552910923957825, 0.000986248254776001, 0.0010172054171562195, 0.001048162579536438, 0.0010791197419166565, 0.001110076904296875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 4.0, 8.0, 8.0, 9.0, 15.0, 15.0, 31.0, 29.0, 60.0, 97.0, 90.0, 135.0, 179.0, 266.0, 326.0, 498.0, 676.0, 1000.0, 1314.0, 1765.0, 2334.0, 3454.0, 4993.0, 7652.0, 13254.0, 29506.0, 85327.0, 242484.0, 351801.0, 184129.0, 60911.0, 22694.0, 11171.0, 6525.0, 4509.0, 3119.0, 2280.0, 1541.0, 1168.0, 889.0, 676.0, 458.0, 349.0, 230.0, 159.0, 121.0, 86.0, 64.0, 52.0, 37.0, 18.0, 16.0, 9.0, 10.0, 3.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0], "bins": [-15.1171875, -14.635009765625, -14.15283203125, -13.670654296875, -13.1884765625, -12.706298828125, -12.22412109375, -11.741943359375, -11.259765625, -10.777587890625, -10.29541015625, -9.813232421875, -9.3310546875, -8.848876953125, -8.36669921875, -7.884521484375, -7.40234375, -6.920166015625, -6.43798828125, -5.955810546875, -5.4736328125, -4.991455078125, -4.50927734375, -4.027099609375, -3.544921875, -3.062744140625, -2.58056640625, -2.098388671875, -1.6162109375, -1.134033203125, -0.65185546875, -0.169677734375, 0.3125, 0.794677734375, 1.27685546875, 1.759033203125, 2.2412109375, 2.723388671875, 3.20556640625, 3.687744140625, 4.169921875, 4.652099609375, 5.13427734375, 5.616455078125, 6.0986328125, 6.580810546875, 7.06298828125, 7.545166015625, 8.02734375, 8.509521484375, 8.99169921875, 9.473876953125, 9.9560546875, 10.438232421875, 10.92041015625, 11.402587890625, 11.884765625, 12.366943359375, 12.84912109375, 13.331298828125, 13.8134765625, 14.295654296875, 14.77783203125, 15.260009765625, 15.7421875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 6.0, 7.0, 6.0, 7.0, 10.0, 18.0, 20.0, 33.0, 61.0, 108.0, 126.0, 135.0, 143.0, 120.0, 60.0, 44.0, 22.0, 17.0, 9.0, 10.0, 3.0, 4.0, 6.0, 7.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.99609375, -4.8157958984375, -4.635498046875, -4.4552001953125, -4.27490234375, -4.0946044921875, -3.914306640625, -3.7340087890625, -3.5537109375, -3.3734130859375, -3.193115234375, -3.0128173828125, -2.83251953125, -2.6522216796875, -2.471923828125, -2.2916259765625, -2.111328125, -1.9310302734375, -1.750732421875, -1.5704345703125, -1.39013671875, -1.2098388671875, -1.029541015625, -0.8492431640625, -0.6689453125, -0.4886474609375, -0.308349609375, -0.1280517578125, 0.05224609375, 0.2325439453125, 0.412841796875, 0.5931396484375, 0.7734375, 0.9537353515625, 1.134033203125, 1.3143310546875, 1.49462890625, 1.6749267578125, 1.855224609375, 2.0355224609375, 2.2158203125, 2.3961181640625, 2.576416015625, 2.7567138671875, 2.93701171875, 3.1173095703125, 3.297607421875, 3.4779052734375, 3.658203125, 3.8385009765625, 4.018798828125, 4.1990966796875, 4.37939453125, 4.5596923828125, 4.739990234375, 4.9202880859375, 5.1005859375, 5.2808837890625, 5.461181640625, 5.6414794921875, 5.82177734375, 6.0020751953125, 6.182373046875, 6.3626708984375, 6.54296875]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 9.0, 2.0, 13.0, 11.0, 12.0, 16.0, 18.0, 15.0, 24.0, 23.0, 35.0, 39.0, 46.0, 58.0, 59.0, 54.0, 64.0, 48.0, 69.0, 62.0, 57.0, 43.0, 45.0, 29.0, 27.0, 40.0, 22.0, 17.0, 3.0, 8.0, 10.0, 8.0, 7.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.16149139404297, -19.467941284179688, -18.774391174316406, -18.080839157104492, -17.38728904724121, -16.69373893737793, -16.000186920166016, -15.306636810302734, -14.613086700439453, -13.919536590576172, -13.225985527038574, -12.532434463500977, -11.838884353637695, -11.145334243774414, -10.451783180236816, -9.758232116699219, -9.064682006835938, -8.371131896972656, -7.677580833435059, -6.984030246734619, -6.29047966003418, -5.59692907333374, -4.903378486633301, -4.209827899932861, -3.516277313232422, -2.8227267265319824, -2.129176139831543, -1.4356255531311035, -0.7420749664306641, -0.04852437973022461, 0.6450262069702148, 1.3385767936706543, 2.0321273803710938, 2.725677967071533, 3.4192285537719727, 4.112779140472412, 4.806329727172852, 5.499880313873291, 6.1934309005737305, 6.88698148727417, 7.580532073974609, 8.27408218383789, 8.967633247375488, 9.661184310913086, 10.354734420776367, 11.048284530639648, 11.741835594177246, 12.435386657714844, 13.128936767578125, 13.822486877441406, 14.516037940979004, 15.209589004516602, 15.903139114379883, 16.596689224243164, 17.290241241455078, 17.98379135131836, 18.67734146118164, 19.370891571044922, 20.064441680908203, 20.757993698120117, 21.4515438079834, 22.14509391784668, 22.838645935058594, 23.532196044921875, 24.225746154785156]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 0.0, 5.0, 6.0, 5.0, 8.0, 13.0, 9.0, 12.0, 12.0, 15.0, 22.0, 24.0, 19.0, 33.0, 27.0, 32.0, 38.0, 46.0, 34.0, 41.0, 42.0, 37.0, 39.0, 32.0, 47.0, 34.0, 38.0, 34.0, 43.0, 37.0, 30.0, 25.0, 28.0, 17.0, 26.0, 12.0, 17.0, 13.0, 14.0, 9.0, 8.0, 3.0, 2.0, 2.0, 4.0, 8.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-12.440733909606934, -12.069839477539062, -11.698945045471191, -11.32805061340332, -10.957157135009766, -10.586262702941895, -10.215368270874023, -9.844473838806152, -9.473579406738281, -9.10268497467041, -8.731790542602539, -8.360896110534668, -7.990002155303955, -7.619107723236084, -7.248213768005371, -6.8773193359375, -6.506424903869629, -6.135530471801758, -5.764636039733887, -5.393742084503174, -5.022847652435303, -4.651953220367432, -4.281059265136719, -3.9101648330688477, -3.5392704010009766, -3.1683759689331055, -2.7974817752838135, -2.4265875816345215, -2.0556931495666504, -1.6847988367080688, -1.3139045238494873, -0.9430103302001953, -0.5721149444580078, -0.20122063159942627, 0.16967368125915527, 0.5405679941177368, 0.9114623069763184, 1.2823566198349, 1.6532509326934814, 2.0241451263427734, 2.3950395584106445, 2.7659339904785156, 3.1368281841278076, 3.5077223777770996, 3.8786168098449707, 4.249511241912842, 4.620405197143555, 4.991299629211426, 5.362194061279297, 5.733088493347168, 6.103982925415039, 6.474876880645752, 6.845771312713623, 7.216665744781494, 7.587559700012207, 7.958454132080078, 8.32934856414795, 8.70024299621582, 9.071137428283691, 9.442031860351562, 9.812925338745117, 10.183819770812988, 10.55471420288086, 10.92560863494873, 11.296503067016602]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 9.0, 12.0, 20.0, 22.0, 24.0, 52.0, 70.0, 119.0, 172.0, 288.0, 394.0, 654.0, 998.0, 1620.0, 2649.0, 4147.0, 6606.0, 10747.0, 16956.0, 26570.0, 40557.0, 61366.0, 85718.0, 112100.0, 130219.0, 133303.0, 119228.0, 94835.0, 68534.0, 46980.0, 30792.0, 19592.0, 12397.0, 7808.0, 4811.0, 3105.0, 1956.0, 1155.0, 717.0, 449.0, 265.0, 174.0, 123.0, 88.0, 45.0, 38.0, 26.0, 16.0, 9.0, 8.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0], "bins": [-12.296875, -11.91455078125, -11.5322265625, -11.14990234375, -10.767578125, -10.38525390625, -10.0029296875, -9.62060546875, -9.23828125, -8.85595703125, -8.4736328125, -8.09130859375, -7.708984375, -7.32666015625, -6.9443359375, -6.56201171875, -6.1796875, -5.79736328125, -5.4150390625, -5.03271484375, -4.650390625, -4.26806640625, -3.8857421875, -3.50341796875, -3.12109375, -2.73876953125, -2.3564453125, -1.97412109375, -1.591796875, -1.20947265625, -0.8271484375, -0.44482421875, -0.0625, 0.31982421875, 0.7021484375, 1.08447265625, 1.466796875, 1.84912109375, 2.2314453125, 2.61376953125, 2.99609375, 3.37841796875, 3.7607421875, 4.14306640625, 4.525390625, 4.90771484375, 5.2900390625, 5.67236328125, 6.0546875, 6.43701171875, 6.8193359375, 7.20166015625, 7.583984375, 7.96630859375, 8.3486328125, 8.73095703125, 9.11328125, 9.49560546875, 9.8779296875, 10.26025390625, 10.642578125, 11.02490234375, 11.4072265625, 11.78955078125, 12.171875]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 8.0, 11.0, 6.0, 10.0, 14.0, 14.0, 14.0, 27.0, 19.0, 28.0, 26.0, 29.0, 41.0, 30.0, 32.0, 39.0, 35.0, 51.0, 46.0, 53.0, 40.0, 42.0, 37.0, 41.0, 44.0, 37.0, 38.0, 33.0, 14.0, 23.0, 15.0, 24.0, 16.0, 12.0, 19.0, 1.0, 4.0, 9.0, 7.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.953125, -12.5404052734375, -12.127685546875, -11.7149658203125, -11.30224609375, -10.8895263671875, -10.476806640625, -10.0640869140625, -9.6513671875, -9.2386474609375, -8.825927734375, -8.4132080078125, -8.00048828125, -7.5877685546875, -7.175048828125, -6.7623291015625, -6.349609375, -5.9368896484375, -5.524169921875, -5.1114501953125, -4.69873046875, -4.2860107421875, -3.873291015625, -3.4605712890625, -3.0478515625, -2.6351318359375, -2.222412109375, -1.8096923828125, -1.39697265625, -0.9842529296875, -0.571533203125, -0.1588134765625, 0.25390625, 0.6666259765625, 1.079345703125, 1.4920654296875, 1.90478515625, 2.3175048828125, 2.730224609375, 3.1429443359375, 3.5556640625, 3.9683837890625, 4.381103515625, 4.7938232421875, 5.20654296875, 5.6192626953125, 6.031982421875, 6.4447021484375, 6.857421875, 7.2701416015625, 7.682861328125, 8.0955810546875, 8.50830078125, 8.9210205078125, 9.333740234375, 9.7464599609375, 10.1591796875, 10.5718994140625, 10.984619140625, 11.3973388671875, 11.81005859375, 12.2227783203125, 12.635498046875, 13.0482177734375, 13.4609375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 12.0, 11.0, 17.0, 36.0, 45.0, 78.0, 96.0, 136.0, 222.0, 303.0, 490.0, 722.0, 1178.0, 1883.0, 2842.0, 4403.0, 7068.0, 10501.0, 16721.0, 26065.0, 38732.0, 57043.0, 79537.0, 101494.0, 120792.0, 127239.0, 118298.0, 99168.0, 75310.0, 53637.0, 36821.0, 23955.0, 15437.0, 10225.0, 6396.0, 4224.0, 2662.0, 1617.0, 1108.0, 700.0, 489.0, 259.0, 190.0, 134.0, 85.0, 60.0, 40.0, 20.0, 16.0, 10.0, 12.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-10.984375, -10.634765625, -10.28515625, -9.935546875, -9.5859375, -9.236328125, -8.88671875, -8.537109375, -8.1875, -7.837890625, -7.48828125, -7.138671875, -6.7890625, -6.439453125, -6.08984375, -5.740234375, -5.390625, -5.041015625, -4.69140625, -4.341796875, -3.9921875, -3.642578125, -3.29296875, -2.943359375, -2.59375, -2.244140625, -1.89453125, -1.544921875, -1.1953125, -0.845703125, -0.49609375, -0.146484375, 0.203125, 0.552734375, 0.90234375, 1.251953125, 1.6015625, 1.951171875, 2.30078125, 2.650390625, 3.0, 3.349609375, 3.69921875, 4.048828125, 4.3984375, 4.748046875, 5.09765625, 5.447265625, 5.796875, 6.146484375, 6.49609375, 6.845703125, 7.1953125, 7.544921875, 7.89453125, 8.244140625, 8.59375, 8.943359375, 9.29296875, 9.642578125, 9.9921875, 10.341796875, 10.69140625, 11.041015625, 11.390625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 3.0, 6.0, 5.0, 5.0, 7.0, 5.0, 11.0, 13.0, 21.0, 15.0, 22.0, 26.0, 37.0, 33.0, 24.0, 37.0, 46.0, 38.0, 46.0, 32.0, 30.0, 37.0, 32.0, 49.0, 29.0, 41.0, 30.0, 31.0, 32.0, 42.0, 24.0, 29.0, 26.0, 20.0, 17.0, 13.0, 8.0, 20.0, 11.0, 7.0, 10.0, 6.0, 7.0, 5.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-7.4921875, -7.26995849609375, -7.0477294921875, -6.82550048828125, -6.603271484375, -6.38104248046875, -6.1588134765625, -5.93658447265625, -5.71435546875, -5.49212646484375, -5.2698974609375, -5.04766845703125, -4.825439453125, -4.60321044921875, -4.3809814453125, -4.15875244140625, -3.9365234375, -3.71429443359375, -3.4920654296875, -3.26983642578125, -3.047607421875, -2.82537841796875, -2.6031494140625, -2.38092041015625, -2.15869140625, -1.93646240234375, -1.7142333984375, -1.49200439453125, -1.269775390625, -1.04754638671875, -0.8253173828125, -0.60308837890625, -0.380859375, -0.15863037109375, 0.0635986328125, 0.28582763671875, 0.508056640625, 0.73028564453125, 0.9525146484375, 1.17474365234375, 1.39697265625, 1.61920166015625, 1.8414306640625, 2.06365966796875, 2.285888671875, 2.50811767578125, 2.7303466796875, 2.95257568359375, 3.1748046875, 3.39703369140625, 3.6192626953125, 3.84149169921875, 4.063720703125, 4.28594970703125, 4.5081787109375, 4.73040771484375, 4.95263671875, 5.17486572265625, 5.3970947265625, 5.61932373046875, 5.841552734375, 6.06378173828125, 6.2860107421875, 6.50823974609375, 6.73046875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 7.0, 9.0, 12.0, 10.0, 17.0, 31.0, 38.0, 78.0, 97.0, 139.0, 224.0, 294.0, 411.0, 683.0, 1012.0, 1532.0, 2437.0, 3805.0, 6075.0, 9750.0, 15544.0, 25139.0, 39473.0, 60272.0, 88270.0, 117255.0, 139236.0, 141343.0, 122371.0, 92680.0, 64914.0, 42664.0, 27100.0, 16959.0, 10397.0, 6417.0, 4220.0, 2743.0, 1734.0, 1074.0, 687.0, 445.0, 327.0, 201.0, 133.0, 104.0, 63.0, 41.0, 25.0, 13.0, 17.0, 10.0, 9.0, 5.0, 6.0, 4.0, 3.0, 3.0], "bins": [-6.19921875, -6.0118408203125, -5.824462890625, -5.6370849609375, -5.44970703125, -5.2623291015625, -5.074951171875, -4.8875732421875, -4.7001953125, -4.5128173828125, -4.325439453125, -4.1380615234375, -3.95068359375, -3.7633056640625, -3.575927734375, -3.3885498046875, -3.201171875, -3.0137939453125, -2.826416015625, -2.6390380859375, -2.45166015625, -2.2642822265625, -2.076904296875, -1.8895263671875, -1.7021484375, -1.5147705078125, -1.327392578125, -1.1400146484375, -0.95263671875, -0.7652587890625, -0.577880859375, -0.3905029296875, -0.203125, -0.0157470703125, 0.171630859375, 0.3590087890625, 0.54638671875, 0.7337646484375, 0.921142578125, 1.1085205078125, 1.2958984375, 1.4832763671875, 1.670654296875, 1.8580322265625, 2.04541015625, 2.2327880859375, 2.420166015625, 2.6075439453125, 2.794921875, 2.9822998046875, 3.169677734375, 3.3570556640625, 3.54443359375, 3.7318115234375, 3.919189453125, 4.1065673828125, 4.2939453125, 4.4813232421875, 4.668701171875, 4.8560791015625, 5.04345703125, 5.2308349609375, 5.418212890625, 5.6055908203125, 5.79296875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 7.0, 3.0, 14.0, 10.0, 15.0, 19.0, 15.0, 30.0, 35.0, 44.0, 49.0, 58.0, 62.0, 71.0, 82.0, 76.0, 77.0, 57.0, 48.0, 42.0, 36.0, 40.0, 26.0, 21.0, 15.0, 15.0, 9.0, 8.0, 6.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0008788108825683594, -0.0008503124117851257, -0.0008218139410018921, -0.0007933154702186584, -0.0007648169994354248, -0.0007363185286521912, -0.0007078200578689575, -0.0006793215870857239, -0.0006508231163024902, -0.0006223246455192566, -0.000593826174736023, -0.0005653277039527893, -0.0005368292331695557, -0.000508330762386322, -0.0004798322916030884, -0.00045133382081985474, -0.0004228353500366211, -0.00039433687925338745, -0.0003658384084701538, -0.00033733993768692017, -0.0003088414669036865, -0.0002803429961204529, -0.00025184452533721924, -0.0002233460545539856, -0.00019484758377075195, -0.0001663491129875183, -0.00013785064220428467, -0.00010935217142105103, -8.085370063781738e-05, -5.235522985458374e-05, -2.3856759071350098e-05, 4.641711711883545e-06, 3.314018249511719e-05, 6.163865327835083e-05, 9.013712406158447e-05, 0.00011863559484481812, 0.00014713406562805176, 0.0001756325364112854, 0.00020413100719451904, 0.00023262947797775269, 0.00026112794876098633, 0.00028962641954421997, 0.0003181248903274536, 0.00034662336111068726, 0.0003751218318939209, 0.00040362030267715454, 0.0004321187734603882, 0.0004606172442436218, 0.0004891157150268555, 0.0005176141858100891, 0.0005461126565933228, 0.0005746111273765564, 0.00060310959815979, 0.0006316080689430237, 0.0006601065397262573, 0.000688605010509491, 0.0007171034812927246, 0.0007456019520759583, 0.0007741004228591919, 0.0008025988936424255, 0.0008310973644256592, 0.0008595958352088928, 0.0008880943059921265, 0.0009165927767753601, 0.0009450912475585938]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 9.0, 11.0, 18.0, 26.0, 27.0, 52.0, 70.0, 112.0, 194.0, 313.0, 452.0, 713.0, 1133.0, 1801.0, 2911.0, 5053.0, 7676.0, 13016.0, 20967.0, 33646.0, 52131.0, 77653.0, 106268.0, 131775.0, 141052.0, 130608.0, 105571.0, 77126.0, 51866.0, 32834.0, 20423.0, 12657.0, 7724.0, 4749.0, 2900.0, 1864.0, 1172.0, 705.0, 472.0, 302.0, 194.0, 131.0, 73.0, 49.0, 25.0, 9.0, 13.0, 5.0, 5.0, 1.0, 0.0, 1.0, 3.0, 2.0], "bins": [-6.5625, -6.3721923828125, -6.181884765625, -5.9915771484375, -5.80126953125, -5.6109619140625, -5.420654296875, -5.2303466796875, -5.0400390625, -4.8497314453125, -4.659423828125, -4.4691162109375, -4.27880859375, -4.0885009765625, -3.898193359375, -3.7078857421875, -3.517578125, -3.3272705078125, -3.136962890625, -2.9466552734375, -2.75634765625, -2.5660400390625, -2.375732421875, -2.1854248046875, -1.9951171875, -1.8048095703125, -1.614501953125, -1.4241943359375, -1.23388671875, -1.0435791015625, -0.853271484375, -0.6629638671875, -0.47265625, -0.2823486328125, -0.092041015625, 0.0982666015625, 0.28857421875, 0.4788818359375, 0.669189453125, 0.8594970703125, 1.0498046875, 1.2401123046875, 1.430419921875, 1.6207275390625, 1.81103515625, 2.0013427734375, 2.191650390625, 2.3819580078125, 2.572265625, 2.7625732421875, 2.952880859375, 3.1431884765625, 3.33349609375, 3.5238037109375, 3.714111328125, 3.9044189453125, 4.0947265625, 4.2850341796875, 4.475341796875, 4.6656494140625, 4.85595703125, 5.0462646484375, 5.236572265625, 5.4268798828125, 5.6171875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 3.0, 5.0, 3.0, 4.0, 11.0, 11.0, 12.0, 7.0, 16.0, 14.0, 15.0, 16.0, 18.0, 27.0, 22.0, 38.0, 30.0, 39.0, 33.0, 54.0, 35.0, 44.0, 41.0, 44.0, 39.0, 50.0, 52.0, 36.0, 29.0, 30.0, 25.0, 29.0, 35.0, 23.0, 12.0, 19.0, 16.0, 16.0, 10.0, 8.0, 7.0, 8.0, 5.0, 7.0, 5.0, 0.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6494140625, -1.5979766845703125, -1.546539306640625, -1.4951019287109375, -1.44366455078125, -1.3922271728515625, -1.340789794921875, -1.2893524169921875, -1.2379150390625, -1.1864776611328125, -1.135040283203125, -1.0836029052734375, -1.03216552734375, -0.9807281494140625, -0.929290771484375, -0.8778533935546875, -0.826416015625, -0.7749786376953125, -0.723541259765625, -0.6721038818359375, -0.62066650390625, -0.5692291259765625, -0.517791748046875, -0.4663543701171875, -0.4149169921875, -0.3634796142578125, -0.312042236328125, -0.2606048583984375, -0.20916748046875, -0.1577301025390625, -0.106292724609375, -0.0548553466796875, -0.00341796875, 0.0480194091796875, 0.099456787109375, 0.1508941650390625, 0.20233154296875, 0.2537689208984375, 0.305206298828125, 0.3566436767578125, 0.4080810546875, 0.4595184326171875, 0.510955810546875, 0.5623931884765625, 0.61383056640625, 0.6652679443359375, 0.716705322265625, 0.7681427001953125, 0.819580078125, 0.8710174560546875, 0.922454833984375, 0.9738922119140625, 1.02532958984375, 1.0767669677734375, 1.128204345703125, 1.1796417236328125, 1.2310791015625, 1.2825164794921875, 1.333953857421875, 1.3853912353515625, 1.43682861328125, 1.4882659912109375, 1.539703369140625, 1.5911407470703125, 1.642578125]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 6.0, 6.0, 12.0, 10.0, 15.0, 13.0, 16.0, 26.0, 21.0, 34.0, 31.0, 48.0, 46.0, 57.0, 50.0, 60.0, 52.0, 60.0, 56.0, 59.0, 39.0, 40.0, 39.0, 44.0, 28.0, 21.0, 22.0, 16.0, 16.0, 12.0, 11.0, 4.0, 6.0, 5.0, 5.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-18.861387252807617, -18.211864471435547, -17.562341690063477, -16.912818908691406, -16.263296127319336, -15.613773345947266, -14.964249610900879, -14.314726829528809, -13.665204048156738, -13.015681266784668, -12.366158485412598, -11.716635704040527, -11.06711196899414, -10.41758918762207, -9.76806640625, -9.11854362487793, -8.46902084350586, -7.819498062133789, -7.169975280761719, -6.52045202255249, -5.87092924118042, -5.22140645980835, -4.571883201599121, -3.922360420227051, -3.2728376388549805, -2.62331485748291, -1.9737918376922607, -1.3242689371109009, -0.674746036529541, -0.025223255157470703, 0.6242997646331787, 1.2738227844238281, 1.9233474731445312, 2.5728702545166016, 3.222393274307251, 3.8719162940979004, 4.521439075469971, 5.170961856842041, 5.8204851150512695, 6.47000789642334, 7.11953067779541, 7.7690534591674805, 8.41857624053955, 9.068099021911621, 9.717622756958008, 10.367145538330078, 11.016668319702148, 11.666191101074219, 12.315713882446289, 12.96523666381836, 13.61475944519043, 14.2642822265625, 14.91380500793457, 15.56332778930664, 16.21285057067871, 16.86237335205078, 17.511898040771484, 18.161420822143555, 18.810943603515625, 19.460466384887695, 20.109989166259766, 20.759511947631836, 21.409034729003906, 22.05855941772461, 22.708080291748047]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 10.0, 7.0, 5.0, 6.0, 3.0, 12.0, 9.0, 4.0, 10.0, 19.0, 17.0, 16.0, 27.0, 23.0, 22.0, 24.0, 27.0, 33.0, 37.0, 39.0, 33.0, 39.0, 44.0, 40.0, 33.0, 40.0, 29.0, 31.0, 37.0, 37.0, 27.0, 36.0, 37.0, 26.0, 29.0, 18.0, 17.0, 18.0, 12.0, 5.0, 14.0, 17.0, 7.0, 9.0, 7.0, 4.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-10.427643775939941, -10.08294677734375, -9.738249778747559, -9.393552780151367, -9.048856735229492, -8.7041597366333, -8.35946273803711, -8.014765739440918, -7.670069217681885, -7.325372219085693, -6.98067569732666, -6.635978698730469, -6.291281700134277, -5.946585178375244, -5.601888179779053, -5.2571916580200195, -4.912494659423828, -4.567797660827637, -4.2231011390686035, -3.878404140472412, -3.5337073802948, -3.1890106201171875, -2.844313621520996, -2.499616861343384, -2.1549201011657715, -1.8102233409881592, -1.4655264616012573, -1.1208295822143555, -0.7761328220367432, -0.43143606185913086, -0.08673906326293945, 0.25795769691467285, 0.6026544570922852, 0.9473512768745422, 1.2920480966567993, 1.6367449760437012, 1.9814417362213135, 2.326138496398926, 2.670835494995117, 3.0155322551727295, 3.360229015350342, 3.704925775527954, 4.049622535705566, 4.394319534301758, 4.739016532897949, 5.083713054656982, 5.428410053253174, 5.773106575012207, 6.117803573608398, 6.46250057220459, 6.807197093963623, 7.1518940925598145, 7.496590614318848, 7.841287612915039, 8.18598461151123, 8.530681610107422, 8.875377655029297, 9.220074653625488, 9.56477165222168, 9.909467697143555, 10.254164695739746, 10.598861694335938, 10.943558692932129, 11.28825569152832, 11.632952690124512]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 1.0, 6.0, 4.0, 8.0, 17.0, 22.0, 29.0, 54.0, 72.0, 138.0, 171.0, 280.0, 478.0, 658.0, 1117.0, 1729.0, 2736.0, 4569.0, 7500.0, 13447.0, 25143.0, 49314.0, 101181.0, 219686.0, 475639.0, 882281.0, 1043729.0, 701520.0, 346834.0, 159304.0, 74740.0, 37003.0, 19018.0, 10308.0, 5939.0, 3506.0, 2097.0, 1371.0, 869.0, 555.0, 377.0, 249.0, 164.0, 118.0, 95.0, 64.0, 47.0, 28.0, 22.0, 20.0, 11.0, 7.0, 2.0, 1.0, 9.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-20.640625, -19.935791015625, -19.23095703125, -18.526123046875, -17.8212890625, -17.116455078125, -16.41162109375, -15.706787109375, -15.001953125, -14.297119140625, -13.59228515625, -12.887451171875, -12.1826171875, -11.477783203125, -10.77294921875, -10.068115234375, -9.36328125, -8.658447265625, -7.95361328125, -7.248779296875, -6.5439453125, -5.839111328125, -5.13427734375, -4.429443359375, -3.724609375, -3.019775390625, -2.31494140625, -1.610107421875, -0.9052734375, -0.200439453125, 0.50439453125, 1.209228515625, 1.9140625, 2.618896484375, 3.32373046875, 4.028564453125, 4.7333984375, 5.438232421875, 6.14306640625, 6.847900390625, 7.552734375, 8.257568359375, 8.96240234375, 9.667236328125, 10.3720703125, 11.076904296875, 11.78173828125, 12.486572265625, 13.19140625, 13.896240234375, 14.60107421875, 15.305908203125, 16.0107421875, 16.715576171875, 17.42041015625, 18.125244140625, 18.830078125, 19.534912109375, 20.23974609375, 20.944580078125, 21.6494140625, 22.354248046875, 23.05908203125, 23.763916015625, 24.46875]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 2.0, 10.0, 8.0, 8.0, 11.0, 12.0, 11.0, 14.0, 28.0, 20.0, 23.0, 25.0, 28.0, 30.0, 31.0, 43.0, 29.0, 37.0, 44.0, 49.0, 49.0, 35.0, 34.0, 38.0, 44.0, 42.0, 45.0, 25.0, 31.0, 36.0, 23.0, 22.0, 15.0, 18.0, 16.0, 12.0, 13.0, 8.0, 6.0, 6.0, 7.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.359375, -9.0513916015625, -8.743408203125, -8.4354248046875, -8.12744140625, -7.8194580078125, -7.511474609375, -7.2034912109375, -6.8955078125, -6.5875244140625, -6.279541015625, -5.9715576171875, -5.66357421875, -5.3555908203125, -5.047607421875, -4.7396240234375, -4.431640625, -4.1236572265625, -3.815673828125, -3.5076904296875, -3.19970703125, -2.8917236328125, -2.583740234375, -2.2757568359375, -1.9677734375, -1.6597900390625, -1.351806640625, -1.0438232421875, -0.73583984375, -0.4278564453125, -0.119873046875, 0.1881103515625, 0.49609375, 0.8040771484375, 1.112060546875, 1.4200439453125, 1.72802734375, 2.0360107421875, 2.343994140625, 2.6519775390625, 2.9599609375, 3.2679443359375, 3.575927734375, 3.8839111328125, 4.19189453125, 4.4998779296875, 4.807861328125, 5.1158447265625, 5.423828125, 5.7318115234375, 6.039794921875, 6.3477783203125, 6.65576171875, 6.9637451171875, 7.271728515625, 7.5797119140625, 7.8876953125, 8.1956787109375, 8.503662109375, 8.8116455078125, 9.11962890625, 9.4276123046875, 9.735595703125, 10.0435791015625, 10.3515625]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 6.0, 12.0, 17.0, 21.0, 48.0, 45.0, 61.0, 109.0, 150.0, 251.0, 354.0, 563.0, 898.0, 1407.0, 2147.0, 3647.0, 6040.0, 9870.0, 16943.0, 29287.0, 51554.0, 92424.0, 166679.0, 297522.0, 501227.0, 728089.0, 790793.0, 611937.0, 382971.0, 218117.0, 121613.0, 67545.0, 37791.0, 21606.0, 12694.0, 7507.0, 4521.0, 2772.0, 1826.0, 1176.0, 660.0, 459.0, 307.0, 184.0, 144.0, 95.0, 68.0, 44.0, 25.0, 26.0, 18.0, 13.0, 3.0, 5.0, 1.0, 2.0, 2.0], "bins": [-21.09375, -20.458984375, -19.82421875, -19.189453125, -18.5546875, -17.919921875, -17.28515625, -16.650390625, -16.015625, -15.380859375, -14.74609375, -14.111328125, -13.4765625, -12.841796875, -12.20703125, -11.572265625, -10.9375, -10.302734375, -9.66796875, -9.033203125, -8.3984375, -7.763671875, -7.12890625, -6.494140625, -5.859375, -5.224609375, -4.58984375, -3.955078125, -3.3203125, -2.685546875, -2.05078125, -1.416015625, -0.78125, -0.146484375, 0.48828125, 1.123046875, 1.7578125, 2.392578125, 3.02734375, 3.662109375, 4.296875, 4.931640625, 5.56640625, 6.201171875, 6.8359375, 7.470703125, 8.10546875, 8.740234375, 9.375, 10.009765625, 10.64453125, 11.279296875, 11.9140625, 12.548828125, 13.18359375, 13.818359375, 14.453125, 15.087890625, 15.72265625, 16.357421875, 16.9921875, 17.626953125, 18.26171875, 18.896484375, 19.53125]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 7.0, 7.0, 9.0, 11.0, 19.0, 21.0, 29.0, 37.0, 39.0, 66.0, 75.0, 97.0, 119.0, 163.0, 215.0, 242.0, 275.0, 314.0, 314.0, 311.0, 309.0, 278.0, 243.0, 184.0, 175.0, 124.0, 106.0, 88.0, 62.0, 38.0, 32.0, 20.0, 10.0, 11.0, 7.0, 5.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.3125, -9.05865478515625, -8.8048095703125, -8.55096435546875, -8.297119140625, -8.04327392578125, -7.7894287109375, -7.53558349609375, -7.28173828125, -7.02789306640625, -6.7740478515625, -6.52020263671875, -6.266357421875, -6.01251220703125, -5.7586669921875, -5.50482177734375, -5.2509765625, -4.99713134765625, -4.7432861328125, -4.48944091796875, -4.235595703125, -3.98175048828125, -3.7279052734375, -3.47406005859375, -3.22021484375, -2.96636962890625, -2.7125244140625, -2.45867919921875, -2.204833984375, -1.95098876953125, -1.6971435546875, -1.44329833984375, -1.189453125, -0.93560791015625, -0.6817626953125, -0.42791748046875, -0.174072265625, 0.07977294921875, 0.3336181640625, 0.58746337890625, 0.84130859375, 1.09515380859375, 1.3489990234375, 1.60284423828125, 1.856689453125, 2.11053466796875, 2.3643798828125, 2.61822509765625, 2.8720703125, 3.12591552734375, 3.3797607421875, 3.63360595703125, 3.887451171875, 4.14129638671875, 4.3951416015625, 4.64898681640625, 4.90283203125, 5.15667724609375, 5.4105224609375, 5.66436767578125, 5.918212890625, 6.17205810546875, 6.4259033203125, 6.67974853515625, 6.93359375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 4.0, 10.0, 6.0, 14.0, 13.0, 18.0, 29.0, 24.0, 33.0, 31.0, 48.0, 54.0, 64.0, 49.0, 80.0, 69.0, 72.0, 69.0, 61.0, 52.0, 39.0, 36.0, 29.0, 15.0, 15.0, 13.0, 6.0, 10.0, 7.0, 12.0, 6.0, 1.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.033483505249023, -23.233503341674805, -22.433523178100586, -21.633543014526367, -20.83356285095215, -20.03358268737793, -19.233600616455078, -18.43362045288086, -17.63364028930664, -16.833660125732422, -16.033679962158203, -15.233699798583984, -14.433719635009766, -13.633739471435547, -12.833758354187012, -12.033778190612793, -11.23379898071289, -10.433818817138672, -9.633838653564453, -8.833858489990234, -8.033878326416016, -7.233897686004639, -6.433917045593262, -5.633936882019043, -4.833956718444824, -4.0339765548706055, -3.2339961528778076, -2.4340157508850098, -1.634035587310791, -0.8340554237365723, -0.03407478332519531, 0.7659053802490234, 1.5658836364746094, 2.365863800048828, 3.165844202041626, 3.965824604034424, 4.765804767608643, 5.565784931182861, 6.365765571594238, 7.165745735168457, 7.965725898742676, 8.765706062316895, 9.565686225891113, 10.365667343139648, 11.165647506713867, 11.965627670288086, 12.765607833862305, 13.565587997436523, 14.365568161010742, 15.165548324584961, 15.96552848815918, 16.7655086517334, 17.565488815307617, 18.365468978881836, 19.165451049804688, 19.965431213378906, 20.765411376953125, 21.565391540527344, 22.365371704101562, 23.16535186767578, 23.96533203125, 24.76531219482422, 25.565292358398438, 26.365272521972656, 27.165252685546875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 7.0, 6.0, 6.0, 10.0, 8.0, 9.0, 15.0, 20.0, 22.0, 26.0, 25.0, 24.0, 30.0, 27.0, 31.0, 36.0, 37.0, 39.0, 45.0, 47.0, 50.0, 41.0, 48.0, 37.0, 32.0, 35.0, 39.0, 40.0, 32.0, 30.0, 28.0, 13.0, 19.0, 19.0, 19.0, 10.0, 9.0, 7.0, 3.0, 6.0, 3.0, 2.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.314404487609863, -13.856593132019043, -13.398782730102539, -12.940971374511719, -12.483160018920898, -12.025349617004395, -11.567538261413574, -11.10972785949707, -10.65191650390625, -10.19410514831543, -9.736294746398926, -9.278483390808105, -8.820672988891602, -8.362861633300781, -7.905050277709961, -7.447239398956299, -6.989428520202637, -6.531617641448975, -6.0738067626953125, -5.615995407104492, -5.15818452835083, -4.700373649597168, -4.242562294006348, -3.7847514152526855, -3.3269405364990234, -2.8691296577453613, -2.41131854057312, -1.9535075426101685, -1.4956965446472168, -1.0378856658935547, -0.5800745487213135, -0.12226343154907227, 0.33554840087890625, 0.7933593988418579, 1.2511703968048096, 1.7089813947677612, 2.166792392730713, 2.624603271484375, 3.082414388656616, 3.5402255058288574, 3.9980363845825195, 4.455847263336182, 4.913658142089844, 5.371469497680664, 5.829280376434326, 6.287091255187988, 6.744902610778809, 7.202713489532471, 7.660524368286133, 8.118335723876953, 8.576146125793457, 9.033957481384277, 9.491767883300781, 9.949579238891602, 10.407390594482422, 10.865201950073242, 11.323012351989746, 11.780823707580566, 12.23863410949707, 12.69644546508789, 13.154256820678711, 13.612067222595215, 14.069878578186035, 14.527688980102539, 14.98550033569336]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 6.0, 8.0, 17.0, 12.0, 24.0, 33.0, 59.0, 71.0, 119.0, 187.0, 269.0, 383.0, 587.0, 929.0, 1441.0, 2291.0, 3521.0, 5814.0, 9684.0, 15611.0, 26221.0, 42874.0, 68183.0, 102067.0, 138034.0, 158214.0, 148092.0, 114778.0, 79270.0, 50507.0, 30747.0, 18664.0, 11373.0, 6786.0, 4245.0, 2665.0, 1654.0, 1062.0, 649.0, 444.0, 327.0, 212.0, 131.0, 93.0, 53.0, 46.0, 42.0, 17.0, 14.0, 8.0, 11.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-11.25, -10.894775390625, -10.53955078125, -10.184326171875, -9.8291015625, -9.473876953125, -9.11865234375, -8.763427734375, -8.408203125, -8.052978515625, -7.69775390625, -7.342529296875, -6.9873046875, -6.632080078125, -6.27685546875, -5.921630859375, -5.56640625, -5.211181640625, -4.85595703125, -4.500732421875, -4.1455078125, -3.790283203125, -3.43505859375, -3.079833984375, -2.724609375, -2.369384765625, -2.01416015625, -1.658935546875, -1.3037109375, -0.948486328125, -0.59326171875, -0.238037109375, 0.1171875, 0.472412109375, 0.82763671875, 1.182861328125, 1.5380859375, 1.893310546875, 2.24853515625, 2.603759765625, 2.958984375, 3.314208984375, 3.66943359375, 4.024658203125, 4.3798828125, 4.735107421875, 5.09033203125, 5.445556640625, 5.80078125, 6.156005859375, 6.51123046875, 6.866455078125, 7.2216796875, 7.576904296875, 7.93212890625, 8.287353515625, 8.642578125, 8.997802734375, 9.35302734375, 9.708251953125, 10.0634765625, 10.418701171875, 10.77392578125, 11.129150390625, 11.484375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 8.0, 7.0, 9.0, 4.0, 10.0, 19.0, 14.0, 14.0, 26.0, 24.0, 26.0, 35.0, 32.0, 45.0, 34.0, 36.0, 35.0, 52.0, 40.0, 51.0, 44.0, 44.0, 34.0, 34.0, 40.0, 32.0, 31.0, 30.0, 32.0, 29.0, 19.0, 24.0, 14.0, 13.0, 12.0, 10.0, 12.0, 5.0, 0.0, 1.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-15.75, -15.252197265625, -14.75439453125, -14.256591796875, -13.7587890625, -13.260986328125, -12.76318359375, -12.265380859375, -11.767578125, -11.269775390625, -10.77197265625, -10.274169921875, -9.7763671875, -9.278564453125, -8.78076171875, -8.282958984375, -7.78515625, -7.287353515625, -6.78955078125, -6.291748046875, -5.7939453125, -5.296142578125, -4.79833984375, -4.300537109375, -3.802734375, -3.304931640625, -2.80712890625, -2.309326171875, -1.8115234375, -1.313720703125, -0.81591796875, -0.318115234375, 0.1796875, 0.677490234375, 1.17529296875, 1.673095703125, 2.1708984375, 2.668701171875, 3.16650390625, 3.664306640625, 4.162109375, 4.659912109375, 5.15771484375, 5.655517578125, 6.1533203125, 6.651123046875, 7.14892578125, 7.646728515625, 8.14453125, 8.642333984375, 9.14013671875, 9.637939453125, 10.1357421875, 10.633544921875, 11.13134765625, 11.629150390625, 12.126953125, 12.624755859375, 13.12255859375, 13.620361328125, 14.1181640625, 14.615966796875, 15.11376953125, 15.611572265625, 16.109375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 11.0, 15.0, 13.0, 25.0, 38.0, 55.0, 105.0, 151.0, 265.0, 424.0, 735.0, 1323.0, 2383.0, 4437.0, 9008.0, 18910.0, 41919.0, 95740.0, 200285.0, 288946.0, 203566.0, 97799.0, 43096.0, 19712.0, 9283.0, 4698.0, 2367.0, 1321.0, 751.0, 478.0, 256.0, 159.0, 105.0, 55.0, 37.0, 26.0, 27.0, 12.0, 10.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.734375, -22.03515625, -21.3359375, -20.63671875, -19.9375, -19.23828125, -18.5390625, -17.83984375, -17.140625, -16.44140625, -15.7421875, -15.04296875, -14.34375, -13.64453125, -12.9453125, -12.24609375, -11.546875, -10.84765625, -10.1484375, -9.44921875, -8.75, -8.05078125, -7.3515625, -6.65234375, -5.953125, -5.25390625, -4.5546875, -3.85546875, -3.15625, -2.45703125, -1.7578125, -1.05859375, -0.359375, 0.33984375, 1.0390625, 1.73828125, 2.4375, 3.13671875, 3.8359375, 4.53515625, 5.234375, 5.93359375, 6.6328125, 7.33203125, 8.03125, 8.73046875, 9.4296875, 10.12890625, 10.828125, 11.52734375, 12.2265625, 12.92578125, 13.625, 14.32421875, 15.0234375, 15.72265625, 16.421875, 17.12109375, 17.8203125, 18.51953125, 19.21875, 19.91796875, 20.6171875, 21.31640625, 22.015625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 5.0, 2.0, 5.0, 5.0, 4.0, 12.0, 10.0, 6.0, 17.0, 14.0, 19.0, 18.0, 19.0, 24.0, 21.0, 23.0, 29.0, 36.0, 35.0, 48.0, 36.0, 42.0, 36.0, 38.0, 38.0, 39.0, 42.0, 43.0, 37.0, 41.0, 36.0, 30.0, 29.0, 22.0, 20.0, 14.0, 18.0, 21.0, 22.0, 8.0, 12.0, 11.0, 7.0, 8.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.90625, -6.63134765625, -6.3564453125, -6.08154296875, -5.806640625, -5.53173828125, -5.2568359375, -4.98193359375, -4.70703125, -4.43212890625, -4.1572265625, -3.88232421875, -3.607421875, -3.33251953125, -3.0576171875, -2.78271484375, -2.5078125, -2.23291015625, -1.9580078125, -1.68310546875, -1.408203125, -1.13330078125, -0.8583984375, -0.58349609375, -0.30859375, -0.03369140625, 0.2412109375, 0.51611328125, 0.791015625, 1.06591796875, 1.3408203125, 1.61572265625, 1.890625, 2.16552734375, 2.4404296875, 2.71533203125, 2.990234375, 3.26513671875, 3.5400390625, 3.81494140625, 4.08984375, 4.36474609375, 4.6396484375, 4.91455078125, 5.189453125, 5.46435546875, 5.7392578125, 6.01416015625, 6.2890625, 6.56396484375, 6.8388671875, 7.11376953125, 7.388671875, 7.66357421875, 7.9384765625, 8.21337890625, 8.48828125, 8.76318359375, 9.0380859375, 9.31298828125, 9.587890625, 9.86279296875, 10.1376953125, 10.41259765625, 10.6875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 5.0, 7.0, 6.0, 11.0, 20.0, 17.0, 26.0, 46.0, 57.0, 81.0, 94.0, 179.0, 249.0, 412.0, 590.0, 969.0, 1542.0, 2621.0, 4288.0, 7244.0, 12904.0, 23481.0, 43300.0, 80662.0, 145764.0, 222260.0, 210114.0, 131359.0, 72307.0, 38517.0, 20865.0, 11636.0, 6619.0, 3966.0, 2421.0, 1444.0, 831.0, 525.0, 366.0, 263.0, 155.0, 123.0, 63.0, 54.0, 23.0, 25.0, 14.0, 9.0, 13.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-9.890625, -9.6072998046875, -9.323974609375, -9.0406494140625, -8.75732421875, -8.4739990234375, -8.190673828125, -7.9073486328125, -7.6240234375, -7.3406982421875, -7.057373046875, -6.7740478515625, -6.49072265625, -6.2073974609375, -5.924072265625, -5.6407470703125, -5.357421875, -5.0740966796875, -4.790771484375, -4.5074462890625, -4.22412109375, -3.9407958984375, -3.657470703125, -3.3741455078125, -3.0908203125, -2.8074951171875, -2.524169921875, -2.2408447265625, -1.95751953125, -1.6741943359375, -1.390869140625, -1.1075439453125, -0.82421875, -0.5408935546875, -0.257568359375, 0.0257568359375, 0.30908203125, 0.5924072265625, 0.875732421875, 1.1590576171875, 1.4423828125, 1.7257080078125, 2.009033203125, 2.2923583984375, 2.57568359375, 2.8590087890625, 3.142333984375, 3.4256591796875, 3.708984375, 3.9923095703125, 4.275634765625, 4.5589599609375, 4.84228515625, 5.1256103515625, 5.408935546875, 5.6922607421875, 5.9755859375, 6.2589111328125, 6.542236328125, 6.8255615234375, 7.10888671875, 7.3922119140625, 7.675537109375, 7.9588623046875, 8.2421875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 7.0, 6.0, 8.0, 9.0, 12.0, 28.0, 31.0, 43.0, 54.0, 73.0, 69.0, 91.0, 73.0, 108.0, 74.0, 82.0, 53.0, 43.0, 34.0, 34.0, 17.0, 10.0, 11.0, 7.0, 8.0, 5.0, 0.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0006556510925292969, -0.0006361603736877441, -0.0006166696548461914, -0.0005971789360046387, -0.0005776882171630859, -0.0005581974983215332, -0.0005387067794799805, -0.0005192160606384277, -0.000499725341796875, -0.00048023462295532227, -0.00046074390411376953, -0.0004412531852722168, -0.00042176246643066406, -0.00040227174758911133, -0.0003827810287475586, -0.00036329030990600586, -0.0003437995910644531, -0.0003243088722229004, -0.00030481815338134766, -0.0002853274345397949, -0.0002658367156982422, -0.00024634599685668945, -0.00022685527801513672, -0.00020736455917358398, -0.00018787384033203125, -0.00016838312149047852, -0.00014889240264892578, -0.00012940168380737305, -0.00010991096496582031, -9.042024612426758e-05, -7.092952728271484e-05, -5.143880844116211e-05, -3.1948089599609375e-05, -1.245737075805664e-05, 7.033348083496094e-06, 2.6524066925048828e-05, 4.601478576660156e-05, 6.55055046081543e-05, 8.499622344970703e-05, 0.00010448694229125977, 0.0001239776611328125, 0.00014346837997436523, 0.00016295909881591797, 0.0001824498176574707, 0.00020194053649902344, 0.00022143125534057617, 0.0002409219741821289, 0.00026041269302368164, 0.0002799034118652344, 0.0002993941307067871, 0.00031888484954833984, 0.0003383755683898926, 0.0003578662872314453, 0.00037735700607299805, 0.0003968477249145508, 0.0004163384437561035, 0.00043582916259765625, 0.000455319881439209, 0.0004748106002807617, 0.0004943013191223145, 0.0005137920379638672, 0.0005332827568054199, 0.0005527734756469727, 0.0005722641944885254, 0.0005917549133300781]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 4.0, 5.0, 11.0, 15.0, 25.0, 28.0, 44.0, 67.0, 99.0, 141.0, 240.0, 279.0, 519.0, 747.0, 1142.0, 1747.0, 2606.0, 4151.0, 6194.0, 9608.0, 14765.0, 22736.0, 35416.0, 52876.0, 77548.0, 106870.0, 131283.0, 140603.0, 127000.0, 100057.0, 71941.0, 48654.0, 32040.0, 20709.0, 13321.0, 8531.0, 5666.0, 3667.0, 2419.0, 1620.0, 1103.0, 667.0, 488.0, 279.0, 230.0, 140.0, 87.0, 75.0, 37.0, 20.0, 9.0, 11.0, 14.0, 2.0, 5.0, 1.0, 5.0, 2.0, 0.0, 2.0], "bins": [-6.33203125, -6.13031005859375, -5.9285888671875, -5.72686767578125, -5.525146484375, -5.32342529296875, -5.1217041015625, -4.91998291015625, -4.71826171875, -4.51654052734375, -4.3148193359375, -4.11309814453125, -3.911376953125, -3.70965576171875, -3.5079345703125, -3.30621337890625, -3.1044921875, -2.90277099609375, -2.7010498046875, -2.49932861328125, -2.297607421875, -2.09588623046875, -1.8941650390625, -1.69244384765625, -1.49072265625, -1.28900146484375, -1.0872802734375, -0.88555908203125, -0.683837890625, -0.48211669921875, -0.2803955078125, -0.07867431640625, 0.123046875, 0.32476806640625, 0.5264892578125, 0.72821044921875, 0.929931640625, 1.13165283203125, 1.3333740234375, 1.53509521484375, 1.73681640625, 1.93853759765625, 2.1402587890625, 2.34197998046875, 2.543701171875, 2.74542236328125, 2.9471435546875, 3.14886474609375, 3.3505859375, 3.55230712890625, 3.7540283203125, 3.95574951171875, 4.157470703125, 4.35919189453125, 4.5609130859375, 4.76263427734375, 4.96435546875, 5.16607666015625, 5.3677978515625, 5.56951904296875, 5.771240234375, 5.97296142578125, 6.1746826171875, 6.37640380859375, 6.578125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 10.0, 5.0, 5.0, 8.0, 10.0, 7.0, 13.0, 10.0, 22.0, 15.0, 20.0, 19.0, 21.0, 28.0, 37.0, 39.0, 39.0, 45.0, 43.0, 45.0, 37.0, 53.0, 55.0, 47.0, 41.0, 40.0, 36.0, 33.0, 37.0, 26.0, 24.0, 19.0, 19.0, 19.0, 17.0, 12.0, 10.0, 3.0, 7.0, 8.0, 3.0, 5.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-1.8759765625, -1.8157958984375, -1.755615234375, -1.6954345703125, -1.63525390625, -1.5750732421875, -1.514892578125, -1.4547119140625, -1.39453125, -1.3343505859375, -1.274169921875, -1.2139892578125, -1.15380859375, -1.0936279296875, -1.033447265625, -0.9732666015625, -0.9130859375, -0.8529052734375, -0.792724609375, -0.7325439453125, -0.67236328125, -0.6121826171875, -0.552001953125, -0.4918212890625, -0.431640625, -0.3714599609375, -0.311279296875, -0.2510986328125, -0.19091796875, -0.1307373046875, -0.070556640625, -0.0103759765625, 0.0498046875, 0.1099853515625, 0.170166015625, 0.2303466796875, 0.29052734375, 0.3507080078125, 0.410888671875, 0.4710693359375, 0.53125, 0.5914306640625, 0.651611328125, 0.7117919921875, 0.77197265625, 0.8321533203125, 0.892333984375, 0.9525146484375, 1.0126953125, 1.0728759765625, 1.133056640625, 1.1932373046875, 1.25341796875, 1.3135986328125, 1.373779296875, 1.4339599609375, 1.494140625, 1.5543212890625, 1.614501953125, 1.6746826171875, 1.73486328125, 1.7950439453125, 1.855224609375, 1.9154052734375, 1.9755859375]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 5.0, 7.0, 5.0, 6.0, 12.0, 22.0, 22.0, 24.0, 29.0, 27.0, 35.0, 37.0, 58.0, 65.0, 53.0, 77.0, 76.0, 69.0, 66.0, 58.0, 43.0, 43.0, 37.0, 25.0, 20.0, 16.0, 10.0, 6.0, 7.0, 9.0, 13.0, 4.0, 4.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.444873809814453, -22.66288185119629, -21.880887985229492, -21.098896026611328, -20.31690216064453, -19.534910202026367, -18.752918243408203, -17.970924377441406, -17.188932418823242, -16.406940460205078, -15.624946594238281, -14.842954635620117, -14.060961723327637, -13.278968811035156, -12.496976852416992, -11.714983940124512, -10.932991027832031, -10.15099811553955, -9.36900520324707, -8.587013244628906, -7.805020332336426, -7.023027420043945, -6.241034984588623, -5.459042549133301, -4.67704963684082, -3.895056962966919, -3.1130642890930176, -2.331071615219116, -1.5490789413452148, -0.7670862674713135, 0.01490640640258789, 0.7968988418579102, 1.5788917541503906, 2.360884428024292, 3.1428771018981934, 3.9248697757720947, 4.706862449645996, 5.488855361938477, 6.270847797393799, 7.052840232849121, 7.834833145141602, 8.616826057434082, 9.398818969726562, 10.180810928344727, 10.962803840637207, 11.744796752929688, 12.526788711547852, 13.308781623840332, 14.090774536132812, 14.872767448425293, 15.654760360717773, 16.436752319335938, 17.218746185302734, 18.0007381439209, 18.782730102539062, 19.56472396850586, 20.346715927124023, 21.128707885742188, 21.910701751708984, 22.69269371032715, 23.474685668945312, 24.25667953491211, 25.038671493530273, 25.820663452148438, 26.602657318115234]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 10.0, 5.0, 7.0, 6.0, 12.0, 18.0, 12.0, 16.0, 27.0, 26.0, 27.0, 20.0, 23.0, 26.0, 35.0, 33.0, 47.0, 35.0, 39.0, 56.0, 41.0, 48.0, 39.0, 43.0, 33.0, 32.0, 37.0, 39.0, 28.0, 32.0, 24.0, 23.0, 19.0, 15.0, 17.0, 5.0, 13.0, 6.0, 6.0, 5.0, 4.0, 0.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.84384536743164, -13.400592803955078, -12.957340240478516, -12.514087677001953, -12.07083511352539, -11.627582550048828, -11.184329986572266, -10.741076469421387, -10.297823905944824, -9.854571342468262, -9.4113187789917, -8.968066215515137, -8.524813652038574, -8.081560134887695, -7.638308048248291, -7.19505500793457, -6.751802921295166, -6.3085503578186035, -5.865297794342041, -5.42204475402832, -4.978792190551758, -4.535539627075195, -4.092287063598633, -3.649034261703491, -3.2057816982269287, -2.762529134750366, -2.3192763328552246, -1.876023769378662, -1.43277108669281, -0.989518404006958, -0.5462658405303955, -0.1030130386352539, 0.3402395248413086, 0.7834922075271606, 1.2267448902130127, 1.6699974536895752, 2.113250255584717, 2.5565028190612793, 2.999755382537842, 3.4430081844329834, 3.886260747909546, 4.3295135498046875, 4.77276611328125, 5.2160186767578125, 5.659271240234375, 6.1025238037109375, 6.5457763671875, 6.989029407501221, 7.432281970977783, 7.875534534454346, 8.318787574768066, 8.762040138244629, 9.205292701721191, 9.648545265197754, 10.091797828674316, 10.535050392150879, 10.978302955627441, 11.421555519104004, 11.864808082580566, 12.308060646057129, 12.751313209533691, 13.19456672668457, 13.637819290161133, 14.081071853637695, 14.524324417114258]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 14.0, 16.0, 26.0, 31.0, 59.0, 67.0, 127.0, 176.0, 309.0, 445.0, 717.0, 1136.0, 1675.0, 2701.0, 4162.0, 6395.0, 9588.0, 14736.0, 22470.0, 32949.0, 47720.0, 65845.0, 86206.0, 104971.0, 117713.0, 117800.0, 107628.0, 88046.0, 66700.0, 48415.0, 33718.0, 22594.0, 15037.0, 9936.0, 6496.0, 4184.0, 2790.0, 1756.0, 1146.0, 732.0, 459.0, 311.0, 189.0, 145.0, 80.0, 47.0, 30.0, 19.0, 23.0, 6.0, 8.0, 5.0, 5.0, 1.0, 2.0, 5.0], "bins": [-12.15625, -11.7882080078125, -11.420166015625, -11.0521240234375, -10.68408203125, -10.3160400390625, -9.947998046875, -9.5799560546875, -9.2119140625, -8.8438720703125, -8.475830078125, -8.1077880859375, -7.73974609375, -7.3717041015625, -7.003662109375, -6.6356201171875, -6.267578125, -5.8995361328125, -5.531494140625, -5.1634521484375, -4.79541015625, -4.4273681640625, -4.059326171875, -3.6912841796875, -3.3232421875, -2.9552001953125, -2.587158203125, -2.2191162109375, -1.85107421875, -1.4830322265625, -1.114990234375, -0.7469482421875, -0.37890625, -0.0108642578125, 0.357177734375, 0.7252197265625, 1.09326171875, 1.4613037109375, 1.829345703125, 2.1973876953125, 2.5654296875, 2.9334716796875, 3.301513671875, 3.6695556640625, 4.03759765625, 4.4056396484375, 4.773681640625, 5.1417236328125, 5.509765625, 5.8778076171875, 6.245849609375, 6.6138916015625, 6.98193359375, 7.3499755859375, 7.718017578125, 8.0860595703125, 8.4541015625, 8.8221435546875, 9.190185546875, 9.5582275390625, 9.92626953125, 10.2943115234375, 10.662353515625, 11.0303955078125, 11.3984375]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 5.0, 7.0, 9.0, 11.0, 16.0, 24.0, 18.0, 19.0, 23.0, 19.0, 33.0, 25.0, 34.0, 36.0, 34.0, 39.0, 38.0, 47.0, 47.0, 46.0, 53.0, 38.0, 39.0, 43.0, 34.0, 27.0, 36.0, 26.0, 22.0, 17.0, 23.0, 15.0, 16.0, 17.0, 9.0, 12.0, 11.0, 8.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.5234375, -15.05126953125, -14.5791015625, -14.10693359375, -13.634765625, -13.16259765625, -12.6904296875, -12.21826171875, -11.74609375, -11.27392578125, -10.8017578125, -10.32958984375, -9.857421875, -9.38525390625, -8.9130859375, -8.44091796875, -7.96875, -7.49658203125, -7.0244140625, -6.55224609375, -6.080078125, -5.60791015625, -5.1357421875, -4.66357421875, -4.19140625, -3.71923828125, -3.2470703125, -2.77490234375, -2.302734375, -1.83056640625, -1.3583984375, -0.88623046875, -0.4140625, 0.05810546875, 0.5302734375, 1.00244140625, 1.474609375, 1.94677734375, 2.4189453125, 2.89111328125, 3.36328125, 3.83544921875, 4.3076171875, 4.77978515625, 5.251953125, 5.72412109375, 6.1962890625, 6.66845703125, 7.140625, 7.61279296875, 8.0849609375, 8.55712890625, 9.029296875, 9.50146484375, 9.9736328125, 10.44580078125, 10.91796875, 11.39013671875, 11.8623046875, 12.33447265625, 12.806640625, 13.27880859375, 13.7509765625, 14.22314453125, 14.6953125]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 8.0, 19.0, 22.0, 35.0, 61.0, 81.0, 124.0, 198.0, 300.0, 494.0, 703.0, 1114.0, 1685.0, 2505.0, 3761.0, 5699.0, 8317.0, 12193.0, 17883.0, 25515.0, 35981.0, 49046.0, 64995.0, 80572.0, 95684.0, 104528.0, 105260.0, 97678.0, 84531.0, 68415.0, 52534.0, 39218.0, 28306.0, 19448.0, 13628.0, 9284.0, 6439.0, 4226.0, 2773.0, 1820.0, 1221.0, 785.0, 505.0, 339.0, 243.0, 136.0, 90.0, 67.0, 30.0, 20.0, 22.0, 12.0, 7.0, 3.0, 0.0, 3.0], "bins": [-11.15625, -10.829345703125, -10.50244140625, -10.175537109375, -9.8486328125, -9.521728515625, -9.19482421875, -8.867919921875, -8.541015625, -8.214111328125, -7.88720703125, -7.560302734375, -7.2333984375, -6.906494140625, -6.57958984375, -6.252685546875, -5.92578125, -5.598876953125, -5.27197265625, -4.945068359375, -4.6181640625, -4.291259765625, -3.96435546875, -3.637451171875, -3.310546875, -2.983642578125, -2.65673828125, -2.329833984375, -2.0029296875, -1.676025390625, -1.34912109375, -1.022216796875, -0.6953125, -0.368408203125, -0.04150390625, 0.285400390625, 0.6123046875, 0.939208984375, 1.26611328125, 1.593017578125, 1.919921875, 2.246826171875, 2.57373046875, 2.900634765625, 3.2275390625, 3.554443359375, 3.88134765625, 4.208251953125, 4.53515625, 4.862060546875, 5.18896484375, 5.515869140625, 5.8427734375, 6.169677734375, 6.49658203125, 6.823486328125, 7.150390625, 7.477294921875, 7.80419921875, 8.131103515625, 8.4580078125, 8.784912109375, 9.11181640625, 9.438720703125, 9.765625]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 6.0, 4.0, 5.0, 4.0, 7.0, 14.0, 6.0, 9.0, 8.0, 11.0, 8.0, 7.0, 22.0, 19.0, 31.0, 26.0, 41.0, 44.0, 30.0, 27.0, 47.0, 33.0, 39.0, 43.0, 44.0, 50.0, 39.0, 42.0, 44.0, 35.0, 27.0, 27.0, 29.0, 27.0, 24.0, 14.0, 27.0, 12.0, 17.0, 14.0, 6.0, 8.0, 6.0, 6.0, 3.0, 5.0, 5.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.671875, -8.4036865234375, -8.135498046875, -7.8673095703125, -7.59912109375, -7.3309326171875, -7.062744140625, -6.7945556640625, -6.5263671875, -6.2581787109375, -5.989990234375, -5.7218017578125, -5.45361328125, -5.1854248046875, -4.917236328125, -4.6490478515625, -4.380859375, -4.1126708984375, -3.844482421875, -3.5762939453125, -3.30810546875, -3.0399169921875, -2.771728515625, -2.5035400390625, -2.2353515625, -1.9671630859375, -1.698974609375, -1.4307861328125, -1.16259765625, -0.8944091796875, -0.626220703125, -0.3580322265625, -0.08984375, 0.1783447265625, 0.446533203125, 0.7147216796875, 0.98291015625, 1.2510986328125, 1.519287109375, 1.7874755859375, 2.0556640625, 2.3238525390625, 2.592041015625, 2.8602294921875, 3.12841796875, 3.3966064453125, 3.664794921875, 3.9329833984375, 4.201171875, 4.4693603515625, 4.737548828125, 5.0057373046875, 5.27392578125, 5.5421142578125, 5.810302734375, 6.0784912109375, 6.3466796875, 6.6148681640625, 6.883056640625, 7.1512451171875, 7.41943359375, 7.6876220703125, 7.955810546875, 8.2239990234375, 8.4921875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 8.0, 11.0, 15.0, 22.0, 30.0, 53.0, 82.0, 126.0, 179.0, 314.0, 441.0, 688.0, 1129.0, 1835.0, 2945.0, 4536.0, 7319.0, 12100.0, 19082.0, 29466.0, 44700.0, 65070.0, 89578.0, 113554.0, 129324.0, 129194.0, 113988.0, 90598.0, 65726.0, 45113.0, 29640.0, 19273.0, 12210.0, 7489.0, 4840.0, 2832.0, 1884.0, 1137.0, 779.0, 407.0, 285.0, 205.0, 121.0, 76.0, 65.0, 29.0, 18.0, 19.0, 15.0, 3.0, 5.0, 1.0, 5.0, 1.0, 0.0, 1.0], "bins": [-5.53125, -5.36370849609375, -5.1961669921875, -5.02862548828125, -4.861083984375, -4.69354248046875, -4.5260009765625, -4.35845947265625, -4.19091796875, -4.02337646484375, -3.8558349609375, -3.68829345703125, -3.520751953125, -3.35321044921875, -3.1856689453125, -3.01812744140625, -2.8505859375, -2.68304443359375, -2.5155029296875, -2.34796142578125, -2.180419921875, -2.01287841796875, -1.8453369140625, -1.67779541015625, -1.51025390625, -1.34271240234375, -1.1751708984375, -1.00762939453125, -0.840087890625, -0.67254638671875, -0.5050048828125, -0.33746337890625, -0.169921875, -0.00238037109375, 0.1651611328125, 0.33270263671875, 0.500244140625, 0.66778564453125, 0.8353271484375, 1.00286865234375, 1.17041015625, 1.33795166015625, 1.5054931640625, 1.67303466796875, 1.840576171875, 2.00811767578125, 2.1756591796875, 2.34320068359375, 2.5107421875, 2.67828369140625, 2.8458251953125, 3.01336669921875, 3.180908203125, 3.34844970703125, 3.5159912109375, 3.68353271484375, 3.85107421875, 4.01861572265625, 4.1861572265625, 4.35369873046875, 4.521240234375, 4.68878173828125, 4.8563232421875, 5.02386474609375, 5.19140625]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 9.0, 6.0, 2.0, 9.0, 16.0, 15.0, 18.0, 29.0, 21.0, 38.0, 38.0, 37.0, 50.0, 58.0, 71.0, 53.0, 60.0, 60.0, 42.0, 60.0, 50.0, 47.0, 34.0, 28.0, 24.0, 29.0, 21.0, 19.0, 17.0, 10.0, 7.0, 4.0, 3.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0006580352783203125, -0.0006364732980728149, -0.0006149113178253174, -0.0005933493375778198, -0.0005717873573303223, -0.0005502253770828247, -0.0005286633968353271, -0.0005071014165878296, -0.00048553943634033203, -0.00046397745609283447, -0.0004424154758453369, -0.00042085349559783936, -0.0003992915153503418, -0.00037772953510284424, -0.0003561675548553467, -0.0003346055746078491, -0.00031304359436035156, -0.000291481614112854, -0.00026991963386535645, -0.0002483576536178589, -0.00022679567337036133, -0.00020523369312286377, -0.0001836717128753662, -0.00016210973262786865, -0.0001405477523803711, -0.00011898577213287354, -9.742379188537598e-05, -7.586181163787842e-05, -5.429983139038086e-05, -3.27378511428833e-05, -1.1175870895385742e-05, 1.0386109352111816e-05, 3.1948089599609375e-05, 5.3510069847106934e-05, 7.507205009460449e-05, 9.663403034210205e-05, 0.00011819601058959961, 0.00013975799083709717, 0.00016131997108459473, 0.00018288195133209229, 0.00020444393157958984, 0.0002260059118270874, 0.00024756789207458496, 0.0002691298723220825, 0.0002906918525695801, 0.00031225383281707764, 0.0003338158130645752, 0.00035537779331207275, 0.0003769397735595703, 0.00039850175380706787, 0.00042006373405456543, 0.000441625714302063, 0.00046318769454956055, 0.0004847496747970581, 0.0005063116550445557, 0.0005278736352920532, 0.0005494356155395508, 0.0005709975957870483, 0.0005925595760345459, 0.0006141215562820435, 0.000635683536529541, 0.0006572455167770386, 0.0006788074970245361, 0.0007003694772720337, 0.0007219314575195312]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 5.0, 7.0, 12.0, 19.0, 23.0, 45.0, 55.0, 97.0, 148.0, 214.0, 332.0, 515.0, 714.0, 1118.0, 1682.0, 2484.0, 3790.0, 5733.0, 8552.0, 12787.0, 18554.0, 27741.0, 39744.0, 55165.0, 73760.0, 92397.0, 107478.0, 114636.0, 110094.0, 96329.0, 77932.0, 59380.0, 43470.0, 30150.0, 20857.0, 14030.0, 9417.0, 6390.0, 4235.0, 2751.0, 1888.0, 1270.0, 905.0, 550.0, 366.0, 258.0, 183.0, 91.0, 91.0, 46.0, 18.0, 23.0, 12.0, 9.0, 5.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.5703125, -4.42108154296875, -4.2718505859375, -4.12261962890625, -3.973388671875, -3.82415771484375, -3.6749267578125, -3.52569580078125, -3.37646484375, -3.22723388671875, -3.0780029296875, -2.92877197265625, -2.779541015625, -2.63031005859375, -2.4810791015625, -2.33184814453125, -2.1826171875, -2.03338623046875, -1.8841552734375, -1.73492431640625, -1.585693359375, -1.43646240234375, -1.2872314453125, -1.13800048828125, -0.98876953125, -0.83953857421875, -0.6903076171875, -0.54107666015625, -0.391845703125, -0.24261474609375, -0.0933837890625, 0.05584716796875, 0.205078125, 0.35430908203125, 0.5035400390625, 0.65277099609375, 0.802001953125, 0.95123291015625, 1.1004638671875, 1.24969482421875, 1.39892578125, 1.54815673828125, 1.6973876953125, 1.84661865234375, 1.995849609375, 2.14508056640625, 2.2943115234375, 2.44354248046875, 2.5927734375, 2.74200439453125, 2.8912353515625, 3.04046630859375, 3.189697265625, 3.33892822265625, 3.4881591796875, 3.63739013671875, 3.78662109375, 3.93585205078125, 4.0850830078125, 4.23431396484375, 4.383544921875, 4.53277587890625, 4.6820068359375, 4.83123779296875, 4.98046875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 9.0, 7.0, 8.0, 8.0, 7.0, 12.0, 11.0, 17.0, 19.0, 22.0, 21.0, 34.0, 29.0, 39.0, 26.0, 42.0, 39.0, 41.0, 38.0, 39.0, 56.0, 49.0, 48.0, 38.0, 32.0, 32.0, 31.0, 42.0, 38.0, 32.0, 22.0, 16.0, 16.0, 12.0, 13.0, 12.0, 13.0, 5.0, 5.0, 4.0, 6.0, 3.0, 4.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.9794921875, -1.9201507568359375, -1.860809326171875, -1.8014678955078125, -1.74212646484375, -1.6827850341796875, -1.623443603515625, -1.5641021728515625, -1.5047607421875, -1.4454193115234375, -1.386077880859375, -1.3267364501953125, -1.26739501953125, -1.2080535888671875, -1.148712158203125, -1.0893707275390625, -1.030029296875, -0.9706878662109375, -0.911346435546875, -0.8520050048828125, -0.79266357421875, -0.7333221435546875, -0.673980712890625, -0.6146392822265625, -0.5552978515625, -0.4959564208984375, -0.436614990234375, -0.3772735595703125, -0.31793212890625, -0.2585906982421875, -0.199249267578125, -0.1399078369140625, -0.08056640625, -0.0212249755859375, 0.038116455078125, 0.0974578857421875, 0.15679931640625, 0.2161407470703125, 0.275482177734375, 0.3348236083984375, 0.3941650390625, 0.4535064697265625, 0.512847900390625, 0.5721893310546875, 0.63153076171875, 0.6908721923828125, 0.750213623046875, 0.8095550537109375, 0.868896484375, 0.9282379150390625, 0.987579345703125, 1.0469207763671875, 1.10626220703125, 1.1656036376953125, 1.224945068359375, 1.2842864990234375, 1.3436279296875, 1.4029693603515625, 1.462310791015625, 1.5216522216796875, 1.58099365234375, 1.6403350830078125, 1.699676513671875, 1.7590179443359375, 1.818359375]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 6.0, 6.0, 8.0, 5.0, 15.0, 5.0, 13.0, 11.0, 23.0, 28.0, 31.0, 46.0, 49.0, 51.0, 60.0, 54.0, 61.0, 77.0, 66.0, 69.0, 58.0, 49.0, 42.0, 34.0, 16.0, 26.0, 16.0, 18.0, 11.0, 8.0, 7.0, 11.0, 3.0, 5.0, 8.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.74799919128418, -22.989160537719727, -22.230321884155273, -21.471485137939453, -20.712646484375, -19.953807830810547, -19.194969177246094, -18.43613052368164, -17.677291870117188, -16.918453216552734, -16.15961456298828, -15.400776863098145, -14.641939163208008, -13.883100509643555, -13.124261856079102, -12.365423202514648, -11.606586456298828, -10.847747802734375, -10.088910102844238, -9.330071449279785, -8.571233749389648, -7.812395095825195, -7.053556442260742, -6.294718265533447, -5.535880088806152, -4.777041912078857, -4.0182037353515625, -3.2593650817871094, -2.5005269050598145, -1.7416887283325195, -0.9828500747680664, -0.22401189804077148, 0.5348281860351562, 1.2936664819717407, 2.052504777908325, 2.811343193054199, 3.570181369781494, 4.329019546508789, 5.087858200073242, 5.846696376800537, 6.605534553527832, 7.364372730255127, 8.123210906982422, 8.882049560546875, 9.640888214111328, 10.399725914001465, 11.158564567565918, 11.917402267456055, 12.676240921020508, 13.435079574584961, 14.193917274475098, 14.95275592803955, 15.711593627929688, 16.47043228149414, 17.229270935058594, 17.988109588623047, 18.7469482421875, 19.505786895751953, 20.264625549316406, 21.02346420288086, 21.78230094909668, 22.541139602661133, 23.299978256225586, 24.05881690979004, 24.81765365600586]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 5.0, 9.0, 6.0, 4.0, 9.0, 10.0, 13.0, 19.0, 16.0, 24.0, 26.0, 26.0, 35.0, 37.0, 44.0, 44.0, 45.0, 43.0, 42.0, 49.0, 47.0, 41.0, 48.0, 47.0, 37.0, 35.0, 40.0, 31.0, 37.0, 26.0, 20.0, 18.0, 11.0, 13.0, 18.0, 6.0, 7.0, 6.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.983983993530273, -15.481595993041992, -14.979207992553711, -14.47681999206543, -13.974432945251465, -13.472044944763184, -12.969656944274902, -12.467268943786621, -11.964881896972656, -11.462493896484375, -10.960105895996094, -10.457717895507812, -9.955330848693848, -9.452942848205566, -8.950554847717285, -8.448166847229004, -7.945778846740723, -7.443390846252441, -6.941003322601318, -6.438615322113037, -5.936227798461914, -5.433839797973633, -4.931451797485352, -4.42906379699707, -3.9266762733459473, -3.424288511276245, -2.921900749206543, -2.4195127487182617, -1.9171249866485596, -1.4147372245788574, -0.9123492240905762, -0.409961462020874, 0.09242630004882812, 0.594814121723175, 1.097201943397522, 1.5995898246765137, 2.101977586746216, 2.604365348815918, 3.106753349304199, 3.6091411113739014, 4.1115288734436035, 4.613916873931885, 5.116304397583008, 5.618692398071289, 6.12108039855957, 6.623467922210693, 7.125855922698975, 7.628243446350098, 8.130631446838379, 8.63301944732666, 9.135407447814941, 9.637794494628906, 10.140182495117188, 10.642570495605469, 11.14495849609375, 11.647346496582031, 12.149734497070312, 12.652122497558594, 13.154510498046875, 13.656898498535156, 14.159285545349121, 14.661673545837402, 15.164061546325684, 15.666449546813965, 16.16883659362793]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 8.0, 23.0, 21.0, 31.0, 41.0, 68.0, 111.0, 183.0, 263.0, 344.0, 580.0, 876.0, 1367.0, 2113.0, 3431.0, 5850.0, 10023.0, 17868.0, 32856.0, 63297.0, 125981.0, 258339.0, 508127.0, 845495.0, 945040.0, 663911.0, 355428.0, 173634.0, 84422.0, 42582.0, 22138.0, 12071.0, 6912.0, 4017.0, 2460.0, 1584.0, 982.0, 616.0, 385.0, 285.0, 176.0, 136.0, 77.0, 44.0, 32.0, 21.0, 16.0, 8.0, 11.0, 3.0, 2.0, 2.0], "bins": [-26.890625, -26.148193359375, -25.40576171875, -24.663330078125, -23.9208984375, -23.178466796875, -22.43603515625, -21.693603515625, -20.951171875, -20.208740234375, -19.46630859375, -18.723876953125, -17.9814453125, -17.239013671875, -16.49658203125, -15.754150390625, -15.01171875, -14.269287109375, -13.52685546875, -12.784423828125, -12.0419921875, -11.299560546875, -10.55712890625, -9.814697265625, -9.072265625, -8.329833984375, -7.58740234375, -6.844970703125, -6.1025390625, -5.360107421875, -4.61767578125, -3.875244140625, -3.1328125, -2.390380859375, -1.64794921875, -0.905517578125, -0.1630859375, 0.579345703125, 1.32177734375, 2.064208984375, 2.806640625, 3.549072265625, 4.29150390625, 5.033935546875, 5.7763671875, 6.518798828125, 7.26123046875, 8.003662109375, 8.74609375, 9.488525390625, 10.23095703125, 10.973388671875, 11.7158203125, 12.458251953125, 13.20068359375, 13.943115234375, 14.685546875, 15.427978515625, 16.17041015625, 16.912841796875, 17.6552734375, 18.397705078125, 19.14013671875, 19.882568359375, 20.625]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 4.0, 8.0, 2.0, 3.0, 16.0, 16.0, 14.0, 21.0, 19.0, 27.0, 30.0, 33.0, 43.0, 46.0, 44.0, 45.0, 46.0, 57.0, 37.0, 43.0, 57.0, 60.0, 42.0, 47.0, 42.0, 40.0, 41.0, 24.0, 18.0, 18.0, 16.0, 7.0, 14.0, 7.0, 2.0, 7.0, 4.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.2578125, -13.79248046875, -13.3271484375, -12.86181640625, -12.396484375, -11.93115234375, -11.4658203125, -11.00048828125, -10.53515625, -10.06982421875, -9.6044921875, -9.13916015625, -8.673828125, -8.20849609375, -7.7431640625, -7.27783203125, -6.8125, -6.34716796875, -5.8818359375, -5.41650390625, -4.951171875, -4.48583984375, -4.0205078125, -3.55517578125, -3.08984375, -2.62451171875, -2.1591796875, -1.69384765625, -1.228515625, -0.76318359375, -0.2978515625, 0.16748046875, 0.6328125, 1.09814453125, 1.5634765625, 2.02880859375, 2.494140625, 2.95947265625, 3.4248046875, 3.89013671875, 4.35546875, 4.82080078125, 5.2861328125, 5.75146484375, 6.216796875, 6.68212890625, 7.1474609375, 7.61279296875, 8.078125, 8.54345703125, 9.0087890625, 9.47412109375, 9.939453125, 10.40478515625, 10.8701171875, 11.33544921875, 11.80078125, 12.26611328125, 12.7314453125, 13.19677734375, 13.662109375, 14.12744140625, 14.5927734375, 15.05810546875, 15.5234375]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 7.0, 5.0, 9.0, 16.0, 25.0, 27.0, 59.0, 61.0, 110.0, 176.0, 279.0, 414.0, 567.0, 941.0, 1552.0, 2330.0, 3890.0, 6632.0, 11408.0, 19723.0, 35033.0, 64320.0, 119541.0, 221537.0, 399993.0, 647676.0, 826738.0, 734623.0, 484396.0, 277344.0, 150579.0, 80938.0, 44293.0, 24632.0, 13834.0, 8090.0, 4760.0, 2843.0, 1714.0, 1092.0, 758.0, 457.0, 324.0, 182.0, 140.0, 83.0, 48.0, 34.0, 23.0, 17.0, 8.0, 5.0, 5.0, 5.0, 0.0, 1.0], "bins": [-27.453125, -26.66162109375, -25.8701171875, -25.07861328125, -24.287109375, -23.49560546875, -22.7041015625, -21.91259765625, -21.12109375, -20.32958984375, -19.5380859375, -18.74658203125, -17.955078125, -17.16357421875, -16.3720703125, -15.58056640625, -14.7890625, -13.99755859375, -13.2060546875, -12.41455078125, -11.623046875, -10.83154296875, -10.0400390625, -9.24853515625, -8.45703125, -7.66552734375, -6.8740234375, -6.08251953125, -5.291015625, -4.49951171875, -3.7080078125, -2.91650390625, -2.125, -1.33349609375, -0.5419921875, 0.24951171875, 1.041015625, 1.83251953125, 2.6240234375, 3.41552734375, 4.20703125, 4.99853515625, 5.7900390625, 6.58154296875, 7.373046875, 8.16455078125, 8.9560546875, 9.74755859375, 10.5390625, 11.33056640625, 12.1220703125, 12.91357421875, 13.705078125, 14.49658203125, 15.2880859375, 16.07958984375, 16.87109375, 17.66259765625, 18.4541015625, 19.24560546875, 20.037109375, 20.82861328125, 21.6201171875, 22.41162109375, 23.203125]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 7.0, 0.0, 6.0, 5.0, 17.0, 15.0, 22.0, 18.0, 38.0, 51.0, 73.0, 80.0, 134.0, 164.0, 197.0, 262.0, 299.0, 317.0, 346.0, 344.0, 335.0, 275.0, 254.0, 208.0, 147.0, 130.0, 100.0, 68.0, 59.0, 26.0, 25.0, 13.0, 16.0, 7.0, 6.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.4296875, -12.10009765625, -11.7705078125, -11.44091796875, -11.111328125, -10.78173828125, -10.4521484375, -10.12255859375, -9.79296875, -9.46337890625, -9.1337890625, -8.80419921875, -8.474609375, -8.14501953125, -7.8154296875, -7.48583984375, -7.15625, -6.82666015625, -6.4970703125, -6.16748046875, -5.837890625, -5.50830078125, -5.1787109375, -4.84912109375, -4.51953125, -4.18994140625, -3.8603515625, -3.53076171875, -3.201171875, -2.87158203125, -2.5419921875, -2.21240234375, -1.8828125, -1.55322265625, -1.2236328125, -0.89404296875, -0.564453125, -0.23486328125, 0.0947265625, 0.42431640625, 0.75390625, 1.08349609375, 1.4130859375, 1.74267578125, 2.072265625, 2.40185546875, 2.7314453125, 3.06103515625, 3.390625, 3.72021484375, 4.0498046875, 4.37939453125, 4.708984375, 5.03857421875, 5.3681640625, 5.69775390625, 6.02734375, 6.35693359375, 6.6865234375, 7.01611328125, 7.345703125, 7.67529296875, 8.0048828125, 8.33447265625, 8.6640625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 6.0, 6.0, 3.0, 8.0, 20.0, 8.0, 15.0, 27.0, 24.0, 25.0, 36.0, 35.0, 52.0, 58.0, 59.0, 58.0, 64.0, 50.0, 69.0, 55.0, 45.0, 55.0, 51.0, 38.0, 27.0, 25.0, 16.0, 13.0, 9.0, 12.0, 8.0, 6.0, 4.0, 4.0, 6.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.259218215942383, -20.40230941772461, -19.545400619506836, -18.688491821289062, -17.83158302307129, -16.974674224853516, -16.117765426635742, -15.260856628417969, -14.403947830200195, -13.547039031982422, -12.690130233764648, -11.833221435546875, -10.976312637329102, -10.119403839111328, -9.262495040893555, -8.405586242675781, -7.548677444458008, -6.691768646240234, -5.834859848022461, -4.9779510498046875, -4.121042251586914, -3.2641334533691406, -2.407224655151367, -1.5503158569335938, -0.6934070587158203, 0.16350173950195312, 1.0204105377197266, 1.8773193359375, 2.7342281341552734, 3.591136932373047, 4.44804573059082, 5.304954528808594, 6.161865234375, 7.018774032592773, 7.875682830810547, 8.73259162902832, 9.589500427246094, 10.446409225463867, 11.30331802368164, 12.160226821899414, 13.017135620117188, 13.874044418334961, 14.730953216552734, 15.587862014770508, 16.44477081298828, 17.301679611206055, 18.158588409423828, 19.0154972076416, 19.872406005859375, 20.72931480407715, 21.586223602294922, 22.443132400512695, 23.30004119873047, 24.156949996948242, 25.013858795166016, 25.87076759338379, 26.727676391601562, 27.584585189819336, 28.44149398803711, 29.298402786254883, 30.155311584472656, 31.01222038269043, 31.869129180908203, 32.726036071777344, 33.58294677734375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 4.0, 3.0, 4.0, 8.0, 5.0, 14.0, 11.0, 12.0, 19.0, 15.0, 26.0, 24.0, 35.0, 32.0, 26.0, 37.0, 43.0, 51.0, 40.0, 42.0, 43.0, 44.0, 45.0, 42.0, 33.0, 33.0, 42.0, 23.0, 16.0, 23.0, 31.0, 24.0, 26.0, 20.0, 23.0, 23.0, 13.0, 11.0, 6.0, 7.0, 5.0, 2.0, 4.0, 4.0, 2.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-16.862382888793945, -16.340221405029297, -15.818058967590332, -15.295896530151367, -14.773735046386719, -14.25157356262207, -13.729411125183105, -13.20724868774414, -12.685087203979492, -12.162925720214844, -11.640763282775879, -11.118600845336914, -10.596439361572266, -10.074277877807617, -9.552115440368652, -9.029953002929688, -8.507791519165039, -7.985629558563232, -7.463467597961426, -6.941305637359619, -6.4191436767578125, -5.896981716156006, -5.374819755554199, -4.852657794952393, -4.330495834350586, -3.8083338737487793, -3.2861719131469727, -2.764009952545166, -2.2418479919433594, -1.7196860313415527, -1.197524070739746, -0.6753621101379395, -0.1532001495361328, 0.36896181106567383, 0.8911237716674805, 1.413285732269287, 1.9354476928710938, 2.4576096534729004, 2.979771614074707, 3.5019335746765137, 4.02409553527832, 4.546257495880127, 5.068419456481934, 5.59058141708374, 6.112743377685547, 6.6349053382873535, 7.15706729888916, 7.679229259490967, 8.201391220092773, 8.723552703857422, 9.245715141296387, 9.767877578735352, 10.2900390625, 10.812200546264648, 11.334362983703613, 11.856525421142578, 12.378686904907227, 12.900848388671875, 13.42301082611084, 13.945173263549805, 14.467334747314453, 14.989496231079102, 15.511658668518066, 16.03382110595703, 16.55598258972168]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 3.0, 10.0, 17.0, 27.0, 34.0, 70.0, 90.0, 143.0, 204.0, 286.0, 495.0, 766.0, 1129.0, 1651.0, 2731.0, 4353.0, 6848.0, 10828.0, 17083.0, 26636.0, 40408.0, 59362.0, 82861.0, 108603.0, 127139.0, 132023.0, 119024.0, 95661.0, 70375.0, 48608.0, 32795.0, 21211.0, 13530.0, 8719.0, 5390.0, 3440.0, 2140.0, 1367.0, 912.0, 503.0, 373.0, 243.0, 139.0, 109.0, 66.0, 55.0, 35.0, 17.0, 15.0, 9.0, 8.0, 7.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.859375, -10.5225830078125, -10.185791015625, -9.8489990234375, -9.51220703125, -9.1754150390625, -8.838623046875, -8.5018310546875, -8.1650390625, -7.8282470703125, -7.491455078125, -7.1546630859375, -6.81787109375, -6.4810791015625, -6.144287109375, -5.8074951171875, -5.470703125, -5.1339111328125, -4.797119140625, -4.4603271484375, -4.12353515625, -3.7867431640625, -3.449951171875, -3.1131591796875, -2.7763671875, -2.4395751953125, -2.102783203125, -1.7659912109375, -1.42919921875, -1.0924072265625, -0.755615234375, -0.4188232421875, -0.08203125, 0.2547607421875, 0.591552734375, 0.9283447265625, 1.26513671875, 1.6019287109375, 1.938720703125, 2.2755126953125, 2.6123046875, 2.9490966796875, 3.285888671875, 3.6226806640625, 3.95947265625, 4.2962646484375, 4.633056640625, 4.9698486328125, 5.306640625, 5.6434326171875, 5.980224609375, 6.3170166015625, 6.65380859375, 6.9906005859375, 7.327392578125, 7.6641845703125, 8.0009765625, 8.3377685546875, 8.674560546875, 9.0113525390625, 9.34814453125, 9.6849365234375, 10.021728515625, 10.3585205078125, 10.6953125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 4.0, 8.0, 6.0, 8.0, 15.0, 19.0, 14.0, 25.0, 25.0, 30.0, 33.0, 47.0, 35.0, 40.0, 47.0, 57.0, 42.0, 41.0, 51.0, 53.0, 51.0, 41.0, 31.0, 34.0, 38.0, 31.0, 24.0, 23.0, 23.0, 12.0, 17.0, 25.0, 14.0, 13.0, 5.0, 9.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-21.90625, -21.2646484375, -20.623046875, -19.9814453125, -19.33984375, -18.6982421875, -18.056640625, -17.4150390625, -16.7734375, -16.1318359375, -15.490234375, -14.8486328125, -14.20703125, -13.5654296875, -12.923828125, -12.2822265625, -11.640625, -10.9990234375, -10.357421875, -9.7158203125, -9.07421875, -8.4326171875, -7.791015625, -7.1494140625, -6.5078125, -5.8662109375, -5.224609375, -4.5830078125, -3.94140625, -3.2998046875, -2.658203125, -2.0166015625, -1.375, -0.7333984375, -0.091796875, 0.5498046875, 1.19140625, 1.8330078125, 2.474609375, 3.1162109375, 3.7578125, 4.3994140625, 5.041015625, 5.6826171875, 6.32421875, 6.9658203125, 7.607421875, 8.2490234375, 8.890625, 9.5322265625, 10.173828125, 10.8154296875, 11.45703125, 12.0986328125, 12.740234375, 13.3818359375, 14.0234375, 14.6650390625, 15.306640625, 15.9482421875, 16.58984375, 17.2314453125, 17.873046875, 18.5146484375, 19.15625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 4.0, 6.0, 11.0, 8.0, 11.0, 27.0, 30.0, 33.0, 67.0, 102.0, 125.0, 183.0, 359.0, 508.0, 838.0, 1309.0, 2201.0, 3696.0, 6457.0, 11832.0, 21036.0, 40246.0, 74590.0, 133764.0, 203508.0, 213516.0, 148264.0, 85358.0, 45419.0, 23958.0, 13077.0, 7462.0, 4083.0, 2455.0, 1484.0, 885.0, 594.0, 352.0, 223.0, 140.0, 127.0, 69.0, 50.0, 26.0, 20.0, 17.0, 13.0, 7.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-19.359375, -18.75634765625, -18.1533203125, -17.55029296875, -16.947265625, -16.34423828125, -15.7412109375, -15.13818359375, -14.53515625, -13.93212890625, -13.3291015625, -12.72607421875, -12.123046875, -11.52001953125, -10.9169921875, -10.31396484375, -9.7109375, -9.10791015625, -8.5048828125, -7.90185546875, -7.298828125, -6.69580078125, -6.0927734375, -5.48974609375, -4.88671875, -4.28369140625, -3.6806640625, -3.07763671875, -2.474609375, -1.87158203125, -1.2685546875, -0.66552734375, -0.0625, 0.54052734375, 1.1435546875, 1.74658203125, 2.349609375, 2.95263671875, 3.5556640625, 4.15869140625, 4.76171875, 5.36474609375, 5.9677734375, 6.57080078125, 7.173828125, 7.77685546875, 8.3798828125, 8.98291015625, 9.5859375, 10.18896484375, 10.7919921875, 11.39501953125, 11.998046875, 12.60107421875, 13.2041015625, 13.80712890625, 14.41015625, 15.01318359375, 15.6162109375, 16.21923828125, 16.822265625, 17.42529296875, 18.0283203125, 18.63134765625, 19.234375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 8.0, 11.0, 8.0, 12.0, 12.0, 12.0, 16.0, 19.0, 18.0, 26.0, 37.0, 26.0, 36.0, 37.0, 32.0, 32.0, 38.0, 44.0, 46.0, 36.0, 35.0, 37.0, 43.0, 41.0, 31.0, 33.0, 30.0, 27.0, 25.0, 37.0, 26.0, 25.0, 16.0, 15.0, 16.0, 9.0, 12.0, 15.0, 5.0, 3.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-10.5, -10.195068359375, -9.89013671875, -9.585205078125, -9.2802734375, -8.975341796875, -8.67041015625, -8.365478515625, -8.060546875, -7.755615234375, -7.45068359375, -7.145751953125, -6.8408203125, -6.535888671875, -6.23095703125, -5.926025390625, -5.62109375, -5.316162109375, -5.01123046875, -4.706298828125, -4.4013671875, -4.096435546875, -3.79150390625, -3.486572265625, -3.181640625, -2.876708984375, -2.57177734375, -2.266845703125, -1.9619140625, -1.656982421875, -1.35205078125, -1.047119140625, -0.7421875, -0.437255859375, -0.13232421875, 0.172607421875, 0.4775390625, 0.782470703125, 1.08740234375, 1.392333984375, 1.697265625, 2.002197265625, 2.30712890625, 2.612060546875, 2.9169921875, 3.221923828125, 3.52685546875, 3.831787109375, 4.13671875, 4.441650390625, 4.74658203125, 5.051513671875, 5.3564453125, 5.661376953125, 5.96630859375, 6.271240234375, 6.576171875, 6.881103515625, 7.18603515625, 7.490966796875, 7.7958984375, 8.100830078125, 8.40576171875, 8.710693359375, 9.015625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 9.0, 17.0, 22.0, 30.0, 51.0, 79.0, 98.0, 159.0, 268.0, 439.0, 648.0, 1021.0, 1663.0, 2650.0, 4393.0, 7453.0, 13238.0, 23613.0, 43280.0, 78814.0, 140225.0, 210374.0, 208467.0, 137406.0, 77168.0, 42326.0, 22696.0, 13029.0, 7406.0, 4418.0, 2582.0, 1605.0, 994.0, 643.0, 419.0, 280.0, 189.0, 135.0, 74.0, 55.0, 41.0, 22.0, 19.0, 20.0, 6.0, 5.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.0, -10.66650390625, -10.3330078125, -9.99951171875, -9.666015625, -9.33251953125, -8.9990234375, -8.66552734375, -8.33203125, -7.99853515625, -7.6650390625, -7.33154296875, -6.998046875, -6.66455078125, -6.3310546875, -5.99755859375, -5.6640625, -5.33056640625, -4.9970703125, -4.66357421875, -4.330078125, -3.99658203125, -3.6630859375, -3.32958984375, -2.99609375, -2.66259765625, -2.3291015625, -1.99560546875, -1.662109375, -1.32861328125, -0.9951171875, -0.66162109375, -0.328125, 0.00537109375, 0.3388671875, 0.67236328125, 1.005859375, 1.33935546875, 1.6728515625, 2.00634765625, 2.33984375, 2.67333984375, 3.0068359375, 3.34033203125, 3.673828125, 4.00732421875, 4.3408203125, 4.67431640625, 5.0078125, 5.34130859375, 5.6748046875, 6.00830078125, 6.341796875, 6.67529296875, 7.0087890625, 7.34228515625, 7.67578125, 8.00927734375, 8.3427734375, 8.67626953125, 9.009765625, 9.34326171875, 9.6767578125, 10.01025390625, 10.34375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 8.0, 3.0, 2.0, 2.0, 2.0, 10.0, 7.0, 11.0, 14.0, 12.0, 18.0, 17.0, 24.0, 29.0, 32.0, 45.0, 37.0, 62.0, 56.0, 55.0, 56.0, 52.0, 57.0, 35.0, 56.0, 43.0, 34.0, 38.0, 40.0, 32.0, 27.0, 18.0, 18.0, 11.0, 8.0, 9.0, 6.0, 5.0, 3.0, 9.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0004820823669433594, -0.00046910718083381653, -0.0004561319947242737, -0.00044315680861473083, -0.000430181622505188, -0.00041720643639564514, -0.0004042312502861023, -0.00039125606417655945, -0.0003782808780670166, -0.00036530569195747375, -0.0003523305058479309, -0.00033935531973838806, -0.0003263801336288452, -0.00031340494751930237, -0.0003004297614097595, -0.0002874545753002167, -0.00027447938919067383, -0.000261504203081131, -0.00024852901697158813, -0.0002355538308620453, -0.00022257864475250244, -0.0002096034586429596, -0.00019662827253341675, -0.0001836530864238739, -0.00017067790031433105, -0.0001577027142047882, -0.00014472752809524536, -0.00013175234198570251, -0.00011877715587615967, -0.00010580196976661682, -9.282678365707397e-05, -7.985159754753113e-05, -6.687641143798828e-05, -5.3901225328445435e-05, -4.092603921890259e-05, -2.795085310935974e-05, -1.4975666999816895e-05, -2.000480890274048e-06, 1.0974705219268799e-05, 2.3949891328811646e-05, 3.692507743835449e-05, 4.990026354789734e-05, 6.287544965744019e-05, 7.585063576698303e-05, 8.882582187652588e-05, 0.00010180100798606873, 0.00011477619409561157, 0.00012775138020515442, 0.00014072656631469727, 0.0001537017524242401, 0.00016667693853378296, 0.0001796521246433258, 0.00019262731075286865, 0.0002056024968624115, 0.00021857768297195435, 0.0002315528690814972, 0.00024452805519104004, 0.0002575032413005829, 0.00027047842741012573, 0.0002834536135196686, 0.0002964287996292114, 0.00030940398573875427, 0.0003223791718482971, 0.00033535435795783997, 0.0003483295440673828]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 9.0, 13.0, 26.0, 25.0, 45.0, 81.0, 111.0, 191.0, 231.0, 362.0, 568.0, 844.0, 1279.0, 1934.0, 3078.0, 4364.0, 6812.0, 10313.0, 15740.0, 25034.0, 37716.0, 56820.0, 82909.0, 112185.0, 135559.0, 140732.0, 122699.0, 94344.0, 65945.0, 44368.0, 29538.0, 18731.0, 12305.0, 8075.0, 5330.0, 3426.0, 2254.0, 1516.0, 1065.0, 684.0, 432.0, 282.0, 194.0, 129.0, 91.0, 61.0, 41.0, 29.0, 14.0, 13.0, 9.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.3125, -8.0543212890625, -7.796142578125, -7.5379638671875, -7.27978515625, -7.0216064453125, -6.763427734375, -6.5052490234375, -6.2470703125, -5.9888916015625, -5.730712890625, -5.4725341796875, -5.21435546875, -4.9561767578125, -4.697998046875, -4.4398193359375, -4.181640625, -3.9234619140625, -3.665283203125, -3.4071044921875, -3.14892578125, -2.8907470703125, -2.632568359375, -2.3743896484375, -2.1162109375, -1.8580322265625, -1.599853515625, -1.3416748046875, -1.08349609375, -0.8253173828125, -0.567138671875, -0.3089599609375, -0.05078125, 0.2073974609375, 0.465576171875, 0.7237548828125, 0.98193359375, 1.2401123046875, 1.498291015625, 1.7564697265625, 2.0146484375, 2.2728271484375, 2.531005859375, 2.7891845703125, 3.04736328125, 3.3055419921875, 3.563720703125, 3.8218994140625, 4.080078125, 4.3382568359375, 4.596435546875, 4.8546142578125, 5.11279296875, 5.3709716796875, 5.629150390625, 5.8873291015625, 6.1455078125, 6.4036865234375, 6.661865234375, 6.9200439453125, 7.17822265625, 7.4364013671875, 7.694580078125, 7.9527587890625, 8.2109375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 4.0, 1.0, 5.0, 4.0, 3.0, 3.0, 5.0, 10.0, 9.0, 8.0, 12.0, 12.0, 17.0, 19.0, 19.0, 30.0, 21.0, 40.0, 43.0, 38.0, 36.0, 52.0, 54.0, 38.0, 49.0, 49.0, 47.0, 46.0, 48.0, 35.0, 37.0, 35.0, 24.0, 27.0, 23.0, 16.0, 23.0, 13.0, 10.0, 6.0, 10.0, 2.0, 5.0, 7.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.595703125, -2.512664794921875, -2.42962646484375, -2.346588134765625, -2.2635498046875, -2.180511474609375, -2.09747314453125, -2.014434814453125, -1.931396484375, -1.848358154296875, -1.76531982421875, -1.682281494140625, -1.5992431640625, -1.516204833984375, -1.43316650390625, -1.350128173828125, -1.26708984375, -1.184051513671875, -1.10101318359375, -1.017974853515625, -0.9349365234375, -0.851898193359375, -0.76885986328125, -0.685821533203125, -0.602783203125, -0.519744873046875, -0.43670654296875, -0.353668212890625, -0.2706298828125, -0.187591552734375, -0.10455322265625, -0.021514892578125, 0.0615234375, 0.144561767578125, 0.22760009765625, 0.310638427734375, 0.3936767578125, 0.476715087890625, 0.55975341796875, 0.642791748046875, 0.725830078125, 0.808868408203125, 0.89190673828125, 0.974945068359375, 1.0579833984375, 1.141021728515625, 1.22406005859375, 1.307098388671875, 1.39013671875, 1.473175048828125, 1.55621337890625, 1.639251708984375, 1.7222900390625, 1.805328369140625, 1.88836669921875, 1.971405029296875, 2.054443359375, 2.137481689453125, 2.22052001953125, 2.303558349609375, 2.3865966796875, 2.469635009765625, 2.55267333984375, 2.635711669921875, 2.71875]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 4.0, 7.0, 4.0, 8.0, 11.0, 12.0, 20.0, 26.0, 28.0, 28.0, 34.0, 57.0, 63.0, 52.0, 76.0, 61.0, 62.0, 70.0, 64.0, 54.0, 60.0, 43.0, 30.0, 36.0, 21.0, 18.0, 14.0, 10.0, 10.0, 8.0, 4.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.695209503173828, -23.747371673583984, -22.79953384399414, -21.851696014404297, -20.903858184814453, -19.95602035522461, -19.008182525634766, -18.060344696044922, -17.112506866455078, -16.164669036865234, -15.21683120727539, -14.268993377685547, -13.321155548095703, -12.37331771850586, -11.425479888916016, -10.477642059326172, -9.529803276062012, -8.581965446472168, -7.634127616882324, -6.6862897872924805, -5.738451957702637, -4.790613651275635, -3.842775821685791, -2.8949379920959473, -1.9471001625061035, -0.999262273311615, -0.051424384117126465, 0.8964135646820068, 1.8442513942718506, 2.7920894622802734, 3.739927291870117, 4.687765121459961, 5.635602951049805, 6.583440780639648, 7.531278610229492, 8.479116439819336, 9.42695426940918, 10.374792098999023, 11.322629928588867, 12.270467758178711, 13.218305587768555, 14.166143417358398, 15.113981246948242, 16.061819076538086, 17.00965690612793, 17.957494735717773, 18.905332565307617, 19.85317039489746, 20.801010131835938, 21.74884796142578, 22.696685791015625, 23.64452362060547, 24.592361450195312, 25.540199279785156, 26.488037109375, 27.435874938964844, 28.383712768554688, 29.33155059814453, 30.279388427734375, 31.22722625732422, 32.17506408691406, 33.122901916503906, 34.07073974609375, 35.018577575683594, 35.96641540527344]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 6.0, 4.0, 7.0, 9.0, 13.0, 11.0, 15.0, 11.0, 21.0, 19.0, 21.0, 31.0, 31.0, 32.0, 33.0, 50.0, 34.0, 43.0, 39.0, 51.0, 41.0, 49.0, 42.0, 39.0, 28.0, 34.0, 33.0, 21.0, 21.0, 20.0, 24.0, 27.0, 23.0, 23.0, 23.0, 14.0, 15.0, 13.0, 6.0, 4.0, 4.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-16.635669708251953, -16.127405166625977, -15.619141578674316, -15.11087703704834, -14.60261344909668, -14.094348907470703, -13.586084365844727, -13.07781982421875, -12.56955623626709, -12.061291694641113, -11.553028106689453, -11.044763565063477, -10.5364990234375, -10.02823543548584, -9.519970893859863, -9.011707305908203, -8.503442764282227, -7.995178699493408, -7.48691463470459, -6.978650093078613, -6.470386028289795, -5.962121963500977, -5.453857421875, -4.945593357086182, -4.437329292297363, -3.929065227508545, -3.4208009243011475, -2.91253662109375, -2.4042725563049316, -1.8960084915161133, -1.3877441883087158, -0.8794798851013184, -0.3712167739868164, 0.1370474100112915, 0.6453115940093994, 1.1535757780075073, 1.6618399620056152, 2.1701040267944336, 2.678368330001831, 3.1866326332092285, 3.694896697998047, 4.203160762786865, 4.711424827575684, 5.21968936920166, 5.7279534339904785, 6.236217498779297, 6.744482040405273, 7.252746105194092, 7.76101016998291, 8.269274711608887, 8.777538299560547, 9.285802841186523, 9.7940673828125, 10.30233097076416, 10.810595512390137, 11.318859100341797, 11.827123641967773, 12.33538818359375, 12.84365177154541, 13.351916313171387, 13.860179901123047, 14.368444442749023, 14.876708984375, 15.384973526000977, 15.893237113952637]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 8.0, 4.0, 9.0, 18.0, 27.0, 49.0, 85.0, 153.0, 199.0, 286.0, 430.0, 715.0, 1148.0, 1829.0, 3014.0, 4797.0, 7595.0, 11806.0, 18695.0, 28795.0, 43623.0, 63515.0, 86814.0, 111006.0, 126479.0, 128356.0, 114977.0, 92019.0, 67648.0, 47218.0, 31150.0, 20398.0, 13234.0, 8295.0, 5219.0, 3223.0, 2176.0, 1289.0, 832.0, 506.0, 327.0, 195.0, 147.0, 97.0, 56.0, 28.0, 21.0, 19.0, 11.0, 7.0, 3.0, 3.0, 1.0, 2.0, 2.0], "bins": [-15.5234375, -15.0682373046875, -14.613037109375, -14.1578369140625, -13.70263671875, -13.2474365234375, -12.792236328125, -12.3370361328125, -11.8818359375, -11.4266357421875, -10.971435546875, -10.5162353515625, -10.06103515625, -9.6058349609375, -9.150634765625, -8.6954345703125, -8.240234375, -7.7850341796875, -7.329833984375, -6.8746337890625, -6.41943359375, -5.9642333984375, -5.509033203125, -5.0538330078125, -4.5986328125, -4.1434326171875, -3.688232421875, -3.2330322265625, -2.77783203125, -2.3226318359375, -1.867431640625, -1.4122314453125, -0.95703125, -0.5018310546875, -0.046630859375, 0.4085693359375, 0.86376953125, 1.3189697265625, 1.774169921875, 2.2293701171875, 2.6845703125, 3.1397705078125, 3.594970703125, 4.0501708984375, 4.50537109375, 4.9605712890625, 5.415771484375, 5.8709716796875, 6.326171875, 6.7813720703125, 7.236572265625, 7.6917724609375, 8.14697265625, 8.6021728515625, 9.057373046875, 9.5125732421875, 9.9677734375, 10.4229736328125, 10.878173828125, 11.3333740234375, 11.78857421875, 12.2437744140625, 12.698974609375, 13.1541748046875, 13.609375]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 3.0, 8.0, 7.0, 13.0, 8.0, 13.0, 15.0, 18.0, 23.0, 20.0, 29.0, 49.0, 38.0, 29.0, 47.0, 47.0, 51.0, 43.0, 40.0, 47.0, 39.0, 41.0, 34.0, 34.0, 48.0, 29.0, 36.0, 28.0, 30.0, 23.0, 22.0, 14.0, 14.0, 9.0, 8.0, 10.0, 10.0, 9.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.0625, -17.471435546875, -16.88037109375, -16.289306640625, -15.6982421875, -15.107177734375, -14.51611328125, -13.925048828125, -13.333984375, -12.742919921875, -12.15185546875, -11.560791015625, -10.9697265625, -10.378662109375, -9.78759765625, -9.196533203125, -8.60546875, -8.014404296875, -7.42333984375, -6.832275390625, -6.2412109375, -5.650146484375, -5.05908203125, -4.468017578125, -3.876953125, -3.285888671875, -2.69482421875, -2.103759765625, -1.5126953125, -0.921630859375, -0.33056640625, 0.260498046875, 0.8515625, 1.442626953125, 2.03369140625, 2.624755859375, 3.2158203125, 3.806884765625, 4.39794921875, 4.989013671875, 5.580078125, 6.171142578125, 6.76220703125, 7.353271484375, 7.9443359375, 8.535400390625, 9.12646484375, 9.717529296875, 10.30859375, 10.899658203125, 11.49072265625, 12.081787109375, 12.6728515625, 13.263916015625, 13.85498046875, 14.446044921875, 15.037109375, 15.628173828125, 16.21923828125, 16.810302734375, 17.4013671875, 17.992431640625, 18.58349609375, 19.174560546875, 19.765625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 8.0, 17.0, 13.0, 28.0, 54.0, 85.0, 134.0, 182.0, 303.0, 454.0, 668.0, 1161.0, 1775.0, 2617.0, 4319.0, 6726.0, 10388.0, 16219.0, 24589.0, 37115.0, 53781.0, 74780.0, 96389.0, 114943.0, 124073.0, 118559.0, 101358.0, 79891.0, 58806.0, 40870.0, 27500.0, 18329.0, 11803.0, 7417.0, 4834.0, 3027.0, 1919.0, 1193.0, 818.0, 514.0, 336.0, 210.0, 130.0, 75.0, 59.0, 31.0, 25.0, 14.0, 7.0, 10.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.6328125, -14.184326171875, -13.73583984375, -13.287353515625, -12.8388671875, -12.390380859375, -11.94189453125, -11.493408203125, -11.044921875, -10.596435546875, -10.14794921875, -9.699462890625, -9.2509765625, -8.802490234375, -8.35400390625, -7.905517578125, -7.45703125, -7.008544921875, -6.56005859375, -6.111572265625, -5.6630859375, -5.214599609375, -4.76611328125, -4.317626953125, -3.869140625, -3.420654296875, -2.97216796875, -2.523681640625, -2.0751953125, -1.626708984375, -1.17822265625, -0.729736328125, -0.28125, 0.167236328125, 0.61572265625, 1.064208984375, 1.5126953125, 1.961181640625, 2.40966796875, 2.858154296875, 3.306640625, 3.755126953125, 4.20361328125, 4.652099609375, 5.1005859375, 5.549072265625, 5.99755859375, 6.446044921875, 6.89453125, 7.343017578125, 7.79150390625, 8.239990234375, 8.6884765625, 9.136962890625, 9.58544921875, 10.033935546875, 10.482421875, 10.930908203125, 11.37939453125, 11.827880859375, 12.2763671875, 12.724853515625, 13.17333984375, 13.621826171875, 14.0703125]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 1.0, 9.0, 2.0, 6.0, 6.0, 5.0, 4.0, 9.0, 12.0, 23.0, 24.0, 22.0, 23.0, 32.0, 21.0, 35.0, 32.0, 36.0, 34.0, 49.0, 49.0, 37.0, 46.0, 50.0, 29.0, 38.0, 37.0, 31.0, 16.0, 38.0, 34.0, 34.0, 28.0, 22.0, 22.0, 24.0, 16.0, 19.0, 11.0, 8.0, 5.0, 6.0, 8.0, 2.0, 6.0, 1.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1328125, -8.7822265625, -8.431640625, -8.0810546875, -7.73046875, -7.3798828125, -7.029296875, -6.6787109375, -6.328125, -5.9775390625, -5.626953125, -5.2763671875, -4.92578125, -4.5751953125, -4.224609375, -3.8740234375, -3.5234375, -3.1728515625, -2.822265625, -2.4716796875, -2.12109375, -1.7705078125, -1.419921875, -1.0693359375, -0.71875, -0.3681640625, -0.017578125, 0.3330078125, 0.68359375, 1.0341796875, 1.384765625, 1.7353515625, 2.0859375, 2.4365234375, 2.787109375, 3.1376953125, 3.48828125, 3.8388671875, 4.189453125, 4.5400390625, 4.890625, 5.2412109375, 5.591796875, 5.9423828125, 6.29296875, 6.6435546875, 6.994140625, 7.3447265625, 7.6953125, 8.0458984375, 8.396484375, 8.7470703125, 9.09765625, 9.4482421875, 9.798828125, 10.1494140625, 10.5, 10.8505859375, 11.201171875, 11.5517578125, 11.90234375, 12.2529296875, 12.603515625, 12.9541015625, 13.3046875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 4.0, 5.0, 6.0, 12.0, 10.0, 21.0, 24.0, 49.0, 59.0, 76.0, 129.0, 196.0, 277.0, 397.0, 710.0, 1136.0, 1761.0, 3056.0, 5278.0, 9286.0, 17232.0, 32105.0, 59815.0, 103925.0, 158256.0, 192492.0, 174621.0, 123906.0, 73664.0, 40363.0, 21854.0, 11657.0, 6584.0, 3730.0, 2178.0, 1342.0, 809.0, 518.0, 328.0, 230.0, 135.0, 105.0, 71.0, 44.0, 33.0, 23.0, 19.0, 13.0, 7.0, 3.0, 6.0, 2.0, 3.0, 2.0], "bins": [-12.21875, -11.8763427734375, -11.533935546875, -11.1915283203125, -10.84912109375, -10.5067138671875, -10.164306640625, -9.8218994140625, -9.4794921875, -9.1370849609375, -8.794677734375, -8.4522705078125, -8.10986328125, -7.7674560546875, -7.425048828125, -7.0826416015625, -6.740234375, -6.3978271484375, -6.055419921875, -5.7130126953125, -5.37060546875, -5.0281982421875, -4.685791015625, -4.3433837890625, -4.0009765625, -3.6585693359375, -3.316162109375, -2.9737548828125, -2.63134765625, -2.2889404296875, -1.946533203125, -1.6041259765625, -1.26171875, -0.9193115234375, -0.576904296875, -0.2344970703125, 0.10791015625, 0.4503173828125, 0.792724609375, 1.1351318359375, 1.4775390625, 1.8199462890625, 2.162353515625, 2.5047607421875, 2.84716796875, 3.1895751953125, 3.531982421875, 3.8743896484375, 4.216796875, 4.5592041015625, 4.901611328125, 5.2440185546875, 5.58642578125, 5.9288330078125, 6.271240234375, 6.6136474609375, 6.9560546875, 7.2984619140625, 7.640869140625, 7.9832763671875, 8.32568359375, 8.6680908203125, 9.010498046875, 9.3529052734375, 9.6953125]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 5.0, 0.0, 4.0, 2.0, 4.0, 9.0, 5.0, 5.0, 13.0, 6.0, 13.0, 18.0, 23.0, 15.0, 22.0, 36.0, 23.0, 32.0, 36.0, 48.0, 54.0, 50.0, 43.0, 40.0, 47.0, 47.0, 43.0, 45.0, 34.0, 35.0, 34.0, 27.0, 32.0, 27.0, 23.0, 17.0, 15.0, 10.0, 11.0, 7.0, 6.0, 9.0, 5.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0007491111755371094, -0.0007250681519508362, -0.000701025128364563, -0.0006769821047782898, -0.0006529390811920166, -0.0006288960576057434, -0.0006048530340194702, -0.000580810010433197, -0.0005567669868469238, -0.0005327239632606506, -0.0005086809396743774, -0.00048463791608810425, -0.00046059489250183105, -0.00043655186891555786, -0.00041250884532928467, -0.0003884658217430115, -0.0003644227981567383, -0.0003403797745704651, -0.0003163367509841919, -0.0002922937273979187, -0.0002682507038116455, -0.0002442076802253723, -0.00022016465663909912, -0.00019612163305282593, -0.00017207860946655273, -0.00014803558588027954, -0.00012399256229400635, -9.994953870773315e-05, -7.590651512145996e-05, -5.186349153518677e-05, -2.7820467948913574e-05, -3.777444362640381e-06, 2.0265579223632812e-05, 4.4308602809906006e-05, 6.83516263961792e-05, 9.239464998245239e-05, 0.00011643767356872559, 0.00014048069715499878, 0.00016452372074127197, 0.00018856674432754517, 0.00021260976791381836, 0.00023665279150009155, 0.00026069581508636475, 0.00028473883867263794, 0.00030878186225891113, 0.0003328248858451843, 0.0003568679094314575, 0.0003809109330177307, 0.0004049539566040039, 0.0004289969801902771, 0.0004530400037765503, 0.0004770830273628235, 0.0005011260509490967, 0.0005251690745353699, 0.0005492120981216431, 0.0005732551217079163, 0.0005972981452941895, 0.0006213411688804626, 0.0006453841924667358, 0.000669427216053009, 0.0006934702396392822, 0.0007175132632255554, 0.0007415562868118286, 0.0007655993103981018, 0.000789642333984375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 8.0, 10.0, 12.0, 21.0, 28.0, 28.0, 39.0, 70.0, 120.0, 146.0, 269.0, 422.0, 737.0, 1266.0, 2592.0, 5940.0, 15599.0, 43730.0, 122001.0, 261405.0, 306287.0, 177899.0, 69271.0, 24065.0, 8879.0, 3637.0, 1714.0, 924.0, 509.0, 319.0, 206.0, 137.0, 82.0, 56.0, 40.0, 26.0, 25.0, 16.0, 8.0, 9.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.984375, -17.38916015625, -16.7939453125, -16.19873046875, -15.603515625, -15.00830078125, -14.4130859375, -13.81787109375, -13.22265625, -12.62744140625, -12.0322265625, -11.43701171875, -10.841796875, -10.24658203125, -9.6513671875, -9.05615234375, -8.4609375, -7.86572265625, -7.2705078125, -6.67529296875, -6.080078125, -5.48486328125, -4.8896484375, -4.29443359375, -3.69921875, -3.10400390625, -2.5087890625, -1.91357421875, -1.318359375, -0.72314453125, -0.1279296875, 0.46728515625, 1.0625, 1.65771484375, 2.2529296875, 2.84814453125, 3.443359375, 4.03857421875, 4.6337890625, 5.22900390625, 5.82421875, 6.41943359375, 7.0146484375, 7.60986328125, 8.205078125, 8.80029296875, 9.3955078125, 9.99072265625, 10.5859375, 11.18115234375, 11.7763671875, 12.37158203125, 12.966796875, 13.56201171875, 14.1572265625, 14.75244140625, 15.34765625, 15.94287109375, 16.5380859375, 17.13330078125, 17.728515625, 18.32373046875, 18.9189453125, 19.51416015625, 20.109375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 5.0, 5.0, 13.0, 13.0, 19.0, 15.0, 31.0, 27.0, 39.0, 43.0, 60.0, 59.0, 50.0, 68.0, 72.0, 62.0, 69.0, 45.0, 56.0, 49.0, 28.0, 26.0, 35.0, 28.0, 22.0, 16.0, 12.0, 6.0, 4.0, 5.0, 7.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.90625, -3.78173828125, -3.6572265625, -3.53271484375, -3.408203125, -3.28369140625, -3.1591796875, -3.03466796875, -2.91015625, -2.78564453125, -2.6611328125, -2.53662109375, -2.412109375, -2.28759765625, -2.1630859375, -2.03857421875, -1.9140625, -1.78955078125, -1.6650390625, -1.54052734375, -1.416015625, -1.29150390625, -1.1669921875, -1.04248046875, -0.91796875, -0.79345703125, -0.6689453125, -0.54443359375, -0.419921875, -0.29541015625, -0.1708984375, -0.04638671875, 0.078125, 0.20263671875, 0.3271484375, 0.45166015625, 0.576171875, 0.70068359375, 0.8251953125, 0.94970703125, 1.07421875, 1.19873046875, 1.3232421875, 1.44775390625, 1.572265625, 1.69677734375, 1.8212890625, 1.94580078125, 2.0703125, 2.19482421875, 2.3193359375, 2.44384765625, 2.568359375, 2.69287109375, 2.8173828125, 2.94189453125, 3.06640625, 3.19091796875, 3.3154296875, 3.43994140625, 3.564453125, 3.68896484375, 3.8134765625, 3.93798828125, 4.0625]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 9.0, 8.0, 7.0, 16.0, 9.0, 11.0, 20.0, 22.0, 32.0, 38.0, 40.0, 51.0, 61.0, 70.0, 69.0, 62.0, 66.0, 67.0, 50.0, 51.0, 61.0, 36.0, 33.0, 33.0, 20.0, 16.0, 10.0, 14.0, 7.0, 2.0, 7.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.203081130981445, -23.262569427490234, -22.322057723999023, -21.381546020507812, -20.4410343170166, -19.50052261352539, -18.560012817382812, -17.61949920654297, -16.67898941040039, -15.73847770690918, -14.797966003417969, -13.857454299926758, -12.916942596435547, -11.976430892944336, -11.035920143127441, -10.09540843963623, -9.154895782470703, -8.214384078979492, -7.273872375488281, -6.3333611488342285, -5.392849445343018, -4.452337741851807, -3.511826515197754, -2.571314811706543, -1.630803108215332, -0.6902915239334106, 0.25022006034851074, 1.1907315254211426, 2.1312432289123535, 3.0717549324035645, 4.012266159057617, 4.952777862548828, 5.893291473388672, 6.833803176879883, 7.774314880371094, 8.714826583862305, 9.655338287353516, 10.595849990844727, 11.536360740661621, 12.476872444152832, 13.417384147644043, 14.357895851135254, 15.298407554626465, 16.23891830444336, 17.17943000793457, 18.11994171142578, 19.060453414916992, 20.000965118408203, 20.941476821899414, 21.881988525390625, 22.822500228881836, 23.763011932373047, 24.703523635864258, 25.64403533935547, 26.584545135498047, 27.52505874633789, 28.46556854248047, 29.40608024597168, 30.34659194946289, 31.2871036529541, 32.22761535644531, 33.16812515258789, 34.108638763427734, 35.04914855957031, 35.989662170410156]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 3.0, 7.0, 3.0, 8.0, 5.0, 11.0, 10.0, 14.0, 9.0, 19.0, 18.0, 21.0, 23.0, 28.0, 32.0, 26.0, 38.0, 42.0, 36.0, 40.0, 42.0, 42.0, 40.0, 38.0, 40.0, 43.0, 49.0, 33.0, 33.0, 38.0, 27.0, 18.0, 28.0, 22.0, 18.0, 13.0, 18.0, 8.0, 9.0, 7.0, 12.0, 9.0, 6.0, 5.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-17.0711669921875, -16.55986213684082, -16.048559188842773, -15.53725528717041, -15.025951385498047, -14.514646530151367, -14.003342628479004, -13.49203872680664, -12.980734825134277, -12.469430923461914, -11.95812702178955, -11.446823120117188, -10.935518264770508, -10.424215316772461, -9.912910461425781, -9.401606559753418, -8.890302658081055, -8.378998756408691, -7.867694854736328, -7.356390476226807, -6.845086574554443, -6.33378267288208, -5.822478294372559, -5.311174392700195, -4.799870491027832, -4.288566589355469, -3.7772624492645264, -3.265958309173584, -2.7546544075012207, -2.2433505058288574, -1.732046365737915, -1.2207422256469727, -0.7094402313232422, -0.19813621044158936, 0.3131678104400635, 0.8244718313217163, 1.3357758522033691, 1.8470797538757324, 2.358383893966675, 2.869688034057617, 3.3809919357299805, 3.8922958374023438, 4.403599739074707, 4.9149041175842285, 5.426208019256592, 5.937511920928955, 6.448816299438477, 6.96012020111084, 7.471424102783203, 7.982728004455566, 8.49403190612793, 9.005335807800293, 9.516639709472656, 10.027944564819336, 10.5392484664917, 11.050552368164062, 11.561856269836426, 12.073160171508789, 12.584464073181152, 13.095767974853516, 13.607072830200195, 14.118375778198242, 14.629680633544922, 15.140984535217285, 15.652288436889648]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 8.0, 9.0, 7.0, 11.0, 31.0, 44.0, 53.0, 97.0, 140.0, 212.0, 348.0, 537.0, 927.0, 1606.0, 2640.0, 4635.0, 8550.0, 15619.0, 30449.0, 61422.0, 128583.0, 274104.0, 549928.0, 893863.0, 950438.0, 637087.0, 327392.0, 153976.0, 73643.0, 36199.0, 18462.0, 9972.0, 5561.0, 3082.0, 1791.0, 1074.0, 648.0, 387.0, 254.0, 165.0, 123.0, 71.0, 44.0, 31.0, 21.0, 14.0, 12.0, 3.0, 8.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-29.90625, -28.97509765625, -28.0439453125, -27.11279296875, -26.181640625, -25.25048828125, -24.3193359375, -23.38818359375, -22.45703125, -21.52587890625, -20.5947265625, -19.66357421875, -18.732421875, -17.80126953125, -16.8701171875, -15.93896484375, -15.0078125, -14.07666015625, -13.1455078125, -12.21435546875, -11.283203125, -10.35205078125, -9.4208984375, -8.48974609375, -7.55859375, -6.62744140625, -5.6962890625, -4.76513671875, -3.833984375, -2.90283203125, -1.9716796875, -1.04052734375, -0.109375, 0.82177734375, 1.7529296875, 2.68408203125, 3.615234375, 4.54638671875, 5.4775390625, 6.40869140625, 7.33984375, 8.27099609375, 9.2021484375, 10.13330078125, 11.064453125, 11.99560546875, 12.9267578125, 13.85791015625, 14.7890625, 15.72021484375, 16.6513671875, 17.58251953125, 18.513671875, 19.44482421875, 20.3759765625, 21.30712890625, 22.23828125, 23.16943359375, 24.1005859375, 25.03173828125, 25.962890625, 26.89404296875, 27.8251953125, 28.75634765625, 29.6875]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 8.0, 10.0, 12.0, 11.0, 20.0, 10.0, 22.0, 23.0, 27.0, 32.0, 30.0, 35.0, 33.0, 43.0, 44.0, 42.0, 51.0, 38.0, 48.0, 45.0, 43.0, 55.0, 43.0, 30.0, 30.0, 30.0, 26.0, 22.0, 21.0, 23.0, 17.0, 8.0, 15.0, 8.0, 7.0, 6.0, 6.0, 4.0, 2.0, 6.0, 1.0, 5.0, 1.0, 1.0, 1.0], "bins": [-18.03125, -17.537353515625, -17.04345703125, -16.549560546875, -16.0556640625, -15.561767578125, -15.06787109375, -14.573974609375, -14.080078125, -13.586181640625, -13.09228515625, -12.598388671875, -12.1044921875, -11.610595703125, -11.11669921875, -10.622802734375, -10.12890625, -9.635009765625, -9.14111328125, -8.647216796875, -8.1533203125, -7.659423828125, -7.16552734375, -6.671630859375, -6.177734375, -5.683837890625, -5.18994140625, -4.696044921875, -4.2021484375, -3.708251953125, -3.21435546875, -2.720458984375, -2.2265625, -1.732666015625, -1.23876953125, -0.744873046875, -0.2509765625, 0.242919921875, 0.73681640625, 1.230712890625, 1.724609375, 2.218505859375, 2.71240234375, 3.206298828125, 3.7001953125, 4.194091796875, 4.68798828125, 5.181884765625, 5.67578125, 6.169677734375, 6.66357421875, 7.157470703125, 7.6513671875, 8.145263671875, 8.63916015625, 9.133056640625, 9.626953125, 10.120849609375, 10.61474609375, 11.108642578125, 11.6025390625, 12.096435546875, 12.59033203125, 13.084228515625, 13.578125]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 8.0, 4.0, 10.0, 22.0, 38.0, 51.0, 87.0, 117.0, 192.0, 373.0, 578.0, 1061.0, 1982.0, 3758.0, 7386.0, 14883.0, 29579.0, 60667.0, 125907.0, 255598.0, 491933.0, 803007.0, 925365.0, 690466.0, 392592.0, 198412.0, 96609.0, 46935.0, 22980.0, 11403.0, 5664.0, 3023.0, 1580.0, 873.0, 450.0, 251.0, 170.0, 97.0, 67.0, 42.0, 27.0, 13.0, 11.0, 7.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.5625, -35.43115234375, -34.2998046875, -33.16845703125, -32.037109375, -30.90576171875, -29.7744140625, -28.64306640625, -27.51171875, -26.38037109375, -25.2490234375, -24.11767578125, -22.986328125, -21.85498046875, -20.7236328125, -19.59228515625, -18.4609375, -17.32958984375, -16.1982421875, -15.06689453125, -13.935546875, -12.80419921875, -11.6728515625, -10.54150390625, -9.41015625, -8.27880859375, -7.1474609375, -6.01611328125, -4.884765625, -3.75341796875, -2.6220703125, -1.49072265625, -0.359375, 0.77197265625, 1.9033203125, 3.03466796875, 4.166015625, 5.29736328125, 6.4287109375, 7.56005859375, 8.69140625, 9.82275390625, 10.9541015625, 12.08544921875, 13.216796875, 14.34814453125, 15.4794921875, 16.61083984375, 17.7421875, 18.87353515625, 20.0048828125, 21.13623046875, 22.267578125, 23.39892578125, 24.5302734375, 25.66162109375, 26.79296875, 27.92431640625, 29.0556640625, 30.18701171875, 31.318359375, 32.44970703125, 33.5810546875, 34.71240234375, 35.84375]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 2.0, 3.0, 4.0, 4.0, 6.0, 10.0, 28.0, 25.0, 42.0, 51.0, 50.0, 74.0, 100.0, 120.0, 155.0, 186.0, 237.0, 238.0, 272.0, 304.0, 293.0, 310.0, 266.0, 249.0, 243.0, 179.0, 146.0, 118.0, 96.0, 63.0, 57.0, 42.0, 22.0, 22.0, 23.0, 7.0, 5.0, 8.0, 7.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.703125, -11.33837890625, -10.9736328125, -10.60888671875, -10.244140625, -9.87939453125, -9.5146484375, -9.14990234375, -8.78515625, -8.42041015625, -8.0556640625, -7.69091796875, -7.326171875, -6.96142578125, -6.5966796875, -6.23193359375, -5.8671875, -5.50244140625, -5.1376953125, -4.77294921875, -4.408203125, -4.04345703125, -3.6787109375, -3.31396484375, -2.94921875, -2.58447265625, -2.2197265625, -1.85498046875, -1.490234375, -1.12548828125, -0.7607421875, -0.39599609375, -0.03125, 0.33349609375, 0.6982421875, 1.06298828125, 1.427734375, 1.79248046875, 2.1572265625, 2.52197265625, 2.88671875, 3.25146484375, 3.6162109375, 3.98095703125, 4.345703125, 4.71044921875, 5.0751953125, 5.43994140625, 5.8046875, 6.16943359375, 6.5341796875, 6.89892578125, 7.263671875, 7.62841796875, 7.9931640625, 8.35791015625, 8.72265625, 9.08740234375, 9.4521484375, 9.81689453125, 10.181640625, 10.54638671875, 10.9111328125, 11.27587890625, 11.640625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 0.0, 1.0, 2.0, 5.0, 3.0, 5.0, 6.0, 10.0, 11.0, 13.0, 6.0, 18.0, 20.0, 27.0, 25.0, 27.0, 38.0, 47.0, 46.0, 38.0, 48.0, 55.0, 61.0, 56.0, 49.0, 60.0, 56.0, 38.0, 33.0, 37.0, 26.0, 28.0, 16.0, 14.0, 9.0, 12.0, 20.0, 6.0, 8.0, 5.0, 2.0, 5.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.080623626708984, -26.166078567504883, -25.25153350830078, -24.33698844909668, -23.422443389892578, -22.507898330688477, -21.593353271484375, -20.67880630493164, -19.764263153076172, -18.84971809387207, -17.93517303466797, -17.020627975463867, -16.106082916259766, -15.191537857055664, -14.276991844177246, -13.362446784973145, -12.447900772094727, -11.533355712890625, -10.618810653686523, -9.704265594482422, -8.78972053527832, -7.8751749992370605, -6.960629463195801, -6.046084403991699, -5.131539344787598, -4.216994285583496, -3.3024489879608154, -2.3879036903381348, -1.4733586311340332, -0.5588135719299316, 0.3557319641113281, 1.2702770233154297, 2.1848201751708984, 3.099365234375, 4.013910293579102, 4.928455829620361, 5.843000888824463, 6.7575459480285645, 7.672091484069824, 8.586636543273926, 9.501181602478027, 10.415726661682129, 11.33027172088623, 12.244817733764648, 13.15936279296875, 14.073907852172852, 14.988452911376953, 15.902997970581055, 16.817543029785156, 17.732088088989258, 18.64663314819336, 19.56117820739746, 20.475723266601562, 21.390268325805664, 22.304813385009766, 23.2193603515625, 24.13390350341797, 25.04844856262207, 25.962993621826172, 26.877538681030273, 27.792083740234375, 28.706628799438477, 29.621173858642578, 30.535720825195312, 31.450265884399414]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 1.0, 4.0, 5.0, 6.0, 8.0, 4.0, 10.0, 18.0, 15.0, 20.0, 15.0, 25.0, 32.0, 32.0, 25.0, 28.0, 30.0, 52.0, 45.0, 40.0, 57.0, 48.0, 39.0, 42.0, 40.0, 36.0, 40.0, 31.0, 32.0, 29.0, 34.0, 32.0, 19.0, 20.0, 11.0, 15.0, 10.0, 13.0, 7.0, 7.0, 3.0, 8.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-22.500263214111328, -21.853761672973633, -21.207260131835938, -20.560758590698242, -19.914257049560547, -19.26775360107422, -18.621253967285156, -17.974750518798828, -17.328248977661133, -16.681747436523438, -16.035245895385742, -15.388744354248047, -14.742241859436035, -14.09574031829834, -13.449238777160645, -12.802736282348633, -12.156235694885254, -11.509734153747559, -10.863232612609863, -10.216730117797852, -9.570228576660156, -8.923727035522461, -8.277225494384766, -7.630723476409912, -6.984221935272217, -6.3377203941345215, -5.691218376159668, -5.044716835021973, -4.398215293884277, -3.751713275909424, -3.1052117347717285, -2.458709716796875, -1.8122081756591797, -1.1657063961029053, -0.5192047357559204, 0.12729692459106445, 0.7737987041473389, 1.4203004837036133, 2.0668020248413086, 2.713304042816162, 3.3598055839538574, 4.006307125091553, 4.652809143066406, 5.299310684204102, 5.945812225341797, 6.59231424331665, 7.238815784454346, 7.885317802429199, 8.531819343566895, 9.17832088470459, 9.824822425842285, 10.471324920654297, 11.117826461791992, 11.764328002929688, 12.410829544067383, 13.057331085205078, 13.703832626342773, 14.350334167480469, 14.996835708618164, 15.64333724975586, 16.289838790893555, 16.93634033203125, 17.582843780517578, 18.229345321655273, 18.87584686279297]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 7.0, 15.0, 13.0, 23.0, 34.0, 59.0, 77.0, 124.0, 182.0, 273.0, 487.0, 762.0, 1263.0, 1941.0, 3361.0, 5564.0, 9288.0, 15048.0, 25128.0, 41087.0, 64799.0, 95254.0, 128589.0, 150086.0, 146116.0, 120975.0, 87661.0, 57174.0, 36576.0, 22419.0, 13740.0, 8113.0, 4797.0, 2929.0, 1733.0, 1088.0, 641.0, 387.0, 272.0, 156.0, 105.0, 60.0, 62.0, 32.0, 24.0, 14.0, 4.0, 3.0, 5.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.4375, -14.9375, -14.4375, -13.9375, -13.4375, -12.9375, -12.4375, -11.9375, -11.4375, -10.9375, -10.4375, -9.9375, -9.4375, -8.9375, -8.4375, -7.9375, -7.4375, -6.9375, -6.4375, -5.9375, -5.4375, -4.9375, -4.4375, -3.9375, -3.4375, -2.9375, -2.4375, -1.9375, -1.4375, -0.9375, -0.4375, 0.0625, 0.5625, 1.0625, 1.5625, 2.0625, 2.5625, 3.0625, 3.5625, 4.0625, 4.5625, 5.0625, 5.5625, 6.0625, 6.5625, 7.0625, 7.5625, 8.0625, 8.5625, 9.0625, 9.5625, 10.0625, 10.5625, 11.0625, 11.5625, 12.0625, 12.5625, 13.0625, 13.5625, 14.0625, 14.5625, 15.0625, 15.5625, 16.0625, 16.5625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 8.0, 4.0, 2.0, 8.0, 7.0, 13.0, 11.0, 15.0, 28.0, 31.0, 20.0, 32.0, 22.0, 35.0, 40.0, 50.0, 55.0, 44.0, 54.0, 52.0, 53.0, 44.0, 45.0, 51.0, 44.0, 34.0, 32.0, 30.0, 28.0, 20.0, 14.0, 13.0, 15.0, 9.0, 8.0, 9.0, 9.0, 5.0, 1.0, 0.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.5, -25.705810546875, -24.91162109375, -24.117431640625, -23.3232421875, -22.529052734375, -21.73486328125, -20.940673828125, -20.146484375, -19.352294921875, -18.55810546875, -17.763916015625, -16.9697265625, -16.175537109375, -15.38134765625, -14.587158203125, -13.79296875, -12.998779296875, -12.20458984375, -11.410400390625, -10.6162109375, -9.822021484375, -9.02783203125, -8.233642578125, -7.439453125, -6.645263671875, -5.85107421875, -5.056884765625, -4.2626953125, -3.468505859375, -2.67431640625, -1.880126953125, -1.0859375, -0.291748046875, 0.50244140625, 1.296630859375, 2.0908203125, 2.885009765625, 3.67919921875, 4.473388671875, 5.267578125, 6.061767578125, 6.85595703125, 7.650146484375, 8.4443359375, 9.238525390625, 10.03271484375, 10.826904296875, 11.62109375, 12.415283203125, 13.20947265625, 14.003662109375, 14.7978515625, 15.592041015625, 16.38623046875, 17.180419921875, 17.974609375, 18.768798828125, 19.56298828125, 20.357177734375, 21.1513671875, 21.945556640625, 22.73974609375, 23.533935546875, 24.328125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 8.0, 9.0, 10.0, 9.0, 15.0, 22.0, 28.0, 53.0, 47.0, 70.0, 99.0, 161.0, 246.0, 447.0, 677.0, 1131.0, 1933.0, 3272.0, 5892.0, 11204.0, 21913.0, 44281.0, 89082.0, 165483.0, 241287.0, 210223.0, 122755.0, 63017.0, 30997.0, 15545.0, 7959.0, 4331.0, 2493.0, 1419.0, 851.0, 538.0, 360.0, 208.0, 146.0, 94.0, 66.0, 42.0, 23.0, 21.0, 23.0, 14.0, 10.0, 10.0, 6.0, 5.0, 5.0, 2.0, 3.0, 4.0, 3.0, 2.0, 1.0], "bins": [-27.21875, -26.361328125, -25.50390625, -24.646484375, -23.7890625, -22.931640625, -22.07421875, -21.216796875, -20.359375, -19.501953125, -18.64453125, -17.787109375, -16.9296875, -16.072265625, -15.21484375, -14.357421875, -13.5, -12.642578125, -11.78515625, -10.927734375, -10.0703125, -9.212890625, -8.35546875, -7.498046875, -6.640625, -5.783203125, -4.92578125, -4.068359375, -3.2109375, -2.353515625, -1.49609375, -0.638671875, 0.21875, 1.076171875, 1.93359375, 2.791015625, 3.6484375, 4.505859375, 5.36328125, 6.220703125, 7.078125, 7.935546875, 8.79296875, 9.650390625, 10.5078125, 11.365234375, 12.22265625, 13.080078125, 13.9375, 14.794921875, 15.65234375, 16.509765625, 17.3671875, 18.224609375, 19.08203125, 19.939453125, 20.796875, 21.654296875, 22.51171875, 23.369140625, 24.2265625, 25.083984375, 25.94140625, 26.798828125, 27.65625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 8.0, 7.0, 4.0, 8.0, 4.0, 13.0, 10.0, 12.0, 13.0, 20.0, 14.0, 18.0, 24.0, 25.0, 22.0, 26.0, 39.0, 32.0, 26.0, 42.0, 33.0, 44.0, 49.0, 36.0, 43.0, 39.0, 34.0, 36.0, 40.0, 34.0, 33.0, 27.0, 24.0, 20.0, 20.0, 21.0, 13.0, 15.0, 18.0, 11.0, 7.0, 9.0, 12.0, 11.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-11.6953125, -11.3287353515625, -10.962158203125, -10.5955810546875, -10.22900390625, -9.8624267578125, -9.495849609375, -9.1292724609375, -8.7626953125, -8.3961181640625, -8.029541015625, -7.6629638671875, -7.29638671875, -6.9298095703125, -6.563232421875, -6.1966552734375, -5.830078125, -5.4635009765625, -5.096923828125, -4.7303466796875, -4.36376953125, -3.9971923828125, -3.630615234375, -3.2640380859375, -2.8974609375, -2.5308837890625, -2.164306640625, -1.7977294921875, -1.43115234375, -1.0645751953125, -0.697998046875, -0.3314208984375, 0.03515625, 0.4017333984375, 0.768310546875, 1.1348876953125, 1.50146484375, 1.8680419921875, 2.234619140625, 2.6011962890625, 2.9677734375, 3.3343505859375, 3.700927734375, 4.0675048828125, 4.43408203125, 4.8006591796875, 5.167236328125, 5.5338134765625, 5.900390625, 6.2669677734375, 6.633544921875, 7.0001220703125, 7.36669921875, 7.7332763671875, 8.099853515625, 8.4664306640625, 8.8330078125, 9.1995849609375, 9.566162109375, 9.9327392578125, 10.29931640625, 10.6658935546875, 11.032470703125, 11.3990478515625, 11.765625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 4.0, 8.0, 11.0, 16.0, 19.0, 40.0, 56.0, 60.0, 110.0, 149.0, 206.0, 307.0, 438.0, 639.0, 993.0, 1509.0, 2303.0, 3631.0, 5509.0, 9055.0, 15051.0, 25021.0, 42697.0, 72637.0, 119276.0, 175729.0, 193388.0, 147759.0, 93262.0, 55786.0, 32657.0, 18930.0, 11430.0, 7014.0, 4479.0, 2794.0, 1780.0, 1247.0, 790.0, 535.0, 379.0, 263.0, 184.0, 115.0, 82.0, 70.0, 44.0, 19.0, 24.0, 14.0, 14.0, 13.0, 4.0, 4.0, 4.0, 1.0, 2.0], "bins": [-13.7109375, -13.298583984375, -12.88623046875, -12.473876953125, -12.0615234375, -11.649169921875, -11.23681640625, -10.824462890625, -10.412109375, -9.999755859375, -9.58740234375, -9.175048828125, -8.7626953125, -8.350341796875, -7.93798828125, -7.525634765625, -7.11328125, -6.700927734375, -6.28857421875, -5.876220703125, -5.4638671875, -5.051513671875, -4.63916015625, -4.226806640625, -3.814453125, -3.402099609375, -2.98974609375, -2.577392578125, -2.1650390625, -1.752685546875, -1.34033203125, -0.927978515625, -0.515625, -0.103271484375, 0.30908203125, 0.721435546875, 1.1337890625, 1.546142578125, 1.95849609375, 2.370849609375, 2.783203125, 3.195556640625, 3.60791015625, 4.020263671875, 4.4326171875, 4.844970703125, 5.25732421875, 5.669677734375, 6.08203125, 6.494384765625, 6.90673828125, 7.319091796875, 7.7314453125, 8.143798828125, 8.55615234375, 8.968505859375, 9.380859375, 9.793212890625, 10.20556640625, 10.617919921875, 11.0302734375, 11.442626953125, 11.85498046875, 12.267333984375, 12.6796875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 0.0, 10.0, 8.0, 12.0, 6.0, 8.0, 18.0, 18.0, 20.0, 38.0, 24.0, 32.0, 45.0, 36.0, 40.0, 27.0, 43.0, 49.0, 59.0, 52.0, 38.0, 51.0, 47.0, 37.0, 42.0, 28.0, 31.0, 32.0, 20.0, 22.0, 13.0, 20.0, 5.0, 4.0, 7.0, 14.0, 9.0, 5.0, 8.0, 4.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0004608631134033203, -0.00044594332575798035, -0.0004310235381126404, -0.0004161037504673004, -0.00040118396282196045, -0.0003862641751766205, -0.0003713443875312805, -0.00035642459988594055, -0.0003415048122406006, -0.0003265850245952606, -0.00031166523694992065, -0.0002967454493045807, -0.0002818256616592407, -0.00026690587401390076, -0.0002519860863685608, -0.00023706629872322083, -0.00022214651107788086, -0.0002072267234325409, -0.00019230693578720093, -0.00017738714814186096, -0.000162467360496521, -0.00014754757285118103, -0.00013262778520584106, -0.0001177079975605011, -0.00010278820991516113, -8.786842226982117e-05, -7.29486346244812e-05, -5.8028846979141235e-05, -4.310905933380127e-05, -2.8189271688461304e-05, -1.3269484043121338e-05, 1.650303602218628e-06, 1.6570091247558594e-05, 3.148987889289856e-05, 4.6409666538238525e-05, 6.132945418357849e-05, 7.624924182891846e-05, 9.116902947425842e-05, 0.00010608881711959839, 0.00012100860476493835, 0.00013592839241027832, 0.00015084818005561829, 0.00016576796770095825, 0.00018068775534629822, 0.00019560754299163818, 0.00021052733063697815, 0.00022544711828231812, 0.00024036690592765808, 0.00025528669357299805, 0.000270206481218338, 0.000285126268863678, 0.00030004605650901794, 0.0003149658441543579, 0.0003298856317996979, 0.00034480541944503784, 0.0003597252070903778, 0.0003746449947357178, 0.00038956478238105774, 0.0004044845700263977, 0.00041940435767173767, 0.00043432414531707764, 0.0004492439329624176, 0.00046416372060775757, 0.00047908350825309753, 0.0004940032958984375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 5.0, 4.0, 4.0, 4.0, 9.0, 10.0, 22.0, 17.0, 39.0, 60.0, 73.0, 122.0, 167.0, 281.0, 407.0, 646.0, 967.0, 1549.0, 2317.0, 3609.0, 5952.0, 9654.0, 15679.0, 25219.0, 41017.0, 64428.0, 96241.0, 130339.0, 152058.0, 147127.0, 118588.0, 84410.0, 55458.0, 34641.0, 21764.0, 13241.0, 8290.0, 5194.0, 3175.0, 2062.0, 1260.0, 840.0, 544.0, 355.0, 254.0, 151.0, 102.0, 66.0, 42.0, 32.0, 21.0, 18.0, 11.0, 8.0, 8.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-13.1796875, -12.765625, -12.3515625, -11.9375, -11.5234375, -11.109375, -10.6953125, -10.28125, -9.8671875, -9.453125, -9.0390625, -8.625, -8.2109375, -7.796875, -7.3828125, -6.96875, -6.5546875, -6.140625, -5.7265625, -5.3125, -4.8984375, -4.484375, -4.0703125, -3.65625, -3.2421875, -2.828125, -2.4140625, -2.0, -1.5859375, -1.171875, -0.7578125, -0.34375, 0.0703125, 0.484375, 0.8984375, 1.3125, 1.7265625, 2.140625, 2.5546875, 2.96875, 3.3828125, 3.796875, 4.2109375, 4.625, 5.0390625, 5.453125, 5.8671875, 6.28125, 6.6953125, 7.109375, 7.5234375, 7.9375, 8.3515625, 8.765625, 9.1796875, 9.59375, 10.0078125, 10.421875, 10.8359375, 11.25, 11.6640625, 12.078125, 12.4921875, 12.90625, 13.3203125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 2.0, 8.0, 1.0, 9.0, 8.0, 5.0, 9.0, 15.0, 15.0, 28.0, 23.0, 34.0, 35.0, 35.0, 54.0, 51.0, 67.0, 52.0, 52.0, 65.0, 48.0, 51.0, 64.0, 30.0, 37.0, 32.0, 33.0, 29.0, 16.0, 20.0, 13.0, 14.0, 14.0, 10.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.96875, -4.82220458984375, -4.6756591796875, -4.52911376953125, -4.382568359375, -4.23602294921875, -4.0894775390625, -3.94293212890625, -3.79638671875, -3.64984130859375, -3.5032958984375, -3.35675048828125, -3.210205078125, -3.06365966796875, -2.9171142578125, -2.77056884765625, -2.6240234375, -2.47747802734375, -2.3309326171875, -2.18438720703125, -2.037841796875, -1.89129638671875, -1.7447509765625, -1.59820556640625, -1.45166015625, -1.30511474609375, -1.1585693359375, -1.01202392578125, -0.865478515625, -0.71893310546875, -0.5723876953125, -0.42584228515625, -0.279296875, -0.13275146484375, 0.0137939453125, 0.16033935546875, 0.306884765625, 0.45343017578125, 0.5999755859375, 0.74652099609375, 0.89306640625, 1.03961181640625, 1.1861572265625, 1.33270263671875, 1.479248046875, 1.62579345703125, 1.7723388671875, 1.91888427734375, 2.0654296875, 2.21197509765625, 2.3585205078125, 2.50506591796875, 2.651611328125, 2.79815673828125, 2.9447021484375, 3.09124755859375, 3.23779296875, 3.38433837890625, 3.5308837890625, 3.67742919921875, 3.823974609375, 3.97052001953125, 4.1170654296875, 4.26361083984375, 4.41015625]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 8.0, 4.0, 9.0, 7.0, 12.0, 10.0, 15.0, 12.0, 23.0, 24.0, 28.0, 35.0, 31.0, 55.0, 52.0, 48.0, 40.0, 44.0, 61.0, 56.0, 50.0, 57.0, 55.0, 30.0, 40.0, 33.0, 28.0, 16.0, 16.0, 21.0, 13.0, 14.0, 14.0, 7.0, 8.0, 3.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.911890029907227, -25.99489402770996, -25.077896118164062, -24.160900115966797, -23.24390411376953, -22.326908111572266, -21.409912109375, -20.4929141998291, -19.575918197631836, -18.65892219543457, -17.741924285888672, -16.824928283691406, -15.90793228149414, -14.990936279296875, -14.073939323425293, -13.156942367553711, -12.239946365356445, -11.32295036315918, -10.405953407287598, -9.488956451416016, -8.57196044921875, -7.654963970184326, -6.737967491149902, -5.8209710121154785, -4.903974533081055, -3.986978054046631, -3.069981575012207, -2.152985095977783, -1.2359886169433594, -0.31899213790893555, 0.5980043411254883, 1.515000820159912, 2.431997299194336, 3.3489937782287598, 4.265990257263184, 5.182986736297607, 6.099983215332031, 7.016979694366455, 7.933976173400879, 8.850973129272461, 9.767969131469727, 10.684965133666992, 11.601962089538574, 12.518959045410156, 13.435955047607422, 14.352951049804688, 15.26994800567627, 16.18694496154785, 17.103940963745117, 18.020936965942383, 18.93793487548828, 19.854930877685547, 20.771926879882812, 21.688922882080078, 22.605918884277344, 23.522916793823242, 24.439912796020508, 25.356908798217773, 26.273906707763672, 27.190902709960938, 28.107898712158203, 29.02489471435547, 29.941890716552734, 30.858888626098633, 31.7758846282959]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 5.0, 3.0, 3.0, 8.0, 3.0, 16.0, 13.0, 9.0, 12.0, 21.0, 24.0, 25.0, 37.0, 30.0, 32.0, 32.0, 36.0, 42.0, 46.0, 44.0, 47.0, 45.0, 37.0, 38.0, 38.0, 44.0, 35.0, 34.0, 33.0, 32.0, 28.0, 25.0, 21.0, 18.0, 19.0, 12.0, 11.0, 7.0, 7.0, 4.0, 6.0, 6.0, 3.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0], "bins": [-22.62870216369629, -21.98770523071289, -21.34670639038086, -20.70570945739746, -20.064712524414062, -19.42371368408203, -18.782716751098633, -18.141719818115234, -17.500720977783203, -16.859724044799805, -16.218725204467773, -15.577728271484375, -14.936731338500977, -14.295733451843262, -13.654735565185547, -13.013738632202148, -12.37274169921875, -11.731743812561035, -11.090746879577637, -10.449748992919922, -9.808752059936523, -9.167754173278809, -8.526756286621094, -7.885758876800537, -7.2447614669799805, -6.603764057159424, -5.962766647338867, -5.321768760681152, -4.680771350860596, -4.039773941040039, -3.3987762928009033, -2.7577786445617676, -2.116781234741211, -1.4757837057113647, -0.8347861766815186, -0.19378864765167236, 0.44720888137817383, 1.0882062911987305, 1.7292039394378662, 2.370201587677002, 3.0111989974975586, 3.6521964073181152, 4.293193817138672, 4.934191703796387, 5.575189113616943, 6.2161865234375, 6.857184410095215, 7.4981818199157715, 8.139179229736328, 8.780177116394043, 9.421174049377441, 10.062171936035156, 10.703168869018555, 11.34416675567627, 11.985164642333984, 12.626161575317383, 13.267159461975098, 13.908157348632812, 14.549154281616211, 15.190152168273926, 15.83115005493164, 16.47214698791504, 17.113143920898438, 17.75414276123047, 18.395139694213867]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 10.0, 9.0, 17.0, 23.0, 25.0, 37.0, 60.0, 72.0, 116.0, 149.0, 295.0, 411.0, 655.0, 1029.0, 1525.0, 2357.0, 3675.0, 5678.0, 8490.0, 13218.0, 20352.0, 30561.0, 44547.0, 63298.0, 85558.0, 105655.0, 120881.0, 121861.0, 111085.0, 90417.0, 68678.0, 49218.0, 33461.0, 22466.0, 14869.0, 9735.0, 6374.0, 4036.0, 2761.0, 1669.0, 1139.0, 721.0, 473.0, 321.0, 204.0, 134.0, 81.0, 59.0, 33.0, 25.0, 17.0, 8.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0], "bins": [-16.296875, -15.804931640625, -15.31298828125, -14.821044921875, -14.3291015625, -13.837158203125, -13.34521484375, -12.853271484375, -12.361328125, -11.869384765625, -11.37744140625, -10.885498046875, -10.3935546875, -9.901611328125, -9.40966796875, -8.917724609375, -8.42578125, -7.933837890625, -7.44189453125, -6.949951171875, -6.4580078125, -5.966064453125, -5.47412109375, -4.982177734375, -4.490234375, -3.998291015625, -3.50634765625, -3.014404296875, -2.5224609375, -2.030517578125, -1.53857421875, -1.046630859375, -0.5546875, -0.062744140625, 0.42919921875, 0.921142578125, 1.4130859375, 1.905029296875, 2.39697265625, 2.888916015625, 3.380859375, 3.872802734375, 4.36474609375, 4.856689453125, 5.3486328125, 5.840576171875, 6.33251953125, 6.824462890625, 7.31640625, 7.808349609375, 8.30029296875, 8.792236328125, 9.2841796875, 9.776123046875, 10.26806640625, 10.760009765625, 11.251953125, 11.743896484375, 12.23583984375, 12.727783203125, 13.2197265625, 13.711669921875, 14.20361328125, 14.695556640625, 15.1875]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 4.0, 2.0, 4.0, 5.0, 4.0, 10.0, 6.0, 10.0, 7.0, 14.0, 11.0, 20.0, 23.0, 31.0, 36.0, 28.0, 37.0, 40.0, 42.0, 47.0, 58.0, 47.0, 50.0, 60.0, 49.0, 42.0, 35.0, 38.0, 29.0, 36.0, 30.0, 26.0, 23.0, 11.0, 19.0, 15.0, 13.0, 9.0, 7.0, 9.0, 4.0, 3.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.34375, -20.591064453125, -19.83837890625, -19.085693359375, -18.3330078125, -17.580322265625, -16.82763671875, -16.074951171875, -15.322265625, -14.569580078125, -13.81689453125, -13.064208984375, -12.3115234375, -11.558837890625, -10.80615234375, -10.053466796875, -9.30078125, -8.548095703125, -7.79541015625, -7.042724609375, -6.2900390625, -5.537353515625, -4.78466796875, -4.031982421875, -3.279296875, -2.526611328125, -1.77392578125, -1.021240234375, -0.2685546875, 0.484130859375, 1.23681640625, 1.989501953125, 2.7421875, 3.494873046875, 4.24755859375, 5.000244140625, 5.7529296875, 6.505615234375, 7.25830078125, 8.010986328125, 8.763671875, 9.516357421875, 10.26904296875, 11.021728515625, 11.7744140625, 12.527099609375, 13.27978515625, 14.032470703125, 14.78515625, 15.537841796875, 16.29052734375, 17.043212890625, 17.7958984375, 18.548583984375, 19.30126953125, 20.053955078125, 20.806640625, 21.559326171875, 22.31201171875, 23.064697265625, 23.8173828125, 24.570068359375, 25.32275390625, 26.075439453125, 26.828125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 9.0, 13.0, 8.0, 26.0, 34.0, 49.0, 91.0, 146.0, 232.0, 331.0, 561.0, 995.0, 1712.0, 2935.0, 4738.0, 7697.0, 12620.0, 20362.0, 32117.0, 49470.0, 72639.0, 98912.0, 121853.0, 134723.0, 129206.0, 109725.0, 83667.0, 59351.0, 39579.0, 25039.0, 15588.0, 9508.0, 5809.0, 3483.0, 2087.0, 1280.0, 770.0, 474.0, 268.0, 179.0, 115.0, 49.0, 31.0, 31.0, 23.0, 13.0, 5.0, 5.0, 5.0, 6.0, 0.0, 1.0], "bins": [-22.125, -21.505615234375, -20.88623046875, -20.266845703125, -19.6474609375, -19.028076171875, -18.40869140625, -17.789306640625, -17.169921875, -16.550537109375, -15.93115234375, -15.311767578125, -14.6923828125, -14.072998046875, -13.45361328125, -12.834228515625, -12.21484375, -11.595458984375, -10.97607421875, -10.356689453125, -9.7373046875, -9.117919921875, -8.49853515625, -7.879150390625, -7.259765625, -6.640380859375, -6.02099609375, -5.401611328125, -4.7822265625, -4.162841796875, -3.54345703125, -2.924072265625, -2.3046875, -1.685302734375, -1.06591796875, -0.446533203125, 0.1728515625, 0.792236328125, 1.41162109375, 2.031005859375, 2.650390625, 3.269775390625, 3.88916015625, 4.508544921875, 5.1279296875, 5.747314453125, 6.36669921875, 6.986083984375, 7.60546875, 8.224853515625, 8.84423828125, 9.463623046875, 10.0830078125, 10.702392578125, 11.32177734375, 11.941162109375, 12.560546875, 13.179931640625, 13.79931640625, 14.418701171875, 15.0380859375, 15.657470703125, 16.27685546875, 16.896240234375, 17.515625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 3.0, 6.0, 7.0, 16.0, 8.0, 11.0, 19.0, 18.0, 20.0, 20.0, 27.0, 30.0, 34.0, 33.0, 38.0, 35.0, 38.0, 43.0, 41.0, 41.0, 38.0, 35.0, 32.0, 46.0, 37.0, 25.0, 40.0, 38.0, 44.0, 21.0, 21.0, 17.0, 18.0, 17.0, 18.0, 13.0, 13.0, 9.0, 13.0, 3.0, 2.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-14.7421875, -14.2867431640625, -13.831298828125, -13.3758544921875, -12.92041015625, -12.4649658203125, -12.009521484375, -11.5540771484375, -11.0986328125, -10.6431884765625, -10.187744140625, -9.7322998046875, -9.27685546875, -8.8214111328125, -8.365966796875, -7.9105224609375, -7.455078125, -6.9996337890625, -6.544189453125, -6.0887451171875, -5.63330078125, -5.1778564453125, -4.722412109375, -4.2669677734375, -3.8115234375, -3.3560791015625, -2.900634765625, -2.4451904296875, -1.98974609375, -1.5343017578125, -1.078857421875, -0.6234130859375, -0.16796875, 0.2874755859375, 0.742919921875, 1.1983642578125, 1.65380859375, 2.1092529296875, 2.564697265625, 3.0201416015625, 3.4755859375, 3.9310302734375, 4.386474609375, 4.8419189453125, 5.29736328125, 5.7528076171875, 6.208251953125, 6.6636962890625, 7.119140625, 7.5745849609375, 8.030029296875, 8.4854736328125, 8.94091796875, 9.3963623046875, 9.851806640625, 10.3072509765625, 10.7626953125, 11.2181396484375, 11.673583984375, 12.1290283203125, 12.58447265625, 13.0399169921875, 13.495361328125, 13.9508056640625, 14.40625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 12.0, 11.0, 17.0, 24.0, 32.0, 51.0, 87.0, 121.0, 189.0, 323.0, 585.0, 932.0, 1593.0, 2826.0, 5643.0, 12174.0, 28910.0, 74286.0, 180980.0, 301271.0, 246349.0, 112992.0, 44623.0, 17607.0, 7921.0, 3991.0, 2026.0, 1061.0, 717.0, 446.0, 258.0, 157.0, 111.0, 65.0, 44.0, 40.0, 19.0, 26.0, 9.0, 9.0, 1.0, 5.0, 1.0, 4.0, 1.0, 2.0], "bins": [-28.40625, -27.6533203125, -26.900390625, -26.1474609375, -25.39453125, -24.6416015625, -23.888671875, -23.1357421875, -22.3828125, -21.6298828125, -20.876953125, -20.1240234375, -19.37109375, -18.6181640625, -17.865234375, -17.1123046875, -16.359375, -15.6064453125, -14.853515625, -14.1005859375, -13.34765625, -12.5947265625, -11.841796875, -11.0888671875, -10.3359375, -9.5830078125, -8.830078125, -8.0771484375, -7.32421875, -6.5712890625, -5.818359375, -5.0654296875, -4.3125, -3.5595703125, -2.806640625, -2.0537109375, -1.30078125, -0.5478515625, 0.205078125, 0.9580078125, 1.7109375, 2.4638671875, 3.216796875, 3.9697265625, 4.72265625, 5.4755859375, 6.228515625, 6.9814453125, 7.734375, 8.4873046875, 9.240234375, 9.9931640625, 10.74609375, 11.4990234375, 12.251953125, 13.0048828125, 13.7578125, 14.5107421875, 15.263671875, 16.0166015625, 16.76953125, 17.5224609375, 18.275390625, 19.0283203125, 19.78125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 5.0, 6.0, 1.0, 12.0, 10.0, 18.0, 21.0, 29.0, 37.0, 54.0, 77.0, 84.0, 79.0, 98.0, 74.0, 76.0, 64.0, 62.0, 44.0, 28.0, 34.0, 27.0, 13.0, 13.0, 10.0, 4.0, 3.0, 9.0, 2.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015993118286132812, -0.0015435665845870972, -0.001487821340560913, -0.001432076096534729, -0.001376330852508545, -0.0013205856084823608, -0.0012648403644561768, -0.0012090951204299927, -0.0011533498764038086, -0.0010976046323776245, -0.0010418593883514404, -0.0009861141443252563, -0.0009303689002990723, -0.0008746236562728882, -0.0008188784122467041, -0.00076313316822052, -0.0007073879241943359, -0.0006516426801681519, -0.0005958974361419678, -0.0005401521921157837, -0.0004844069480895996, -0.00042866170406341553, -0.00037291646003723145, -0.00031717121601104736, -0.0002614259719848633, -0.0002056807279586792, -0.00014993548393249512, -9.419023990631104e-05, -3.844499588012695e-05, 1.730024814605713e-05, 7.304549217224121e-05, 0.0001287907361984253, 0.00018453598022460938, 0.00024028122425079346, 0.00029602646827697754, 0.0003517717123031616, 0.0004075169563293457, 0.0004632622003555298, 0.0005190074443817139, 0.000574752688407898, 0.000630497932434082, 0.0006862431764602661, 0.0007419884204864502, 0.0007977336645126343, 0.0008534789085388184, 0.0009092241525650024, 0.0009649693965911865, 0.0010207146406173706, 0.0010764598846435547, 0.0011322051286697388, 0.0011879503726959229, 0.001243695616722107, 0.001299440860748291, 0.001355186104774475, 0.0014109313488006592, 0.0014666765928268433, 0.0015224218368530273, 0.0015781670808792114, 0.0016339123249053955, 0.0016896575689315796, 0.0017454028129577637, 0.0018011480569839478, 0.0018568933010101318, 0.001912638545036316, 0.0019683837890625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 2.0, 4.0, 5.0, 5.0, 14.0, 16.0, 18.0, 31.0, 46.0, 73.0, 91.0, 133.0, 182.0, 210.0, 306.0, 487.0, 637.0, 1005.0, 1532.0, 2451.0, 3919.0, 6651.0, 11370.0, 20602.0, 38271.0, 70800.0, 122983.0, 179367.0, 198224.0, 160730.0, 100995.0, 56560.0, 30463.0, 16360.0, 9231.0, 5365.0, 3235.0, 2036.0, 1282.0, 869.0, 621.0, 395.0, 304.0, 196.0, 143.0, 101.0, 83.0, 47.0, 33.0, 27.0, 17.0, 11.0, 5.0, 8.0, 6.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0], "bins": [-16.0, -15.489013671875, -14.97802734375, -14.467041015625, -13.9560546875, -13.445068359375, -12.93408203125, -12.423095703125, -11.912109375, -11.401123046875, -10.89013671875, -10.379150390625, -9.8681640625, -9.357177734375, -8.84619140625, -8.335205078125, -7.82421875, -7.313232421875, -6.80224609375, -6.291259765625, -5.7802734375, -5.269287109375, -4.75830078125, -4.247314453125, -3.736328125, -3.225341796875, -2.71435546875, -2.203369140625, -1.6923828125, -1.181396484375, -0.67041015625, -0.159423828125, 0.3515625, 0.862548828125, 1.37353515625, 1.884521484375, 2.3955078125, 2.906494140625, 3.41748046875, 3.928466796875, 4.439453125, 4.950439453125, 5.46142578125, 5.972412109375, 6.4833984375, 6.994384765625, 7.50537109375, 8.016357421875, 8.52734375, 9.038330078125, 9.54931640625, 10.060302734375, 10.5712890625, 11.082275390625, 11.59326171875, 12.104248046875, 12.615234375, 13.126220703125, 13.63720703125, 14.148193359375, 14.6591796875, 15.170166015625, 15.68115234375, 16.192138671875, 16.703125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 7.0, 7.0, 5.0, 11.0, 8.0, 11.0, 9.0, 18.0, 18.0, 19.0, 24.0, 29.0, 25.0, 37.0, 40.0, 51.0, 49.0, 47.0, 58.0, 68.0, 46.0, 68.0, 55.0, 57.0, 28.0, 48.0, 21.0, 17.0, 28.0, 16.0, 12.0, 15.0, 4.0, 10.0, 5.0, 10.0, 3.0, 5.0, 4.0, 2.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-5.71484375, -5.55792236328125, -5.4010009765625, -5.24407958984375, -5.087158203125, -4.93023681640625, -4.7733154296875, -4.61639404296875, -4.45947265625, -4.30255126953125, -4.1456298828125, -3.98870849609375, -3.831787109375, -3.67486572265625, -3.5179443359375, -3.36102294921875, -3.2041015625, -3.04718017578125, -2.8902587890625, -2.73333740234375, -2.576416015625, -2.41949462890625, -2.2625732421875, -2.10565185546875, -1.94873046875, -1.79180908203125, -1.6348876953125, -1.47796630859375, -1.321044921875, -1.16412353515625, -1.0072021484375, -0.85028076171875, -0.693359375, -0.53643798828125, -0.3795166015625, -0.22259521484375, -0.065673828125, 0.09124755859375, 0.2481689453125, 0.40509033203125, 0.56201171875, 0.71893310546875, 0.8758544921875, 1.03277587890625, 1.189697265625, 1.34661865234375, 1.5035400390625, 1.66046142578125, 1.8173828125, 1.97430419921875, 2.1312255859375, 2.28814697265625, 2.445068359375, 2.60198974609375, 2.7589111328125, 2.91583251953125, 3.07275390625, 3.22967529296875, 3.3865966796875, 3.54351806640625, 3.700439453125, 3.85736083984375, 4.0142822265625, 4.17120361328125, 4.328125]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 9.0, 4.0, 11.0, 8.0, 9.0, 8.0, 12.0, 18.0, 25.0, 26.0, 31.0, 37.0, 36.0, 36.0, 48.0, 49.0, 61.0, 59.0, 65.0, 61.0, 56.0, 52.0, 59.0, 41.0, 25.0, 18.0, 22.0, 20.0, 25.0, 17.0, 13.0, 8.0, 11.0, 6.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.86786460876465, -30.837194442749023, -29.8065242767334, -28.775854110717773, -27.745182037353516, -26.71451187133789, -25.683841705322266, -24.65317153930664, -23.622501373291016, -22.59183120727539, -21.561161041259766, -20.53049087524414, -19.499820709228516, -18.46915054321289, -17.438478469848633, -16.407808303833008, -15.377138137817383, -14.346467971801758, -13.315797805786133, -12.285126686096191, -11.254456520080566, -10.223786354064941, -9.193115234375, -8.162445068359375, -7.13177490234375, -6.101104736328125, -5.070434093475342, -4.039763450622559, -3.0090932846069336, -1.9784231185913086, -0.9477524757385254, 0.08291816711425781, 1.11358642578125, 2.144256830215454, 3.174927234649658, 4.205597877502441, 5.236268043518066, 6.266938209533691, 7.297608852386475, 8.328279495239258, 9.358949661254883, 10.389619827270508, 11.420289993286133, 12.450961112976074, 13.4816312789917, 14.512301445007324, 15.542972564697266, 16.57364273071289, 17.604312896728516, 18.63498306274414, 19.665653228759766, 20.69632339477539, 21.726993560791016, 22.75766372680664, 23.7883358001709, 24.819005966186523, 25.84967613220215, 26.880346298217773, 27.9110164642334, 28.941686630249023, 29.97235870361328, 31.003028869628906, 32.03369903564453, 33.064369201660156, 34.09503936767578]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 1.0, 5.0, 5.0, 6.0, 8.0, 8.0, 12.0, 7.0, 9.0, 13.0, 19.0, 19.0, 18.0, 20.0, 24.0, 24.0, 22.0, 29.0, 28.0, 41.0, 33.0, 36.0, 43.0, 35.0, 41.0, 33.0, 43.0, 35.0, 34.0, 26.0, 45.0, 31.0, 30.0, 21.0, 28.0, 18.0, 14.0, 23.0, 18.0, 18.0, 15.0, 10.0, 11.0, 10.0, 8.0, 4.0, 4.0, 6.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-18.195226669311523, -17.602327346801758, -17.009428024291992, -16.416528701782227, -15.823630332946777, -15.230731010437012, -14.637832641601562, -14.044933319091797, -13.452033996582031, -12.859134674072266, -12.2662353515625, -11.67333698272705, -11.080437660217285, -10.48753833770752, -9.89463996887207, -9.301740646362305, -8.708841323852539, -8.115942001342773, -7.523043155670166, -6.930144309997559, -6.337244987487793, -5.744345664978027, -5.15144681930542, -4.5585479736328125, -3.965648651123047, -3.3727495670318604, -2.779850482940674, -2.1869513988494873, -1.5940523147583008, -1.0011532306671143, -0.40825414657592773, 0.1846446990966797, 0.7775421142578125, 1.370441198348999, 1.9633402824401855, 2.556239366531372, 3.1491384506225586, 3.742037534713745, 4.334936618804932, 4.927835464477539, 5.520734786987305, 6.11363410949707, 6.706532955169678, 7.299431800842285, 7.892331123352051, 8.485230445861816, 9.078128814697266, 9.671028137207031, 10.263927459716797, 10.856826782226562, 11.449726104736328, 12.042624473571777, 12.635523796081543, 13.228423118591309, 13.821321487426758, 14.414220809936523, 15.007120132446289, 15.600019454956055, 16.19291877746582, 16.785818099975586, 17.37871551513672, 17.971614837646484, 18.56451416015625, 19.157413482666016, 19.75031280517578]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 15.0, 14.0, 24.0, 36.0, 72.0, 120.0, 212.0, 327.0, 619.0, 1020.0, 1913.0, 3403.0, 6571.0, 12677.0, 25033.0, 51337.0, 106052.0, 221711.0, 443756.0, 768107.0, 952362.0, 752088.0, 429892.0, 213219.0, 102074.0, 49184.0, 24282.0, 12371.0, 6616.0, 3675.0, 2118.0, 1237.0, 760.0, 446.0, 336.0, 208.0, 116.0, 86.0, 63.0, 35.0, 30.0, 17.0, 16.0, 14.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.28125, -33.15625, -32.03125, -30.90625, -29.78125, -28.65625, -27.53125, -26.40625, -25.28125, -24.15625, -23.03125, -21.90625, -20.78125, -19.65625, -18.53125, -17.40625, -16.28125, -15.15625, -14.03125, -12.90625, -11.78125, -10.65625, -9.53125, -8.40625, -7.28125, -6.15625, -5.03125, -3.90625, -2.78125, -1.65625, -0.53125, 0.59375, 1.71875, 2.84375, 3.96875, 5.09375, 6.21875, 7.34375, 8.46875, 9.59375, 10.71875, 11.84375, 12.96875, 14.09375, 15.21875, 16.34375, 17.46875, 18.59375, 19.71875, 20.84375, 21.96875, 23.09375, 24.21875, 25.34375, 26.46875, 27.59375, 28.71875, 29.84375, 30.96875, 32.09375, 33.21875, 34.34375, 35.46875, 36.59375, 37.71875]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 7.0, 5.0, 5.0, 9.0, 9.0, 4.0, 10.0, 11.0, 14.0, 26.0, 22.0, 18.0, 34.0, 26.0, 42.0, 27.0, 35.0, 43.0, 38.0, 41.0, 45.0, 43.0, 44.0, 42.0, 44.0, 32.0, 47.0, 33.0, 36.0, 25.0, 30.0, 28.0, 19.0, 17.0, 16.0, 18.0, 7.0, 20.0, 7.0, 5.0, 6.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.203125, -16.57861328125, -15.9541015625, -15.32958984375, -14.705078125, -14.08056640625, -13.4560546875, -12.83154296875, -12.20703125, -11.58251953125, -10.9580078125, -10.33349609375, -9.708984375, -9.08447265625, -8.4599609375, -7.83544921875, -7.2109375, -6.58642578125, -5.9619140625, -5.33740234375, -4.712890625, -4.08837890625, -3.4638671875, -2.83935546875, -2.21484375, -1.59033203125, -0.9658203125, -0.34130859375, 0.283203125, 0.90771484375, 1.5322265625, 2.15673828125, 2.78125, 3.40576171875, 4.0302734375, 4.65478515625, 5.279296875, 5.90380859375, 6.5283203125, 7.15283203125, 7.77734375, 8.40185546875, 9.0263671875, 9.65087890625, 10.275390625, 10.89990234375, 11.5244140625, 12.14892578125, 12.7734375, 13.39794921875, 14.0224609375, 14.64697265625, 15.271484375, 15.89599609375, 16.5205078125, 17.14501953125, 17.76953125, 18.39404296875, 19.0185546875, 19.64306640625, 20.267578125, 20.89208984375, 21.5166015625, 22.14111328125, 22.765625]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 8.0, 13.0, 22.0, 37.0, 56.0, 87.0, 139.0, 248.0, 415.0, 716.0, 1306.0, 2202.0, 3941.0, 7495.0, 14466.0, 27980.0, 55203.0, 109322.0, 215476.0, 406620.0, 673930.0, 864530.0, 761815.0, 494214.0, 270312.0, 139035.0, 70454.0, 35428.0, 18101.0, 9477.0, 4997.0, 2705.0, 1512.0, 808.0, 501.0, 257.0, 164.0, 125.0, 44.0, 51.0, 24.0, 19.0, 10.0, 8.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-40.65625, -39.2861328125, -37.916015625, -36.5458984375, -35.17578125, -33.8056640625, -32.435546875, -31.0654296875, -29.6953125, -28.3251953125, -26.955078125, -25.5849609375, -24.21484375, -22.8447265625, -21.474609375, -20.1044921875, -18.734375, -17.3642578125, -15.994140625, -14.6240234375, -13.25390625, -11.8837890625, -10.513671875, -9.1435546875, -7.7734375, -6.4033203125, -5.033203125, -3.6630859375, -2.29296875, -0.9228515625, 0.447265625, 1.8173828125, 3.1875, 4.5576171875, 5.927734375, 7.2978515625, 8.66796875, 10.0380859375, 11.408203125, 12.7783203125, 14.1484375, 15.5185546875, 16.888671875, 18.2587890625, 19.62890625, 20.9990234375, 22.369140625, 23.7392578125, 25.109375, 26.4794921875, 27.849609375, 29.2197265625, 30.58984375, 31.9599609375, 33.330078125, 34.7001953125, 36.0703125, 37.4404296875, 38.810546875, 40.1806640625, 41.55078125, 42.9208984375, 44.291015625, 45.6611328125, 47.03125]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 1.0, 3.0, 4.0, 3.0, 5.0, 11.0, 5.0, 15.0, 20.0, 19.0, 31.0, 49.0, 70.0, 85.0, 98.0, 110.0, 142.0, 193.0, 209.0, 243.0, 278.0, 295.0, 309.0, 240.0, 253.0, 263.0, 211.0, 203.0, 177.0, 129.0, 99.0, 92.0, 55.0, 52.0, 35.0, 19.0, 14.0, 9.0, 11.0, 6.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.234375, -12.7841796875, -12.333984375, -11.8837890625, -11.43359375, -10.9833984375, -10.533203125, -10.0830078125, -9.6328125, -9.1826171875, -8.732421875, -8.2822265625, -7.83203125, -7.3818359375, -6.931640625, -6.4814453125, -6.03125, -5.5810546875, -5.130859375, -4.6806640625, -4.23046875, -3.7802734375, -3.330078125, -2.8798828125, -2.4296875, -1.9794921875, -1.529296875, -1.0791015625, -0.62890625, -0.1787109375, 0.271484375, 0.7216796875, 1.171875, 1.6220703125, 2.072265625, 2.5224609375, 2.97265625, 3.4228515625, 3.873046875, 4.3232421875, 4.7734375, 5.2236328125, 5.673828125, 6.1240234375, 6.57421875, 7.0244140625, 7.474609375, 7.9248046875, 8.375, 8.8251953125, 9.275390625, 9.7255859375, 10.17578125, 10.6259765625, 11.076171875, 11.5263671875, 11.9765625, 12.4267578125, 12.876953125, 13.3271484375, 13.77734375, 14.2275390625, 14.677734375, 15.1279296875, 15.578125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 7.0, 6.0, 11.0, 9.0, 7.0, 8.0, 12.0, 14.0, 22.0, 23.0, 39.0, 33.0, 39.0, 48.0, 52.0, 54.0, 59.0, 51.0, 61.0, 57.0, 50.0, 45.0, 50.0, 37.0, 41.0, 28.0, 24.0, 27.0, 16.0, 15.0, 15.0, 8.0, 8.0, 10.0, 4.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.26799011230469, -38.92879867553711, -37.58960723876953, -36.25041580200195, -34.911224365234375, -33.5720329284668, -32.23284149169922, -30.893648147583008, -29.55445671081543, -28.21526527404785, -26.876073837280273, -25.536880493164062, -24.197689056396484, -22.858497619628906, -21.519306182861328, -20.18011474609375, -18.840923309326172, -17.501731872558594, -16.162540435791016, -14.823348045349121, -13.484156608581543, -12.144965171813965, -10.80577278137207, -9.466581344604492, -8.127389907836914, -6.788198471069336, -5.4490065574646, -4.109814643859863, -2.770623207092285, -1.431431770324707, -0.0922393798828125, 1.2469520568847656, 2.5861473083496094, 3.9253389835357666, 5.264530658721924, 6.60372257232666, 7.942914009094238, 9.282105445861816, 10.621297836303711, 11.960489273071289, 13.299680709838867, 14.638872146606445, 15.978063583374023, 17.317256927490234, 18.656448364257812, 19.99563980102539, 21.33483123779297, 22.674022674560547, 24.013214111328125, 25.352405548095703, 26.69159698486328, 28.03078842163086, 29.369979858398438, 30.709171295166016, 32.048362731933594, 33.38755798339844, 34.72674560546875, 36.06593704223633, 37.405128479003906, 38.744319915771484, 40.08351135253906, 41.42270278930664, 42.76189422607422, 44.10108947753906, 45.44028091430664]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 6.0, 6.0, 7.0, 8.0, 11.0, 12.0, 11.0, 10.0, 11.0, 13.0, 19.0, 22.0, 20.0, 32.0, 29.0, 25.0, 34.0, 30.0, 43.0, 37.0, 44.0, 30.0, 42.0, 49.0, 37.0, 47.0, 42.0, 32.0, 33.0, 38.0, 35.0, 21.0, 30.0, 15.0, 25.0, 17.0, 16.0, 15.0, 9.0, 10.0, 8.0, 3.0, 2.0, 5.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.071855545043945, -23.28384017944336, -22.495824813842773, -21.707809448242188, -20.919795989990234, -20.13178062438965, -19.343765258789062, -18.555749893188477, -17.76773452758789, -16.979719161987305, -16.19170379638672, -15.40368938446045, -14.61567497253418, -13.827659606933594, -13.039644241333008, -12.251628875732422, -11.463615417480469, -10.675600051879883, -9.887585639953613, -9.099570274353027, -8.311555862426758, -7.523540496826172, -6.735525131225586, -5.947510242462158, -5.1594953536987305, -4.371480464935303, -3.583465337753296, -2.795450210571289, -2.0074353218078613, -1.2194204330444336, -0.43140506744384766, 0.3566098213195801, 1.1446247100830078, 1.932639718055725, 2.7206547260284424, 3.508669853210449, 4.296684741973877, 5.084699630737305, 5.872714996337891, 6.660729885101318, 7.448744773864746, 8.236760139465332, 9.024774551391602, 9.812789916992188, 10.600805282592773, 11.388819694519043, 12.176835060119629, 12.964849472045898, 13.752864837646484, 14.54088020324707, 15.32889461517334, 16.11690902709961, 16.904924392700195, 17.69293975830078, 18.480955123901367, 19.268970489501953, 20.056983947753906, 20.844999313354492, 21.633014678955078, 22.42102813720703, 23.209043502807617, 23.997058868408203, 24.78507423400879, 25.573089599609375, 26.36110496520996]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 6.0, 9.0, 25.0, 35.0, 52.0, 79.0, 125.0, 227.0, 359.0, 534.0, 880.0, 1439.0, 2376.0, 4033.0, 6682.0, 11290.0, 18888.0, 31628.0, 51661.0, 79990.0, 114212.0, 144557.0, 154445.0, 137468.0, 104078.0, 70747.0, 44858.0, 27375.0, 15999.0, 9703.0, 5937.0, 3390.0, 2083.0, 1340.0, 749.0, 491.0, 293.0, 182.0, 118.0, 64.0, 56.0, 33.0, 19.0, 15.0, 13.0, 11.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.765625, -19.09228515625, -18.4189453125, -17.74560546875, -17.072265625, -16.39892578125, -15.7255859375, -15.05224609375, -14.37890625, -13.70556640625, -13.0322265625, -12.35888671875, -11.685546875, -11.01220703125, -10.3388671875, -9.66552734375, -8.9921875, -8.31884765625, -7.6455078125, -6.97216796875, -6.298828125, -5.62548828125, -4.9521484375, -4.27880859375, -3.60546875, -2.93212890625, -2.2587890625, -1.58544921875, -0.912109375, -0.23876953125, 0.4345703125, 1.10791015625, 1.78125, 2.45458984375, 3.1279296875, 3.80126953125, 4.474609375, 5.14794921875, 5.8212890625, 6.49462890625, 7.16796875, 7.84130859375, 8.5146484375, 9.18798828125, 9.861328125, 10.53466796875, 11.2080078125, 11.88134765625, 12.5546875, 13.22802734375, 13.9013671875, 14.57470703125, 15.248046875, 15.92138671875, 16.5947265625, 17.26806640625, 17.94140625, 18.61474609375, 19.2880859375, 19.96142578125, 20.634765625, 21.30810546875, 21.9814453125, 22.65478515625, 23.328125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 10.0, 3.0, 6.0, 13.0, 11.0, 14.0, 15.0, 22.0, 22.0, 15.0, 32.0, 41.0, 29.0, 34.0, 35.0, 39.0, 40.0, 34.0, 44.0, 42.0, 40.0, 45.0, 34.0, 41.0, 41.0, 28.0, 35.0, 23.0, 37.0, 18.0, 22.0, 19.0, 18.0, 19.0, 17.0, 11.0, 7.0, 6.0, 6.0, 7.0, 5.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 5.0, 0.0, 0.0, 2.0], "bins": [-28.265625, -27.398193359375, -26.53076171875, -25.663330078125, -24.7958984375, -23.928466796875, -23.06103515625, -22.193603515625, -21.326171875, -20.458740234375, -19.59130859375, -18.723876953125, -17.8564453125, -16.989013671875, -16.12158203125, -15.254150390625, -14.38671875, -13.519287109375, -12.65185546875, -11.784423828125, -10.9169921875, -10.049560546875, -9.18212890625, -8.314697265625, -7.447265625, -6.579833984375, -5.71240234375, -4.844970703125, -3.9775390625, -3.110107421875, -2.24267578125, -1.375244140625, -0.5078125, 0.359619140625, 1.22705078125, 2.094482421875, 2.9619140625, 3.829345703125, 4.69677734375, 5.564208984375, 6.431640625, 7.299072265625, 8.16650390625, 9.033935546875, 9.9013671875, 10.768798828125, 11.63623046875, 12.503662109375, 13.37109375, 14.238525390625, 15.10595703125, 15.973388671875, 16.8408203125, 17.708251953125, 18.57568359375, 19.443115234375, 20.310546875, 21.177978515625, 22.04541015625, 22.912841796875, 23.7802734375, 24.647705078125, 25.51513671875, 26.382568359375, 27.25]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 6.0, 10.0, 11.0, 15.0, 35.0, 33.0, 54.0, 81.0, 123.0, 181.0, 274.0, 428.0, 658.0, 1081.0, 1672.0, 2774.0, 4861.0, 8562.0, 15882.0, 30241.0, 58614.0, 110490.0, 186474.0, 229798.0, 177056.0, 102331.0, 54406.0, 27931.0, 14834.0, 8158.0, 4529.0, 2571.0, 1550.0, 979.0, 642.0, 401.0, 257.0, 164.0, 115.0, 76.0, 66.0, 54.0, 33.0, 15.0, 12.0, 9.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.875, -31.794921875, -30.71484375, -29.634765625, -28.5546875, -27.474609375, -26.39453125, -25.314453125, -24.234375, -23.154296875, -22.07421875, -20.994140625, -19.9140625, -18.833984375, -17.75390625, -16.673828125, -15.59375, -14.513671875, -13.43359375, -12.353515625, -11.2734375, -10.193359375, -9.11328125, -8.033203125, -6.953125, -5.873046875, -4.79296875, -3.712890625, -2.6328125, -1.552734375, -0.47265625, 0.607421875, 1.6875, 2.767578125, 3.84765625, 4.927734375, 6.0078125, 7.087890625, 8.16796875, 9.248046875, 10.328125, 11.408203125, 12.48828125, 13.568359375, 14.6484375, 15.728515625, 16.80859375, 17.888671875, 18.96875, 20.048828125, 21.12890625, 22.208984375, 23.2890625, 24.369140625, 25.44921875, 26.529296875, 27.609375, 28.689453125, 29.76953125, 30.849609375, 31.9296875, 33.009765625, 34.08984375, 35.169921875, 36.25]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 7.0, 5.0, 10.0, 9.0, 11.0, 15.0, 13.0, 14.0, 16.0, 24.0, 23.0, 16.0, 27.0, 28.0, 39.0, 31.0, 41.0, 29.0, 48.0, 48.0, 49.0, 47.0, 41.0, 51.0, 31.0, 42.0, 39.0, 37.0, 28.0, 26.0, 15.0, 19.0, 32.0, 11.0, 13.0, 13.0, 14.0, 7.0, 7.0, 9.0, 0.0, 6.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-17.46875, -16.929931640625, -16.39111328125, -15.852294921875, -15.3134765625, -14.774658203125, -14.23583984375, -13.697021484375, -13.158203125, -12.619384765625, -12.08056640625, -11.541748046875, -11.0029296875, -10.464111328125, -9.92529296875, -9.386474609375, -8.84765625, -8.308837890625, -7.77001953125, -7.231201171875, -6.6923828125, -6.153564453125, -5.61474609375, -5.075927734375, -4.537109375, -3.998291015625, -3.45947265625, -2.920654296875, -2.3818359375, -1.843017578125, -1.30419921875, -0.765380859375, -0.2265625, 0.312255859375, 0.85107421875, 1.389892578125, 1.9287109375, 2.467529296875, 3.00634765625, 3.545166015625, 4.083984375, 4.622802734375, 5.16162109375, 5.700439453125, 6.2392578125, 6.778076171875, 7.31689453125, 7.855712890625, 8.39453125, 8.933349609375, 9.47216796875, 10.010986328125, 10.5498046875, 11.088623046875, 11.62744140625, 12.166259765625, 12.705078125, 13.243896484375, 13.78271484375, 14.321533203125, 14.8603515625, 15.399169921875, 15.93798828125, 16.476806640625, 17.015625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 9.0, 8.0, 11.0, 10.0, 13.0, 28.0, 46.0, 67.0, 91.0, 146.0, 195.0, 375.0, 573.0, 935.0, 1529.0, 2706.0, 4745.0, 8600.0, 16291.0, 32633.0, 65234.0, 127644.0, 218743.0, 242848.0, 157330.0, 81963.0, 40701.0, 20393.0, 10815.0, 5775.0, 3324.0, 1873.0, 1093.0, 642.0, 413.0, 273.0, 169.0, 110.0, 64.0, 54.0, 32.0, 18.0, 15.0, 10.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.296875, -20.566650390625, -19.83642578125, -19.106201171875, -18.3759765625, -17.645751953125, -16.91552734375, -16.185302734375, -15.455078125, -14.724853515625, -13.99462890625, -13.264404296875, -12.5341796875, -11.803955078125, -11.07373046875, -10.343505859375, -9.61328125, -8.883056640625, -8.15283203125, -7.422607421875, -6.6923828125, -5.962158203125, -5.23193359375, -4.501708984375, -3.771484375, -3.041259765625, -2.31103515625, -1.580810546875, -0.8505859375, -0.120361328125, 0.60986328125, 1.340087890625, 2.0703125, 2.800537109375, 3.53076171875, 4.260986328125, 4.9912109375, 5.721435546875, 6.45166015625, 7.181884765625, 7.912109375, 8.642333984375, 9.37255859375, 10.102783203125, 10.8330078125, 11.563232421875, 12.29345703125, 13.023681640625, 13.75390625, 14.484130859375, 15.21435546875, 15.944580078125, 16.6748046875, 17.405029296875, 18.13525390625, 18.865478515625, 19.595703125, 20.325927734375, 21.05615234375, 21.786376953125, 22.5166015625, 23.246826171875, 23.97705078125, 24.707275390625, 25.4375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 3.0, 7.0, 12.0, 11.0, 18.0, 12.0, 22.0, 18.0, 29.0, 27.0, 43.0, 45.0, 47.0, 52.0, 66.0, 69.0, 65.0, 59.0, 60.0, 56.0, 48.0, 47.0, 28.0, 33.0, 24.0, 27.0, 15.0, 7.0, 9.0, 8.0, 7.0, 7.0, 7.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.000919342041015625, -0.0008916258811950684, -0.0008639097213745117, -0.0008361935615539551, -0.0008084774017333984, -0.0007807612419128418, -0.0007530450820922852, -0.0007253289222717285, -0.0006976127624511719, -0.0006698966026306152, -0.0006421804428100586, -0.000614464282989502, -0.0005867481231689453, -0.0005590319633483887, -0.000531315803527832, -0.0005035996437072754, -0.00047588348388671875, -0.0004481673240661621, -0.00042045116424560547, -0.00039273500442504883, -0.0003650188446044922, -0.00033730268478393555, -0.0003095865249633789, -0.00028187036514282227, -0.0002541542053222656, -0.00022643804550170898, -0.00019872188568115234, -0.0001710057258605957, -0.00014328956604003906, -0.00011557340621948242, -8.785724639892578e-05, -6.014108657836914e-05, -3.24249267578125e-05, -4.708766937255859e-06, 2.300739288330078e-05, 5.072355270385742e-05, 7.843971252441406e-05, 0.0001061558723449707, 0.00013387203216552734, 0.00016158819198608398, 0.00018930435180664062, 0.00021702051162719727, 0.0002447366714477539, 0.00027245283126831055, 0.0003001689910888672, 0.00032788515090942383, 0.00035560131072998047, 0.0003833174705505371, 0.00041103363037109375, 0.0004387497901916504, 0.00046646595001220703, 0.0004941821098327637, 0.0005218982696533203, 0.000549614429473877, 0.0005773305892944336, 0.0006050467491149902, 0.0006327629089355469, 0.0006604790687561035, 0.0006881952285766602, 0.0007159113883972168, 0.0007436275482177734, 0.0007713437080383301, 0.0007990598678588867, 0.0008267760276794434, 0.0008544921875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 6.0, 2.0, 4.0, 4.0, 8.0, 3.0, 9.0, 15.0, 13.0, 25.0, 40.0, 54.0, 71.0, 104.0, 145.0, 208.0, 268.0, 500.0, 751.0, 1223.0, 2105.0, 3688.0, 6581.0, 12563.0, 24403.0, 46640.0, 88175.0, 149480.0, 205669.0, 198857.0, 138578.0, 79202.0, 41827.0, 21578.0, 11246.0, 6073.0, 3257.0, 1875.0, 1145.0, 744.0, 486.0, 308.0, 162.0, 139.0, 94.0, 60.0, 40.0, 47.0, 27.0, 24.0, 10.0, 12.0, 6.0, 8.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.609375, -24.781005859375, -23.95263671875, -23.124267578125, -22.2958984375, -21.467529296875, -20.63916015625, -19.810791015625, -18.982421875, -18.154052734375, -17.32568359375, -16.497314453125, -15.6689453125, -14.840576171875, -14.01220703125, -13.183837890625, -12.35546875, -11.527099609375, -10.69873046875, -9.870361328125, -9.0419921875, -8.213623046875, -7.38525390625, -6.556884765625, -5.728515625, -4.900146484375, -4.07177734375, -3.243408203125, -2.4150390625, -1.586669921875, -0.75830078125, 0.070068359375, 0.8984375, 1.726806640625, 2.55517578125, 3.383544921875, 4.2119140625, 5.040283203125, 5.86865234375, 6.697021484375, 7.525390625, 8.353759765625, 9.18212890625, 10.010498046875, 10.8388671875, 11.667236328125, 12.49560546875, 13.323974609375, 14.15234375, 14.980712890625, 15.80908203125, 16.637451171875, 17.4658203125, 18.294189453125, 19.12255859375, 19.950927734375, 20.779296875, 21.607666015625, 22.43603515625, 23.264404296875, 24.0927734375, 24.921142578125, 25.74951171875, 26.577880859375, 27.40625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 3.0, 2.0, 4.0, 7.0, 9.0, 6.0, 17.0, 12.0, 18.0, 21.0, 30.0, 44.0, 21.0, 37.0, 44.0, 50.0, 53.0, 41.0, 56.0, 53.0, 58.0, 62.0, 63.0, 57.0, 37.0, 32.0, 24.0, 31.0, 19.0, 15.0, 13.0, 14.0, 7.0, 9.0, 10.0, 4.0, 3.0, 2.0, 3.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-7.390625, -7.19158935546875, -6.9925537109375, -6.79351806640625, -6.594482421875, -6.39544677734375, -6.1964111328125, -5.99737548828125, -5.79833984375, -5.59930419921875, -5.4002685546875, -5.20123291015625, -5.002197265625, -4.80316162109375, -4.6041259765625, -4.40509033203125, -4.2060546875, -4.00701904296875, -3.8079833984375, -3.60894775390625, -3.409912109375, -3.21087646484375, -3.0118408203125, -2.81280517578125, -2.61376953125, -2.41473388671875, -2.2156982421875, -2.01666259765625, -1.817626953125, -1.61859130859375, -1.4195556640625, -1.22052001953125, -1.021484375, -0.82244873046875, -0.6234130859375, -0.42437744140625, -0.225341796875, -0.02630615234375, 0.1727294921875, 0.37176513671875, 0.57080078125, 0.76983642578125, 0.9688720703125, 1.16790771484375, 1.366943359375, 1.56597900390625, 1.7650146484375, 1.96405029296875, 2.1630859375, 2.36212158203125, 2.5611572265625, 2.76019287109375, 2.959228515625, 3.15826416015625, 3.3572998046875, 3.55633544921875, 3.75537109375, 3.95440673828125, 4.1534423828125, 4.35247802734375, 4.551513671875, 4.75054931640625, 4.9495849609375, 5.14862060546875, 5.34765625]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 8.0, 8.0, 7.0, 9.0, 11.0, 10.0, 13.0, 18.0, 29.0, 30.0, 26.0, 39.0, 51.0, 45.0, 61.0, 44.0, 60.0, 61.0, 57.0, 47.0, 48.0, 51.0, 43.0, 44.0, 32.0, 28.0, 25.0, 17.0, 17.0, 13.0, 8.0, 12.0, 8.0, 6.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.21493148803711, -39.865421295166016, -38.515907287597656, -37.16639709472656, -35.81688690185547, -34.467376708984375, -33.11786651611328, -31.768352508544922, -30.418842315673828, -29.069332122802734, -27.719820022583008, -26.37030792236328, -25.020797729492188, -23.671287536621094, -22.321775436401367, -20.97226333618164, -19.622753143310547, -18.273242950439453, -16.923730850219727, -15.574219703674316, -14.224708557128906, -12.875197410583496, -11.525686264038086, -10.176175117492676, -8.826663970947266, -7.4771528244018555, -6.127641677856445, -4.778130531311035, -3.428619384765625, -2.079108238220215, -0.7295970916748047, 0.6199140548706055, 1.9694252014160156, 3.318936347961426, 4.668447494506836, 6.017958641052246, 7.367469787597656, 8.716980934143066, 10.066492080688477, 11.416003227233887, 12.765514373779297, 14.115025520324707, 15.464536666870117, 16.814048767089844, 18.163558959960938, 19.51306915283203, 20.862581253051758, 22.212093353271484, 23.561603546142578, 24.911113739013672, 26.2606258392334, 27.610137939453125, 28.95964813232422, 30.309158325195312, 31.65867042541504, 33.008182525634766, 34.35769271850586, 35.70720291137695, 37.05671691894531, 38.406227111816406, 39.7557373046875, 41.105247497558594, 42.45475769042969, 43.80427169799805, 45.15378189086914]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 6.0, 4.0, 7.0, 7.0, 17.0, 9.0, 13.0, 8.0, 15.0, 18.0, 20.0, 25.0, 20.0, 29.0, 27.0, 33.0, 33.0, 34.0, 38.0, 44.0, 40.0, 32.0, 49.0, 48.0, 45.0, 47.0, 38.0, 32.0, 22.0, 44.0, 23.0, 25.0, 20.0, 17.0, 23.0, 13.0, 19.0, 10.0, 9.0, 9.0, 8.0, 6.0, 4.0, 2.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-25.21017074584961, -24.417564392089844, -23.624958038330078, -22.832353591918945, -22.03974723815918, -21.247140884399414, -20.45453643798828, -19.661930084228516, -18.86932373046875, -18.076717376708984, -17.28411102294922, -16.491506576538086, -15.69890022277832, -14.906293869018555, -14.113688468933105, -13.321083068847656, -12.52847671508789, -11.735870361328125, -10.943264961242676, -10.150659561157227, -9.358053207397461, -8.565446853637695, -7.772841453552246, -6.980235576629639, -6.187629699707031, -5.395023822784424, -4.602417945861816, -3.809812068939209, -3.0172061920166016, -2.224600315093994, -1.4319944381713867, -0.6393885612487793, 0.1532154083251953, 0.9458212852478027, 1.7384271621704102, 2.5310330390930176, 3.323638916015625, 4.116244792938232, 4.90885066986084, 5.701456546783447, 6.494062423706055, 7.286668300628662, 8.07927417755127, 8.871879577636719, 9.664485931396484, 10.45709228515625, 11.2496976852417, 12.042303085327148, 12.834909439086914, 13.62751579284668, 14.420121192932129, 15.212726593017578, 16.005332946777344, 16.79793930053711, 17.590545654296875, 18.383150100708008, 19.175756454467773, 19.96836280822754, 20.760967254638672, 21.553573608398438, 22.346179962158203, 23.13878631591797, 23.931392669677734, 24.723997116088867, 25.516603469848633]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 7.0, 16.0, 13.0, 23.0, 43.0, 52.0, 89.0, 136.0, 229.0, 320.0, 545.0, 808.0, 1269.0, 2064.0, 3129.0, 5350.0, 8854.0, 14758.0, 24836.0, 39970.0, 63968.0, 94843.0, 128732.0, 149965.0, 147091.0, 122194.0, 88413.0, 58215.0, 36580.0, 21975.0, 13349.0, 7909.0, 4832.0, 2998.0, 1826.0, 1162.0, 742.0, 445.0, 279.0, 187.0, 117.0, 81.0, 44.0, 33.0, 23.0, 16.0, 8.0, 11.0, 8.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.25, -24.405517578125, -23.56103515625, -22.716552734375, -21.8720703125, -21.027587890625, -20.18310546875, -19.338623046875, -18.494140625, -17.649658203125, -16.80517578125, -15.960693359375, -15.1162109375, -14.271728515625, -13.42724609375, -12.582763671875, -11.73828125, -10.893798828125, -10.04931640625, -9.204833984375, -8.3603515625, -7.515869140625, -6.67138671875, -5.826904296875, -4.982421875, -4.137939453125, -3.29345703125, -2.448974609375, -1.6044921875, -0.760009765625, 0.08447265625, 0.928955078125, 1.7734375, 2.617919921875, 3.46240234375, 4.306884765625, 5.1513671875, 5.995849609375, 6.84033203125, 7.684814453125, 8.529296875, 9.373779296875, 10.21826171875, 11.062744140625, 11.9072265625, 12.751708984375, 13.59619140625, 14.440673828125, 15.28515625, 16.129638671875, 16.97412109375, 17.818603515625, 18.6630859375, 19.507568359375, 20.35205078125, 21.196533203125, 22.041015625, 22.885498046875, 23.72998046875, 24.574462890625, 25.4189453125, 26.263427734375, 27.10791015625, 27.952392578125, 28.796875]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 8.0, 11.0, 9.0, 15.0, 20.0, 22.0, 19.0, 12.0, 20.0, 16.0, 44.0, 30.0, 46.0, 33.0, 49.0, 51.0, 57.0, 65.0, 55.0, 42.0, 53.0, 46.0, 43.0, 34.0, 41.0, 31.0, 19.0, 24.0, 13.0, 18.0, 15.0, 11.0, 10.0, 4.0, 5.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.203125, -29.169189453125, -28.13525390625, -27.101318359375, -26.0673828125, -25.033447265625, -23.99951171875, -22.965576171875, -21.931640625, -20.897705078125, -19.86376953125, -18.829833984375, -17.7958984375, -16.761962890625, -15.72802734375, -14.694091796875, -13.66015625, -12.626220703125, -11.59228515625, -10.558349609375, -9.5244140625, -8.490478515625, -7.45654296875, -6.422607421875, -5.388671875, -4.354736328125, -3.32080078125, -2.286865234375, -1.2529296875, -0.218994140625, 0.81494140625, 1.848876953125, 2.8828125, 3.916748046875, 4.95068359375, 5.984619140625, 7.0185546875, 8.052490234375, 9.08642578125, 10.120361328125, 11.154296875, 12.188232421875, 13.22216796875, 14.256103515625, 15.2900390625, 16.323974609375, 17.35791015625, 18.391845703125, 19.42578125, 20.459716796875, 21.49365234375, 22.527587890625, 23.5615234375, 24.595458984375, 25.62939453125, 26.663330078125, 27.697265625, 28.731201171875, 29.76513671875, 30.799072265625, 31.8330078125, 32.866943359375, 33.90087890625, 34.934814453125, 35.96875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 0.0, 3.0, 3.0, 6.0, 6.0, 13.0, 18.0, 33.0, 33.0, 52.0, 72.0, 91.0, 167.0, 219.0, 323.0, 453.0, 710.0, 1186.0, 1961.0, 3251.0, 5777.0, 11110.0, 21896.0, 45688.0, 93532.0, 166494.0, 224217.0, 205476.0, 130613.0, 67702.0, 32429.0, 15839.0, 8157.0, 4205.0, 2551.0, 1484.0, 925.0, 619.0, 390.0, 249.0, 180.0, 112.0, 91.0, 82.0, 43.0, 24.0, 21.0, 19.0, 10.0, 3.0, 9.0, 3.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-46.40625, -44.89794921875, -43.3896484375, -41.88134765625, -40.373046875, -38.86474609375, -37.3564453125, -35.84814453125, -34.33984375, -32.83154296875, -31.3232421875, -29.81494140625, -28.306640625, -26.79833984375, -25.2900390625, -23.78173828125, -22.2734375, -20.76513671875, -19.2568359375, -17.74853515625, -16.240234375, -14.73193359375, -13.2236328125, -11.71533203125, -10.20703125, -8.69873046875, -7.1904296875, -5.68212890625, -4.173828125, -2.66552734375, -1.1572265625, 0.35107421875, 1.859375, 3.36767578125, 4.8759765625, 6.38427734375, 7.892578125, 9.40087890625, 10.9091796875, 12.41748046875, 13.92578125, 15.43408203125, 16.9423828125, 18.45068359375, 19.958984375, 21.46728515625, 22.9755859375, 24.48388671875, 25.9921875, 27.50048828125, 29.0087890625, 30.51708984375, 32.025390625, 33.53369140625, 35.0419921875, 36.55029296875, 38.05859375, 39.56689453125, 41.0751953125, 42.58349609375, 44.091796875, 45.60009765625, 47.1083984375, 48.61669921875, 50.125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 6.0, 4.0, 5.0, 11.0, 8.0, 10.0, 12.0, 10.0, 23.0, 11.0, 21.0, 35.0, 25.0, 28.0, 39.0, 34.0, 35.0, 46.0, 38.0, 42.0, 45.0, 38.0, 35.0, 31.0, 46.0, 43.0, 38.0, 29.0, 24.0, 41.0, 31.0, 23.0, 21.0, 19.0, 22.0, 16.0, 14.0, 7.0, 9.0, 10.0, 2.0, 5.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-21.015625, -20.408203125, -19.80078125, -19.193359375, -18.5859375, -17.978515625, -17.37109375, -16.763671875, -16.15625, -15.548828125, -14.94140625, -14.333984375, -13.7265625, -13.119140625, -12.51171875, -11.904296875, -11.296875, -10.689453125, -10.08203125, -9.474609375, -8.8671875, -8.259765625, -7.65234375, -7.044921875, -6.4375, -5.830078125, -5.22265625, -4.615234375, -4.0078125, -3.400390625, -2.79296875, -2.185546875, -1.578125, -0.970703125, -0.36328125, 0.244140625, 0.8515625, 1.458984375, 2.06640625, 2.673828125, 3.28125, 3.888671875, 4.49609375, 5.103515625, 5.7109375, 6.318359375, 6.92578125, 7.533203125, 8.140625, 8.748046875, 9.35546875, 9.962890625, 10.5703125, 11.177734375, 11.78515625, 12.392578125, 13.0, 13.607421875, 14.21484375, 14.822265625, 15.4296875, 16.037109375, 16.64453125, 17.251953125, 17.859375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 11.0, 16.0, 10.0, 21.0, 39.0, 55.0, 67.0, 95.0, 149.0, 180.0, 260.0, 336.0, 540.0, 869.0, 1378.0, 2185.0, 3661.0, 6296.0, 11546.0, 20937.0, 39877.0, 74570.0, 133868.0, 199478.0, 209265.0, 151496.0, 88069.0, 46782.0, 24714.0, 13176.0, 7542.0, 4186.0, 2471.0, 1505.0, 965.0, 587.0, 379.0, 265.0, 209.0, 153.0, 95.0, 74.0, 57.0, 36.0, 31.0, 20.0, 13.0, 13.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0], "bins": [-26.4375, -25.662841796875, -24.88818359375, -24.113525390625, -23.3388671875, -22.564208984375, -21.78955078125, -21.014892578125, -20.240234375, -19.465576171875, -18.69091796875, -17.916259765625, -17.1416015625, -16.366943359375, -15.59228515625, -14.817626953125, -14.04296875, -13.268310546875, -12.49365234375, -11.718994140625, -10.9443359375, -10.169677734375, -9.39501953125, -8.620361328125, -7.845703125, -7.071044921875, -6.29638671875, -5.521728515625, -4.7470703125, -3.972412109375, -3.19775390625, -2.423095703125, -1.6484375, -0.873779296875, -0.09912109375, 0.675537109375, 1.4501953125, 2.224853515625, 2.99951171875, 3.774169921875, 4.548828125, 5.323486328125, 6.09814453125, 6.872802734375, 7.6474609375, 8.422119140625, 9.19677734375, 9.971435546875, 10.74609375, 11.520751953125, 12.29541015625, 13.070068359375, 13.8447265625, 14.619384765625, 15.39404296875, 16.168701171875, 16.943359375, 17.718017578125, 18.49267578125, 19.267333984375, 20.0419921875, 20.816650390625, 21.59130859375, 22.365966796875, 23.140625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 1.0, 4.0, 0.0, 4.0, 3.0, 7.0, 8.0, 11.0, 11.0, 20.0, 29.0, 44.0, 67.0, 81.0, 95.0, 125.0, 119.0, 95.0, 81.0, 69.0, 47.0, 27.0, 21.0, 12.0, 9.0, 8.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0032787322998046875, -0.0031517446041107178, -0.003024756908416748, -0.0028977692127227783, -0.0027707815170288086, -0.002643793821334839, -0.002516806125640869, -0.0023898184299468994, -0.0022628307342529297, -0.00213584303855896, -0.0020088553428649902, -0.0018818676471710205, -0.0017548799514770508, -0.001627892255783081, -0.0015009045600891113, -0.0013739168643951416, -0.0012469291687011719, -0.0011199414730072021, -0.0009929537773132324, -0.0008659660816192627, -0.000738978385925293, -0.0006119906902313232, -0.0004850029945373535, -0.0003580152988433838, -0.00023102760314941406, -0.00010403990745544434, 2.294778823852539e-05, 0.00014993548393249512, 0.00027692317962646484, 0.00040391087532043457, 0.0005308985710144043, 0.000657886266708374, 0.0007848739624023438, 0.0009118616580963135, 0.0010388493537902832, 0.001165837049484253, 0.0012928247451782227, 0.0014198124408721924, 0.0015468001365661621, 0.0016737878322601318, 0.0018007755279541016, 0.0019277632236480713, 0.002054750919342041, 0.0021817386150360107, 0.0023087263107299805, 0.00243571400642395, 0.00256270170211792, 0.0026896893978118896, 0.0028166770935058594, 0.002943664789199829, 0.003070652484893799, 0.0031976401805877686, 0.0033246278762817383, 0.003451615571975708, 0.0035786032676696777, 0.0037055909633636475, 0.003832578659057617, 0.003959566354751587, 0.004086554050445557, 0.004213541746139526, 0.004340529441833496, 0.004467517137527466, 0.0045945048332214355, 0.004721492528915405, 0.004848480224609375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 2.0, 7.0, 11.0, 15.0, 16.0, 24.0, 47.0, 53.0, 80.0, 115.0, 178.0, 276.0, 424.0, 601.0, 951.0, 1412.0, 2361.0, 3652.0, 6230.0, 10685.0, 19082.0, 34887.0, 65306.0, 116803.0, 181193.0, 207424.0, 166589.0, 103035.0, 56502.0, 30140.0, 16533.0, 9468.0, 5475.0, 3268.0, 2042.0, 1250.0, 795.0, 534.0, 334.0, 237.0, 153.0, 113.0, 79.0, 54.0, 33.0, 31.0, 23.0, 9.0, 14.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-24.53125, -23.74951171875, -22.9677734375, -22.18603515625, -21.404296875, -20.62255859375, -19.8408203125, -19.05908203125, -18.27734375, -17.49560546875, -16.7138671875, -15.93212890625, -15.150390625, -14.36865234375, -13.5869140625, -12.80517578125, -12.0234375, -11.24169921875, -10.4599609375, -9.67822265625, -8.896484375, -8.11474609375, -7.3330078125, -6.55126953125, -5.76953125, -4.98779296875, -4.2060546875, -3.42431640625, -2.642578125, -1.86083984375, -1.0791015625, -0.29736328125, 0.484375, 1.26611328125, 2.0478515625, 2.82958984375, 3.611328125, 4.39306640625, 5.1748046875, 5.95654296875, 6.73828125, 7.52001953125, 8.3017578125, 9.08349609375, 9.865234375, 10.64697265625, 11.4287109375, 12.21044921875, 12.9921875, 13.77392578125, 14.5556640625, 15.33740234375, 16.119140625, 16.90087890625, 17.6826171875, 18.46435546875, 19.24609375, 20.02783203125, 20.8095703125, 21.59130859375, 22.373046875, 23.15478515625, 23.9365234375, 24.71826171875, 25.5]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 5.0, 4.0, 4.0, 7.0, 7.0, 7.0, 16.0, 12.0, 20.0, 31.0, 30.0, 38.0, 44.0, 67.0, 65.0, 63.0, 93.0, 68.0, 74.0, 75.0, 65.0, 51.0, 26.0, 24.0, 22.0, 27.0, 10.0, 12.0, 8.0, 9.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.171875, -7.9005126953125, -7.629150390625, -7.3577880859375, -7.08642578125, -6.8150634765625, -6.543701171875, -6.2723388671875, -6.0009765625, -5.7296142578125, -5.458251953125, -5.1868896484375, -4.91552734375, -4.6441650390625, -4.372802734375, -4.1014404296875, -3.830078125, -3.5587158203125, -3.287353515625, -3.0159912109375, -2.74462890625, -2.4732666015625, -2.201904296875, -1.9305419921875, -1.6591796875, -1.3878173828125, -1.116455078125, -0.8450927734375, -0.57373046875, -0.3023681640625, -0.031005859375, 0.2403564453125, 0.51171875, 0.7830810546875, 1.054443359375, 1.3258056640625, 1.59716796875, 1.8685302734375, 2.139892578125, 2.4112548828125, 2.6826171875, 2.9539794921875, 3.225341796875, 3.4967041015625, 3.76806640625, 4.0394287109375, 4.310791015625, 4.5821533203125, 4.853515625, 5.1248779296875, 5.396240234375, 5.6676025390625, 5.93896484375, 6.2103271484375, 6.481689453125, 6.7530517578125, 7.0244140625, 7.2957763671875, 7.567138671875, 7.8385009765625, 8.10986328125, 8.3812255859375, 8.652587890625, 8.9239501953125, 9.1953125]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 4.0, 4.0, 8.0, 4.0, 12.0, 8.0, 11.0, 12.0, 17.0, 26.0, 20.0, 20.0, 46.0, 37.0, 41.0, 50.0, 45.0, 45.0, 48.0, 38.0, 48.0, 47.0, 50.0, 43.0, 48.0, 41.0, 28.0, 37.0, 29.0, 19.0, 22.0, 21.0, 17.0, 10.0, 11.0, 9.0, 6.0, 7.0, 2.0, 5.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.419578552246094, -34.14214324951172, -32.864707946777344, -31.58727264404297, -30.309837341308594, -29.03240203857422, -27.754966735839844, -26.47753143310547, -25.200096130371094, -23.92266082763672, -22.645225524902344, -21.36779022216797, -20.090354919433594, -18.81291961669922, -17.535484313964844, -16.25804901123047, -14.980615615844727, -13.703180313110352, -12.425745010375977, -11.148309707641602, -9.870874404907227, -8.593439102172852, -7.316004753112793, -6.038569450378418, -4.761134147644043, -3.483698844909668, -2.206263780593872, -0.9288287162780762, 0.34860658645629883, 1.6260418891906738, 2.9034767150878906, 4.180912017822266, 5.458347320556641, 6.735782623291016, 8.01321792602539, 9.290653228759766, 10.56808853149414, 11.845523834228516, 13.122958183288574, 14.40039348602295, 15.677828788757324, 16.955263137817383, 18.232698440551758, 19.510133743286133, 20.787569046020508, 22.065004348754883, 23.342439651489258, 24.619874954223633, 25.897310256958008, 27.174745559692383, 28.452180862426758, 29.729616165161133, 31.007051467895508, 32.28448486328125, 33.561920166015625, 34.83935546875, 36.116790771484375, 37.39422607421875, 38.671661376953125, 39.9490966796875, 41.226531982421875, 42.50396728515625, 43.781402587890625, 45.058837890625, 46.336273193359375]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 9.0, 6.0, 7.0, 12.0, 11.0, 13.0, 6.0, 28.0, 8.0, 24.0, 29.0, 24.0, 25.0, 33.0, 42.0, 38.0, 45.0, 35.0, 43.0, 49.0, 45.0, 52.0, 43.0, 31.0, 37.0, 34.0, 38.0, 29.0, 29.0, 30.0, 16.0, 29.0, 17.0, 14.0, 12.0, 15.0, 5.0, 5.0, 13.0, 12.0, 5.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-33.991695404052734, -33.017005920410156, -32.042320251464844, -31.0676326751709, -30.092945098876953, -29.118255615234375, -28.14356803894043, -27.168880462646484, -26.19419288635254, -25.219505310058594, -24.24481773376465, -23.270130157470703, -22.295440673828125, -21.320755004882812, -20.346065521240234, -19.37137794494629, -18.396690368652344, -17.4220027923584, -16.447315216064453, -15.472626686096191, -14.497939109802246, -13.5232515335083, -12.548563003540039, -11.573875427246094, -10.599187850952148, -9.624500274658203, -8.649812698364258, -7.675124168395996, -6.700436592102051, -5.7257490158081055, -4.751060962677002, -3.7763729095458984, -2.801685333251953, -1.8269975185394287, -0.8523097038269043, 0.12237811088562012, 1.0970659255981445, 2.07175350189209, 3.0464415550231934, 4.021129608154297, 4.995817184448242, 5.9705047607421875, 6.945192813873291, 7.9198808670043945, 8.89456844329834, 9.869256019592285, 10.843944549560547, 11.818632125854492, 12.793319702148438, 13.768007278442383, 14.742694854736328, 15.71738338470459, 16.69207000732422, 17.666759490966797, 18.641447067260742, 19.616134643554688, 20.590822219848633, 21.565509796142578, 22.540197372436523, 23.51488494873047, 24.489574432373047, 25.46426010131836, 26.438949584960938, 27.413637161254883, 28.388324737548828]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 7.0, 7.0, 16.0, 14.0, 26.0, 50.0, 71.0, 116.0, 205.0, 337.0, 550.0, 1012.0, 1772.0, 3163.0, 5632.0, 10130.0, 18898.0, 35827.0, 69036.0, 135464.0, 268491.0, 501172.0, 789335.0, 886923.0, 670110.0, 385608.0, 198975.0, 100430.0, 51500.0, 26948.0, 14265.0, 7760.0, 4379.0, 2432.0, 1421.0, 811.0, 505.0, 297.0, 206.0, 129.0, 82.0, 73.0, 38.0, 18.0, 15.0, 14.0, 10.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-43.53125, -42.1396484375, -40.748046875, -39.3564453125, -37.96484375, -36.5732421875, -35.181640625, -33.7900390625, -32.3984375, -31.0068359375, -29.615234375, -28.2236328125, -26.83203125, -25.4404296875, -24.048828125, -22.6572265625, -21.265625, -19.8740234375, -18.482421875, -17.0908203125, -15.69921875, -14.3076171875, -12.916015625, -11.5244140625, -10.1328125, -8.7412109375, -7.349609375, -5.9580078125, -4.56640625, -3.1748046875, -1.783203125, -0.3916015625, 1.0, 2.3916015625, 3.783203125, 5.1748046875, 6.56640625, 7.9580078125, 9.349609375, 10.7412109375, 12.1328125, 13.5244140625, 14.916015625, 16.3076171875, 17.69921875, 19.0908203125, 20.482421875, 21.8740234375, 23.265625, 24.6572265625, 26.048828125, 27.4404296875, 28.83203125, 30.2236328125, 31.615234375, 33.0068359375, 34.3984375, 35.7900390625, 37.181640625, 38.5732421875, 39.96484375, 41.3564453125, 42.748046875, 44.1396484375, 45.53125]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 9.0, 9.0, 5.0, 20.0, 14.0, 12.0, 14.0, 20.0, 17.0, 24.0, 22.0, 32.0, 36.0, 30.0, 42.0, 31.0, 39.0, 37.0, 42.0, 46.0, 46.0, 45.0, 42.0, 33.0, 36.0, 39.0, 41.0, 33.0, 32.0, 17.0, 22.0, 13.0, 12.0, 21.0, 15.0, 10.0, 8.0, 10.0, 8.0, 8.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-29.6875, -28.724609375, -27.76171875, -26.798828125, -25.8359375, -24.873046875, -23.91015625, -22.947265625, -21.984375, -21.021484375, -20.05859375, -19.095703125, -18.1328125, -17.169921875, -16.20703125, -15.244140625, -14.28125, -13.318359375, -12.35546875, -11.392578125, -10.4296875, -9.466796875, -8.50390625, -7.541015625, -6.578125, -5.615234375, -4.65234375, -3.689453125, -2.7265625, -1.763671875, -0.80078125, 0.162109375, 1.125, 2.087890625, 3.05078125, 4.013671875, 4.9765625, 5.939453125, 6.90234375, 7.865234375, 8.828125, 9.791015625, 10.75390625, 11.716796875, 12.6796875, 13.642578125, 14.60546875, 15.568359375, 16.53125, 17.494140625, 18.45703125, 19.419921875, 20.3828125, 21.345703125, 22.30859375, 23.271484375, 24.234375, 25.197265625, 26.16015625, 27.123046875, 28.0859375, 29.048828125, 30.01171875, 30.974609375, 31.9375]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 0.0, 7.0, 10.0, 11.0, 17.0, 29.0, 50.0, 58.0, 108.0, 136.0, 244.0, 362.0, 610.0, 965.0, 1613.0, 2535.0, 4119.0, 6812.0, 11763.0, 19568.0, 34178.0, 58718.0, 102402.0, 177157.0, 301787.0, 483858.0, 677016.0, 737788.0, 599140.0, 399391.0, 241594.0, 139803.0, 80501.0, 46005.0, 26826.0, 15665.0, 9264.0, 5455.0, 3309.0, 2007.0, 1260.0, 792.0, 501.0, 292.0, 223.0, 122.0, 91.0, 47.0, 32.0, 18.0, 19.0, 8.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-49.34375, -47.71435546875, -46.0849609375, -44.45556640625, -42.826171875, -41.19677734375, -39.5673828125, -37.93798828125, -36.30859375, -34.67919921875, -33.0498046875, -31.42041015625, -29.791015625, -28.16162109375, -26.5322265625, -24.90283203125, -23.2734375, -21.64404296875, -20.0146484375, -18.38525390625, -16.755859375, -15.12646484375, -13.4970703125, -11.86767578125, -10.23828125, -8.60888671875, -6.9794921875, -5.35009765625, -3.720703125, -2.09130859375, -0.4619140625, 1.16748046875, 2.796875, 4.42626953125, 6.0556640625, 7.68505859375, 9.314453125, 10.94384765625, 12.5732421875, 14.20263671875, 15.83203125, 17.46142578125, 19.0908203125, 20.72021484375, 22.349609375, 23.97900390625, 25.6083984375, 27.23779296875, 28.8671875, 30.49658203125, 32.1259765625, 33.75537109375, 35.384765625, 37.01416015625, 38.6435546875, 40.27294921875, 41.90234375, 43.53173828125, 45.1611328125, 46.79052734375, 48.419921875, 50.04931640625, 51.6787109375, 53.30810546875, 54.9375]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 6.0, 17.0, 13.0, 17.0, 31.0, 35.0, 29.0, 49.0, 56.0, 82.0, 90.0, 121.0, 160.0, 169.0, 203.0, 218.0, 257.0, 274.0, 258.0, 272.0, 233.0, 270.0, 239.0, 196.0, 158.0, 116.0, 94.0, 91.0, 65.0, 60.0, 51.0, 31.0, 32.0, 22.0, 15.0, 12.0, 10.0, 6.0, 10.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.796875, -19.17333984375, -18.5498046875, -17.92626953125, -17.302734375, -16.67919921875, -16.0556640625, -15.43212890625, -14.80859375, -14.18505859375, -13.5615234375, -12.93798828125, -12.314453125, -11.69091796875, -11.0673828125, -10.44384765625, -9.8203125, -9.19677734375, -8.5732421875, -7.94970703125, -7.326171875, -6.70263671875, -6.0791015625, -5.45556640625, -4.83203125, -4.20849609375, -3.5849609375, -2.96142578125, -2.337890625, -1.71435546875, -1.0908203125, -0.46728515625, 0.15625, 0.77978515625, 1.4033203125, 2.02685546875, 2.650390625, 3.27392578125, 3.8974609375, 4.52099609375, 5.14453125, 5.76806640625, 6.3916015625, 7.01513671875, 7.638671875, 8.26220703125, 8.8857421875, 9.50927734375, 10.1328125, 10.75634765625, 11.3798828125, 12.00341796875, 12.626953125, 13.25048828125, 13.8740234375, 14.49755859375, 15.12109375, 15.74462890625, 16.3681640625, 16.99169921875, 17.615234375, 18.23876953125, 18.8623046875, 19.48583984375, 20.109375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 9.0, 7.0, 6.0, 15.0, 11.0, 14.0, 15.0, 30.0, 29.0, 34.0, 30.0, 40.0, 42.0, 49.0, 44.0, 41.0, 54.0, 58.0, 46.0, 55.0, 54.0, 45.0, 43.0, 21.0, 38.0, 27.0, 23.0, 23.0, 23.0, 16.0, 6.0, 11.0, 10.0, 12.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-54.776466369628906, -52.83802032470703, -50.89957046508789, -48.961124420166016, -47.022674560546875, -45.084228515625, -43.145782470703125, -41.207332611083984, -39.268882751464844, -37.33043670654297, -35.39198684692383, -33.45354080200195, -31.515090942382812, -29.576644897460938, -27.63819694519043, -25.699748992919922, -23.761302947998047, -21.82285499572754, -19.88440704345703, -17.945960998535156, -16.007511138916016, -14.069064140319824, -12.130617141723633, -10.192169189453125, -8.253721237182617, -6.315273284912109, -4.37682580947876, -2.43837833404541, -0.49993038177490234, 1.4385175704956055, 3.376964569091797, 5.315412521362305, 7.2538604736328125, 9.19230842590332, 11.130756378173828, 13.06920337677002, 15.007651329040527, 16.94609832763672, 18.884546279907227, 20.822994232177734, 22.761442184448242, 24.69989013671875, 26.638338088989258, 28.576786041259766, 30.51523208618164, 32.45368194580078, 34.392127990722656, 36.33057403564453, 38.26902389526367, 40.20746994018555, 42.14591979980469, 44.08436584472656, 46.0228157043457, 47.96126174926758, 49.89971160888672, 51.838157653808594, 53.77660369873047, 55.715049743652344, 57.653499603271484, 59.59194564819336, 61.5303955078125, 63.468841552734375, 65.40728759765625, 67.34573364257812, 69.28418731689453]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 8.0, 12.0, 6.0, 9.0, 9.0, 10.0, 18.0, 20.0, 21.0, 26.0, 22.0, 30.0, 29.0, 38.0, 31.0, 42.0, 34.0, 41.0, 48.0, 37.0, 41.0, 32.0, 34.0, 37.0, 31.0, 37.0, 45.0, 29.0, 35.0, 26.0, 23.0, 22.0, 12.0, 15.0, 13.0, 12.0, 13.0, 12.0, 14.0, 4.0, 7.0, 8.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-45.55194854736328, -44.18765640258789, -42.8233642578125, -41.459068298339844, -40.09477615356445, -38.73048400878906, -37.36619186401367, -36.00189971923828, -34.637603759765625, -33.273311614990234, -31.90901756286621, -30.54472541809082, -29.180431365966797, -27.816139221191406, -26.451847076416016, -25.087554931640625, -23.723262786865234, -22.358970642089844, -20.99467658996582, -19.63038444519043, -18.266090393066406, -16.901798248291016, -15.537506103515625, -14.173213005065918, -12.808919906616211, -11.444626808166504, -10.080333709716797, -8.716041564941406, -7.351748466491699, -5.987455368041992, -4.623163223266602, -3.2588701248168945, -1.8945770263671875, -0.5302841663360596, 0.8340086936950684, 2.198301315307617, 3.562594413757324, 4.926887512207031, 6.291179656982422, 7.655472755432129, 9.019765853881836, 10.384058952331543, 11.74835205078125, 13.11264419555664, 14.476937294006348, 15.841230392456055, 17.205522537231445, 18.56981658935547, 19.93410873413086, 21.29840087890625, 22.662694931030273, 24.026987075805664, 25.391281127929688, 26.755573272705078, 28.11986541748047, 29.48415756225586, 30.848451614379883, 32.212745666503906, 33.5770378112793, 34.94132995605469, 36.30562210083008, 37.66991424560547, 39.034210205078125, 40.398502349853516, 41.762794494628906]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 5.0, 12.0, 18.0, 34.0, 40.0, 57.0, 98.0, 132.0, 228.0, 314.0, 426.0, 689.0, 1040.0, 1622.0, 2529.0, 3679.0, 5609.0, 8628.0, 13261.0, 20639.0, 32014.0, 47661.0, 70233.0, 97913.0, 123687.0, 137379.0, 130417.0, 107484.0, 80126.0, 55740.0, 37235.0, 24151.0, 15835.0, 10360.0, 6558.0, 4394.0, 2851.0, 1958.0, 1177.0, 774.0, 559.0, 334.0, 182.0, 166.0, 104.0, 71.0, 65.0, 24.0, 19.0, 14.0, 8.0, 5.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0], "bins": [-25.25, -24.453125, -23.65625, -22.859375, -22.0625, -21.265625, -20.46875, -19.671875, -18.875, -18.078125, -17.28125, -16.484375, -15.6875, -14.890625, -14.09375, -13.296875, -12.5, -11.703125, -10.90625, -10.109375, -9.3125, -8.515625, -7.71875, -6.921875, -6.125, -5.328125, -4.53125, -3.734375, -2.9375, -2.140625, -1.34375, -0.546875, 0.25, 1.046875, 1.84375, 2.640625, 3.4375, 4.234375, 5.03125, 5.828125, 6.625, 7.421875, 8.21875, 9.015625, 9.8125, 10.609375, 11.40625, 12.203125, 13.0, 13.796875, 14.59375, 15.390625, 16.1875, 16.984375, 17.78125, 18.578125, 19.375, 20.171875, 20.96875, 21.765625, 22.5625, 23.359375, 24.15625, 24.953125, 25.75]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 6.0, 8.0, 9.0, 14.0, 9.0, 12.0, 25.0, 22.0, 21.0, 28.0, 30.0, 34.0, 47.0, 28.0, 39.0, 38.0, 36.0, 54.0, 40.0, 45.0, 32.0, 33.0, 47.0, 39.0, 41.0, 39.0, 34.0, 30.0, 26.0, 23.0, 12.0, 13.0, 10.0, 15.0, 14.0, 9.0, 6.0, 8.0, 6.0, 3.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-48.53125, -46.95654296875, -45.3818359375, -43.80712890625, -42.232421875, -40.65771484375, -39.0830078125, -37.50830078125, -35.93359375, -34.35888671875, -32.7841796875, -31.20947265625, -29.634765625, -28.06005859375, -26.4853515625, -24.91064453125, -23.3359375, -21.76123046875, -20.1865234375, -18.61181640625, -17.037109375, -15.46240234375, -13.8876953125, -12.31298828125, -10.73828125, -9.16357421875, -7.5888671875, -6.01416015625, -4.439453125, -2.86474609375, -1.2900390625, 0.28466796875, 1.859375, 3.43408203125, 5.0087890625, 6.58349609375, 8.158203125, 9.73291015625, 11.3076171875, 12.88232421875, 14.45703125, 16.03173828125, 17.6064453125, 19.18115234375, 20.755859375, 22.33056640625, 23.9052734375, 25.47998046875, 27.0546875, 28.62939453125, 30.2041015625, 31.77880859375, 33.353515625, 34.92822265625, 36.5029296875, 38.07763671875, 39.65234375, 41.22705078125, 42.8017578125, 44.37646484375, 45.951171875, 47.52587890625, 49.1005859375, 50.67529296875, 52.25]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 9.0, 9.0, 16.0, 14.0, 36.0, 56.0, 69.0, 93.0, 177.0, 264.0, 466.0, 659.0, 1133.0, 1787.0, 2996.0, 5131.0, 9326.0, 16460.0, 29720.0, 54483.0, 97210.0, 158343.0, 207225.0, 184016.0, 121621.0, 69980.0, 38395.0, 21172.0, 11760.0, 6390.0, 3687.0, 2291.0, 1339.0, 798.0, 485.0, 344.0, 202.0, 132.0, 85.0, 60.0, 46.0, 23.0, 28.0, 6.0, 8.0, 5.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.21875, -36.8876953125, -35.556640625, -34.2255859375, -32.89453125, -31.5634765625, -30.232421875, -28.9013671875, -27.5703125, -26.2392578125, -24.908203125, -23.5771484375, -22.24609375, -20.9150390625, -19.583984375, -18.2529296875, -16.921875, -15.5908203125, -14.259765625, -12.9287109375, -11.59765625, -10.2666015625, -8.935546875, -7.6044921875, -6.2734375, -4.9423828125, -3.611328125, -2.2802734375, -0.94921875, 0.3818359375, 1.712890625, 3.0439453125, 4.375, 5.7060546875, 7.037109375, 8.3681640625, 9.69921875, 11.0302734375, 12.361328125, 13.6923828125, 15.0234375, 16.3544921875, 17.685546875, 19.0166015625, 20.34765625, 21.6787109375, 23.009765625, 24.3408203125, 25.671875, 27.0029296875, 28.333984375, 29.6650390625, 30.99609375, 32.3271484375, 33.658203125, 34.9892578125, 36.3203125, 37.6513671875, 38.982421875, 40.3134765625, 41.64453125, 42.9755859375, 44.306640625, 45.6376953125, 46.96875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 1.0, 3.0, 6.0, 9.0, 4.0, 7.0, 12.0, 11.0, 19.0, 20.0, 19.0, 35.0, 25.0, 24.0, 33.0, 32.0, 38.0, 32.0, 58.0, 57.0, 47.0, 42.0, 36.0, 36.0, 32.0, 39.0, 33.0, 40.0, 35.0, 35.0, 33.0, 27.0, 24.0, 19.0, 21.0, 15.0, 7.0, 9.0, 5.0, 11.0, 7.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.3125, -24.433349609375, -23.55419921875, -22.675048828125, -21.7958984375, -20.916748046875, -20.03759765625, -19.158447265625, -18.279296875, -17.400146484375, -16.52099609375, -15.641845703125, -14.7626953125, -13.883544921875, -13.00439453125, -12.125244140625, -11.24609375, -10.366943359375, -9.48779296875, -8.608642578125, -7.7294921875, -6.850341796875, -5.97119140625, -5.092041015625, -4.212890625, -3.333740234375, -2.45458984375, -1.575439453125, -0.6962890625, 0.182861328125, 1.06201171875, 1.941162109375, 2.8203125, 3.699462890625, 4.57861328125, 5.457763671875, 6.3369140625, 7.216064453125, 8.09521484375, 8.974365234375, 9.853515625, 10.732666015625, 11.61181640625, 12.490966796875, 13.3701171875, 14.249267578125, 15.12841796875, 16.007568359375, 16.88671875, 17.765869140625, 18.64501953125, 19.524169921875, 20.4033203125, 21.282470703125, 22.16162109375, 23.040771484375, 23.919921875, 24.799072265625, 25.67822265625, 26.557373046875, 27.4365234375, 28.315673828125, 29.19482421875, 30.073974609375, 30.953125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 9.0, 15.0, 16.0, 19.0, 39.0, 43.0, 72.0, 113.0, 189.0, 291.0, 444.0, 794.0, 1286.0, 2282.0, 3925.0, 7162.0, 12988.0, 24749.0, 47365.0, 88257.0, 157779.0, 225541.0, 203013.0, 126129.0, 68411.0, 35478.0, 18732.0, 10119.0, 5668.0, 3097.0, 1721.0, 1076.0, 630.0, 387.0, 254.0, 150.0, 107.0, 60.0, 40.0, 39.0, 21.0, 19.0, 9.0, 12.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.578125, -20.8017578125, -20.025390625, -19.2490234375, -18.47265625, -17.6962890625, -16.919921875, -16.1435546875, -15.3671875, -14.5908203125, -13.814453125, -13.0380859375, -12.26171875, -11.4853515625, -10.708984375, -9.9326171875, -9.15625, -8.3798828125, -7.603515625, -6.8271484375, -6.05078125, -5.2744140625, -4.498046875, -3.7216796875, -2.9453125, -2.1689453125, -1.392578125, -0.6162109375, 0.16015625, 0.9365234375, 1.712890625, 2.4892578125, 3.265625, 4.0419921875, 4.818359375, 5.5947265625, 6.37109375, 7.1474609375, 7.923828125, 8.7001953125, 9.4765625, 10.2529296875, 11.029296875, 11.8056640625, 12.58203125, 13.3583984375, 14.134765625, 14.9111328125, 15.6875, 16.4638671875, 17.240234375, 18.0166015625, 18.79296875, 19.5693359375, 20.345703125, 21.1220703125, 21.8984375, 22.6748046875, 23.451171875, 24.2275390625, 25.00390625, 25.7802734375, 26.556640625, 27.3330078125, 28.109375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 7.0, 3.0, 6.0, 6.0, 5.0, 8.0, 14.0, 13.0, 18.0, 22.0, 23.0, 33.0, 33.0, 28.0, 51.0, 39.0, 39.0, 53.0, 52.0, 43.0, 48.0, 50.0, 46.0, 46.0, 40.0, 30.0, 29.0, 29.0, 27.0, 32.0, 16.0, 12.0, 18.0, 13.0, 15.0, 16.0, 12.0, 5.0, 4.0, 4.0, 2.0, 3.0, 4.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008177757263183594, -0.0007904618978500366, -0.0007631480693817139, -0.0007358342409133911, -0.0007085204124450684, -0.0006812065839767456, -0.0006538927555084229, -0.0006265789270401001, -0.0005992650985717773, -0.0005719512701034546, -0.0005446374416351318, -0.0005173236131668091, -0.0004900097846984863, -0.0004626959562301636, -0.0004353821277618408, -0.00040806829929351807, -0.0003807544708251953, -0.00035344064235687256, -0.0003261268138885498, -0.00029881298542022705, -0.0002714991569519043, -0.00024418532848358154, -0.0002168715000152588, -0.00018955767154693604, -0.00016224384307861328, -0.00013493001461029053, -0.00010761618614196777, -8.030235767364502e-05, -5.2988529205322266e-05, -2.5674700736999512e-05, 1.6391277313232422e-06, 2.8952956199645996e-05, 5.626678466796875e-05, 8.35806131362915e-05, 0.00011089444160461426, 0.000138208270072937, 0.00016552209854125977, 0.00019283592700958252, 0.00022014975547790527, 0.00024746358394622803, 0.0002747774124145508, 0.00030209124088287354, 0.0003294050693511963, 0.00035671889781951904, 0.0003840327262878418, 0.00041134655475616455, 0.0004386603832244873, 0.00046597421169281006, 0.0004932880401611328, 0.0005206018686294556, 0.0005479156970977783, 0.0005752295255661011, 0.0006025433540344238, 0.0006298571825027466, 0.0006571710109710693, 0.0006844848394393921, 0.0007117986679077148, 0.0007391124963760376, 0.0007664263248443604, 0.0007937401533126831, 0.0008210539817810059, 0.0008483678102493286, 0.0008756816387176514, 0.0009029954671859741, 0.0009303092956542969]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 6.0, 4.0, 6.0, 5.0, 14.0, 15.0, 22.0, 29.0, 41.0, 75.0, 85.0, 159.0, 224.0, 280.0, 500.0, 732.0, 1141.0, 1849.0, 2863.0, 4708.0, 8049.0, 14632.0, 26361.0, 48814.0, 86490.0, 139372.0, 188151.0, 186947.0, 139789.0, 86278.0, 48794.0, 26455.0, 14807.0, 8248.0, 4646.0, 2837.0, 1817.0, 1141.0, 742.0, 443.0, 306.0, 197.0, 165.0, 109.0, 56.0, 51.0, 36.0, 30.0, 16.0, 9.0, 7.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.375, -23.5625, -22.75, -21.9375, -21.125, -20.3125, -19.5, -18.6875, -17.875, -17.0625, -16.25, -15.4375, -14.625, -13.8125, -13.0, -12.1875, -11.375, -10.5625, -9.75, -8.9375, -8.125, -7.3125, -6.5, -5.6875, -4.875, -4.0625, -3.25, -2.4375, -1.625, -0.8125, 0.0, 0.8125, 1.625, 2.4375, 3.25, 4.0625, 4.875, 5.6875, 6.5, 7.3125, 8.125, 8.9375, 9.75, 10.5625, 11.375, 12.1875, 13.0, 13.8125, 14.625, 15.4375, 16.25, 17.0625, 17.875, 18.6875, 19.5, 20.3125, 21.125, 21.9375, 22.75, 23.5625, 24.375, 25.1875, 26.0, 26.8125, 27.625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 5.0, 7.0, 4.0, 7.0, 9.0, 7.0, 15.0, 17.0, 14.0, 15.0, 18.0, 25.0, 33.0, 33.0, 27.0, 41.0, 39.0, 50.0, 59.0, 52.0, 46.0, 39.0, 56.0, 57.0, 48.0, 43.0, 40.0, 31.0, 27.0, 19.0, 17.0, 17.0, 18.0, 11.0, 9.0, 13.0, 5.0, 10.0, 2.0, 6.0, 3.0, 7.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-7.03125, -6.82421875, -6.6171875, -6.41015625, -6.203125, -5.99609375, -5.7890625, -5.58203125, -5.375, -5.16796875, -4.9609375, -4.75390625, -4.546875, -4.33984375, -4.1328125, -3.92578125, -3.71875, -3.51171875, -3.3046875, -3.09765625, -2.890625, -2.68359375, -2.4765625, -2.26953125, -2.0625, -1.85546875, -1.6484375, -1.44140625, -1.234375, -1.02734375, -0.8203125, -0.61328125, -0.40625, -0.19921875, 0.0078125, 0.21484375, 0.421875, 0.62890625, 0.8359375, 1.04296875, 1.25, 1.45703125, 1.6640625, 1.87109375, 2.078125, 2.28515625, 2.4921875, 2.69921875, 2.90625, 3.11328125, 3.3203125, 3.52734375, 3.734375, 3.94140625, 4.1484375, 4.35546875, 4.5625, 4.76953125, 4.9765625, 5.18359375, 5.390625, 5.59765625, 5.8046875, 6.01171875, 6.21875]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 7.0, 6.0, 5.0, 4.0, 8.0, 10.0, 9.0, 12.0, 19.0, 21.0, 26.0, 34.0, 36.0, 34.0, 35.0, 41.0, 52.0, 39.0, 48.0, 53.0, 45.0, 43.0, 56.0, 43.0, 47.0, 39.0, 30.0, 36.0, 23.0, 22.0, 21.0, 20.0, 15.0, 13.0, 12.0, 15.0, 4.0, 6.0, 5.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.782806396484375, -50.89947509765625, -49.016143798828125, -47.132808685302734, -45.24947738647461, -43.366146087646484, -41.482810974121094, -39.59947967529297, -37.716148376464844, -35.83281707763672, -33.949485778808594, -32.0661506652832, -30.182819366455078, -28.299488067626953, -26.416154861450195, -24.532821655273438, -22.649490356445312, -20.766159057617188, -18.88282585144043, -16.999492645263672, -15.116161346435547, -13.232829093933105, -11.349496841430664, -9.466164588928223, -7.582832336425781, -5.69950008392334, -3.8161678314208984, -1.932835578918457, -0.049503326416015625, 1.8338289260864258, 3.717161178588867, 5.600493431091309, 7.48382568359375, 9.367157936096191, 11.250490188598633, 13.133822441101074, 15.017154693603516, 16.90048599243164, 18.7838191986084, 20.667152404785156, 22.55048370361328, 24.433815002441406, 26.317148208618164, 28.200481414794922, 30.083812713623047, 31.967144012451172, 33.85047912597656, 35.73381042480469, 37.61714172363281, 39.50047302246094, 41.38380432128906, 43.26713943481445, 45.15047073364258, 47.0338020324707, 48.917137145996094, 50.80046844482422, 52.683799743652344, 54.56713104248047, 56.450462341308594, 58.333797454833984, 60.21712875366211, 62.100460052490234, 63.983795166015625, 65.86712646484375, 67.75045776367188]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 7.0, 12.0, 5.0, 10.0, 11.0, 15.0, 16.0, 20.0, 26.0, 21.0, 30.0, 39.0, 29.0, 31.0, 37.0, 38.0, 40.0, 50.0, 44.0, 31.0, 35.0, 44.0, 29.0, 30.0, 41.0, 42.0, 29.0, 42.0, 27.0, 24.0, 19.0, 16.0, 14.0, 13.0, 10.0, 11.0, 16.0, 9.0, 11.0, 3.0, 7.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-46.820247650146484, -45.43103790283203, -44.04182815551758, -42.652618408203125, -41.263404846191406, -39.87419509887695, -38.4849853515625, -37.09577560424805, -35.706565856933594, -34.31735610961914, -32.92814636230469, -31.5389347076416, -30.149723052978516, -28.760513305664062, -27.37130355834961, -25.982093811035156, -24.592880249023438, -23.203670501708984, -21.8144588470459, -20.425249099731445, -19.03603744506836, -17.646827697753906, -16.257617950439453, -14.868407249450684, -13.479196548461914, -12.089985847473145, -10.700775146484375, -9.311565399169922, -7.922354698181152, -6.533143997192383, -5.14393424987793, -3.75472354888916, -2.3655128479003906, -0.9763023853302002, 0.41290807723999023, 1.8021183013916016, 3.191329002380371, 4.580539703369141, 5.969749450683594, 7.358960151672363, 8.748170852661133, 10.137381553649902, 11.526592254638672, 12.915802001953125, 14.305012702941895, 15.694223403930664, 17.083433151245117, 18.472644805908203, 19.861854553222656, 21.25106430053711, 22.640275955200195, 24.02948570251465, 25.418697357177734, 26.807907104492188, 28.19711685180664, 29.586326599121094, 30.97553825378418, 32.364749908447266, 33.75395965576172, 35.14316940307617, 36.532379150390625, 37.921592712402344, 39.31079864501953, 40.70001220703125, 42.0892219543457]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 5.0, 12.0, 12.0, 14.0, 31.0, 41.0, 64.0, 82.0, 111.0, 198.0, 290.0, 374.0, 592.0, 904.0, 1304.0, 2012.0, 2858.0, 4231.0, 6128.0, 9091.0, 13072.0, 19207.0, 27290.0, 38282.0, 52715.0, 69469.0, 87459.0, 102190.0, 109943.0, 107545.0, 96194.0, 79966.0, 62387.0, 46283.0, 33480.0, 23427.0, 16195.0, 11346.0, 7540.0, 5143.0, 3526.0, 2375.0, 1669.0, 1137.0, 797.0, 499.0, 327.0, 254.0, 170.0, 122.0, 66.0, 59.0, 25.0, 20.0, 12.0, 6.0, 8.0, 5.0, 1.0, 2.0], "bins": [-28.015625, -27.1611328125, -26.306640625, -25.4521484375, -24.59765625, -23.7431640625, -22.888671875, -22.0341796875, -21.1796875, -20.3251953125, -19.470703125, -18.6162109375, -17.76171875, -16.9072265625, -16.052734375, -15.1982421875, -14.34375, -13.4892578125, -12.634765625, -11.7802734375, -10.92578125, -10.0712890625, -9.216796875, -8.3623046875, -7.5078125, -6.6533203125, -5.798828125, -4.9443359375, -4.08984375, -3.2353515625, -2.380859375, -1.5263671875, -0.671875, 0.1826171875, 1.037109375, 1.8916015625, 2.74609375, 3.6005859375, 4.455078125, 5.3095703125, 6.1640625, 7.0185546875, 7.873046875, 8.7275390625, 9.58203125, 10.4365234375, 11.291015625, 12.1455078125, 13.0, 13.8544921875, 14.708984375, 15.5634765625, 16.41796875, 17.2724609375, 18.126953125, 18.9814453125, 19.8359375, 20.6904296875, 21.544921875, 22.3994140625, 23.25390625, 24.1083984375, 24.962890625, 25.8173828125, 26.671875]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 10.0, 5.0, 8.0, 11.0, 6.0, 7.0, 5.0, 17.0, 15.0, 19.0, 27.0, 30.0, 23.0, 32.0, 31.0, 35.0, 42.0, 34.0, 37.0, 39.0, 38.0, 42.0, 44.0, 30.0, 37.0, 34.0, 29.0, 34.0, 44.0, 44.0, 22.0, 28.0, 19.0, 22.0, 18.0, 14.0, 15.0, 6.0, 5.0, 11.0, 9.0, 4.0, 6.0, 3.0, 3.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.28125, -39.89208984375, -38.5029296875, -37.11376953125, -35.724609375, -34.33544921875, -32.9462890625, -31.55712890625, -30.16796875, -28.77880859375, -27.3896484375, -26.00048828125, -24.611328125, -23.22216796875, -21.8330078125, -20.44384765625, -19.0546875, -17.66552734375, -16.2763671875, -14.88720703125, -13.498046875, -12.10888671875, -10.7197265625, -9.33056640625, -7.94140625, -6.55224609375, -5.1630859375, -3.77392578125, -2.384765625, -0.99560546875, 0.3935546875, 1.78271484375, 3.171875, 4.56103515625, 5.9501953125, 7.33935546875, 8.728515625, 10.11767578125, 11.5068359375, 12.89599609375, 14.28515625, 15.67431640625, 17.0634765625, 18.45263671875, 19.841796875, 21.23095703125, 22.6201171875, 24.00927734375, 25.3984375, 26.78759765625, 28.1767578125, 29.56591796875, 30.955078125, 32.34423828125, 33.7333984375, 35.12255859375, 36.51171875, 37.90087890625, 39.2900390625, 40.67919921875, 42.068359375, 43.45751953125, 44.8466796875, 46.23583984375, 47.625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 8.0, 7.0, 6.0, 19.0, 27.0, 38.0, 62.0, 84.0, 113.0, 172.0, 287.0, 383.0, 620.0, 867.0, 1356.0, 2183.0, 3352.0, 5436.0, 8888.0, 14929.0, 25966.0, 45965.0, 82188.0, 138235.0, 193126.0, 192920.0, 138013.0, 82274.0, 46152.0, 26217.0, 14816.0, 8722.0, 5509.0, 3420.0, 2090.0, 1365.0, 909.0, 601.0, 407.0, 288.0, 156.0, 117.0, 86.0, 62.0, 36.0, 32.0, 23.0, 13.0, 7.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-74.5625, -72.232421875, -69.90234375, -67.572265625, -65.2421875, -62.912109375, -60.58203125, -58.251953125, -55.921875, -53.591796875, -51.26171875, -48.931640625, -46.6015625, -44.271484375, -41.94140625, -39.611328125, -37.28125, -34.951171875, -32.62109375, -30.291015625, -27.9609375, -25.630859375, -23.30078125, -20.970703125, -18.640625, -16.310546875, -13.98046875, -11.650390625, -9.3203125, -6.990234375, -4.66015625, -2.330078125, 0.0, 2.330078125, 4.66015625, 6.990234375, 9.3203125, 11.650390625, 13.98046875, 16.310546875, 18.640625, 20.970703125, 23.30078125, 25.630859375, 27.9609375, 30.291015625, 32.62109375, 34.951171875, 37.28125, 39.611328125, 41.94140625, 44.271484375, 46.6015625, 48.931640625, 51.26171875, 53.591796875, 55.921875, 58.251953125, 60.58203125, 62.912109375, 65.2421875, 67.572265625, 69.90234375, 72.232421875, 74.5625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 7.0, 5.0, 13.0, 14.0, 14.0, 15.0, 20.0, 21.0, 15.0, 32.0, 28.0, 31.0, 34.0, 39.0, 46.0, 32.0, 45.0, 54.0, 58.0, 36.0, 34.0, 40.0, 50.0, 51.0, 31.0, 25.0, 29.0, 24.0, 20.0, 31.0, 16.0, 12.0, 11.0, 12.0, 16.0, 11.0, 5.0, 2.0, 2.0, 4.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.8125, -34.59326171875, -33.3740234375, -32.15478515625, -30.935546875, -29.71630859375, -28.4970703125, -27.27783203125, -26.05859375, -24.83935546875, -23.6201171875, -22.40087890625, -21.181640625, -19.96240234375, -18.7431640625, -17.52392578125, -16.3046875, -15.08544921875, -13.8662109375, -12.64697265625, -11.427734375, -10.20849609375, -8.9892578125, -7.77001953125, -6.55078125, -5.33154296875, -4.1123046875, -2.89306640625, -1.673828125, -0.45458984375, 0.7646484375, 1.98388671875, 3.203125, 4.42236328125, 5.6416015625, 6.86083984375, 8.080078125, 9.29931640625, 10.5185546875, 11.73779296875, 12.95703125, 14.17626953125, 15.3955078125, 16.61474609375, 17.833984375, 19.05322265625, 20.2724609375, 21.49169921875, 22.7109375, 23.93017578125, 25.1494140625, 26.36865234375, 27.587890625, 28.80712890625, 30.0263671875, 31.24560546875, 32.46484375, 33.68408203125, 34.9033203125, 36.12255859375, 37.341796875, 38.56103515625, 39.7802734375, 40.99951171875, 42.21875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 7.0, 10.0, 16.0, 12.0, 17.0, 37.0, 42.0, 68.0, 118.0, 171.0, 285.0, 563.0, 875.0, 1615.0, 2933.0, 5321.0, 9907.0, 19371.0, 38934.0, 79463.0, 151829.0, 226254.0, 220710.0, 141216.0, 74297.0, 36163.0, 18177.0, 9163.0, 4863.0, 2606.0, 1448.0, 801.0, 484.0, 284.0, 176.0, 85.0, 68.0, 56.0, 34.0, 23.0, 17.0, 6.0, 13.0, 6.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-52.15625, -50.61962890625, -49.0830078125, -47.54638671875, -46.009765625, -44.47314453125, -42.9365234375, -41.39990234375, -39.86328125, -38.32666015625, -36.7900390625, -35.25341796875, -33.716796875, -32.18017578125, -30.6435546875, -29.10693359375, -27.5703125, -26.03369140625, -24.4970703125, -22.96044921875, -21.423828125, -19.88720703125, -18.3505859375, -16.81396484375, -15.27734375, -13.74072265625, -12.2041015625, -10.66748046875, -9.130859375, -7.59423828125, -6.0576171875, -4.52099609375, -2.984375, -1.44775390625, 0.0888671875, 1.62548828125, 3.162109375, 4.69873046875, 6.2353515625, 7.77197265625, 9.30859375, 10.84521484375, 12.3818359375, 13.91845703125, 15.455078125, 16.99169921875, 18.5283203125, 20.06494140625, 21.6015625, 23.13818359375, 24.6748046875, 26.21142578125, 27.748046875, 29.28466796875, 30.8212890625, 32.35791015625, 33.89453125, 35.43115234375, 36.9677734375, 38.50439453125, 40.041015625, 41.57763671875, 43.1142578125, 44.65087890625, 46.1875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 4.0, 4.0, 11.0, 8.0, 10.0, 14.0, 6.0, 20.0, 33.0, 40.0, 48.0, 69.0, 75.0, 77.0, 76.0, 106.0, 82.0, 81.0, 58.0, 44.0, 28.0, 34.0, 15.0, 23.0, 6.0, 12.0, 3.0, 3.0, 3.0, 2.0, 7.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.005977630615234375, -0.00580209493637085, -0.005626559257507324, -0.005451023578643799, -0.0052754878997802734, -0.005099952220916748, -0.004924416542053223, -0.004748880863189697, -0.004573345184326172, -0.0043978095054626465, -0.004222273826599121, -0.004046738147735596, -0.0038712024688720703, -0.003695666790008545, -0.0035201311111450195, -0.003344595432281494, -0.0031690597534179688, -0.0029935240745544434, -0.002817988395690918, -0.0026424527168273926, -0.002466917037963867, -0.002291381359100342, -0.0021158456802368164, -0.001940310001373291, -0.0017647743225097656, -0.0015892386436462402, -0.0014137029647827148, -0.0012381672859191895, -0.001062631607055664, -0.0008870959281921387, -0.0007115602493286133, -0.0005360245704650879, -0.0003604888916015625, -0.0001849532127380371, -9.417533874511719e-06, 0.00016611814498901367, 0.00034165382385253906, 0.0005171895027160645, 0.0006927251815795898, 0.0008682608604431152, 0.0010437965393066406, 0.001219332218170166, 0.0013948678970336914, 0.0015704035758972168, 0.0017459392547607422, 0.0019214749336242676, 0.002097010612487793, 0.0022725462913513184, 0.0024480819702148438, 0.002623617649078369, 0.0027991533279418945, 0.00297468900680542, 0.0031502246856689453, 0.0033257603645324707, 0.003501296043395996, 0.0036768317222595215, 0.003852367401123047, 0.004027903079986572, 0.004203438758850098, 0.004378974437713623, 0.0045545101165771484, 0.004730045795440674, 0.004905581474304199, 0.005081117153167725, 0.00525665283203125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 4.0, 8.0, 11.0, 19.0, 22.0, 43.0, 49.0, 68.0, 105.0, 134.0, 222.0, 299.0, 457.0, 695.0, 966.0, 1394.0, 2072.0, 3061.0, 4621.0, 6828.0, 10779.0, 16496.0, 25635.0, 40094.0, 61495.0, 91021.0, 124157.0, 147225.0, 144287.0, 119075.0, 85025.0, 56928.0, 36932.0, 23699.0, 15457.0, 9870.0, 6257.0, 4237.0, 2757.0, 1950.0, 1310.0, 888.0, 587.0, 397.0, 289.0, 207.0, 129.0, 99.0, 70.0, 33.0, 29.0, 24.0, 22.0, 12.0, 6.0, 4.0, 1.0, 0.0, 2.0, 2.0, 4.0], "bins": [-26.75, -25.884521484375, -25.01904296875, -24.153564453125, -23.2880859375, -22.422607421875, -21.55712890625, -20.691650390625, -19.826171875, -18.960693359375, -18.09521484375, -17.229736328125, -16.3642578125, -15.498779296875, -14.63330078125, -13.767822265625, -12.90234375, -12.036865234375, -11.17138671875, -10.305908203125, -9.4404296875, -8.574951171875, -7.70947265625, -6.843994140625, -5.978515625, -5.113037109375, -4.24755859375, -3.382080078125, -2.5166015625, -1.651123046875, -0.78564453125, 0.079833984375, 0.9453125, 1.810791015625, 2.67626953125, 3.541748046875, 4.4072265625, 5.272705078125, 6.13818359375, 7.003662109375, 7.869140625, 8.734619140625, 9.60009765625, 10.465576171875, 11.3310546875, 12.196533203125, 13.06201171875, 13.927490234375, 14.79296875, 15.658447265625, 16.52392578125, 17.389404296875, 18.2548828125, 19.120361328125, 19.98583984375, 20.851318359375, 21.716796875, 22.582275390625, 23.44775390625, 24.313232421875, 25.1787109375, 26.044189453125, 26.90966796875, 27.775146484375, 28.640625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 1.0, 2.0, 4.0, 4.0, 2.0, 4.0, 3.0, 7.0, 11.0, 11.0, 16.0, 17.0, 21.0, 20.0, 30.0, 25.0, 38.0, 31.0, 41.0, 44.0, 55.0, 49.0, 52.0, 39.0, 54.0, 51.0, 46.0, 52.0, 43.0, 49.0, 30.0, 27.0, 22.0, 17.0, 11.0, 15.0, 13.0, 8.0, 7.0, 9.0, 4.0, 4.0, 7.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-10.0859375, -9.784423828125, -9.48291015625, -9.181396484375, -8.8798828125, -8.578369140625, -8.27685546875, -7.975341796875, -7.673828125, -7.372314453125, -7.07080078125, -6.769287109375, -6.4677734375, -6.166259765625, -5.86474609375, -5.563232421875, -5.26171875, -4.960205078125, -4.65869140625, -4.357177734375, -4.0556640625, -3.754150390625, -3.45263671875, -3.151123046875, -2.849609375, -2.548095703125, -2.24658203125, -1.945068359375, -1.6435546875, -1.342041015625, -1.04052734375, -0.739013671875, -0.4375, -0.135986328125, 0.16552734375, 0.467041015625, 0.7685546875, 1.070068359375, 1.37158203125, 1.673095703125, 1.974609375, 2.276123046875, 2.57763671875, 2.879150390625, 3.1806640625, 3.482177734375, 3.78369140625, 4.085205078125, 4.38671875, 4.688232421875, 4.98974609375, 5.291259765625, 5.5927734375, 5.894287109375, 6.19580078125, 6.497314453125, 6.798828125, 7.100341796875, 7.40185546875, 7.703369140625, 8.0048828125, 8.306396484375, 8.60791015625, 8.909423828125, 9.2109375]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 3.0, 2.0, 4.0, 3.0, 5.0, 13.0, 8.0, 10.0, 17.0, 29.0, 16.0, 27.0, 41.0, 26.0, 35.0, 40.0, 41.0, 45.0, 51.0, 49.0, 48.0, 47.0, 43.0, 38.0, 52.0, 39.0, 35.0, 31.0, 39.0, 32.0, 17.0, 26.0, 19.0, 17.0, 8.0, 9.0, 8.0, 7.0, 11.0, 4.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-69.01078796386719, -66.85242462158203, -64.69405364990234, -62.53569030761719, -60.37732696533203, -58.21895980834961, -56.06059265136719, -53.90222930908203, -51.74386215209961, -49.58549499511719, -47.42713165283203, -45.26876449584961, -43.11039733886719, -40.95203399658203, -38.79366683959961, -36.63529968261719, -34.47693634033203, -32.31856918334961, -30.160205841064453, -28.00183868408203, -25.843473434448242, -23.685108184814453, -21.52674102783203, -19.368375778198242, -17.210010528564453, -15.051645278930664, -12.893279075622559, -10.734912872314453, -8.576547622680664, -6.418182373046875, -4.2598161697387695, -2.101449966430664, 0.05690765380859375, 2.215273380279541, 4.373639106750488, 6.5320048332214355, 8.690370559692383, 10.848735809326172, 13.007102012634277, 15.165468215942383, 17.323833465576172, 19.48219871520996, 21.64056396484375, 23.798931121826172, 25.95729637145996, 28.11566162109375, 30.274028778076172, 32.432395935058594, 34.59075927734375, 36.74912643432617, 38.90748977661133, 41.06585693359375, 43.224220275878906, 45.38258743286133, 47.54095458984375, 49.699317932128906, 51.85768508911133, 54.01605224609375, 56.174415588378906, 58.33278274536133, 60.49114990234375, 62.649513244628906, 64.80787658691406, 66.96624755859375, 69.1246109008789]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 3.0, 4.0, 7.0, 4.0, 11.0, 8.0, 18.0, 15.0, 12.0, 20.0, 24.0, 30.0, 28.0, 43.0, 32.0, 35.0, 37.0, 29.0, 39.0, 38.0, 47.0, 46.0, 40.0, 45.0, 39.0, 35.0, 33.0, 30.0, 35.0, 19.0, 23.0, 25.0, 27.0, 26.0, 17.0, 9.0, 13.0, 12.0, 6.0, 8.0, 8.0, 1.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-64.76392364501953, -62.54938888549805, -60.3348503112793, -58.12031555175781, -55.90577697753906, -53.69124221801758, -51.476707458496094, -49.262168884277344, -47.04763412475586, -44.833099365234375, -42.618560791015625, -40.40402603149414, -38.189491271972656, -35.974952697753906, -33.76041793823242, -31.545881271362305, -29.331344604492188, -27.11680793762207, -24.902271270751953, -22.68773651123047, -20.47319984436035, -18.258663177490234, -16.04412841796875, -13.829591751098633, -11.615055084228516, -9.400518417358398, -7.185982704162598, -4.971446514129639, -2.7569103240966797, -0.5423736572265625, 1.6721620559692383, 3.886697769165039, 6.101234436035156, 8.315771102905273, 10.530306816101074, 12.744842529296875, 14.959379196166992, 17.17391586303711, 19.388450622558594, 21.60298728942871, 23.817523956298828, 26.032060623168945, 28.246597290039062, 30.461132049560547, 32.67566680908203, 34.89020538330078, 37.104740142822266, 39.31927490234375, 41.5338134765625, 43.748348236083984, 45.962886810302734, 48.17742156982422, 50.39196014404297, 52.60649490356445, 54.82102966308594, 57.03556823730469, 59.25010299682617, 61.464637756347656, 63.679176330566406, 65.89371490478516, 68.10824584960938, 70.32278442382812, 72.53732299804688, 74.7518539428711, 76.96639251708984]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 7.0, 2.0, 9.0, 11.0, 11.0, 19.0, 25.0, 28.0, 40.0, 51.0, 74.0, 68.0, 133.0, 126.0, 171.0, 232.0, 293.0, 414.0, 537.0, 730.0, 940.0, 1402.0, 2411.0, 4144.0, 8885.0, 491303.0, 4284.0, 2432.0, 1420.0, 1011.0, 752.0, 568.0, 430.0, 311.0, 241.0, 183.0, 112.0, 118.0, 93.0, 54.0, 44.0, 33.0, 34.0, 21.0, 21.0, 13.0, 11.0, 10.0, 7.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-737.7885131835938, -713.224609375, -688.6607055664062, -664.0968017578125, -639.5328369140625, -614.9689331054688, -590.405029296875, -565.8411254882812, -541.2772216796875, -516.7133178710938, -492.1494140625, -467.5854797363281, -443.0215759277344, -418.4576721191406, -393.89373779296875, -369.329833984375, -344.76593017578125, -320.2020263671875, -295.63812255859375, -271.0741882324219, -246.51028442382812, -221.94638061523438, -197.38246154785156, -172.81854248046875, -148.254638671875, -123.69072723388672, -99.12681579589844, -74.56290435791016, -49.998992919921875, -25.435081481933594, -0.8711700439453125, 23.6927490234375, 48.25665283203125, 72.82056427001953, 97.38447570800781, 121.9483871459961, 146.51229858398438, 171.07620239257812, 195.64012145996094, 220.20404052734375, 244.7679443359375, 269.33184814453125, 293.895751953125, 318.4596862792969, 343.0235900878906, 367.5874938964844, 392.15142822265625, 416.71533203125, 441.27923583984375, 465.8431396484375, 490.40704345703125, 514.970947265625, 539.534912109375, 564.0988159179688, 588.6627197265625, 613.2266235351562, 637.79052734375, 662.3544311523438, 686.9183349609375, 711.4822387695312, 736.046142578125, 760.610107421875, 785.1740112304688, 809.7379150390625, 834.3018188476562]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 4.0, 4.0, 8.0, 3.0, 9.0, 10.0, 14.0, 21.0, 10.0, 21.0, 25.0, 29.0, 27.0, 45.0, 32.0, 30.0, 42.0, 28.0, 39.0, 48.0, 41.0, 1070.0, 36.0, 43.0, 45.0, 31.0, 32.0, 31.0, 33.0, 23.0, 22.0, 31.0, 23.0, 19.0, 22.0, 9.0, 10.0, 11.0, 11.0, 9.0, 5.0, 2.0, 4.0, 4.0, 6.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2068.56884765625, -1997.9425048828125, -1927.316162109375, -1856.6898193359375, -1786.0634765625, -1715.43701171875, -1644.8106689453125, -1574.184326171875, -1503.5579833984375, -1432.931640625, -1362.3052978515625, -1291.678955078125, -1221.052490234375, -1150.42626953125, -1079.7998046875, -1009.1734619140625, -938.547119140625, -867.9207763671875, -797.29443359375, -726.6680297851562, -656.0416870117188, -585.4153442382812, -514.7889404296875, -444.16259765625, -373.5362548828125, -302.909912109375, -232.28353881835938, -161.6571807861328, -91.03082275390625, -20.40447998046875, 50.221893310546875, 120.8482666015625, 191.474853515625, 262.1011962890625, 332.7275695800781, 403.35394287109375, 473.98028564453125, 544.6066284179688, 615.2330322265625, 685.859375, 756.4857177734375, 827.112060546875, 897.7384033203125, 968.3648071289062, 1038.9912109375, 1109.617431640625, 1180.243896484375, 1250.8702392578125, 1321.49658203125, 1392.1229248046875, 1462.749267578125, 1533.3756103515625, 1604.001953125, 1674.62841796875, 1745.2547607421875, 1815.881103515625, 1886.5074462890625, 1957.1337890625, 2027.7601318359375, 2098.386474609375, 2169.012939453125, 2239.63916015625, 2310.265625, 2380.89208984375, 2451.518310546875]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 4.0, 3.0, 7.0, 4.0, 5.0, 7.0, 4.0, 11.0, 9.0, 13.0, 13.0, 11.0, 30.0, 35.0, 27.0, 37.0, 62.0, 74.0, 118.0, 154.0, 212.0, 311.0, 437.0, 569.0, 740.0, 925.0, 1237.0, 1614.0, 2117.0, 2660.0, 4093.0, 7531.0, 64020.0, 31128602.0, 15112.0, 9158.0, 7984.0, 3354.0, 1239.0, 732.0, 400.0, 227.0, 178.0, 123.0, 127.0, 86.0, 50.0, 30.0, 13.0, 3.0, 1.0, 1.0, 1.0], "bins": [-2639.215087890625, -2579.439697265625, -2519.664306640625, -2459.88916015625, -2400.11376953125, -2340.33837890625, -2280.56298828125, -2220.78759765625, -2161.01220703125, -2101.23681640625, -2041.4615478515625, -1981.6861572265625, -1921.9107666015625, -1862.135498046875, -1802.360107421875, -1742.584716796875, -1682.8094482421875, -1623.0340576171875, -1563.2587890625, -1503.4833984375, -1443.7080078125, -1383.9326171875, -1324.1573486328125, -1264.3819580078125, -1204.606689453125, -1144.831298828125, -1085.0560302734375, -1025.2806396484375, -965.5052490234375, -905.7299194335938, -845.95458984375, -786.17919921875, -726.4039306640625, -666.6286010742188, -606.8532104492188, -547.077880859375, -487.3025207519531, -427.52716064453125, -367.7518310546875, -307.9764709472656, -248.20111083984375, -188.42575073242188, -128.65040588378906, -68.87506103515625, -9.099700927734375, 50.6756591796875, 110.45098876953125, 170.22634887695312, 230.001708984375, 289.7770690917969, 349.55242919921875, 409.3277587890625, 469.1031188964844, 528.8784790039062, 588.65380859375, 648.42919921875, 708.2045288085938, 767.9798583984375, 827.7552490234375, 887.5305786132812, 947.305908203125, 1007.081298828125, 1066.856689453125, 1126.6319580078125, 1186.4073486328125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 9.0, 7.0, 18.0, 20.0, 31.0, 34.0, 55.0, 95.0, 109.0, 173.0, 278.0, 396.0, 573.0, 834.0, 1389.0, 2150.0, 3548.0, 5633.0, 9535.0, 16273.0, 28471.0, 50647.0, 92299.0, 175690.0, 351865.0, 773437.0, 1821933.0, 1611281.0, 678234.0, 313769.0, 159150.0, 83891.0, 45874.0, 25861.0, 14927.0, 8935.0, 5198.0, 3242.0, 1960.0, 1257.0, 809.0, 540.0, 337.0, 196.0, 157.0, 117.0, 71.0, 41.0, 32.0, 25.0, 13.0, 6.0, 6.0, 10.0, 1.0, 2.0, 1.0, 1.0], "bins": [-199.375, -193.318359375, -187.26171875, -181.205078125, -175.1484375, -169.091796875, -163.03515625, -156.978515625, -150.921875, -144.865234375, -138.80859375, -132.751953125, -126.6953125, -120.638671875, -114.58203125, -108.525390625, -102.46875, -96.412109375, -90.35546875, -84.298828125, -78.2421875, -72.185546875, -66.12890625, -60.072265625, -54.015625, -47.958984375, -41.90234375, -35.845703125, -29.7890625, -23.732421875, -17.67578125, -11.619140625, -5.5625, 0.494140625, 6.55078125, 12.607421875, 18.6640625, 24.720703125, 30.77734375, 36.833984375, 42.890625, 48.947265625, 55.00390625, 61.060546875, 67.1171875, 73.173828125, 79.23046875, 85.287109375, 91.34375, 97.400390625, 103.45703125, 109.513671875, 115.5703125, 121.626953125, 127.68359375, 133.740234375, 139.796875, 145.853515625, 151.91015625, 157.966796875, 164.0234375, 170.080078125, 176.13671875, 182.193359375, 188.25]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 0.0, 1.0, 5.0, 9.0, 15.0, 14.0, 13.0, 17.0, 22.0, 28.0, 22.0, 44.0, 54.0, 54.0, 78.0, 83.0, 131.0, 136.0, 180.0, 214.0, 169.0, 157.0, 109.0, 92.0, 77.0, 57.0, 50.0, 37.0, 18.0, 31.0, 25.0, 15.0, 9.0, 10.0, 10.0, 5.0, 13.0, 5.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-82.5625, -80.03515625, -77.5078125, -74.98046875, -72.453125, -69.92578125, -67.3984375, -64.87109375, -62.34375, -59.81640625, -57.2890625, -54.76171875, -52.234375, -49.70703125, -47.1796875, -44.65234375, -42.125, -39.59765625, -37.0703125, -34.54296875, -32.015625, -29.48828125, -26.9609375, -24.43359375, -21.90625, -19.37890625, -16.8515625, -14.32421875, -11.796875, -9.26953125, -6.7421875, -4.21484375, -1.6875, 0.83984375, 3.3671875, 5.89453125, 8.421875, 10.94921875, 13.4765625, 16.00390625, 18.53125, 21.05859375, 23.5859375, 26.11328125, 28.640625, 31.16796875, 33.6953125, 36.22265625, 38.75, 41.27734375, 43.8046875, 46.33203125, 48.859375, 51.38671875, 53.9140625, 56.44140625, 58.96875, 61.49609375, 64.0234375, 66.55078125, 69.078125, 71.60546875, 74.1328125, 76.66015625, 79.1875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 17.0, 14.0, 22.0, 22.0, 28.0, 56.0, 91.0, 121.0, 179.0, 253.0, 348.0, 529.0, 783.0, 1270.0, 1888.0, 3057.0, 5135.0, 8548.0, 14640.0, 24624.0, 42670.0, 76094.0, 135727.0, 244195.0, 458225.0, 985853.0, 1969935.0, 1167544.0, 522490.0, 272559.0, 152026.0, 85714.0, 48255.0, 27702.0, 16098.0, 9451.0, 5497.0, 3511.0, 2064.0, 1428.0, 911.0, 585.0, 394.0, 292.0, 178.0, 123.0, 87.0, 55.0, 36.0, 36.0, 30.0, 22.0, 8.0, 5.0, 5.0, 8.0, 2.0, 3.0], "bins": [-98.625, -95.599609375, -92.57421875, -89.548828125, -86.5234375, -83.498046875, -80.47265625, -77.447265625, -74.421875, -71.396484375, -68.37109375, -65.345703125, -62.3203125, -59.294921875, -56.26953125, -53.244140625, -50.21875, -47.193359375, -44.16796875, -41.142578125, -38.1171875, -35.091796875, -32.06640625, -29.041015625, -26.015625, -22.990234375, -19.96484375, -16.939453125, -13.9140625, -10.888671875, -7.86328125, -4.837890625, -1.8125, 1.212890625, 4.23828125, 7.263671875, 10.2890625, 13.314453125, 16.33984375, 19.365234375, 22.390625, 25.416015625, 28.44140625, 31.466796875, 34.4921875, 37.517578125, 40.54296875, 43.568359375, 46.59375, 49.619140625, 52.64453125, 55.669921875, 58.6953125, 61.720703125, 64.74609375, 67.771484375, 70.796875, 73.822265625, 76.84765625, 79.873046875, 82.8984375, 85.923828125, 88.94921875, 91.974609375, 95.0]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 9.0, 11.0, 15.0, 12.0, 11.0, 22.0, 28.0, 38.0, 61.0, 73.0, 100.0, 150.0, 189.0, 273.0, 279.0, 229.0, 157.0, 90.0, 56.0, 45.0, 30.0, 37.0, 24.0, 18.0, 14.0, 7.0, 12.0, 10.0, 4.0, 5.0, 4.0, 5.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-157.375, -153.2744140625, -149.173828125, -145.0732421875, -140.97265625, -136.8720703125, -132.771484375, -128.6708984375, -124.5703125, -120.4697265625, -116.369140625, -112.2685546875, -108.16796875, -104.0673828125, -99.966796875, -95.8662109375, -91.765625, -87.6650390625, -83.564453125, -79.4638671875, -75.36328125, -71.2626953125, -67.162109375, -63.0615234375, -58.9609375, -54.8603515625, -50.759765625, -46.6591796875, -42.55859375, -38.4580078125, -34.357421875, -30.2568359375, -26.15625, -22.0556640625, -17.955078125, -13.8544921875, -9.75390625, -5.6533203125, -1.552734375, 2.5478515625, 6.6484375, 10.7490234375, 14.849609375, 18.9501953125, 23.05078125, 27.1513671875, 31.251953125, 35.3525390625, 39.453125, 43.5537109375, 47.654296875, 51.7548828125, 55.85546875, 59.9560546875, 64.056640625, 68.1572265625, 72.2578125, 76.3583984375, 80.458984375, 84.5595703125, 88.66015625, 92.7607421875, 96.861328125, 100.9619140625, 105.0625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 6.0, 10.0, 7.0, 26.0, 26.0, 35.0, 61.0, 79.0, 120.0, 217.0, 348.0, 555.0, 890.0, 1468.0, 2680.0, 5104.0, 9861.0, 20252.0, 43308.0, 109605.0, 5442987.0, 491098.0, 89461.0, 36893.0, 17436.0, 8740.0, 4535.0, 2354.0, 1261.0, 772.0, 439.0, 293.0, 193.0, 124.0, 85.0, 38.0, 24.0, 13.0, 13.0, 9.0, 7.0, 11.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-239.125, -229.119140625, -219.11328125, -209.107421875, -199.1015625, -189.095703125, -179.08984375, -169.083984375, -159.078125, -149.072265625, -139.06640625, -129.060546875, -119.0546875, -109.048828125, -99.04296875, -89.037109375, -79.03125, -69.025390625, -59.01953125, -49.013671875, -39.0078125, -29.001953125, -18.99609375, -8.990234375, 1.015625, 11.021484375, 21.02734375, 31.033203125, 41.0390625, 51.044921875, 61.05078125, 71.056640625, 81.0625, 91.068359375, 101.07421875, 111.080078125, 121.0859375, 131.091796875, 141.09765625, 151.103515625, 161.109375, 171.115234375, 181.12109375, 191.126953125, 201.1328125, 211.138671875, 221.14453125, 231.150390625, 241.15625, 251.162109375, 261.16796875, 271.173828125, 281.1796875, 291.185546875, 301.19140625, 311.197265625, 321.203125, 331.208984375, 341.21484375, 351.220703125, 361.2265625, 371.232421875, 381.23828125, 391.244140625, 401.25]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 6.0, 2.0, 2.0, 8.0, 6.0, 9.0, 9.0, 13.0, 9.0, 18.0, 27.0, 35.0, 23.0, 42.0, 42.0, 42.0, 63.0, 71.0, 135.0, 235.0, 329.0, 260.0, 147.0, 87.0, 68.0, 56.0, 33.0, 36.0, 46.0, 29.0, 19.0, 19.0, 25.0, 13.0, 12.0, 9.0, 7.0, 7.0, 3.0, 4.0, 4.0, 6.0, 3.0, 1.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-152.5, -147.5546875, -142.609375, -137.6640625, -132.71875, -127.7734375, -122.828125, -117.8828125, -112.9375, -107.9921875, -103.046875, -98.1015625, -93.15625, -88.2109375, -83.265625, -78.3203125, -73.375, -68.4296875, -63.484375, -58.5390625, -53.59375, -48.6484375, -43.703125, -38.7578125, -33.8125, -28.8671875, -23.921875, -18.9765625, -14.03125, -9.0859375, -4.140625, 0.8046875, 5.75, 10.6953125, 15.640625, 20.5859375, 25.53125, 30.4765625, 35.421875, 40.3671875, 45.3125, 50.2578125, 55.203125, 60.1484375, 65.09375, 70.0390625, 74.984375, 79.9296875, 84.875, 89.8203125, 94.765625, 99.7109375, 104.65625, 109.6015625, 114.546875, 119.4921875, 124.4375, 129.3828125, 134.328125, 139.2734375, 144.21875, 149.1640625, 154.109375, 159.0546875, 164.0]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 9.0, 9.0, 7.0, 12.0, 15.0, 22.0, 30.0, 51.0, 45.0, 71.0, 105.0, 177.0, 142.0, 79.0, 56.0, 32.0, 41.0, 26.0, 19.0, 10.0, 13.0, 8.0, 8.0, 9.0, 4.0, 2.0, 0.0, 2.0, 3.0], "bins": [-8581.712890625, -8398.4638671875, -8215.2138671875, -8031.96484375, -7848.71533203125, -7665.4658203125, -7482.216796875, -7298.96728515625, -7115.7177734375, -6932.46826171875, -6749.21875, -6565.9697265625, -6382.72021484375, -6199.470703125, -6016.2216796875, -5832.97216796875, -5649.72265625, -5466.47314453125, -5283.2236328125, -5099.974609375, -4916.72509765625, -4733.4755859375, -4550.2265625, -4366.97705078125, -4183.7275390625, -4000.47802734375, -3817.228759765625, -3633.9794921875, -3450.72998046875, -3267.48046875, -3084.231201171875, -2900.98193359375, -2717.732421875, -2534.48291015625, -2351.233642578125, -2167.984375, -1984.73486328125, -1801.4854736328125, -1618.236083984375, -1434.9866943359375, -1251.7373046875, -1068.4879150390625, -885.238525390625, -701.9891357421875, -518.73974609375, -335.4903564453125, -152.240966796875, 31.0084228515625, 214.2578125, 397.5072021484375, 580.756591796875, 764.0059814453125, 947.25537109375, 1130.5047607421875, 1313.754150390625, 1497.0035400390625, 1680.2529296875, 1863.5023193359375, 2046.751708984375, 2230.0009765625, 2413.25048828125, 2596.5, 2779.749267578125, 2962.99853515625, 3146.248046875]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 4.0, 3.0, 4.0, 7.0, 12.0, 12.0, 19.0, 8.0, 21.0, 18.0, 14.0, 18.0, 25.0, 21.0, 23.0, 47.0, 70.0, 117.0, 149.0, 85.0, 45.0, 44.0, 31.0, 35.0, 19.0, 24.0, 16.0, 19.0, 12.0, 8.0, 9.0, 6.0, 13.0, 8.0, 6.0, 5.0, 7.0, 2.0, 2.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4715.66064453125, -4569.54931640625, -4423.4375, -4277.326171875, -4131.21484375, -3985.10302734375, -3838.99169921875, -3692.880126953125, -3546.7685546875, -3400.656982421875, -3254.54541015625, -3108.43408203125, -2962.322509765625, -2816.2109375, -2670.099609375, -2523.988037109375, -2377.87646484375, -2231.764892578125, -2085.6533203125, -1939.5419921875, -1793.430419921875, -1647.31884765625, -1501.2073974609375, -1355.095947265625, -1208.984375, -1062.872802734375, -916.7613525390625, -770.6498413085938, -624.538330078125, -478.42681884765625, -332.3153076171875, -186.20379638671875, -40.091796875, 106.01971435546875, 252.1312255859375, 398.24273681640625, 544.354248046875, 690.4657592773438, 836.5772705078125, 982.6887817382812, 1128.80029296875, 1274.911865234375, 1421.0233154296875, 1567.134765625, 1713.246337890625, 1859.35791015625, 2005.4693603515625, 2151.580810546875, 2297.6923828125, 2443.803955078125, 2589.91552734375, 2736.02685546875, 2882.138427734375, 3028.25, 3174.361328125, 3320.472900390625, 3466.58447265625, 3612.696044921875, 3758.8076171875, 3904.9189453125, 4051.030517578125, 4197.14208984375, 4343.25341796875, 4489.365234375, 4635.4765625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 10.0, 7.0, 12.0, 26.0, 14.0, 30.0, 46.0, 59.0, 64.0, 81.0, 151.0, 204.0, 268.0, 395.0, 476.0, 745.0, 1093.0, 1601.0, 2294.0, 3450.0, 5307.0, 8338.0, 13599.0, 23310.0, 44932.0, 106009.0, 375449.0, 2779088.0, 575042.0, 140608.0, 52859.0, 25093.0, 13445.0, 7697.0, 4513.0, 2911.0, 1859.0, 1200.0, 707.0, 433.0, 314.0, 200.0, 135.0, 80.0, 55.0, 32.0, 17.0, 9.0, 8.0, 6.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-42.71875, -41.5185546875, -40.318359375, -39.1181640625, -37.91796875, -36.7177734375, -35.517578125, -34.3173828125, -33.1171875, -31.9169921875, -30.716796875, -29.5166015625, -28.31640625, -27.1162109375, -25.916015625, -24.7158203125, -23.515625, -22.3154296875, -21.115234375, -19.9150390625, -18.71484375, -17.5146484375, -16.314453125, -15.1142578125, -13.9140625, -12.7138671875, -11.513671875, -10.3134765625, -9.11328125, -7.9130859375, -6.712890625, -5.5126953125, -4.3125, -3.1123046875, -1.912109375, -0.7119140625, 0.48828125, 1.6884765625, 2.888671875, 4.0888671875, 5.2890625, 6.4892578125, 7.689453125, 8.8896484375, 10.08984375, 11.2900390625, 12.490234375, 13.6904296875, 14.890625, 16.0908203125, 17.291015625, 18.4912109375, 19.69140625, 20.8916015625, 22.091796875, 23.2919921875, 24.4921875, 25.6923828125, 26.892578125, 28.0927734375, 29.29296875, 30.4931640625, 31.693359375, 32.8935546875, 34.09375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 6.0, 2.0, 4.0, 2.0, 12.0, 3.0, 4.0, 13.0, 9.0, 14.0, 23.0, 24.0, 42.0, 41.0, 59.0, 93.0, 125.0, 134.0, 82.0, 78.0, 62.0, 40.0, 30.0, 19.0, 18.0, 12.0, 12.0, 7.0, 8.0, 3.0, 3.0, 3.0, 3.0, 5.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.703125, -4.575531005859375, -4.44793701171875, -4.320343017578125, -4.1927490234375, -4.065155029296875, -3.93756103515625, -3.809967041015625, -3.682373046875, -3.554779052734375, -3.42718505859375, -3.299591064453125, -3.1719970703125, -3.044403076171875, -2.91680908203125, -2.789215087890625, -2.66162109375, -2.534027099609375, -2.40643310546875, -2.278839111328125, -2.1512451171875, -2.023651123046875, -1.89605712890625, -1.768463134765625, -1.640869140625, -1.513275146484375, -1.38568115234375, -1.258087158203125, -1.1304931640625, -1.002899169921875, -0.87530517578125, -0.747711181640625, -0.6201171875, -0.492523193359375, -0.36492919921875, -0.237335205078125, -0.1097412109375, 0.017852783203125, 0.14544677734375, 0.273040771484375, 0.400634765625, 0.528228759765625, 0.65582275390625, 0.783416748046875, 0.9110107421875, 1.038604736328125, 1.16619873046875, 1.293792724609375, 1.42138671875, 1.548980712890625, 1.67657470703125, 1.804168701171875, 1.9317626953125, 2.059356689453125, 2.18695068359375, 2.314544677734375, 2.442138671875, 2.569732666015625, 2.69732666015625, 2.824920654296875, 2.9525146484375, 3.080108642578125, 3.20770263671875, 3.335296630859375, 3.462890625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 5.0, 4.0, 10.0, 6.0, 8.0, 9.0, 37.0, 32.0, 44.0, 53.0, 112.0, 113.0, 187.0, 230.0, 375.0, 549.0, 887.0, 1491.0, 2552.0, 4864.0, 9771.0, 21848.0, 53910.0, 147571.0, 458985.0, 1856567.0, 1129297.0, 322730.0, 107213.0, 40508.0, 16963.0, 7803.0, 3891.0, 2129.0, 1177.0, 808.0, 467.0, 306.0, 217.0, 153.0, 126.0, 91.0, 57.0, 50.0, 27.0, 16.0, 14.0, 12.0, 8.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-37.84375, -36.53173828125, -35.2197265625, -33.90771484375, -32.595703125, -31.28369140625, -29.9716796875, -28.65966796875, -27.34765625, -26.03564453125, -24.7236328125, -23.41162109375, -22.099609375, -20.78759765625, -19.4755859375, -18.16357421875, -16.8515625, -15.53955078125, -14.2275390625, -12.91552734375, -11.603515625, -10.29150390625, -8.9794921875, -7.66748046875, -6.35546875, -5.04345703125, -3.7314453125, -2.41943359375, -1.107421875, 0.20458984375, 1.5166015625, 2.82861328125, 4.140625, 5.45263671875, 6.7646484375, 8.07666015625, 9.388671875, 10.70068359375, 12.0126953125, 13.32470703125, 14.63671875, 15.94873046875, 17.2607421875, 18.57275390625, 19.884765625, 21.19677734375, 22.5087890625, 23.82080078125, 25.1328125, 26.44482421875, 27.7568359375, 29.06884765625, 30.380859375, 31.69287109375, 33.0048828125, 34.31689453125, 35.62890625, 36.94091796875, 38.2529296875, 39.56494140625, 40.876953125, 42.18896484375, 43.5009765625, 44.81298828125, 46.125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 12.0, 17.0, 14.0, 18.0, 12.0, 30.0, 28.0, 32.0, 43.0, 67.0, 66.0, 90.0, 115.0, 145.0, 168.0, 237.0, 266.0, 407.0, 543.0, 343.0, 266.0, 229.0, 183.0, 145.0, 115.0, 87.0, 85.0, 64.0, 48.0, 55.0, 34.0, 27.0, 17.0, 12.0, 12.0, 9.0, 10.0, 8.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-14.59375, -14.2027587890625, -13.811767578125, -13.4207763671875, -13.02978515625, -12.6387939453125, -12.247802734375, -11.8568115234375, -11.4658203125, -11.0748291015625, -10.683837890625, -10.2928466796875, -9.90185546875, -9.5108642578125, -9.119873046875, -8.7288818359375, -8.337890625, -7.9468994140625, -7.555908203125, -7.1649169921875, -6.77392578125, -6.3829345703125, -5.991943359375, -5.6009521484375, -5.2099609375, -4.8189697265625, -4.427978515625, -4.0369873046875, -3.64599609375, -3.2550048828125, -2.864013671875, -2.4730224609375, -2.08203125, -1.6910400390625, -1.300048828125, -0.9090576171875, -0.51806640625, -0.1270751953125, 0.263916015625, 0.6549072265625, 1.0458984375, 1.4368896484375, 1.827880859375, 2.2188720703125, 2.60986328125, 3.0008544921875, 3.391845703125, 3.7828369140625, 4.173828125, 4.5648193359375, 4.955810546875, 5.3468017578125, 5.73779296875, 6.1287841796875, 6.519775390625, 6.9107666015625, 7.3017578125, 7.6927490234375, 8.083740234375, 8.4747314453125, 8.86572265625, 9.2567138671875, 9.647705078125, 10.0386962890625, 10.4296875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 8.0, 12.0, 27.0, 61.0, 108.0, 163.0, 184.0, 184.0, 121.0, 54.0, 33.0, 16.0, 16.0, 8.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-214.38536071777344, -205.2847442626953, -196.18414306640625, -187.08352661132812, -177.98291015625, -168.88229370117188, -159.78167724609375, -150.6810760498047, -141.58045959472656, -132.47984313964844, -123.37923431396484, -114.27862548828125, -105.17800903320312, -96.077392578125, -86.9767837524414, -77.87617492675781, -68.77555847167969, -59.67494583129883, -50.57433319091797, -41.47372055053711, -32.37310791015625, -23.27249526977539, -14.171882629394531, -5.071269989013672, 4.0293426513671875, 13.129955291748047, 22.230567932128906, 31.331180572509766, 40.431793212890625, 49.532405853271484, 58.633018493652344, 67.73362731933594, 76.83425903320312, 85.93487548828125, 95.03548431396484, 104.13609313964844, 113.23670959472656, 122.33732604980469, 131.43792724609375, 140.53854370117188, 149.63916015625, 158.73977661132812, 167.84039306640625, 176.9409942626953, 186.04161071777344, 195.14222717285156, 204.24282836914062, 213.34344482421875, 222.44406127929688, 231.544677734375, 240.64529418945312, 249.7458953857422, 258.84649658203125, 267.9471130371094, 277.0477294921875, 286.1483459472656, 295.24896240234375, 304.3495788574219, 313.4501953125, 322.5508117675781, 331.65142822265625, 340.75201416015625, 349.8526306152344, 358.9532470703125, 368.0538635253906]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 4.0, 8.0, 13.0, 11.0, 17.0, 17.0, 28.0, 30.0, 51.0, 56.0, 63.0, 61.0, 58.0, 67.0, 78.0, 66.0, 58.0, 49.0, 43.0, 32.0, 47.0, 42.0, 23.0, 23.0, 19.0, 10.0, 6.0, 7.0, 1.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-166.04632568359375, -161.99449157714844, -157.9426727294922, -153.89083862304688, -149.83900451660156, -145.7871856689453, -141.7353515625, -137.6835174560547, -133.63169860839844, -129.57986450195312, -125.52803802490234, -121.47621154785156, -117.42438507080078, -113.37255859375, -109.32072448730469, -105.2688980102539, -101.2170639038086, -97.16523742675781, -93.1134033203125, -89.06157684326172, -85.00975036621094, -80.95791625976562, -76.90608978271484, -72.85426330566406, -68.80242919921875, -64.75060272216797, -60.69877243041992, -56.646942138671875, -52.595115661621094, -48.54328536987305, -44.491455078125, -40.43962860107422, -36.38780975341797, -32.33597946166992, -28.28415298461914, -24.232322692871094, -20.18049430847168, -16.128665924072266, -12.076835632324219, -8.025007247924805, -3.9731788635253906, 0.07864999771118164, 4.130478858947754, 8.182308197021484, 12.234136581420898, 16.285964965820312, 20.33779525756836, 24.389623641967773, 28.441452026367188, 32.493282318115234, 36.545108795166016, 40.59693908691406, 44.648765563964844, 48.70059585571289, 52.75242614746094, 56.80425262451172, 60.856082916259766, 64.90791320800781, 68.9597396850586, 73.01156616210938, 77.06340026855469, 81.11522674560547, 85.16705322265625, 89.21888732910156, 93.27071380615234]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 11.0, 9.0, 20.0, 26.0, 30.0, 52.0, 56.0, 97.0, 128.0, 187.0, 332.0, 521.0, 887.0, 1623.0, 3110.0, 6346.0, 14290.0, 37738.0, 128521.0, 508949.0, 244197.0, 61756.0, 21614.0, 8815.0, 4263.0, 2144.0, 1179.0, 602.0, 363.0, 227.0, 149.0, 94.0, 68.0, 39.0, 26.0, 27.0, 6.0, 7.0, 8.0, 14.0, 2.0, 6.0, 1.0, 2.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-30.171875, -29.156494140625, -28.14111328125, -27.125732421875, -26.1103515625, -25.094970703125, -24.07958984375, -23.064208984375, -22.048828125, -21.033447265625, -20.01806640625, -19.002685546875, -17.9873046875, -16.971923828125, -15.95654296875, -14.941162109375, -13.92578125, -12.910400390625, -11.89501953125, -10.879638671875, -9.8642578125, -8.848876953125, -7.83349609375, -6.818115234375, -5.802734375, -4.787353515625, -3.77197265625, -2.756591796875, -1.7412109375, -0.725830078125, 0.28955078125, 1.304931640625, 2.3203125, 3.335693359375, 4.35107421875, 5.366455078125, 6.3818359375, 7.397216796875, 8.41259765625, 9.427978515625, 10.443359375, 11.458740234375, 12.47412109375, 13.489501953125, 14.5048828125, 15.520263671875, 16.53564453125, 17.551025390625, 18.56640625, 19.581787109375, 20.59716796875, 21.612548828125, 22.6279296875, 23.643310546875, 24.65869140625, 25.674072265625, 26.689453125, 27.704833984375, 28.72021484375, 29.735595703125, 30.7509765625, 31.766357421875, 32.78173828125, 33.797119140625, 34.8125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 5.0, 4.0, 4.0, 6.0, 4.0, 14.0, 20.0, 22.0, 14.0, 30.0, 56.0, 60.0, 69.0, 73.0, 81.0, 95.0, 70.0, 73.0, 60.0, 54.0, 39.0, 45.0, 22.0, 24.0, 15.0, 9.0, 7.0, 3.0, 2.0, 10.0, 3.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6875, -6.521270751953125, -6.35504150390625, -6.188812255859375, -6.0225830078125, -5.856353759765625, -5.69012451171875, -5.523895263671875, -5.357666015625, -5.191436767578125, -5.02520751953125, -4.858978271484375, -4.6927490234375, -4.526519775390625, -4.36029052734375, -4.194061279296875, -4.02783203125, -3.861602783203125, -3.69537353515625, -3.529144287109375, -3.3629150390625, -3.196685791015625, -3.03045654296875, -2.864227294921875, -2.697998046875, -2.531768798828125, -2.36553955078125, -2.199310302734375, -2.0330810546875, -1.866851806640625, -1.70062255859375, -1.534393310546875, -1.3681640625, -1.201934814453125, -1.03570556640625, -0.869476318359375, -0.7032470703125, -0.537017822265625, -0.37078857421875, -0.204559326171875, -0.038330078125, 0.127899169921875, 0.29412841796875, 0.460357666015625, 0.6265869140625, 0.792816162109375, 0.95904541015625, 1.125274658203125, 1.29150390625, 1.457733154296875, 1.62396240234375, 1.790191650390625, 1.9564208984375, 2.122650146484375, 2.28887939453125, 2.455108642578125, 2.621337890625, 2.787567138671875, 2.95379638671875, 3.120025634765625, 3.2862548828125, 3.452484130859375, 3.61871337890625, 3.784942626953125, 3.951171875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 6.0, 5.0, 3.0, 8.0, 13.0, 23.0, 16.0, 24.0, 28.0, 66.0, 74.0, 101.0, 167.0, 239.0, 320.0, 458.0, 668.0, 1048.0, 1637.0, 2550.0, 4313.0, 7460.0, 13358.0, 27019.0, 59782.0, 160152.0, 389516.0, 225741.0, 79581.0, 34456.0, 16812.0, 8995.0, 5077.0, 3102.0, 1940.0, 1238.0, 790.0, 513.0, 359.0, 263.0, 175.0, 142.0, 102.0, 61.0, 48.0, 35.0, 22.0, 24.0, 11.0, 6.0, 11.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.59375, -17.9873046875, -17.380859375, -16.7744140625, -16.16796875, -15.5615234375, -14.955078125, -14.3486328125, -13.7421875, -13.1357421875, -12.529296875, -11.9228515625, -11.31640625, -10.7099609375, -10.103515625, -9.4970703125, -8.890625, -8.2841796875, -7.677734375, -7.0712890625, -6.46484375, -5.8583984375, -5.251953125, -4.6455078125, -4.0390625, -3.4326171875, -2.826171875, -2.2197265625, -1.61328125, -1.0068359375, -0.400390625, 0.2060546875, 0.8125, 1.4189453125, 2.025390625, 2.6318359375, 3.23828125, 3.8447265625, 4.451171875, 5.0576171875, 5.6640625, 6.2705078125, 6.876953125, 7.4833984375, 8.08984375, 8.6962890625, 9.302734375, 9.9091796875, 10.515625, 11.1220703125, 11.728515625, 12.3349609375, 12.94140625, 13.5478515625, 14.154296875, 14.7607421875, 15.3671875, 15.9736328125, 16.580078125, 17.1865234375, 17.79296875, 18.3994140625, 19.005859375, 19.6123046875, 20.21875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 5.0, 7.0, 2.0, 8.0, 11.0, 17.0, 11.0, 8.0, 9.0, 15.0, 18.0, 18.0, 23.0, 29.0, 37.0, 43.0, 43.0, 41.0, 41.0, 40.0, 38.0, 38.0, 45.0, 38.0, 30.0, 35.0, 42.0, 33.0, 29.0, 33.0, 29.0, 22.0, 23.0, 16.0, 20.0, 13.0, 19.0, 11.0, 16.0, 9.0, 11.0, 5.0, 4.0, 4.0, 5.0, 4.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.28125, -18.6494140625, -18.017578125, -17.3857421875, -16.75390625, -16.1220703125, -15.490234375, -14.8583984375, -14.2265625, -13.5947265625, -12.962890625, -12.3310546875, -11.69921875, -11.0673828125, -10.435546875, -9.8037109375, -9.171875, -8.5400390625, -7.908203125, -7.2763671875, -6.64453125, -6.0126953125, -5.380859375, -4.7490234375, -4.1171875, -3.4853515625, -2.853515625, -2.2216796875, -1.58984375, -0.9580078125, -0.326171875, 0.3056640625, 0.9375, 1.5693359375, 2.201171875, 2.8330078125, 3.46484375, 4.0966796875, 4.728515625, 5.3603515625, 5.9921875, 6.6240234375, 7.255859375, 7.8876953125, 8.51953125, 9.1513671875, 9.783203125, 10.4150390625, 11.046875, 11.6787109375, 12.310546875, 12.9423828125, 13.57421875, 14.2060546875, 14.837890625, 15.4697265625, 16.1015625, 16.7333984375, 17.365234375, 17.9970703125, 18.62890625, 19.2607421875, 19.892578125, 20.5244140625, 21.15625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 5.0, 5.0, 5.0, 3.0, 14.0, 10.0, 15.0, 39.0, 37.0, 48.0, 94.0, 161.0, 224.0, 406.0, 777.0, 1673.0, 3737.0, 9575.0, 30202.0, 135528.0, 534336.0, 256426.0, 50755.0, 14511.0, 5301.0, 2272.0, 1074.0, 554.0, 301.0, 185.0, 108.0, 71.0, 26.0, 24.0, 17.0, 10.0, 13.0, 8.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.890625, -19.262939453125, -18.63525390625, -18.007568359375, -17.3798828125, -16.752197265625, -16.12451171875, -15.496826171875, -14.869140625, -14.241455078125, -13.61376953125, -12.986083984375, -12.3583984375, -11.730712890625, -11.10302734375, -10.475341796875, -9.84765625, -9.219970703125, -8.59228515625, -7.964599609375, -7.3369140625, -6.709228515625, -6.08154296875, -5.453857421875, -4.826171875, -4.198486328125, -3.57080078125, -2.943115234375, -2.3154296875, -1.687744140625, -1.06005859375, -0.432373046875, 0.1953125, 0.822998046875, 1.45068359375, 2.078369140625, 2.7060546875, 3.333740234375, 3.96142578125, 4.589111328125, 5.216796875, 5.844482421875, 6.47216796875, 7.099853515625, 7.7275390625, 8.355224609375, 8.98291015625, 9.610595703125, 10.23828125, 10.865966796875, 11.49365234375, 12.121337890625, 12.7490234375, 13.376708984375, 14.00439453125, 14.632080078125, 15.259765625, 15.887451171875, 16.51513671875, 17.142822265625, 17.7705078125, 18.398193359375, 19.02587890625, 19.653564453125, 20.28125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 7.0, 10.0, 9.0, 13.0, 18.0, 24.0, 27.0, 32.0, 37.0, 47.0, 45.0, 56.0, 64.0, 58.0, 63.0, 69.0, 61.0, 59.0, 54.0, 40.0, 40.0, 26.0, 21.0, 23.0, 21.0, 17.0, 11.0, 2.0, 8.0, 11.0, 5.0, 3.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.0005445480346679688, -0.00052623450756073, -0.0005079209804534912, -0.0004896074533462524, -0.00047129392623901367, -0.0004529803991317749, -0.00043466687202453613, -0.00041635334491729736, -0.0003980398178100586, -0.0003797262907028198, -0.00036141276359558105, -0.0003430992364883423, -0.0003247857093811035, -0.00030647218227386475, -0.000288158655166626, -0.0002698451280593872, -0.00025153160095214844, -0.00023321807384490967, -0.0002149045467376709, -0.00019659101963043213, -0.00017827749252319336, -0.0001599639654159546, -0.00014165043830871582, -0.00012333691120147705, -0.00010502338409423828, -8.670985698699951e-05, -6.839632987976074e-05, -5.008280277252197e-05, -3.17692756652832e-05, -1.3455748558044434e-05, 4.857778549194336e-06, 2.3171305656433105e-05, 4.1484832763671875e-05, 5.9798359870910645e-05, 7.811188697814941e-05, 9.642541408538818e-05, 0.00011473894119262695, 0.00013305246829986572, 0.0001513659954071045, 0.00016967952251434326, 0.00018799304962158203, 0.0002063065767288208, 0.00022462010383605957, 0.00024293363094329834, 0.0002612471580505371, 0.0002795606851577759, 0.00029787421226501465, 0.0003161877393722534, 0.0003345012664794922, 0.00035281479358673096, 0.0003711283206939697, 0.0003894418478012085, 0.00040775537490844727, 0.00042606890201568604, 0.0004443824291229248, 0.0004626959562301636, 0.00048100948333740234, 0.0004993230104446411, 0.0005176365375518799, 0.0005359500646591187, 0.0005542635917663574, 0.0005725771188735962, 0.000590890645980835, 0.0006092041730880737, 0.0006275177001953125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 4.0, 6.0, 10.0, 13.0, 30.0, 36.0, 91.0, 177.0, 345.0, 803.0, 1680.0, 4594.0, 13809.0, 54738.0, 298340.0, 525958.0, 112286.0, 23695.0, 7155.0, 2590.0, 1089.0, 523.0, 270.0, 127.0, 84.0, 33.0, 21.0, 14.0, 10.0, 6.0, 5.0, 8.0, 1.0, 3.0, 2.0], "bins": [-31.015625, -30.314208984375, -29.61279296875, -28.911376953125, -28.2099609375, -27.508544921875, -26.80712890625, -26.105712890625, -25.404296875, -24.702880859375, -24.00146484375, -23.300048828125, -22.5986328125, -21.897216796875, -21.19580078125, -20.494384765625, -19.79296875, -19.091552734375, -18.39013671875, -17.688720703125, -16.9873046875, -16.285888671875, -15.58447265625, -14.883056640625, -14.181640625, -13.480224609375, -12.77880859375, -12.077392578125, -11.3759765625, -10.674560546875, -9.97314453125, -9.271728515625, -8.5703125, -7.868896484375, -7.16748046875, -6.466064453125, -5.7646484375, -5.063232421875, -4.36181640625, -3.660400390625, -2.958984375, -2.257568359375, -1.55615234375, -0.854736328125, -0.1533203125, 0.548095703125, 1.24951171875, 1.950927734375, 2.65234375, 3.353759765625, 4.05517578125, 4.756591796875, 5.4580078125, 6.159423828125, 6.86083984375, 7.562255859375, 8.263671875, 8.965087890625, 9.66650390625, 10.367919921875, 11.0693359375, 11.770751953125, 12.47216796875, 13.173583984375, 13.875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 8.0, 10.0, 6.0, 11.0, 15.0, 18.0, 25.0, 23.0, 24.0, 32.0, 36.0, 37.0, 45.0, 52.0, 52.0, 50.0, 72.0, 46.0, 62.0, 59.0, 42.0, 31.0, 44.0, 36.0, 22.0, 21.0, 22.0, 20.0, 14.0, 13.0, 9.0, 7.0, 9.0, 3.0, 2.0, 6.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.6484375, -8.39825439453125, -8.1480712890625, -7.89788818359375, -7.647705078125, -7.39752197265625, -7.1473388671875, -6.89715576171875, -6.64697265625, -6.39678955078125, -6.1466064453125, -5.89642333984375, -5.646240234375, -5.39605712890625, -5.1458740234375, -4.89569091796875, -4.6455078125, -4.39532470703125, -4.1451416015625, -3.89495849609375, -3.644775390625, -3.39459228515625, -3.1444091796875, -2.89422607421875, -2.64404296875, -2.39385986328125, -2.1436767578125, -1.89349365234375, -1.643310546875, -1.39312744140625, -1.1429443359375, -0.89276123046875, -0.642578125, -0.39239501953125, -0.1422119140625, 0.10797119140625, 0.358154296875, 0.60833740234375, 0.8585205078125, 1.10870361328125, 1.35888671875, 1.60906982421875, 1.8592529296875, 2.10943603515625, 2.359619140625, 2.60980224609375, 2.8599853515625, 3.11016845703125, 3.3603515625, 3.61053466796875, 3.8607177734375, 4.11090087890625, 4.361083984375, 4.61126708984375, 4.8614501953125, 5.11163330078125, 5.36181640625, 5.61199951171875, 5.8621826171875, 6.11236572265625, 6.362548828125, 6.61273193359375, 6.8629150390625, 7.11309814453125, 7.36328125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 7.0, 4.0, 5.0, 8.0, 11.0, 17.0, 26.0, 36.0, 94.0, 197.0, 215.0, 191.0, 85.0, 46.0, 24.0, 12.0, 6.0, 8.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-288.68634033203125, -279.2657470703125, -269.84515380859375, -260.4245300292969, -251.00393676757812, -241.58334350585938, -232.16273498535156, -222.74212646484375, -213.321533203125, -203.90093994140625, -194.48033142089844, -185.05972290039062, -175.63912963867188, -166.21853637695312, -156.7979278564453, -147.3773193359375, -137.95672607421875, -128.5361328125, -119.11552429199219, -109.6949234008789, -100.27432250976562, -90.85372161865234, -81.43312072753906, -72.01251983642578, -62.5919189453125, -53.17131805419922, -43.75071716308594, -34.330116271972656, -24.909515380859375, -15.488914489746094, -6.0683135986328125, 3.3522872924804688, 12.772918701171875, 22.193519592285156, 31.614120483398438, 41.03472137451172, 50.455322265625, 59.87592315673828, 69.29652404785156, 78.71712493896484, 88.13772583007812, 97.5583267211914, 106.97892761230469, 116.39952850341797, 125.82012939453125, 135.24072265625, 144.6613311767578, 154.08193969726562, 163.50253295898438, 172.92312622070312, 182.34373474121094, 191.76434326171875, 201.1849365234375, 210.60552978515625, 220.02613830566406, 229.44674682617188, 238.86734008789062, 248.28793334960938, 257.70855712890625, 267.129150390625, 276.54974365234375, 285.9703369140625, 295.39093017578125, 304.8115539550781, 314.2321472167969]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 3.0, 2.0, 9.0, 9.0, 12.0, 12.0, 29.0, 61.0, 88.0, 131.0, 188.0, 139.0, 113.0, 64.0, 40.0, 22.0, 17.0, 6.0, 7.0, 7.0, 6.0, 2.0, 7.0, 2.0, 0.0, 2.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-279.038818359375, -266.829345703125, -254.61988830566406, -242.41043090820312, -230.20095825195312, -217.99148559570312, -205.7820281982422, -193.57257080078125, -181.36309814453125, -169.15362548828125, -156.9441680908203, -144.73471069335938, -132.52523803710938, -120.3157730102539, -108.10630798339844, -95.89684295654297, -83.6873779296875, -71.47791290283203, -59.26844787597656, -47.058982849121094, -34.849517822265625, -22.640052795410156, -10.430587768554688, 1.7788772583007812, 13.98834228515625, 26.19780731201172, 38.40727233886719, 50.616737365722656, 62.826202392578125, 75.0356674194336, 87.24513244628906, 99.45459747314453, 111.6640625, 123.87352752685547, 136.08299255371094, 148.29244995117188, 160.50192260742188, 172.71139526367188, 184.9208526611328, 197.13031005859375, 209.33978271484375, 221.54925537109375, 233.7587127685547, 245.96817016601562, 258.1776428222656, 270.3871154785156, 282.5965576171875, 294.8060302734375, 307.0155029296875, 319.2249755859375, 331.4344482421875, 343.6438903808594, 355.8533630371094, 368.0628356933594, 380.27227783203125, 392.48175048828125, 404.69122314453125, 416.90069580078125, 429.11016845703125, 441.3196105957031, 453.5290832519531, 465.7385559082031, 477.947998046875, 490.157470703125, 502.366943359375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 3.0, 8.0, 6.0, 15.0, 17.0, 21.0, 18.0, 55.0, 62.0, 110.0, 208.0, 378.0, 621.0, 1238.0, 2439.0, 5633.0, 14450.0, 48726.0, 295348.0, 3568143.0, 195194.0, 38937.0, 12427.0, 5016.0, 2356.0, 1126.0, 619.0, 405.0, 229.0, 152.0, 94.0, 62.0, 49.0, 28.0, 19.0, 24.0, 16.0, 14.0, 4.0, 6.0, 2.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-92.1875, -89.15625, -86.125, -83.09375, -80.0625, -77.03125, -74.0, -70.96875, -67.9375, -64.90625, -61.875, -58.84375, -55.8125, -52.78125, -49.75, -46.71875, -43.6875, -40.65625, -37.625, -34.59375, -31.5625, -28.53125, -25.5, -22.46875, -19.4375, -16.40625, -13.375, -10.34375, -7.3125, -4.28125, -1.25, 1.78125, 4.8125, 7.84375, 10.875, 13.90625, 16.9375, 19.96875, 23.0, 26.03125, 29.0625, 32.09375, 35.125, 38.15625, 41.1875, 44.21875, 47.25, 50.28125, 53.3125, 56.34375, 59.375, 62.40625, 65.4375, 68.46875, 71.5, 74.53125, 77.5625, 80.59375, 83.625, 86.65625, 89.6875, 92.71875, 95.75, 98.78125, 101.8125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 8.0, 5.0, 6.0, 6.0, 15.0, 14.0, 19.0, 21.0, 30.0, 48.0, 71.0, 77.0, 86.0, 88.0, 71.0, 94.0, 77.0, 61.0, 50.0, 40.0, 34.0, 20.0, 19.0, 4.0, 10.0, 4.0, 4.0, 6.0, 2.0, 3.0, 0.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.96875, -5.77081298828125, -5.5728759765625, -5.37493896484375, -5.177001953125, -4.97906494140625, -4.7811279296875, -4.58319091796875, -4.38525390625, -4.18731689453125, -3.9893798828125, -3.79144287109375, -3.593505859375, -3.39556884765625, -3.1976318359375, -2.99969482421875, -2.8017578125, -2.60382080078125, -2.4058837890625, -2.20794677734375, -2.010009765625, -1.81207275390625, -1.6141357421875, -1.41619873046875, -1.21826171875, -1.02032470703125, -0.8223876953125, -0.62445068359375, -0.426513671875, -0.22857666015625, -0.0306396484375, 0.16729736328125, 0.365234375, 0.56317138671875, 0.7611083984375, 0.95904541015625, 1.156982421875, 1.35491943359375, 1.5528564453125, 1.75079345703125, 1.94873046875, 2.14666748046875, 2.3446044921875, 2.54254150390625, 2.740478515625, 2.93841552734375, 3.1363525390625, 3.33428955078125, 3.5322265625, 3.73016357421875, 3.9281005859375, 4.12603759765625, 4.323974609375, 4.52191162109375, 4.7198486328125, 4.91778564453125, 5.11572265625, 5.31365966796875, 5.5115966796875, 5.70953369140625, 5.907470703125, 6.10540771484375, 6.3033447265625, 6.50128173828125, 6.69921875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 8.0, 8.0, 13.0, 15.0, 26.0, 41.0, 40.0, 58.0, 84.0, 123.0, 172.0, 260.0, 379.0, 613.0, 877.0, 1471.0, 2372.0, 4150.0, 7323.0, 13225.0, 26512.0, 55798.0, 131504.0, 384781.0, 2517491.0, 699401.0, 194664.0, 77385.0, 35555.0, 17452.0, 9329.0, 5139.0, 2973.0, 1786.0, 1107.0, 708.0, 427.0, 300.0, 214.0, 136.0, 115.0, 73.0, 50.0, 37.0, 26.0, 16.0, 11.0, 11.0, 8.0, 2.0, 7.0, 3.0, 5.0, 3.0, 2.0, 1.0], "bins": [-52.1875, -50.591796875, -48.99609375, -47.400390625, -45.8046875, -44.208984375, -42.61328125, -41.017578125, -39.421875, -37.826171875, -36.23046875, -34.634765625, -33.0390625, -31.443359375, -29.84765625, -28.251953125, -26.65625, -25.060546875, -23.46484375, -21.869140625, -20.2734375, -18.677734375, -17.08203125, -15.486328125, -13.890625, -12.294921875, -10.69921875, -9.103515625, -7.5078125, -5.912109375, -4.31640625, -2.720703125, -1.125, 0.470703125, 2.06640625, 3.662109375, 5.2578125, 6.853515625, 8.44921875, 10.044921875, 11.640625, 13.236328125, 14.83203125, 16.427734375, 18.0234375, 19.619140625, 21.21484375, 22.810546875, 24.40625, 26.001953125, 27.59765625, 29.193359375, 30.7890625, 32.384765625, 33.98046875, 35.576171875, 37.171875, 38.767578125, 40.36328125, 41.958984375, 43.5546875, 45.150390625, 46.74609375, 48.341796875, 49.9375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 7.0, 7.0, 8.0, 11.0, 9.0, 22.0, 23.0, 24.0, 29.0, 49.0, 61.0, 84.0, 82.0, 133.0, 182.0, 289.0, 551.0, 1281.0, 407.0, 216.0, 161.0, 106.0, 70.0, 66.0, 40.0, 33.0, 25.0, 19.0, 10.0, 10.0, 13.0, 8.0, 5.0, 6.0, 5.0, 2.0, 3.0, 6.0, 4.0, 1.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.484375, -9.1490478515625, -8.813720703125, -8.4783935546875, -8.14306640625, -7.8077392578125, -7.472412109375, -7.1370849609375, -6.8017578125, -6.4664306640625, -6.131103515625, -5.7957763671875, -5.46044921875, -5.1251220703125, -4.789794921875, -4.4544677734375, -4.119140625, -3.7838134765625, -3.448486328125, -3.1131591796875, -2.77783203125, -2.4425048828125, -2.107177734375, -1.7718505859375, -1.4365234375, -1.1011962890625, -0.765869140625, -0.4305419921875, -0.09521484375, 0.2401123046875, 0.575439453125, 0.9107666015625, 1.24609375, 1.5814208984375, 1.916748046875, 2.2520751953125, 2.58740234375, 2.9227294921875, 3.258056640625, 3.5933837890625, 3.9287109375, 4.2640380859375, 4.599365234375, 4.9346923828125, 5.27001953125, 5.6053466796875, 5.940673828125, 6.2760009765625, 6.611328125, 6.9466552734375, 7.281982421875, 7.6173095703125, 7.95263671875, 8.2879638671875, 8.623291015625, 8.9586181640625, 9.2939453125, 9.6292724609375, 9.964599609375, 10.2999267578125, 10.63525390625, 10.9705810546875, 11.305908203125, 11.6412353515625, 11.9765625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 6.0, 16.0, 9.0, 21.0, 45.0, 70.0, 117.0, 183.0, 184.0, 135.0, 104.0, 52.0, 36.0, 17.0, 3.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-147.76976013183594, -143.60548400878906, -139.44122314453125, -135.27694702148438, -131.11268615722656, -126.94841766357422, -122.78414916992188, -118.619873046875, -114.45561218261719, -110.29134368896484, -106.1270751953125, -101.96280670166016, -97.79853820800781, -93.63426971435547, -89.47000122070312, -85.30572509765625, -81.1414566040039, -76.97718811035156, -72.81291961669922, -68.64865112304688, -64.48438262939453, -60.32011413574219, -56.15584182739258, -51.991573333740234, -47.82730484008789, -43.66303634643555, -39.4987678527832, -35.334495544433594, -31.170228958129883, -27.00596046447754, -22.841690063476562, -18.67742156982422, -14.513153076171875, -10.348884582519531, -6.184615135192871, -2.020345687866211, 2.143922805786133, 6.308191299438477, 10.472461700439453, 14.636730194091797, 18.80099868774414, 22.965267181396484, 27.129535675048828, 31.293806076049805, 35.45807647705078, 39.622344970703125, 43.78661346435547, 47.95088195800781, 52.115150451660156, 56.2794189453125, 60.443687438964844, 64.60795593261719, 68.77222442626953, 72.93649291992188, 77.10076904296875, 81.26502990722656, 85.42930603027344, 89.59357452392578, 93.75784301757812, 97.92211151123047, 102.08638000488281, 106.25064849853516, 110.4149169921875, 114.57919311523438, 118.74345397949219]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 6.0, 11.0, 17.0, 16.0, 17.0, 26.0, 31.0, 34.0, 47.0, 49.0, 67.0, 54.0, 77.0, 74.0, 78.0, 78.0, 59.0, 45.0, 46.0, 41.0, 28.0, 28.0, 15.0, 17.0, 8.0, 6.0, 7.0, 5.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.56741333007812, -62.397796630859375, -60.228179931640625, -58.05856704711914, -55.88895034790039, -53.71933364868164, -51.549720764160156, -49.380104064941406, -47.210487365722656, -45.040870666503906, -42.871253967285156, -40.70164108276367, -38.53202438354492, -36.36240768432617, -34.19279479980469, -32.02317810058594, -29.853561401367188, -27.683944702148438, -25.51432991027832, -23.344715118408203, -21.175098419189453, -19.005481719970703, -16.835866928100586, -14.666251182556152, -12.496635437011719, -10.327019691467285, -8.157403945922852, -5.987788200378418, -3.8181724548339844, -1.6485567092895508, 0.5210590362548828, 2.6906747817993164, 4.86029052734375, 7.029906272888184, 9.199522018432617, 11.36913776397705, 13.538753509521484, 15.708369255065918, 17.87798500061035, 20.04759979248047, 22.21721649169922, 24.38683319091797, 26.556447982788086, 28.726062774658203, 30.895679473876953, 33.0652961730957, 35.23490905761719, 37.40452575683594, 39.57414245605469, 41.74375915527344, 43.91337585449219, 46.08298873901367, 48.25260543823242, 50.42222213745117, 52.591835021972656, 54.761451721191406, 56.931068420410156, 59.100685119628906, 61.270301818847656, 63.43991470336914, 65.60952758789062, 67.77914428710938, 69.94876098632812, 72.11837768554688, 74.28799438476562]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 11.0, 9.0, 13.0, 18.0, 26.0, 30.0, 38.0, 65.0, 112.0, 129.0, 210.0, 337.0, 510.0, 737.0, 1320.0, 2262.0, 4081.0, 7763.0, 15312.0, 34157.0, 88838.0, 294557.0, 389424.0, 123975.0, 44444.0, 19061.0, 9352.0, 4948.0, 2720.0, 1541.0, 882.0, 585.0, 337.0, 238.0, 160.0, 106.0, 78.0, 42.0, 31.0, 27.0, 16.0, 17.0, 13.0, 9.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-46.25, -44.93408203125, -43.6181640625, -42.30224609375, -40.986328125, -39.67041015625, -38.3544921875, -37.03857421875, -35.72265625, -34.40673828125, -33.0908203125, -31.77490234375, -30.458984375, -29.14306640625, -27.8271484375, -26.51123046875, -25.1953125, -23.87939453125, -22.5634765625, -21.24755859375, -19.931640625, -18.61572265625, -17.2998046875, -15.98388671875, -14.66796875, -13.35205078125, -12.0361328125, -10.72021484375, -9.404296875, -8.08837890625, -6.7724609375, -5.45654296875, -4.140625, -2.82470703125, -1.5087890625, -0.19287109375, 1.123046875, 2.43896484375, 3.7548828125, 5.07080078125, 6.38671875, 7.70263671875, 9.0185546875, 10.33447265625, 11.650390625, 12.96630859375, 14.2822265625, 15.59814453125, 16.9140625, 18.22998046875, 19.5458984375, 20.86181640625, 22.177734375, 23.49365234375, 24.8095703125, 26.12548828125, 27.44140625, 28.75732421875, 30.0732421875, 31.38916015625, 32.705078125, 34.02099609375, 35.3369140625, 36.65283203125, 37.96875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 5.0, 3.0, 3.0, 4.0, 4.0, 6.0, 10.0, 8.0, 12.0, 16.0, 13.0, 21.0, 28.0, 32.0, 31.0, 34.0, 39.0, 58.0, 53.0, 53.0, 51.0, 62.0, 46.0, 53.0, 52.0, 48.0, 46.0, 43.0, 24.0, 26.0, 13.0, 15.0, 18.0, 22.0, 10.0, 8.0, 8.0, 5.0, 7.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3203125, -3.18487548828125, -3.0494384765625, -2.91400146484375, -2.778564453125, -2.64312744140625, -2.5076904296875, -2.37225341796875, -2.23681640625, -2.10137939453125, -1.9659423828125, -1.83050537109375, -1.695068359375, -1.55963134765625, -1.4241943359375, -1.28875732421875, -1.1533203125, -1.01788330078125, -0.8824462890625, -0.74700927734375, -0.611572265625, -0.47613525390625, -0.3406982421875, -0.20526123046875, -0.06982421875, 0.06561279296875, 0.2010498046875, 0.33648681640625, 0.471923828125, 0.60736083984375, 0.7427978515625, 0.87823486328125, 1.013671875, 1.14910888671875, 1.2845458984375, 1.41998291015625, 1.555419921875, 1.69085693359375, 1.8262939453125, 1.96173095703125, 2.09716796875, 2.23260498046875, 2.3680419921875, 2.50347900390625, 2.638916015625, 2.77435302734375, 2.9097900390625, 3.04522705078125, 3.1806640625, 3.31610107421875, 3.4515380859375, 3.58697509765625, 3.722412109375, 3.85784912109375, 3.9932861328125, 4.12872314453125, 4.26416015625, 4.39959716796875, 4.5350341796875, 4.67047119140625, 4.805908203125, 4.94134521484375, 5.0767822265625, 5.21221923828125, 5.34765625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 7.0, 11.0, 15.0, 13.0, 12.0, 34.0, 64.0, 95.0, 169.0, 252.0, 422.0, 702.0, 1296.0, 2318.0, 4736.0, 10787.0, 30130.0, 119837.0, 538181.0, 257745.0, 51965.0, 16193.0, 6687.0, 3114.0, 1611.0, 893.0, 447.0, 301.0, 191.0, 110.0, 75.0, 49.0, 36.0, 30.0, 11.0, 8.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-57.09375, -55.5390625, -53.984375, -52.4296875, -50.875, -49.3203125, -47.765625, -46.2109375, -44.65625, -43.1015625, -41.546875, -39.9921875, -38.4375, -36.8828125, -35.328125, -33.7734375, -32.21875, -30.6640625, -29.109375, -27.5546875, -26.0, -24.4453125, -22.890625, -21.3359375, -19.78125, -18.2265625, -16.671875, -15.1171875, -13.5625, -12.0078125, -10.453125, -8.8984375, -7.34375, -5.7890625, -4.234375, -2.6796875, -1.125, 0.4296875, 1.984375, 3.5390625, 5.09375, 6.6484375, 8.203125, 9.7578125, 11.3125, 12.8671875, 14.421875, 15.9765625, 17.53125, 19.0859375, 20.640625, 22.1953125, 23.75, 25.3046875, 26.859375, 28.4140625, 29.96875, 31.5234375, 33.078125, 34.6328125, 36.1875, 37.7421875, 39.296875, 40.8515625, 42.40625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 2.0, 4.0, 6.0, 6.0, 10.0, 4.0, 13.0, 10.0, 25.0, 25.0, 28.0, 29.0, 38.0, 45.0, 45.0, 47.0, 55.0, 67.0, 67.0, 45.0, 52.0, 56.0, 49.0, 54.0, 37.0, 37.0, 24.0, 23.0, 24.0, 18.0, 9.0, 14.0, 5.0, 4.0, 2.0, 4.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-27.546875, -26.780517578125, -26.01416015625, -25.247802734375, -24.4814453125, -23.715087890625, -22.94873046875, -22.182373046875, -21.416015625, -20.649658203125, -19.88330078125, -19.116943359375, -18.3505859375, -17.584228515625, -16.81787109375, -16.051513671875, -15.28515625, -14.518798828125, -13.75244140625, -12.986083984375, -12.2197265625, -11.453369140625, -10.68701171875, -9.920654296875, -9.154296875, -8.387939453125, -7.62158203125, -6.855224609375, -6.0888671875, -5.322509765625, -4.55615234375, -3.789794921875, -3.0234375, -2.257080078125, -1.49072265625, -0.724365234375, 0.0419921875, 0.808349609375, 1.57470703125, 2.341064453125, 3.107421875, 3.873779296875, 4.64013671875, 5.406494140625, 6.1728515625, 6.939208984375, 7.70556640625, 8.471923828125, 9.23828125, 10.004638671875, 10.77099609375, 11.537353515625, 12.3037109375, 13.070068359375, 13.83642578125, 14.602783203125, 15.369140625, 16.135498046875, 16.90185546875, 17.668212890625, 18.4345703125, 19.200927734375, 19.96728515625, 20.733642578125, 21.5]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 10.0, 12.0, 16.0, 30.0, 39.0, 51.0, 86.0, 143.0, 234.0, 347.0, 689.0, 1214.0, 2421.0, 5014.0, 11318.0, 27354.0, 73868.0, 205429.0, 368866.0, 219371.0, 79557.0, 29517.0, 11961.0, 5357.0, 2623.0, 1280.0, 675.0, 403.0, 226.0, 136.0, 85.0, 86.0, 37.0, 26.0, 22.0, 15.0, 6.0, 9.0, 9.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-28.71875, -27.88720703125, -27.0556640625, -26.22412109375, -25.392578125, -24.56103515625, -23.7294921875, -22.89794921875, -22.06640625, -21.23486328125, -20.4033203125, -19.57177734375, -18.740234375, -17.90869140625, -17.0771484375, -16.24560546875, -15.4140625, -14.58251953125, -13.7509765625, -12.91943359375, -12.087890625, -11.25634765625, -10.4248046875, -9.59326171875, -8.76171875, -7.93017578125, -7.0986328125, -6.26708984375, -5.435546875, -4.60400390625, -3.7724609375, -2.94091796875, -2.109375, -1.27783203125, -0.4462890625, 0.38525390625, 1.216796875, 2.04833984375, 2.8798828125, 3.71142578125, 4.54296875, 5.37451171875, 6.2060546875, 7.03759765625, 7.869140625, 8.70068359375, 9.5322265625, 10.36376953125, 11.1953125, 12.02685546875, 12.8583984375, 13.68994140625, 14.521484375, 15.35302734375, 16.1845703125, 17.01611328125, 17.84765625, 18.67919921875, 19.5107421875, 20.34228515625, 21.173828125, 22.00537109375, 22.8369140625, 23.66845703125, 24.5]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 6.0, 0.0, 5.0, 4.0, 4.0, 5.0, 9.0, 18.0, 27.0, 62.0, 94.0, 139.0, 167.0, 197.0, 101.0, 75.0, 31.0, 11.0, 8.0, 6.0, 3.0, 6.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0028076171875, -0.0027156472206115723, -0.0026236772537231445, -0.002531707286834717, -0.002439737319946289, -0.0023477673530578613, -0.0022557973861694336, -0.002163827419281006, -0.002071857452392578, -0.0019798874855041504, -0.0018879175186157227, -0.001795947551727295, -0.0017039775848388672, -0.0016120076179504395, -0.0015200376510620117, -0.001428067684173584, -0.0013360977172851562, -0.0012441277503967285, -0.0011521577835083008, -0.001060187816619873, -0.0009682178497314453, -0.0008762478828430176, -0.0007842779159545898, -0.0006923079490661621, -0.0006003379821777344, -0.0005083680152893066, -0.0004163980484008789, -0.00032442808151245117, -0.00023245811462402344, -0.0001404881477355957, -4.851818084716797e-05, 4.3451786041259766e-05, 0.0001354217529296875, 0.00022739171981811523, 0.00031936168670654297, 0.0004113316535949707, 0.0005033016204833984, 0.0005952715873718262, 0.0006872415542602539, 0.0007792115211486816, 0.0008711814880371094, 0.0009631514549255371, 0.0010551214218139648, 0.0011470913887023926, 0.0012390613555908203, 0.001331031322479248, 0.0014230012893676758, 0.0015149712562561035, 0.0016069412231445312, 0.001698911190032959, 0.0017908811569213867, 0.0018828511238098145, 0.001974821090698242, 0.00206679105758667, 0.0021587610244750977, 0.0022507309913635254, 0.002342700958251953, 0.002434670925140381, 0.0025266408920288086, 0.0026186108589172363, 0.002710580825805664, 0.002802550792694092, 0.0028945207595825195, 0.0029864907264709473, 0.003078460693359375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 7.0, 3.0, 6.0, 5.0, 11.0, 20.0, 29.0, 62.0, 132.0, 215.0, 475.0, 1170.0, 2880.0, 7611.0, 25205.0, 99677.0, 385549.0, 387426.0, 100677.0, 24881.0, 7545.0, 2783.0, 1108.0, 500.0, 276.0, 129.0, 78.0, 36.0, 19.0, 14.0, 7.0, 6.0, 3.0, 3.0, 1.0, 4.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-49.125, -47.865478515625, -46.60595703125, -45.346435546875, -44.0869140625, -42.827392578125, -41.56787109375, -40.308349609375, -39.048828125, -37.789306640625, -36.52978515625, -35.270263671875, -34.0107421875, -32.751220703125, -31.49169921875, -30.232177734375, -28.97265625, -27.713134765625, -26.45361328125, -25.194091796875, -23.9345703125, -22.675048828125, -21.41552734375, -20.156005859375, -18.896484375, -17.636962890625, -16.37744140625, -15.117919921875, -13.8583984375, -12.598876953125, -11.33935546875, -10.079833984375, -8.8203125, -7.560791015625, -6.30126953125, -5.041748046875, -3.7822265625, -2.522705078125, -1.26318359375, -0.003662109375, 1.255859375, 2.515380859375, 3.77490234375, 5.034423828125, 6.2939453125, 7.553466796875, 8.81298828125, 10.072509765625, 11.33203125, 12.591552734375, 13.85107421875, 15.110595703125, 16.3701171875, 17.629638671875, 18.88916015625, 20.148681640625, 21.408203125, 22.667724609375, 23.92724609375, 25.186767578125, 26.4462890625, 27.705810546875, 28.96533203125, 30.224853515625, 31.484375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 1.0, 4.0, 3.0, 6.0, 10.0, 7.0, 7.0, 17.0, 14.0, 17.0, 29.0, 25.0, 33.0, 48.0, 64.0, 63.0, 61.0, 63.0, 62.0, 84.0, 69.0, 59.0, 60.0, 35.0, 39.0, 25.0, 29.0, 21.0, 9.0, 4.0, 9.0, 13.0, 6.0, 6.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.65625, -11.177978515625, -10.69970703125, -10.221435546875, -9.7431640625, -9.264892578125, -8.78662109375, -8.308349609375, -7.830078125, -7.351806640625, -6.87353515625, -6.395263671875, -5.9169921875, -5.438720703125, -4.96044921875, -4.482177734375, -4.00390625, -3.525634765625, -3.04736328125, -2.569091796875, -2.0908203125, -1.612548828125, -1.13427734375, -0.656005859375, -0.177734375, 0.300537109375, 0.77880859375, 1.257080078125, 1.7353515625, 2.213623046875, 2.69189453125, 3.170166015625, 3.6484375, 4.126708984375, 4.60498046875, 5.083251953125, 5.5615234375, 6.039794921875, 6.51806640625, 6.996337890625, 7.474609375, 7.952880859375, 8.43115234375, 8.909423828125, 9.3876953125, 9.865966796875, 10.34423828125, 10.822509765625, 11.30078125, 11.779052734375, 12.25732421875, 12.735595703125, 13.2138671875, 13.692138671875, 14.17041015625, 14.648681640625, 15.126953125, 15.605224609375, 16.08349609375, 16.561767578125, 17.0400390625, 17.518310546875, 17.99658203125, 18.474853515625, 18.953125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 11.0, 7.0, 12.0, 18.0, 31.0, 77.0, 118.0, 150.0, 165.0, 146.0, 103.0, 71.0, 50.0, 21.0, 9.0, 8.0, 2.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-177.26101684570312, -167.6498260498047, -158.03863525390625, -148.42745971679688, -138.81626892089844, -129.205078125, -119.59388732910156, -109.98270416259766, -100.37151336669922, -90.76032257080078, -81.14913940429688, -71.53794860839844, -61.926761627197266, -52.315574645996094, -42.704383850097656, -33.09320068359375, -23.482009887695312, -13.870821952819824, -4.259634017944336, 5.351554870605469, 14.96274185180664, 24.573928833007812, 34.18511962890625, 43.796302795410156, 53.407493591308594, 63.018680572509766, 72.62986755371094, 82.24105834960938, 91.85224914550781, 101.46343231201172, 111.07462310791016, 120.68580627441406, 130.2969970703125, 139.90818786621094, 149.51937866210938, 159.13055419921875, 168.7417449951172, 178.35293579101562, 187.96412658691406, 197.5753173828125, 207.18649291992188, 216.7976837158203, 226.40887451171875, 236.02005004882812, 245.63124084472656, 255.242431640625, 264.8536376953125, 274.4648132324219, 284.07598876953125, 293.6871643066406, 303.2983703613281, 312.9095458984375, 322.520751953125, 332.1319274902344, 341.74310302734375, 351.35430908203125, 360.96551513671875, 370.5766906738281, 380.1878967285156, 389.799072265625, 399.4102783203125, 409.0214538574219, 418.63262939453125, 428.24383544921875, 437.8550109863281]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 10.0, 3.0, 9.0, 9.0, 12.0, 11.0, 17.0, 21.0, 29.0, 35.0, 35.0, 51.0, 53.0, 58.0, 70.0, 52.0, 60.0, 52.0, 64.0, 45.0, 46.0, 45.0, 38.0, 35.0, 33.0, 23.0, 19.0, 14.0, 9.0, 10.0, 11.0, 6.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-159.87094116210938, -154.9088897705078, -149.94683837890625, -144.98477172851562, -140.02272033691406, -135.0606689453125, -130.09861755371094, -125.13656616210938, -120.17450714111328, -115.21245574951172, -110.25039672851562, -105.28834533691406, -100.3262939453125, -95.3642349243164, -90.40218353271484, -85.44012451171875, -80.47807312011719, -75.51602172851562, -70.55396270751953, -65.59191131591797, -60.62985610961914, -55.66780090332031, -50.70574951171875, -45.74369430541992, -40.781639099121094, -35.819583892822266, -30.85753059387207, -25.895477294921875, -20.933422088623047, -15.971366882324219, -11.009313583374023, -6.047260284423828, -1.085205078125, 3.8768491744995117, 8.838903427124023, 13.800957679748535, 18.763011932373047, 23.725067138671875, 28.68712043762207, 33.649173736572266, 38.611228942871094, 43.57328414916992, 48.53533935546875, 53.49739074707031, 58.45944595336914, 63.42150115966797, 68.38355255126953, 73.34561157226562, 78.30766296386719, 83.26971435546875, 88.23177337646484, 93.1938247680664, 98.1558837890625, 103.11793518066406, 108.07998657226562, 113.04203796386719, 118.00409698486328, 122.96614837646484, 127.92820739746094, 132.8902587890625, 137.85231018066406, 142.81436157226562, 147.77642822265625, 152.7384796142578, 157.70053100585938]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 4.0, 10.0, 20.0, 36.0, 47.0, 77.0, 123.0, 199.0, 352.0, 581.0, 1109.0, 2012.0, 3887.0, 8059.0, 18143.0, 47206.0, 182247.0, 3342556.0, 456421.0, 79857.0, 27346.0, 11726.0, 5552.0, 2849.0, 1561.0, 855.0, 497.0, 329.0, 198.0, 102.0, 96.0, 65.0, 38.0, 33.0, 20.0, 13.0, 15.0, 5.0, 4.0, 6.0, 8.0, 8.0, 5.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-90.8125, -87.2822265625, -83.751953125, -80.2216796875, -76.69140625, -73.1611328125, -69.630859375, -66.1005859375, -62.5703125, -59.0400390625, -55.509765625, -51.9794921875, -48.44921875, -44.9189453125, -41.388671875, -37.8583984375, -34.328125, -30.7978515625, -27.267578125, -23.7373046875, -20.20703125, -16.6767578125, -13.146484375, -9.6162109375, -6.0859375, -2.5556640625, 0.974609375, 4.5048828125, 8.03515625, 11.5654296875, 15.095703125, 18.6259765625, 22.15625, 25.6865234375, 29.216796875, 32.7470703125, 36.27734375, 39.8076171875, 43.337890625, 46.8681640625, 50.3984375, 53.9287109375, 57.458984375, 60.9892578125, 64.51953125, 68.0498046875, 71.580078125, 75.1103515625, 78.640625, 82.1708984375, 85.701171875, 89.2314453125, 92.76171875, 96.2919921875, 99.822265625, 103.3525390625, 106.8828125, 110.4130859375, 113.943359375, 117.4736328125, 121.00390625, 124.5341796875, 128.064453125, 131.5947265625, 135.125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 6.0, 8.0, 14.0, 15.0, 20.0, 25.0, 33.0, 50.0, 48.0, 53.0, 61.0, 66.0, 72.0, 61.0, 83.0, 57.0, 60.0, 64.0, 48.0, 25.0, 21.0, 30.0, 18.0, 14.0, 15.0, 7.0, 10.0, 6.0, 5.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.54296875, -4.35711669921875, -4.1712646484375, -3.98541259765625, -3.799560546875, -3.61370849609375, -3.4278564453125, -3.24200439453125, -3.05615234375, -2.87030029296875, -2.6844482421875, -2.49859619140625, -2.312744140625, -2.12689208984375, -1.9410400390625, -1.75518798828125, -1.5693359375, -1.38348388671875, -1.1976318359375, -1.01177978515625, -0.825927734375, -0.64007568359375, -0.4542236328125, -0.26837158203125, -0.08251953125, 0.10333251953125, 0.2891845703125, 0.47503662109375, 0.660888671875, 0.84674072265625, 1.0325927734375, 1.21844482421875, 1.404296875, 1.59014892578125, 1.7760009765625, 1.96185302734375, 2.147705078125, 2.33355712890625, 2.5194091796875, 2.70526123046875, 2.89111328125, 3.07696533203125, 3.2628173828125, 3.44866943359375, 3.634521484375, 3.82037353515625, 4.0062255859375, 4.19207763671875, 4.3779296875, 4.56378173828125, 4.7496337890625, 4.93548583984375, 5.121337890625, 5.30718994140625, 5.4930419921875, 5.67889404296875, 5.86474609375, 6.05059814453125, 6.2364501953125, 6.42230224609375, 6.608154296875, 6.79400634765625, 6.9798583984375, 7.16571044921875, 7.3515625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 7.0, 4.0, 4.0, 3.0, 9.0, 5.0, 14.0, 15.0, 21.0, 23.0, 29.0, 42.0, 62.0, 96.0, 194.0, 368.0, 907.0, 2926.0, 13667.0, 107921.0, 3468250.0, 550047.0, 40180.0, 6636.0, 1637.0, 536.0, 242.0, 117.0, 95.0, 61.0, 39.0, 21.0, 18.0, 16.0, 19.0, 5.0, 10.0, 6.0, 7.0, 4.0, 2.0, 5.0, 2.0, 5.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-210.625, -203.306640625, -195.98828125, -188.669921875, -181.3515625, -174.033203125, -166.71484375, -159.396484375, -152.078125, -144.759765625, -137.44140625, -130.123046875, -122.8046875, -115.486328125, -108.16796875, -100.849609375, -93.53125, -86.212890625, -78.89453125, -71.576171875, -64.2578125, -56.939453125, -49.62109375, -42.302734375, -34.984375, -27.666015625, -20.34765625, -13.029296875, -5.7109375, 1.607421875, 8.92578125, 16.244140625, 23.5625, 30.880859375, 38.19921875, 45.517578125, 52.8359375, 60.154296875, 67.47265625, 74.791015625, 82.109375, 89.427734375, 96.74609375, 104.064453125, 111.3828125, 118.701171875, 126.01953125, 133.337890625, 140.65625, 147.974609375, 155.29296875, 162.611328125, 169.9296875, 177.248046875, 184.56640625, 191.884765625, 199.203125, 206.521484375, 213.83984375, 221.158203125, 228.4765625, 235.794921875, 243.11328125, 250.431640625, 257.75]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 5.0, 6.0, 1.0, 3.0, 3.0, 4.0, 8.0, 8.0, 6.0, 7.0, 6.0, 15.0, 23.0, 23.0, 33.0, 50.0, 51.0, 78.0, 94.0, 143.0, 237.0, 398.0, 1306.0, 596.0, 296.0, 187.0, 116.0, 95.0, 65.0, 51.0, 38.0, 27.0, 20.0, 16.0, 10.0, 13.0, 8.0, 12.0, 8.0, 4.0, 6.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.59375, -17.1153564453125, -16.636962890625, -16.1585693359375, -15.68017578125, -15.2017822265625, -14.723388671875, -14.2449951171875, -13.7666015625, -13.2882080078125, -12.809814453125, -12.3314208984375, -11.85302734375, -11.3746337890625, -10.896240234375, -10.4178466796875, -9.939453125, -9.4610595703125, -8.982666015625, -8.5042724609375, -8.02587890625, -7.5474853515625, -7.069091796875, -6.5906982421875, -6.1123046875, -5.6339111328125, -5.155517578125, -4.6771240234375, -4.19873046875, -3.7203369140625, -3.241943359375, -2.7635498046875, -2.28515625, -1.8067626953125, -1.328369140625, -0.8499755859375, -0.37158203125, 0.1068115234375, 0.585205078125, 1.0635986328125, 1.5419921875, 2.0203857421875, 2.498779296875, 2.9771728515625, 3.45556640625, 3.9339599609375, 4.412353515625, 4.8907470703125, 5.369140625, 5.8475341796875, 6.325927734375, 6.8043212890625, 7.28271484375, 7.7611083984375, 8.239501953125, 8.7178955078125, 9.1962890625, 9.6746826171875, 10.153076171875, 10.6314697265625, 11.10986328125, 11.5882568359375, 12.066650390625, 12.5450439453125, 13.0234375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 3.0, 5.0, 9.0, 10.0, 20.0, 38.0, 52.0, 76.0, 101.0, 115.0, 146.0, 102.0, 112.0, 61.0, 55.0, 38.0, 26.0, 14.0, 8.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-200.0250701904297, -195.2325897216797, -190.4401092529297, -185.64764404296875, -180.85516357421875, -176.06268310546875, -171.27020263671875, -166.47772216796875, -161.6852569580078, -156.8927764892578, -152.1002960205078, -147.30783081054688, -142.51535034179688, -137.72286987304688, -132.93038940429688, -128.13790893554688, -123.3454360961914, -118.5529556274414, -113.76048278808594, -108.96800231933594, -104.17552947998047, -99.38304901123047, -94.590576171875, -89.798095703125, -85.005615234375, -80.213134765625, -75.42066192626953, -70.62818145751953, -65.83570861816406, -61.04322814941406, -56.25075149536133, -51.458274841308594, -46.665809631347656, -41.87333297729492, -37.08085632324219, -32.28837585449219, -27.495901107788086, -22.70342445373535, -17.910945892333984, -13.11846923828125, -8.325992584228516, -3.533515453338623, 1.2589616775512695, 6.05143928527832, 10.843915939331055, 15.636392593383789, 20.428871154785156, 25.22134780883789, 30.013824462890625, 34.80630111694336, 39.598777770996094, 44.391258239746094, 49.18373107910156, 53.97621154785156, 58.7686882019043, 63.56116485595703, 68.3536376953125, 73.1461181640625, 77.93859100341797, 82.73107147216797, 87.52354431152344, 92.31602478027344, 97.10850524902344, 101.9009780883789, 106.6934585571289]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 7.0, 3.0, 4.0, 5.0, 3.0, 4.0, 9.0, 17.0, 15.0, 15.0, 12.0, 19.0, 35.0, 25.0, 36.0, 31.0, 34.0, 36.0, 43.0, 47.0, 52.0, 38.0, 37.0, 51.0, 42.0, 39.0, 50.0, 44.0, 35.0, 29.0, 30.0, 38.0, 22.0, 17.0, 8.0, 9.0, 11.0, 10.0, 9.0, 14.0, 7.0, 7.0, 3.0, 8.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-70.94207000732422, -68.9043960571289, -66.8667221069336, -64.82904052734375, -62.79136657714844, -60.753692626953125, -58.71601867675781, -56.678340911865234, -54.640663146972656, -52.602989196777344, -50.565311431884766, -48.52763748168945, -46.489959716796875, -44.45228576660156, -42.41461181640625, -40.37693405151367, -38.33926010131836, -36.30158615112305, -34.26390838623047, -32.226234436035156, -30.188556671142578, -28.150882720947266, -26.11320686340332, -24.075531005859375, -22.03785514831543, -20.000179290771484, -17.96250343322754, -15.92482852935791, -13.887152671813965, -11.84947681427002, -9.81180191040039, -7.774126052856445, -5.7364501953125, -3.698774576187134, -1.6610989570617676, 0.37657642364501953, 2.414252281188965, 4.45192813873291, 6.489603042602539, 8.527278900146484, 10.56495475769043, 12.602630615234375, 14.64030647277832, 16.677982330322266, 18.715656280517578, 20.753334045410156, 22.79100799560547, 24.828683853149414, 26.86635971069336, 28.904035568237305, 30.94171142578125, 32.97938537597656, 35.01706314086914, 37.05473709106445, 39.09241485595703, 41.130088806152344, 43.167762756347656, 45.20543670654297, 47.24311447143555, 49.28078842163086, 51.31846618652344, 53.35614013671875, 55.39381408691406, 57.43149185180664, 59.46916961669922]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 10.0, 8.0, 8.0, 7.0, 14.0, 21.0, 37.0, 60.0, 73.0, 121.0, 125.0, 242.0, 326.0, 507.0, 749.0, 1133.0, 1744.0, 2723.0, 4102.0, 6512.0, 10437.0, 16182.0, 26064.0, 41075.0, 64266.0, 97296.0, 137524.0, 165767.0, 151517.0, 111916.0, 75525.0, 48805.0, 30911.0, 19095.0, 12086.0, 7444.0, 4882.0, 3132.0, 1997.0, 1361.0, 873.0, 572.0, 446.0, 265.0, 178.0, 138.0, 89.0, 85.0, 36.0, 21.0, 19.0, 11.0, 7.0, 8.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-30.765625, -29.762939453125, -28.76025390625, -27.757568359375, -26.7548828125, -25.752197265625, -24.74951171875, -23.746826171875, -22.744140625, -21.741455078125, -20.73876953125, -19.736083984375, -18.7333984375, -17.730712890625, -16.72802734375, -15.725341796875, -14.72265625, -13.719970703125, -12.71728515625, -11.714599609375, -10.7119140625, -9.709228515625, -8.70654296875, -7.703857421875, -6.701171875, -5.698486328125, -4.69580078125, -3.693115234375, -2.6904296875, -1.687744140625, -0.68505859375, 0.317626953125, 1.3203125, 2.322998046875, 3.32568359375, 4.328369140625, 5.3310546875, 6.333740234375, 7.33642578125, 8.339111328125, 9.341796875, 10.344482421875, 11.34716796875, 12.349853515625, 13.3525390625, 14.355224609375, 15.35791015625, 16.360595703125, 17.36328125, 18.365966796875, 19.36865234375, 20.371337890625, 21.3740234375, 22.376708984375, 23.37939453125, 24.382080078125, 25.384765625, 26.387451171875, 27.39013671875, 28.392822265625, 29.3955078125, 30.398193359375, 31.40087890625, 32.403564453125, 33.40625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 6.0, 5.0, 2.0, 6.0, 9.0, 14.0, 7.0, 17.0, 12.0, 15.0, 12.0, 24.0, 28.0, 37.0, 36.0, 37.0, 44.0, 47.0, 39.0, 48.0, 53.0, 47.0, 41.0, 43.0, 42.0, 41.0, 56.0, 41.0, 22.0, 21.0, 30.0, 23.0, 18.0, 19.0, 13.0, 10.0, 5.0, 5.0, 12.0, 7.0, 4.0, 2.0, 3.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.30078125, -4.15350341796875, -4.0062255859375, -3.85894775390625, -3.711669921875, -3.56439208984375, -3.4171142578125, -3.26983642578125, -3.12255859375, -2.97528076171875, -2.8280029296875, -2.68072509765625, -2.533447265625, -2.38616943359375, -2.2388916015625, -2.09161376953125, -1.9443359375, -1.79705810546875, -1.6497802734375, -1.50250244140625, -1.355224609375, -1.20794677734375, -1.0606689453125, -0.91339111328125, -0.76611328125, -0.61883544921875, -0.4715576171875, -0.32427978515625, -0.177001953125, -0.02972412109375, 0.1175537109375, 0.26483154296875, 0.412109375, 0.55938720703125, 0.7066650390625, 0.85394287109375, 1.001220703125, 1.14849853515625, 1.2957763671875, 1.44305419921875, 1.59033203125, 1.73760986328125, 1.8848876953125, 2.03216552734375, 2.179443359375, 2.32672119140625, 2.4739990234375, 2.62127685546875, 2.7685546875, 2.91583251953125, 3.0631103515625, 3.21038818359375, 3.357666015625, 3.50494384765625, 3.6522216796875, 3.79949951171875, 3.94677734375, 4.09405517578125, 4.2413330078125, 4.38861083984375, 4.535888671875, 4.68316650390625, 4.8304443359375, 4.97772216796875, 5.125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 10.0, 16.0, 21.0, 33.0, 37.0, 46.0, 87.0, 116.0, 193.0, 273.0, 409.0, 685.0, 1219.0, 2376.0, 4774.0, 11107.0, 27280.0, 71923.0, 181802.0, 336640.0, 242497.0, 101013.0, 38078.0, 14857.0, 6323.0, 2931.0, 1506.0, 836.0, 498.0, 321.0, 217.0, 161.0, 83.0, 56.0, 48.0, 27.0, 21.0, 13.0, 9.0, 8.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-78.6875, -76.279296875, -73.87109375, -71.462890625, -69.0546875, -66.646484375, -64.23828125, -61.830078125, -59.421875, -57.013671875, -54.60546875, -52.197265625, -49.7890625, -47.380859375, -44.97265625, -42.564453125, -40.15625, -37.748046875, -35.33984375, -32.931640625, -30.5234375, -28.115234375, -25.70703125, -23.298828125, -20.890625, -18.482421875, -16.07421875, -13.666015625, -11.2578125, -8.849609375, -6.44140625, -4.033203125, -1.625, 0.783203125, 3.19140625, 5.599609375, 8.0078125, 10.416015625, 12.82421875, 15.232421875, 17.640625, 20.048828125, 22.45703125, 24.865234375, 27.2734375, 29.681640625, 32.08984375, 34.498046875, 36.90625, 39.314453125, 41.72265625, 44.130859375, 46.5390625, 48.947265625, 51.35546875, 53.763671875, 56.171875, 58.580078125, 60.98828125, 63.396484375, 65.8046875, 68.212890625, 70.62109375, 73.029296875, 75.4375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 5.0, 6.0, 8.0, 7.0, 12.0, 11.0, 11.0, 10.0, 12.0, 25.0, 17.0, 22.0, 22.0, 31.0, 32.0, 35.0, 43.0, 49.0, 34.0, 30.0, 48.0, 53.0, 54.0, 48.0, 44.0, 40.0, 31.0, 38.0, 33.0, 33.0, 23.0, 26.0, 23.0, 18.0, 15.0, 12.0, 6.0, 10.0, 9.0, 6.0, 4.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-33.21875, -32.14990234375, -31.0810546875, -30.01220703125, -28.943359375, -27.87451171875, -26.8056640625, -25.73681640625, -24.66796875, -23.59912109375, -22.5302734375, -21.46142578125, -20.392578125, -19.32373046875, -18.2548828125, -17.18603515625, -16.1171875, -15.04833984375, -13.9794921875, -12.91064453125, -11.841796875, -10.77294921875, -9.7041015625, -8.63525390625, -7.56640625, -6.49755859375, -5.4287109375, -4.35986328125, -3.291015625, -2.22216796875, -1.1533203125, -0.08447265625, 0.984375, 2.05322265625, 3.1220703125, 4.19091796875, 5.259765625, 6.32861328125, 7.3974609375, 8.46630859375, 9.53515625, 10.60400390625, 11.6728515625, 12.74169921875, 13.810546875, 14.87939453125, 15.9482421875, 17.01708984375, 18.0859375, 19.15478515625, 20.2236328125, 21.29248046875, 22.361328125, 23.43017578125, 24.4990234375, 25.56787109375, 26.63671875, 27.70556640625, 28.7744140625, 29.84326171875, 30.912109375, 31.98095703125, 33.0498046875, 34.11865234375, 35.1875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 7.0, 8.0, 9.0, 18.0, 23.0, 41.0, 64.0, 90.0, 162.0, 306.0, 598.0, 1132.0, 2551.0, 5989.0, 16365.0, 51166.0, 174203.0, 389398.0, 275591.0, 88247.0, 26425.0, 9109.0, 3530.0, 1636.0, 856.0, 429.0, 227.0, 135.0, 84.0, 59.0, 21.0, 24.0, 16.0, 11.0, 13.0, 5.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.59375, -51.84912109375, -50.1044921875, -48.35986328125, -46.615234375, -44.87060546875, -43.1259765625, -41.38134765625, -39.63671875, -37.89208984375, -36.1474609375, -34.40283203125, -32.658203125, -30.91357421875, -29.1689453125, -27.42431640625, -25.6796875, -23.93505859375, -22.1904296875, -20.44580078125, -18.701171875, -16.95654296875, -15.2119140625, -13.46728515625, -11.72265625, -9.97802734375, -8.2333984375, -6.48876953125, -4.744140625, -2.99951171875, -1.2548828125, 0.48974609375, 2.234375, 3.97900390625, 5.7236328125, 7.46826171875, 9.212890625, 10.95751953125, 12.7021484375, 14.44677734375, 16.19140625, 17.93603515625, 19.6806640625, 21.42529296875, 23.169921875, 24.91455078125, 26.6591796875, 28.40380859375, 30.1484375, 31.89306640625, 33.6376953125, 35.38232421875, 37.126953125, 38.87158203125, 40.6162109375, 42.36083984375, 44.10546875, 45.85009765625, 47.5947265625, 49.33935546875, 51.083984375, 52.82861328125, 54.5732421875, 56.31787109375, 58.0625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 3.0, 5.0, 7.0, 7.0, 8.0, 13.0, 21.0, 16.0, 38.0, 30.0, 42.0, 55.0, 56.0, 73.0, 94.0, 88.0, 82.0, 72.0, 63.0, 35.0, 34.0, 39.0, 23.0, 18.0, 16.0, 11.0, 8.0, 9.0, 5.0, 5.0, 5.0, 4.0, 4.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.006748199462890625, -0.006529808044433594, -0.0063114166259765625, -0.006093025207519531, -0.0058746337890625, -0.005656242370605469, -0.0054378509521484375, -0.005219459533691406, -0.005001068115234375, -0.004782676696777344, -0.0045642852783203125, -0.004345893859863281, -0.00412750244140625, -0.003909111022949219, -0.0036907196044921875, -0.0034723281860351562, -0.003253936767578125, -0.0030355453491210938, -0.0028171539306640625, -0.0025987625122070312, -0.00238037109375, -0.0021619796752929688, -0.0019435882568359375, -0.0017251968383789062, -0.001506805419921875, -0.0012884140014648438, -0.0010700225830078125, -0.0008516311645507812, -0.00063323974609375, -0.00041484832763671875, -0.0001964569091796875, 2.193450927734375e-05, 0.000240325927734375, 0.00045871734619140625, 0.0006771087646484375, 0.0008955001831054688, 0.0011138916015625, 0.0013322830200195312, 0.0015506744384765625, 0.0017690658569335938, 0.001987457275390625, 0.0022058486938476562, 0.0024242401123046875, 0.0026426315307617188, 0.00286102294921875, 0.0030794143676757812, 0.0032978057861328125, 0.0035161972045898438, 0.003734588623046875, 0.003952980041503906, 0.0041713714599609375, 0.004389762878417969, 0.004608154296875, 0.004826545715332031, 0.0050449371337890625, 0.005263328552246094, 0.005481719970703125, 0.005700111389160156, 0.0059185028076171875, 0.006136894226074219, 0.00635528564453125, 0.006573677062988281, 0.0067920684814453125, 0.007010459899902344, 0.007228851318359375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 2.0, 5.0, 4.0, 12.0, 2.0, 20.0, 30.0, 38.0, 69.0, 159.0, 272.0, 550.0, 1392.0, 4003.0, 17021.0, 131228.0, 643140.0, 217183.0, 25020.0, 5258.0, 1725.0, 700.0, 338.0, 155.0, 85.0, 45.0, 31.0, 24.0, 14.0, 9.0, 9.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.625, -90.56640625, -87.5078125, -84.44921875, -81.390625, -78.33203125, -75.2734375, -72.21484375, -69.15625, -66.09765625, -63.0390625, -59.98046875, -56.921875, -53.86328125, -50.8046875, -47.74609375, -44.6875, -41.62890625, -38.5703125, -35.51171875, -32.453125, -29.39453125, -26.3359375, -23.27734375, -20.21875, -17.16015625, -14.1015625, -11.04296875, -7.984375, -4.92578125, -1.8671875, 1.19140625, 4.25, 7.30859375, 10.3671875, 13.42578125, 16.484375, 19.54296875, 22.6015625, 25.66015625, 28.71875, 31.77734375, 34.8359375, 37.89453125, 40.953125, 44.01171875, 47.0703125, 50.12890625, 53.1875, 56.24609375, 59.3046875, 62.36328125, 65.421875, 68.48046875, 71.5390625, 74.59765625, 77.65625, 80.71484375, 83.7734375, 86.83203125, 89.890625, 92.94921875, 96.0078125, 99.06640625, 102.125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 1.0, 3.0, 5.0, 11.0, 16.0, 19.0, 36.0, 46.0, 34.0, 68.0, 79.0, 98.0, 131.0, 97.0, 89.0, 76.0, 56.0, 58.0, 21.0, 26.0, 9.0, 6.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.359375, -25.141357421875, -23.92333984375, -22.705322265625, -21.4873046875, -20.269287109375, -19.05126953125, -17.833251953125, -16.615234375, -15.397216796875, -14.17919921875, -12.961181640625, -11.7431640625, -10.525146484375, -9.30712890625, -8.089111328125, -6.87109375, -5.653076171875, -4.43505859375, -3.217041015625, -1.9990234375, -0.781005859375, 0.43701171875, 1.655029296875, 2.873046875, 4.091064453125, 5.30908203125, 6.527099609375, 7.7451171875, 8.963134765625, 10.18115234375, 11.399169921875, 12.6171875, 13.835205078125, 15.05322265625, 16.271240234375, 17.4892578125, 18.707275390625, 19.92529296875, 21.143310546875, 22.361328125, 23.579345703125, 24.79736328125, 26.015380859375, 27.2333984375, 28.451416015625, 29.66943359375, 30.887451171875, 32.10546875, 33.323486328125, 34.54150390625, 35.759521484375, 36.9775390625, 38.195556640625, 39.41357421875, 40.631591796875, 41.849609375, 43.067626953125, 44.28564453125, 45.503662109375, 46.7216796875, 47.939697265625, 49.15771484375, 50.375732421875, 51.59375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 8.0, 10.0, 17.0, 35.0, 104.0, 213.0, 250.0, 198.0, 100.0, 39.0, 21.0, 6.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-660.50146484375, -626.5277099609375, -592.553955078125, -558.5802001953125, -524.6065063476562, -490.63275146484375, -456.65899658203125, -422.68524169921875, -388.7115173339844, -354.7377624511719, -320.7640380859375, -286.790283203125, -252.81654357910156, -218.84280395507812, -184.86904907226562, -150.8953094482422, -116.92156982421875, -82.94783020019531, -48.974082946777344, -15.000335693359375, 18.973403930664062, 52.9471435546875, 86.9208984375, 120.89463806152344, 154.86837768554688, 188.8421173095703, 222.81585693359375, 256.78961181640625, 290.76336669921875, 324.7370910644531, 358.7108459472656, 392.6845703125, 426.6583251953125, 460.632080078125, 494.6058044433594, 528.57958984375, 562.5532836914062, 596.5270385742188, 630.5007934570312, 664.4745483398438, 698.4482421875, 732.4219970703125, 766.395751953125, 800.3695068359375, 834.3432006835938, 868.3169555664062, 902.2907104492188, 936.2644653320312, 970.2382202148438, 1004.2119750976562, 1038.1856689453125, 1072.159423828125, 1106.1331787109375, 1140.10693359375, 1174.0806884765625, 1208.054443359375, 1242.0281982421875, 1276.001953125, 1309.9757080078125, 1343.949462890625, 1377.9232177734375, 1411.89697265625, 1445.87060546875, 1479.8443603515625, 1513.818115234375]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 2.0, 5.0, 13.0, 7.0, 12.0, 24.0, 15.0, 28.0, 36.0, 50.0, 51.0, 59.0, 70.0, 67.0, 65.0, 79.0, 76.0, 71.0, 44.0, 43.0, 40.0, 31.0, 22.0, 21.0, 23.0, 13.0, 5.0, 11.0, 9.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-326.781982421875, -314.1104431152344, -301.4389343261719, -288.76739501953125, -276.0958557128906, -263.42431640625, -250.7528076171875, -238.08126831054688, -225.4097442626953, -212.73822021484375, -200.06668090820312, -187.39515686035156, -174.7236328125, -162.05209350585938, -149.3805694580078, -136.70904541015625, -124.03750610351562, -111.36597442626953, -98.69444274902344, -86.02291870117188, -73.35138702392578, -60.67985534667969, -48.008331298828125, -35.33679962158203, -22.665267944335938, -9.993738174438477, 2.6777915954589844, 15.349319458007812, 28.020851135253906, 40.6923828125, 53.36390686035156, 66.03543853759766, 78.70697021484375, 91.37850189208984, 104.05003356933594, 116.7215576171875, 129.39309692382812, 142.0646209716797, 154.73614501953125, 167.40768432617188, 180.07920837402344, 192.750732421875, 205.42227172851562, 218.0937957763672, 230.76531982421875, 243.43685913085938, 256.1083984375, 268.7799072265625, 281.4514465332031, 294.12298583984375, 306.79449462890625, 319.4660339355469, 332.1375732421875, 344.80908203125, 357.4806213378906, 370.15216064453125, 382.82366943359375, 395.4952087402344, 408.1667175292969, 420.8382568359375, 433.5097961425781, 446.18133544921875, 458.85284423828125, 471.5243835449219, 484.1959228515625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 9.0, 6.0, 3.0, 2.0, 11.0, 30.0, 31.0, 41.0, 71.0, 123.0, 334.0, 775.0, 2853.0, 15629.0, 195355.0, 3883129.0, 84709.0, 8657.0, 1557.0, 484.0, 188.0, 102.0, 69.0, 42.0, 25.0, 19.0, 10.0, 3.0, 8.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-403.0, -390.546875, -378.09375, -365.640625, -353.1875, -340.734375, -328.28125, -315.828125, -303.375, -290.921875, -278.46875, -266.015625, -253.5625, -241.109375, -228.65625, -216.203125, -203.75, -191.296875, -178.84375, -166.390625, -153.9375, -141.484375, -129.03125, -116.578125, -104.125, -91.671875, -79.21875, -66.765625, -54.3125, -41.859375, -29.40625, -16.953125, -4.5, 7.953125, 20.40625, 32.859375, 45.3125, 57.765625, 70.21875, 82.671875, 95.125, 107.578125, 120.03125, 132.484375, 144.9375, 157.390625, 169.84375, 182.296875, 194.75, 207.203125, 219.65625, 232.109375, 244.5625, 257.015625, 269.46875, 281.921875, 294.375, 306.828125, 319.28125, 331.734375, 344.1875, 356.640625, 369.09375, 381.546875, 394.0]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 7.0, 5.0, 2.0, 8.0, 13.0, 25.0, 26.0, 29.0, 26.0, 50.0, 40.0, 53.0, 65.0, 59.0, 77.0, 78.0, 72.0, 84.0, 59.0, 52.0, 26.0, 36.0, 34.0, 24.0, 14.0, 13.0, 2.0, 8.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.703125, -10.36767578125, -10.0322265625, -9.69677734375, -9.361328125, -9.02587890625, -8.6904296875, -8.35498046875, -8.01953125, -7.68408203125, -7.3486328125, -7.01318359375, -6.677734375, -6.34228515625, -6.0068359375, -5.67138671875, -5.3359375, -5.00048828125, -4.6650390625, -4.32958984375, -3.994140625, -3.65869140625, -3.3232421875, -2.98779296875, -2.65234375, -2.31689453125, -1.9814453125, -1.64599609375, -1.310546875, -0.97509765625, -0.6396484375, -0.30419921875, 0.03125, 0.36669921875, 0.7021484375, 1.03759765625, 1.373046875, 1.70849609375, 2.0439453125, 2.37939453125, 2.71484375, 3.05029296875, 3.3857421875, 3.72119140625, 4.056640625, 4.39208984375, 4.7275390625, 5.06298828125, 5.3984375, 5.73388671875, 6.0693359375, 6.40478515625, 6.740234375, 7.07568359375, 7.4111328125, 7.74658203125, 8.08203125, 8.41748046875, 8.7529296875, 9.08837890625, 9.423828125, 9.75927734375, 10.0947265625, 10.43017578125, 10.765625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 4.0, 8.0, 6.0, 16.0, 18.0, 19.0, 29.0, 28.0, 71.0, 108.0, 241.0, 688.0, 2519.0, 11104.0, 66845.0, 844334.0, 3128244.0, 117032.0, 17486.0, 3794.0, 998.0, 334.0, 147.0, 77.0, 45.0, 28.0, 21.0, 16.0, 11.0, 3.0, 7.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-265.5, -256.38671875, -247.2734375, -238.16015625, -229.046875, -219.93359375, -210.8203125, -201.70703125, -192.59375, -183.48046875, -174.3671875, -165.25390625, -156.140625, -147.02734375, -137.9140625, -128.80078125, -119.6875, -110.57421875, -101.4609375, -92.34765625, -83.234375, -74.12109375, -65.0078125, -55.89453125, -46.78125, -37.66796875, -28.5546875, -19.44140625, -10.328125, -1.21484375, 7.8984375, 17.01171875, 26.125, 35.23828125, 44.3515625, 53.46484375, 62.578125, 71.69140625, 80.8046875, 89.91796875, 99.03125, 108.14453125, 117.2578125, 126.37109375, 135.484375, 144.59765625, 153.7109375, 162.82421875, 171.9375, 181.05078125, 190.1640625, 199.27734375, 208.390625, 217.50390625, 226.6171875, 235.73046875, 244.84375, 253.95703125, 263.0703125, 272.18359375, 281.296875, 290.41015625, 299.5234375, 308.63671875, 317.75]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 9.0, 8.0, 14.0, 7.0, 13.0, 19.0, 31.0, 38.0, 46.0, 62.0, 65.0, 114.0, 161.0, 286.0, 615.0, 1377.0, 405.0, 238.0, 165.0, 95.0, 81.0, 49.0, 29.0, 31.0, 32.0, 18.0, 17.0, 17.0, 7.0, 5.0, 8.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-35.25, -34.30517578125, -33.3603515625, -32.41552734375, -31.470703125, -30.52587890625, -29.5810546875, -28.63623046875, -27.69140625, -26.74658203125, -25.8017578125, -24.85693359375, -23.912109375, -22.96728515625, -22.0224609375, -21.07763671875, -20.1328125, -19.18798828125, -18.2431640625, -17.29833984375, -16.353515625, -15.40869140625, -14.4638671875, -13.51904296875, -12.57421875, -11.62939453125, -10.6845703125, -9.73974609375, -8.794921875, -7.85009765625, -6.9052734375, -5.96044921875, -5.015625, -4.07080078125, -3.1259765625, -2.18115234375, -1.236328125, -0.29150390625, 0.6533203125, 1.59814453125, 2.54296875, 3.48779296875, 4.4326171875, 5.37744140625, 6.322265625, 7.26708984375, 8.2119140625, 9.15673828125, 10.1015625, 11.04638671875, 11.9912109375, 12.93603515625, 13.880859375, 14.82568359375, 15.7705078125, 16.71533203125, 17.66015625, 18.60498046875, 19.5498046875, 20.49462890625, 21.439453125, 22.38427734375, 23.3291015625, 24.27392578125, 25.21875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 8.0, 12.0, 35.0, 32.0, 72.0, 127.0, 171.0, 172.0, 144.0, 106.0, 51.0, 31.0, 21.0, 8.0, 5.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-263.3853759765625, -251.46664428710938, -239.54791259765625, -227.62918090820312, -215.71044921875, -203.79171752929688, -191.87298583984375, -179.95425415039062, -168.0355224609375, -156.11679077148438, -144.19805908203125, -132.27932739257812, -120.360595703125, -108.44186401367188, -96.52313232421875, -84.60440063476562, -72.6856689453125, -60.766937255859375, -48.84820556640625, -36.929473876953125, -25.0107421875, -13.092010498046875, -1.17327880859375, 10.745452880859375, 22.6641845703125, 34.582916259765625, 46.50164794921875, 58.420379638671875, 70.339111328125, 82.25784301757812, 94.17657470703125, 106.09530639648438, 118.0140380859375, 129.93276977539062, 141.85150146484375, 153.77023315429688, 165.68896484375, 177.60769653320312, 189.52642822265625, 201.44515991210938, 213.3638916015625, 225.28262329101562, 237.20135498046875, 249.12008666992188, 261.038818359375, 272.9575500488281, 284.87628173828125, 296.7950134277344, 308.7137451171875, 320.6324768066406, 332.55120849609375, 344.4699401855469, 356.388671875, 368.3074035644531, 380.22613525390625, 392.1448669433594, 404.0635986328125, 415.9823303222656, 427.90106201171875, 439.8197937011719, 451.738525390625, 463.6572570800781, 475.57598876953125, 487.4947204589844, 499.4134521484375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 5.0, 0.0, 5.0, 10.0, 5.0, 9.0, 4.0, 17.0, 14.0, 9.0, 12.0, 14.0, 22.0, 22.0, 27.0, 31.0, 23.0, 34.0, 36.0, 33.0, 42.0, 44.0, 40.0, 39.0, 46.0, 49.0, 40.0, 33.0, 48.0, 33.0, 26.0, 19.0, 22.0, 23.0, 26.0, 22.0, 17.0, 18.0, 9.0, 17.0, 9.0, 9.0, 8.0, 4.0, 9.0, 5.0, 9.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-131.38462829589844, -127.5765609741211, -123.76848602294922, -119.96041870117188, -116.15234375, -112.34427642822266, -108.53620910644531, -104.72813415527344, -100.92005920410156, -97.11199188232422, -93.30391693115234, -89.495849609375, -85.68777465820312, -81.87970733642578, -78.07164001464844, -74.26356506347656, -70.45549774169922, -66.64743041992188, -62.83935546875, -59.031288146972656, -55.22321319580078, -51.41514587402344, -47.60707473754883, -43.79900360107422, -39.99093246459961, -36.182861328125, -32.37479019165039, -28.566720962524414, -24.758649826049805, -20.950578689575195, -17.14250946044922, -13.33443832397461, -9.5263671875, -5.718296527862549, -1.9102258682250977, 1.8978443145751953, 5.705915451049805, 9.513986587524414, 13.32205581665039, 17.130126953125, 20.93819808959961, 24.74626922607422, 28.554340362548828, 32.36241149902344, 36.17047882080078, 39.978553771972656, 43.78662109375, 47.59469223022461, 51.40276336669922, 55.21083450317383, 59.01890563964844, 62.82697296142578, 66.63504791259766, 70.443115234375, 74.25119018554688, 78.05925750732422, 81.86732482910156, 85.6753921508789, 89.48346710205078, 93.29153442382812, 97.099609375, 100.90767669677734, 104.71574401855469, 108.52381896972656, 112.33189392089844]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 12.0, 13.0, 16.0, 22.0, 38.0, 46.0, 72.0, 114.0, 183.0, 277.0, 435.0, 750.0, 1193.0, 2356.0, 5194.0, 12774.0, 34988.0, 95807.0, 235310.0, 348744.0, 190333.0, 73998.0, 26785.0, 10112.0, 4205.0, 1957.0, 1076.0, 611.0, 374.0, 236.0, 148.0, 123.0, 83.0, 49.0, 40.0, 20.0, 13.0, 13.0, 10.0, 4.0, 8.0, 6.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-92.0, -89.2431640625, -86.486328125, -83.7294921875, -80.97265625, -78.2158203125, -75.458984375, -72.7021484375, -69.9453125, -67.1884765625, -64.431640625, -61.6748046875, -58.91796875, -56.1611328125, -53.404296875, -50.6474609375, -47.890625, -45.1337890625, -42.376953125, -39.6201171875, -36.86328125, -34.1064453125, -31.349609375, -28.5927734375, -25.8359375, -23.0791015625, -20.322265625, -17.5654296875, -14.80859375, -12.0517578125, -9.294921875, -6.5380859375, -3.78125, -1.0244140625, 1.732421875, 4.4892578125, 7.24609375, 10.0029296875, 12.759765625, 15.5166015625, 18.2734375, 21.0302734375, 23.787109375, 26.5439453125, 29.30078125, 32.0576171875, 34.814453125, 37.5712890625, 40.328125, 43.0849609375, 45.841796875, 48.5986328125, 51.35546875, 54.1123046875, 56.869140625, 59.6259765625, 62.3828125, 65.1396484375, 67.896484375, 70.6533203125, 73.41015625, 76.1669921875, 78.923828125, 81.6806640625, 84.4375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 7.0, 6.0, 12.0, 20.0, 33.0, 35.0, 48.0, 60.0, 59.0, 72.0, 68.0, 69.0, 76.0, 66.0, 59.0, 64.0, 63.0, 50.0, 35.0, 21.0, 25.0, 10.0, 13.0, 13.0, 4.0, 7.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.3125, -12.897705078125, -12.48291015625, -12.068115234375, -11.6533203125, -11.238525390625, -10.82373046875, -10.408935546875, -9.994140625, -9.579345703125, -9.16455078125, -8.749755859375, -8.3349609375, -7.920166015625, -7.50537109375, -7.090576171875, -6.67578125, -6.260986328125, -5.84619140625, -5.431396484375, -5.0166015625, -4.601806640625, -4.18701171875, -3.772216796875, -3.357421875, -2.942626953125, -2.52783203125, -2.113037109375, -1.6982421875, -1.283447265625, -0.86865234375, -0.453857421875, -0.0390625, 0.375732421875, 0.79052734375, 1.205322265625, 1.6201171875, 2.034912109375, 2.44970703125, 2.864501953125, 3.279296875, 3.694091796875, 4.10888671875, 4.523681640625, 4.9384765625, 5.353271484375, 5.76806640625, 6.182861328125, 6.59765625, 7.012451171875, 7.42724609375, 7.842041015625, 8.2568359375, 8.671630859375, 9.08642578125, 9.501220703125, 9.916015625, 10.330810546875, 10.74560546875, 11.160400390625, 11.5751953125, 11.989990234375, 12.40478515625, 12.819580078125, 13.234375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 7.0, 7.0, 10.0, 9.0, 14.0, 21.0, 28.0, 36.0, 59.0, 77.0, 131.0, 203.0, 284.0, 457.0, 796.0, 1291.0, 2594.0, 5555.0, 13778.0, 40010.0, 128445.0, 364726.0, 325798.0, 108152.0, 34084.0, 11928.0, 4642.0, 2244.0, 1215.0, 696.0, 455.0, 260.0, 160.0, 120.0, 84.0, 44.0, 38.0, 30.0, 25.0, 12.0, 14.0, 9.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.6875, -107.326171875, -103.96484375, -100.603515625, -97.2421875, -93.880859375, -90.51953125, -87.158203125, -83.796875, -80.435546875, -77.07421875, -73.712890625, -70.3515625, -66.990234375, -63.62890625, -60.267578125, -56.90625, -53.544921875, -50.18359375, -46.822265625, -43.4609375, -40.099609375, -36.73828125, -33.376953125, -30.015625, -26.654296875, -23.29296875, -19.931640625, -16.5703125, -13.208984375, -9.84765625, -6.486328125, -3.125, 0.236328125, 3.59765625, 6.958984375, 10.3203125, 13.681640625, 17.04296875, 20.404296875, 23.765625, 27.126953125, 30.48828125, 33.849609375, 37.2109375, 40.572265625, 43.93359375, 47.294921875, 50.65625, 54.017578125, 57.37890625, 60.740234375, 64.1015625, 67.462890625, 70.82421875, 74.185546875, 77.546875, 80.908203125, 84.26953125, 87.630859375, 90.9921875, 94.353515625, 97.71484375, 101.076171875, 104.4375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 9.0, 11.0, 9.0, 12.0, 15.0, 25.0, 31.0, 31.0, 42.0, 46.0, 56.0, 69.0, 60.0, 62.0, 56.0, 80.0, 76.0, 55.0, 40.0, 43.0, 43.0, 31.0, 23.0, 18.0, 12.0, 8.0, 13.0, 7.0, 7.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.5625, -68.2412109375, -65.919921875, -63.5986328125, -61.27734375, -58.9560546875, -56.634765625, -54.3134765625, -51.9921875, -49.6708984375, -47.349609375, -45.0283203125, -42.70703125, -40.3857421875, -38.064453125, -35.7431640625, -33.421875, -31.1005859375, -28.779296875, -26.4580078125, -24.13671875, -21.8154296875, -19.494140625, -17.1728515625, -14.8515625, -12.5302734375, -10.208984375, -7.8876953125, -5.56640625, -3.2451171875, -0.923828125, 1.3974609375, 3.71875, 6.0400390625, 8.361328125, 10.6826171875, 13.00390625, 15.3251953125, 17.646484375, 19.9677734375, 22.2890625, 24.6103515625, 26.931640625, 29.2529296875, 31.57421875, 33.8955078125, 36.216796875, 38.5380859375, 40.859375, 43.1806640625, 45.501953125, 47.8232421875, 50.14453125, 52.4658203125, 54.787109375, 57.1083984375, 59.4296875, 61.7509765625, 64.072265625, 66.3935546875, 68.71484375, 71.0361328125, 73.357421875, 75.6787109375, 78.0]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 5.0, 8.0, 14.0, 11.0, 22.0, 31.0, 38.0, 58.0, 99.0, 118.0, 235.0, 405.0, 817.0, 1786.0, 4739.0, 14709.0, 59008.0, 266596.0, 477273.0, 169412.0, 36898.0, 10028.0, 3339.0, 1326.0, 683.0, 369.0, 194.0, 127.0, 78.0, 42.0, 32.0, 20.0, 13.0, 7.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.375, -43.65234375, -41.9296875, -40.20703125, -38.484375, -36.76171875, -35.0390625, -33.31640625, -31.59375, -29.87109375, -28.1484375, -26.42578125, -24.703125, -22.98046875, -21.2578125, -19.53515625, -17.8125, -16.08984375, -14.3671875, -12.64453125, -10.921875, -9.19921875, -7.4765625, -5.75390625, -4.03125, -2.30859375, -0.5859375, 1.13671875, 2.859375, 4.58203125, 6.3046875, 8.02734375, 9.75, 11.47265625, 13.1953125, 14.91796875, 16.640625, 18.36328125, 20.0859375, 21.80859375, 23.53125, 25.25390625, 26.9765625, 28.69921875, 30.421875, 32.14453125, 33.8671875, 35.58984375, 37.3125, 39.03515625, 40.7578125, 42.48046875, 44.203125, 45.92578125, 47.6484375, 49.37109375, 51.09375, 52.81640625, 54.5390625, 56.26171875, 57.984375, 59.70703125, 61.4296875, 63.15234375, 64.875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 6.0, 7.0, 9.0, 13.0, 15.0, 22.0, 23.0, 21.0, 38.0, 48.0, 74.0, 64.0, 105.0, 100.0, 90.0, 84.0, 64.0, 41.0, 32.0, 32.0, 25.0, 19.0, 16.0, 14.0, 11.0, 12.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00801849365234375, -0.007793307304382324, -0.0075681209564208984, -0.007342934608459473, -0.007117748260498047, -0.006892561912536621, -0.006667375564575195, -0.0064421892166137695, -0.006217002868652344, -0.005991816520690918, -0.005766630172729492, -0.005541443824768066, -0.005316257476806641, -0.005091071128845215, -0.004865884780883789, -0.004640698432922363, -0.0044155120849609375, -0.004190325736999512, -0.003965139389038086, -0.00373995304107666, -0.0035147666931152344, -0.0032895803451538086, -0.003064393997192383, -0.002839207649230957, -0.0026140213012695312, -0.0023888349533081055, -0.0021636486053466797, -0.001938462257385254, -0.0017132759094238281, -0.0014880895614624023, -0.0012629032135009766, -0.0010377168655395508, -0.000812530517578125, -0.0005873441696166992, -0.00036215782165527344, -0.00013697147369384766, 8.821487426757812e-05, 0.0003134012222290039, 0.0005385875701904297, 0.0007637739181518555, 0.0009889602661132812, 0.001214146614074707, 0.0014393329620361328, 0.0016645193099975586, 0.0018897056579589844, 0.00211489200592041, 0.002340078353881836, 0.0025652647018432617, 0.0027904510498046875, 0.0030156373977661133, 0.003240823745727539, 0.003466010093688965, 0.0036911964416503906, 0.003916382789611816, 0.004141569137573242, 0.004366755485534668, 0.004591941833496094, 0.0048171281814575195, 0.005042314529418945, 0.005267500877380371, 0.005492687225341797, 0.005717873573303223, 0.0059430599212646484, 0.006168246269226074, 0.0063934326171875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 7.0, 7.0, 16.0, 12.0, 16.0, 25.0, 37.0, 39.0, 91.0, 130.0, 189.0, 306.0, 521.0, 930.0, 1814.0, 3896.0, 9715.0, 28770.0, 106251.0, 359589.0, 373067.0, 114101.0, 30543.0, 10177.0, 3995.0, 1884.0, 965.0, 545.0, 336.0, 196.0, 123.0, 82.0, 52.0, 34.0, 29.0, 21.0, 7.0, 10.0, 6.0, 7.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-53.90625, -52.3671875, -50.828125, -49.2890625, -47.75, -46.2109375, -44.671875, -43.1328125, -41.59375, -40.0546875, -38.515625, -36.9765625, -35.4375, -33.8984375, -32.359375, -30.8203125, -29.28125, -27.7421875, -26.203125, -24.6640625, -23.125, -21.5859375, -20.046875, -18.5078125, -16.96875, -15.4296875, -13.890625, -12.3515625, -10.8125, -9.2734375, -7.734375, -6.1953125, -4.65625, -3.1171875, -1.578125, -0.0390625, 1.5, 3.0390625, 4.578125, 6.1171875, 7.65625, 9.1953125, 10.734375, 12.2734375, 13.8125, 15.3515625, 16.890625, 18.4296875, 19.96875, 21.5078125, 23.046875, 24.5859375, 26.125, 27.6640625, 29.203125, 30.7421875, 32.28125, 33.8203125, 35.359375, 36.8984375, 38.4375, 39.9765625, 41.515625, 43.0546875, 44.59375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 3.0, 3.0, 7.0, 8.0, 6.0, 11.0, 5.0, 10.0, 19.0, 21.0, 31.0, 50.0, 44.0, 59.0, 66.0, 69.0, 70.0, 72.0, 76.0, 56.0, 54.0, 44.0, 53.0, 41.0, 19.0, 31.0, 25.0, 12.0, 10.0, 8.0, 8.0, 5.0, 2.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-30.5625, -29.804443359375, -29.04638671875, -28.288330078125, -27.5302734375, -26.772216796875, -26.01416015625, -25.256103515625, -24.498046875, -23.739990234375, -22.98193359375, -22.223876953125, -21.4658203125, -20.707763671875, -19.94970703125, -19.191650390625, -18.43359375, -17.675537109375, -16.91748046875, -16.159423828125, -15.4013671875, -14.643310546875, -13.88525390625, -13.127197265625, -12.369140625, -11.611083984375, -10.85302734375, -10.094970703125, -9.3369140625, -8.578857421875, -7.82080078125, -7.062744140625, -6.3046875, -5.546630859375, -4.78857421875, -4.030517578125, -3.2724609375, -2.514404296875, -1.75634765625, -0.998291015625, -0.240234375, 0.517822265625, 1.27587890625, 2.033935546875, 2.7919921875, 3.550048828125, 4.30810546875, 5.066162109375, 5.82421875, 6.582275390625, 7.34033203125, 8.098388671875, 8.8564453125, 9.614501953125, 10.37255859375, 11.130615234375, 11.888671875, 12.646728515625, 13.40478515625, 14.162841796875, 14.9208984375, 15.678955078125, 16.43701171875, 17.195068359375, 17.953125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 8.0, 14.0, 26.0, 51.0, 73.0, 96.0, 137.0, 141.0, 132.0, 109.0, 75.0, 44.0, 35.0, 21.0, 7.0, 9.0, 6.0, 0.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-641.4290161132812, -618.9644165039062, -596.4998168945312, -574.0352783203125, -551.5706787109375, -529.1060791015625, -506.6414794921875, -484.1768798828125, -461.7123107910156, -439.2477111816406, -416.78314208984375, -394.31854248046875, -371.85394287109375, -349.3893737792969, -326.9247741699219, -304.460205078125, -281.99560546875, -259.531005859375, -237.06643676757812, -214.60183715820312, -192.1372528076172, -169.67266845703125, -147.20806884765625, -124.74348449707031, -102.27890014648438, -79.81431579589844, -57.34972381591797, -34.8851318359375, -12.420547485351562, 10.044036865234375, 32.508636474609375, 54.97322082519531, 77.4378662109375, 99.90245056152344, 122.3670425415039, 144.83163452148438, 167.2962188720703, 189.76080322265625, 212.22540283203125, 234.6899871826172, 257.1545715332031, 279.6191711425781, 302.083740234375, 324.54833984375, 347.012939453125, 369.4775085449219, 391.9421081542969, 414.40667724609375, 436.87127685546875, 459.33587646484375, 481.8004455566406, 504.2650451660156, 526.7296142578125, 549.1942138671875, 571.6588134765625, 594.1234130859375, 616.5880126953125, 639.0526123046875, 661.5172119140625, 683.9818115234375, 706.4463500976562, 728.9109497070312, 751.3755493164062, 773.8401489257812, 796.3046875]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 9.0, 4.0, 8.0, 10.0, 10.0, 8.0, 10.0, 22.0, 20.0, 19.0, 26.0, 19.0, 21.0, 30.0, 30.0, 48.0, 36.0, 39.0, 44.0, 56.0, 49.0, 51.0, 56.0, 49.0, 36.0, 37.0, 29.0, 30.0, 41.0, 27.0, 25.0, 17.0, 19.0, 15.0, 10.0, 12.0, 8.0, 6.0, 4.0, 3.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-411.755126953125, -399.9296569824219, -388.1042175292969, -376.27874755859375, -364.4532775878906, -352.6278076171875, -340.8023681640625, -328.9768981933594, -317.15142822265625, -305.3259582519531, -293.5005187988281, -281.675048828125, -269.8495788574219, -258.02410888671875, -246.19866943359375, -234.37319946289062, -222.54774475097656, -210.7222900390625, -198.89682006835938, -187.0713653564453, -175.2458953857422, -163.42044067382812, -151.594970703125, -139.76951599121094, -127.94405364990234, -116.11859130859375, -104.29312896728516, -92.46766662597656, -80.6422119140625, -68.81674194335938, -56.99128723144531, -45.16582489013672, -33.340362548828125, -21.51490020751953, -9.68943977355957, 2.1360206604003906, 13.961483001708984, 25.786945343017578, 37.612403869628906, 49.4378662109375, 61.263328552246094, 73.08879089355469, 84.91425323486328, 96.73971557617188, 108.56517028808594, 120.39064025878906, 132.21609497070312, 144.04156494140625, 155.8670196533203, 167.69247436523438, 179.5179443359375, 191.34339904785156, 203.1688690185547, 214.99432373046875, 226.81979370117188, 238.64524841308594, 250.470703125, 262.2961730957031, 274.1216125488281, 285.94708251953125, 297.7725524902344, 309.5980224609375, 321.4234619140625, 333.2489318847656, 345.07440185546875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 9.0, 13.0, 28.0, 25.0, 64.0, 123.0, 283.0, 862.0, 3989.0, 32835.0, 3772369.0, 363993.0, 16077.0, 2495.0, 599.0, 216.0, 111.0, 63.0, 62.0, 27.0, 18.0, 10.0, 3.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-338.75, -326.1328125, -313.515625, -300.8984375, -288.28125, -275.6640625, -263.046875, -250.4296875, -237.8125, -225.1953125, -212.578125, -199.9609375, -187.34375, -174.7265625, -162.109375, -149.4921875, -136.875, -124.2578125, -111.640625, -99.0234375, -86.40625, -73.7890625, -61.171875, -48.5546875, -35.9375, -23.3203125, -10.703125, 1.9140625, 14.53125, 27.1484375, 39.765625, 52.3828125, 65.0, 77.6171875, 90.234375, 102.8515625, 115.46875, 128.0859375, 140.703125, 153.3203125, 165.9375, 178.5546875, 191.171875, 203.7890625, 216.40625, 229.0234375, 241.640625, 254.2578125, 266.875, 279.4921875, 292.109375, 304.7265625, 317.34375, 329.9609375, 342.578125, 355.1953125, 367.8125, 380.4296875, 393.046875, 405.6640625, 418.28125, 430.8984375, 443.515625, 456.1328125, 468.75]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 7.0, 21.0, 18.0, 33.0, 59.0, 63.0, 71.0, 67.0, 103.0, 92.0, 95.0, 91.0, 73.0, 46.0, 47.0, 36.0, 34.0, 17.0, 10.0, 11.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.8125, -17.188232421875, -16.56396484375, -15.939697265625, -15.3154296875, -14.691162109375, -14.06689453125, -13.442626953125, -12.818359375, -12.194091796875, -11.56982421875, -10.945556640625, -10.3212890625, -9.697021484375, -9.07275390625, -8.448486328125, -7.82421875, -7.199951171875, -6.57568359375, -5.951416015625, -5.3271484375, -4.702880859375, -4.07861328125, -3.454345703125, -2.830078125, -2.205810546875, -1.58154296875, -0.957275390625, -0.3330078125, 0.291259765625, 0.91552734375, 1.539794921875, 2.1640625, 2.788330078125, 3.41259765625, 4.036865234375, 4.6611328125, 5.285400390625, 5.90966796875, 6.533935546875, 7.158203125, 7.782470703125, 8.40673828125, 9.031005859375, 9.6552734375, 10.279541015625, 10.90380859375, 11.528076171875, 12.15234375, 12.776611328125, 13.40087890625, 14.025146484375, 14.6494140625, 15.273681640625, 15.89794921875, 16.522216796875, 17.146484375, 17.770751953125, 18.39501953125, 19.019287109375, 19.6435546875, 20.267822265625, 20.89208984375, 21.516357421875, 22.140625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 6.0, 12.0, 10.0, 33.0, 55.0, 84.0, 125.0, 184.0, 432.0, 759.0, 1523.0, 3455.0, 8292.0, 22839.0, 79408.0, 486297.0, 3275479.0, 237576.0, 50505.0, 15829.0, 6071.0, 2624.0, 1245.0, 607.0, 340.0, 199.0, 117.0, 68.0, 38.0, 13.0, 17.0, 13.0, 9.0, 7.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-168.125, -163.228515625, -158.33203125, -153.435546875, -148.5390625, -143.642578125, -138.74609375, -133.849609375, -128.953125, -124.056640625, -119.16015625, -114.263671875, -109.3671875, -104.470703125, -99.57421875, -94.677734375, -89.78125, -84.884765625, -79.98828125, -75.091796875, -70.1953125, -65.298828125, -60.40234375, -55.505859375, -50.609375, -45.712890625, -40.81640625, -35.919921875, -31.0234375, -26.126953125, -21.23046875, -16.333984375, -11.4375, -6.541015625, -1.64453125, 3.251953125, 8.1484375, 13.044921875, 17.94140625, 22.837890625, 27.734375, 32.630859375, 37.52734375, 42.423828125, 47.3203125, 52.216796875, 57.11328125, 62.009765625, 66.90625, 71.802734375, 76.69921875, 81.595703125, 86.4921875, 91.388671875, 96.28515625, 101.181640625, 106.078125, 110.974609375, 115.87109375, 120.767578125, 125.6640625, 130.560546875, 135.45703125, 140.353515625, 145.25]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 1.0, 2.0, 8.0, 5.0, 14.0, 10.0, 15.0, 15.0, 31.0, 38.0, 48.0, 93.0, 129.0, 238.0, 540.0, 1729.0, 533.0, 245.0, 111.0, 91.0, 60.0, 22.0, 30.0, 25.0, 10.0, 4.0, 7.0, 6.0, 7.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.125, -31.91943359375, -30.7138671875, -29.50830078125, -28.302734375, -27.09716796875, -25.8916015625, -24.68603515625, -23.48046875, -22.27490234375, -21.0693359375, -19.86376953125, -18.658203125, -17.45263671875, -16.2470703125, -15.04150390625, -13.8359375, -12.63037109375, -11.4248046875, -10.21923828125, -9.013671875, -7.80810546875, -6.6025390625, -5.39697265625, -4.19140625, -2.98583984375, -1.7802734375, -0.57470703125, 0.630859375, 1.83642578125, 3.0419921875, 4.24755859375, 5.453125, 6.65869140625, 7.8642578125, 9.06982421875, 10.275390625, 11.48095703125, 12.6865234375, 13.89208984375, 15.09765625, 16.30322265625, 17.5087890625, 18.71435546875, 19.919921875, 21.12548828125, 22.3310546875, 23.53662109375, 24.7421875, 25.94775390625, 27.1533203125, 28.35888671875, 29.564453125, 30.77001953125, 31.9755859375, 33.18115234375, 34.38671875, 35.59228515625, 36.7978515625, 38.00341796875, 39.208984375, 40.41455078125, 41.6201171875, 42.82568359375, 44.03125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 11.0, 10.0, 8.0, 28.0, 51.0, 50.0, 72.0, 105.0, 127.0, 123.0, 114.0, 84.0, 81.0, 48.0, 31.0, 20.0, 16.0, 8.0, 2.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-250.4905548095703, -242.75283813476562, -235.01512145996094, -227.2773895263672, -219.5396728515625, -211.8019561767578, -204.06423950195312, -196.32650756835938, -188.5887908935547, -180.85107421875, -173.1133575439453, -165.37562561035156, -157.63790893554688, -149.9001922607422, -142.1624755859375, -134.42474365234375, -126.6870346069336, -118.9493179321289, -111.21159362792969, -103.473876953125, -95.73615264892578, -87.9984359741211, -80.26071166992188, -72.52299499511719, -64.7852783203125, -57.04755783081055, -49.309837341308594, -41.572120666503906, -33.83439636230469, -26.0966796875, -18.358959197998047, -10.621238708496094, -2.883514404296875, 4.85420560836792, 12.591925621032715, 20.32964515686035, 28.067365646362305, 35.805084228515625, 43.54280471801758, 51.28052520751953, 59.018245697021484, 66.75596618652344, 74.49368286132812, 82.23140716552734, 89.96912384033203, 97.70684814453125, 105.44456481933594, 113.18228149414062, 120.92000579833984, 128.65773010253906, 136.39544677734375, 144.13316345214844, 151.87088012695312, 159.60861206054688, 167.34632873535156, 175.08404541015625, 182.82176208496094, 190.55947875976562, 198.2971954345703, 206.03492736816406, 213.77264404296875, 221.51036071777344, 229.24807739257812, 236.98580932617188, 244.72352600097656]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 4.0, 8.0, 8.0, 4.0, 12.0, 12.0, 19.0, 18.0, 27.0, 25.0, 23.0, 32.0, 33.0, 31.0, 40.0, 34.0, 36.0, 53.0, 35.0, 43.0, 49.0, 53.0, 51.0, 44.0, 45.0, 25.0, 26.0, 42.0, 30.0, 21.0, 15.0, 19.0, 18.0, 17.0, 7.0, 8.0, 6.0, 3.0, 5.0, 5.0, 1.0, 6.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-117.79442596435547, -114.21016693115234, -110.62590789794922, -107.04164123535156, -103.45738220214844, -99.87312316894531, -96.28886413574219, -92.70460510253906, -89.12034606933594, -85.53608703613281, -81.95182800292969, -78.36756896972656, -74.7833023071289, -71.19904327392578, -67.61478424072266, -64.03052520751953, -60.446258544921875, -56.86199951171875, -53.27773666381836, -49.693477630615234, -46.109214782714844, -42.52495574951172, -38.940696716308594, -35.35643768310547, -31.772174835205078, -28.18791389465332, -24.603652954101562, -21.019393920898438, -17.43513298034668, -13.850872039794922, -10.266613006591797, -6.682352066040039, -3.09808349609375, 0.4861769676208496, 4.070437431335449, 7.654697418212891, 11.238958358764648, 14.823219299316406, 18.40747833251953, 21.99173927307129, 25.576000213623047, 29.160261154174805, 32.74452209472656, 36.32878112792969, 39.91304016113281, 43.4973030090332, 47.08156204223633, 50.66582489013672, 54.250083923339844, 57.83434295654297, 61.41860580444336, 65.00286865234375, 68.58712768554688, 72.17138671875, 75.75564575195312, 79.33990478515625, 82.92416381835938, 86.5084228515625, 90.09268188476562, 93.67694091796875, 97.2612075805664, 100.84546661376953, 104.42972564697266, 108.01398468017578, 111.59825134277344]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 6.0, 8.0, 14.0, 8.0, 31.0, 30.0, 33.0, 58.0, 90.0, 134.0, 161.0, 246.0, 376.0, 660.0, 1294.0, 2781.0, 6857.0, 18072.0, 52629.0, 152276.0, 348539.0, 289434.0, 112594.0, 38482.0, 13726.0, 5066.0, 2257.0, 1068.0, 582.0, 332.0, 218.0, 157.0, 94.0, 79.0, 56.0, 33.0, 28.0, 11.0, 8.0, 11.0, 9.0, 9.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-96.3125, -93.69921875, -91.0859375, -88.47265625, -85.859375, -83.24609375, -80.6328125, -78.01953125, -75.40625, -72.79296875, -70.1796875, -67.56640625, -64.953125, -62.33984375, -59.7265625, -57.11328125, -54.5, -51.88671875, -49.2734375, -46.66015625, -44.046875, -41.43359375, -38.8203125, -36.20703125, -33.59375, -30.98046875, -28.3671875, -25.75390625, -23.140625, -20.52734375, -17.9140625, -15.30078125, -12.6875, -10.07421875, -7.4609375, -4.84765625, -2.234375, 0.37890625, 2.9921875, 5.60546875, 8.21875, 10.83203125, 13.4453125, 16.05859375, 18.671875, 21.28515625, 23.8984375, 26.51171875, 29.125, 31.73828125, 34.3515625, 36.96484375, 39.578125, 42.19140625, 44.8046875, 47.41796875, 50.03125, 52.64453125, 55.2578125, 57.87109375, 60.484375, 63.09765625, 65.7109375, 68.32421875, 70.9375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 9.0, 9.0, 20.0, 34.0, 37.0, 47.0, 62.0, 79.0, 83.0, 93.0, 102.0, 81.0, 88.0, 71.0, 52.0, 40.0, 39.0, 22.0, 17.0, 6.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.75, -18.106201171875, -17.46240234375, -16.818603515625, -16.1748046875, -15.531005859375, -14.88720703125, -14.243408203125, -13.599609375, -12.955810546875, -12.31201171875, -11.668212890625, -11.0244140625, -10.380615234375, -9.73681640625, -9.093017578125, -8.44921875, -7.805419921875, -7.16162109375, -6.517822265625, -5.8740234375, -5.230224609375, -4.58642578125, -3.942626953125, -3.298828125, -2.655029296875, -2.01123046875, -1.367431640625, -0.7236328125, -0.079833984375, 0.56396484375, 1.207763671875, 1.8515625, 2.495361328125, 3.13916015625, 3.782958984375, 4.4267578125, 5.070556640625, 5.71435546875, 6.358154296875, 7.001953125, 7.645751953125, 8.28955078125, 8.933349609375, 9.5771484375, 10.220947265625, 10.86474609375, 11.508544921875, 12.15234375, 12.796142578125, 13.43994140625, 14.083740234375, 14.7275390625, 15.371337890625, 16.01513671875, 16.658935546875, 17.302734375, 17.946533203125, 18.59033203125, 19.234130859375, 19.8779296875, 20.521728515625, 21.16552734375, 21.809326171875, 22.453125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 7.0, 8.0, 19.0, 16.0, 23.0, 43.0, 41.0, 72.0, 96.0, 124.0, 189.0, 272.0, 375.0, 563.0, 918.0, 1517.0, 2758.0, 5592.0, 11818.0, 26876.0, 64444.0, 144554.0, 267322.0, 264700.0, 142444.0, 62914.0, 26653.0, 11604.0, 5506.0, 2762.0, 1543.0, 902.0, 560.0, 363.0, 307.0, 195.0, 137.0, 83.0, 74.0, 46.0, 34.0, 29.0, 18.0, 9.0, 9.0, 4.0, 3.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.34375, -50.5380859375, -48.732421875, -46.9267578125, -45.12109375, -43.3154296875, -41.509765625, -39.7041015625, -37.8984375, -36.0927734375, -34.287109375, -32.4814453125, -30.67578125, -28.8701171875, -27.064453125, -25.2587890625, -23.453125, -21.6474609375, -19.841796875, -18.0361328125, -16.23046875, -14.4248046875, -12.619140625, -10.8134765625, -9.0078125, -7.2021484375, -5.396484375, -3.5908203125, -1.78515625, 0.0205078125, 1.826171875, 3.6318359375, 5.4375, 7.2431640625, 9.048828125, 10.8544921875, 12.66015625, 14.4658203125, 16.271484375, 18.0771484375, 19.8828125, 21.6884765625, 23.494140625, 25.2998046875, 27.10546875, 28.9111328125, 30.716796875, 32.5224609375, 34.328125, 36.1337890625, 37.939453125, 39.7451171875, 41.55078125, 43.3564453125, 45.162109375, 46.9677734375, 48.7734375, 50.5791015625, 52.384765625, 54.1904296875, 55.99609375, 57.8017578125, 59.607421875, 61.4130859375, 63.21875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 6.0, 9.0, 8.0, 18.0, 7.0, 12.0, 15.0, 14.0, 23.0, 25.0, 35.0, 33.0, 45.0, 36.0, 52.0, 56.0, 46.0, 46.0, 36.0, 52.0, 50.0, 41.0, 53.0, 38.0, 40.0, 30.0, 34.0, 30.0, 22.0, 12.0, 13.0, 18.0, 12.0, 10.0, 6.0, 8.0, 3.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.75, -50.013671875, -48.27734375, -46.541015625, -44.8046875, -43.068359375, -41.33203125, -39.595703125, -37.859375, -36.123046875, -34.38671875, -32.650390625, -30.9140625, -29.177734375, -27.44140625, -25.705078125, -23.96875, -22.232421875, -20.49609375, -18.759765625, -17.0234375, -15.287109375, -13.55078125, -11.814453125, -10.078125, -8.341796875, -6.60546875, -4.869140625, -3.1328125, -1.396484375, 0.33984375, 2.076171875, 3.8125, 5.548828125, 7.28515625, 9.021484375, 10.7578125, 12.494140625, 14.23046875, 15.966796875, 17.703125, 19.439453125, 21.17578125, 22.912109375, 24.6484375, 26.384765625, 28.12109375, 29.857421875, 31.59375, 33.330078125, 35.06640625, 36.802734375, 38.5390625, 40.275390625, 42.01171875, 43.748046875, 45.484375, 47.220703125, 48.95703125, 50.693359375, 52.4296875, 54.166015625, 55.90234375, 57.638671875, 59.375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 5.0, 8.0, 14.0, 16.0, 23.0, 27.0, 39.0, 41.0, 81.0, 123.0, 183.0, 306.0, 510.0, 1070.0, 2461.0, 6230.0, 20576.0, 85191.0, 336018.0, 423328.0, 128158.0, 29649.0, 8602.0, 2985.0, 1291.0, 664.0, 366.0, 187.0, 122.0, 73.0, 55.0, 40.0, 13.0, 19.0, 14.0, 16.0, 12.0, 9.0, 8.0, 3.0, 6.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.5, -34.35986328125, -33.2197265625, -32.07958984375, -30.939453125, -29.79931640625, -28.6591796875, -27.51904296875, -26.37890625, -25.23876953125, -24.0986328125, -22.95849609375, -21.818359375, -20.67822265625, -19.5380859375, -18.39794921875, -17.2578125, -16.11767578125, -14.9775390625, -13.83740234375, -12.697265625, -11.55712890625, -10.4169921875, -9.27685546875, -8.13671875, -6.99658203125, -5.8564453125, -4.71630859375, -3.576171875, -2.43603515625, -1.2958984375, -0.15576171875, 0.984375, 2.12451171875, 3.2646484375, 4.40478515625, 5.544921875, 6.68505859375, 7.8251953125, 8.96533203125, 10.10546875, 11.24560546875, 12.3857421875, 13.52587890625, 14.666015625, 15.80615234375, 16.9462890625, 18.08642578125, 19.2265625, 20.36669921875, 21.5068359375, 22.64697265625, 23.787109375, 24.92724609375, 26.0673828125, 27.20751953125, 28.34765625, 29.48779296875, 30.6279296875, 31.76806640625, 32.908203125, 34.04833984375, 35.1884765625, 36.32861328125, 37.46875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 6.0, 5.0, 9.0, 7.0, 5.0, 16.0, 18.0, 19.0, 32.0, 26.0, 26.0, 41.0, 47.0, 67.0, 100.0, 89.0, 92.0, 64.0, 50.0, 51.0, 45.0, 28.0, 35.0, 21.0, 21.0, 22.0, 9.0, 14.0, 10.0, 5.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.004543304443359375, -0.004396557807922363, -0.0042498111724853516, -0.00410306453704834, -0.003956317901611328, -0.0038095712661743164, -0.0036628246307373047, -0.003516077995300293, -0.0033693313598632812, -0.0032225847244262695, -0.003075838088989258, -0.002929091453552246, -0.0027823448181152344, -0.0026355981826782227, -0.002488851547241211, -0.0023421049118041992, -0.0021953582763671875, -0.0020486116409301758, -0.001901865005493164, -0.0017551183700561523, -0.0016083717346191406, -0.001461625099182129, -0.0013148784637451172, -0.0011681318283081055, -0.0010213851928710938, -0.000874638557434082, -0.0007278919219970703, -0.0005811452865600586, -0.0004343986511230469, -0.00028765201568603516, -0.00014090538024902344, 5.841255187988281e-06, 0.000152587890625, 0.0002993345260620117, 0.00044608116149902344, 0.0005928277969360352, 0.0007395744323730469, 0.0008863210678100586, 0.0010330677032470703, 0.001179814338684082, 0.0013265609741210938, 0.0014733076095581055, 0.0016200542449951172, 0.001766800880432129, 0.0019135475158691406, 0.0020602941513061523, 0.002207040786743164, 0.0023537874221801758, 0.0025005340576171875, 0.0026472806930541992, 0.002794027328491211, 0.0029407739639282227, 0.0030875205993652344, 0.003234267234802246, 0.003381013870239258, 0.0035277605056762695, 0.0036745071411132812, 0.003821253776550293, 0.003968000411987305, 0.004114747047424316, 0.004261493682861328, 0.00440824031829834, 0.0045549869537353516, 0.004701733589172363, 0.004848480224609375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 6.0, 7.0, 11.0, 21.0, 23.0, 31.0, 54.0, 82.0, 123.0, 237.0, 382.0, 668.0, 1183.0, 2493.0, 5963.0, 17854.0, 75553.0, 349971.0, 442700.0, 112803.0, 24469.0, 7689.0, 2995.0, 1408.0, 737.0, 428.0, 247.0, 137.0, 96.0, 62.0, 36.0, 18.0, 14.0, 16.0, 7.0, 9.0, 6.0, 0.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-40.59375, -39.3681640625, -38.142578125, -36.9169921875, -35.69140625, -34.4658203125, -33.240234375, -32.0146484375, -30.7890625, -29.5634765625, -28.337890625, -27.1123046875, -25.88671875, -24.6611328125, -23.435546875, -22.2099609375, -20.984375, -19.7587890625, -18.533203125, -17.3076171875, -16.08203125, -14.8564453125, -13.630859375, -12.4052734375, -11.1796875, -9.9541015625, -8.728515625, -7.5029296875, -6.27734375, -5.0517578125, -3.826171875, -2.6005859375, -1.375, -0.1494140625, 1.076171875, 2.3017578125, 3.52734375, 4.7529296875, 5.978515625, 7.2041015625, 8.4296875, 9.6552734375, 10.880859375, 12.1064453125, 13.33203125, 14.5576171875, 15.783203125, 17.0087890625, 18.234375, 19.4599609375, 20.685546875, 21.9111328125, 23.13671875, 24.3623046875, 25.587890625, 26.8134765625, 28.0390625, 29.2646484375, 30.490234375, 31.7158203125, 32.94140625, 34.1669921875, 35.392578125, 36.6181640625, 37.84375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 11.0, 14.0, 11.0, 17.0, 21.0, 23.0, 44.0, 48.0, 54.0, 58.0, 80.0, 92.0, 69.0, 78.0, 77.0, 52.0, 39.0, 48.0, 39.0, 27.0, 19.0, 16.0, 15.0, 8.0, 6.0, 10.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.453125, -21.758056640625, -21.06298828125, -20.367919921875, -19.6728515625, -18.977783203125, -18.28271484375, -17.587646484375, -16.892578125, -16.197509765625, -15.50244140625, -14.807373046875, -14.1123046875, -13.417236328125, -12.72216796875, -12.027099609375, -11.33203125, -10.636962890625, -9.94189453125, -9.246826171875, -8.5517578125, -7.856689453125, -7.16162109375, -6.466552734375, -5.771484375, -5.076416015625, -4.38134765625, -3.686279296875, -2.9912109375, -2.296142578125, -1.60107421875, -0.906005859375, -0.2109375, 0.484130859375, 1.17919921875, 1.874267578125, 2.5693359375, 3.264404296875, 3.95947265625, 4.654541015625, 5.349609375, 6.044677734375, 6.73974609375, 7.434814453125, 8.1298828125, 8.824951171875, 9.52001953125, 10.215087890625, 10.91015625, 11.605224609375, 12.30029296875, 12.995361328125, 13.6904296875, 14.385498046875, 15.08056640625, 15.775634765625, 16.470703125, 17.165771484375, 17.86083984375, 18.555908203125, 19.2509765625, 19.946044921875, 20.64111328125, 21.336181640625, 22.03125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 6.0, 13.0, 18.0, 14.0, 37.0, 61.0, 68.0, 82.0, 96.0, 129.0, 96.0, 92.0, 75.0, 54.0, 47.0, 37.0, 22.0, 13.0, 11.0, 8.0, 7.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-502.29571533203125, -489.33551025390625, -476.37530517578125, -463.4150695800781, -450.4548645019531, -437.4946594238281, -424.5344543457031, -411.57421875, -398.614013671875, -385.65380859375, -372.693603515625, -359.7333679199219, -346.7731628417969, -333.8129577636719, -320.8527526855469, -307.89251708984375, -294.93231201171875, -281.97210693359375, -269.01190185546875, -256.0516662597656, -243.09146118164062, -230.13125610351562, -217.17105102539062, -204.21083068847656, -191.25064086914062, -178.29043579101562, -165.33021545410156, -152.37001037597656, -139.4097900390625, -126.4495849609375, -113.48937225341797, -100.52915954589844, -87.56893920898438, -74.60872650146484, -61.64851379394531, -48.68830490112305, -35.728092193603516, -22.76788330078125, -9.807670593261719, 3.1525421142578125, 16.112754821777344, 29.072967529296875, 42.033180236816406, 54.99338912963867, 67.95359802246094, 80.91381072998047, 93.8740234375, 106.83423614501953, 119.79444885253906, 132.75465393066406, 145.71487426757812, 158.67507934570312, 171.6352996826172, 184.5955047607422, 197.55572509765625, 210.51593017578125, 223.47613525390625, 236.43634033203125, 249.3965606689453, 262.3567810058594, 275.3169860839844, 288.2771911621094, 301.2373962402344, 314.1976318359375, 327.1578369140625]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 4.0, 11.0, 4.0, 10.0, 17.0, 18.0, 15.0, 23.0, 28.0, 28.0, 46.0, 47.0, 34.0, 35.0, 58.0, 44.0, 49.0, 58.0, 57.0, 45.0, 39.0, 46.0, 43.0, 28.0, 44.0, 25.0, 36.0, 20.0, 14.0, 9.0, 18.0, 10.0, 5.0, 4.0, 11.0, 2.0, 3.0, 3.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-290.86920166015625, -280.7148132324219, -270.5603942871094, -260.406005859375, -250.25161743164062, -240.0972137451172, -229.94281005859375, -219.78842163085938, -209.63401794433594, -199.4796142578125, -189.32522583007812, -179.1708221435547, -169.01641845703125, -158.86203002929688, -148.70762634277344, -138.55322265625, -128.39883422851562, -118.24443817138672, -108.09004211425781, -97.93563842773438, -87.78124237060547, -77.62684631347656, -67.47244262695312, -57.31804656982422, -47.16365051269531, -37.009254455566406, -26.854854583740234, -16.700456619262695, -6.546058654785156, 3.60833740234375, 13.762737274169922, 23.917137145996094, 34.071533203125, 44.225929260253906, 54.38032913208008, 64.53472900390625, 74.68912506103516, 84.84352111816406, 94.9979248046875, 105.1523208618164, 115.30671691894531, 125.46111297607422, 135.61550903320312, 145.76991271972656, 155.92431640625, 166.07870483398438, 176.2331085205078, 186.38751220703125, 196.54190063476562, 206.69630432128906, 216.85069274902344, 227.00509643554688, 237.15948486328125, 247.3138885498047, 257.4682922363281, 267.6226806640625, 277.777099609375, 287.9314880371094, 298.0859069824219, 308.24029541015625, 318.3946838378906, 328.549072265625, 338.7034912109375, 348.8578796386719, 359.01226806640625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 10.0, 10.0, 8.0, 20.0, 33.0, 48.0, 73.0, 102.0, 181.0, 329.0, 610.0, 1199.0, 2964.0, 8620.0, 33589.0, 353145.0, 3695411.0, 74827.0, 14901.0, 4668.0, 1747.0, 799.0, 416.0, 225.0, 125.0, 69.0, 49.0, 27.0, 24.0, 15.0, 6.0, 11.0, 3.0, 6.0, 2.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-145.0, -139.861328125, -134.72265625, -129.583984375, -124.4453125, -119.306640625, -114.16796875, -109.029296875, -103.890625, -98.751953125, -93.61328125, -88.474609375, -83.3359375, -78.197265625, -73.05859375, -67.919921875, -62.78125, -57.642578125, -52.50390625, -47.365234375, -42.2265625, -37.087890625, -31.94921875, -26.810546875, -21.671875, -16.533203125, -11.39453125, -6.255859375, -1.1171875, 4.021484375, 9.16015625, 14.298828125, 19.4375, 24.576171875, 29.71484375, 34.853515625, 39.9921875, 45.130859375, 50.26953125, 55.408203125, 60.546875, 65.685546875, 70.82421875, 75.962890625, 81.1015625, 86.240234375, 91.37890625, 96.517578125, 101.65625, 106.794921875, 111.93359375, 117.072265625, 122.2109375, 127.349609375, 132.48828125, 137.626953125, 142.765625, 147.904296875, 153.04296875, 158.181640625, 163.3203125, 168.458984375, 173.59765625, 178.736328125, 183.875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 4.0, 6.0, 14.0, 21.0, 20.0, 19.0, 32.0, 46.0, 60.0, 65.0, 69.0, 82.0, 81.0, 82.0, 68.0, 76.0, 50.0, 54.0, 31.0, 41.0, 27.0, 16.0, 15.0, 9.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.5390625, -14.9981689453125, -14.457275390625, -13.9163818359375, -13.37548828125, -12.8345947265625, -12.293701171875, -11.7528076171875, -11.2119140625, -10.6710205078125, -10.130126953125, -9.5892333984375, -9.04833984375, -8.5074462890625, -7.966552734375, -7.4256591796875, -6.884765625, -6.3438720703125, -5.802978515625, -5.2620849609375, -4.72119140625, -4.1802978515625, -3.639404296875, -3.0985107421875, -2.5576171875, -2.0167236328125, -1.475830078125, -0.9349365234375, -0.39404296875, 0.1468505859375, 0.687744140625, 1.2286376953125, 1.76953125, 2.3104248046875, 2.851318359375, 3.3922119140625, 3.93310546875, 4.4739990234375, 5.014892578125, 5.5557861328125, 6.0966796875, 6.6375732421875, 7.178466796875, 7.7193603515625, 8.26025390625, 8.8011474609375, 9.342041015625, 9.8829345703125, 10.423828125, 10.9647216796875, 11.505615234375, 12.0465087890625, 12.58740234375, 13.1282958984375, 13.669189453125, 14.2100830078125, 14.7509765625, 15.2918701171875, 15.832763671875, 16.3736572265625, 16.91455078125, 17.4554443359375, 17.996337890625, 18.5372314453125, 19.078125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 6.0, 5.0, 7.0, 12.0, 12.0, 18.0, 28.0, 17.0, 27.0, 34.0, 36.0, 80.0, 101.0, 157.0, 327.0, 701.0, 1710.0, 4944.0, 16478.0, 69454.0, 576713.0, 3327656.0, 152370.0, 29879.0, 8311.0, 2920.0, 1191.0, 511.0, 217.0, 126.0, 61.0, 47.0, 33.0, 24.0, 16.0, 17.0, 8.0, 11.0, 7.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-122.3125, -118.5166015625, -114.720703125, -110.9248046875, -107.12890625, -103.3330078125, -99.537109375, -95.7412109375, -91.9453125, -88.1494140625, -84.353515625, -80.5576171875, -76.76171875, -72.9658203125, -69.169921875, -65.3740234375, -61.578125, -57.7822265625, -53.986328125, -50.1904296875, -46.39453125, -42.5986328125, -38.802734375, -35.0068359375, -31.2109375, -27.4150390625, -23.619140625, -19.8232421875, -16.02734375, -12.2314453125, -8.435546875, -4.6396484375, -0.84375, 2.9521484375, 6.748046875, 10.5439453125, 14.33984375, 18.1357421875, 21.931640625, 25.7275390625, 29.5234375, 33.3193359375, 37.115234375, 40.9111328125, 44.70703125, 48.5029296875, 52.298828125, 56.0947265625, 59.890625, 63.6865234375, 67.482421875, 71.2783203125, 75.07421875, 78.8701171875, 82.666015625, 86.4619140625, 90.2578125, 94.0537109375, 97.849609375, 101.6455078125, 105.44140625, 109.2373046875, 113.033203125, 116.8291015625, 120.625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 4.0, 3.0, 6.0, 20.0, 29.0, 42.0, 63.0, 113.0, 214.0, 604.0, 2060.0, 440.0, 210.0, 108.0, 50.0, 39.0, 21.0, 20.0, 10.0, 10.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-54.9375, -53.75244140625, -52.5673828125, -51.38232421875, -50.197265625, -49.01220703125, -47.8271484375, -46.64208984375, -45.45703125, -44.27197265625, -43.0869140625, -41.90185546875, -40.716796875, -39.53173828125, -38.3466796875, -37.16162109375, -35.9765625, -34.79150390625, -33.6064453125, -32.42138671875, -31.236328125, -30.05126953125, -28.8662109375, -27.68115234375, -26.49609375, -25.31103515625, -24.1259765625, -22.94091796875, -21.755859375, -20.57080078125, -19.3857421875, -18.20068359375, -17.015625, -15.83056640625, -14.6455078125, -13.46044921875, -12.275390625, -11.09033203125, -9.9052734375, -8.72021484375, -7.53515625, -6.35009765625, -5.1650390625, -3.97998046875, -2.794921875, -1.60986328125, -0.4248046875, 0.76025390625, 1.9453125, 3.13037109375, 4.3154296875, 5.50048828125, 6.685546875, 7.87060546875, 9.0556640625, 10.24072265625, 11.42578125, 12.61083984375, 13.7958984375, 14.98095703125, 16.166015625, 17.35107421875, 18.5361328125, 19.72119140625, 20.90625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 5.0, 4.0, 11.0, 19.0, 18.0, 34.0, 46.0, 75.0, 133.0, 120.0, 143.0, 123.0, 89.0, 73.0, 35.0, 28.0, 17.0, 7.0, 8.0, 3.0, 6.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-121.0135269165039, -115.53886413574219, -110.06420135498047, -104.58953857421875, -99.11488342285156, -93.64021301269531, -88.16555786132812, -82.6908950805664, -77.21623229980469, -71.74156951904297, -66.26690673828125, -60.7922477722168, -55.31758499145508, -49.84292221069336, -44.368263244628906, -38.89360046386719, -33.41893768310547, -27.94427490234375, -22.469614028930664, -16.994953155517578, -11.52029037475586, -6.045627593994141, -0.5709686279296875, 4.903694152832031, 10.37835693359375, 15.853018760681152, 21.327680587768555, 26.80234146118164, 32.27700424194336, 37.75166702270508, 43.22632598876953, 48.70098876953125, 54.17564392089844, 59.650306701660156, 65.12496948242188, 70.59962463378906, 76.07429504394531, 81.5489501953125, 87.02361297607422, 92.49827575683594, 97.97293853759766, 103.44760131835938, 108.9222640991211, 114.39692687988281, 119.87158203125, 125.34625244140625, 130.82090759277344, 136.29556274414062, 141.77023315429688, 147.24488830566406, 152.7195587158203, 158.1942138671875, 163.66888427734375, 169.14353942871094, 174.61819458007812, 180.09286499023438, 185.56753540039062, 191.0421905517578, 196.51686096191406, 201.99151611328125, 207.4661865234375, 212.9408416748047, 218.41549682617188, 223.89016723632812, 229.3648223876953]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 6.0, 9.0, 12.0, 9.0, 13.0, 15.0, 19.0, 18.0, 24.0, 20.0, 31.0, 29.0, 34.0, 35.0, 29.0, 28.0, 51.0, 39.0, 38.0, 48.0, 47.0, 44.0, 42.0, 42.0, 37.0, 30.0, 29.0, 32.0, 27.0, 20.0, 15.0, 19.0, 13.0, 11.0, 13.0, 11.0, 9.0, 11.0, 11.0, 2.0, 8.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0], "bins": [-86.27619934082031, -83.82474517822266, -81.373291015625, -78.92182922363281, -76.47037506103516, -74.0189208984375, -71.56746673583984, -69.11601257324219, -66.66455078125, -64.21309661865234, -61.76163864135742, -59.310184478759766, -56.858726501464844, -54.40727233886719, -51.95581817626953, -49.50436019897461, -47.05290603637695, -44.6014518737793, -42.149993896484375, -39.69853973388672, -37.2470817565918, -34.79562759399414, -32.34416961669922, -29.892715454101562, -27.441259384155273, -24.989803314208984, -22.538347244262695, -20.086891174316406, -17.63543701171875, -15.183979988098145, -12.732524871826172, -10.281068801879883, -7.829612731933594, -5.378156661987305, -2.926701068878174, -0.47524547576904297, 1.976210594177246, 4.427666664123535, 6.879121780395508, 9.330577850341797, 11.782033920288086, 14.233489990234375, 16.684946060180664, 19.136402130126953, 21.58785629272461, 24.03931427001953, 26.490768432617188, 28.942224502563477, 31.393680572509766, 33.84513473510742, 36.296592712402344, 38.748046875, 41.19950485229492, 43.65095901489258, 46.1024169921875, 48.553871154785156, 51.00532531738281, 53.45677947998047, 55.90823745727539, 58.35969161987305, 60.81114959716797, 63.262603759765625, 65.71405792236328, 68.16551208496094, 70.61697387695312]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 6.0, 5.0, 6.0, 7.0, 12.0, 24.0, 40.0, 42.0, 70.0, 80.0, 197.0, 271.0, 484.0, 1001.0, 2147.0, 5643.0, 18128.0, 66668.0, 255361.0, 471452.0, 164830.0, 42863.0, 11817.0, 3981.0, 1622.0, 755.0, 416.0, 231.0, 126.0, 86.0, 52.0, 48.0, 30.0, 17.0, 6.0, 9.0, 7.0, 4.0, 4.0, 1.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.875, -92.6064453125, -89.337890625, -86.0693359375, -82.80078125, -79.5322265625, -76.263671875, -72.9951171875, -69.7265625, -66.4580078125, -63.189453125, -59.9208984375, -56.65234375, -53.3837890625, -50.115234375, -46.8466796875, -43.578125, -40.3095703125, -37.041015625, -33.7724609375, -30.50390625, -27.2353515625, -23.966796875, -20.6982421875, -17.4296875, -14.1611328125, -10.892578125, -7.6240234375, -4.35546875, -1.0869140625, 2.181640625, 5.4501953125, 8.71875, 11.9873046875, 15.255859375, 18.5244140625, 21.79296875, 25.0615234375, 28.330078125, 31.5986328125, 34.8671875, 38.1357421875, 41.404296875, 44.6728515625, 47.94140625, 51.2099609375, 54.478515625, 57.7470703125, 61.015625, 64.2841796875, 67.552734375, 70.8212890625, 74.08984375, 77.3583984375, 80.626953125, 83.8955078125, 87.1640625, 90.4326171875, 93.701171875, 96.9697265625, 100.23828125, 103.5068359375, 106.775390625, 110.0439453125, 113.3125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 7.0, 16.0, 12.0, 26.0, 22.0, 36.0, 46.0, 53.0, 72.0, 73.0, 101.0, 92.0, 75.0, 90.0, 67.0, 46.0, 46.0, 44.0, 25.0, 21.0, 11.0, 7.0, 8.0, 7.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.71875, -15.12451171875, -14.5302734375, -13.93603515625, -13.341796875, -12.74755859375, -12.1533203125, -11.55908203125, -10.96484375, -10.37060546875, -9.7763671875, -9.18212890625, -8.587890625, -7.99365234375, -7.3994140625, -6.80517578125, -6.2109375, -5.61669921875, -5.0224609375, -4.42822265625, -3.833984375, -3.23974609375, -2.6455078125, -2.05126953125, -1.45703125, -0.86279296875, -0.2685546875, 0.32568359375, 0.919921875, 1.51416015625, 2.1083984375, 2.70263671875, 3.296875, 3.89111328125, 4.4853515625, 5.07958984375, 5.673828125, 6.26806640625, 6.8623046875, 7.45654296875, 8.05078125, 8.64501953125, 9.2392578125, 9.83349609375, 10.427734375, 11.02197265625, 11.6162109375, 12.21044921875, 12.8046875, 13.39892578125, 13.9931640625, 14.58740234375, 15.181640625, 15.77587890625, 16.3701171875, 16.96435546875, 17.55859375, 18.15283203125, 18.7470703125, 19.34130859375, 19.935546875, 20.52978515625, 21.1240234375, 21.71826171875, 22.3125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 3.0, 4.0, 5.0, 11.0, 14.0, 18.0, 28.0, 47.0, 61.0, 91.0, 97.0, 171.0, 214.0, 275.0, 466.0, 746.0, 1258.0, 2144.0, 4337.0, 9375.0, 21474.0, 54359.0, 133009.0, 275978.0, 293049.0, 145947.0, 60441.0, 24088.0, 10186.0, 4703.0, 2332.0, 1302.0, 776.0, 488.0, 328.0, 208.0, 140.0, 113.0, 71.0, 64.0, 44.0, 33.0, 14.0, 18.0, 10.0, 6.0, 3.0, 5.0, 6.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.375, -49.720703125, -48.06640625, -46.412109375, -44.7578125, -43.103515625, -41.44921875, -39.794921875, -38.140625, -36.486328125, -34.83203125, -33.177734375, -31.5234375, -29.869140625, -28.21484375, -26.560546875, -24.90625, -23.251953125, -21.59765625, -19.943359375, -18.2890625, -16.634765625, -14.98046875, -13.326171875, -11.671875, -10.017578125, -8.36328125, -6.708984375, -5.0546875, -3.400390625, -1.74609375, -0.091796875, 1.5625, 3.216796875, 4.87109375, 6.525390625, 8.1796875, 9.833984375, 11.48828125, 13.142578125, 14.796875, 16.451171875, 18.10546875, 19.759765625, 21.4140625, 23.068359375, 24.72265625, 26.376953125, 28.03125, 29.685546875, 31.33984375, 32.994140625, 34.6484375, 36.302734375, 37.95703125, 39.611328125, 41.265625, 42.919921875, 44.57421875, 46.228515625, 47.8828125, 49.537109375, 51.19140625, 52.845703125, 54.5]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 5.0, 6.0, 4.0, 13.0, 9.0, 14.0, 16.0, 14.0, 16.0, 24.0, 24.0, 27.0, 40.0, 32.0, 33.0, 43.0, 38.0, 50.0, 50.0, 60.0, 54.0, 45.0, 37.0, 50.0, 41.0, 44.0, 41.0, 30.0, 27.0, 15.0, 27.0, 17.0, 14.0, 9.0, 8.0, 11.0, 5.0, 2.0, 2.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.3125, -40.76171875, -39.2109375, -37.66015625, -36.109375, -34.55859375, -33.0078125, -31.45703125, -29.90625, -28.35546875, -26.8046875, -25.25390625, -23.703125, -22.15234375, -20.6015625, -19.05078125, -17.5, -15.94921875, -14.3984375, -12.84765625, -11.296875, -9.74609375, -8.1953125, -6.64453125, -5.09375, -3.54296875, -1.9921875, -0.44140625, 1.109375, 2.66015625, 4.2109375, 5.76171875, 7.3125, 8.86328125, 10.4140625, 11.96484375, 13.515625, 15.06640625, 16.6171875, 18.16796875, 19.71875, 21.26953125, 22.8203125, 24.37109375, 25.921875, 27.47265625, 29.0234375, 30.57421875, 32.125, 33.67578125, 35.2265625, 36.77734375, 38.328125, 39.87890625, 41.4296875, 42.98046875, 44.53125, 46.08203125, 47.6328125, 49.18359375, 50.734375, 52.28515625, 53.8359375, 55.38671875, 56.9375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 4.0, 3.0, 4.0, 10.0, 17.0, 11.0, 29.0, 29.0, 48.0, 82.0, 128.0, 229.0, 472.0, 857.0, 1738.0, 3924.0, 11314.0, 45845.0, 279892.0, 552160.0, 117351.0, 22383.0, 6616.0, 2686.0, 1213.0, 655.0, 353.0, 202.0, 98.0, 68.0, 39.0, 27.0, 21.0, 9.0, 12.0, 7.0, 8.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-42.65625, -41.2919921875, -39.927734375, -38.5634765625, -37.19921875, -35.8349609375, -34.470703125, -33.1064453125, -31.7421875, -30.3779296875, -29.013671875, -27.6494140625, -26.28515625, -24.9208984375, -23.556640625, -22.1923828125, -20.828125, -19.4638671875, -18.099609375, -16.7353515625, -15.37109375, -14.0068359375, -12.642578125, -11.2783203125, -9.9140625, -8.5498046875, -7.185546875, -5.8212890625, -4.45703125, -3.0927734375, -1.728515625, -0.3642578125, 1.0, 2.3642578125, 3.728515625, 5.0927734375, 6.45703125, 7.8212890625, 9.185546875, 10.5498046875, 11.9140625, 13.2783203125, 14.642578125, 16.0068359375, 17.37109375, 18.7353515625, 20.099609375, 21.4638671875, 22.828125, 24.1923828125, 25.556640625, 26.9208984375, 28.28515625, 29.6494140625, 31.013671875, 32.3779296875, 33.7421875, 35.1064453125, 36.470703125, 37.8349609375, 39.19921875, 40.5634765625, 41.927734375, 43.2919921875, 44.65625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 5.0, 4.0, 6.0, 7.0, 10.0, 10.0, 13.0, 14.0, 22.0, 37.0, 41.0, 66.0, 82.0, 130.0, 145.0, 107.0, 81.0, 58.0, 38.0, 34.0, 29.0, 17.0, 9.0, 10.0, 5.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00690460205078125, -0.006703615188598633, -0.006502628326416016, -0.0063016414642333984, -0.006100654602050781, -0.005899667739868164, -0.005698680877685547, -0.00549769401550293, -0.0052967071533203125, -0.005095720291137695, -0.004894733428955078, -0.004693746566772461, -0.004492759704589844, -0.0042917728424072266, -0.004090785980224609, -0.003889799118041992, -0.003688812255859375, -0.003487825393676758, -0.0032868385314941406, -0.0030858516693115234, -0.0028848648071289062, -0.002683877944946289, -0.002482891082763672, -0.0022819042205810547, -0.0020809173583984375, -0.0018799304962158203, -0.0016789436340332031, -0.001477956771850586, -0.0012769699096679688, -0.0010759830474853516, -0.0008749961853027344, -0.0006740093231201172, -0.0004730224609375, -0.0002720355987548828, -7.104873657226562e-05, 0.00012993812561035156, 0.00033092498779296875, 0.0005319118499755859, 0.0007328987121582031, 0.0009338855743408203, 0.0011348724365234375, 0.0013358592987060547, 0.0015368461608886719, 0.001737833023071289, 0.0019388198852539062, 0.0021398067474365234, 0.0023407936096191406, 0.002541780471801758, 0.002742767333984375, 0.002943754196166992, 0.0031447410583496094, 0.0033457279205322266, 0.0035467147827148438, 0.003747701644897461, 0.003948688507080078, 0.004149675369262695, 0.0043506622314453125, 0.00455164909362793, 0.004752635955810547, 0.004953622817993164, 0.005154609680175781, 0.0053555965423583984, 0.005556583404541016, 0.005757570266723633, 0.00595855712890625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 1.0, 6.0, 0.0, 3.0, 6.0, 2.0, 7.0, 6.0, 10.0, 24.0, 21.0, 28.0, 46.0, 77.0, 134.0, 200.0, 372.0, 728.0, 1535.0, 3540.0, 9782.0, 38165.0, 302387.0, 588049.0, 78453.0, 15701.0, 5084.0, 1994.0, 954.0, 486.0, 279.0, 173.0, 93.0, 62.0, 40.0, 36.0, 15.0, 15.0, 9.0, 6.0, 7.0, 9.0, 5.0, 7.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.1875, -54.54443359375, -52.9013671875, -51.25830078125, -49.615234375, -47.97216796875, -46.3291015625, -44.68603515625, -43.04296875, -41.39990234375, -39.7568359375, -38.11376953125, -36.470703125, -34.82763671875, -33.1845703125, -31.54150390625, -29.8984375, -28.25537109375, -26.6123046875, -24.96923828125, -23.326171875, -21.68310546875, -20.0400390625, -18.39697265625, -16.75390625, -15.11083984375, -13.4677734375, -11.82470703125, -10.181640625, -8.53857421875, -6.8955078125, -5.25244140625, -3.609375, -1.96630859375, -0.3232421875, 1.31982421875, 2.962890625, 4.60595703125, 6.2490234375, 7.89208984375, 9.53515625, 11.17822265625, 12.8212890625, 14.46435546875, 16.107421875, 17.75048828125, 19.3935546875, 21.03662109375, 22.6796875, 24.32275390625, 25.9658203125, 27.60888671875, 29.251953125, 30.89501953125, 32.5380859375, 34.18115234375, 35.82421875, 37.46728515625, 39.1103515625, 40.75341796875, 42.396484375, 44.03955078125, 45.6826171875, 47.32568359375, 48.96875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 6.0, 2.0, 6.0, 4.0, 7.0, 9.0, 8.0, 8.0, 21.0, 28.0, 26.0, 44.0, 61.0, 69.0, 80.0, 81.0, 104.0, 101.0, 85.0, 62.0, 46.0, 40.0, 32.0, 17.0, 16.0, 7.0, 9.0, 4.0, 7.0, 6.0, 3.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-32.65625, -31.82421875, -30.9921875, -30.16015625, -29.328125, -28.49609375, -27.6640625, -26.83203125, -26.0, -25.16796875, -24.3359375, -23.50390625, -22.671875, -21.83984375, -21.0078125, -20.17578125, -19.34375, -18.51171875, -17.6796875, -16.84765625, -16.015625, -15.18359375, -14.3515625, -13.51953125, -12.6875, -11.85546875, -11.0234375, -10.19140625, -9.359375, -8.52734375, -7.6953125, -6.86328125, -6.03125, -5.19921875, -4.3671875, -3.53515625, -2.703125, -1.87109375, -1.0390625, -0.20703125, 0.625, 1.45703125, 2.2890625, 3.12109375, 3.953125, 4.78515625, 5.6171875, 6.44921875, 7.28125, 8.11328125, 8.9453125, 9.77734375, 10.609375, 11.44140625, 12.2734375, 13.10546875, 13.9375, 14.76953125, 15.6015625, 16.43359375, 17.265625, 18.09765625, 18.9296875, 19.76171875, 20.59375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 9.0, 7.0, 9.0, 6.0, 19.0, 19.0, 29.0, 51.0, 59.0, 100.0, 92.0, 110.0, 121.0, 84.0, 90.0, 68.0, 39.0, 29.0, 21.0, 12.0, 10.0, 11.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0], "bins": [-573.565673828125, -561.1333618164062, -548.7010498046875, -536.268798828125, -523.8364868164062, -511.4041748046875, -498.97186279296875, -486.53955078125, -474.10723876953125, -461.6749267578125, -449.2426452636719, -436.8103332519531, -424.3780212402344, -411.94573974609375, -399.513427734375, -387.08111572265625, -374.6488342285156, -362.2165222167969, -349.78424072265625, -337.3519287109375, -324.91961669921875, -312.4873046875, -300.0550231933594, -287.6227111816406, -275.1904296875, -262.75811767578125, -250.32582092285156, -237.89352416992188, -225.46121215820312, -213.02891540527344, -200.59661865234375, -188.164306640625, -175.73202514648438, -163.2997283935547, -150.86741638183594, -138.43511962890625, -126.00281524658203, -113.57051086425781, -101.13821411132812, -88.7059097290039, -76.27360534667969, -63.84130096435547, -51.409000396728516, -38.97669982910156, -26.544395446777344, -14.112091064453125, -1.6797943115234375, 10.752510070800781, 23.184814453125, 35.61711883544922, 48.04941940307617, 60.481719970703125, 72.91402435302734, 85.34632873535156, 97.77862548828125, 110.21092987060547, 122.64323425292969, 135.07553100585938, 147.50784301757812, 159.9401397705078, 172.3724365234375, 184.80474853515625, 197.23704528808594, 209.66934204101562, 222.10165405273438]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 5.0, 6.0, 10.0, 11.0, 14.0, 11.0, 18.0, 29.0, 30.0, 35.0, 40.0, 49.0, 32.0, 40.0, 52.0, 42.0, 35.0, 46.0, 58.0, 51.0, 51.0, 49.0, 48.0, 29.0, 39.0, 35.0, 26.0, 23.0, 12.0, 19.0, 26.0, 2.0, 5.0, 4.0, 8.0, 2.0, 3.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-315.7646179199219, -306.2895202636719, -296.8144226074219, -287.3393249511719, -277.8642272949219, -268.3891296386719, -258.9140319824219, -249.4389190673828, -239.9638214111328, -230.4887237548828, -221.0136260986328, -211.5385284423828, -202.06341552734375, -192.58831787109375, -183.11322021484375, -173.63812255859375, -164.16302490234375, -154.68792724609375, -145.21282958984375, -135.73773193359375, -126.26262664794922, -116.78752899169922, -107.31242370605469, -97.83732604980469, -88.36222839355469, -78.88713073730469, -69.41203308105469, -59.936927795410156, -50.461830139160156, -40.986732482910156, -31.51163101196289, -22.036529541015625, -12.56146240234375, -3.086362838745117, 6.388736724853516, 15.863836288452148, 25.33893585205078, 34.81403350830078, 44.28913497924805, 53.76423645019531, 63.23933410644531, 72.71443176269531, 82.18952941894531, 91.66463470458984, 101.13973236083984, 110.61483001708984, 120.08993530273438, 129.56503295898438, 139.04013061523438, 148.51522827148438, 157.99032592773438, 167.46542358398438, 176.94052124023438, 186.41561889648438, 195.89073181152344, 205.36582946777344, 214.84092712402344, 224.31602478027344, 233.79112243652344, 243.26622009277344, 252.7413330078125, 262.2164306640625, 271.6915283203125, 281.1666259765625, 290.6417236328125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 8.0, 6.0, 11.0, 8.0, 26.0, 38.0, 49.0, 64.0, 121.0, 238.0, 481.0, 916.0, 2287.0, 6420.0, 22276.0, 122367.0, 3535504.0, 438003.0, 47545.0, 11231.0, 3589.0, 1463.0, 688.0, 352.0, 192.0, 127.0, 62.0, 40.0, 38.0, 33.0, 21.0, 17.0, 18.0, 14.0, 7.0, 5.0, 6.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-129.25, -124.591796875, -119.93359375, -115.275390625, -110.6171875, -105.958984375, -101.30078125, -96.642578125, -91.984375, -87.326171875, -82.66796875, -78.009765625, -73.3515625, -68.693359375, -64.03515625, -59.376953125, -54.71875, -50.060546875, -45.40234375, -40.744140625, -36.0859375, -31.427734375, -26.76953125, -22.111328125, -17.453125, -12.794921875, -8.13671875, -3.478515625, 1.1796875, 5.837890625, 10.49609375, 15.154296875, 19.8125, 24.470703125, 29.12890625, 33.787109375, 38.4453125, 43.103515625, 47.76171875, 52.419921875, 57.078125, 61.736328125, 66.39453125, 71.052734375, 75.7109375, 80.369140625, 85.02734375, 89.685546875, 94.34375, 99.001953125, 103.66015625, 108.318359375, 112.9765625, 117.634765625, 122.29296875, 126.951171875, 131.609375, 136.267578125, 140.92578125, 145.583984375, 150.2421875, 154.900390625, 159.55859375, 164.216796875, 168.875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 14.0, 20.0, 23.0, 31.0, 33.0, 58.0, 69.0, 96.0, 97.0, 84.0, 77.0, 74.0, 97.0, 60.0, 45.0, 40.0, 26.0, 17.0, 23.0, 5.0, 7.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.109375, -17.501220703125, -16.89306640625, -16.284912109375, -15.6767578125, -15.068603515625, -14.46044921875, -13.852294921875, -13.244140625, -12.635986328125, -12.02783203125, -11.419677734375, -10.8115234375, -10.203369140625, -9.59521484375, -8.987060546875, -8.37890625, -7.770751953125, -7.16259765625, -6.554443359375, -5.9462890625, -5.338134765625, -4.72998046875, -4.121826171875, -3.513671875, -2.905517578125, -2.29736328125, -1.689208984375, -1.0810546875, -0.472900390625, 0.13525390625, 0.743408203125, 1.3515625, 1.959716796875, 2.56787109375, 3.176025390625, 3.7841796875, 4.392333984375, 5.00048828125, 5.608642578125, 6.216796875, 6.824951171875, 7.43310546875, 8.041259765625, 8.6494140625, 9.257568359375, 9.86572265625, 10.473876953125, 11.08203125, 11.690185546875, 12.29833984375, 12.906494140625, 13.5146484375, 14.122802734375, 14.73095703125, 15.339111328125, 15.947265625, 16.555419921875, 17.16357421875, 17.771728515625, 18.3798828125, 18.988037109375, 19.59619140625, 20.204345703125, 20.8125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 7.0, 8.0, 10.0, 13.0, 15.0, 28.0, 27.0, 60.0, 51.0, 69.0, 89.0, 119.0, 185.0, 234.0, 328.0, 493.0, 893.0, 1551.0, 3168.0, 8295.0, 27271.0, 135507.0, 2376303.0, 1485477.0, 115666.0, 24127.0, 7263.0, 2980.0, 1485.0, 856.0, 549.0, 361.0, 214.0, 149.0, 102.0, 81.0, 80.0, 42.0, 31.0, 26.0, 24.0, 14.0, 7.0, 11.0, 5.0, 6.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-109.0, -105.58984375, -102.1796875, -98.76953125, -95.359375, -91.94921875, -88.5390625, -85.12890625, -81.71875, -78.30859375, -74.8984375, -71.48828125, -68.078125, -64.66796875, -61.2578125, -57.84765625, -54.4375, -51.02734375, -47.6171875, -44.20703125, -40.796875, -37.38671875, -33.9765625, -30.56640625, -27.15625, -23.74609375, -20.3359375, -16.92578125, -13.515625, -10.10546875, -6.6953125, -3.28515625, 0.125, 3.53515625, 6.9453125, 10.35546875, 13.765625, 17.17578125, 20.5859375, 23.99609375, 27.40625, 30.81640625, 34.2265625, 37.63671875, 41.046875, 44.45703125, 47.8671875, 51.27734375, 54.6875, 58.09765625, 61.5078125, 64.91796875, 68.328125, 71.73828125, 75.1484375, 78.55859375, 81.96875, 85.37890625, 88.7890625, 92.19921875, 95.609375, 99.01953125, 102.4296875, 105.83984375, 109.25]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 6.0, 8.0, 5.0, 15.0, 25.0, 42.0, 63.0, 92.0, 167.0, 308.0, 709.0, 1652.0, 464.0, 236.0, 109.0, 69.0, 38.0, 27.0, 12.0, 10.0, 6.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-55.875, -54.376953125, -52.87890625, -51.380859375, -49.8828125, -48.384765625, -46.88671875, -45.388671875, -43.890625, -42.392578125, -40.89453125, -39.396484375, -37.8984375, -36.400390625, -34.90234375, -33.404296875, -31.90625, -30.408203125, -28.91015625, -27.412109375, -25.9140625, -24.416015625, -22.91796875, -21.419921875, -19.921875, -18.423828125, -16.92578125, -15.427734375, -13.9296875, -12.431640625, -10.93359375, -9.435546875, -7.9375, -6.439453125, -4.94140625, -3.443359375, -1.9453125, -0.447265625, 1.05078125, 2.548828125, 4.046875, 5.544921875, 7.04296875, 8.541015625, 10.0390625, 11.537109375, 13.03515625, 14.533203125, 16.03125, 17.529296875, 19.02734375, 20.525390625, 22.0234375, 23.521484375, 25.01953125, 26.517578125, 28.015625, 29.513671875, 31.01171875, 32.509765625, 34.0078125, 35.505859375, 37.00390625, 38.501953125, 40.0]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 9.0, 11.0, 20.0, 25.0, 53.0, 66.0, 103.0, 117.0, 133.0, 116.0, 105.0, 70.0, 57.0, 45.0, 28.0, 12.0, 15.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-364.1314392089844, -355.24560546875, -346.35980224609375, -337.4739990234375, -328.5881652832031, -319.70233154296875, -310.8165283203125, -301.93072509765625, -293.0448913574219, -284.1590576171875, -275.27325439453125, -266.387451171875, -257.5016174316406, -248.6157989501953, -239.72998046875, -230.8441619873047, -221.95834350585938, -213.07252502441406, -204.18670654296875, -195.30088806152344, -186.41506958007812, -177.5292510986328, -168.6434326171875, -159.7576141357422, -150.87179565429688, -141.98597717285156, -133.10015869140625, -124.21434020996094, -115.32852172851562, -106.44270324707031, -97.556884765625, -88.67106628417969, -79.78526306152344, -70.89944458007812, -62.01362609863281, -53.1278076171875, -44.24198913574219, -35.356170654296875, -26.470352172851562, -17.58453369140625, -8.698715209960938, 0.187103271484375, 9.072921752929688, 17.958740234375, 26.844558715820312, 35.730377197265625, 44.61619567871094, 53.50201416015625, 62.38783264160156, 71.27365112304688, 80.15946960449219, 89.0452880859375, 97.93110656738281, 106.81692504882812, 115.70274353027344, 124.58856201171875, 133.47438049316406, 142.36019897460938, 151.2460174560547, 160.1318359375, 169.0176544189453, 177.90347290039062, 186.78929138183594, 195.67510986328125, 204.56092834472656]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 6.0, 1.0, 4.0, 4.0, 5.0, 4.0, 5.0, 10.0, 8.0, 12.0, 23.0, 24.0, 27.0, 30.0, 35.0, 36.0, 40.0, 42.0, 41.0, 41.0, 40.0, 57.0, 60.0, 60.0, 37.0, 45.0, 36.0, 32.0, 33.0, 29.0, 39.0, 33.0, 21.0, 11.0, 18.0, 10.0, 15.0, 9.0, 7.0, 5.0, 4.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.99546813964844, -129.6334686279297, -125.27147674560547, -120.90947723388672, -116.5474853515625, -112.18548583984375, -107.823486328125, -103.46148681640625, -99.09949493408203, -94.73749542236328, -90.37550354003906, -86.01350402832031, -81.65150451660156, -77.28951263427734, -72.9275131225586, -68.56552124023438, -64.20352172851562, -59.84152603149414, -55.479530334472656, -51.117530822753906, -46.75553512573242, -42.39353942871094, -38.03153991699219, -33.6695442199707, -29.30754852294922, -24.945552825927734, -20.583555221557617, -16.2215576171875, -11.859561920166016, -7.497566223144531, -3.135568618774414, 1.2264289855957031, 5.588409423828125, 9.950406074523926, 14.312402725219727, 18.674400329589844, 23.036396026611328, 27.398391723632812, 31.76038932800293, 36.12238693237305, 40.48438262939453, 44.846378326416016, 49.2083740234375, 53.57037353515625, 57.932369232177734, 62.29436492919922, 66.65636444091797, 71.01835632324219, 75.38035583496094, 79.74235534667969, 84.1043472290039, 88.46634674072266, 92.82833862304688, 97.19033813476562, 101.55233764648438, 105.91433715820312, 110.27632904052734, 114.6383285522461, 119.00032043457031, 123.36231994628906, 127.72431945800781, 132.0863037109375, 136.44830322265625, 140.810302734375, 145.17230224609375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 8.0, 16.0, 27.0, 41.0, 62.0, 97.0, 153.0, 273.0, 511.0, 1087.0, 3045.0, 14729.0, 116540.0, 698525.0, 184847.0, 21902.0, 3983.0, 1342.0, 625.0, 278.0, 177.0, 116.0, 69.0, 31.0, 25.0, 15.0, 15.0, 8.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-180.75, -174.84375, -168.9375, -163.03125, -157.125, -151.21875, -145.3125, -139.40625, -133.5, -127.59375, -121.6875, -115.78125, -109.875, -103.96875, -98.0625, -92.15625, -86.25, -80.34375, -74.4375, -68.53125, -62.625, -56.71875, -50.8125, -44.90625, -39.0, -33.09375, -27.1875, -21.28125, -15.375, -9.46875, -3.5625, 2.34375, 8.25, 14.15625, 20.0625, 25.96875, 31.875, 37.78125, 43.6875, 49.59375, 55.5, 61.40625, 67.3125, 73.21875, 79.125, 85.03125, 90.9375, 96.84375, 102.75, 108.65625, 114.5625, 120.46875, 126.375, 132.28125, 138.1875, 144.09375, 150.0, 155.90625, 161.8125, 167.71875, 173.625, 179.53125, 185.4375, 191.34375, 197.25]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 8.0, 8.0, 12.0, 20.0, 31.0, 37.0, 54.0, 63.0, 74.0, 103.0, 83.0, 100.0, 87.0, 84.0, 75.0, 42.0, 30.0, 40.0, 23.0, 14.0, 8.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.25, -20.605712890625, -19.96142578125, -19.317138671875, -18.6728515625, -18.028564453125, -17.38427734375, -16.739990234375, -16.095703125, -15.451416015625, -14.80712890625, -14.162841796875, -13.5185546875, -12.874267578125, -12.22998046875, -11.585693359375, -10.94140625, -10.297119140625, -9.65283203125, -9.008544921875, -8.3642578125, -7.719970703125, -7.07568359375, -6.431396484375, -5.787109375, -5.142822265625, -4.49853515625, -3.854248046875, -3.2099609375, -2.565673828125, -1.92138671875, -1.277099609375, -0.6328125, 0.011474609375, 0.65576171875, 1.300048828125, 1.9443359375, 2.588623046875, 3.23291015625, 3.877197265625, 4.521484375, 5.165771484375, 5.81005859375, 6.454345703125, 7.0986328125, 7.742919921875, 8.38720703125, 9.031494140625, 9.67578125, 10.320068359375, 10.96435546875, 11.608642578125, 12.2529296875, 12.897216796875, 13.54150390625, 14.185791015625, 14.830078125, 15.474365234375, 16.11865234375, 16.762939453125, 17.4072265625, 18.051513671875, 18.69580078125, 19.340087890625, 19.984375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 2.0, 10.0, 11.0, 11.0, 28.0, 37.0, 50.0, 75.0, 111.0, 155.0, 232.0, 366.0, 613.0, 1001.0, 1790.0, 3260.0, 6647.0, 13941.0, 30622.0, 67388.0, 147768.0, 296934.0, 255283.0, 119736.0, 54674.0, 24461.0, 11394.0, 5398.0, 2745.0, 1552.0, 816.0, 504.0, 303.0, 241.0, 112.0, 91.0, 61.0, 37.0, 25.0, 25.0, 15.0, 11.0, 11.0, 7.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-47.65625, -46.2490234375, -44.841796875, -43.4345703125, -42.02734375, -40.6201171875, -39.212890625, -37.8056640625, -36.3984375, -34.9912109375, -33.583984375, -32.1767578125, -30.76953125, -29.3623046875, -27.955078125, -26.5478515625, -25.140625, -23.7333984375, -22.326171875, -20.9189453125, -19.51171875, -18.1044921875, -16.697265625, -15.2900390625, -13.8828125, -12.4755859375, -11.068359375, -9.6611328125, -8.25390625, -6.8466796875, -5.439453125, -4.0322265625, -2.625, -1.2177734375, 0.189453125, 1.5966796875, 3.00390625, 4.4111328125, 5.818359375, 7.2255859375, 8.6328125, 10.0400390625, 11.447265625, 12.8544921875, 14.26171875, 15.6689453125, 17.076171875, 18.4833984375, 19.890625, 21.2978515625, 22.705078125, 24.1123046875, 25.51953125, 26.9267578125, 28.333984375, 29.7412109375, 31.1484375, 32.5556640625, 33.962890625, 35.3701171875, 36.77734375, 38.1845703125, 39.591796875, 40.9990234375, 42.40625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 2.0, 5.0, 10.0, 5.0, 9.0, 15.0, 14.0, 12.0, 15.0, 18.0, 33.0, 23.0, 32.0, 31.0, 36.0, 41.0, 45.0, 42.0, 46.0, 31.0, 50.0, 45.0, 49.0, 43.0, 27.0, 39.0, 32.0, 40.0, 33.0, 21.0, 17.0, 16.0, 24.0, 20.0, 20.0, 13.0, 12.0, 6.0, 10.0, 8.0, 5.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.03125, -38.72265625, -37.4140625, -36.10546875, -34.796875, -33.48828125, -32.1796875, -30.87109375, -29.5625, -28.25390625, -26.9453125, -25.63671875, -24.328125, -23.01953125, -21.7109375, -20.40234375, -19.09375, -17.78515625, -16.4765625, -15.16796875, -13.859375, -12.55078125, -11.2421875, -9.93359375, -8.625, -7.31640625, -6.0078125, -4.69921875, -3.390625, -2.08203125, -0.7734375, 0.53515625, 1.84375, 3.15234375, 4.4609375, 5.76953125, 7.078125, 8.38671875, 9.6953125, 11.00390625, 12.3125, 13.62109375, 14.9296875, 16.23828125, 17.546875, 18.85546875, 20.1640625, 21.47265625, 22.78125, 24.08984375, 25.3984375, 26.70703125, 28.015625, 29.32421875, 30.6328125, 31.94140625, 33.25, 34.55859375, 35.8671875, 37.17578125, 38.484375, 39.79296875, 41.1015625, 42.41015625, 43.71875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 4.0, 16.0, 24.0, 44.0, 72.0, 144.0, 319.0, 842.0, 2813.0, 13599.0, 111197.0, 660574.0, 228443.0, 24136.0, 4351.0, 1151.0, 428.0, 177.0, 91.0, 59.0, 22.0, 15.0, 11.0, 9.0, 9.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.21875, -42.5595703125, -40.900390625, -39.2412109375, -37.58203125, -35.9228515625, -34.263671875, -32.6044921875, -30.9453125, -29.2861328125, -27.626953125, -25.9677734375, -24.30859375, -22.6494140625, -20.990234375, -19.3310546875, -17.671875, -16.0126953125, -14.353515625, -12.6943359375, -11.03515625, -9.3759765625, -7.716796875, -6.0576171875, -4.3984375, -2.7392578125, -1.080078125, 0.5791015625, 2.23828125, 3.8974609375, 5.556640625, 7.2158203125, 8.875, 10.5341796875, 12.193359375, 13.8525390625, 15.51171875, 17.1708984375, 18.830078125, 20.4892578125, 22.1484375, 23.8076171875, 25.466796875, 27.1259765625, 28.78515625, 30.4443359375, 32.103515625, 33.7626953125, 35.421875, 37.0810546875, 38.740234375, 40.3994140625, 42.05859375, 43.7177734375, 45.376953125, 47.0361328125, 48.6953125, 50.3544921875, 52.013671875, 53.6728515625, 55.33203125, 56.9912109375, 58.650390625, 60.3095703125, 61.96875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 9.0, 7.0, 8.0, 14.0, 17.0, 20.0, 27.0, 35.0, 38.0, 56.0, 54.0, 124.0, 133.0, 130.0, 77.0, 53.0, 48.0, 32.0, 33.0, 18.0, 19.0, 13.0, 9.0, 6.0, 1.0, 10.0, 0.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00592803955078125, -0.005778014659881592, -0.005627989768981934, -0.005477964878082275, -0.005327939987182617, -0.005177915096282959, -0.005027890205383301, -0.004877865314483643, -0.004727840423583984, -0.004577815532684326, -0.004427790641784668, -0.00427776575088501, -0.0041277408599853516, -0.003977715969085693, -0.003827691078186035, -0.003677666187286377, -0.0035276412963867188, -0.0033776164054870605, -0.0032275915145874023, -0.003077566623687744, -0.002927541732788086, -0.0027775168418884277, -0.0026274919509887695, -0.0024774670600891113, -0.002327442169189453, -0.002177417278289795, -0.0020273923873901367, -0.0018773674964904785, -0.0017273426055908203, -0.0015773177146911621, -0.001427292823791504, -0.0012772679328918457, -0.0011272430419921875, -0.0009772181510925293, -0.0008271932601928711, -0.0006771683692932129, -0.0005271434783935547, -0.0003771185874938965, -0.00022709369659423828, -7.706880569458008e-05, 7.295608520507812e-05, 0.00022298097610473633, 0.00037300586700439453, 0.0005230307579040527, 0.0006730556488037109, 0.0008230805397033691, 0.0009731054306030273, 0.0011231303215026855, 0.0012731552124023438, 0.001423180103302002, 0.0015732049942016602, 0.0017232298851013184, 0.0018732547760009766, 0.0020232796669006348, 0.002173304557800293, 0.002323329448699951, 0.0024733543395996094, 0.0026233792304992676, 0.0027734041213989258, 0.002923429012298584, 0.003073453903198242, 0.0032234787940979004, 0.0033735036849975586, 0.003523528575897217, 0.003673553466796875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 4.0, 11.0, 19.0, 23.0, 19.0, 38.0, 54.0, 102.0, 130.0, 229.0, 359.0, 595.0, 1108.0, 2135.0, 4265.0, 10270.0, 28062.0, 94719.0, 309473.0, 390105.0, 140609.0, 40766.0, 13994.0, 5667.0, 2640.0, 1301.0, 708.0, 431.0, 248.0, 158.0, 102.0, 68.0, 44.0, 18.0, 23.0, 18.0, 16.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-27.078125, -26.236083984375, -25.39404296875, -24.552001953125, -23.7099609375, -22.867919921875, -22.02587890625, -21.183837890625, -20.341796875, -19.499755859375, -18.65771484375, -17.815673828125, -16.9736328125, -16.131591796875, -15.28955078125, -14.447509765625, -13.60546875, -12.763427734375, -11.92138671875, -11.079345703125, -10.2373046875, -9.395263671875, -8.55322265625, -7.711181640625, -6.869140625, -6.027099609375, -5.18505859375, -4.343017578125, -3.5009765625, -2.658935546875, -1.81689453125, -0.974853515625, -0.1328125, 0.709228515625, 1.55126953125, 2.393310546875, 3.2353515625, 4.077392578125, 4.91943359375, 5.761474609375, 6.603515625, 7.445556640625, 8.28759765625, 9.129638671875, 9.9716796875, 10.813720703125, 11.65576171875, 12.497802734375, 13.33984375, 14.181884765625, 15.02392578125, 15.865966796875, 16.7080078125, 17.550048828125, 18.39208984375, 19.234130859375, 20.076171875, 20.918212890625, 21.76025390625, 22.602294921875, 23.4443359375, 24.286376953125, 25.12841796875, 25.970458984375, 26.8125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 5.0, 2.0, 2.0, 8.0, 8.0, 22.0, 18.0, 26.0, 30.0, 45.0, 46.0, 66.0, 80.0, 107.0, 97.0, 83.0, 83.0, 69.0, 41.0, 46.0, 24.0, 20.0, 23.0, 16.0, 11.0, 3.0, 6.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.296875, -21.564697265625, -20.83251953125, -20.100341796875, -19.3681640625, -18.635986328125, -17.90380859375, -17.171630859375, -16.439453125, -15.707275390625, -14.97509765625, -14.242919921875, -13.5107421875, -12.778564453125, -12.04638671875, -11.314208984375, -10.58203125, -9.849853515625, -9.11767578125, -8.385498046875, -7.6533203125, -6.921142578125, -6.18896484375, -5.456787109375, -4.724609375, -3.992431640625, -3.26025390625, -2.528076171875, -1.7958984375, -1.063720703125, -0.33154296875, 0.400634765625, 1.1328125, 1.864990234375, 2.59716796875, 3.329345703125, 4.0615234375, 4.793701171875, 5.52587890625, 6.258056640625, 6.990234375, 7.722412109375, 8.45458984375, 9.186767578125, 9.9189453125, 10.651123046875, 11.38330078125, 12.115478515625, 12.84765625, 13.579833984375, 14.31201171875, 15.044189453125, 15.7763671875, 16.508544921875, 17.24072265625, 17.972900390625, 18.705078125, 19.437255859375, 20.16943359375, 20.901611328125, 21.6337890625, 22.365966796875, 23.09814453125, 23.830322265625, 24.5625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 3.0, 5.0, 2.0, 5.0, 8.0, 9.0, 15.0, 32.0, 33.0, 35.0, 49.0, 50.0, 68.0, 65.0, 84.0, 110.0, 67.0, 69.0, 65.0, 56.0, 41.0, 35.0, 25.0, 22.0, 16.0, 11.0, 4.0, 5.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-231.17059326171875, -222.47744750976562, -213.7843017578125, -205.09115600585938, -196.39801025390625, -187.70486450195312, -179.01171875, -170.31857299804688, -161.62542724609375, -152.93228149414062, -144.2391357421875, -135.54598999023438, -126.85284423828125, -118.15969848632812, -109.46656036376953, -100.7734146118164, -92.08027648925781, -83.38713073730469, -74.69398498535156, -66.00083923339844, -57.30769729614258, -48.61455154418945, -39.921409606933594, -31.22826385498047, -22.535118103027344, -13.841973304748535, -5.148828506469727, 3.5443153381347656, 12.23746109008789, 20.930606842041016, 29.623748779296875, 38.31689453125, 47.010040283203125, 55.70318603515625, 64.39633178710938, 73.0894775390625, 81.78262329101562, 90.47576904296875, 99.16890716552734, 107.86205291748047, 116.5551986694336, 125.24834442138672, 133.9414825439453, 142.63462829589844, 151.32777404785156, 160.0209197998047, 168.7140655517578, 177.40721130371094, 186.10035705566406, 194.7935028076172, 203.4866485595703, 212.17979431152344, 220.87294006347656, 229.5660858154297, 238.25921630859375, 246.95236206054688, 255.6455078125, 264.3386535644531, 273.03179931640625, 281.7249450683594, 290.4180908203125, 299.1112365722656, 307.80438232421875, 316.4975280761719, 325.190673828125]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 9.0, 12.0, 10.0, 14.0, 14.0, 17.0, 19.0, 24.0, 21.0, 28.0, 27.0, 29.0, 44.0, 39.0, 50.0, 47.0, 49.0, 43.0, 42.0, 52.0, 39.0, 43.0, 44.0, 38.0, 25.0, 33.0, 23.0, 32.0, 15.0, 16.0, 18.0, 16.0, 11.0, 12.0, 11.0, 5.0, 6.0, 1.0, 4.0, 5.0, 5.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-247.33224487304688, -239.5975799560547, -231.8629150390625, -224.1282501220703, -216.39358520507812, -208.65892028808594, -200.92425537109375, -193.18960571289062, -185.45492553710938, -177.7202606201172, -169.985595703125, -162.2509307861328, -154.51626586914062, -146.78160095214844, -139.04693603515625, -131.31228637695312, -123.57762145996094, -115.84295654296875, -108.10829162597656, -100.37362670898438, -92.63896179199219, -84.904296875, -77.16963958740234, -69.43497467041016, -61.70030975341797, -53.96564483642578, -46.230979919433594, -38.49631881713867, -30.761653900146484, -23.026988983154297, -15.292327880859375, -7.5576629638671875, 0.1770172119140625, 7.911681175231934, 15.646345138549805, 23.38100814819336, 31.115673065185547, 38.850337982177734, 46.584999084472656, 54.319664001464844, 62.05432891845703, 69.78899383544922, 77.5236587524414, 85.25831604003906, 92.99298095703125, 100.72764587402344, 108.46231079101562, 116.19697570800781, 123.931640625, 131.6663055419922, 139.40097045898438, 147.13563537597656, 154.87030029296875, 162.60496520996094, 170.33963012695312, 178.07427978515625, 185.8089599609375, 193.5436248779297, 201.27828979492188, 209.01295471191406, 216.74761962890625, 224.48228454589844, 232.21694946289062, 239.95159912109375, 247.68626403808594]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 3.0, 6.0, 13.0, 14.0, 27.0, 38.0, 61.0, 95.0, 156.0, 275.0, 603.0, 1429.0, 4248.0, 21747.0, 704500.0, 3425192.0, 27719.0, 5160.0, 1566.0, 645.0, 277.0, 181.0, 81.0, 71.0, 46.0, 41.0, 21.0, 12.0, 15.0, 4.0, 6.0, 11.0, 2.0, 5.0, 0.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-209.625, -202.154296875, -194.68359375, -187.212890625, -179.7421875, -172.271484375, -164.80078125, -157.330078125, -149.859375, -142.388671875, -134.91796875, -127.447265625, -119.9765625, -112.505859375, -105.03515625, -97.564453125, -90.09375, -82.623046875, -75.15234375, -67.681640625, -60.2109375, -52.740234375, -45.26953125, -37.798828125, -30.328125, -22.857421875, -15.38671875, -7.916015625, -0.4453125, 7.025390625, 14.49609375, 21.966796875, 29.4375, 36.908203125, 44.37890625, 51.849609375, 59.3203125, 66.791015625, 74.26171875, 81.732421875, 89.203125, 96.673828125, 104.14453125, 111.615234375, 119.0859375, 126.556640625, 134.02734375, 141.498046875, 148.96875, 156.439453125, 163.91015625, 171.380859375, 178.8515625, 186.322265625, 193.79296875, 201.263671875, 208.734375, 216.205078125, 223.67578125, 231.146484375, 238.6171875, 246.087890625, 253.55859375, 261.029296875, 268.5]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 9.0, 14.0, 13.0, 32.0, 33.0, 43.0, 51.0, 69.0, 100.0, 81.0, 108.0, 94.0, 69.0, 67.0, 60.0, 43.0, 40.0, 25.0, 18.0, 12.0, 13.0, 1.0, 4.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.5, -20.8583984375, -20.216796875, -19.5751953125, -18.93359375, -18.2919921875, -17.650390625, -17.0087890625, -16.3671875, -15.7255859375, -15.083984375, -14.4423828125, -13.80078125, -13.1591796875, -12.517578125, -11.8759765625, -11.234375, -10.5927734375, -9.951171875, -9.3095703125, -8.66796875, -8.0263671875, -7.384765625, -6.7431640625, -6.1015625, -5.4599609375, -4.818359375, -4.1767578125, -3.53515625, -2.8935546875, -2.251953125, -1.6103515625, -0.96875, -0.3271484375, 0.314453125, 0.9560546875, 1.59765625, 2.2392578125, 2.880859375, 3.5224609375, 4.1640625, 4.8056640625, 5.447265625, 6.0888671875, 6.73046875, 7.3720703125, 8.013671875, 8.6552734375, 9.296875, 9.9384765625, 10.580078125, 11.2216796875, 11.86328125, 12.5048828125, 13.146484375, 13.7880859375, 14.4296875, 15.0712890625, 15.712890625, 16.3544921875, 16.99609375, 17.6376953125, 18.279296875, 18.9208984375, 19.5625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 5.0, 6.0, 3.0, 2.0, 9.0, 6.0, 9.0, 19.0, 11.0, 13.0, 20.0, 30.0, 44.0, 76.0, 137.0, 245.0, 429.0, 869.0, 1857.0, 4501.0, 11988.0, 38718.0, 180997.0, 3156470.0, 673631.0, 87048.0, 22948.0, 8061.0, 3177.0, 1372.0, 712.0, 327.0, 200.0, 108.0, 75.0, 52.0, 38.0, 14.0, 12.0, 12.0, 6.0, 8.0, 7.0, 6.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-89.25, -86.52734375, -83.8046875, -81.08203125, -78.359375, -75.63671875, -72.9140625, -70.19140625, -67.46875, -64.74609375, -62.0234375, -59.30078125, -56.578125, -53.85546875, -51.1328125, -48.41015625, -45.6875, -42.96484375, -40.2421875, -37.51953125, -34.796875, -32.07421875, -29.3515625, -26.62890625, -23.90625, -21.18359375, -18.4609375, -15.73828125, -13.015625, -10.29296875, -7.5703125, -4.84765625, -2.125, 0.59765625, 3.3203125, 6.04296875, 8.765625, 11.48828125, 14.2109375, 16.93359375, 19.65625, 22.37890625, 25.1015625, 27.82421875, 30.546875, 33.26953125, 35.9921875, 38.71484375, 41.4375, 44.16015625, 46.8828125, 49.60546875, 52.328125, 55.05078125, 57.7734375, 60.49609375, 63.21875, 65.94140625, 68.6640625, 71.38671875, 74.109375, 76.83203125, 79.5546875, 82.27734375, 85.0]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 4.0, 6.0, 5.0, 11.0, 8.0, 9.0, 7.0, 16.0, 22.0, 35.0, 35.0, 60.0, 91.0, 131.0, 183.0, 346.0, 1027.0, 1036.0, 350.0, 206.0, 128.0, 90.0, 63.0, 41.0, 26.0, 27.0, 26.0, 19.0, 17.0, 9.0, 4.0, 7.0, 9.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-19.21875, -18.507080078125, -17.79541015625, -17.083740234375, -16.3720703125, -15.660400390625, -14.94873046875, -14.237060546875, -13.525390625, -12.813720703125, -12.10205078125, -11.390380859375, -10.6787109375, -9.967041015625, -9.25537109375, -8.543701171875, -7.83203125, -7.120361328125, -6.40869140625, -5.697021484375, -4.9853515625, -4.273681640625, -3.56201171875, -2.850341796875, -2.138671875, -1.427001953125, -0.71533203125, -0.003662109375, 0.7080078125, 1.419677734375, 2.13134765625, 2.843017578125, 3.5546875, 4.266357421875, 4.97802734375, 5.689697265625, 6.4013671875, 7.113037109375, 7.82470703125, 8.536376953125, 9.248046875, 9.959716796875, 10.67138671875, 11.383056640625, 12.0947265625, 12.806396484375, 13.51806640625, 14.229736328125, 14.94140625, 15.653076171875, 16.36474609375, 17.076416015625, 17.7880859375, 18.499755859375, 19.21142578125, 19.923095703125, 20.634765625, 21.346435546875, 22.05810546875, 22.769775390625, 23.4814453125, 24.193115234375, 24.90478515625, 25.616455078125, 26.328125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 6.0, 15.0, 25.0, 45.0, 50.0, 79.0, 121.0, 123.0, 127.0, 92.0, 94.0, 65.0, 52.0, 30.0, 29.0, 10.0, 9.0, 6.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-174.47479248046875, -167.94744873046875, -161.42010498046875, -154.8927459716797, -148.3654022216797, -141.8380584716797, -135.3107147216797, -128.78335571289062, -122.25601196289062, -115.72866821289062, -109.2013168334961, -102.6739730834961, -96.14662170410156, -89.61927795410156, -83.09193420410156, -76.56458282470703, -70.03723907470703, -63.509891510009766, -56.9825439453125, -50.4552001953125, -43.92784881591797, -37.40050506591797, -30.873157501220703, -24.345809936523438, -17.818462371826172, -11.291114807128906, -4.763768196105957, 1.7635784149169922, 8.290925979614258, 14.81827163696289, 21.345619201660156, 27.872966766357422, 34.40031433105469, 40.92766189575195, 47.45500946044922, 53.98235321044922, 60.50970458984375, 67.03704833984375, 73.56439208984375, 80.09174346923828, 86.61909484863281, 93.14643859863281, 99.67378997802734, 106.20113372802734, 112.72848510742188, 119.25582885742188, 125.78317260742188, 132.31051635742188, 138.83786010742188, 145.36520385742188, 151.89254760742188, 158.41990661621094, 164.94725036621094, 171.47459411621094, 178.00193786621094, 184.529296875, 191.056640625, 197.583984375, 204.111328125, 210.63868713378906, 217.16603088378906, 223.69337463378906, 230.22071838378906, 236.74807739257812, 243.27542114257812]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 6.0, 5.0, 9.0, 6.0, 9.0, 10.0, 19.0, 19.0, 24.0, 28.0, 28.0, 44.0, 31.0, 41.0, 46.0, 56.0, 61.0, 52.0, 43.0, 49.0, 45.0, 51.0, 33.0, 37.0, 36.0, 29.0, 29.0, 33.0, 25.0, 19.0, 17.0, 12.0, 15.0, 11.0, 7.0, 4.0, 5.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-113.060546875, -109.63899230957031, -106.21743774414062, -102.79588317871094, -99.37432861328125, -95.95277404785156, -92.5312271118164, -89.10967254638672, -85.68811798095703, -82.26656341552734, -78.84500885009766, -75.42345428466797, -72.00190734863281, -68.58035278320312, -65.15879821777344, -61.73724365234375, -58.31568908691406, -54.894134521484375, -51.47257995605469, -48.051029205322266, -44.62947463989258, -41.20792007446289, -37.78636932373047, -34.36481475830078, -30.943260192871094, -27.521705627441406, -24.10015296936035, -20.678600311279297, -17.25704574584961, -13.835491180419922, -10.413938522338867, -6.9923858642578125, -3.570831298828125, -0.1492776870727539, 3.272275924682617, 6.693829536437988, 10.11538314819336, 13.536937713623047, 16.9584903717041, 20.380043029785156, 23.801597595214844, 27.22315216064453, 30.644704818725586, 34.06625747680664, 37.48781204223633, 40.909366607666016, 44.33091735839844, 47.752471923828125, 51.17402648925781, 54.5955810546875, 58.01713562011719, 61.43868637084961, 64.86024475097656, 68.28179931640625, 71.7033462524414, 75.1249008178711, 78.54645538330078, 81.96800994873047, 85.38956451416016, 88.81111907958984, 92.232666015625, 95.65422058105469, 99.07577514648438, 102.49732971191406, 105.91888427734375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 4.0, 5.0, 6.0, 12.0, 19.0, 13.0, 29.0, 33.0, 42.0, 49.0, 74.0, 109.0, 193.0, 281.0, 503.0, 973.0, 1964.0, 4976.0, 15934.0, 65921.0, 330861.0, 486440.0, 104416.0, 23462.0, 6903.0, 2573.0, 1154.0, 609.0, 331.0, 228.0, 130.0, 100.0, 51.0, 44.0, 33.0, 27.0, 15.0, 11.0, 5.0, 4.0, 7.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-134.75, -130.6845703125, -126.619140625, -122.5537109375, -118.48828125, -114.4228515625, -110.357421875, -106.2919921875, -102.2265625, -98.1611328125, -94.095703125, -90.0302734375, -85.96484375, -81.8994140625, -77.833984375, -73.7685546875, -69.703125, -65.6376953125, -61.572265625, -57.5068359375, -53.44140625, -49.3759765625, -45.310546875, -41.2451171875, -37.1796875, -33.1142578125, -29.048828125, -24.9833984375, -20.91796875, -16.8525390625, -12.787109375, -8.7216796875, -4.65625, -0.5908203125, 3.474609375, 7.5400390625, 11.60546875, 15.6708984375, 19.736328125, 23.8017578125, 27.8671875, 31.9326171875, 35.998046875, 40.0634765625, 44.12890625, 48.1943359375, 52.259765625, 56.3251953125, 60.390625, 64.4560546875, 68.521484375, 72.5869140625, 76.65234375, 80.7177734375, 84.783203125, 88.8486328125, 92.9140625, 96.9794921875, 101.044921875, 105.1103515625, 109.17578125, 113.2412109375, 117.306640625, 121.3720703125, 125.4375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 13.0, 14.0, 17.0, 25.0, 30.0, 31.0, 53.0, 72.0, 88.0, 80.0, 89.0, 86.0, 102.0, 76.0, 61.0, 41.0, 36.0, 21.0, 29.0, 14.0, 10.0, 4.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.796875, -21.151123046875, -20.50537109375, -19.859619140625, -19.2138671875, -18.568115234375, -17.92236328125, -17.276611328125, -16.630859375, -15.985107421875, -15.33935546875, -14.693603515625, -14.0478515625, -13.402099609375, -12.75634765625, -12.110595703125, -11.46484375, -10.819091796875, -10.17333984375, -9.527587890625, -8.8818359375, -8.236083984375, -7.59033203125, -6.944580078125, -6.298828125, -5.653076171875, -5.00732421875, -4.361572265625, -3.7158203125, -3.070068359375, -2.42431640625, -1.778564453125, -1.1328125, -0.487060546875, 0.15869140625, 0.804443359375, 1.4501953125, 2.095947265625, 2.74169921875, 3.387451171875, 4.033203125, 4.678955078125, 5.32470703125, 5.970458984375, 6.6162109375, 7.261962890625, 7.90771484375, 8.553466796875, 9.19921875, 9.844970703125, 10.49072265625, 11.136474609375, 11.7822265625, 12.427978515625, 13.07373046875, 13.719482421875, 14.365234375, 15.010986328125, 15.65673828125, 16.302490234375, 16.9482421875, 17.593994140625, 18.23974609375, 18.885498046875, 19.53125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 6.0, 7.0, 15.0, 14.0, 17.0, 23.0, 32.0, 47.0, 53.0, 50.0, 91.0, 119.0, 157.0, 198.0, 300.0, 488.0, 679.0, 1117.0, 1952.0, 3620.0, 7470.0, 15955.0, 35230.0, 81191.0, 184184.0, 327392.0, 214350.0, 95256.0, 41452.0, 18349.0, 8520.0, 4206.0, 2262.0, 1226.0, 802.0, 471.0, 352.0, 232.0, 163.0, 129.0, 108.0, 59.0, 53.0, 43.0, 23.0, 22.0, 18.0, 20.0, 14.0, 5.0, 7.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-43.96875, -42.5771484375, -41.185546875, -39.7939453125, -38.40234375, -37.0107421875, -35.619140625, -34.2275390625, -32.8359375, -31.4443359375, -30.052734375, -28.6611328125, -27.26953125, -25.8779296875, -24.486328125, -23.0947265625, -21.703125, -20.3115234375, -18.919921875, -17.5283203125, -16.13671875, -14.7451171875, -13.353515625, -11.9619140625, -10.5703125, -9.1787109375, -7.787109375, -6.3955078125, -5.00390625, -3.6123046875, -2.220703125, -0.8291015625, 0.5625, 1.9541015625, 3.345703125, 4.7373046875, 6.12890625, 7.5205078125, 8.912109375, 10.3037109375, 11.6953125, 13.0869140625, 14.478515625, 15.8701171875, 17.26171875, 18.6533203125, 20.044921875, 21.4365234375, 22.828125, 24.2197265625, 25.611328125, 27.0029296875, 28.39453125, 29.7861328125, 31.177734375, 32.5693359375, 33.9609375, 35.3525390625, 36.744140625, 38.1357421875, 39.52734375, 40.9189453125, 42.310546875, 43.7021484375, 45.09375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 9.0, 13.0, 6.0, 9.0, 12.0, 12.0, 20.0, 22.0, 22.0, 20.0, 24.0, 19.0, 35.0, 38.0, 37.0, 39.0, 44.0, 35.0, 62.0, 44.0, 37.0, 37.0, 35.0, 40.0, 27.0, 31.0, 36.0, 27.0, 27.0, 25.0, 29.0, 21.0, 14.0, 12.0, 15.0, 9.0, 9.0, 10.0, 10.0, 9.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0], "bins": [-43.6875, -42.39794921875, -41.1083984375, -39.81884765625, -38.529296875, -37.23974609375, -35.9501953125, -34.66064453125, -33.37109375, -32.08154296875, -30.7919921875, -29.50244140625, -28.212890625, -26.92333984375, -25.6337890625, -24.34423828125, -23.0546875, -21.76513671875, -20.4755859375, -19.18603515625, -17.896484375, -16.60693359375, -15.3173828125, -14.02783203125, -12.73828125, -11.44873046875, -10.1591796875, -8.86962890625, -7.580078125, -6.29052734375, -5.0009765625, -3.71142578125, -2.421875, -1.13232421875, 0.1572265625, 1.44677734375, 2.736328125, 4.02587890625, 5.3154296875, 6.60498046875, 7.89453125, 9.18408203125, 10.4736328125, 11.76318359375, 13.052734375, 14.34228515625, 15.6318359375, 16.92138671875, 18.2109375, 19.50048828125, 20.7900390625, 22.07958984375, 23.369140625, 24.65869140625, 25.9482421875, 27.23779296875, 28.52734375, 29.81689453125, 31.1064453125, 32.39599609375, 33.685546875, 34.97509765625, 36.2646484375, 37.55419921875, 38.84375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 4.0, 3.0, 5.0, 26.0, 28.0, 44.0, 69.0, 154.0, 262.0, 551.0, 1308.0, 3106.0, 8829.0, 29028.0, 115661.0, 416514.0, 348925.0, 88900.0, 23030.0, 7278.0, 2641.0, 1171.0, 477.0, 280.0, 117.0, 59.0, 34.0, 15.0, 14.0, 14.0, 4.0, 3.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.34375, -25.36474609375, -24.3857421875, -23.40673828125, -22.427734375, -21.44873046875, -20.4697265625, -19.49072265625, -18.51171875, -17.53271484375, -16.5537109375, -15.57470703125, -14.595703125, -13.61669921875, -12.6376953125, -11.65869140625, -10.6796875, -9.70068359375, -8.7216796875, -7.74267578125, -6.763671875, -5.78466796875, -4.8056640625, -3.82666015625, -2.84765625, -1.86865234375, -0.8896484375, 0.08935546875, 1.068359375, 2.04736328125, 3.0263671875, 4.00537109375, 4.984375, 5.96337890625, 6.9423828125, 7.92138671875, 8.900390625, 9.87939453125, 10.8583984375, 11.83740234375, 12.81640625, 13.79541015625, 14.7744140625, 15.75341796875, 16.732421875, 17.71142578125, 18.6904296875, 19.66943359375, 20.6484375, 21.62744140625, 22.6064453125, 23.58544921875, 24.564453125, 25.54345703125, 26.5224609375, 27.50146484375, 28.48046875, 29.45947265625, 30.4384765625, 31.41748046875, 32.396484375, 33.37548828125, 34.3544921875, 35.33349609375, 36.3125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 6.0, 9.0, 11.0, 20.0, 15.0, 29.0, 31.0, 30.0, 64.0, 72.0, 141.0, 141.0, 119.0, 76.0, 53.0, 36.0, 29.0, 30.0, 15.0, 20.0, 12.0, 9.0, 7.0, 5.0, 4.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0042266845703125, -0.004067182540893555, -0.003907680511474609, -0.003748178482055664, -0.0035886764526367188, -0.0034291744232177734, -0.003269672393798828, -0.003110170364379883, -0.0029506683349609375, -0.002791166305541992, -0.002631664276123047, -0.0024721622467041016, -0.0023126602172851562, -0.002153158187866211, -0.0019936561584472656, -0.0018341541290283203, -0.001674652099609375, -0.0015151500701904297, -0.0013556480407714844, -0.001196146011352539, -0.0010366439819335938, -0.0008771419525146484, -0.0007176399230957031, -0.0005581378936767578, -0.0003986358642578125, -0.0002391338348388672, -7.963180541992188e-05, 7.987022399902344e-05, 0.00023937225341796875, 0.00039887428283691406, 0.0005583763122558594, 0.0007178783416748047, 0.00087738037109375, 0.0010368824005126953, 0.0011963844299316406, 0.001355886459350586, 0.0015153884887695312, 0.0016748905181884766, 0.0018343925476074219, 0.001993894577026367, 0.0021533966064453125, 0.002312898635864258, 0.002472400665283203, 0.0026319026947021484, 0.0027914047241210938, 0.002950906753540039, 0.0031104087829589844, 0.0032699108123779297, 0.003429412841796875, 0.0035889148712158203, 0.0037484169006347656, 0.003907918930053711, 0.004067420959472656, 0.0042269229888916016, 0.004386425018310547, 0.004545927047729492, 0.0047054290771484375, 0.004864931106567383, 0.005024433135986328, 0.0051839351654052734, 0.005343437194824219, 0.005502939224243164, 0.005662441253662109, 0.005821943283081055, 0.0059814453125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 7.0, 9.0, 14.0, 15.0, 33.0, 33.0, 71.0, 117.0, 208.0, 333.0, 684.0, 1467.0, 3719.0, 10385.0, 37095.0, 161655.0, 497249.0, 254508.0, 57148.0, 15175.0, 4819.0, 1873.0, 876.0, 461.0, 238.0, 128.0, 83.0, 56.0, 31.0, 30.0, 8.0, 14.0, 3.0, 9.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-36.3125, -35.32177734375, -34.3310546875, -33.34033203125, -32.349609375, -31.35888671875, -30.3681640625, -29.37744140625, -28.38671875, -27.39599609375, -26.4052734375, -25.41455078125, -24.423828125, -23.43310546875, -22.4423828125, -21.45166015625, -20.4609375, -19.47021484375, -18.4794921875, -17.48876953125, -16.498046875, -15.50732421875, -14.5166015625, -13.52587890625, -12.53515625, -11.54443359375, -10.5537109375, -9.56298828125, -8.572265625, -7.58154296875, -6.5908203125, -5.60009765625, -4.609375, -3.61865234375, -2.6279296875, -1.63720703125, -0.646484375, 0.34423828125, 1.3349609375, 2.32568359375, 3.31640625, 4.30712890625, 5.2978515625, 6.28857421875, 7.279296875, 8.27001953125, 9.2607421875, 10.25146484375, 11.2421875, 12.23291015625, 13.2236328125, 14.21435546875, 15.205078125, 16.19580078125, 17.1865234375, 18.17724609375, 19.16796875, 20.15869140625, 21.1494140625, 22.14013671875, 23.130859375, 24.12158203125, 25.1123046875, 26.10302734375, 27.09375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 5.0, 4.0, 5.0, 8.0, 6.0, 8.0, 8.0, 15.0, 14.0, 23.0, 32.0, 34.0, 46.0, 44.0, 56.0, 55.0, 69.0, 67.0, 67.0, 59.0, 57.0, 57.0, 53.0, 49.0, 32.0, 26.0, 21.0, 14.0, 12.0, 11.0, 9.0, 5.0, 7.0, 7.0, 5.0, 6.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.03125, -18.471435546875, -17.91162109375, -17.351806640625, -16.7919921875, -16.232177734375, -15.67236328125, -15.112548828125, -14.552734375, -13.992919921875, -13.43310546875, -12.873291015625, -12.3134765625, -11.753662109375, -11.19384765625, -10.634033203125, -10.07421875, -9.514404296875, -8.95458984375, -8.394775390625, -7.8349609375, -7.275146484375, -6.71533203125, -6.155517578125, -5.595703125, -5.035888671875, -4.47607421875, -3.916259765625, -3.3564453125, -2.796630859375, -2.23681640625, -1.677001953125, -1.1171875, -0.557373046875, 0.00244140625, 0.562255859375, 1.1220703125, 1.681884765625, 2.24169921875, 2.801513671875, 3.361328125, 3.921142578125, 4.48095703125, 5.040771484375, 5.6005859375, 6.160400390625, 6.72021484375, 7.280029296875, 7.83984375, 8.399658203125, 8.95947265625, 9.519287109375, 10.0791015625, 10.638916015625, 11.19873046875, 11.758544921875, 12.318359375, 12.878173828125, 13.43798828125, 13.997802734375, 14.5576171875, 15.117431640625, 15.67724609375, 16.237060546875, 16.796875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 5.0, 6.0, 9.0, 15.0, 32.0, 34.0, 53.0, 65.0, 92.0, 112.0, 103.0, 95.0, 112.0, 82.0, 62.0, 48.0, 24.0, 24.0, 18.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-505.0211181640625, -492.9909362792969, -480.96075439453125, -468.9305419921875, -456.9003601074219, -444.87017822265625, -432.8399963378906, -420.809814453125, -408.77960205078125, -396.7494201660156, -384.71923828125, -372.68902587890625, -360.6588439941406, -348.628662109375, -336.5984802246094, -324.56829833984375, -312.5380859375, -300.5079040527344, -288.47772216796875, -276.447509765625, -264.4173278808594, -252.38714599609375, -240.35696411132812, -228.32676696777344, -216.29660034179688, -204.26641845703125, -192.23622131347656, -180.20603942871094, -168.17584228515625, -156.14566040039062, -144.115478515625, -132.0852813720703, -120.05508422851562, -108.02489471435547, -95.99470520019531, -83.96452331542969, -71.934326171875, -59.90414047241211, -47.87395477294922, -35.84376525878906, -23.813575744628906, -11.783387184143066, 0.24680137634277344, 12.276988983154297, 24.307178497314453, 36.33736801147461, 48.3675537109375, 60.397743225097656, 72.42793273925781, 84.45812225341797, 96.48831176757812, 108.51849365234375, 120.54869079589844, 132.57887268066406, 144.60906982421875, 156.63925170898438, 168.66943359375, 180.69961547851562, 192.7298126220703, 204.75999450683594, 216.79019165039062, 228.82037353515625, 240.85055541992188, 252.88075256347656, 264.91094970703125]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 7.0, 2.0, 2.0, 8.0, 8.0, 6.0, 7.0, 13.0, 15.0, 16.0, 22.0, 23.0, 24.0, 28.0, 28.0, 49.0, 43.0, 40.0, 30.0, 46.0, 56.0, 36.0, 47.0, 52.0, 44.0, 48.0, 32.0, 34.0, 38.0, 37.0, 31.0, 25.0, 28.0, 20.0, 10.0, 14.0, 13.0, 12.0, 4.0, 3.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-192.45175170898438, -184.69760131835938, -176.9434356689453, -169.1892852783203, -161.4351348876953, -153.68096923828125, -145.92681884765625, -138.17266845703125, -130.4185028076172, -122.66434478759766, -114.91019439697266, -107.15603637695312, -99.4018783569336, -91.64772033691406, -83.89356994628906, -76.13941192626953, -68.38526153564453, -60.631107330322266, -52.876949310302734, -45.12279510498047, -37.36863708496094, -29.614482879638672, -21.860328674316406, -14.106170654296875, -6.352016448974609, 1.4021391868591309, 9.156294822692871, 16.910449981689453, 24.66460609436035, 32.41876220703125, 40.172916412353516, 47.92707443237305, 55.68122863769531, 63.43538284301758, 71.18953704833984, 78.94369506835938, 86.6978530883789, 94.45201110839844, 102.20616149902344, 109.96031951904297, 117.7144775390625, 125.46863555908203, 133.22279357910156, 140.97694396972656, 148.73109436035156, 156.48526000976562, 164.23941040039062, 171.99356079101562, 179.74771118164062, 187.50186157226562, 195.2560272216797, 203.0101776123047, 210.7643280029297, 218.51849365234375, 226.27264404296875, 234.02679443359375, 241.7809600830078, 249.5351104736328, 257.2892761230469, 265.0434265136719, 272.7975769042969, 280.5517272949219, 288.305908203125, 296.06005859375, 303.814208984375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 3.0, 3.0, 4.0, 12.0, 7.0, 16.0, 25.0, 33.0, 51.0, 74.0, 103.0, 194.0, 408.0, 809.0, 2000.0, 6021.0, 27694.0, 427985.0, 3652438.0, 61417.0, 9781.0, 2902.0, 1113.0, 507.0, 229.0, 167.0, 102.0, 54.0, 29.0, 21.0, 22.0, 10.0, 11.0, 7.0, 8.0, 7.0, 10.0, 5.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-169.125, -162.904296875, -156.68359375, -150.462890625, -144.2421875, -138.021484375, -131.80078125, -125.580078125, -119.359375, -113.138671875, -106.91796875, -100.697265625, -94.4765625, -88.255859375, -82.03515625, -75.814453125, -69.59375, -63.373046875, -57.15234375, -50.931640625, -44.7109375, -38.490234375, -32.26953125, -26.048828125, -19.828125, -13.607421875, -7.38671875, -1.166015625, 5.0546875, 11.275390625, 17.49609375, 23.716796875, 29.9375, 36.158203125, 42.37890625, 48.599609375, 54.8203125, 61.041015625, 67.26171875, 73.482421875, 79.703125, 85.923828125, 92.14453125, 98.365234375, 104.5859375, 110.806640625, 117.02734375, 123.248046875, 129.46875, 135.689453125, 141.91015625, 148.130859375, 154.3515625, 160.572265625, 166.79296875, 173.013671875, 179.234375, 185.455078125, 191.67578125, 197.896484375, 204.1171875, 210.337890625, 216.55859375, 222.779296875, 229.0]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 8.0, 7.0, 13.0, 19.0, 23.0, 27.0, 33.0, 53.0, 76.0, 78.0, 81.0, 93.0, 91.0, 70.0, 64.0, 73.0, 48.0, 42.0, 26.0, 32.0, 13.0, 16.0, 8.0, 2.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.671875, -20.0439453125, -19.416015625, -18.7880859375, -18.16015625, -17.5322265625, -16.904296875, -16.2763671875, -15.6484375, -15.0205078125, -14.392578125, -13.7646484375, -13.13671875, -12.5087890625, -11.880859375, -11.2529296875, -10.625, -9.9970703125, -9.369140625, -8.7412109375, -8.11328125, -7.4853515625, -6.857421875, -6.2294921875, -5.6015625, -4.9736328125, -4.345703125, -3.7177734375, -3.08984375, -2.4619140625, -1.833984375, -1.2060546875, -0.578125, 0.0498046875, 0.677734375, 1.3056640625, 1.93359375, 2.5615234375, 3.189453125, 3.8173828125, 4.4453125, 5.0732421875, 5.701171875, 6.3291015625, 6.95703125, 7.5849609375, 8.212890625, 8.8408203125, 9.46875, 10.0966796875, 10.724609375, 11.3525390625, 11.98046875, 12.6083984375, 13.236328125, 13.8642578125, 14.4921875, 15.1201171875, 15.748046875, 16.3759765625, 17.00390625, 17.6318359375, 18.259765625, 18.8876953125, 19.515625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 3.0, 6.0, 9.0, 13.0, 11.0, 29.0, 27.0, 31.0, 52.0, 51.0, 88.0, 99.0, 172.0, 236.0, 404.0, 816.0, 1963.0, 6139.0, 27001.0, 221411.0, 3587066.0, 304115.0, 33067.0, 7202.0, 2117.0, 856.0, 411.0, 251.0, 158.0, 111.0, 93.0, 61.0, 56.0, 37.0, 31.0, 15.0, 15.0, 14.0, 15.0, 15.0, 1.0, 5.0, 3.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-130.625, -126.732421875, -122.83984375, -118.947265625, -115.0546875, -111.162109375, -107.26953125, -103.376953125, -99.484375, -95.591796875, -91.69921875, -87.806640625, -83.9140625, -80.021484375, -76.12890625, -72.236328125, -68.34375, -64.451171875, -60.55859375, -56.666015625, -52.7734375, -48.880859375, -44.98828125, -41.095703125, -37.203125, -33.310546875, -29.41796875, -25.525390625, -21.6328125, -17.740234375, -13.84765625, -9.955078125, -6.0625, -2.169921875, 1.72265625, 5.615234375, 9.5078125, 13.400390625, 17.29296875, 21.185546875, 25.078125, 28.970703125, 32.86328125, 36.755859375, 40.6484375, 44.541015625, 48.43359375, 52.326171875, 56.21875, 60.111328125, 64.00390625, 67.896484375, 71.7890625, 75.681640625, 79.57421875, 83.466796875, 87.359375, 91.251953125, 95.14453125, 99.037109375, 102.9296875, 106.822265625, 110.71484375, 114.607421875, 118.5]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 5.0, 9.0, 1.0, 22.0, 24.0, 50.0, 76.0, 234.0, 792.0, 2004.0, 494.0, 177.0, 83.0, 53.0, 26.0, 15.0, 6.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.8125, -56.7373046875, -54.662109375, -52.5869140625, -50.51171875, -48.4365234375, -46.361328125, -44.2861328125, -42.2109375, -40.1357421875, -38.060546875, -35.9853515625, -33.91015625, -31.8349609375, -29.759765625, -27.6845703125, -25.609375, -23.5341796875, -21.458984375, -19.3837890625, -17.30859375, -15.2333984375, -13.158203125, -11.0830078125, -9.0078125, -6.9326171875, -4.857421875, -2.7822265625, -0.70703125, 1.3681640625, 3.443359375, 5.5185546875, 7.59375, 9.6689453125, 11.744140625, 13.8193359375, 15.89453125, 17.9697265625, 20.044921875, 22.1201171875, 24.1953125, 26.2705078125, 28.345703125, 30.4208984375, 32.49609375, 34.5712890625, 36.646484375, 38.7216796875, 40.796875, 42.8720703125, 44.947265625, 47.0224609375, 49.09765625, 51.1728515625, 53.248046875, 55.3232421875, 57.3984375, 59.4736328125, 61.548828125, 63.6240234375, 65.69921875, 67.7744140625, 69.849609375, 71.9248046875, 74.0]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 6.0, 6.0, 12.0, 22.0, 24.0, 42.0, 64.0, 89.0, 116.0, 114.0, 122.0, 106.0, 92.0, 67.0, 49.0, 34.0, 18.0, 6.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-282.52789306640625, -274.9053039550781, -267.28271484375, -259.6601257324219, -252.0375518798828, -244.4149627685547, -236.79237365722656, -229.16978454589844, -221.54721069335938, -213.92462158203125, -206.30203247070312, -198.679443359375, -191.05686950683594, -183.4342803955078, -175.8116912841797, -168.18910217285156, -160.56651306152344, -152.9439239501953, -145.3213348388672, -137.69876098632812, -130.076171875, -122.45358276367188, -114.83099365234375, -107.20840454101562, -99.58582305908203, -91.9632339477539, -84.34065246582031, -76.71806335449219, -69.09547424316406, -61.47289276123047, -53.850303649902344, -46.227718353271484, -38.60511779785156, -30.982532501220703, -23.35994529724121, -15.737358093261719, -8.11477279663086, -0.4921875, 7.130401611328125, 14.752986907958984, 22.375572204589844, 29.998157501220703, 37.62074279785156, 45.24333190917969, 52.86591720581055, 60.488502502441406, 68.11109161376953, 75.73367309570312, 83.35626220703125, 90.97885131835938, 98.60143280029297, 106.2240219116211, 113.84660339355469, 121.46919250488281, 129.09178161621094, 136.71437072753906, 144.33694458007812, 151.95953369140625, 159.58212280273438, 167.2047119140625, 174.82728576660156, 182.4498748779297, 190.0724639892578, 197.69505310058594, 205.31764221191406]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 6.0, 12.0, 14.0, 12.0, 20.0, 28.0, 30.0, 33.0, 39.0, 44.0, 52.0, 68.0, 54.0, 42.0, 60.0, 68.0, 54.0, 62.0, 50.0, 43.0, 45.0, 29.0, 25.0, 31.0, 19.0, 13.0, 16.0, 7.0, 9.0, 4.0, 3.0, 8.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-139.14976501464844, -134.23031616210938, -129.3108673095703, -124.39141845703125, -119.47196960449219, -114.55252075195312, -109.63307189941406, -104.713623046875, -99.79417419433594, -94.87472534179688, -89.95527648925781, -85.03582763671875, -80.11637878417969, -75.19692993164062, -70.27748107910156, -65.3580322265625, -60.43858337402344, -55.519134521484375, -50.59968566894531, -45.68023681640625, -40.76078796386719, -35.841339111328125, -30.921890258789062, -26.00244140625, -21.082992553710938, -16.163543701171875, -11.244094848632812, -6.32464599609375, -1.4051971435546875, 3.514251708984375, 8.433700561523438, 13.3531494140625, 18.2725830078125, 23.192031860351562, 28.111480712890625, 33.03092956542969, 37.95037841796875, 42.86982727050781, 47.789276123046875, 52.70872497558594, 57.628173828125, 62.54762268066406, 67.46707153320312, 72.38652038574219, 77.30596923828125, 82.22541809082031, 87.14486694335938, 92.06431579589844, 96.9837646484375, 101.90321350097656, 106.82266235351562, 111.74211120605469, 116.66156005859375, 121.58100891113281, 126.50045776367188, 131.41990661621094, 136.33935546875, 141.25880432128906, 146.17825317382812, 151.0977020263672, 156.01715087890625, 160.9365997314453, 165.85604858398438, 170.77549743652344, 175.6949462890625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 4.0, 2.0, 1.0, 7.0, 11.0, 7.0, 27.0, 35.0, 45.0, 61.0, 95.0, 156.0, 294.0, 534.0, 1260.0, 3314.0, 12827.0, 74864.0, 702069.0, 215996.0, 27249.0, 6035.0, 1869.0, 827.0, 397.0, 208.0, 135.0, 94.0, 33.0, 29.0, 24.0, 8.0, 6.0, 11.0, 6.0, 3.0, 4.0, 1.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-145.875, -140.615234375, -135.35546875, -130.095703125, -124.8359375, -119.576171875, -114.31640625, -109.056640625, -103.796875, -98.537109375, -93.27734375, -88.017578125, -82.7578125, -77.498046875, -72.23828125, -66.978515625, -61.71875, -56.458984375, -51.19921875, -45.939453125, -40.6796875, -35.419921875, -30.16015625, -24.900390625, -19.640625, -14.380859375, -9.12109375, -3.861328125, 1.3984375, 6.658203125, 11.91796875, 17.177734375, 22.4375, 27.697265625, 32.95703125, 38.216796875, 43.4765625, 48.736328125, 53.99609375, 59.255859375, 64.515625, 69.775390625, 75.03515625, 80.294921875, 85.5546875, 90.814453125, 96.07421875, 101.333984375, 106.59375, 111.853515625, 117.11328125, 122.373046875, 127.6328125, 132.892578125, 138.15234375, 143.412109375, 148.671875, 153.931640625, 159.19140625, 164.451171875, 169.7109375, 174.970703125, 180.23046875, 185.490234375, 190.75]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 7.0, 10.0, 6.0, 23.0, 25.0, 25.0, 56.0, 66.0, 91.0, 73.0, 84.0, 100.0, 91.0, 63.0, 72.0, 52.0, 53.0, 34.0, 24.0, 16.0, 14.0, 8.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.140625, -21.455078125, -20.76953125, -20.083984375, -19.3984375, -18.712890625, -18.02734375, -17.341796875, -16.65625, -15.970703125, -15.28515625, -14.599609375, -13.9140625, -13.228515625, -12.54296875, -11.857421875, -11.171875, -10.486328125, -9.80078125, -9.115234375, -8.4296875, -7.744140625, -7.05859375, -6.373046875, -5.6875, -5.001953125, -4.31640625, -3.630859375, -2.9453125, -2.259765625, -1.57421875, -0.888671875, -0.203125, 0.482421875, 1.16796875, 1.853515625, 2.5390625, 3.224609375, 3.91015625, 4.595703125, 5.28125, 5.966796875, 6.65234375, 7.337890625, 8.0234375, 8.708984375, 9.39453125, 10.080078125, 10.765625, 11.451171875, 12.13671875, 12.822265625, 13.5078125, 14.193359375, 14.87890625, 15.564453125, 16.25, 16.935546875, 17.62109375, 18.306640625, 18.9921875, 19.677734375, 20.36328125, 21.048828125, 21.734375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 2.0, 5.0, 9.0, 14.0, 12.0, 26.0, 29.0, 39.0, 52.0, 68.0, 130.0, 151.0, 201.0, 296.0, 488.0, 762.0, 1426.0, 3002.0, 7243.0, 19648.0, 56119.0, 176815.0, 492100.0, 193624.0, 60424.0, 20890.0, 7869.0, 3161.0, 1535.0, 895.0, 482.0, 303.0, 221.0, 137.0, 101.0, 68.0, 55.0, 44.0, 27.0, 19.0, 21.0, 17.0, 9.0, 2.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-60.8125, -58.943359375, -57.07421875, -55.205078125, -53.3359375, -51.466796875, -49.59765625, -47.728515625, -45.859375, -43.990234375, -42.12109375, -40.251953125, -38.3828125, -36.513671875, -34.64453125, -32.775390625, -30.90625, -29.037109375, -27.16796875, -25.298828125, -23.4296875, -21.560546875, -19.69140625, -17.822265625, -15.953125, -14.083984375, -12.21484375, -10.345703125, -8.4765625, -6.607421875, -4.73828125, -2.869140625, -1.0, 0.869140625, 2.73828125, 4.607421875, 6.4765625, 8.345703125, 10.21484375, 12.083984375, 13.953125, 15.822265625, 17.69140625, 19.560546875, 21.4296875, 23.298828125, 25.16796875, 27.037109375, 28.90625, 30.775390625, 32.64453125, 34.513671875, 36.3828125, 38.251953125, 40.12109375, 41.990234375, 43.859375, 45.728515625, 47.59765625, 49.466796875, 51.3359375, 53.205078125, 55.07421875, 56.943359375, 58.8125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 9.0, 10.0, 8.0, 13.0, 15.0, 11.0, 16.0, 26.0, 22.0, 19.0, 32.0, 32.0, 40.0, 49.0, 37.0, 53.0, 43.0, 45.0, 51.0, 45.0, 58.0, 43.0, 40.0, 34.0, 33.0, 28.0, 30.0, 25.0, 26.0, 25.0, 22.0, 20.0, 11.0, 8.0, 7.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.125, -42.56982421875, -41.0146484375, -39.45947265625, -37.904296875, -36.34912109375, -34.7939453125, -33.23876953125, -31.68359375, -30.12841796875, -28.5732421875, -27.01806640625, -25.462890625, -23.90771484375, -22.3525390625, -20.79736328125, -19.2421875, -17.68701171875, -16.1318359375, -14.57666015625, -13.021484375, -11.46630859375, -9.9111328125, -8.35595703125, -6.80078125, -5.24560546875, -3.6904296875, -2.13525390625, -0.580078125, 0.97509765625, 2.5302734375, 4.08544921875, 5.640625, 7.19580078125, 8.7509765625, 10.30615234375, 11.861328125, 13.41650390625, 14.9716796875, 16.52685546875, 18.08203125, 19.63720703125, 21.1923828125, 22.74755859375, 24.302734375, 25.85791015625, 27.4130859375, 28.96826171875, 30.5234375, 32.07861328125, 33.6337890625, 35.18896484375, 36.744140625, 38.29931640625, 39.8544921875, 41.40966796875, 42.96484375, 44.52001953125, 46.0751953125, 47.63037109375, 49.185546875, 50.74072265625, 52.2958984375, 53.85107421875, 55.40625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 0.0, 8.0, 5.0, 12.0, 18.0, 32.0, 53.0, 79.0, 88.0, 188.0, 363.0, 808.0, 2150.0, 7335.0, 30634.0, 184535.0, 620785.0, 163534.0, 27562.0, 6629.0, 2052.0, 855.0, 368.0, 184.0, 98.0, 75.0, 32.0, 18.0, 14.0, 10.0, 9.0, 4.0, 8.0, 7.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.984375, -30.968017578125, -29.95166015625, -28.935302734375, -27.9189453125, -26.902587890625, -25.88623046875, -24.869873046875, -23.853515625, -22.837158203125, -21.82080078125, -20.804443359375, -19.7880859375, -18.771728515625, -17.75537109375, -16.739013671875, -15.72265625, -14.706298828125, -13.68994140625, -12.673583984375, -11.6572265625, -10.640869140625, -9.62451171875, -8.608154296875, -7.591796875, -6.575439453125, -5.55908203125, -4.542724609375, -3.5263671875, -2.510009765625, -1.49365234375, -0.477294921875, 0.5390625, 1.555419921875, 2.57177734375, 3.588134765625, 4.6044921875, 5.620849609375, 6.63720703125, 7.653564453125, 8.669921875, 9.686279296875, 10.70263671875, 11.718994140625, 12.7353515625, 13.751708984375, 14.76806640625, 15.784423828125, 16.80078125, 17.817138671875, 18.83349609375, 19.849853515625, 20.8662109375, 21.882568359375, 22.89892578125, 23.915283203125, 24.931640625, 25.947998046875, 26.96435546875, 27.980712890625, 28.9970703125, 30.013427734375, 31.02978515625, 32.046142578125, 33.0625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 7.0, 8.0, 3.0, 14.0, 6.0, 15.0, 18.0, 35.0, 31.0, 52.0, 114.0, 190.0, 201.0, 103.0, 62.0, 30.0, 30.0, 18.0, 13.0, 19.0, 5.0, 8.0, 6.0, 5.0, 4.0, 1.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0072479248046875, -0.007052063941955566, -0.006856203079223633, -0.006660342216491699, -0.006464481353759766, -0.006268620491027832, -0.0060727596282958984, -0.005876898765563965, -0.005681037902832031, -0.005485177040100098, -0.005289316177368164, -0.0050934553146362305, -0.004897594451904297, -0.004701733589172363, -0.00450587272644043, -0.004310011863708496, -0.0041141510009765625, -0.003918290138244629, -0.0037224292755126953, -0.0035265684127807617, -0.003330707550048828, -0.0031348466873168945, -0.002938985824584961, -0.0027431249618530273, -0.0025472640991210938, -0.00235140323638916, -0.0021555423736572266, -0.001959681510925293, -0.0017638206481933594, -0.0015679597854614258, -0.0013720989227294922, -0.0011762380599975586, -0.000980377197265625, -0.0007845163345336914, -0.0005886554718017578, -0.0003927946090698242, -0.00019693374633789062, -1.0728836059570312e-06, 0.00019478797912597656, 0.00039064884185791016, 0.0005865097045898438, 0.0007823705673217773, 0.000978231430053711, 0.0011740922927856445, 0.0013699531555175781, 0.0015658140182495117, 0.0017616748809814453, 0.001957535743713379, 0.0021533966064453125, 0.002349257469177246, 0.0025451183319091797, 0.0027409791946411133, 0.002936840057373047, 0.0031327009201049805, 0.003328561782836914, 0.0035244226455688477, 0.0037202835083007812, 0.003916144371032715, 0.0041120052337646484, 0.004307866096496582, 0.004503726959228516, 0.004699587821960449, 0.004895448684692383, 0.005091309547424316, 0.00528717041015625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 1.0, 3.0, 4.0, 5.0, 4.0, 7.0, 10.0, 14.0, 16.0, 34.0, 49.0, 70.0, 117.0, 216.0, 344.0, 659.0, 1608.0, 4758.0, 17521.0, 81292.0, 549930.0, 326745.0, 47988.0, 11262.0, 3221.0, 1338.0, 557.0, 318.0, 167.0, 105.0, 81.0, 36.0, 21.0, 13.0, 14.0, 7.0, 13.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-34.09375, -33.115234375, -32.13671875, -31.158203125, -30.1796875, -29.201171875, -28.22265625, -27.244140625, -26.265625, -25.287109375, -24.30859375, -23.330078125, -22.3515625, -21.373046875, -20.39453125, -19.416015625, -18.4375, -17.458984375, -16.48046875, -15.501953125, -14.5234375, -13.544921875, -12.56640625, -11.587890625, -10.609375, -9.630859375, -8.65234375, -7.673828125, -6.6953125, -5.716796875, -4.73828125, -3.759765625, -2.78125, -1.802734375, -0.82421875, 0.154296875, 1.1328125, 2.111328125, 3.08984375, 4.068359375, 5.046875, 6.025390625, 7.00390625, 7.982421875, 8.9609375, 9.939453125, 10.91796875, 11.896484375, 12.875, 13.853515625, 14.83203125, 15.810546875, 16.7890625, 17.767578125, 18.74609375, 19.724609375, 20.703125, 21.681640625, 22.66015625, 23.638671875, 24.6171875, 25.595703125, 26.57421875, 27.552734375, 28.53125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 7.0, 11.0, 5.0, 12.0, 12.0, 9.0, 19.0, 25.0, 42.0, 45.0, 73.0, 88.0, 144.0, 115.0, 107.0, 89.0, 45.0, 28.0, 35.0, 28.0, 12.0, 10.0, 15.0, 9.0, 9.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.40625, -18.760009765625, -18.11376953125, -17.467529296875, -16.8212890625, -16.175048828125, -15.52880859375, -14.882568359375, -14.236328125, -13.590087890625, -12.94384765625, -12.297607421875, -11.6513671875, -11.005126953125, -10.35888671875, -9.712646484375, -9.06640625, -8.420166015625, -7.77392578125, -7.127685546875, -6.4814453125, -5.835205078125, -5.18896484375, -4.542724609375, -3.896484375, -3.250244140625, -2.60400390625, -1.957763671875, -1.3115234375, -0.665283203125, -0.01904296875, 0.627197265625, 1.2734375, 1.919677734375, 2.56591796875, 3.212158203125, 3.8583984375, 4.504638671875, 5.15087890625, 5.797119140625, 6.443359375, 7.089599609375, 7.73583984375, 8.382080078125, 9.0283203125, 9.674560546875, 10.32080078125, 10.967041015625, 11.61328125, 12.259521484375, 12.90576171875, 13.552001953125, 14.1982421875, 14.844482421875, 15.49072265625, 16.136962890625, 16.783203125, 17.429443359375, 18.07568359375, 18.721923828125, 19.3681640625, 20.014404296875, 20.66064453125, 21.306884765625, 21.953125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 8.0, 7.0, 15.0, 36.0, 60.0, 105.0, 137.0, 187.0, 167.0, 100.0, 76.0, 56.0, 24.0, 17.0, 8.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-635.1976928710938, -617.8590698242188, -600.5204467773438, -583.1817626953125, -565.8431396484375, -548.5045166015625, -531.1658935546875, -513.8272705078125, -496.4886169433594, -479.1499938964844, -461.81134033203125, -444.47271728515625, -427.13409423828125, -409.7954406738281, -392.4568176269531, -375.1181640625, -357.779541015625, -340.44091796875, -323.1022644042969, -305.7636413574219, -288.42498779296875, -271.08636474609375, -253.74774169921875, -236.4091033935547, -219.07046508789062, -201.73182678222656, -184.3931884765625, -167.0545654296875, -149.71592712402344, -132.37728881835938, -115.03865814208984, -97.70002746582031, -80.36138916015625, -63.02275466918945, -45.684120178222656, -28.34548568725586, -11.006851196289062, 6.331787109375, 23.67041778564453, 41.00904846191406, 58.347686767578125, 75.68632507324219, 93.02495574951172, 110.36358642578125, 127.70222473144531, 145.04086303710938, 162.37948608398438, 179.71812438964844, 197.0567626953125, 214.39540100097656, 231.73403930664062, 249.07266235351562, 266.41131591796875, 283.74993896484375, 301.08856201171875, 318.42718505859375, 335.7658386230469, 353.1044616699219, 370.443115234375, 387.78173828125, 405.120361328125, 422.4590148925781, 439.7976379394531, 457.13629150390625, 474.47491455078125]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 11.0, 10.0, 11.0, 12.0, 13.0, 15.0, 22.0, 20.0, 23.0, 36.0, 24.0, 31.0, 23.0, 38.0, 35.0, 45.0, 47.0, 54.0, 32.0, 47.0, 37.0, 39.0, 47.0, 27.0, 38.0, 31.0, 28.0, 43.0, 18.0, 25.0, 13.0, 15.0, 15.0, 10.0, 14.0, 8.0, 10.0, 12.0, 4.0, 5.0, 8.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-199.2005615234375, -192.03567504882812, -184.8707733154297, -177.7058868408203, -170.54100036621094, -163.3760986328125, -156.21121215820312, -149.04632568359375, -141.88143920898438, -134.716552734375, -127.5516586303711, -120.38676452636719, -113.22187805175781, -106.0569839477539, -98.89208984375, -91.72720336914062, -84.56230163574219, -77.39740753173828, -70.2325210571289, -63.067626953125, -55.90273666381836, -48.73784637451172, -41.57295227050781, -34.40806198120117, -27.24317169189453, -20.07828140258789, -12.913389205932617, -5.748497009277344, 1.4163932800292969, 8.581283569335938, 15.746177673339844, 22.911067962646484, 30.075958251953125, 37.240848541259766, 44.405738830566406, 51.57063293457031, 58.73552322387695, 65.9004135131836, 73.0653076171875, 80.23019409179688, 87.39508819580078, 94.55998229980469, 101.72486877441406, 108.88976287841797, 116.05465698242188, 123.21954345703125, 130.38442993164062, 137.54933166503906, 144.71421813964844, 151.8791046142578, 159.04400634765625, 166.20889282226562, 173.373779296875, 180.53866577148438, 187.7035675048828, 194.8684539794922, 202.03335571289062, 209.1982421875, 216.36314392089844, 223.5280303955078, 230.6929168701172, 237.85781860351562, 245.022705078125, 252.18759155273438, 259.35247802734375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 8.0, 7.0, 6.0, 8.0, 11.0, 15.0, 35.0, 33.0, 54.0, 68.0, 88.0, 124.0, 219.0, 334.0, 627.0, 1204.0, 2703.0, 6777.0, 23233.0, 149712.0, 3793906.0, 176830.0, 25322.0, 7334.0, 2770.0, 1312.0, 619.0, 335.0, 181.0, 116.0, 73.0, 50.0, 37.0, 17.0, 21.0, 10.0, 18.0, 13.0, 12.0, 8.0, 10.0, 3.0, 3.0, 3.0, 4.0, 1.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-143.375, -138.349609375, -133.32421875, -128.298828125, -123.2734375, -118.248046875, -113.22265625, -108.197265625, -103.171875, -98.146484375, -93.12109375, -88.095703125, -83.0703125, -78.044921875, -73.01953125, -67.994140625, -62.96875, -57.943359375, -52.91796875, -47.892578125, -42.8671875, -37.841796875, -32.81640625, -27.791015625, -22.765625, -17.740234375, -12.71484375, -7.689453125, -2.6640625, 2.361328125, 7.38671875, 12.412109375, 17.4375, 22.462890625, 27.48828125, 32.513671875, 37.5390625, 42.564453125, 47.58984375, 52.615234375, 57.640625, 62.666015625, 67.69140625, 72.716796875, 77.7421875, 82.767578125, 87.79296875, 92.818359375, 97.84375, 102.869140625, 107.89453125, 112.919921875, 117.9453125, 122.970703125, 127.99609375, 133.021484375, 138.046875, 143.072265625, 148.09765625, 153.123046875, 158.1484375, 163.173828125, 168.19921875, 173.224609375, 178.25]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 6.0, 5.0, 3.0, 6.0, 15.0, 16.0, 18.0, 29.0, 44.0, 45.0, 87.0, 83.0, 65.0, 78.0, 73.0, 75.0, 79.0, 60.0, 59.0, 53.0, 36.0, 21.0, 18.0, 12.0, 14.0, 2.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.265625, -20.600830078125, -19.93603515625, -19.271240234375, -18.6064453125, -17.941650390625, -17.27685546875, -16.612060546875, -15.947265625, -15.282470703125, -14.61767578125, -13.952880859375, -13.2880859375, -12.623291015625, -11.95849609375, -11.293701171875, -10.62890625, -9.964111328125, -9.29931640625, -8.634521484375, -7.9697265625, -7.304931640625, -6.64013671875, -5.975341796875, -5.310546875, -4.645751953125, -3.98095703125, -3.316162109375, -2.6513671875, -1.986572265625, -1.32177734375, -0.656982421875, 0.0078125, 0.672607421875, 1.33740234375, 2.002197265625, 2.6669921875, 3.331787109375, 3.99658203125, 4.661376953125, 5.326171875, 5.990966796875, 6.65576171875, 7.320556640625, 7.9853515625, 8.650146484375, 9.31494140625, 9.979736328125, 10.64453125, 11.309326171875, 11.97412109375, 12.638916015625, 13.3037109375, 13.968505859375, 14.63330078125, 15.298095703125, 15.962890625, 16.627685546875, 17.29248046875, 17.957275390625, 18.6220703125, 19.286865234375, 19.95166015625, 20.616455078125, 21.28125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 11.0, 9.0, 13.0, 19.0, 31.0, 43.0, 51.0, 72.0, 85.0, 136.0, 221.0, 393.0, 801.0, 1890.0, 5603.0, 19964.0, 111748.0, 3106144.0, 859358.0, 66486.0, 14073.0, 4086.0, 1467.0, 636.0, 349.0, 190.0, 113.0, 76.0, 49.0, 47.0, 27.0, 20.0, 10.0, 11.0, 11.0, 9.0, 6.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0], "bins": [-114.125, -110.65234375, -107.1796875, -103.70703125, -100.234375, -96.76171875, -93.2890625, -89.81640625, -86.34375, -82.87109375, -79.3984375, -75.92578125, -72.453125, -68.98046875, -65.5078125, -62.03515625, -58.5625, -55.08984375, -51.6171875, -48.14453125, -44.671875, -41.19921875, -37.7265625, -34.25390625, -30.78125, -27.30859375, -23.8359375, -20.36328125, -16.890625, -13.41796875, -9.9453125, -6.47265625, -3.0, 0.47265625, 3.9453125, 7.41796875, 10.890625, 14.36328125, 17.8359375, 21.30859375, 24.78125, 28.25390625, 31.7265625, 35.19921875, 38.671875, 42.14453125, 45.6171875, 49.08984375, 52.5625, 56.03515625, 59.5078125, 62.98046875, 66.453125, 69.92578125, 73.3984375, 76.87109375, 80.34375, 83.81640625, 87.2890625, 90.76171875, 94.234375, 97.70703125, 101.1796875, 104.65234375, 108.125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 10.0, 21.0, 30.0, 57.0, 95.0, 251.0, 569.0, 1898.0, 640.0, 223.0, 113.0, 55.0, 43.0, 21.0, 19.0, 7.0, 8.0, 5.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-63.8125, -62.3779296875, -60.943359375, -59.5087890625, -58.07421875, -56.6396484375, -55.205078125, -53.7705078125, -52.3359375, -50.9013671875, -49.466796875, -48.0322265625, -46.59765625, -45.1630859375, -43.728515625, -42.2939453125, -40.859375, -39.4248046875, -37.990234375, -36.5556640625, -35.12109375, -33.6865234375, -32.251953125, -30.8173828125, -29.3828125, -27.9482421875, -26.513671875, -25.0791015625, -23.64453125, -22.2099609375, -20.775390625, -19.3408203125, -17.90625, -16.4716796875, -15.037109375, -13.6025390625, -12.16796875, -10.7333984375, -9.298828125, -7.8642578125, -6.4296875, -4.9951171875, -3.560546875, -2.1259765625, -0.69140625, 0.7431640625, 2.177734375, 3.6123046875, 5.046875, 6.4814453125, 7.916015625, 9.3505859375, 10.78515625, 12.2197265625, 13.654296875, 15.0888671875, 16.5234375, 17.9580078125, 19.392578125, 20.8271484375, 22.26171875, 23.6962890625, 25.130859375, 26.5654296875, 28.0]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 8.0, 13.0, 24.0, 64.0, 97.0, 123.0, 143.0, 159.0, 120.0, 116.0, 55.0, 37.0, 13.0, 10.0, 5.0, 4.0, 0.0, 1.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-215.8210906982422, -207.04991149902344, -198.2787322998047, -189.50753784179688, -180.73635864257812, -171.96517944335938, -163.19400024414062, -154.42282104492188, -145.65164184570312, -136.88046264648438, -128.10928344726562, -119.33809661865234, -110.56690979003906, -101.79573059082031, -93.02455139160156, -84.25337219238281, -75.482177734375, -66.71099853515625, -57.93981170654297, -49.16863250732422, -40.3974494934082, -31.626266479492188, -22.855087280273438, -14.083904266357422, -5.312721252441406, 3.458460807800293, 12.229642868041992, 21.000823974609375, 29.77200698852539, 38.543190002441406, 47.314369201660156, 56.08555221557617, 64.85671997070312, 73.62789916992188, 82.39908599853516, 91.1702651977539, 99.94145202636719, 108.71263122558594, 117.48381042480469, 126.25498962402344, 135.02618408203125, 143.79736328125, 152.56854248046875, 161.3397216796875, 170.1109161376953, 178.88209533691406, 187.6532745361328, 196.42445373535156, 205.1956329345703, 213.96681213378906, 222.7379913330078, 231.50918579101562, 240.28036499023438, 249.05154418945312, 257.8227233886719, 266.5939025878906, 275.3650817871094, 284.1362609863281, 292.9074401855469, 301.6786193847656, 310.4497985839844, 319.22100830078125, 327.9921875, 336.76336669921875, 345.5345458984375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 3.0, 6.0, 5.0, 15.0, 7.0, 10.0, 9.0, 24.0, 22.0, 21.0, 33.0, 46.0, 44.0, 41.0, 33.0, 52.0, 76.0, 60.0, 64.0, 52.0, 44.0, 45.0, 44.0, 50.0, 33.0, 21.0, 30.0, 22.0, 14.0, 19.0, 19.0, 10.0, 9.0, 7.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.55390167236328, -98.66016387939453, -94.76643371582031, -90.87269592285156, -86.97895812988281, -83.08522033691406, -79.19148254394531, -75.2977523803711, -71.40401458740234, -67.5102767944336, -63.61654281616211, -59.722808837890625, -55.829071044921875, -51.935333251953125, -48.04159927368164, -44.147865295410156, -40.254127502441406, -36.360389709472656, -32.46665573120117, -28.572919845581055, -24.679183959960938, -20.78544807434082, -16.891712188720703, -12.997976303100586, -9.104240417480469, -5.210504531860352, -1.3167686462402344, 2.576967239379883, 6.470703125, 10.364439010620117, 14.258174896240234, 18.15191078186035, 22.045639038085938, 25.939374923706055, 29.833110809326172, 33.726844787597656, 37.620582580566406, 41.514320373535156, 45.40805435180664, 49.301788330078125, 53.195526123046875, 57.089263916015625, 60.98299789428711, 64.8767318725586, 68.77046966552734, 72.6642074584961, 76.55793762207031, 80.45167541503906, 84.34541320800781, 88.23915100097656, 92.13288879394531, 96.02661895751953, 99.92035675048828, 103.81409454345703, 107.70782470703125, 111.6015625, 115.49530029296875, 119.3890380859375, 123.28277587890625, 127.17650604248047, 131.07025146484375, 134.96397399902344, 138.8577117919922, 142.75144958496094, 146.6451873779297]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 2.0, 5.0, 6.0, 9.0, 15.0, 21.0, 27.0, 54.0, 74.0, 110.0, 190.0, 297.0, 537.0, 1198.0, 3490.0, 14604.0, 84429.0, 753049.0, 159015.0, 23053.0, 5140.0, 1603.0, 721.0, 345.0, 229.0, 107.0, 72.0, 41.0, 38.0, 18.0, 22.0, 12.0, 9.0, 9.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-165.25, -160.1875, -155.125, -150.0625, -145.0, -139.9375, -134.875, -129.8125, -124.75, -119.6875, -114.625, -109.5625, -104.5, -99.4375, -94.375, -89.3125, -84.25, -79.1875, -74.125, -69.0625, -64.0, -58.9375, -53.875, -48.8125, -43.75, -38.6875, -33.625, -28.5625, -23.5, -18.4375, -13.375, -8.3125, -3.25, 1.8125, 6.875, 11.9375, 17.0, 22.0625, 27.125, 32.1875, 37.25, 42.3125, 47.375, 52.4375, 57.5, 62.5625, 67.625, 72.6875, 77.75, 82.8125, 87.875, 92.9375, 98.0, 103.0625, 108.125, 113.1875, 118.25, 123.3125, 128.375, 133.4375, 138.5, 143.5625, 148.625, 153.6875, 158.75]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 7.0, 4.0, 9.0, 13.0, 15.0, 18.0, 35.0, 33.0, 49.0, 57.0, 85.0, 60.0, 80.0, 80.0, 85.0, 85.0, 61.0, 60.0, 40.0, 40.0, 32.0, 17.0, 12.0, 11.0, 6.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.6875, -21.015625, -20.34375, -19.671875, -19.0, -18.328125, -17.65625, -16.984375, -16.3125, -15.640625, -14.96875, -14.296875, -13.625, -12.953125, -12.28125, -11.609375, -10.9375, -10.265625, -9.59375, -8.921875, -8.25, -7.578125, -6.90625, -6.234375, -5.5625, -4.890625, -4.21875, -3.546875, -2.875, -2.203125, -1.53125, -0.859375, -0.1875, 0.484375, 1.15625, 1.828125, 2.5, 3.171875, 3.84375, 4.515625, 5.1875, 5.859375, 6.53125, 7.203125, 7.875, 8.546875, 9.21875, 9.890625, 10.5625, 11.234375, 11.90625, 12.578125, 13.25, 13.921875, 14.59375, 15.265625, 15.9375, 16.609375, 17.28125, 17.953125, 18.625, 19.296875, 19.96875, 20.640625, 21.3125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 5.0, 5.0, 5.0, 7.0, 9.0, 9.0, 20.0, 29.0, 37.0, 36.0, 65.0, 112.0, 151.0, 238.0, 378.0, 711.0, 1383.0, 2453.0, 5165.0, 10667.0, 22252.0, 48791.0, 136323.0, 452824.0, 237394.0, 70368.0, 30780.0, 14046.0, 6909.0, 3387.0, 1748.0, 903.0, 513.0, 301.0, 160.0, 101.0, 77.0, 53.0, 41.0, 29.0, 26.0, 12.0, 11.0, 9.0, 4.0, 7.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.5, -48.03125, -46.5625, -45.09375, -43.625, -42.15625, -40.6875, -39.21875, -37.75, -36.28125, -34.8125, -33.34375, -31.875, -30.40625, -28.9375, -27.46875, -26.0, -24.53125, -23.0625, -21.59375, -20.125, -18.65625, -17.1875, -15.71875, -14.25, -12.78125, -11.3125, -9.84375, -8.375, -6.90625, -5.4375, -3.96875, -2.5, -1.03125, 0.4375, 1.90625, 3.375, 4.84375, 6.3125, 7.78125, 9.25, 10.71875, 12.1875, 13.65625, 15.125, 16.59375, 18.0625, 19.53125, 21.0, 22.46875, 23.9375, 25.40625, 26.875, 28.34375, 29.8125, 31.28125, 32.75, 34.21875, 35.6875, 37.15625, 38.625, 40.09375, 41.5625, 43.03125, 44.5]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 4.0, 4.0, 1.0, 8.0, 8.0, 11.0, 14.0, 23.0, 13.0, 20.0, 33.0, 36.0, 35.0, 30.0, 38.0, 35.0, 40.0, 37.0, 41.0, 39.0, 47.0, 63.0, 41.0, 48.0, 44.0, 36.0, 44.0, 36.0, 31.0, 18.0, 25.0, 16.0, 13.0, 13.0, 13.0, 8.0, 6.0, 7.0, 3.0, 7.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.0, -45.478515625, -43.95703125, -42.435546875, -40.9140625, -39.392578125, -37.87109375, -36.349609375, -34.828125, -33.306640625, -31.78515625, -30.263671875, -28.7421875, -27.220703125, -25.69921875, -24.177734375, -22.65625, -21.134765625, -19.61328125, -18.091796875, -16.5703125, -15.048828125, -13.52734375, -12.005859375, -10.484375, -8.962890625, -7.44140625, -5.919921875, -4.3984375, -2.876953125, -1.35546875, 0.166015625, 1.6875, 3.208984375, 4.73046875, 6.251953125, 7.7734375, 9.294921875, 10.81640625, 12.337890625, 13.859375, 15.380859375, 16.90234375, 18.423828125, 19.9453125, 21.466796875, 22.98828125, 24.509765625, 26.03125, 27.552734375, 29.07421875, 30.595703125, 32.1171875, 33.638671875, 35.16015625, 36.681640625, 38.203125, 39.724609375, 41.24609375, 42.767578125, 44.2890625, 45.810546875, 47.33203125, 48.853515625, 50.375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 5.0, 6.0, 16.0, 22.0, 28.0, 39.0, 40.0, 100.0, 140.0, 293.0, 505.0, 986.0, 2528.0, 9193.0, 69883.0, 852383.0, 96106.0, 11124.0, 2806.0, 1097.0, 541.0, 286.0, 153.0, 76.0, 68.0, 34.0, 30.0, 16.0, 15.0, 8.0, 8.0, 6.0, 2.0, 4.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.65625, -45.79150390625, -43.9267578125, -42.06201171875, -40.197265625, -38.33251953125, -36.4677734375, -34.60302734375, -32.73828125, -30.87353515625, -29.0087890625, -27.14404296875, -25.279296875, -23.41455078125, -21.5498046875, -19.68505859375, -17.8203125, -15.95556640625, -14.0908203125, -12.22607421875, -10.361328125, -8.49658203125, -6.6318359375, -4.76708984375, -2.90234375, -1.03759765625, 0.8271484375, 2.69189453125, 4.556640625, 6.42138671875, 8.2861328125, 10.15087890625, 12.015625, 13.88037109375, 15.7451171875, 17.60986328125, 19.474609375, 21.33935546875, 23.2041015625, 25.06884765625, 26.93359375, 28.79833984375, 30.6630859375, 32.52783203125, 34.392578125, 36.25732421875, 38.1220703125, 39.98681640625, 41.8515625, 43.71630859375, 45.5810546875, 47.44580078125, 49.310546875, 51.17529296875, 53.0400390625, 54.90478515625, 56.76953125, 58.63427734375, 60.4990234375, 62.36376953125, 64.228515625, 66.09326171875, 67.9580078125, 69.82275390625, 71.6875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 0.0, 4.0, 6.0, 6.0, 3.0, 3.0, 6.0, 13.0, 11.0, 26.0, 20.0, 43.0, 130.0, 320.0, 214.0, 73.0, 34.0, 25.0, 22.0, 12.0, 6.0, 6.0, 8.0, 6.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0111541748046875, -0.010910391807556152, -0.010666608810424805, -0.010422825813293457, -0.01017904281616211, -0.009935259819030762, -0.009691476821899414, -0.009447693824768066, -0.009203910827636719, -0.008960127830505371, -0.008716344833374023, -0.008472561836242676, -0.008228778839111328, -0.00798499584197998, -0.007741212844848633, -0.007497429847717285, -0.0072536468505859375, -0.00700986385345459, -0.006766080856323242, -0.0065222978591918945, -0.006278514862060547, -0.006034731864929199, -0.0057909488677978516, -0.005547165870666504, -0.005303382873535156, -0.005059599876403809, -0.004815816879272461, -0.004572033882141113, -0.004328250885009766, -0.004084467887878418, -0.0038406848907470703, -0.0035969018936157227, -0.003353118896484375, -0.0031093358993530273, -0.0028655529022216797, -0.002621769905090332, -0.0023779869079589844, -0.0021342039108276367, -0.001890420913696289, -0.0016466379165649414, -0.0014028549194335938, -0.001159071922302246, -0.0009152889251708984, -0.0006715059280395508, -0.0004277229309082031, -0.00018393993377685547, 5.984306335449219e-05, 0.00030362606048583984, 0.0005474090576171875, 0.0007911920547485352, 0.0010349750518798828, 0.0012787580490112305, 0.0015225410461425781, 0.0017663240432739258, 0.0020101070404052734, 0.002253890037536621, 0.0024976730346679688, 0.0027414560317993164, 0.002985239028930664, 0.0032290220260620117, 0.0034728050231933594, 0.003716588020324707, 0.003960371017456055, 0.004204154014587402, 0.00444793701171875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 5.0, 7.0, 13.0, 8.0, 19.0, 35.0, 38.0, 49.0, 105.0, 173.0, 391.0, 1013.0, 3470.0, 19026.0, 316753.0, 671832.0, 28719.0, 4662.0, 1244.0, 503.0, 195.0, 100.0, 66.0, 36.0, 22.0, 16.0, 14.0, 7.0, 10.0, 7.0, 4.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.375, -57.40234375, -55.4296875, -53.45703125, -51.484375, -49.51171875, -47.5390625, -45.56640625, -43.59375, -41.62109375, -39.6484375, -37.67578125, -35.703125, -33.73046875, -31.7578125, -29.78515625, -27.8125, -25.83984375, -23.8671875, -21.89453125, -19.921875, -17.94921875, -15.9765625, -14.00390625, -12.03125, -10.05859375, -8.0859375, -6.11328125, -4.140625, -2.16796875, -0.1953125, 1.77734375, 3.75, 5.72265625, 7.6953125, 9.66796875, 11.640625, 13.61328125, 15.5859375, 17.55859375, 19.53125, 21.50390625, 23.4765625, 25.44921875, 27.421875, 29.39453125, 31.3671875, 33.33984375, 35.3125, 37.28515625, 39.2578125, 41.23046875, 43.203125, 45.17578125, 47.1484375, 49.12109375, 51.09375, 53.06640625, 55.0390625, 57.01171875, 58.984375, 60.95703125, 62.9296875, 64.90234375, 66.875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 6.0, 6.0, 10.0, 14.0, 19.0, 31.0, 42.0, 79.0, 180.0, 229.0, 157.0, 85.0, 38.0, 24.0, 15.0, 11.0, 11.0, 8.0, 9.0, 6.0, 4.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.5625, -34.5615234375, -33.560546875, -32.5595703125, -31.55859375, -30.5576171875, -29.556640625, -28.5556640625, -27.5546875, -26.5537109375, -25.552734375, -24.5517578125, -23.55078125, -22.5498046875, -21.548828125, -20.5478515625, -19.546875, -18.5458984375, -17.544921875, -16.5439453125, -15.54296875, -14.5419921875, -13.541015625, -12.5400390625, -11.5390625, -10.5380859375, -9.537109375, -8.5361328125, -7.53515625, -6.5341796875, -5.533203125, -4.5322265625, -3.53125, -2.5302734375, -1.529296875, -0.5283203125, 0.47265625, 1.4736328125, 2.474609375, 3.4755859375, 4.4765625, 5.4775390625, 6.478515625, 7.4794921875, 8.48046875, 9.4814453125, 10.482421875, 11.4833984375, 12.484375, 13.4853515625, 14.486328125, 15.4873046875, 16.48828125, 17.4892578125, 18.490234375, 19.4912109375, 20.4921875, 21.4931640625, 22.494140625, 23.4951171875, 24.49609375, 25.4970703125, 26.498046875, 27.4990234375, 28.5]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 5.0, 15.0, 38.0, 41.0, 83.0, 140.0, 158.0, 162.0, 150.0, 97.0, 57.0, 42.0, 11.0, 8.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-190.3349151611328, -172.87261962890625, -155.4103240966797, -137.94802856445312, -120.4857406616211, -103.02344512939453, -85.5611572265625, -68.09886169433594, -50.636566162109375, -33.17427062988281, -15.711978912353516, 1.7503128051757812, 19.212608337402344, 36.674903869628906, 54.13719177246094, 71.5994873046875, 89.06178283691406, 106.52407836914062, 123.98637390136719, 141.44866943359375, 158.91094970703125, 176.37326049804688, 193.83554077148438, 211.29783630371094, 228.7601318359375, 246.22242736816406, 263.6847229003906, 281.1470031738281, 298.60931396484375, 316.07159423828125, 333.53387451171875, 350.9961853027344, 368.45843505859375, 385.92071533203125, 403.3830261230469, 420.8453063964844, 438.3076171875, 455.7698974609375, 473.232177734375, 490.6944885253906, 508.15679931640625, 525.6190795898438, 543.0813598632812, 560.543701171875, 578.0059814453125, 595.46826171875, 612.9305419921875, 630.392822265625, 647.8551025390625, 665.3173828125, 682.7796630859375, 700.2420043945312, 717.7042846679688, 735.1665649414062, 752.6288452148438, 770.0911865234375, 787.553466796875, 805.0157470703125, 822.47802734375, 839.9403686523438, 857.4026489257812, 874.8649291992188, 892.3272094726562, 909.78955078125, 927.2518310546875]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 6.0, 5.0, 3.0, 7.0, 5.0, 10.0, 13.0, 15.0, 9.0, 25.0, 28.0, 16.0, 26.0, 37.0, 28.0, 32.0, 35.0, 37.0, 48.0, 57.0, 53.0, 48.0, 37.0, 42.0, 42.0, 40.0, 35.0, 34.0, 33.0, 31.0, 22.0, 22.0, 25.0, 23.0, 21.0, 12.0, 8.0, 12.0, 6.0, 8.0, 1.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-191.6279296875, -184.66299438476562, -177.6980438232422, -170.7331085205078, -163.76815795898438, -156.80322265625, -149.83828735351562, -142.8733367919922, -135.9084014892578, -128.94346618652344, -121.978515625, -115.01358032226562, -108.04863739013672, -101.08369445800781, -94.1187515258789, -87.15380859375, -80.1888656616211, -73.22392272949219, -66.25897979736328, -59.29404067993164, -52.3291015625, -45.364158630371094, -38.39921569824219, -31.434276580810547, -24.46933364868164, -17.504392623901367, -10.539450645446777, -3.5745086669921875, 3.390432357788086, 10.35537338256836, 17.320316314697266, 24.285255432128906, 31.250198364257812, 38.21514129638672, 45.18008041381836, 52.145023345947266, 59.109962463378906, 66.07490539550781, 73.03984832763672, 80.00479125976562, 86.9697265625, 93.9346694946289, 100.89961242675781, 107.86454772949219, 114.8294906616211, 121.79443359375, 128.75936889648438, 135.7243194580078, 142.68927001953125, 149.65420532226562, 156.61915588378906, 163.58409118652344, 170.54904174804688, 177.51397705078125, 184.47891235351562, 191.44386291503906, 198.40879821777344, 205.3737335205078, 212.33868408203125, 219.30361938476562, 226.26856994628906, 233.23350524902344, 240.19845581054688, 247.16339111328125, 254.12832641601562]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 9.0, 16.0, 14.0, 23.0, 32.0, 37.0, 38.0, 57.0, 86.0, 135.0, 203.0, 301.0, 476.0, 851.0, 1540.0, 3284.0, 7747.0, 23431.0, 98074.0, 3262223.0, 699083.0, 66695.0, 17776.0, 6375.0, 2600.0, 1225.0, 662.0, 387.0, 255.0, 168.0, 110.0, 97.0, 58.0, 47.0, 32.0, 38.0, 18.0, 16.0, 12.0, 16.0, 6.0, 3.0, 5.0, 0.0, 3.0, 2.0, 6.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0], "bins": [-145.125, -140.42578125, -135.7265625, -131.02734375, -126.328125, -121.62890625, -116.9296875, -112.23046875, -107.53125, -102.83203125, -98.1328125, -93.43359375, -88.734375, -84.03515625, -79.3359375, -74.63671875, -69.9375, -65.23828125, -60.5390625, -55.83984375, -51.140625, -46.44140625, -41.7421875, -37.04296875, -32.34375, -27.64453125, -22.9453125, -18.24609375, -13.546875, -8.84765625, -4.1484375, 0.55078125, 5.25, 9.94921875, 14.6484375, 19.34765625, 24.046875, 28.74609375, 33.4453125, 38.14453125, 42.84375, 47.54296875, 52.2421875, 56.94140625, 61.640625, 66.33984375, 71.0390625, 75.73828125, 80.4375, 85.13671875, 89.8359375, 94.53515625, 99.234375, 103.93359375, 108.6328125, 113.33203125, 118.03125, 122.73046875, 127.4296875, 132.12890625, 136.828125, 141.52734375, 146.2265625, 150.92578125, 155.625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 8.0, 7.0, 6.0, 12.0, 7.0, 20.0, 22.0, 28.0, 54.0, 40.0, 64.0, 72.0, 77.0, 66.0, 102.0, 70.0, 70.0, 65.0, 67.0, 32.0, 34.0, 37.0, 13.0, 16.0, 6.0, 7.0, 4.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.609375, -20.93505859375, -20.2607421875, -19.58642578125, -18.912109375, -18.23779296875, -17.5634765625, -16.88916015625, -16.21484375, -15.54052734375, -14.8662109375, -14.19189453125, -13.517578125, -12.84326171875, -12.1689453125, -11.49462890625, -10.8203125, -10.14599609375, -9.4716796875, -8.79736328125, -8.123046875, -7.44873046875, -6.7744140625, -6.10009765625, -5.42578125, -4.75146484375, -4.0771484375, -3.40283203125, -2.728515625, -2.05419921875, -1.3798828125, -0.70556640625, -0.03125, 0.64306640625, 1.3173828125, 1.99169921875, 2.666015625, 3.34033203125, 4.0146484375, 4.68896484375, 5.36328125, 6.03759765625, 6.7119140625, 7.38623046875, 8.060546875, 8.73486328125, 9.4091796875, 10.08349609375, 10.7578125, 11.43212890625, 12.1064453125, 12.78076171875, 13.455078125, 14.12939453125, 14.8037109375, 15.47802734375, 16.15234375, 16.82666015625, 17.5009765625, 18.17529296875, 18.849609375, 19.52392578125, 20.1982421875, 20.87255859375, 21.546875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 6.0, 9.0, 10.0, 14.0, 14.0, 18.0, 36.0, 41.0, 50.0, 63.0, 115.0, 157.0, 237.0, 415.0, 722.0, 1315.0, 2732.0, 6101.0, 14616.0, 39276.0, 129394.0, 922889.0, 2808316.0, 184037.0, 51014.0, 18247.0, 7418.0, 3343.0, 1592.0, 807.0, 477.0, 273.0, 177.0, 106.0, 72.0, 50.0, 32.0, 23.0, 15.0, 15.0, 12.0, 6.0, 5.0, 7.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-86.4375, -83.904296875, -81.37109375, -78.837890625, -76.3046875, -73.771484375, -71.23828125, -68.705078125, -66.171875, -63.638671875, -61.10546875, -58.572265625, -56.0390625, -53.505859375, -50.97265625, -48.439453125, -45.90625, -43.373046875, -40.83984375, -38.306640625, -35.7734375, -33.240234375, -30.70703125, -28.173828125, -25.640625, -23.107421875, -20.57421875, -18.041015625, -15.5078125, -12.974609375, -10.44140625, -7.908203125, -5.375, -2.841796875, -0.30859375, 2.224609375, 4.7578125, 7.291015625, 9.82421875, 12.357421875, 14.890625, 17.423828125, 19.95703125, 22.490234375, 25.0234375, 27.556640625, 30.08984375, 32.623046875, 35.15625, 37.689453125, 40.22265625, 42.755859375, 45.2890625, 47.822265625, 50.35546875, 52.888671875, 55.421875, 57.955078125, 60.48828125, 63.021484375, 65.5546875, 68.087890625, 70.62109375, 73.154296875, 75.6875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 6.0, 6.0, 11.0, 11.0, 22.0, 29.0, 33.0, 66.0, 71.0, 139.0, 279.0, 772.0, 1772.0, 373.0, 202.0, 102.0, 62.0, 43.0, 25.0, 9.0, 10.0, 15.0, 4.0, 2.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-54.46875, -53.208740234375, -51.94873046875, -50.688720703125, -49.4287109375, -48.168701171875, -46.90869140625, -45.648681640625, -44.388671875, -43.128662109375, -41.86865234375, -40.608642578125, -39.3486328125, -38.088623046875, -36.82861328125, -35.568603515625, -34.30859375, -33.048583984375, -31.78857421875, -30.528564453125, -29.2685546875, -28.008544921875, -26.74853515625, -25.488525390625, -24.228515625, -22.968505859375, -21.70849609375, -20.448486328125, -19.1884765625, -17.928466796875, -16.66845703125, -15.408447265625, -14.1484375, -12.888427734375, -11.62841796875, -10.368408203125, -9.1083984375, -7.848388671875, -6.58837890625, -5.328369140625, -4.068359375, -2.808349609375, -1.54833984375, -0.288330078125, 0.9716796875, 2.231689453125, 3.49169921875, 4.751708984375, 6.01171875, 7.271728515625, 8.53173828125, 9.791748046875, 11.0517578125, 12.311767578125, 13.57177734375, 14.831787109375, 16.091796875, 17.351806640625, 18.61181640625, 19.871826171875, 21.1318359375, 22.391845703125, 23.65185546875, 24.911865234375, 26.171875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 9.0, 22.0, 37.0, 61.0, 107.0, 161.0, 194.0, 174.0, 126.0, 62.0, 29.0, 20.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-550.94921875, -540.5137329101562, -530.0782470703125, -519.6427612304688, -509.207275390625, -498.7717590332031, -488.3362731933594, -477.9007873535156, -467.4653015136719, -457.0298156738281, -446.5943298339844, -436.1588439941406, -425.72332763671875, -415.287841796875, -404.85235595703125, -394.4168701171875, -383.98138427734375, -373.5458984375, -363.11041259765625, -352.6749267578125, -342.23944091796875, -331.8039245605469, -321.3684387207031, -310.9329528808594, -300.4974670410156, -290.0619812011719, -279.6264953613281, -269.1910095214844, -258.7554931640625, -248.3200225830078, -237.884521484375, -227.44903564453125, -217.01353454589844, -206.5780487060547, -196.14254760742188, -185.70706176757812, -175.27157592773438, -164.83609008789062, -154.40060424804688, -143.96510314941406, -133.5296173095703, -123.09413146972656, -112.65863800048828, -102.22314453125, -91.78765869140625, -81.3521728515625, -70.91667938232422, -60.48118591308594, -50.04570007324219, -39.61021041870117, -29.174720764160156, -18.73923110961914, -8.303741455078125, 2.1317481994628906, 12.567237854003906, 23.002731323242188, 33.43821716308594, 43.87370681762695, 54.30919647216797, 64.74468994140625, 75.18017578125, 85.61566162109375, 96.05115509033203, 106.48664855957031, 116.92213439941406]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 0.0, 6.0, 4.0, 6.0, 6.0, 7.0, 7.0, 10.0, 15.0, 15.0, 14.0, 13.0, 25.0, 22.0, 28.0, 24.0, 20.0, 32.0, 37.0, 35.0, 37.0, 40.0, 38.0, 45.0, 39.0, 31.0, 40.0, 38.0, 35.0, 30.0, 24.0, 33.0, 22.0, 22.0, 24.0, 28.0, 22.0, 20.0, 21.0, 14.0, 14.0, 8.0, 11.0, 14.0, 8.0, 6.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-89.22309875488281, -86.47863006591797, -83.73416137695312, -80.98970031738281, -78.24523162841797, -75.50076293945312, -72.75629425048828, -70.01182556152344, -67.26736450195312, -64.52289581298828, -61.7784309387207, -59.03396224975586, -56.28949737548828, -53.54502868652344, -50.800559997558594, -48.05609130859375, -45.311622619628906, -42.56715393066406, -39.822689056396484, -37.07822036743164, -34.33375549316406, -31.58928680419922, -28.844818115234375, -26.100351333618164, -23.355884552001953, -20.611417770385742, -17.86695098876953, -15.122482299804688, -12.378015518188477, -9.633548736572266, -6.889080047607422, -4.144613265991211, -1.400146484375, 1.3443207740783691, 4.088788032531738, 6.833255767822266, 9.577722549438477, 12.322189331054688, 15.066658020019531, 17.811124801635742, 20.555591583251953, 23.300058364868164, 26.044525146484375, 28.78899383544922, 31.53346061706543, 34.27792739868164, 37.022396087646484, 39.76686096191406, 42.511329650878906, 45.25579833984375, 48.00026321411133, 50.74473190307617, 53.48919677734375, 56.233665466308594, 58.97813415527344, 61.72260284423828, 64.46707153320312, 67.21154022216797, 69.95600891113281, 72.70046997070312, 75.44493865966797, 78.18940734863281, 80.93387603759766, 83.6783447265625, 86.42280578613281]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 3.0, 3.0, 6.0, 19.0, 31.0, 55.0, 71.0, 105.0, 195.0, 303.0, 551.0, 1176.0, 3177.0, 11266.0, 54645.0, 317257.0, 541564.0, 92486.0, 17933.0, 4441.0, 1615.0, 671.0, 390.0, 235.0, 144.0, 78.0, 52.0, 40.0, 11.0, 19.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.0625, -115.1142578125, -111.166015625, -107.2177734375, -103.26953125, -99.3212890625, -95.373046875, -91.4248046875, -87.4765625, -83.5283203125, -79.580078125, -75.6318359375, -71.68359375, -67.7353515625, -63.787109375, -59.8388671875, -55.890625, -51.9423828125, -47.994140625, -44.0458984375, -40.09765625, -36.1494140625, -32.201171875, -28.2529296875, -24.3046875, -20.3564453125, -16.408203125, -12.4599609375, -8.51171875, -4.5634765625, -0.615234375, 3.3330078125, 7.28125, 11.2294921875, 15.177734375, 19.1259765625, 23.07421875, 27.0224609375, 30.970703125, 34.9189453125, 38.8671875, 42.8154296875, 46.763671875, 50.7119140625, 54.66015625, 58.6083984375, 62.556640625, 66.5048828125, 70.453125, 74.4013671875, 78.349609375, 82.2978515625, 86.24609375, 90.1943359375, 94.142578125, 98.0908203125, 102.0390625, 105.9873046875, 109.935546875, 113.8837890625, 117.83203125, 121.7802734375, 125.728515625, 129.6767578125, 133.625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 7.0, 9.0, 9.0, 9.0, 21.0, 12.0, 21.0, 32.0, 46.0, 58.0, 49.0, 86.0, 77.0, 77.0, 89.0, 63.0, 63.0, 65.0, 59.0, 54.0, 28.0, 28.0, 16.0, 7.0, 8.0, 8.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.125, -21.4287109375, -20.732421875, -20.0361328125, -19.33984375, -18.6435546875, -17.947265625, -17.2509765625, -16.5546875, -15.8583984375, -15.162109375, -14.4658203125, -13.76953125, -13.0732421875, -12.376953125, -11.6806640625, -10.984375, -10.2880859375, -9.591796875, -8.8955078125, -8.19921875, -7.5029296875, -6.806640625, -6.1103515625, -5.4140625, -4.7177734375, -4.021484375, -3.3251953125, -2.62890625, -1.9326171875, -1.236328125, -0.5400390625, 0.15625, 0.8525390625, 1.548828125, 2.2451171875, 2.94140625, 3.6376953125, 4.333984375, 5.0302734375, 5.7265625, 6.4228515625, 7.119140625, 7.8154296875, 8.51171875, 9.2080078125, 9.904296875, 10.6005859375, 11.296875, 11.9931640625, 12.689453125, 13.3857421875, 14.08203125, 14.7783203125, 15.474609375, 16.1708984375, 16.8671875, 17.5634765625, 18.259765625, 18.9560546875, 19.65234375, 20.3486328125, 21.044921875, 21.7412109375, 22.4375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 8.0, 13.0, 9.0, 22.0, 35.0, 40.0, 54.0, 89.0, 123.0, 147.0, 214.0, 327.0, 486.0, 970.0, 2074.0, 5295.0, 16433.0, 55532.0, 208369.0, 521224.0, 168286.0, 46473.0, 13825.0, 4417.0, 1765.0, 851.0, 501.0, 285.0, 199.0, 161.0, 90.0, 58.0, 53.0, 36.0, 24.0, 16.0, 18.0, 8.0, 7.0, 7.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-69.8125, -67.841796875, -65.87109375, -63.900390625, -61.9296875, -59.958984375, -57.98828125, -56.017578125, -54.046875, -52.076171875, -50.10546875, -48.134765625, -46.1640625, -44.193359375, -42.22265625, -40.251953125, -38.28125, -36.310546875, -34.33984375, -32.369140625, -30.3984375, -28.427734375, -26.45703125, -24.486328125, -22.515625, -20.544921875, -18.57421875, -16.603515625, -14.6328125, -12.662109375, -10.69140625, -8.720703125, -6.75, -4.779296875, -2.80859375, -0.837890625, 1.1328125, 3.103515625, 5.07421875, 7.044921875, 9.015625, 10.986328125, 12.95703125, 14.927734375, 16.8984375, 18.869140625, 20.83984375, 22.810546875, 24.78125, 26.751953125, 28.72265625, 30.693359375, 32.6640625, 34.634765625, 36.60546875, 38.576171875, 40.546875, 42.517578125, 44.48828125, 46.458984375, 48.4296875, 50.400390625, 52.37109375, 54.341796875, 56.3125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 5.0, 2.0, 3.0, 5.0, 8.0, 5.0, 13.0, 8.0, 8.0, 11.0, 14.0, 16.0, 15.0, 17.0, 22.0, 23.0, 35.0, 30.0, 33.0, 28.0, 38.0, 41.0, 29.0, 33.0, 48.0, 38.0, 39.0, 40.0, 41.0, 38.0, 38.0, 41.0, 33.0, 37.0, 15.0, 20.0, 19.0, 21.0, 13.0, 18.0, 10.0, 14.0, 8.0, 6.0, 10.0, 9.0, 5.0, 6.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.5625, -37.10888671875, -35.6552734375, -34.20166015625, -32.748046875, -31.29443359375, -29.8408203125, -28.38720703125, -26.93359375, -25.47998046875, -24.0263671875, -22.57275390625, -21.119140625, -19.66552734375, -18.2119140625, -16.75830078125, -15.3046875, -13.85107421875, -12.3974609375, -10.94384765625, -9.490234375, -8.03662109375, -6.5830078125, -5.12939453125, -3.67578125, -2.22216796875, -0.7685546875, 0.68505859375, 2.138671875, 3.59228515625, 5.0458984375, 6.49951171875, 7.953125, 9.40673828125, 10.8603515625, 12.31396484375, 13.767578125, 15.22119140625, 16.6748046875, 18.12841796875, 19.58203125, 21.03564453125, 22.4892578125, 23.94287109375, 25.396484375, 26.85009765625, 28.3037109375, 29.75732421875, 31.2109375, 32.66455078125, 34.1181640625, 35.57177734375, 37.025390625, 38.47900390625, 39.9326171875, 41.38623046875, 42.83984375, 44.29345703125, 45.7470703125, 47.20068359375, 48.654296875, 50.10791015625, 51.5615234375, 53.01513671875, 54.46875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 7.0, 12.0, 14.0, 13.0, 36.0, 54.0, 71.0, 167.0, 279.0, 553.0, 1431.0, 3544.0, 10005.0, 31385.0, 103788.0, 414413.0, 352116.0, 89093.0, 27367.0, 8739.0, 3161.0, 1164.0, 552.0, 290.0, 129.0, 76.0, 30.0, 29.0, 15.0, 12.0, 6.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.765625, -21.887939453125, -21.01025390625, -20.132568359375, -19.2548828125, -18.377197265625, -17.49951171875, -16.621826171875, -15.744140625, -14.866455078125, -13.98876953125, -13.111083984375, -12.2333984375, -11.355712890625, -10.47802734375, -9.600341796875, -8.72265625, -7.844970703125, -6.96728515625, -6.089599609375, -5.2119140625, -4.334228515625, -3.45654296875, -2.578857421875, -1.701171875, -0.823486328125, 0.05419921875, 0.931884765625, 1.8095703125, 2.687255859375, 3.56494140625, 4.442626953125, 5.3203125, 6.197998046875, 7.07568359375, 7.953369140625, 8.8310546875, 9.708740234375, 10.58642578125, 11.464111328125, 12.341796875, 13.219482421875, 14.09716796875, 14.974853515625, 15.8525390625, 16.730224609375, 17.60791015625, 18.485595703125, 19.36328125, 20.240966796875, 21.11865234375, 21.996337890625, 22.8740234375, 23.751708984375, 24.62939453125, 25.507080078125, 26.384765625, 27.262451171875, 28.14013671875, 29.017822265625, 29.8955078125, 30.773193359375, 31.65087890625, 32.528564453125, 33.40625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 1.0, 3.0, 2.0, 3.0, 1.0, 6.0, 7.0, 13.0, 21.0, 23.0, 21.0, 34.0, 42.0, 62.0, 104.0, 183.0, 136.0, 86.0, 69.0, 31.0, 42.0, 30.0, 22.0, 14.0, 14.0, 6.0, 8.0, 8.0, 2.0, 5.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0], "bins": [-0.00711822509765625, -0.006952166557312012, -0.0067861080169677734, -0.006620049476623535, -0.006453990936279297, -0.006287932395935059, -0.00612187385559082, -0.005955815315246582, -0.005789756774902344, -0.0056236982345581055, -0.005457639694213867, -0.005291581153869629, -0.005125522613525391, -0.004959464073181152, -0.004793405532836914, -0.004627346992492676, -0.0044612884521484375, -0.004295229911804199, -0.004129171371459961, -0.003963112831115723, -0.0037970542907714844, -0.003630995750427246, -0.003464937210083008, -0.0032988786697387695, -0.0031328201293945312, -0.002966761589050293, -0.0028007030487060547, -0.0026346445083618164, -0.002468585968017578, -0.00230252742767334, -0.0021364688873291016, -0.0019704103469848633, -0.001804351806640625, -0.0016382932662963867, -0.0014722347259521484, -0.0013061761856079102, -0.0011401176452636719, -0.0009740591049194336, -0.0008080005645751953, -0.000641942024230957, -0.00047588348388671875, -0.00030982494354248047, -0.0001437664031982422, 2.2292137145996094e-05, 0.00018835067749023438, 0.00035440921783447266, 0.0005204677581787109, 0.0006865262985229492, 0.0008525848388671875, 0.0010186433792114258, 0.001184701919555664, 0.0013507604598999023, 0.0015168190002441406, 0.001682877540588379, 0.0018489360809326172, 0.0020149946212768555, 0.0021810531616210938, 0.002347111701965332, 0.0025131702423095703, 0.0026792287826538086, 0.002845287322998047, 0.003011345863342285, 0.0031774044036865234, 0.0033434629440307617, 0.003509521484375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 3.0, 18.0, 19.0, 26.0, 32.0, 48.0, 81.0, 112.0, 145.0, 264.0, 425.0, 806.0, 1679.0, 4152.0, 11972.0, 44153.0, 195948.0, 538912.0, 188145.0, 42307.0, 11777.0, 4041.0, 1641.0, 766.0, 400.0, 228.0, 139.0, 77.0, 67.0, 57.0, 26.0, 27.0, 17.0, 12.0, 6.0, 4.0, 7.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.28125, -32.2568359375, -31.232421875, -30.2080078125, -29.18359375, -28.1591796875, -27.134765625, -26.1103515625, -25.0859375, -24.0615234375, -23.037109375, -22.0126953125, -20.98828125, -19.9638671875, -18.939453125, -17.9150390625, -16.890625, -15.8662109375, -14.841796875, -13.8173828125, -12.79296875, -11.7685546875, -10.744140625, -9.7197265625, -8.6953125, -7.6708984375, -6.646484375, -5.6220703125, -4.59765625, -3.5732421875, -2.548828125, -1.5244140625, -0.5, 0.5244140625, 1.548828125, 2.5732421875, 3.59765625, 4.6220703125, 5.646484375, 6.6708984375, 7.6953125, 8.7197265625, 9.744140625, 10.7685546875, 11.79296875, 12.8173828125, 13.841796875, 14.8662109375, 15.890625, 16.9150390625, 17.939453125, 18.9638671875, 19.98828125, 21.0126953125, 22.037109375, 23.0615234375, 24.0859375, 25.1103515625, 26.134765625, 27.1591796875, 28.18359375, 29.2080078125, 30.232421875, 31.2568359375, 32.28125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 1.0, 5.0, 2.0, 11.0, 4.0, 5.0, 10.0, 10.0, 6.0, 19.0, 7.0, 16.0, 22.0, 37.0, 31.0, 38.0, 40.0, 61.0, 69.0, 69.0, 64.0, 63.0, 50.0, 57.0, 47.0, 51.0, 42.0, 37.0, 24.0, 20.0, 19.0, 14.0, 10.0, 8.0, 6.0, 4.0, 4.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-20.390625, -19.777099609375, -19.16357421875, -18.550048828125, -17.9365234375, -17.322998046875, -16.70947265625, -16.095947265625, -15.482421875, -14.868896484375, -14.25537109375, -13.641845703125, -13.0283203125, -12.414794921875, -11.80126953125, -11.187744140625, -10.57421875, -9.960693359375, -9.34716796875, -8.733642578125, -8.1201171875, -7.506591796875, -6.89306640625, -6.279541015625, -5.666015625, -5.052490234375, -4.43896484375, -3.825439453125, -3.2119140625, -2.598388671875, -1.98486328125, -1.371337890625, -0.7578125, -0.144287109375, 0.46923828125, 1.082763671875, 1.6962890625, 2.309814453125, 2.92333984375, 3.536865234375, 4.150390625, 4.763916015625, 5.37744140625, 5.990966796875, 6.6044921875, 7.218017578125, 7.83154296875, 8.445068359375, 9.05859375, 9.672119140625, 10.28564453125, 10.899169921875, 11.5126953125, 12.126220703125, 12.73974609375, 13.353271484375, 13.966796875, 14.580322265625, 15.19384765625, 15.807373046875, 16.4208984375, 17.034423828125, 17.64794921875, 18.261474609375, 18.875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 7.0, 34.0, 149.0, 324.0, 317.0, 139.0, 31.0, 10.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-314.1203308105469, -269.69305419921875, -225.26580810546875, -180.8385467529297, -136.41128540039062, -91.98402404785156, -47.5567626953125, -3.129486083984375, 41.297760009765625, 85.72502136230469, 130.15228271484375, 174.5795440673828, 219.00680541992188, 263.43408203125, 307.861328125, 352.2886047363281, 396.7158508300781, 441.14312744140625, 485.57037353515625, 529.9976196289062, 574.4249267578125, 618.8521728515625, 663.2794189453125, 707.7066650390625, 752.1339111328125, 796.5611572265625, 840.9884033203125, 885.4157104492188, 929.8429565429688, 974.2702026367188, 1018.697509765625, 1063.124755859375, 1107.552001953125, 1151.979248046875, 1196.406494140625, 1240.833740234375, 1285.260986328125, 1329.6883544921875, 1374.1156005859375, 1418.5428466796875, 1462.9700927734375, 1507.3973388671875, 1551.8245849609375, 1596.2518310546875, 1640.67919921875, 1685.1064453125, 1729.53369140625, 1773.9609375, 1818.38818359375, 1862.8154296875, 1907.24267578125, 1951.669921875, 1996.09716796875, 2040.5245361328125, 2084.95166015625, 2129.37890625, 2173.80615234375, 2218.2333984375, 2262.66064453125, 2307.087890625, 2351.51513671875, 2395.9423828125, 2440.36962890625, 2484.796875, 2529.224365234375]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 4.0, 6.0, 2.0, 7.0, 12.0, 10.0, 9.0, 10.0, 14.0, 11.0, 22.0, 14.0, 22.0, 29.0, 32.0, 22.0, 39.0, 40.0, 39.0, 34.0, 34.0, 43.0, 44.0, 40.0, 40.0, 35.0, 41.0, 28.0, 35.0, 40.0, 24.0, 37.0, 17.0, 26.0, 17.0, 24.0, 12.0, 17.0, 11.0, 10.0, 9.0, 6.0, 8.0, 7.0, 9.0, 6.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0], "bins": [-268.91546630859375, -261.24969482421875, -253.58389282226562, -245.91812133789062, -238.25233459472656, -230.5865478515625, -222.9207763671875, -215.25498962402344, -207.58920288085938, -199.9234161376953, -192.25762939453125, -184.59185791015625, -176.9260711669922, -169.26028442382812, -161.59451293945312, -153.92872619628906, -146.262939453125, -138.59715270996094, -130.93136596679688, -123.26559448242188, -115.59980773925781, -107.93402099609375, -100.26824188232422, -92.60246276855469, -84.93667602539062, -77.27088928222656, -69.60511016845703, -61.939327239990234, -54.27354431152344, -46.60776138305664, -38.941978454589844, -31.276195526123047, -23.610397338867188, -15.94461441040039, -8.278831481933594, -0.6130485534667969, 7.052734375, 14.718517303466797, 22.384300231933594, 30.05008316040039, 37.71586608886719, 45.381649017333984, 53.04743194580078, 60.71321487426758, 68.37899780273438, 76.04478454589844, 83.71056365966797, 91.3763427734375, 99.04212951660156, 106.70791625976562, 114.37369537353516, 122.03947448730469, 129.70526123046875, 137.3710479736328, 145.03683471679688, 152.70260620117188, 160.36839294433594, 168.0341796875, 175.699951171875, 183.36573791503906, 191.03152465820312, 198.6973114013672, 206.36309814453125, 214.02886962890625, 221.6946563720703]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 6.0, 6.0, 12.0, 6.0, 23.0, 42.0, 44.0, 57.0, 108.0, 172.0, 286.0, 498.0, 885.0, 1770.0, 4170.0, 12197.0, 50039.0, 403614.0, 3489321.0, 186247.0, 30339.0, 8207.0, 3036.0, 1296.0, 721.0, 402.0, 265.0, 155.0, 92.0, 70.0, 59.0, 38.0, 31.0, 16.0, 6.0, 12.0, 10.0, 7.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-141.875, -137.19921875, -132.5234375, -127.84765625, -123.171875, -118.49609375, -113.8203125, -109.14453125, -104.46875, -99.79296875, -95.1171875, -90.44140625, -85.765625, -81.08984375, -76.4140625, -71.73828125, -67.0625, -62.38671875, -57.7109375, -53.03515625, -48.359375, -43.68359375, -39.0078125, -34.33203125, -29.65625, -24.98046875, -20.3046875, -15.62890625, -10.953125, -6.27734375, -1.6015625, 3.07421875, 7.75, 12.42578125, 17.1015625, 21.77734375, 26.453125, 31.12890625, 35.8046875, 40.48046875, 45.15625, 49.83203125, 54.5078125, 59.18359375, 63.859375, 68.53515625, 73.2109375, 77.88671875, 82.5625, 87.23828125, 91.9140625, 96.58984375, 101.265625, 105.94140625, 110.6171875, 115.29296875, 119.96875, 124.64453125, 129.3203125, 133.99609375, 138.671875, 143.34765625, 148.0234375, 152.69921875, 157.375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 6.0, 7.0, 16.0, 20.0, 20.0, 26.0, 43.0, 42.0, 56.0, 88.0, 55.0, 80.0, 82.0, 71.0, 74.0, 70.0, 60.0, 51.0, 39.0, 33.0, 16.0, 18.0, 8.0, 9.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.640625, -20.948974609375, -20.25732421875, -19.565673828125, -18.8740234375, -18.182373046875, -17.49072265625, -16.799072265625, -16.107421875, -15.415771484375, -14.72412109375, -14.032470703125, -13.3408203125, -12.649169921875, -11.95751953125, -11.265869140625, -10.57421875, -9.882568359375, -9.19091796875, -8.499267578125, -7.8076171875, -7.115966796875, -6.42431640625, -5.732666015625, -5.041015625, -4.349365234375, -3.65771484375, -2.966064453125, -2.2744140625, -1.582763671875, -0.89111328125, -0.199462890625, 0.4921875, 1.183837890625, 1.87548828125, 2.567138671875, 3.2587890625, 3.950439453125, 4.64208984375, 5.333740234375, 6.025390625, 6.717041015625, 7.40869140625, 8.100341796875, 8.7919921875, 9.483642578125, 10.17529296875, 10.866943359375, 11.55859375, 12.250244140625, 12.94189453125, 13.633544921875, 14.3251953125, 15.016845703125, 15.70849609375, 16.400146484375, 17.091796875, 17.783447265625, 18.47509765625, 19.166748046875, 19.8583984375, 20.550048828125, 21.24169921875, 21.933349609375, 22.625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 7.0, 4.0, 5.0, 12.0, 12.0, 30.0, 29.0, 35.0, 51.0, 75.0, 98.0, 154.0, 210.0, 353.0, 583.0, 1387.0, 4442.0, 21850.0, 157064.0, 3244146.0, 686403.0, 62185.0, 10351.0, 2526.0, 946.0, 485.0, 268.0, 161.0, 124.0, 76.0, 69.0, 35.0, 29.0, 16.0, 15.0, 18.0, 9.0, 9.0, 5.0, 3.0, 3.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-139.625, -135.6103515625, -131.595703125, -127.5810546875, -123.56640625, -119.5517578125, -115.537109375, -111.5224609375, -107.5078125, -103.4931640625, -99.478515625, -95.4638671875, -91.44921875, -87.4345703125, -83.419921875, -79.4052734375, -75.390625, -71.3759765625, -67.361328125, -63.3466796875, -59.33203125, -55.3173828125, -51.302734375, -47.2880859375, -43.2734375, -39.2587890625, -35.244140625, -31.2294921875, -27.21484375, -23.2001953125, -19.185546875, -15.1708984375, -11.15625, -7.1416015625, -3.126953125, 0.8876953125, 4.90234375, 8.9169921875, 12.931640625, 16.9462890625, 20.9609375, 24.9755859375, 28.990234375, 33.0048828125, 37.01953125, 41.0341796875, 45.048828125, 49.0634765625, 53.078125, 57.0927734375, 61.107421875, 65.1220703125, 69.13671875, 73.1513671875, 77.166015625, 81.1806640625, 85.1953125, 89.2099609375, 93.224609375, 97.2392578125, 101.25390625, 105.2685546875, 109.283203125, 113.2978515625, 117.3125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 8.0, 17.0, 30.0, 59.0, 142.0, 333.0, 1158.0, 1628.0, 394.0, 158.0, 69.0, 44.0, 27.0, 6.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.25, -67.7470703125, -65.244140625, -62.7412109375, -60.23828125, -57.7353515625, -55.232421875, -52.7294921875, -50.2265625, -47.7236328125, -45.220703125, -42.7177734375, -40.21484375, -37.7119140625, -35.208984375, -32.7060546875, -30.203125, -27.7001953125, -25.197265625, -22.6943359375, -20.19140625, -17.6884765625, -15.185546875, -12.6826171875, -10.1796875, -7.6767578125, -5.173828125, -2.6708984375, -0.16796875, 2.3349609375, 4.837890625, 7.3408203125, 9.84375, 12.3466796875, 14.849609375, 17.3525390625, 19.85546875, 22.3583984375, 24.861328125, 27.3642578125, 29.8671875, 32.3701171875, 34.873046875, 37.3759765625, 39.87890625, 42.3818359375, 44.884765625, 47.3876953125, 49.890625, 52.3935546875, 54.896484375, 57.3994140625, 59.90234375, 62.4052734375, 64.908203125, 67.4111328125, 69.9140625, 72.4169921875, 74.919921875, 77.4228515625, 79.92578125, 82.4287109375, 84.931640625, 87.4345703125, 89.9375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 4.0, 7.0, 8.0, 20.0, 24.0, 34.0, 41.0, 53.0, 70.0, 79.0, 87.0, 107.0, 82.0, 71.0, 79.0, 55.0, 56.0, 36.0, 22.0, 13.0, 15.0, 9.0, 4.0, 9.0, 1.0, 4.0, 0.0, 3.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-211.2149200439453, -203.9550018310547, -196.69508361816406, -189.43516540527344, -182.1752471923828, -174.9153289794922, -167.65541076660156, -160.39549255371094, -153.1355743408203, -145.8756561279297, -138.61573791503906, -131.35581970214844, -124.09590148925781, -116.83598327636719, -109.57606506347656, -102.31614685058594, -95.05622863769531, -87.79631042480469, -80.53639221191406, -73.27647399902344, -66.01655578613281, -58.75663757324219, -51.49671936035156, -44.23680114746094, -36.97688293457031, -29.716964721679688, -22.457046508789062, -15.197128295898438, -7.9372100830078125, -0.6772918701171875, 6.5826263427734375, 13.842544555664062, 21.10247802734375, 28.362396240234375, 35.622314453125, 42.882232666015625, 50.14215087890625, 57.402069091796875, 64.6619873046875, 71.92190551757812, 79.18182373046875, 86.44174194335938, 93.70166015625, 100.96157836914062, 108.22149658203125, 115.48141479492188, 122.7413330078125, 130.00125122070312, 137.26116943359375, 144.52108764648438, 151.781005859375, 159.04092407226562, 166.30084228515625, 173.56076049804688, 180.8206787109375, 188.08059692382812, 195.34051513671875, 202.60043334960938, 209.8603515625, 217.12026977539062, 224.38018798828125, 231.64010620117188, 238.9000244140625, 246.15994262695312, 253.41986083984375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 9.0, 10.0, 11.0, 21.0, 19.0, 21.0, 27.0, 28.0, 28.0, 32.0, 47.0, 37.0, 52.0, 60.0, 38.0, 38.0, 59.0, 43.0, 36.0, 49.0, 46.0, 42.0, 45.0, 26.0, 32.0, 16.0, 28.0, 25.0, 22.0, 13.0, 8.0, 13.0, 7.0, 4.0, 0.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-126.20563507080078, -121.4463882446289, -116.68714141845703, -111.92789459228516, -107.16864776611328, -102.4094009399414, -97.65015411376953, -92.89090728759766, -88.13166046142578, -83.3724136352539, -78.61316680908203, -73.85391998291016, -69.09467315673828, -64.3354263305664, -59.57617950439453, -54.816932678222656, -50.05768585205078, -45.298439025878906, -40.53919219970703, -35.779945373535156, -31.02069854736328, -26.261451721191406, -21.50220489501953, -16.742958068847656, -11.983711242675781, -7.224464416503906, -2.4652175903320312, 2.2940292358398438, 7.053276062011719, 11.812522888183594, 16.57176971435547, 21.331016540527344, 26.090255737304688, 30.849502563476562, 35.60874938964844, 40.36799621582031, 45.12724304199219, 49.88648986816406, 54.64573669433594, 59.40498352050781, 64.16423034667969, 68.92347717285156, 73.68272399902344, 78.44197082519531, 83.20121765136719, 87.96046447753906, 92.71971130371094, 97.47895812988281, 102.23820495605469, 106.99745178222656, 111.75669860839844, 116.51594543457031, 121.27519226074219, 126.03443908691406, 130.79368591308594, 135.5529327392578, 140.3121795654297, 145.07142639160156, 149.83067321777344, 154.5899200439453, 159.3491668701172, 164.10841369628906, 168.86766052246094, 173.6269073486328, 178.3861541748047]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 5.0, 9.0, 9.0, 10.0, 26.0, 18.0, 31.0, 66.0, 98.0, 177.0, 341.0, 613.0, 1445.0, 3971.0, 16158.0, 98447.0, 581589.0, 293256.0, 39792.0, 8039.0, 2416.0, 979.0, 489.0, 250.0, 139.0, 58.0, 31.0, 35.0, 21.0, 13.0, 14.0, 4.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-113.125, -109.05078125, -104.9765625, -100.90234375, -96.828125, -92.75390625, -88.6796875, -84.60546875, -80.53125, -76.45703125, -72.3828125, -68.30859375, -64.234375, -60.16015625, -56.0859375, -52.01171875, -47.9375, -43.86328125, -39.7890625, -35.71484375, -31.640625, -27.56640625, -23.4921875, -19.41796875, -15.34375, -11.26953125, -7.1953125, -3.12109375, 0.953125, 5.02734375, 9.1015625, 13.17578125, 17.25, 21.32421875, 25.3984375, 29.47265625, 33.546875, 37.62109375, 41.6953125, 45.76953125, 49.84375, 53.91796875, 57.9921875, 62.06640625, 66.140625, 70.21484375, 74.2890625, 78.36328125, 82.4375, 86.51171875, 90.5859375, 94.66015625, 98.734375, 102.80859375, 106.8828125, 110.95703125, 115.03125, 119.10546875, 123.1796875, 127.25390625, 131.328125, 135.40234375, 139.4765625, 143.55078125, 147.625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 6.0, 9.0, 8.0, 24.0, 10.0, 28.0, 39.0, 51.0, 58.0, 76.0, 67.0, 77.0, 73.0, 75.0, 89.0, 70.0, 56.0, 44.0, 40.0, 40.0, 23.0, 7.0, 9.0, 8.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.65625, -20.92138671875, -20.1865234375, -19.45166015625, -18.716796875, -17.98193359375, -17.2470703125, -16.51220703125, -15.77734375, -15.04248046875, -14.3076171875, -13.57275390625, -12.837890625, -12.10302734375, -11.3681640625, -10.63330078125, -9.8984375, -9.16357421875, -8.4287109375, -7.69384765625, -6.958984375, -6.22412109375, -5.4892578125, -4.75439453125, -4.01953125, -3.28466796875, -2.5498046875, -1.81494140625, -1.080078125, -0.34521484375, 0.3896484375, 1.12451171875, 1.859375, 2.59423828125, 3.3291015625, 4.06396484375, 4.798828125, 5.53369140625, 6.2685546875, 7.00341796875, 7.73828125, 8.47314453125, 9.2080078125, 9.94287109375, 10.677734375, 11.41259765625, 12.1474609375, 12.88232421875, 13.6171875, 14.35205078125, 15.0869140625, 15.82177734375, 16.556640625, 17.29150390625, 18.0263671875, 18.76123046875, 19.49609375, 20.23095703125, 20.9658203125, 21.70068359375, 22.435546875, 23.17041015625, 23.9052734375, 24.64013671875, 25.375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 7.0, 6.0, 8.0, 8.0, 15.0, 20.0, 36.0, 44.0, 63.0, 92.0, 112.0, 179.0, 235.0, 319.0, 521.0, 898.0, 1672.0, 3566.0, 8933.0, 25334.0, 83466.0, 328810.0, 426043.0, 114575.0, 33360.0, 11262.0, 4282.0, 1934.0, 992.0, 545.0, 374.0, 222.0, 179.0, 122.0, 88.0, 58.0, 64.0, 35.0, 26.0, 13.0, 11.0, 4.0, 8.0, 8.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-62.0625, -60.001953125, -57.94140625, -55.880859375, -53.8203125, -51.759765625, -49.69921875, -47.638671875, -45.578125, -43.517578125, -41.45703125, -39.396484375, -37.3359375, -35.275390625, -33.21484375, -31.154296875, -29.09375, -27.033203125, -24.97265625, -22.912109375, -20.8515625, -18.791015625, -16.73046875, -14.669921875, -12.609375, -10.548828125, -8.48828125, -6.427734375, -4.3671875, -2.306640625, -0.24609375, 1.814453125, 3.875, 5.935546875, 7.99609375, 10.056640625, 12.1171875, 14.177734375, 16.23828125, 18.298828125, 20.359375, 22.419921875, 24.48046875, 26.541015625, 28.6015625, 30.662109375, 32.72265625, 34.783203125, 36.84375, 38.904296875, 40.96484375, 43.025390625, 45.0859375, 47.146484375, 49.20703125, 51.267578125, 53.328125, 55.388671875, 57.44921875, 59.509765625, 61.5703125, 63.630859375, 65.69140625, 67.751953125, 69.8125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 8.0, 6.0, 8.0, 11.0, 13.0, 18.0, 22.0, 19.0, 33.0, 21.0, 35.0, 40.0, 37.0, 36.0, 49.0, 52.0, 50.0, 59.0, 60.0, 59.0, 44.0, 42.0, 40.0, 41.0, 35.0, 28.0, 24.0, 11.0, 25.0, 22.0, 11.0, 7.0, 8.0, 9.0, 5.0, 8.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-68.8125, -66.6806640625, -64.548828125, -62.4169921875, -60.28515625, -58.1533203125, -56.021484375, -53.8896484375, -51.7578125, -49.6259765625, -47.494140625, -45.3623046875, -43.23046875, -41.0986328125, -38.966796875, -36.8349609375, -34.703125, -32.5712890625, -30.439453125, -28.3076171875, -26.17578125, -24.0439453125, -21.912109375, -19.7802734375, -17.6484375, -15.5166015625, -13.384765625, -11.2529296875, -9.12109375, -6.9892578125, -4.857421875, -2.7255859375, -0.59375, 1.5380859375, 3.669921875, 5.8017578125, 7.93359375, 10.0654296875, 12.197265625, 14.3291015625, 16.4609375, 18.5927734375, 20.724609375, 22.8564453125, 24.98828125, 27.1201171875, 29.251953125, 31.3837890625, 33.515625, 35.6474609375, 37.779296875, 39.9111328125, 42.04296875, 44.1748046875, 46.306640625, 48.4384765625, 50.5703125, 52.7021484375, 54.833984375, 56.9658203125, 59.09765625, 61.2294921875, 63.361328125, 65.4931640625, 67.625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 8.0, 9.0, 17.0, 25.0, 34.0, 50.0, 104.0, 174.0, 349.0, 742.0, 2026.0, 8144.0, 43827.0, 261641.0, 546005.0, 152831.0, 24955.0, 4902.0, 1434.0, 561.0, 294.0, 169.0, 98.0, 51.0, 37.0, 18.0, 13.0, 13.0, 9.0, 3.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-31.609375, -30.600830078125, -29.59228515625, -28.583740234375, -27.5751953125, -26.566650390625, -25.55810546875, -24.549560546875, -23.541015625, -22.532470703125, -21.52392578125, -20.515380859375, -19.5068359375, -18.498291015625, -17.48974609375, -16.481201171875, -15.47265625, -14.464111328125, -13.45556640625, -12.447021484375, -11.4384765625, -10.429931640625, -9.42138671875, -8.412841796875, -7.404296875, -6.395751953125, -5.38720703125, -4.378662109375, -3.3701171875, -2.361572265625, -1.35302734375, -0.344482421875, 0.6640625, 1.672607421875, 2.68115234375, 3.689697265625, 4.6982421875, 5.706787109375, 6.71533203125, 7.723876953125, 8.732421875, 9.740966796875, 10.74951171875, 11.758056640625, 12.7666015625, 13.775146484375, 14.78369140625, 15.792236328125, 16.80078125, 17.809326171875, 18.81787109375, 19.826416015625, 20.8349609375, 21.843505859375, 22.85205078125, 23.860595703125, 24.869140625, 25.877685546875, 26.88623046875, 27.894775390625, 28.9033203125, 29.911865234375, 30.92041015625, 31.928955078125, 32.9375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 7.0, 8.0, 17.0, 11.0, 19.0, 23.0, 35.0, 41.0, 65.0, 87.0, 97.0, 93.0, 111.0, 88.0, 52.0, 54.0, 45.0, 36.0, 28.0, 21.0, 19.0, 6.0, 10.0, 12.0, 6.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005023956298828125, -0.0048789381980896, -0.004733920097351074, -0.004588901996612549, -0.0044438838958740234, -0.004298865795135498, -0.004153847694396973, -0.004008829593658447, -0.003863811492919922, -0.0037187933921813965, -0.003573775291442871, -0.0034287571907043457, -0.0032837390899658203, -0.003138720989227295, -0.0029937028884887695, -0.002848684787750244, -0.0027036666870117188, -0.0025586485862731934, -0.002413630485534668, -0.0022686123847961426, -0.002123594284057617, -0.001978576183319092, -0.0018335580825805664, -0.001688539981842041, -0.0015435218811035156, -0.0013985037803649902, -0.0012534856796264648, -0.0011084675788879395, -0.0009634494781494141, -0.0008184313774108887, -0.0006734132766723633, -0.0005283951759338379, -0.0003833770751953125, -0.0002383589744567871, -9.334087371826172e-05, 5.167722702026367e-05, 0.00019669532775878906, 0.00034171342849731445, 0.00048673152923583984, 0.0006317496299743652, 0.0007767677307128906, 0.000921785831451416, 0.0010668039321899414, 0.0012118220329284668, 0.0013568401336669922, 0.0015018582344055176, 0.001646876335144043, 0.0017918944358825684, 0.0019369125366210938, 0.002081930637359619, 0.0022269487380981445, 0.00237196683883667, 0.0025169849395751953, 0.0026620030403137207, 0.002807021141052246, 0.0029520392417907715, 0.003097057342529297, 0.0032420754432678223, 0.0033870935440063477, 0.003532111644744873, 0.0036771297454833984, 0.003822147846221924, 0.003967165946960449, 0.004112184047698975, 0.0042572021484375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 13.0, 14.0, 16.0, 33.0, 54.0, 92.0, 173.0, 249.0, 501.0, 982.0, 2387.0, 7658.0, 36065.0, 194647.0, 529780.0, 221065.0, 41417.0, 8537.0, 2658.0, 1001.0, 493.0, 287.0, 147.0, 104.0, 54.0, 32.0, 31.0, 18.0, 11.0, 12.0, 6.0, 9.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.1875, -33.168212890625, -32.14892578125, -31.129638671875, -30.1103515625, -29.091064453125, -28.07177734375, -27.052490234375, -26.033203125, -25.013916015625, -23.99462890625, -22.975341796875, -21.9560546875, -20.936767578125, -19.91748046875, -18.898193359375, -17.87890625, -16.859619140625, -15.84033203125, -14.821044921875, -13.8017578125, -12.782470703125, -11.76318359375, -10.743896484375, -9.724609375, -8.705322265625, -7.68603515625, -6.666748046875, -5.6474609375, -4.628173828125, -3.60888671875, -2.589599609375, -1.5703125, -0.551025390625, 0.46826171875, 1.487548828125, 2.5068359375, 3.526123046875, 4.54541015625, 5.564697265625, 6.583984375, 7.603271484375, 8.62255859375, 9.641845703125, 10.6611328125, 11.680419921875, 12.69970703125, 13.718994140625, 14.73828125, 15.757568359375, 16.77685546875, 17.796142578125, 18.8154296875, 19.834716796875, 20.85400390625, 21.873291015625, 22.892578125, 23.911865234375, 24.93115234375, 25.950439453125, 26.9697265625, 27.989013671875, 29.00830078125, 30.027587890625, 31.046875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 6.0, 4.0, 10.0, 10.0, 9.0, 11.0, 25.0, 28.0, 38.0, 35.0, 62.0, 70.0, 79.0, 91.0, 95.0, 82.0, 64.0, 73.0, 51.0, 40.0, 26.0, 28.0, 18.0, 17.0, 13.0, 8.0, 1.0, 4.0, 4.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.71875, -26.935791015625, -26.15283203125, -25.369873046875, -24.5869140625, -23.803955078125, -23.02099609375, -22.238037109375, -21.455078125, -20.672119140625, -19.88916015625, -19.106201171875, -18.3232421875, -17.540283203125, -16.75732421875, -15.974365234375, -15.19140625, -14.408447265625, -13.62548828125, -12.842529296875, -12.0595703125, -11.276611328125, -10.49365234375, -9.710693359375, -8.927734375, -8.144775390625, -7.36181640625, -6.578857421875, -5.7958984375, -5.012939453125, -4.22998046875, -3.447021484375, -2.6640625, -1.881103515625, -1.09814453125, -0.315185546875, 0.4677734375, 1.250732421875, 2.03369140625, 2.816650390625, 3.599609375, 4.382568359375, 5.16552734375, 5.948486328125, 6.7314453125, 7.514404296875, 8.29736328125, 9.080322265625, 9.86328125, 10.646240234375, 11.42919921875, 12.212158203125, 12.9951171875, 13.778076171875, 14.56103515625, 15.343994140625, 16.126953125, 16.909912109375, 17.69287109375, 18.475830078125, 19.2587890625, 20.041748046875, 20.82470703125, 21.607666015625, 22.390625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 6.0, 13.0, 6.0, 21.0, 45.0, 78.0, 89.0, 132.0, 145.0, 124.0, 121.0, 70.0, 62.0, 42.0, 23.0, 10.0, 8.0, 8.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-862.804931640625, -845.1047973632812, -827.4046630859375, -809.7045288085938, -792.00439453125, -774.3042602539062, -756.6041259765625, -738.904052734375, -721.203857421875, -703.5037231445312, -685.8035888671875, -668.1034545898438, -650.4033203125, -632.7031860351562, -615.0030517578125, -597.302978515625, -579.6028442382812, -561.9027099609375, -544.2025756835938, -526.50244140625, -508.80230712890625, -491.1021728515625, -473.4020690917969, -455.7019348144531, -438.0018005371094, -420.3016662597656, -402.6015319824219, -384.9013977050781, -367.2012939453125, -349.50115966796875, -331.801025390625, -314.10089111328125, -296.40069580078125, -278.7005615234375, -261.00042724609375, -243.30030822753906, -225.6001739501953, -207.90003967285156, -190.19992065429688, -172.49978637695312, -154.79965209960938, -137.09951782226562, -119.3993911743164, -101.69926452636719, -83.99913024902344, -66.29899597167969, -48.59886932373047, -30.89874267578125, -13.1986083984375, 4.501522064208984, 22.20165252685547, 39.90178298950195, 57.60191345214844, 75.30204772949219, 93.0021743774414, 110.70230102539062, 128.40243530273438, 146.10256958007812, 163.80270385742188, 181.50282287597656, 199.2029571533203, 216.90309143066406, 234.60321044921875, 252.3033447265625, 270.00347900390625]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 4.0, 6.0, 5.0, 12.0, 19.0, 17.0, 20.0, 27.0, 31.0, 37.0, 44.0, 36.0, 56.0, 55.0, 55.0, 67.0, 52.0, 52.0, 50.0, 56.0, 56.0, 53.0, 37.0, 34.0, 26.0, 22.0, 15.0, 17.0, 9.0, 6.0, 11.0, 5.0, 5.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-460.99365234375, -448.9089660644531, -436.82427978515625, -424.7395935058594, -412.6549072265625, -400.5702209472656, -388.48553466796875, -376.40081787109375, -364.316162109375, -352.2314758300781, -340.14678955078125, -328.0621032714844, -315.9774169921875, -303.8927307128906, -291.80804443359375, -279.72332763671875, -267.6386413574219, -255.553955078125, -243.46926879882812, -231.38458251953125, -219.29989624023438, -207.2152099609375, -195.13050842285156, -183.0458221435547, -170.9611358642578, -158.87644958496094, -146.79176330566406, -134.70706176757812, -122.62238311767578, -110.5376968383789, -98.4530029296875, -86.36831665039062, -74.28363037109375, -62.198944091796875, -50.114253997802734, -38.029563903808594, -25.94487762451172, -13.860191345214844, -1.7754974365234375, 10.309188842773438, 22.393875122070312, 34.47856140136719, 46.56325149536133, 58.64794158935547, 70.73262786865234, 82.81731414794922, 94.90200805664062, 106.9866943359375, 119.07138061523438, 131.15606689453125, 143.24075317382812, 155.325439453125, 167.41012573242188, 179.49481201171875, 191.5795135498047, 203.66419982910156, 215.74888610839844, 227.8335723876953, 239.9182586669922, 252.00296020507812, 264.087646484375, 276.1723327636719, 288.25701904296875, 300.3417053222656, 312.4263916015625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 6.0, 3.0, 9.0, 19.0, 20.0, 35.0, 42.0, 94.0, 152.0, 220.0, 453.0, 952.0, 2554.0, 8702.0, 58596.0, 4066785.0, 44032.0, 7387.0, 2336.0, 917.0, 407.0, 189.0, 135.0, 87.0, 43.0, 21.0, 24.0, 14.0, 15.0, 5.0, 5.0, 3.0, 8.0, 4.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-220.75, -213.5, -206.25, -199.0, -191.75, -184.5, -177.25, -170.0, -162.75, -155.5, -148.25, -141.0, -133.75, -126.5, -119.25, -112.0, -104.75, -97.5, -90.25, -83.0, -75.75, -68.5, -61.25, -54.0, -46.75, -39.5, -32.25, -25.0, -17.75, -10.5, -3.25, 4.0, 11.25, 18.5, 25.75, 33.0, 40.25, 47.5, 54.75, 62.0, 69.25, 76.5, 83.75, 91.0, 98.25, 105.5, 112.75, 120.0, 127.25, 134.5, 141.75, 149.0, 156.25, 163.5, 170.75, 178.0, 185.25, 192.5, 199.75, 207.0, 214.25, 221.5, 228.75, 236.0, 243.25]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 4.0, 10.0, 6.0, 7.0, 10.0, 31.0, 20.0, 29.0, 42.0, 36.0, 54.0, 69.0, 63.0, 72.0, 60.0, 61.0, 77.0, 54.0, 58.0, 40.0, 42.0, 32.0, 31.0, 16.0, 17.0, 20.0, 8.0, 12.0, 8.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-20.359375, -19.64990234375, -18.9404296875, -18.23095703125, -17.521484375, -16.81201171875, -16.1025390625, -15.39306640625, -14.68359375, -13.97412109375, -13.2646484375, -12.55517578125, -11.845703125, -11.13623046875, -10.4267578125, -9.71728515625, -9.0078125, -8.29833984375, -7.5888671875, -6.87939453125, -6.169921875, -5.46044921875, -4.7509765625, -4.04150390625, -3.33203125, -2.62255859375, -1.9130859375, -1.20361328125, -0.494140625, 0.21533203125, 0.9248046875, 1.63427734375, 2.34375, 3.05322265625, 3.7626953125, 4.47216796875, 5.181640625, 5.89111328125, 6.6005859375, 7.31005859375, 8.01953125, 8.72900390625, 9.4384765625, 10.14794921875, 10.857421875, 11.56689453125, 12.2763671875, 12.98583984375, 13.6953125, 14.40478515625, 15.1142578125, 15.82373046875, 16.533203125, 17.24267578125, 17.9521484375, 18.66162109375, 19.37109375, 20.08056640625, 20.7900390625, 21.49951171875, 22.208984375, 22.91845703125, 23.6279296875, 24.33740234375, 25.046875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 6.0, 13.0, 8.0, 18.0, 27.0, 50.0, 103.0, 215.0, 519.0, 1113.0, 2900.0, 8706.0, 43873.0, 3901007.0, 207708.0, 19636.0, 5155.0, 1818.0, 781.0, 321.0, 145.0, 75.0, 38.0, 20.0, 15.0, 10.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-162.375, -158.0771484375, -153.779296875, -149.4814453125, -145.18359375, -140.8857421875, -136.587890625, -132.2900390625, -127.9921875, -123.6943359375, -119.396484375, -115.0986328125, -110.80078125, -106.5029296875, -102.205078125, -97.9072265625, -93.609375, -89.3115234375, -85.013671875, -80.7158203125, -76.41796875, -72.1201171875, -67.822265625, -63.5244140625, -59.2265625, -54.9287109375, -50.630859375, -46.3330078125, -42.03515625, -37.7373046875, -33.439453125, -29.1416015625, -24.84375, -20.5458984375, -16.248046875, -11.9501953125, -7.65234375, -3.3544921875, 0.943359375, 5.2412109375, 9.5390625, 13.8369140625, 18.134765625, 22.4326171875, 26.73046875, 31.0283203125, 35.326171875, 39.6240234375, 43.921875, 48.2197265625, 52.517578125, 56.8154296875, 61.11328125, 65.4111328125, 69.708984375, 74.0068359375, 78.3046875, 82.6025390625, 86.900390625, 91.1982421875, 95.49609375, 99.7939453125, 104.091796875, 108.3896484375, 112.6875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 6.0, 3.0, 8.0, 8.0, 7.0, 20.0, 20.0, 26.0, 43.0, 100.0, 177.0, 2657.0, 599.0, 150.0, 88.0, 53.0, 27.0, 27.0, 12.0, 10.0, 4.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.359375, -16.9130859375, -16.466796875, -16.0205078125, -15.57421875, -15.1279296875, -14.681640625, -14.2353515625, -13.7890625, -13.3427734375, -12.896484375, -12.4501953125, -12.00390625, -11.5576171875, -11.111328125, -10.6650390625, -10.21875, -9.7724609375, -9.326171875, -8.8798828125, -8.43359375, -7.9873046875, -7.541015625, -7.0947265625, -6.6484375, -6.2021484375, -5.755859375, -5.3095703125, -4.86328125, -4.4169921875, -3.970703125, -3.5244140625, -3.078125, -2.6318359375, -2.185546875, -1.7392578125, -1.29296875, -0.8466796875, -0.400390625, 0.0458984375, 0.4921875, 0.9384765625, 1.384765625, 1.8310546875, 2.27734375, 2.7236328125, 3.169921875, 3.6162109375, 4.0625, 4.5087890625, 4.955078125, 5.4013671875, 5.84765625, 6.2939453125, 6.740234375, 7.1865234375, 7.6328125, 8.0791015625, 8.525390625, 8.9716796875, 9.41796875, 9.8642578125, 10.310546875, 10.7568359375, 11.203125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 3.0, 12.0, 4.0, 9.0, 19.0, 13.0, 42.0, 51.0, 57.0, 70.0, 82.0, 88.0, 86.0, 91.0, 88.0, 73.0, 70.0, 39.0, 36.0, 23.0, 10.0, 9.0, 7.0, 9.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-87.95367431640625, -85.9128646850586, -83.87205505371094, -81.83124542236328, -79.79043579101562, -77.74961853027344, -75.70880889892578, -73.66799926757812, -71.62718963623047, -69.58638000488281, -67.54557037353516, -65.5047607421875, -63.46394729614258, -61.42313766479492, -59.38232421875, -57.341514587402344, -55.30070495605469, -53.25989532470703, -51.219085693359375, -49.17827224731445, -47.1374626159668, -45.09665298461914, -43.05583953857422, -41.01502990722656, -38.974220275878906, -36.93341064453125, -34.892601013183594, -32.85178756713867, -30.810977935791016, -28.77016830444336, -26.72935676574707, -24.68854522705078, -22.647735595703125, -20.60692596435547, -18.56611442565918, -16.52530288696289, -14.484493255615234, -12.443682670593262, -10.402872085571289, -8.362061500549316, -6.321250915527344, -4.280440330505371, -2.2396297454833984, -0.19881916046142578, 1.8419914245605469, 3.8828020095825195, 5.923612594604492, 7.964423179626465, 10.005233764648438, 12.04604434967041, 14.086854934692383, 16.127666473388672, 18.168476104736328, 20.209285736083984, 22.250097274780273, 24.290908813476562, 26.33171844482422, 28.372528076171875, 30.413339614868164, 32.45415115356445, 34.49496078491211, 36.535770416259766, 38.57658386230469, 40.617393493652344, 42.658203125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 3.0, 9.0, 11.0, 13.0, 13.0, 16.0, 23.0, 22.0, 26.0, 31.0, 26.0, 39.0, 37.0, 45.0, 40.0, 44.0, 43.0, 33.0, 33.0, 47.0, 38.0, 36.0, 34.0, 43.0, 40.0, 25.0, 29.0, 25.0, 27.0, 22.0, 17.0, 13.0, 10.0, 14.0, 14.0, 7.0, 7.0, 7.0, 11.0, 3.0, 3.0, 1.0, 8.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-34.16252899169922, -33.09475326538086, -32.0269775390625, -30.95920181274414, -29.89142608642578, -28.823650360107422, -27.75587272644043, -26.68809700012207, -25.62032127380371, -24.55254554748535, -23.484769821166992, -22.416994094848633, -21.34921646118164, -20.28144073486328, -19.213665008544922, -18.145889282226562, -17.078113555908203, -16.010337829589844, -14.942562103271484, -13.874785423278809, -12.80700969696045, -11.73923397064209, -10.671457290649414, -9.603681564331055, -8.535905838012695, -7.468130111694336, -6.400353908538818, -5.332577705383301, -4.264801979064941, -3.197026252746582, -2.1292500495910645, -1.0614738464355469, 0.0063018798828125, 1.074077844619751, 2.1418538093566895, 3.209629774093628, 4.277405738830566, 5.345181465148926, 6.412957668304443, 7.480733871459961, 8.54850959777832, 9.61628532409668, 10.684061050415039, 11.751837730407715, 12.819613456726074, 13.887389183044434, 14.95516586303711, 16.02294158935547, 17.090717315673828, 18.158493041992188, 19.226268768310547, 20.294044494628906, 21.361820220947266, 22.429595947265625, 23.497373580932617, 24.565149307250977, 25.632925033569336, 26.700700759887695, 27.768476486206055, 28.836252212524414, 29.904029846191406, 30.971805572509766, 32.039581298828125, 33.107357025146484, 34.175132751464844]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 6.0, 6.0, 13.0, 10.0, 24.0, 34.0, 39.0, 44.0, 58.0, 118.0, 176.0, 265.0, 430.0, 680.0, 1137.0, 2198.0, 4648.0, 10888.0, 27319.0, 72210.0, 197389.0, 367353.0, 225728.0, 83004.0, 31511.0, 12307.0, 5325.0, 2413.0, 1270.0, 665.0, 429.0, 270.0, 183.0, 125.0, 78.0, 57.0, 46.0, 30.0, 21.0, 13.0, 12.0, 8.0, 3.0, 5.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-60.09375, -58.3037109375, -56.513671875, -54.7236328125, -52.93359375, -51.1435546875, -49.353515625, -47.5634765625, -45.7734375, -43.9833984375, -42.193359375, -40.4033203125, -38.61328125, -36.8232421875, -35.033203125, -33.2431640625, -31.453125, -29.6630859375, -27.873046875, -26.0830078125, -24.29296875, -22.5029296875, -20.712890625, -18.9228515625, -17.1328125, -15.3427734375, -13.552734375, -11.7626953125, -9.97265625, -8.1826171875, -6.392578125, -4.6025390625, -2.8125, -1.0224609375, 0.767578125, 2.5576171875, 4.34765625, 6.1376953125, 7.927734375, 9.7177734375, 11.5078125, 13.2978515625, 15.087890625, 16.8779296875, 18.66796875, 20.4580078125, 22.248046875, 24.0380859375, 25.828125, 27.6181640625, 29.408203125, 31.1982421875, 32.98828125, 34.7783203125, 36.568359375, 38.3583984375, 40.1484375, 41.9384765625, 43.728515625, 45.5185546875, 47.30859375, 49.0986328125, 50.888671875, 52.6787109375, 54.46875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 4.0, 5.0, 7.0, 11.0, 14.0, 11.0, 22.0, 30.0, 40.0, 40.0, 47.0, 46.0, 49.0, 62.0, 81.0, 52.0, 64.0, 76.0, 52.0, 50.0, 39.0, 42.0, 24.0, 35.0, 26.0, 18.0, 16.0, 9.0, 9.0, 8.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-20.9375, -20.229248046875, -19.52099609375, -18.812744140625, -18.1044921875, -17.396240234375, -16.68798828125, -15.979736328125, -15.271484375, -14.563232421875, -13.85498046875, -13.146728515625, -12.4384765625, -11.730224609375, -11.02197265625, -10.313720703125, -9.60546875, -8.897216796875, -8.18896484375, -7.480712890625, -6.7724609375, -6.064208984375, -5.35595703125, -4.647705078125, -3.939453125, -3.231201171875, -2.52294921875, -1.814697265625, -1.1064453125, -0.398193359375, 0.31005859375, 1.018310546875, 1.7265625, 2.434814453125, 3.14306640625, 3.851318359375, 4.5595703125, 5.267822265625, 5.97607421875, 6.684326171875, 7.392578125, 8.100830078125, 8.80908203125, 9.517333984375, 10.2255859375, 10.933837890625, 11.64208984375, 12.350341796875, 13.05859375, 13.766845703125, 14.47509765625, 15.183349609375, 15.8916015625, 16.599853515625, 17.30810546875, 18.016357421875, 18.724609375, 19.432861328125, 20.14111328125, 20.849365234375, 21.5576171875, 22.265869140625, 22.97412109375, 23.682373046875, 24.390625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 2.0, 2.0, 11.0, 9.0, 12.0, 26.0, 35.0, 65.0, 80.0, 168.0, 246.0, 403.0, 723.0, 1325.0, 3873.0, 21812.0, 213083.0, 697701.0, 92719.0, 11213.0, 2508.0, 1048.0, 567.0, 350.0, 195.0, 126.0, 87.0, 62.0, 40.0, 16.0, 16.0, 10.0, 4.0, 7.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-113.3125, -110.01171875, -106.7109375, -103.41015625, -100.109375, -96.80859375, -93.5078125, -90.20703125, -86.90625, -83.60546875, -80.3046875, -77.00390625, -73.703125, -70.40234375, -67.1015625, -63.80078125, -60.5, -57.19921875, -53.8984375, -50.59765625, -47.296875, -43.99609375, -40.6953125, -37.39453125, -34.09375, -30.79296875, -27.4921875, -24.19140625, -20.890625, -17.58984375, -14.2890625, -10.98828125, -7.6875, -4.38671875, -1.0859375, 2.21484375, 5.515625, 8.81640625, 12.1171875, 15.41796875, 18.71875, 22.01953125, 25.3203125, 28.62109375, 31.921875, 35.22265625, 38.5234375, 41.82421875, 45.125, 48.42578125, 51.7265625, 55.02734375, 58.328125, 61.62890625, 64.9296875, 68.23046875, 71.53125, 74.83203125, 78.1328125, 81.43359375, 84.734375, 88.03515625, 91.3359375, 94.63671875, 97.9375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 6.0, 5.0, 12.0, 5.0, 16.0, 10.0, 13.0, 19.0, 23.0, 33.0, 22.0, 32.0, 33.0, 34.0, 32.0, 41.0, 37.0, 42.0, 40.0, 46.0, 47.0, 42.0, 46.0, 53.0, 31.0, 48.0, 29.0, 22.0, 28.0, 22.0, 18.0, 25.0, 16.0, 11.0, 7.0, 13.0, 10.0, 7.0, 6.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.4375, -62.23046875, -60.0234375, -57.81640625, -55.609375, -53.40234375, -51.1953125, -48.98828125, -46.78125, -44.57421875, -42.3671875, -40.16015625, -37.953125, -35.74609375, -33.5390625, -31.33203125, -29.125, -26.91796875, -24.7109375, -22.50390625, -20.296875, -18.08984375, -15.8828125, -13.67578125, -11.46875, -9.26171875, -7.0546875, -4.84765625, -2.640625, -0.43359375, 1.7734375, 3.98046875, 6.1875, 8.39453125, 10.6015625, 12.80859375, 15.015625, 17.22265625, 19.4296875, 21.63671875, 23.84375, 26.05078125, 28.2578125, 30.46484375, 32.671875, 34.87890625, 37.0859375, 39.29296875, 41.5, 43.70703125, 45.9140625, 48.12109375, 50.328125, 52.53515625, 54.7421875, 56.94921875, 59.15625, 61.36328125, 63.5703125, 65.77734375, 67.984375, 70.19140625, 72.3984375, 74.60546875, 76.8125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 0.0, 5.0, 6.0, 7.0, 14.0, 13.0, 17.0, 27.0, 43.0, 58.0, 64.0, 102.0, 171.0, 256.0, 483.0, 852.0, 1675.0, 3644.0, 8717.0, 22809.0, 74167.0, 291430.0, 454634.0, 130355.0, 36271.0, 12627.0, 5143.0, 2313.0, 1130.0, 570.0, 325.0, 214.0, 130.0, 85.0, 55.0, 47.0, 21.0, 17.0, 14.0, 14.0, 10.0, 11.0, 4.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.8125, -21.065673828125, -20.31884765625, -19.572021484375, -18.8251953125, -18.078369140625, -17.33154296875, -16.584716796875, -15.837890625, -15.091064453125, -14.34423828125, -13.597412109375, -12.8505859375, -12.103759765625, -11.35693359375, -10.610107421875, -9.86328125, -9.116455078125, -8.36962890625, -7.622802734375, -6.8759765625, -6.129150390625, -5.38232421875, -4.635498046875, -3.888671875, -3.141845703125, -2.39501953125, -1.648193359375, -0.9013671875, -0.154541015625, 0.59228515625, 1.339111328125, 2.0859375, 2.832763671875, 3.57958984375, 4.326416015625, 5.0732421875, 5.820068359375, 6.56689453125, 7.313720703125, 8.060546875, 8.807373046875, 9.55419921875, 10.301025390625, 11.0478515625, 11.794677734375, 12.54150390625, 13.288330078125, 14.03515625, 14.781982421875, 15.52880859375, 16.275634765625, 17.0224609375, 17.769287109375, 18.51611328125, 19.262939453125, 20.009765625, 20.756591796875, 21.50341796875, 22.250244140625, 22.9970703125, 23.743896484375, 24.49072265625, 25.237548828125, 25.984375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 7.0, 7.0, 10.0, 12.0, 14.0, 22.0, 19.0, 30.0, 34.0, 50.0, 48.0, 74.0, 73.0, 82.0, 80.0, 73.0, 76.0, 62.0, 37.0, 36.0, 27.0, 34.0, 14.0, 20.0, 8.0, 8.0, 10.0, 8.0, 5.0, 2.0, 1.0, 6.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0038967132568359375, -0.0037879645824432373, -0.003679215908050537, -0.003570467233657837, -0.0034617185592651367, -0.0033529698848724365, -0.0032442212104797363, -0.003135472536087036, -0.003026723861694336, -0.0029179751873016357, -0.0028092265129089355, -0.0027004778385162354, -0.002591729164123535, -0.002482980489730835, -0.0023742318153381348, -0.0022654831409454346, -0.0021567344665527344, -0.002047985792160034, -0.001939237117767334, -0.0018304884433746338, -0.0017217397689819336, -0.0016129910945892334, -0.0015042424201965332, -0.001395493745803833, -0.0012867450714111328, -0.0011779963970184326, -0.0010692477226257324, -0.0009604990482330322, -0.000851750373840332, -0.0007430016994476318, -0.0006342530250549316, -0.0005255043506622314, -0.00041675567626953125, -0.00030800700187683105, -0.00019925832748413086, -9.050965309143066e-05, 1.823902130126953e-05, 0.00012698769569396973, 0.00023573637008666992, 0.0003444850444793701, 0.0004532337188720703, 0.0005619823932647705, 0.0006707310676574707, 0.0007794797420501709, 0.0008882284164428711, 0.0009969770908355713, 0.0011057257652282715, 0.0012144744396209717, 0.0013232231140136719, 0.001431971788406372, 0.0015407204627990723, 0.0016494691371917725, 0.0017582178115844727, 0.0018669664859771729, 0.001975715160369873, 0.0020844638347625732, 0.0021932125091552734, 0.0023019611835479736, 0.002410709857940674, 0.002519458532333374, 0.0026282072067260742, 0.0027369558811187744, 0.0028457045555114746, 0.002954453229904175, 0.003063201904296875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 6.0, 7.0, 22.0, 34.0, 41.0, 60.0, 119.0, 200.0, 422.0, 1075.0, 4072.0, 25106.0, 385583.0, 587790.0, 36429.0, 5204.0, 1378.0, 511.0, 207.0, 114.0, 59.0, 31.0, 30.0, 18.0, 10.0, 13.0, 5.0, 5.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.0625, -57.37890625, -55.6953125, -54.01171875, -52.328125, -50.64453125, -48.9609375, -47.27734375, -45.59375, -43.91015625, -42.2265625, -40.54296875, -38.859375, -37.17578125, -35.4921875, -33.80859375, -32.125, -30.44140625, -28.7578125, -27.07421875, -25.390625, -23.70703125, -22.0234375, -20.33984375, -18.65625, -16.97265625, -15.2890625, -13.60546875, -11.921875, -10.23828125, -8.5546875, -6.87109375, -5.1875, -3.50390625, -1.8203125, -0.13671875, 1.546875, 3.23046875, 4.9140625, 6.59765625, 8.28125, 9.96484375, 11.6484375, 13.33203125, 15.015625, 16.69921875, 18.3828125, 20.06640625, 21.75, 23.43359375, 25.1171875, 26.80078125, 28.484375, 30.16796875, 31.8515625, 33.53515625, 35.21875, 36.90234375, 38.5859375, 40.26953125, 41.953125, 43.63671875, 45.3203125, 47.00390625, 48.6875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 11.0, 10.0, 20.0, 35.0, 48.0, 61.0, 80.0, 130.0, 132.0, 146.0, 101.0, 90.0, 38.0, 39.0, 21.0, 7.0, 14.0, 4.0, 4.0, 5.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.21875, -50.93603515625, -49.6533203125, -48.37060546875, -47.087890625, -45.80517578125, -44.5224609375, -43.23974609375, -41.95703125, -40.67431640625, -39.3916015625, -38.10888671875, -36.826171875, -35.54345703125, -34.2607421875, -32.97802734375, -31.6953125, -30.41259765625, -29.1298828125, -27.84716796875, -26.564453125, -25.28173828125, -23.9990234375, -22.71630859375, -21.43359375, -20.15087890625, -18.8681640625, -17.58544921875, -16.302734375, -15.02001953125, -13.7373046875, -12.45458984375, -11.171875, -9.88916015625, -8.6064453125, -7.32373046875, -6.041015625, -4.75830078125, -3.4755859375, -2.19287109375, -0.91015625, 0.37255859375, 1.6552734375, 2.93798828125, 4.220703125, 5.50341796875, 6.7861328125, 8.06884765625, 9.3515625, 10.63427734375, 11.9169921875, 13.19970703125, 14.482421875, 15.76513671875, 17.0478515625, 18.33056640625, 19.61328125, 20.89599609375, 22.1787109375, 23.46142578125, 24.744140625, 26.02685546875, 27.3095703125, 28.59228515625, 29.875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 10.0, 27.0, 47.0, 68.0, 110.0, 169.0, 162.0, 133.0, 100.0, 77.0, 48.0, 23.0, 14.0, 4.0, 6.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-349.2296142578125, -328.0545654296875, -306.8795166015625, -285.7044982910156, -264.5294494628906, -243.35440063476562, -222.1793670654297, -201.00433349609375, -179.82928466796875, -158.65423583984375, -137.4792022705078, -116.30416107177734, -95.12911987304688, -73.9540786743164, -52.77903747558594, -31.60400390625, -10.428955078125, 10.746086120605469, 31.921127319335938, 53.096168518066406, 74.27120971679688, 95.44625091552734, 116.62129211425781, 137.79632568359375, 158.97137451171875, 180.14642333984375, 201.3214569091797, 222.49649047851562, 243.67153930664062, 264.8465881347656, 286.0216064453125, 307.1966552734375, 328.3717041015625, 349.5467529296875, 370.7218017578125, 391.8968200683594, 413.0718688964844, 434.2469177246094, 455.42193603515625, 476.59698486328125, 497.77203369140625, 518.9470825195312, 540.1221313476562, 561.2971801757812, 582.47216796875, 603.647216796875, 624.822265625, 645.997314453125, 667.17236328125, 688.347412109375, 709.5224609375, 730.697509765625, 751.87255859375, 773.0475463867188, 794.2225952148438, 815.3976440429688, 836.5726928710938, 857.7477416992188, 878.9227905273438, 900.0978393554688, 921.2728271484375, 942.4478759765625, 963.6229248046875, 984.7979736328125, 1005.9730224609375]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 0.0, 3.0, 4.0, 4.0, 6.0, 5.0, 10.0, 8.0, 10.0, 9.0, 24.0, 12.0, 33.0, 22.0, 26.0, 32.0, 32.0, 21.0, 35.0, 42.0, 47.0, 42.0, 50.0, 43.0, 43.0, 38.0, 39.0, 26.0, 42.0, 42.0, 43.0, 34.0, 32.0, 19.0, 24.0, 23.0, 16.0, 10.0, 9.0, 9.0, 7.0, 6.0, 4.0, 8.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-333.5670166015625, -322.6954345703125, -311.8238525390625, -300.9522705078125, -290.0806884765625, -279.2091064453125, -268.3375244140625, -257.4659423828125, -246.5943603515625, -235.7227783203125, -224.8511962890625, -213.9796142578125, -203.1080322265625, -192.2364501953125, -181.3648681640625, -170.4932861328125, -159.6217041015625, -148.7501220703125, -137.8785400390625, -127.0069580078125, -116.1353759765625, -105.2637939453125, -94.3922119140625, -83.5206298828125, -72.6490478515625, -61.7774658203125, -50.9058837890625, -40.0343017578125, -29.1627197265625, -18.2911376953125, -7.4195556640625, 3.4520263671875, 14.3236083984375, 25.1951904296875, 36.0667724609375, 46.9383544921875, 57.8099365234375, 68.6815185546875, 79.5531005859375, 90.4246826171875, 101.2962646484375, 112.1678466796875, 123.0394287109375, 133.9110107421875, 144.7825927734375, 155.6541748046875, 166.5257568359375, 177.3973388671875, 188.2689208984375, 199.1405029296875, 210.0120849609375, 220.8836669921875, 231.7552490234375, 242.6268310546875, 253.4984130859375, 264.3699951171875, 275.2415771484375, 286.1131591796875, 296.9847412109375, 307.8563232421875, 318.7279052734375, 329.5994873046875, 340.4710693359375, 351.3426513671875, 362.2142333984375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 7.0, 7.0, 14.0, 23.0, 24.0, 47.0, 85.0, 123.0, 200.0, 359.0, 725.0, 1604.0, 4013.0, 13559.0, 87485.0, 3984518.0, 81205.0, 13106.0, 3961.0, 1565.0, 696.0, 363.0, 229.0, 132.0, 68.0, 51.0, 32.0, 12.0, 21.0, 14.0, 7.0, 4.0, 6.0, 6.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-137.0, -132.015625, -127.03125, -122.046875, -117.0625, -112.078125, -107.09375, -102.109375, -97.125, -92.140625, -87.15625, -82.171875, -77.1875, -72.203125, -67.21875, -62.234375, -57.25, -52.265625, -47.28125, -42.296875, -37.3125, -32.328125, -27.34375, -22.359375, -17.375, -12.390625, -7.40625, -2.421875, 2.5625, 7.546875, 12.53125, 17.515625, 22.5, 27.484375, 32.46875, 37.453125, 42.4375, 47.421875, 52.40625, 57.390625, 62.375, 67.359375, 72.34375, 77.328125, 82.3125, 87.296875, 92.28125, 97.265625, 102.25, 107.234375, 112.21875, 117.203125, 122.1875, 127.171875, 132.15625, 137.140625, 142.125, 147.109375, 152.09375, 157.078125, 162.0625, 167.046875, 172.03125, 177.015625, 182.0]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 3.0, 5.0, 5.0, 11.0, 11.0, 20.0, 19.0, 26.0, 37.0, 23.0, 39.0, 55.0, 44.0, 53.0, 66.0, 70.0, 65.0, 75.0, 59.0, 59.0, 53.0, 31.0, 33.0, 38.0, 34.0, 13.0, 18.0, 7.0, 5.0, 9.0, 3.0, 4.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-21.3125, -20.600341796875, -19.88818359375, -19.176025390625, -18.4638671875, -17.751708984375, -17.03955078125, -16.327392578125, -15.615234375, -14.903076171875, -14.19091796875, -13.478759765625, -12.7666015625, -12.054443359375, -11.34228515625, -10.630126953125, -9.91796875, -9.205810546875, -8.49365234375, -7.781494140625, -7.0693359375, -6.357177734375, -5.64501953125, -4.932861328125, -4.220703125, -3.508544921875, -2.79638671875, -2.084228515625, -1.3720703125, -0.659912109375, 0.05224609375, 0.764404296875, 1.4765625, 2.188720703125, 2.90087890625, 3.613037109375, 4.3251953125, 5.037353515625, 5.74951171875, 6.461669921875, 7.173828125, 7.885986328125, 8.59814453125, 9.310302734375, 10.0224609375, 10.734619140625, 11.44677734375, 12.158935546875, 12.87109375, 13.583251953125, 14.29541015625, 15.007568359375, 15.7197265625, 16.431884765625, 17.14404296875, 17.856201171875, 18.568359375, 19.280517578125, 19.99267578125, 20.704833984375, 21.4169921875, 22.129150390625, 22.84130859375, 23.553466796875, 24.265625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 10.0, 11.0, 12.0, 11.0, 20.0, 20.0, 48.0, 70.0, 99.0, 142.0, 228.0, 394.0, 651.0, 1264.0, 2619.0, 5856.0, 16034.0, 55093.0, 508501.0, 3491311.0, 77198.0, 20740.0, 7470.0, 3093.0, 1449.0, 818.0, 401.0, 263.0, 159.0, 102.0, 56.0, 34.0, 29.0, 19.0, 20.0, 5.0, 8.0, 7.0, 9.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.0, -70.4033203125, -67.806640625, -65.2099609375, -62.61328125, -60.0166015625, -57.419921875, -54.8232421875, -52.2265625, -49.6298828125, -47.033203125, -44.4365234375, -41.83984375, -39.2431640625, -36.646484375, -34.0498046875, -31.453125, -28.8564453125, -26.259765625, -23.6630859375, -21.06640625, -18.4697265625, -15.873046875, -13.2763671875, -10.6796875, -8.0830078125, -5.486328125, -2.8896484375, -0.29296875, 2.3037109375, 4.900390625, 7.4970703125, 10.09375, 12.6904296875, 15.287109375, 17.8837890625, 20.48046875, 23.0771484375, 25.673828125, 28.2705078125, 30.8671875, 33.4638671875, 36.060546875, 38.6572265625, 41.25390625, 43.8505859375, 46.447265625, 49.0439453125, 51.640625, 54.2373046875, 56.833984375, 59.4306640625, 62.02734375, 64.6240234375, 67.220703125, 69.8173828125, 72.4140625, 75.0107421875, 77.607421875, 80.2041015625, 82.80078125, 85.3974609375, 87.994140625, 90.5908203125, 93.1875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 2.0, 0.0, 3.0, 6.0, 8.0, 6.0, 10.0, 14.0, 14.0, 32.0, 41.0, 76.0, 97.0, 230.0, 2551.0, 556.0, 166.0, 89.0, 42.0, 36.0, 28.0, 25.0, 13.0, 16.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0078125, -11.4805908203125, -10.953369140625, -10.4261474609375, -9.89892578125, -9.3717041015625, -8.844482421875, -8.3172607421875, -7.7900390625, -7.2628173828125, -6.735595703125, -6.2083740234375, -5.68115234375, -5.1539306640625, -4.626708984375, -4.0994873046875, -3.572265625, -3.0450439453125, -2.517822265625, -1.9906005859375, -1.46337890625, -0.9361572265625, -0.408935546875, 0.1182861328125, 0.6455078125, 1.1727294921875, 1.699951171875, 2.2271728515625, 2.75439453125, 3.2816162109375, 3.808837890625, 4.3360595703125, 4.86328125, 5.3905029296875, 5.917724609375, 6.4449462890625, 6.97216796875, 7.4993896484375, 8.026611328125, 8.5538330078125, 9.0810546875, 9.6082763671875, 10.135498046875, 10.6627197265625, 11.18994140625, 11.7171630859375, 12.244384765625, 12.7716064453125, 13.298828125, 13.8260498046875, 14.353271484375, 14.8804931640625, 15.40771484375, 15.9349365234375, 16.462158203125, 16.9893798828125, 17.5166015625, 18.0438232421875, 18.571044921875, 19.0982666015625, 19.62548828125, 20.1527099609375, 20.679931640625, 21.2071533203125, 21.734375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 7.0, 15.0, 33.0, 33.0, 81.0, 99.0, 131.0, 158.0, 122.0, 109.0, 84.0, 46.0, 34.0, 19.0, 9.0, 11.0, 7.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.72802734375, -83.01950073242188, -79.31096649169922, -75.6024398803711, -71.89390563964844, -68.18537902832031, -64.47685241699219, -60.7683219909668, -57.059791564941406, -53.351261138916016, -49.642730712890625, -45.9342041015625, -42.22567367553711, -38.51714324951172, -34.808616638183594, -31.100086212158203, -27.391555786132812, -23.683025360107422, -19.974496841430664, -16.265968322753906, -12.557437896728516, -8.848907470703125, -5.140378952026367, -1.4318504333496094, 2.2766799926757812, 5.9852094650268555, 9.69373893737793, 13.402268409729004, 17.110797882080078, 20.81932830810547, 24.527856826782227, 28.236385345458984, 31.944915771484375, 35.653446197509766, 39.361976623535156, 43.07050323486328, 46.77903366088867, 50.48756408691406, 54.19609069824219, 57.90462112426758, 61.61315155029297, 65.3216781616211, 69.03021240234375, 72.73873901367188, 76.447265625, 80.15579986572266, 83.86432647705078, 87.57286071777344, 91.28138732910156, 94.98991394042969, 98.69844818115234, 102.40697479248047, 106.11550903320312, 109.82403564453125, 113.53256225585938, 117.2410888671875, 120.94962310791016, 124.65814971923828, 128.36668395996094, 132.07521057128906, 135.7837371826172, 139.49227905273438, 143.2008056640625, 146.90933227539062, 150.61785888671875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 4.0, 3.0, 4.0, 7.0, 11.0, 16.0, 6.0, 7.0, 11.0, 22.0, 18.0, 23.0, 26.0, 24.0, 29.0, 26.0, 41.0, 27.0, 25.0, 35.0, 47.0, 45.0, 33.0, 38.0, 60.0, 44.0, 34.0, 33.0, 34.0, 29.0, 32.0, 24.0, 27.0, 21.0, 17.0, 15.0, 21.0, 23.0, 16.0, 9.0, 7.0, 5.0, 7.0, 5.0, 3.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0], "bins": [-44.682899475097656, -43.43684768676758, -42.190792083740234, -40.944740295410156, -39.69868850708008, -38.45263671875, -37.206581115722656, -35.96052932739258, -34.7144775390625, -33.46842575073242, -32.22237014770508, -30.976318359375, -29.730266571044922, -28.48421287536621, -27.2381591796875, -25.992107391357422, -24.74605369567871, -23.5, -22.253948211669922, -21.00789451599121, -19.761842727661133, -18.515789031982422, -17.269737243652344, -16.023683547973633, -14.777630805969238, -13.531578063964844, -12.28552532196045, -11.039472579956055, -9.793418884277344, -8.547367095947266, -7.301313400268555, -6.05526065826416, -4.809207916259766, -3.563155174255371, -2.3171021938323975, -1.0710492134094238, 0.1750035285949707, 1.4210562705993652, 2.667109489440918, 3.9131622314453125, 5.159214973449707, 6.405267715454102, 7.651320457458496, 8.89737319946289, 10.143426895141602, 11.38947868347168, 12.63553237915039, 13.881585121154785, 15.12763786315918, 16.37369155883789, 17.61974334716797, 18.86579704284668, 20.111848831176758, 21.35790252685547, 22.603954315185547, 23.850008010864258, 25.09606170654297, 26.34211540222168, 27.588167190551758, 28.83422088623047, 30.080272674560547, 31.326326370239258, 32.57238006591797, 33.81843185424805, 35.064483642578125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 5.0, 13.0, 24.0, 19.0, 18.0, 54.0, 81.0, 111.0, 192.0, 298.0, 601.0, 1187.0, 2622.0, 5884.0, 16027.0, 47227.0, 148620.0, 367751.0, 299356.0, 104417.0, 33644.0, 11794.0, 4521.0, 1835.0, 986.0, 481.0, 271.0, 186.0, 107.0, 73.0, 39.0, 36.0, 20.0, 17.0, 12.0, 8.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.4375, -49.822265625, -48.20703125, -46.591796875, -44.9765625, -43.361328125, -41.74609375, -40.130859375, -38.515625, -36.900390625, -35.28515625, -33.669921875, -32.0546875, -30.439453125, -28.82421875, -27.208984375, -25.59375, -23.978515625, -22.36328125, -20.748046875, -19.1328125, -17.517578125, -15.90234375, -14.287109375, -12.671875, -11.056640625, -9.44140625, -7.826171875, -6.2109375, -4.595703125, -2.98046875, -1.365234375, 0.25, 1.865234375, 3.48046875, 5.095703125, 6.7109375, 8.326171875, 9.94140625, 11.556640625, 13.171875, 14.787109375, 16.40234375, 18.017578125, 19.6328125, 21.248046875, 22.86328125, 24.478515625, 26.09375, 27.708984375, 29.32421875, 30.939453125, 32.5546875, 34.169921875, 35.78515625, 37.400390625, 39.015625, 40.630859375, 42.24609375, 43.861328125, 45.4765625, 47.091796875, 48.70703125, 50.322265625, 51.9375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 6.0, 6.0, 14.0, 21.0, 29.0, 24.0, 21.0, 24.0, 35.0, 48.0, 50.0, 47.0, 58.0, 67.0, 41.0, 67.0, 57.0, 57.0, 61.0, 49.0, 36.0, 41.0, 34.0, 26.0, 20.0, 11.0, 11.0, 9.0, 9.0, 3.0, 2.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-22.421875, -21.691650390625, -20.96142578125, -20.231201171875, -19.5009765625, -18.770751953125, -18.04052734375, -17.310302734375, -16.580078125, -15.849853515625, -15.11962890625, -14.389404296875, -13.6591796875, -12.928955078125, -12.19873046875, -11.468505859375, -10.73828125, -10.008056640625, -9.27783203125, -8.547607421875, -7.8173828125, -7.087158203125, -6.35693359375, -5.626708984375, -4.896484375, -4.166259765625, -3.43603515625, -2.705810546875, -1.9755859375, -1.245361328125, -0.51513671875, 0.215087890625, 0.9453125, 1.675537109375, 2.40576171875, 3.135986328125, 3.8662109375, 4.596435546875, 5.32666015625, 6.056884765625, 6.787109375, 7.517333984375, 8.24755859375, 8.977783203125, 9.7080078125, 10.438232421875, 11.16845703125, 11.898681640625, 12.62890625, 13.359130859375, 14.08935546875, 14.819580078125, 15.5498046875, 16.280029296875, 17.01025390625, 17.740478515625, 18.470703125, 19.200927734375, 19.93115234375, 20.661376953125, 21.3916015625, 22.121826171875, 22.85205078125, 23.582275390625, 24.3125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 10.0, 14.0, 33.0, 52.0, 102.0, 205.0, 445.0, 873.0, 2228.0, 15214.0, 672271.0, 344929.0, 8897.0, 1811.0, 760.0, 350.0, 206.0, 84.0, 34.0, 20.0, 10.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-147.0, -142.083984375, -137.16796875, -132.251953125, -127.3359375, -122.419921875, -117.50390625, -112.587890625, -107.671875, -102.755859375, -97.83984375, -92.923828125, -88.0078125, -83.091796875, -78.17578125, -73.259765625, -68.34375, -63.427734375, -58.51171875, -53.595703125, -48.6796875, -43.763671875, -38.84765625, -33.931640625, -29.015625, -24.099609375, -19.18359375, -14.267578125, -9.3515625, -4.435546875, 0.48046875, 5.396484375, 10.3125, 15.228515625, 20.14453125, 25.060546875, 29.9765625, 34.892578125, 39.80859375, 44.724609375, 49.640625, 54.556640625, 59.47265625, 64.388671875, 69.3046875, 74.220703125, 79.13671875, 84.052734375, 88.96875, 93.884765625, 98.80078125, 103.716796875, 108.6328125, 113.548828125, 118.46484375, 123.380859375, 128.296875, 133.212890625, 138.12890625, 143.044921875, 147.9609375, 152.876953125, 157.79296875, 162.708984375, 167.625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 3.0, 0.0, 11.0, 10.0, 12.0, 9.0, 22.0, 16.0, 14.0, 34.0, 25.0, 32.0, 31.0, 40.0, 38.0, 44.0, 48.0, 40.0, 39.0, 62.0, 51.0, 37.0, 61.0, 38.0, 38.0, 34.0, 29.0, 37.0, 33.0, 18.0, 19.0, 9.0, 5.0, 11.0, 11.0, 7.0, 5.0, 6.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-80.0, -77.3701171875, -74.740234375, -72.1103515625, -69.48046875, -66.8505859375, -64.220703125, -61.5908203125, -58.9609375, -56.3310546875, -53.701171875, -51.0712890625, -48.44140625, -45.8115234375, -43.181640625, -40.5517578125, -37.921875, -35.2919921875, -32.662109375, -30.0322265625, -27.40234375, -24.7724609375, -22.142578125, -19.5126953125, -16.8828125, -14.2529296875, -11.623046875, -8.9931640625, -6.36328125, -3.7333984375, -1.103515625, 1.5263671875, 4.15625, 6.7861328125, 9.416015625, 12.0458984375, 14.67578125, 17.3056640625, 19.935546875, 22.5654296875, 25.1953125, 27.8251953125, 30.455078125, 33.0849609375, 35.71484375, 38.3447265625, 40.974609375, 43.6044921875, 46.234375, 48.8642578125, 51.494140625, 54.1240234375, 56.75390625, 59.3837890625, 62.013671875, 64.6435546875, 67.2734375, 69.9033203125, 72.533203125, 75.1630859375, 77.79296875, 80.4228515625, 83.052734375, 85.6826171875, 88.3125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 5.0, 3.0, 16.0, 24.0, 44.0, 59.0, 113.0, 265.0, 767.0, 3195.0, 44200.0, 955077.0, 40290.0, 3187.0, 778.0, 272.0, 118.0, 68.0, 29.0, 17.0, 11.0, 6.0, 6.0, 4.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.75, -76.2490234375, -73.748046875, -71.2470703125, -68.74609375, -66.2451171875, -63.744140625, -61.2431640625, -58.7421875, -56.2412109375, -53.740234375, -51.2392578125, -48.73828125, -46.2373046875, -43.736328125, -41.2353515625, -38.734375, -36.2333984375, -33.732421875, -31.2314453125, -28.73046875, -26.2294921875, -23.728515625, -21.2275390625, -18.7265625, -16.2255859375, -13.724609375, -11.2236328125, -8.72265625, -6.2216796875, -3.720703125, -1.2197265625, 1.28125, 3.7822265625, 6.283203125, 8.7841796875, 11.28515625, 13.7861328125, 16.287109375, 18.7880859375, 21.2890625, 23.7900390625, 26.291015625, 28.7919921875, 31.29296875, 33.7939453125, 36.294921875, 38.7958984375, 41.296875, 43.7978515625, 46.298828125, 48.7998046875, 51.30078125, 53.8017578125, 56.302734375, 58.8037109375, 61.3046875, 63.8056640625, 66.306640625, 68.8076171875, 71.30859375, 73.8095703125, 76.310546875, 78.8115234375, 81.3125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 3.0, 6.0, 10.0, 3.0, 9.0, 12.0, 15.0, 19.0, 30.0, 38.0, 48.0, 55.0, 63.0, 103.0, 108.0, 95.0, 93.0, 71.0, 52.0, 40.0, 32.0, 23.0, 15.0, 6.0, 11.0, 6.0, 9.0, 6.0, 5.0, 1.0, 6.0, 2.0, 4.0, 2.0], "bins": [-0.00531005859375, -0.005191385746002197, -0.0050727128982543945, -0.004954040050506592, -0.004835367202758789, -0.004716694355010986, -0.004598021507263184, -0.004479348659515381, -0.004360675811767578, -0.004242002964019775, -0.004123330116271973, -0.00400465726852417, -0.003885984420776367, -0.0037673115730285645, -0.0036486387252807617, -0.003529965877532959, -0.0034112930297851562, -0.0032926201820373535, -0.0031739473342895508, -0.003055274486541748, -0.0029366016387939453, -0.0028179287910461426, -0.00269925594329834, -0.002580583095550537, -0.0024619102478027344, -0.0023432374000549316, -0.002224564552307129, -0.002105891704559326, -0.0019872188568115234, -0.0018685460090637207, -0.001749873161315918, -0.0016312003135681152, -0.0015125274658203125, -0.0013938546180725098, -0.001275181770324707, -0.0011565089225769043, -0.0010378360748291016, -0.0009191632270812988, -0.0008004903793334961, -0.0006818175315856934, -0.0005631446838378906, -0.0004444718360900879, -0.00032579898834228516, -0.00020712614059448242, -8.845329284667969e-05, 3.0219554901123047e-05, 0.00014889240264892578, 0.0002675652503967285, 0.00038623809814453125, 0.000504910945892334, 0.0006235837936401367, 0.0007422566413879395, 0.0008609294891357422, 0.000979602336883545, 0.0010982751846313477, 0.0012169480323791504, 0.0013356208801269531, 0.0014542937278747559, 0.0015729665756225586, 0.0016916394233703613, 0.001810312271118164, 0.0019289851188659668, 0.0020476579666137695, 0.0021663308143615723, 0.002285003662109375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 6.0, 5.0, 4.0, 13.0, 21.0, 22.0, 41.0, 75.0, 117.0, 192.0, 400.0, 1115.0, 3756.0, 25911.0, 784818.0, 217924.0, 10466.0, 2254.0, 739.0, 284.0, 151.0, 77.0, 64.0, 42.0, 21.0, 15.0, 10.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.8125, -59.8056640625, -57.798828125, -55.7919921875, -53.78515625, -51.7783203125, -49.771484375, -47.7646484375, -45.7578125, -43.7509765625, -41.744140625, -39.7373046875, -37.73046875, -35.7236328125, -33.716796875, -31.7099609375, -29.703125, -27.6962890625, -25.689453125, -23.6826171875, -21.67578125, -19.6689453125, -17.662109375, -15.6552734375, -13.6484375, -11.6416015625, -9.634765625, -7.6279296875, -5.62109375, -3.6142578125, -1.607421875, 0.3994140625, 2.40625, 4.4130859375, 6.419921875, 8.4267578125, 10.43359375, 12.4404296875, 14.447265625, 16.4541015625, 18.4609375, 20.4677734375, 22.474609375, 24.4814453125, 26.48828125, 28.4951171875, 30.501953125, 32.5087890625, 34.515625, 36.5224609375, 38.529296875, 40.5361328125, 42.54296875, 44.5498046875, 46.556640625, 48.5634765625, 50.5703125, 52.5771484375, 54.583984375, 56.5908203125, 58.59765625, 60.6044921875, 62.611328125, 64.6181640625, 66.625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 4.0, 7.0, 4.0, 5.0, 22.0, 46.0, 107.0, 217.0, 205.0, 193.0, 107.0, 35.0, 23.0, 8.0, 6.0, 8.0, 5.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.859375, -28.842041015625, -26.82470703125, -24.807373046875, -22.7900390625, -20.772705078125, -18.75537109375, -16.738037109375, -14.720703125, -12.703369140625, -10.68603515625, -8.668701171875, -6.6513671875, -4.634033203125, -2.61669921875, -0.599365234375, 1.41796875, 3.435302734375, 5.45263671875, 7.469970703125, 9.4873046875, 11.504638671875, 13.52197265625, 15.539306640625, 17.556640625, 19.573974609375, 21.59130859375, 23.608642578125, 25.6259765625, 27.643310546875, 29.66064453125, 31.677978515625, 33.6953125, 35.712646484375, 37.72998046875, 39.747314453125, 41.7646484375, 43.781982421875, 45.79931640625, 47.816650390625, 49.833984375, 51.851318359375, 53.86865234375, 55.885986328125, 57.9033203125, 59.920654296875, 61.93798828125, 63.955322265625, 65.97265625, 67.989990234375, 70.00732421875, 72.024658203125, 74.0419921875, 76.059326171875, 78.07666015625, 80.093994140625, 82.111328125, 84.128662109375, 86.14599609375, 88.163330078125, 90.1806640625, 92.197998046875, 94.21533203125, 96.232666015625, 98.25]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 8.0, 16.0, 85.0, 198.0, 320.0, 240.0, 97.0, 26.0, 13.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-312.1193542480469, -271.5897216796875, -231.06005859375, -190.53042602539062, -150.0007781982422, -109.47113037109375, -68.94149780273438, -28.411834716796875, 12.1177978515625, 52.64744186401367, 93.17708587646484, 133.70672607421875, 174.2363739013672, 214.76602172851562, 255.295654296875, 295.8253173828125, 336.3549499511719, 376.88458251953125, 417.41424560546875, 457.9438781738281, 498.4735107421875, 539.003173828125, 579.5328369140625, 620.0625, 660.5921020507812, 701.1217651367188, 741.6513671875, 782.1810302734375, 822.710693359375, 863.2403564453125, 903.7699584960938, 944.2996215820312, 984.8292236328125, 1025.35888671875, 1065.8885498046875, 1106.418212890625, 1146.94775390625, 1187.4774169921875, 1228.007080078125, 1268.5367431640625, 1309.06640625, 1349.5960693359375, 1390.125732421875, 1430.6552734375, 1471.1849365234375, 1511.714599609375, 1552.2442626953125, 1592.77392578125, 1633.303466796875, 1673.8331298828125, 1714.36279296875, 1754.892333984375, 1795.4219970703125, 1835.95166015625, 1876.4813232421875, 1917.010986328125, 1957.5406494140625, 1998.0703125, 2038.5999755859375, 2079.129638671875, 2119.6591796875, 2160.18896484375, 2200.718505859375, 2241.248046875, 2281.77783203125]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 2.0, 2.0, 7.0, 7.0, 19.0, 9.0, 6.0, 12.0, 12.0, 19.0, 25.0, 20.0, 37.0, 40.0, 31.0, 57.0, 39.0, 52.0, 47.0, 37.0, 56.0, 59.0, 50.0, 43.0, 50.0, 43.0, 32.0, 25.0, 27.0, 21.0, 21.0, 13.0, 14.0, 14.0, 10.0, 9.0, 5.0, 7.0, 7.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-373.48114013671875, -361.5601806640625, -349.6391906738281, -337.7182312011719, -325.7972412109375, -313.87628173828125, -301.955322265625, -290.0343322753906, -278.1133728027344, -266.1924133300781, -254.27142333984375, -242.3504638671875, -230.4294891357422, -218.50851440429688, -206.58753967285156, -194.66656494140625, -182.74559020996094, -170.82461547851562, -158.9036407470703, -146.982666015625, -135.06170654296875, -123.14073181152344, -111.21975708007812, -99.29878997802734, -87.37781524658203, -75.45684051513672, -63.53587341308594, -51.614898681640625, -39.69392776489258, -27.77295684814453, -15.851982116699219, -3.9310150146484375, 7.989959716796875, 19.910930633544922, 31.8319034576416, 43.75287628173828, 55.67384719848633, 67.59481811523438, 79.51579284667969, 91.43675994873047, 103.35773468017578, 115.2787094116211, 127.19967651367188, 139.1206512451172, 151.0416259765625, 162.96258544921875, 174.88357543945312, 186.80453491210938, 198.7255096435547, 210.646484375, 222.5674591064453, 234.48843383789062, 246.40939331054688, 258.33038330078125, 270.2513427734375, 282.17230224609375, 294.0932922363281, 306.0142517089844, 317.93524169921875, 329.856201171875, 341.7771911621094, 353.6981506347656, 365.619140625, 377.54010009765625, 389.4610595703125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 10.0, 10.0, 12.0, 22.0, 26.0, 36.0, 66.0, 76.0, 130.0, 195.0, 325.0, 607.0, 994.0, 2014.0, 4417.0, 10664.0, 44278.0, 4059196.0, 50600.0, 11242.0, 4514.0, 2124.0, 1149.0, 575.0, 364.0, 211.0, 154.0, 89.0, 58.0, 43.0, 18.0, 20.0, 9.0, 9.0, 3.0, 5.0, 5.0, 5.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-119.6875, -115.8916015625, -112.095703125, -108.2998046875, -104.50390625, -100.7080078125, -96.912109375, -93.1162109375, -89.3203125, -85.5244140625, -81.728515625, -77.9326171875, -74.13671875, -70.3408203125, -66.544921875, -62.7490234375, -58.953125, -55.1572265625, -51.361328125, -47.5654296875, -43.76953125, -39.9736328125, -36.177734375, -32.3818359375, -28.5859375, -24.7900390625, -20.994140625, -17.1982421875, -13.40234375, -9.6064453125, -5.810546875, -2.0146484375, 1.78125, 5.5771484375, 9.373046875, 13.1689453125, 16.96484375, 20.7607421875, 24.556640625, 28.3525390625, 32.1484375, 35.9443359375, 39.740234375, 43.5361328125, 47.33203125, 51.1279296875, 54.923828125, 58.7197265625, 62.515625, 66.3115234375, 70.107421875, 73.9033203125, 77.69921875, 81.4951171875, 85.291015625, 89.0869140625, 92.8828125, 96.6787109375, 100.474609375, 104.2705078125, 108.06640625, 111.8623046875, 115.658203125, 119.4541015625, 123.25]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 2.0, 2.0, 7.0, 11.0, 2.0, 11.0, 14.0, 27.0, 33.0, 39.0, 40.0, 47.0, 51.0, 64.0, 75.0, 63.0, 80.0, 62.0, 73.0, 56.0, 51.0, 43.0, 26.0, 27.0, 22.0, 17.0, 16.0, 13.0, 8.0, 10.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-28.875, -28.02734375, -27.1796875, -26.33203125, -25.484375, -24.63671875, -23.7890625, -22.94140625, -22.09375, -21.24609375, -20.3984375, -19.55078125, -18.703125, -17.85546875, -17.0078125, -16.16015625, -15.3125, -14.46484375, -13.6171875, -12.76953125, -11.921875, -11.07421875, -10.2265625, -9.37890625, -8.53125, -7.68359375, -6.8359375, -5.98828125, -5.140625, -4.29296875, -3.4453125, -2.59765625, -1.75, -0.90234375, -0.0546875, 0.79296875, 1.640625, 2.48828125, 3.3359375, 4.18359375, 5.03125, 5.87890625, 6.7265625, 7.57421875, 8.421875, 9.26953125, 10.1171875, 10.96484375, 11.8125, 12.66015625, 13.5078125, 14.35546875, 15.203125, 16.05078125, 16.8984375, 17.74609375, 18.59375, 19.44140625, 20.2890625, 21.13671875, 21.984375, 22.83203125, 23.6796875, 24.52734375, 25.375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 1.0, 7.0, 6.0, 7.0, 15.0, 27.0, 28.0, 30.0, 74.0, 84.0, 137.0, 169.0, 269.0, 476.0, 734.0, 1479.0, 2870.0, 6762.0, 19320.0, 187115.0, 3928118.0, 30077.0, 8869.0, 3675.0, 1661.0, 855.0, 467.0, 292.0, 208.0, 132.0, 92.0, 67.0, 39.0, 32.0, 32.0, 24.0, 15.0, 10.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.3125, -75.0693359375, -71.826171875, -68.5830078125, -65.33984375, -62.0966796875, -58.853515625, -55.6103515625, -52.3671875, -49.1240234375, -45.880859375, -42.6376953125, -39.39453125, -36.1513671875, -32.908203125, -29.6650390625, -26.421875, -23.1787109375, -19.935546875, -16.6923828125, -13.44921875, -10.2060546875, -6.962890625, -3.7197265625, -0.4765625, 2.7666015625, 6.009765625, 9.2529296875, 12.49609375, 15.7392578125, 18.982421875, 22.2255859375, 25.46875, 28.7119140625, 31.955078125, 35.1982421875, 38.44140625, 41.6845703125, 44.927734375, 48.1708984375, 51.4140625, 54.6572265625, 57.900390625, 61.1435546875, 64.38671875, 67.6298828125, 70.873046875, 74.1162109375, 77.359375, 80.6025390625, 83.845703125, 87.0888671875, 90.33203125, 93.5751953125, 96.818359375, 100.0615234375, 103.3046875, 106.5478515625, 109.791015625, 113.0341796875, 116.27734375, 119.5205078125, 122.763671875, 126.0068359375, 129.25]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 0.0, 4.0, 8.0, 6.0, 8.0, 12.0, 40.0, 83.0, 3285.0, 439.0, 93.0, 31.0, 20.0, 13.0, 7.0, 7.0, 5.0, 2.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.4375, -23.69482421875, -22.9521484375, -22.20947265625, -21.466796875, -20.72412109375, -19.9814453125, -19.23876953125, -18.49609375, -17.75341796875, -17.0107421875, -16.26806640625, -15.525390625, -14.78271484375, -14.0400390625, -13.29736328125, -12.5546875, -11.81201171875, -11.0693359375, -10.32666015625, -9.583984375, -8.84130859375, -8.0986328125, -7.35595703125, -6.61328125, -5.87060546875, -5.1279296875, -4.38525390625, -3.642578125, -2.89990234375, -2.1572265625, -1.41455078125, -0.671875, 0.07080078125, 0.8134765625, 1.55615234375, 2.298828125, 3.04150390625, 3.7841796875, 4.52685546875, 5.26953125, 6.01220703125, 6.7548828125, 7.49755859375, 8.240234375, 8.98291015625, 9.7255859375, 10.46826171875, 11.2109375, 11.95361328125, 12.6962890625, 13.43896484375, 14.181640625, 14.92431640625, 15.6669921875, 16.40966796875, 17.15234375, 17.89501953125, 18.6376953125, 19.38037109375, 20.123046875, 20.86572265625, 21.6083984375, 22.35107421875, 23.09375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 8.0, 10.0, 5.0, 9.0, 11.0, 26.0, 28.0, 40.0, 58.0, 73.0, 95.0, 104.0, 90.0, 102.0, 101.0, 78.0, 48.0, 42.0, 24.0, 20.0, 13.0, 7.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.728843688964844, -48.334014892578125, -45.939186096191406, -43.54435729980469, -41.14952850341797, -38.75469970703125, -36.35987091064453, -33.96504211425781, -31.570215225219727, -29.175386428833008, -26.78055763244629, -24.385730743408203, -21.990901947021484, -19.596073150634766, -17.201244354248047, -14.806415557861328, -12.41158676147461, -10.01675796508789, -7.62192964553833, -5.2271013259887695, -2.832272529602051, -0.43744373321533203, 1.9573841094970703, 4.352212905883789, 6.747041702270508, 9.141870498657227, 11.536699295043945, 13.931527137756348, 16.32635498046875, 18.72118377685547, 21.116012573242188, 23.510841369628906, 25.905670166015625, 28.300498962402344, 30.695327758789062, 33.09015655517578, 35.4849853515625, 37.87981414794922, 40.27464294433594, 42.669471740722656, 45.064300537109375, 47.459129333496094, 49.85395812988281, 52.24878692626953, 54.64361572265625, 57.03844451904297, 59.43327331542969, 61.828102111816406, 64.22293090820312, 66.61775970458984, 69.01258850097656, 71.40741729736328, 73.80224609375, 76.19707489013672, 78.59190368652344, 80.98673248291016, 83.38155364990234, 85.77638244628906, 88.17121124267578, 90.5660400390625, 92.96086883544922, 95.35569763183594, 97.75052642822266, 100.14535522460938, 102.5401840209961]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 8.0, 9.0, 7.0, 9.0, 5.0, 12.0, 9.0, 21.0, 19.0, 21.0, 27.0, 32.0, 25.0, 23.0, 31.0, 42.0, 30.0, 43.0, 28.0, 41.0, 42.0, 43.0, 40.0, 45.0, 36.0, 32.0, 47.0, 37.0, 29.0, 18.0, 32.0, 25.0, 19.0, 11.0, 12.0, 10.0, 6.0, 16.0, 7.0, 10.0, 7.0, 6.0, 6.0, 6.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-33.992958068847656, -32.957664489746094, -31.9223690032959, -30.887075424194336, -29.851781845092773, -28.816486358642578, -27.781192779541016, -26.745899200439453, -25.71060562133789, -24.675312042236328, -23.640016555786133, -22.60472297668457, -21.569429397583008, -20.534133911132812, -19.49884033203125, -18.463546752929688, -17.428251266479492, -16.39295768737793, -15.35766315460205, -14.322368621826172, -13.28707504272461, -12.25178050994873, -11.216485977172852, -10.181192398071289, -9.14589786529541, -8.110603332519531, -7.075309753417969, -6.04001522064209, -5.004721164703369, -3.9694271087646484, -2.9341325759887695, -1.8988385200500488, -0.8635444641113281, 0.17174971103668213, 1.2070438861846924, 2.242338180541992, 3.277632236480713, 4.312926292419434, 5.3482208251953125, 6.383514881134033, 7.418808937072754, 8.454103469848633, 9.489397048950195, 10.524691581726074, 11.559986114501953, 12.595279693603516, 13.630574226379395, 14.665868759155273, 15.701162338256836, 16.7364559173584, 17.771751403808594, 18.807044982910156, 19.84233856201172, 20.87763214111328, 21.912927627563477, 22.94822120666504, 23.983516693115234, 25.018810272216797, 26.054105758666992, 27.089399337768555, 28.124692916870117, 29.159988403320312, 30.195281982421875, 31.230575561523438, 32.265869140625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 7.0, 7.0, 16.0, 33.0, 31.0, 86.0, 149.0, 265.0, 518.0, 1157.0, 2775.0, 8022.0, 27098.0, 105403.0, 383085.0, 377551.0, 103199.0, 26142.0, 7956.0, 2824.0, 1135.0, 497.0, 259.0, 141.0, 75.0, 36.0, 31.0, 22.0, 10.0, 12.0, 5.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.84375, -57.00439453125, -55.1650390625, -53.32568359375, -51.486328125, -49.64697265625, -47.8076171875, -45.96826171875, -44.12890625, -42.28955078125, -40.4501953125, -38.61083984375, -36.771484375, -34.93212890625, -33.0927734375, -31.25341796875, -29.4140625, -27.57470703125, -25.7353515625, -23.89599609375, -22.056640625, -20.21728515625, -18.3779296875, -16.53857421875, -14.69921875, -12.85986328125, -11.0205078125, -9.18115234375, -7.341796875, -5.50244140625, -3.6630859375, -1.82373046875, 0.015625, 1.85498046875, 3.6943359375, 5.53369140625, 7.373046875, 9.21240234375, 11.0517578125, 12.89111328125, 14.73046875, 16.56982421875, 18.4091796875, 20.24853515625, 22.087890625, 23.92724609375, 25.7666015625, 27.60595703125, 29.4453125, 31.28466796875, 33.1240234375, 34.96337890625, 36.802734375, 38.64208984375, 40.4814453125, 42.32080078125, 44.16015625, 45.99951171875, 47.8388671875, 49.67822265625, 51.517578125, 53.35693359375, 55.1962890625, 57.03564453125, 58.875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 0.0, 5.0, 5.0, 5.0, 11.0, 8.0, 13.0, 13.0, 27.0, 24.0, 31.0, 41.0, 42.0, 58.0, 46.0, 57.0, 65.0, 69.0, 45.0, 73.0, 64.0, 64.0, 45.0, 39.0, 26.0, 27.0, 17.0, 17.0, 20.0, 7.0, 11.0, 9.0, 7.0, 4.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-27.96875, -27.1396484375, -26.310546875, -25.4814453125, -24.65234375, -23.8232421875, -22.994140625, -22.1650390625, -21.3359375, -20.5068359375, -19.677734375, -18.8486328125, -18.01953125, -17.1904296875, -16.361328125, -15.5322265625, -14.703125, -13.8740234375, -13.044921875, -12.2158203125, -11.38671875, -10.5576171875, -9.728515625, -8.8994140625, -8.0703125, -7.2412109375, -6.412109375, -5.5830078125, -4.75390625, -3.9248046875, -3.095703125, -2.2666015625, -1.4375, -0.6083984375, 0.220703125, 1.0498046875, 1.87890625, 2.7080078125, 3.537109375, 4.3662109375, 5.1953125, 6.0244140625, 6.853515625, 7.6826171875, 8.51171875, 9.3408203125, 10.169921875, 10.9990234375, 11.828125, 12.6572265625, 13.486328125, 14.3154296875, 15.14453125, 15.9736328125, 16.802734375, 17.6318359375, 18.4609375, 19.2900390625, 20.119140625, 20.9482421875, 21.77734375, 22.6064453125, 23.435546875, 24.2646484375, 25.09375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 11.0, 18.0, 24.0, 36.0, 43.0, 93.0, 126.0, 194.0, 314.0, 477.0, 875.0, 1686.0, 5586.0, 46802.0, 706049.0, 263027.0, 16880.0, 3305.0, 1240.0, 647.0, 438.0, 232.0, 163.0, 104.0, 68.0, 39.0, 25.0, 20.0, 15.0, 8.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.875, -65.71484375, -62.5546875, -59.39453125, -56.234375, -53.07421875, -49.9140625, -46.75390625, -43.59375, -40.43359375, -37.2734375, -34.11328125, -30.953125, -27.79296875, -24.6328125, -21.47265625, -18.3125, -15.15234375, -11.9921875, -8.83203125, -5.671875, -2.51171875, 0.6484375, 3.80859375, 6.96875, 10.12890625, 13.2890625, 16.44921875, 19.609375, 22.76953125, 25.9296875, 29.08984375, 32.25, 35.41015625, 38.5703125, 41.73046875, 44.890625, 48.05078125, 51.2109375, 54.37109375, 57.53125, 60.69140625, 63.8515625, 67.01171875, 70.171875, 73.33203125, 76.4921875, 79.65234375, 82.8125, 85.97265625, 89.1328125, 92.29296875, 95.453125, 98.61328125, 101.7734375, 104.93359375, 108.09375, 111.25390625, 114.4140625, 117.57421875, 120.734375, 123.89453125, 127.0546875, 130.21484375, 133.375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 10.0, 8.0, 17.0, 21.0, 18.0, 29.0, 39.0, 42.0, 57.0, 59.0, 63.0, 76.0, 78.0, 66.0, 72.0, 68.0, 58.0, 51.0, 39.0, 37.0, 29.0, 19.0, 12.0, 13.0, 8.0, 8.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-185.25, -180.783203125, -176.31640625, -171.849609375, -167.3828125, -162.916015625, -158.44921875, -153.982421875, -149.515625, -145.048828125, -140.58203125, -136.115234375, -131.6484375, -127.181640625, -122.71484375, -118.248046875, -113.78125, -109.314453125, -104.84765625, -100.380859375, -95.9140625, -91.447265625, -86.98046875, -82.513671875, -78.046875, -73.580078125, -69.11328125, -64.646484375, -60.1796875, -55.712890625, -51.24609375, -46.779296875, -42.3125, -37.845703125, -33.37890625, -28.912109375, -24.4453125, -19.978515625, -15.51171875, -11.044921875, -6.578125, -2.111328125, 2.35546875, 6.822265625, 11.2890625, 15.755859375, 20.22265625, 24.689453125, 29.15625, 33.623046875, 38.08984375, 42.556640625, 47.0234375, 51.490234375, 55.95703125, 60.423828125, 64.890625, 69.357421875, 73.82421875, 78.291015625, 82.7578125, 87.224609375, 91.69140625, 96.158203125, 100.625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 6.0, 4.0, 5.0, 6.0, 9.0, 11.0, 14.0, 28.0, 27.0, 38.0, 64.0, 87.0, 130.0, 242.0, 481.0, 1224.0, 4872.0, 40474.0, 774147.0, 208867.0, 13804.0, 2385.0, 802.0, 320.0, 201.0, 87.0, 62.0, 43.0, 29.0, 25.0, 11.0, 11.0, 11.0, 8.0, 10.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.21875, -41.76708984375, -40.3154296875, -38.86376953125, -37.412109375, -35.96044921875, -34.5087890625, -33.05712890625, -31.60546875, -30.15380859375, -28.7021484375, -27.25048828125, -25.798828125, -24.34716796875, -22.8955078125, -21.44384765625, -19.9921875, -18.54052734375, -17.0888671875, -15.63720703125, -14.185546875, -12.73388671875, -11.2822265625, -9.83056640625, -8.37890625, -6.92724609375, -5.4755859375, -4.02392578125, -2.572265625, -1.12060546875, 0.3310546875, 1.78271484375, 3.234375, 4.68603515625, 6.1376953125, 7.58935546875, 9.041015625, 10.49267578125, 11.9443359375, 13.39599609375, 14.84765625, 16.29931640625, 17.7509765625, 19.20263671875, 20.654296875, 22.10595703125, 23.5576171875, 25.00927734375, 26.4609375, 27.91259765625, 29.3642578125, 30.81591796875, 32.267578125, 33.71923828125, 35.1708984375, 36.62255859375, 38.07421875, 39.52587890625, 40.9775390625, 42.42919921875, 43.880859375, 45.33251953125, 46.7841796875, 48.23583984375, 49.6875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 4.0, 5.0, 6.0, 8.0, 8.0, 20.0, 14.0, 24.0, 36.0, 40.0, 56.0, 93.0, 113.0, 129.0, 112.0, 92.0, 66.0, 36.0, 31.0, 17.0, 17.0, 16.0, 16.0, 11.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.003875732421875, -0.0037534236907958984, -0.003631114959716797, -0.0035088062286376953, -0.0033864974975585938, -0.003264188766479492, -0.0031418800354003906, -0.003019571304321289, -0.0028972625732421875, -0.002774953842163086, -0.0026526451110839844, -0.002530336380004883, -0.0024080276489257812, -0.0022857189178466797, -0.002163410186767578, -0.0020411014556884766, -0.001918792724609375, -0.0017964839935302734, -0.0016741752624511719, -0.0015518665313720703, -0.0014295578002929688, -0.0013072490692138672, -0.0011849403381347656, -0.001062631607055664, -0.0009403228759765625, -0.0008180141448974609, -0.0006957054138183594, -0.0005733966827392578, -0.00045108795166015625, -0.0003287792205810547, -0.00020647048950195312, -8.416175842285156e-05, 3.814697265625e-05, 0.00016045570373535156, 0.0002827644348144531, 0.0004050731658935547, 0.0005273818969726562, 0.0006496906280517578, 0.0007719993591308594, 0.0008943080902099609, 0.0010166168212890625, 0.001138925552368164, 0.0012612342834472656, 0.0013835430145263672, 0.0015058517456054688, 0.0016281604766845703, 0.0017504692077636719, 0.0018727779388427734, 0.001995086669921875, 0.0021173954010009766, 0.002239704132080078, 0.0023620128631591797, 0.0024843215942382812, 0.002606630325317383, 0.0027289390563964844, 0.002851247787475586, 0.0029735565185546875, 0.003095865249633789, 0.0032181739807128906, 0.003340482711791992, 0.0034627914428710938, 0.0035851001739501953, 0.003707408905029297, 0.0038297176361083984, 0.0039520263671875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 7.0, 13.0, 29.0, 64.0, 102.0, 196.0, 421.0, 1246.0, 7709.0, 188352.0, 823240.0, 23409.0, 2547.0, 691.0, 268.0, 119.0, 69.0, 37.0, 18.0, 8.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.5625, -64.49609375, -62.4296875, -60.36328125, -58.296875, -56.23046875, -54.1640625, -52.09765625, -50.03125, -47.96484375, -45.8984375, -43.83203125, -41.765625, -39.69921875, -37.6328125, -35.56640625, -33.5, -31.43359375, -29.3671875, -27.30078125, -25.234375, -23.16796875, -21.1015625, -19.03515625, -16.96875, -14.90234375, -12.8359375, -10.76953125, -8.703125, -6.63671875, -4.5703125, -2.50390625, -0.4375, 1.62890625, 3.6953125, 5.76171875, 7.828125, 9.89453125, 11.9609375, 14.02734375, 16.09375, 18.16015625, 20.2265625, 22.29296875, 24.359375, 26.42578125, 28.4921875, 30.55859375, 32.625, 34.69140625, 36.7578125, 38.82421875, 40.890625, 42.95703125, 45.0234375, 47.08984375, 49.15625, 51.22265625, 53.2890625, 55.35546875, 57.421875, 59.48828125, 61.5546875, 63.62109375, 65.6875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 8.0, 1.0, 7.0, 8.0, 9.0, 13.0, 22.0, 18.0, 32.0, 58.0, 56.0, 83.0, 126.0, 118.0, 113.0, 87.0, 70.0, 59.0, 35.0, 22.0, 12.0, 9.0, 7.0, 6.0, 10.0, 7.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.9375, -29.84814453125, -28.7587890625, -27.66943359375, -26.580078125, -25.49072265625, -24.4013671875, -23.31201171875, -22.22265625, -21.13330078125, -20.0439453125, -18.95458984375, -17.865234375, -16.77587890625, -15.6865234375, -14.59716796875, -13.5078125, -12.41845703125, -11.3291015625, -10.23974609375, -9.150390625, -8.06103515625, -6.9716796875, -5.88232421875, -4.79296875, -3.70361328125, -2.6142578125, -1.52490234375, -0.435546875, 0.65380859375, 1.7431640625, 2.83251953125, 3.921875, 5.01123046875, 6.1005859375, 7.18994140625, 8.279296875, 9.36865234375, 10.4580078125, 11.54736328125, 12.63671875, 13.72607421875, 14.8154296875, 15.90478515625, 16.994140625, 18.08349609375, 19.1728515625, 20.26220703125, 21.3515625, 22.44091796875, 23.5302734375, 24.61962890625, 25.708984375, 26.79833984375, 27.8876953125, 28.97705078125, 30.06640625, 31.15576171875, 32.2451171875, 33.33447265625, 34.423828125, 35.51318359375, 36.6025390625, 37.69189453125, 38.78125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 10.0, 20.0, 70.0, 176.0, 306.0, 261.0, 111.0, 27.0, 17.0, 6.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-839.79931640625, -805.8283081054688, -771.8572387695312, -737.88623046875, -703.9151611328125, -669.9441528320312, -635.97314453125, -602.0020751953125, -568.031005859375, -534.0599975585938, -500.08892822265625, -466.117919921875, -432.1468505859375, -398.17584228515625, -364.2048034667969, -330.2337646484375, -296.26275634765625, -262.2917175292969, -228.3206787109375, -194.3496551513672, -160.3786163330078, -126.40757751464844, -92.43655395507812, -58.46551513671875, -24.494476318359375, 9.476558685302734, 43.447593688964844, 77.41862487792969, 111.38966369628906, 145.36070251464844, 179.33172607421875, 213.30276489257812, 247.2738037109375, 281.2448425292969, 315.21588134765625, 349.1868896484375, 383.157958984375, 417.12896728515625, 451.1000061035156, 485.071044921875, 519.0421142578125, 553.0131225585938, 586.9841918945312, 620.9552001953125, 654.92626953125, 688.8972778320312, 722.8682861328125, 756.83935546875, 790.8103637695312, 824.7813720703125, 858.75244140625, 892.7234497070312, 926.6945190429688, 960.66552734375, 994.6365966796875, 1028.607666015625, 1062.57861328125, 1096.5496826171875, 1130.5206298828125, 1164.49169921875, 1198.4627685546875, 1232.433837890625, 1266.40478515625, 1300.3758544921875, 1334.346923828125]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 6.0, 6.0, 4.0, 7.0, 16.0, 7.0, 15.0, 18.0, 20.0, 27.0, 10.0, 26.0, 32.0, 34.0, 38.0, 31.0, 34.0, 38.0, 49.0, 32.0, 43.0, 44.0, 49.0, 45.0, 39.0, 41.0, 37.0, 35.0, 34.0, 30.0, 32.0, 18.0, 24.0, 16.0, 13.0, 8.0, 8.0, 7.0, 10.0, 3.0, 6.0, 5.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-383.5564270019531, -372.88934326171875, -362.22222900390625, -351.5551452636719, -340.8880615234375, -330.220947265625, -319.5538635253906, -308.88677978515625, -298.21966552734375, -287.5525817871094, -276.8854675292969, -266.2183837890625, -255.55128479003906, -244.88418579101562, -234.21710205078125, -223.5500030517578, -212.88290405273438, -202.21580505371094, -191.5487060546875, -180.88162231445312, -170.2145233154297, -159.54742431640625, -148.88034057617188, -138.21324157714844, -127.546142578125, -116.87904357910156, -106.21195220947266, -95.54486083984375, -84.87776184082031, -74.21066284179688, -63.54357147216797, -52.87648010253906, -42.2093505859375, -31.542255401611328, -20.875160217285156, -10.208065032958984, 0.4590301513671875, 11.12612533569336, 21.79322052001953, 32.46031188964844, 43.127410888671875, 53.79450607299805, 64.46160125732422, 75.12869262695312, 85.79579162597656, 96.462890625, 107.1299819946289, 117.79707336425781, 128.46417236328125, 139.1312713623047, 149.79837036132812, 160.4654541015625, 171.13255310058594, 181.79965209960938, 192.46673583984375, 203.1338348388672, 213.80093383789062, 224.46803283691406, 235.1351318359375, 245.80221557617188, 256.46929931640625, 267.13641357421875, 277.8034973144531, 288.4705810546875, 299.1376953125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 4.0, 8.0, 4.0, 13.0, 16.0, 35.0, 41.0, 61.0, 102.0, 170.0, 321.0, 633.0, 1458.0, 3431.0, 9323.0, 38308.0, 3936131.0, 174795.0, 19267.0, 5754.0, 2209.0, 1034.0, 493.0, 266.0, 144.0, 81.0, 66.0, 32.0, 23.0, 17.0, 11.0, 10.0, 12.0, 4.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-101.3125, -97.79296875, -94.2734375, -90.75390625, -87.234375, -83.71484375, -80.1953125, -76.67578125, -73.15625, -69.63671875, -66.1171875, -62.59765625, -59.078125, -55.55859375, -52.0390625, -48.51953125, -45.0, -41.48046875, -37.9609375, -34.44140625, -30.921875, -27.40234375, -23.8828125, -20.36328125, -16.84375, -13.32421875, -9.8046875, -6.28515625, -2.765625, 0.75390625, 4.2734375, 7.79296875, 11.3125, 14.83203125, 18.3515625, 21.87109375, 25.390625, 28.91015625, 32.4296875, 35.94921875, 39.46875, 42.98828125, 46.5078125, 50.02734375, 53.546875, 57.06640625, 60.5859375, 64.10546875, 67.625, 71.14453125, 74.6640625, 78.18359375, 81.703125, 85.22265625, 88.7421875, 92.26171875, 95.78125, 99.30078125, 102.8203125, 106.33984375, 109.859375, 113.37890625, 116.8984375, 120.41796875, 123.9375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 3.0, 5.0, 10.0, 11.0, 16.0, 33.0, 24.0, 39.0, 47.0, 62.0, 78.0, 77.0, 76.0, 93.0, 78.0, 81.0, 54.0, 47.0, 45.0, 32.0, 22.0, 26.0, 15.0, 6.0, 7.0, 1.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-41.6875, -40.64501953125, -39.6025390625, -38.56005859375, -37.517578125, -36.47509765625, -35.4326171875, -34.39013671875, -33.34765625, -32.30517578125, -31.2626953125, -30.22021484375, -29.177734375, -28.13525390625, -27.0927734375, -26.05029296875, -25.0078125, -23.96533203125, -22.9228515625, -21.88037109375, -20.837890625, -19.79541015625, -18.7529296875, -17.71044921875, -16.66796875, -15.62548828125, -14.5830078125, -13.54052734375, -12.498046875, -11.45556640625, -10.4130859375, -9.37060546875, -8.328125, -7.28564453125, -6.2431640625, -5.20068359375, -4.158203125, -3.11572265625, -2.0732421875, -1.03076171875, 0.01171875, 1.05419921875, 2.0966796875, 3.13916015625, 4.181640625, 5.22412109375, 6.2666015625, 7.30908203125, 8.3515625, 9.39404296875, 10.4365234375, 11.47900390625, 12.521484375, 13.56396484375, 14.6064453125, 15.64892578125, 16.69140625, 17.73388671875, 18.7763671875, 19.81884765625, 20.861328125, 21.90380859375, 22.9462890625, 23.98876953125, 25.03125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 1.0, 3.0, 5.0, 6.0, 6.0, 15.0, 19.0, 34.0, 40.0, 56.0, 66.0, 113.0, 201.0, 293.0, 412.0, 630.0, 1142.0, 2163.0, 4407.0, 10245.0, 30675.0, 194341.0, 3821474.0, 92151.0, 20431.0, 7490.0, 3495.0, 1753.0, 936.0, 603.0, 328.0, 242.0, 163.0, 116.0, 61.0, 39.0, 45.0, 17.0, 18.0, 21.0, 8.0, 9.0, 3.0, 2.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-59.34375, -57.4501953125, -55.556640625, -53.6630859375, -51.76953125, -49.8759765625, -47.982421875, -46.0888671875, -44.1953125, -42.3017578125, -40.408203125, -38.5146484375, -36.62109375, -34.7275390625, -32.833984375, -30.9404296875, -29.046875, -27.1533203125, -25.259765625, -23.3662109375, -21.47265625, -19.5791015625, -17.685546875, -15.7919921875, -13.8984375, -12.0048828125, -10.111328125, -8.2177734375, -6.32421875, -4.4306640625, -2.537109375, -0.6435546875, 1.25, 3.1435546875, 5.037109375, 6.9306640625, 8.82421875, 10.7177734375, 12.611328125, 14.5048828125, 16.3984375, 18.2919921875, 20.185546875, 22.0791015625, 23.97265625, 25.8662109375, 27.759765625, 29.6533203125, 31.546875, 33.4404296875, 35.333984375, 37.2275390625, 39.12109375, 41.0146484375, 42.908203125, 44.8017578125, 46.6953125, 48.5888671875, 50.482421875, 52.3759765625, 54.26953125, 56.1630859375, 58.056640625, 59.9501953125, 61.84375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 6.0, 5.0, 8.0, 6.0, 6.0, 17.0, 30.0, 37.0, 50.0, 62.0, 124.0, 378.0, 2708.0, 300.0, 116.0, 66.0, 41.0, 30.0, 22.0, 11.0, 6.0, 10.0, 8.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.78125, -19.15185546875, -18.5224609375, -17.89306640625, -17.263671875, -16.63427734375, -16.0048828125, -15.37548828125, -14.74609375, -14.11669921875, -13.4873046875, -12.85791015625, -12.228515625, -11.59912109375, -10.9697265625, -10.34033203125, -9.7109375, -9.08154296875, -8.4521484375, -7.82275390625, -7.193359375, -6.56396484375, -5.9345703125, -5.30517578125, -4.67578125, -4.04638671875, -3.4169921875, -2.78759765625, -2.158203125, -1.52880859375, -0.8994140625, -0.27001953125, 0.359375, 0.98876953125, 1.6181640625, 2.24755859375, 2.876953125, 3.50634765625, 4.1357421875, 4.76513671875, 5.39453125, 6.02392578125, 6.6533203125, 7.28271484375, 7.912109375, 8.54150390625, 9.1708984375, 9.80029296875, 10.4296875, 11.05908203125, 11.6884765625, 12.31787109375, 12.947265625, 13.57666015625, 14.2060546875, 14.83544921875, 15.46484375, 16.09423828125, 16.7236328125, 17.35302734375, 17.982421875, 18.61181640625, 19.2412109375, 19.87060546875, 20.5]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 5.0, 1.0, 5.0, 5.0, 17.0, 20.0, 20.0, 25.0, 42.0, 40.0, 68.0, 70.0, 98.0, 114.0, 96.0, 93.0, 74.0, 59.0, 53.0, 30.0, 27.0, 14.0, 13.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-102.06675720214844, -99.00914001464844, -95.95153045654297, -92.8939208984375, -89.8363037109375, -86.7786865234375, -83.72107696533203, -80.66346740722656, -77.60585021972656, -74.54823303222656, -71.4906234741211, -68.43301391601562, -65.37539672851562, -62.31778335571289, -59.260169982910156, -56.20255661010742, -53.14494323730469, -50.08732986450195, -47.02971649169922, -43.972103118896484, -40.91448974609375, -37.856876373291016, -34.79926300048828, -31.741649627685547, -28.684036254882812, -25.626422882080078, -22.568809509277344, -19.51119613647461, -16.453582763671875, -13.39596939086914, -10.338356018066406, -7.280742645263672, -4.2231292724609375, -1.1655158996582031, 1.8920974731445312, 4.949710845947266, 8.00732421875, 11.064937591552734, 14.122550964355469, 17.180164337158203, 20.237777709960938, 23.295391082763672, 26.353004455566406, 29.41061782836914, 32.468231201171875, 35.52584457397461, 38.583457946777344, 41.64107131958008, 44.69868469238281, 47.75629806518555, 50.81391143798828, 53.871524810791016, 56.92913818359375, 59.986751556396484, 63.04436492919922, 66.10197448730469, 69.15959167480469, 72.21720886230469, 75.27481842041016, 78.33242797851562, 81.39004516601562, 84.44766235351562, 87.5052719116211, 90.56288146972656, 93.62049865722656]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 11.0, 9.0, 9.0, 6.0, 20.0, 15.0, 20.0, 17.0, 14.0, 22.0, 26.0, 33.0, 33.0, 46.0, 40.0, 43.0, 44.0, 50.0, 46.0, 48.0, 48.0, 46.0, 53.0, 47.0, 34.0, 35.0, 36.0, 26.0, 16.0, 29.0, 16.0, 16.0, 12.0, 10.0, 3.0, 4.0, 2.0, 4.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.46294403076172, -61.66453170776367, -59.866119384765625, -58.06770706176758, -56.26929473876953, -54.470882415771484, -52.67247009277344, -50.87405776977539, -49.075645446777344, -47.2772331237793, -45.47882080078125, -43.6804084777832, -41.881996154785156, -40.08358383178711, -38.28517150878906, -36.486759185791016, -34.68834686279297, -32.88993453979492, -31.091522216796875, -29.293109893798828, -27.49469757080078, -25.696285247802734, -23.897872924804688, -22.09946060180664, -20.301044464111328, -18.50263214111328, -16.704219818115234, -14.905807495117188, -13.10739517211914, -11.308981895446777, -9.51056957244873, -7.712157249450684, -5.913745880126953, -4.115333557128906, -2.3169209957122803, -0.5185084342956543, 1.2799038887023926, 3.0783166885375977, 4.8767290115356445, 6.675141334533691, 8.473553657531738, 10.271965980529785, 12.070378303527832, 13.868791580200195, 15.667203903198242, 17.46561622619629, 19.264028549194336, 21.062440872192383, 22.86085319519043, 24.659265518188477, 26.457677841186523, 28.25609016418457, 30.054502487182617, 31.852916717529297, 33.651329040527344, 35.44974136352539, 37.24815368652344, 39.046566009521484, 40.84497833251953, 42.64339065551758, 44.441802978515625, 46.24021530151367, 48.03862762451172, 49.837039947509766, 51.63545227050781]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 2.0, 5.0, 9.0, 8.0, 7.0, 16.0, 17.0, 29.0, 43.0, 63.0, 111.0, 156.0, 227.0, 372.0, 652.0, 1175.0, 2221.0, 4894.0, 11477.0, 29517.0, 81389.0, 224506.0, 399909.0, 182838.0, 66699.0, 24105.0, 9448.0, 4109.0, 1983.0, 1047.0, 572.0, 348.0, 194.0, 135.0, 91.0, 43.0, 45.0, 28.0, 14.0, 11.0, 12.0, 8.0, 6.0, 5.0, 2.0, 2.0, 0.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-62.21875, -60.29833984375, -58.3779296875, -56.45751953125, -54.537109375, -52.61669921875, -50.6962890625, -48.77587890625, -46.85546875, -44.93505859375, -43.0146484375, -41.09423828125, -39.173828125, -37.25341796875, -35.3330078125, -33.41259765625, -31.4921875, -29.57177734375, -27.6513671875, -25.73095703125, -23.810546875, -21.89013671875, -19.9697265625, -18.04931640625, -16.12890625, -14.20849609375, -12.2880859375, -10.36767578125, -8.447265625, -6.52685546875, -4.6064453125, -2.68603515625, -0.765625, 1.15478515625, 3.0751953125, 4.99560546875, 6.916015625, 8.83642578125, 10.7568359375, 12.67724609375, 14.59765625, 16.51806640625, 18.4384765625, 20.35888671875, 22.279296875, 24.19970703125, 26.1201171875, 28.04052734375, 29.9609375, 31.88134765625, 33.8017578125, 35.72216796875, 37.642578125, 39.56298828125, 41.4833984375, 43.40380859375, 45.32421875, 47.24462890625, 49.1650390625, 51.08544921875, 53.005859375, 54.92626953125, 56.8466796875, 58.76708984375, 60.6875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 6.0, 2.0, 7.0, 11.0, 12.0, 15.0, 17.0, 23.0, 35.0, 44.0, 41.0, 62.0, 56.0, 65.0, 69.0, 82.0, 68.0, 73.0, 54.0, 58.0, 38.0, 36.0, 29.0, 28.0, 25.0, 12.0, 10.0, 8.0, 7.0, 5.0, 2.0, 3.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-33.625, -32.701416015625, -31.77783203125, -30.854248046875, -29.9306640625, -29.007080078125, -28.08349609375, -27.159912109375, -26.236328125, -25.312744140625, -24.38916015625, -23.465576171875, -22.5419921875, -21.618408203125, -20.69482421875, -19.771240234375, -18.84765625, -17.924072265625, -17.00048828125, -16.076904296875, -15.1533203125, -14.229736328125, -13.30615234375, -12.382568359375, -11.458984375, -10.535400390625, -9.61181640625, -8.688232421875, -7.7646484375, -6.841064453125, -5.91748046875, -4.993896484375, -4.0703125, -3.146728515625, -2.22314453125, -1.299560546875, -0.3759765625, 0.547607421875, 1.47119140625, 2.394775390625, 3.318359375, 4.241943359375, 5.16552734375, 6.089111328125, 7.0126953125, 7.936279296875, 8.85986328125, 9.783447265625, 10.70703125, 11.630615234375, 12.55419921875, 13.477783203125, 14.4013671875, 15.324951171875, 16.24853515625, 17.172119140625, 18.095703125, 19.019287109375, 19.94287109375, 20.866455078125, 21.7900390625, 22.713623046875, 23.63720703125, 24.560791015625, 25.484375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 5.0, 2.0, 3.0, 3.0, 5.0, 6.0, 7.0, 5.0, 13.0, 21.0, 16.0, 23.0, 30.0, 36.0, 58.0, 87.0, 104.0, 183.0, 277.0, 418.0, 777.0, 1479.0, 4427.0, 18393.0, 135911.0, 712175.0, 146622.0, 19379.0, 4485.0, 1551.0, 753.0, 412.0, 278.0, 169.0, 120.0, 92.0, 62.0, 51.0, 24.0, 30.0, 21.0, 16.0, 4.0, 6.0, 8.0, 8.0, 4.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.0, -77.9453125, -74.890625, -71.8359375, -68.78125, -65.7265625, -62.671875, -59.6171875, -56.5625, -53.5078125, -50.453125, -47.3984375, -44.34375, -41.2890625, -38.234375, -35.1796875, -32.125, -29.0703125, -26.015625, -22.9609375, -19.90625, -16.8515625, -13.796875, -10.7421875, -7.6875, -4.6328125, -1.578125, 1.4765625, 4.53125, 7.5859375, 10.640625, 13.6953125, 16.75, 19.8046875, 22.859375, 25.9140625, 28.96875, 32.0234375, 35.078125, 38.1328125, 41.1875, 44.2421875, 47.296875, 50.3515625, 53.40625, 56.4609375, 59.515625, 62.5703125, 65.625, 68.6796875, 71.734375, 74.7890625, 77.84375, 80.8984375, 83.953125, 87.0078125, 90.0625, 93.1171875, 96.171875, 99.2265625, 102.28125, 105.3359375, 108.390625, 111.4453125, 114.5]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 11.0, 9.0, 14.0, 11.0, 10.0, 19.0, 22.0, 22.0, 21.0, 26.0, 42.0, 39.0, 45.0, 48.0, 50.0, 53.0, 60.0, 43.0, 48.0, 50.0, 53.0, 45.0, 29.0, 34.0, 32.0, 31.0, 20.0, 29.0, 17.0, 20.0, 12.0, 7.0, 5.0, 5.0, 5.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-96.0, -93.3427734375, -90.685546875, -88.0283203125, -85.37109375, -82.7138671875, -80.056640625, -77.3994140625, -74.7421875, -72.0849609375, -69.427734375, -66.7705078125, -64.11328125, -61.4560546875, -58.798828125, -56.1416015625, -53.484375, -50.8271484375, -48.169921875, -45.5126953125, -42.85546875, -40.1982421875, -37.541015625, -34.8837890625, -32.2265625, -29.5693359375, -26.912109375, -24.2548828125, -21.59765625, -18.9404296875, -16.283203125, -13.6259765625, -10.96875, -8.3115234375, -5.654296875, -2.9970703125, -0.33984375, 2.3173828125, 4.974609375, 7.6318359375, 10.2890625, 12.9462890625, 15.603515625, 18.2607421875, 20.91796875, 23.5751953125, 26.232421875, 28.8896484375, 31.546875, 34.2041015625, 36.861328125, 39.5185546875, 42.17578125, 44.8330078125, 47.490234375, 50.1474609375, 52.8046875, 55.4619140625, 58.119140625, 60.7763671875, 63.43359375, 66.0908203125, 68.748046875, 71.4052734375, 74.0625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 0.0, 0.0, 5.0, 12.0, 15.0, 21.0, 41.0, 48.0, 90.0, 196.0, 401.0, 867.0, 2558.0, 10359.0, 68254.0, 604173.0, 316037.0, 35899.0, 6373.0, 1809.0, 698.0, 325.0, 168.0, 83.0, 57.0, 37.0, 12.0, 7.0, 11.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.046875, -21.081787109375, -20.11669921875, -19.151611328125, -18.1865234375, -17.221435546875, -16.25634765625, -15.291259765625, -14.326171875, -13.361083984375, -12.39599609375, -11.430908203125, -10.4658203125, -9.500732421875, -8.53564453125, -7.570556640625, -6.60546875, -5.640380859375, -4.67529296875, -3.710205078125, -2.7451171875, -1.780029296875, -0.81494140625, 0.150146484375, 1.115234375, 2.080322265625, 3.04541015625, 4.010498046875, 4.9755859375, 5.940673828125, 6.90576171875, 7.870849609375, 8.8359375, 9.801025390625, 10.76611328125, 11.731201171875, 12.6962890625, 13.661376953125, 14.62646484375, 15.591552734375, 16.556640625, 17.521728515625, 18.48681640625, 19.451904296875, 20.4169921875, 21.382080078125, 22.34716796875, 23.312255859375, 24.27734375, 25.242431640625, 26.20751953125, 27.172607421875, 28.1376953125, 29.102783203125, 30.06787109375, 31.032958984375, 31.998046875, 32.963134765625, 33.92822265625, 34.893310546875, 35.8583984375, 36.823486328125, 37.78857421875, 38.753662109375, 39.71875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 5.0, 5.0, 6.0, 9.0, 15.0, 17.0, 21.0, 27.0, 23.0, 31.0, 45.0, 75.0, 107.0, 131.0, 119.0, 73.0, 56.0, 55.0, 42.0, 28.0, 30.0, 17.0, 14.0, 15.0, 6.0, 4.0, 7.0, 6.0, 7.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004486083984375, -0.004326164722442627, -0.004166245460510254, -0.004006326198577881, -0.003846406936645508, -0.0036864876747131348, -0.0035265684127807617, -0.0033666491508483887, -0.0032067298889160156, -0.0030468106269836426, -0.0028868913650512695, -0.0027269721031188965, -0.0025670528411865234, -0.0024071335792541504, -0.0022472143173217773, -0.0020872950553894043, -0.0019273757934570312, -0.0017674565315246582, -0.0016075372695922852, -0.0014476180076599121, -0.001287698745727539, -0.001127779483795166, -0.000967860221862793, -0.0008079409599304199, -0.0006480216979980469, -0.00048810243606567383, -0.0003281831741333008, -0.00016826391220092773, -8.344650268554688e-06, 0.00015157461166381836, 0.0003114938735961914, 0.00047141313552856445, 0.0006313323974609375, 0.0007912516593933105, 0.0009511709213256836, 0.0011110901832580566, 0.0012710094451904297, 0.0014309287071228027, 0.0015908479690551758, 0.0017507672309875488, 0.0019106864929199219, 0.002070605754852295, 0.002230525016784668, 0.002390444278717041, 0.002550363540649414, 0.002710282802581787, 0.00287020206451416, 0.003030121326446533, 0.0031900405883789062, 0.0033499598503112793, 0.0035098791122436523, 0.0036697983741760254, 0.0038297176361083984, 0.0039896368980407715, 0.0041495561599731445, 0.004309475421905518, 0.004469394683837891, 0.004629313945770264, 0.004789233207702637, 0.00494915246963501, 0.005109071731567383, 0.005268990993499756, 0.005428910255432129, 0.005588829517364502, 0.005748748779296875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 8.0, 8.0, 12.0, 29.0, 57.0, 72.0, 170.0, 306.0, 666.0, 1739.0, 7314.0, 76359.0, 799994.0, 147079.0, 11071.0, 2084.0, 804.0, 352.0, 186.0, 122.0, 55.0, 25.0, 11.0, 15.0, 10.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.109375, -28.777587890625, -27.44580078125, -26.114013671875, -24.7822265625, -23.450439453125, -22.11865234375, -20.786865234375, -19.455078125, -18.123291015625, -16.79150390625, -15.459716796875, -14.1279296875, -12.796142578125, -11.46435546875, -10.132568359375, -8.80078125, -7.468994140625, -6.13720703125, -4.805419921875, -3.4736328125, -2.141845703125, -0.81005859375, 0.521728515625, 1.853515625, 3.185302734375, 4.51708984375, 5.848876953125, 7.1806640625, 8.512451171875, 9.84423828125, 11.176025390625, 12.5078125, 13.839599609375, 15.17138671875, 16.503173828125, 17.8349609375, 19.166748046875, 20.49853515625, 21.830322265625, 23.162109375, 24.493896484375, 25.82568359375, 27.157470703125, 28.4892578125, 29.821044921875, 31.15283203125, 32.484619140625, 33.81640625, 35.148193359375, 36.47998046875, 37.811767578125, 39.1435546875, 40.475341796875, 41.80712890625, 43.138916015625, 44.470703125, 45.802490234375, 47.13427734375, 48.466064453125, 49.7978515625, 51.129638671875, 52.46142578125, 53.793212890625, 55.125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 8.0, 3.0, 7.0, 9.0, 12.0, 19.0, 17.0, 26.0, 32.0, 26.0, 26.0, 36.0, 42.0, 64.0, 45.0, 45.0, 71.0, 62.0, 56.0, 60.0, 47.0, 49.0, 44.0, 29.0, 32.0, 20.0, 15.0, 14.0, 17.0, 9.0, 14.0, 13.0, 6.0, 6.0, 4.0, 3.0, 2.0, 7.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-20.25, -19.65625, -19.0625, -18.46875, -17.875, -17.28125, -16.6875, -16.09375, -15.5, -14.90625, -14.3125, -13.71875, -13.125, -12.53125, -11.9375, -11.34375, -10.75, -10.15625, -9.5625, -8.96875, -8.375, -7.78125, -7.1875, -6.59375, -6.0, -5.40625, -4.8125, -4.21875, -3.625, -3.03125, -2.4375, -1.84375, -1.25, -0.65625, -0.0625, 0.53125, 1.125, 1.71875, 2.3125, 2.90625, 3.5, 4.09375, 4.6875, 5.28125, 5.875, 6.46875, 7.0625, 7.65625, 8.25, 8.84375, 9.4375, 10.03125, 10.625, 11.21875, 11.8125, 12.40625, 13.0, 13.59375, 14.1875, 14.78125, 15.375, 15.96875, 16.5625, 17.15625, 17.75]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 10.0, 56.0, 245.0, 430.0, 210.0, 44.0, 10.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-664.328369140625, -600.9441528320312, -537.5599975585938, -474.17578125, -410.7915954589844, -347.40740966796875, -284.023193359375, -220.63900756835938, -157.25482177734375, -93.8706283569336, -30.486434936523438, 32.89776611328125, 96.28195190429688, 159.6661376953125, 223.05035400390625, 286.4345397949219, 349.8187255859375, 413.2029113769531, 476.58709716796875, 539.9713134765625, 603.35546875, 666.7396850585938, 730.1239013671875, 793.508056640625, 856.8922729492188, 920.2764892578125, 983.66064453125, 1047.044921875, 1110.4290771484375, 1173.813232421875, 1237.197509765625, 1300.5816650390625, 1363.9658203125, 1427.3499755859375, 1490.7342529296875, 1554.118408203125, 1617.5025634765625, 1680.88671875, 1744.27099609375, 1807.6551513671875, 1871.039306640625, 1934.4234619140625, 1997.8077392578125, 2061.19189453125, 2124.576171875, 2187.960205078125, 2251.344482421875, 2314.728759765625, 2378.11279296875, 2441.4970703125, 2504.881103515625, 2568.265380859375, 2631.649658203125, 2695.03369140625, 2758.41796875, 2821.80224609375, 2885.1865234375, 2948.57080078125, 3011.954833984375, 3075.339111328125, 3138.723388671875, 3202.107421875, 3265.49169921875, 3328.8759765625, 3392.260009765625]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 1.0, 4.0, 4.0, 10.0, 14.0, 15.0, 7.0, 14.0, 16.0, 32.0, 18.0, 37.0, 41.0, 36.0, 55.0, 62.0, 63.0, 56.0, 56.0, 52.0, 54.0, 40.0, 39.0, 55.0, 38.0, 28.0, 29.0, 22.0, 27.0, 17.0, 10.0, 13.0, 7.0, 8.0, 8.0, 1.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-326.4562683105469, -313.5807800292969, -300.705322265625, -287.829833984375, -274.9543762207031, -262.0788879394531, -249.2034149169922, -236.32794189453125, -223.4524688720703, -210.57699584960938, -197.70152282714844, -184.8260498046875, -171.9505615234375, -159.07510375976562, -146.19961547851562, -133.3241424560547, -120.44866943359375, -107.57319641113281, -94.69772338867188, -81.8222427368164, -68.94676971435547, -56.07129669189453, -43.19581604003906, -30.320343017578125, -17.444869995117188, -4.569395065307617, 8.306079864501953, 21.181556701660156, 34.057029724121094, 46.93250274658203, 59.8079833984375, 72.68345642089844, 85.5589599609375, 98.43443298339844, 111.30990600585938, 124.18538665771484, 137.06085205078125, 149.93634033203125, 162.8118133544922, 175.68728637695312, 188.56275939941406, 201.438232421875, 214.31370544433594, 227.18917846679688, 240.06466674804688, 252.94012451171875, 265.81561279296875, 278.69110107421875, 291.5665588378906, 304.4420471191406, 317.3175048828125, 330.1929931640625, 343.0684509277344, 355.9439392089844, 368.81939697265625, 381.69488525390625, 394.57037353515625, 407.44586181640625, 420.3213195800781, 433.1968078613281, 446.072265625, 458.94775390625, 471.8232421875, 484.6986999511719, 497.57415771484375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 1.0, 13.0, 18.0, 34.0, 41.0, 74.0, 160.0, 303.0, 750.0, 1757.0, 5009.0, 18738.0, 108123.0, 2945614.0, 1031156.0, 63566.0, 12635.0, 3696.0, 1359.0, 596.0, 285.0, 133.0, 90.0, 39.0, 37.0, 22.0, 17.0, 7.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.5, -65.240234375, -62.98046875, -60.720703125, -58.4609375, -56.201171875, -53.94140625, -51.681640625, -49.421875, -47.162109375, -44.90234375, -42.642578125, -40.3828125, -38.123046875, -35.86328125, -33.603515625, -31.34375, -29.083984375, -26.82421875, -24.564453125, -22.3046875, -20.044921875, -17.78515625, -15.525390625, -13.265625, -11.005859375, -8.74609375, -6.486328125, -4.2265625, -1.966796875, 0.29296875, 2.552734375, 4.8125, 7.072265625, 9.33203125, 11.591796875, 13.8515625, 16.111328125, 18.37109375, 20.630859375, 22.890625, 25.150390625, 27.41015625, 29.669921875, 31.9296875, 34.189453125, 36.44921875, 38.708984375, 40.96875, 43.228515625, 45.48828125, 47.748046875, 50.0078125, 52.267578125, 54.52734375, 56.787109375, 59.046875, 61.306640625, 63.56640625, 65.826171875, 68.0859375, 70.345703125, 72.60546875, 74.865234375, 77.125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 7.0, 5.0, 6.0, 6.0, 18.0, 16.0, 16.0, 20.0, 33.0, 37.0, 31.0, 33.0, 42.0, 61.0, 68.0, 63.0, 76.0, 54.0, 61.0, 48.0, 60.0, 42.0, 37.0, 31.0, 26.0, 27.0, 20.0, 10.0, 15.0, 6.0, 6.0, 8.0, 2.0, 3.0, 3.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-21.265625, -20.547119140625, -19.82861328125, -19.110107421875, -18.3916015625, -17.673095703125, -16.95458984375, -16.236083984375, -15.517578125, -14.799072265625, -14.08056640625, -13.362060546875, -12.6435546875, -11.925048828125, -11.20654296875, -10.488037109375, -9.76953125, -9.051025390625, -8.33251953125, -7.614013671875, -6.8955078125, -6.177001953125, -5.45849609375, -4.739990234375, -4.021484375, -3.302978515625, -2.58447265625, -1.865966796875, -1.1474609375, -0.428955078125, 0.28955078125, 1.008056640625, 1.7265625, 2.445068359375, 3.16357421875, 3.882080078125, 4.6005859375, 5.319091796875, 6.03759765625, 6.756103515625, 7.474609375, 8.193115234375, 8.91162109375, 9.630126953125, 10.3486328125, 11.067138671875, 11.78564453125, 12.504150390625, 13.22265625, 13.941162109375, 14.65966796875, 15.378173828125, 16.0966796875, 16.815185546875, 17.53369140625, 18.252197265625, 18.970703125, 19.689208984375, 20.40771484375, 21.126220703125, 21.8447265625, 22.563232421875, 23.28173828125, 24.000244140625, 24.71875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 7.0, 8.0, 7.0, 8.0, 17.0, 17.0, 31.0, 49.0, 125.0, 205.0, 427.0, 1051.0, 3144.0, 12364.0, 76986.0, 2855718.0, 1178103.0, 52257.0, 9431.0, 2583.0, 836.0, 407.0, 195.0, 122.0, 66.0, 31.0, 29.0, 19.0, 16.0, 4.0, 5.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-86.6875, -84.2041015625, -81.720703125, -79.2373046875, -76.75390625, -74.2705078125, -71.787109375, -69.3037109375, -66.8203125, -64.3369140625, -61.853515625, -59.3701171875, -56.88671875, -54.4033203125, -51.919921875, -49.4365234375, -46.953125, -44.4697265625, -41.986328125, -39.5029296875, -37.01953125, -34.5361328125, -32.052734375, -29.5693359375, -27.0859375, -24.6025390625, -22.119140625, -19.6357421875, -17.15234375, -14.6689453125, -12.185546875, -9.7021484375, -7.21875, -4.7353515625, -2.251953125, 0.2314453125, 2.71484375, 5.1982421875, 7.681640625, 10.1650390625, 12.6484375, 15.1318359375, 17.615234375, 20.0986328125, 22.58203125, 25.0654296875, 27.548828125, 30.0322265625, 32.515625, 34.9990234375, 37.482421875, 39.9658203125, 42.44921875, 44.9326171875, 47.416015625, 49.8994140625, 52.3828125, 54.8662109375, 57.349609375, 59.8330078125, 62.31640625, 64.7998046875, 67.283203125, 69.7666015625, 72.25]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 1.0, 4.0, 3.0, 8.0, 15.0, 15.0, 20.0, 25.0, 56.0, 90.0, 144.0, 300.0, 633.0, 1146.0, 749.0, 349.0, 197.0, 114.0, 65.0, 41.0, 38.0, 16.0, 9.0, 7.0, 5.0, 5.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.34375, -49.25439453125, -47.1650390625, -45.07568359375, -42.986328125, -40.89697265625, -38.8076171875, -36.71826171875, -34.62890625, -32.53955078125, -30.4501953125, -28.36083984375, -26.271484375, -24.18212890625, -22.0927734375, -20.00341796875, -17.9140625, -15.82470703125, -13.7353515625, -11.64599609375, -9.556640625, -7.46728515625, -5.3779296875, -3.28857421875, -1.19921875, 0.89013671875, 2.9794921875, 5.06884765625, 7.158203125, 9.24755859375, 11.3369140625, 13.42626953125, 15.515625, 17.60498046875, 19.6943359375, 21.78369140625, 23.873046875, 25.96240234375, 28.0517578125, 30.14111328125, 32.23046875, 34.31982421875, 36.4091796875, 38.49853515625, 40.587890625, 42.67724609375, 44.7666015625, 46.85595703125, 48.9453125, 51.03466796875, 53.1240234375, 55.21337890625, 57.302734375, 59.39208984375, 61.4814453125, 63.57080078125, 65.66015625, 67.74951171875, 69.8388671875, 71.92822265625, 74.017578125, 76.10693359375, 78.1962890625, 80.28564453125, 82.375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 11.0, 26.0, 53.0, 138.0, 232.0, 226.0, 133.0, 93.0, 42.0, 15.0, 9.0, 8.0, 2.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-734.3699951171875, -711.4608154296875, -688.5516357421875, -665.6424560546875, -642.7332763671875, -619.8240966796875, -596.9149169921875, -574.0057373046875, -551.0965576171875, -528.1873779296875, -505.2781982421875, -482.3690185546875, -459.4598388671875, -436.5506591796875, -413.6414794921875, -390.7322998046875, -367.8231201171875, -344.9139404296875, -322.0047607421875, -299.0955810546875, -276.1864013671875, -253.2772216796875, -230.3680419921875, -207.4588623046875, -184.5496826171875, -161.6405029296875, -138.7313232421875, -115.8221435546875, -92.9129638671875, -70.0037841796875, -47.0946044921875, -24.1854248046875, -1.27618408203125, 21.63299560546875, 44.54217529296875, 67.45135498046875, 90.36053466796875, 113.26971435546875, 136.17889404296875, 159.08807373046875, 181.99725341796875, 204.90643310546875, 227.81561279296875, 250.72479248046875, 273.63397216796875, 296.54315185546875, 319.45233154296875, 342.36151123046875, 365.27069091796875, 388.17987060546875, 411.08905029296875, 433.99822998046875, 456.90740966796875, 479.81658935546875, 502.72576904296875, 525.6349487304688, 548.5441284179688, 571.4533081054688, 594.3624877929688, 617.2716674804688, 640.1808471679688, 663.0900268554688, 685.9992065429688, 708.9083862304688, 731.8175659179688]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 5.0, 6.0, 6.0, 5.0, 14.0, 16.0, 13.0, 20.0, 17.0, 34.0, 26.0, 43.0, 30.0, 40.0, 42.0, 49.0, 54.0, 44.0, 61.0, 57.0, 57.0, 52.0, 40.0, 30.0, 49.0, 31.0, 30.0, 30.0, 16.0, 24.0, 16.0, 8.0, 9.0, 10.0, 4.0, 5.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-266.94854736328125, -258.3462829589844, -249.74400329589844, -241.1417236328125, -232.53945922851562, -223.93719482421875, -215.3349151611328, -206.73263549804688, -198.13037109375, -189.52810668945312, -180.9258270263672, -172.32354736328125, -163.72128295898438, -155.1190185546875, -146.51673889160156, -137.91445922851562, -129.31219482421875, -120.70992279052734, -112.10765075683594, -103.50537872314453, -94.90310668945312, -86.30083465576172, -77.69856262207031, -69.0962905883789, -60.4940185546875, -51.891746520996094, -43.28947448730469, -34.68720245361328, -26.084930419921875, -17.48265838623047, -8.880386352539062, -0.27811431884765625, 8.32415771484375, 16.926429748535156, 25.528701782226562, 34.13097381591797, 42.733245849609375, 51.33551788330078, 59.93778991699219, 68.5400619506836, 77.142333984375, 85.7446060180664, 94.34687805175781, 102.94915008544922, 111.55142211914062, 120.15369415283203, 128.75596618652344, 137.35824584960938, 145.96051025390625, 154.56277465820312, 163.16505432128906, 171.767333984375, 180.36959838867188, 188.97186279296875, 197.5741424560547, 206.17642211914062, 214.7786865234375, 223.38095092773438, 231.9832305908203, 240.58551025390625, 249.18777465820312, 257.7900390625, 266.392333984375, 274.9945983886719, 283.59686279296875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 7.0, 7.0, 15.0, 17.0, 31.0, 48.0, 93.0, 119.0, 215.0, 371.0, 835.0, 1771.0, 3938.0, 10504.0, 31021.0, 99929.0, 392748.0, 367411.0, 93260.0, 28984.0, 10039.0, 3878.0, 1718.0, 742.0, 347.0, 198.0, 133.0, 67.0, 34.0, 28.0, 15.0, 10.0, 6.0, 7.0, 2.0, 7.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-74.5, -72.58837890625, -70.6767578125, -68.76513671875, -66.853515625, -64.94189453125, -63.0302734375, -61.11865234375, -59.20703125, -57.29541015625, -55.3837890625, -53.47216796875, -51.560546875, -49.64892578125, -47.7373046875, -45.82568359375, -43.9140625, -42.00244140625, -40.0908203125, -38.17919921875, -36.267578125, -34.35595703125, -32.4443359375, -30.53271484375, -28.62109375, -26.70947265625, -24.7978515625, -22.88623046875, -20.974609375, -19.06298828125, -17.1513671875, -15.23974609375, -13.328125, -11.41650390625, -9.5048828125, -7.59326171875, -5.681640625, -3.77001953125, -1.8583984375, 0.05322265625, 1.96484375, 3.87646484375, 5.7880859375, 7.69970703125, 9.611328125, 11.52294921875, 13.4345703125, 15.34619140625, 17.2578125, 19.16943359375, 21.0810546875, 22.99267578125, 24.904296875, 26.81591796875, 28.7275390625, 30.63916015625, 32.55078125, 34.46240234375, 36.3740234375, 38.28564453125, 40.197265625, 42.10888671875, 44.0205078125, 45.93212890625, 47.84375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 8.0, 7.0, 14.0, 16.0, 13.0, 24.0, 26.0, 45.0, 30.0, 47.0, 67.0, 61.0, 50.0, 73.0, 54.0, 66.0, 67.0, 40.0, 45.0, 43.0, 48.0, 36.0, 25.0, 21.0, 14.0, 14.0, 11.0, 3.0, 6.0, 7.0, 1.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-22.078125, -21.35009765625, -20.6220703125, -19.89404296875, -19.166015625, -18.43798828125, -17.7099609375, -16.98193359375, -16.25390625, -15.52587890625, -14.7978515625, -14.06982421875, -13.341796875, -12.61376953125, -11.8857421875, -11.15771484375, -10.4296875, -9.70166015625, -8.9736328125, -8.24560546875, -7.517578125, -6.78955078125, -6.0615234375, -5.33349609375, -4.60546875, -3.87744140625, -3.1494140625, -2.42138671875, -1.693359375, -0.96533203125, -0.2373046875, 0.49072265625, 1.21875, 1.94677734375, 2.6748046875, 3.40283203125, 4.130859375, 4.85888671875, 5.5869140625, 6.31494140625, 7.04296875, 7.77099609375, 8.4990234375, 9.22705078125, 9.955078125, 10.68310546875, 11.4111328125, 12.13916015625, 12.8671875, 13.59521484375, 14.3232421875, 15.05126953125, 15.779296875, 16.50732421875, 17.2353515625, 17.96337890625, 18.69140625, 19.41943359375, 20.1474609375, 20.87548828125, 21.603515625, 22.33154296875, 23.0595703125, 23.78759765625, 24.515625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 4.0, 5.0, 9.0, 13.0, 15.0, 19.0, 28.0, 38.0, 56.0, 85.0, 135.0, 238.0, 433.0, 821.0, 1879.0, 6205.0, 66074.0, 857591.0, 102792.0, 7960.0, 2121.0, 874.0, 438.0, 250.0, 173.0, 100.0, 60.0, 40.0, 19.0, 20.0, 18.0, 12.0, 2.0, 8.0, 2.0, 6.0, 7.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-127.8125, -124.115234375, -120.41796875, -116.720703125, -113.0234375, -109.326171875, -105.62890625, -101.931640625, -98.234375, -94.537109375, -90.83984375, -87.142578125, -83.4453125, -79.748046875, -76.05078125, -72.353515625, -68.65625, -64.958984375, -61.26171875, -57.564453125, -53.8671875, -50.169921875, -46.47265625, -42.775390625, -39.078125, -35.380859375, -31.68359375, -27.986328125, -24.2890625, -20.591796875, -16.89453125, -13.197265625, -9.5, -5.802734375, -2.10546875, 1.591796875, 5.2890625, 8.986328125, 12.68359375, 16.380859375, 20.078125, 23.775390625, 27.47265625, 31.169921875, 34.8671875, 38.564453125, 42.26171875, 45.958984375, 49.65625, 53.353515625, 57.05078125, 60.748046875, 64.4453125, 68.142578125, 71.83984375, 75.537109375, 79.234375, 82.931640625, 86.62890625, 90.326171875, 94.0234375, 97.720703125, 101.41796875, 105.115234375, 108.8125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 6.0, 3.0, 9.0, 13.0, 14.0, 13.0, 21.0, 20.0, 27.0, 32.0, 28.0, 26.0, 27.0, 46.0, 35.0, 43.0, 48.0, 52.0, 39.0, 43.0, 58.0, 39.0, 45.0, 33.0, 46.0, 41.0, 36.0, 18.0, 21.0, 26.0, 28.0, 17.0, 10.0, 4.0, 10.0, 2.0, 7.0, 2.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-77.8125, -75.61474609375, -73.4169921875, -71.21923828125, -69.021484375, -66.82373046875, -64.6259765625, -62.42822265625, -60.23046875, -58.03271484375, -55.8349609375, -53.63720703125, -51.439453125, -49.24169921875, -47.0439453125, -44.84619140625, -42.6484375, -40.45068359375, -38.2529296875, -36.05517578125, -33.857421875, -31.65966796875, -29.4619140625, -27.26416015625, -25.06640625, -22.86865234375, -20.6708984375, -18.47314453125, -16.275390625, -14.07763671875, -11.8798828125, -9.68212890625, -7.484375, -5.28662109375, -3.0888671875, -0.89111328125, 1.306640625, 3.50439453125, 5.7021484375, 7.89990234375, 10.09765625, 12.29541015625, 14.4931640625, 16.69091796875, 18.888671875, 21.08642578125, 23.2841796875, 25.48193359375, 27.6796875, 29.87744140625, 32.0751953125, 34.27294921875, 36.470703125, 38.66845703125, 40.8662109375, 43.06396484375, 45.26171875, 47.45947265625, 49.6572265625, 51.85498046875, 54.052734375, 56.25048828125, 58.4482421875, 60.64599609375, 62.84375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 4.0, 6.0, 1.0, 9.0, 15.0, 23.0, 40.0, 49.0, 71.0, 139.0, 265.0, 743.0, 3135.0, 36056.0, 909496.0, 91629.0, 5102.0, 1009.0, 341.0, 171.0, 73.0, 61.0, 46.0, 24.0, 10.0, 7.0, 5.0, 11.0, 1.0, 6.0, 0.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.46875, -41.77294921875, -40.0771484375, -38.38134765625, -36.685546875, -34.98974609375, -33.2939453125, -31.59814453125, -29.90234375, -28.20654296875, -26.5107421875, -24.81494140625, -23.119140625, -21.42333984375, -19.7275390625, -18.03173828125, -16.3359375, -14.64013671875, -12.9443359375, -11.24853515625, -9.552734375, -7.85693359375, -6.1611328125, -4.46533203125, -2.76953125, -1.07373046875, 0.6220703125, 2.31787109375, 4.013671875, 5.70947265625, 7.4052734375, 9.10107421875, 10.796875, 12.49267578125, 14.1884765625, 15.88427734375, 17.580078125, 19.27587890625, 20.9716796875, 22.66748046875, 24.36328125, 26.05908203125, 27.7548828125, 29.45068359375, 31.146484375, 32.84228515625, 34.5380859375, 36.23388671875, 37.9296875, 39.62548828125, 41.3212890625, 43.01708984375, 44.712890625, 46.40869140625, 48.1044921875, 49.80029296875, 51.49609375, 53.19189453125, 54.8876953125, 56.58349609375, 58.279296875, 59.97509765625, 61.6708984375, 63.36669921875, 65.0625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 0.0, 3.0, 5.0, 6.0, 1.0, 7.0, 5.0, 5.0, 7.0, 14.0, 14.0, 19.0, 10.0, 22.0, 32.0, 39.0, 46.0, 74.0, 84.0, 132.0, 118.0, 81.0, 61.0, 51.0, 30.0, 23.0, 21.0, 12.0, 18.0, 10.0, 13.0, 5.0, 8.0, 9.0, 5.0, 2.0, 6.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0035114288330078125, -0.0033857524394989014, -0.0032600760459899902, -0.003134399652481079, -0.003008723258972168, -0.002883046865463257, -0.0027573704719543457, -0.0026316940784454346, -0.0025060176849365234, -0.0023803412914276123, -0.002254664897918701, -0.00212898850440979, -0.002003312110900879, -0.0018776357173919678, -0.0017519593238830566, -0.0016262829303741455, -0.0015006065368652344, -0.0013749301433563232, -0.0012492537498474121, -0.001123577356338501, -0.0009979009628295898, -0.0008722245693206787, -0.0007465481758117676, -0.0006208717823028564, -0.0004951953887939453, -0.0003695189952850342, -0.00024384260177612305, -0.00011816620826721191, 7.510185241699219e-06, 0.00013318657875061035, 0.0002588629722595215, 0.0003845393657684326, 0.0005102157592773438, 0.0006358921527862549, 0.000761568546295166, 0.0008872449398040771, 0.0010129213333129883, 0.0011385977268218994, 0.0012642741203308105, 0.0013899505138397217, 0.0015156269073486328, 0.001641303300857544, 0.001766979694366455, 0.0018926560878753662, 0.0020183324813842773, 0.0021440088748931885, 0.0022696852684020996, 0.0023953616619110107, 0.002521038055419922, 0.002646714448928833, 0.002772390842437744, 0.0028980672359466553, 0.0030237436294555664, 0.0031494200229644775, 0.0032750964164733887, 0.0034007728099823, 0.003526449203491211, 0.003652125597000122, 0.003777801990509033, 0.0039034783840179443, 0.0040291547775268555, 0.004154831171035767, 0.004280507564544678, 0.004406183958053589, 0.0045318603515625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 9.0, 6.0, 15.0, 22.0, 31.0, 38.0, 64.0, 89.0, 130.0, 255.0, 477.0, 1075.0, 3029.0, 14420.0, 254126.0, 735664.0, 31528.0, 4734.0, 1441.0, 626.0, 311.0, 160.0, 100.0, 59.0, 49.0, 25.0, 22.0, 13.0, 8.0, 2.0, 3.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.375, -43.076171875, -41.77734375, -40.478515625, -39.1796875, -37.880859375, -36.58203125, -35.283203125, -33.984375, -32.685546875, -31.38671875, -30.087890625, -28.7890625, -27.490234375, -26.19140625, -24.892578125, -23.59375, -22.294921875, -20.99609375, -19.697265625, -18.3984375, -17.099609375, -15.80078125, -14.501953125, -13.203125, -11.904296875, -10.60546875, -9.306640625, -8.0078125, -6.708984375, -5.41015625, -4.111328125, -2.8125, -1.513671875, -0.21484375, 1.083984375, 2.3828125, 3.681640625, 4.98046875, 6.279296875, 7.578125, 8.876953125, 10.17578125, 11.474609375, 12.7734375, 14.072265625, 15.37109375, 16.669921875, 17.96875, 19.267578125, 20.56640625, 21.865234375, 23.1640625, 24.462890625, 25.76171875, 27.060546875, 28.359375, 29.658203125, 30.95703125, 32.255859375, 33.5546875, 34.853515625, 36.15234375, 37.451171875, 38.75]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 7.0, 14.0, 23.0, 28.0, 42.0, 62.0, 78.0, 136.0, 159.0, 142.0, 114.0, 78.0, 39.0, 22.0, 19.0, 10.0, 8.0, 4.0, 7.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-49.78125, -48.555908203125, -47.33056640625, -46.105224609375, -44.8798828125, -43.654541015625, -42.42919921875, -41.203857421875, -39.978515625, -38.753173828125, -37.52783203125, -36.302490234375, -35.0771484375, -33.851806640625, -32.62646484375, -31.401123046875, -30.17578125, -28.950439453125, -27.72509765625, -26.499755859375, -25.2744140625, -24.049072265625, -22.82373046875, -21.598388671875, -20.373046875, -19.147705078125, -17.92236328125, -16.697021484375, -15.4716796875, -14.246337890625, -13.02099609375, -11.795654296875, -10.5703125, -9.344970703125, -8.11962890625, -6.894287109375, -5.6689453125, -4.443603515625, -3.21826171875, -1.992919921875, -0.767578125, 0.457763671875, 1.68310546875, 2.908447265625, 4.1337890625, 5.359130859375, 6.58447265625, 7.809814453125, 9.03515625, 10.260498046875, 11.48583984375, 12.711181640625, 13.9365234375, 15.161865234375, 16.38720703125, 17.612548828125, 18.837890625, 20.063232421875, 21.28857421875, 22.513916015625, 23.7392578125, 24.964599609375, 26.18994140625, 27.415283203125, 28.640625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 6.0, 14.0, 32.0, 88.0, 198.0, 270.0, 204.0, 104.0, 43.0, 23.0, 14.0, 5.0, 2.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-498.6337890625, -474.1600036621094, -449.68621826171875, -425.21240234375, -400.7386169433594, -376.26483154296875, -351.791015625, -327.3172302246094, -302.84344482421875, -278.3696594238281, -253.89585876464844, -229.42205810546875, -204.94827270507812, -180.4744873046875, -156.0006866455078, -131.52688598632812, -107.0531005859375, -82.57930755615234, -58.10551452636719, -33.63172149658203, -9.157928466796875, 15.315864562988281, 39.78965759277344, 64.26345825195312, 88.73724365234375, 113.2110366821289, 137.68482971191406, 162.15863037109375, 186.63241577148438, 211.106201171875, 235.5800018310547, 260.0538024902344, 284.527587890625, 309.0013732910156, 333.47515869140625, 357.948974609375, 382.4227600097656, 406.89654541015625, 431.370361328125, 455.8441467285156, 480.31793212890625, 504.7917175292969, 529.2655029296875, 553.7393188476562, 578.213134765625, 602.6868896484375, 627.1607055664062, 651.634521484375, 676.1082763671875, 700.5820922851562, 725.0558471679688, 749.5296630859375, 774.00341796875, 798.4772338867188, 822.9510498046875, 847.4248046875, 871.8986206054688, 896.3724365234375, 920.84619140625, 945.3200073242188, 969.7938232421875, 994.267578125, 1018.7413940429688, 1043.2152099609375, 1067.68896484375]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 5.0, 5.0, 5.0, 12.0, 14.0, 9.0, 20.0, 21.0, 27.0, 22.0, 28.0, 36.0, 36.0, 29.0, 45.0, 58.0, 48.0, 49.0, 74.0, 55.0, 59.0, 50.0, 43.0, 42.0, 35.0, 31.0, 19.0, 15.0, 28.0, 20.0, 16.0, 7.0, 9.0, 8.0, 8.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-340.7347412109375, -330.76318359375, -320.7916259765625, -310.820068359375, -300.8485107421875, -290.876953125, -280.9053955078125, -270.933837890625, -260.9622802734375, -250.99072265625, -241.0191650390625, -231.047607421875, -221.0760498046875, -211.1044921875, -201.13291931152344, -191.16136169433594, -181.18978881835938, -171.21823120117188, -161.24667358398438, -151.27511596679688, -141.30355834960938, -131.33200073242188, -121.36042785644531, -111.38887023925781, -101.41731262207031, -91.44575500488281, -81.47419738769531, -71.50263214111328, -61.53107452392578, -51.55951690673828, -41.587955474853516, -31.61639404296875, -21.644805908203125, -11.673246383666992, -1.7016868591308594, 8.269872665405273, 18.241432189941406, 28.212989807128906, 38.18455123901367, 48.15611267089844, 58.12767028808594, 68.09922790527344, 78.07078552246094, 88.04235076904297, 98.01390838623047, 107.98546600341797, 117.95703125, 127.9285888671875, 137.900146484375, 147.8717041015625, 157.84326171875, 167.8148193359375, 177.786376953125, 187.7579345703125, 197.72950744628906, 207.70106506347656, 217.67262268066406, 227.64418029785156, 237.61573791503906, 247.58729553222656, 257.5588684082031, 267.5304260253906, 277.5019836425781, 287.4735412597656, 297.4450988769531]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 7.0, 9.0, 21.0, 21.0, 29.0, 33.0, 55.0, 131.0, 183.0, 329.0, 696.0, 1556.0, 3804.0, 10465.0, 38890.0, 292841.0, 3507547.0, 282224.0, 38204.0, 10391.0, 3764.0, 1567.0, 643.0, 342.0, 208.0, 103.0, 66.0, 56.0, 36.0, 19.0, 14.0, 11.0, 7.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.875, -44.37060546875, -42.8662109375, -41.36181640625, -39.857421875, -38.35302734375, -36.8486328125, -35.34423828125, -33.83984375, -32.33544921875, -30.8310546875, -29.32666015625, -27.822265625, -26.31787109375, -24.8134765625, -23.30908203125, -21.8046875, -20.30029296875, -18.7958984375, -17.29150390625, -15.787109375, -14.28271484375, -12.7783203125, -11.27392578125, -9.76953125, -8.26513671875, -6.7607421875, -5.25634765625, -3.751953125, -2.24755859375, -0.7431640625, 0.76123046875, 2.265625, 3.77001953125, 5.2744140625, 6.77880859375, 8.283203125, 9.78759765625, 11.2919921875, 12.79638671875, 14.30078125, 15.80517578125, 17.3095703125, 18.81396484375, 20.318359375, 21.82275390625, 23.3271484375, 24.83154296875, 26.3359375, 27.84033203125, 29.3447265625, 30.84912109375, 32.353515625, 33.85791015625, 35.3623046875, 36.86669921875, 38.37109375, 39.87548828125, 41.3798828125, 42.88427734375, 44.388671875, 45.89306640625, 47.3974609375, 48.90185546875, 50.40625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 5.0, 14.0, 6.0, 7.0, 15.0, 12.0, 25.0, 30.0, 37.0, 45.0, 57.0, 64.0, 63.0, 65.0, 55.0, 60.0, 83.0, 65.0, 56.0, 35.0, 39.0, 43.0, 27.0, 22.0, 16.0, 11.0, 13.0, 14.0, 2.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-22.625, -21.889404296875, -21.15380859375, -20.418212890625, -19.6826171875, -18.947021484375, -18.21142578125, -17.475830078125, -16.740234375, -16.004638671875, -15.26904296875, -14.533447265625, -13.7978515625, -13.062255859375, -12.32666015625, -11.591064453125, -10.85546875, -10.119873046875, -9.38427734375, -8.648681640625, -7.9130859375, -7.177490234375, -6.44189453125, -5.706298828125, -4.970703125, -4.235107421875, -3.49951171875, -2.763916015625, -2.0283203125, -1.292724609375, -0.55712890625, 0.178466796875, 0.9140625, 1.649658203125, 2.38525390625, 3.120849609375, 3.8564453125, 4.592041015625, 5.32763671875, 6.063232421875, 6.798828125, 7.534423828125, 8.27001953125, 9.005615234375, 9.7412109375, 10.476806640625, 11.21240234375, 11.947998046875, 12.68359375, 13.419189453125, 14.15478515625, 14.890380859375, 15.6259765625, 16.361572265625, 17.09716796875, 17.832763671875, 18.568359375, 19.303955078125, 20.03955078125, 20.775146484375, 21.5107421875, 22.246337890625, 22.98193359375, 23.717529296875, 24.453125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 7.0, 11.0, 10.0, 20.0, 22.0, 37.0, 54.0, 99.0, 133.0, 273.0, 480.0, 777.0, 1427.0, 2820.0, 5508.0, 11802.0, 29706.0, 92721.0, 521512.0, 2881772.0, 499189.0, 92201.0, 29738.0, 11998.0, 5513.0, 2918.0, 1571.0, 863.0, 457.0, 235.0, 139.0, 93.0, 56.0, 35.0, 17.0, 19.0, 12.0, 3.0, 10.0, 4.0, 3.0, 4.0, 0.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.796875, -29.81884765625, -28.8408203125, -27.86279296875, -26.884765625, -25.90673828125, -24.9287109375, -23.95068359375, -22.97265625, -21.99462890625, -21.0166015625, -20.03857421875, -19.060546875, -18.08251953125, -17.1044921875, -16.12646484375, -15.1484375, -14.17041015625, -13.1923828125, -12.21435546875, -11.236328125, -10.25830078125, -9.2802734375, -8.30224609375, -7.32421875, -6.34619140625, -5.3681640625, -4.39013671875, -3.412109375, -2.43408203125, -1.4560546875, -0.47802734375, 0.5, 1.47802734375, 2.4560546875, 3.43408203125, 4.412109375, 5.39013671875, 6.3681640625, 7.34619140625, 8.32421875, 9.30224609375, 10.2802734375, 11.25830078125, 12.236328125, 13.21435546875, 14.1923828125, 15.17041015625, 16.1484375, 17.12646484375, 18.1044921875, 19.08251953125, 20.060546875, 21.03857421875, 22.0166015625, 22.99462890625, 23.97265625, 24.95068359375, 25.9287109375, 26.90673828125, 27.884765625, 28.86279296875, 29.8408203125, 30.81884765625, 31.796875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 4.0, 4.0, 3.0, 6.0, 8.0, 6.0, 19.0, 18.0, 21.0, 24.0, 54.0, 65.0, 94.0, 136.0, 251.0, 463.0, 834.0, 794.0, 486.0, 255.0, 182.0, 112.0, 66.0, 38.0, 34.0, 29.0, 7.0, 14.0, 13.0, 11.0, 7.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.0, -35.7666015625, -34.533203125, -33.2998046875, -32.06640625, -30.8330078125, -29.599609375, -28.3662109375, -27.1328125, -25.8994140625, -24.666015625, -23.4326171875, -22.19921875, -20.9658203125, -19.732421875, -18.4990234375, -17.265625, -16.0322265625, -14.798828125, -13.5654296875, -12.33203125, -11.0986328125, -9.865234375, -8.6318359375, -7.3984375, -6.1650390625, -4.931640625, -3.6982421875, -2.46484375, -1.2314453125, 0.001953125, 1.2353515625, 2.46875, 3.7021484375, 4.935546875, 6.1689453125, 7.40234375, 8.6357421875, 9.869140625, 11.1025390625, 12.3359375, 13.5693359375, 14.802734375, 16.0361328125, 17.26953125, 18.5029296875, 19.736328125, 20.9697265625, 22.203125, 23.4365234375, 24.669921875, 25.9033203125, 27.13671875, 28.3701171875, 29.603515625, 30.8369140625, 32.0703125, 33.3037109375, 34.537109375, 35.7705078125, 37.00390625, 38.2373046875, 39.470703125, 40.7041015625, 41.9375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 6.0, 5.0, 10.0, 22.0, 70.0, 141.0, 275.0, 243.0, 143.0, 48.0, 20.0, 10.0, 6.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-519.0661010742188, -501.0537414550781, -483.0414123535156, -465.029052734375, -447.0167236328125, -429.0043640136719, -410.99200439453125, -392.97967529296875, -374.9673156738281, -356.9549560546875, -338.942626953125, -320.9302673339844, -302.91790771484375, -284.90557861328125, -266.8932189941406, -248.88087463378906, -230.8685302734375, -212.85618591308594, -194.84384155273438, -176.83148193359375, -158.8191375732422, -140.80679321289062, -122.79444122314453, -104.78208923339844, -86.76974487304688, -68.75740051269531, -50.74504852294922, -32.73270034790039, -14.720352172851562, 3.2919921875, 21.304344177246094, 39.31669616699219, 57.32904052734375, 75.34138488769531, 93.3537368774414, 111.3660888671875, 129.37843322753906, 147.39077758789062, 165.40313720703125, 183.4154815673828, 201.42782592773438, 219.44017028808594, 237.4525146484375, 255.46487426757812, 273.47723388671875, 291.48956298828125, 309.5019226074219, 327.5142822265625, 345.526611328125, 363.5389709472656, 381.5513000488281, 399.56365966796875, 417.57598876953125, 435.5883483886719, 453.6007080078125, 471.613037109375, 489.6253967285156, 507.63775634765625, 525.6500854492188, 543.6624145507812, 561.6748046875, 579.6871337890625, 597.699462890625, 615.7118530273438, 633.7241821289062]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 5.0, 2.0, 13.0, 17.0, 6.0, 12.0, 24.0, 22.0, 25.0, 25.0, 39.0, 44.0, 44.0, 48.0, 49.0, 63.0, 65.0, 61.0, 63.0, 63.0, 50.0, 39.0, 32.0, 31.0, 30.0, 33.0, 22.0, 22.0, 10.0, 10.0, 6.0, 6.0, 2.0, 2.0, 2.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-232.88919067382812, -226.7714080810547, -220.65362548828125, -214.53582763671875, -208.4180450439453, -202.30026245117188, -196.18247985839844, -190.064697265625, -183.9468994140625, -177.82911682128906, -171.71133422851562, -165.59353637695312, -159.4757537841797, -153.35797119140625, -147.2401885986328, -141.12240600585938, -135.00462341308594, -128.8868408203125, -122.76905059814453, -116.6512680053711, -110.53347778320312, -104.41569519042969, -98.29791259765625, -92.18013000488281, -86.06233978271484, -79.9445571899414, -73.82676696777344, -67.708984375, -61.5911979675293, -55.473411560058594, -49.355628967285156, -43.23784255981445, -37.12005615234375, -31.002269744873047, -24.884485244750977, -18.766700744628906, -12.648914337158203, -6.5311279296875, -0.4133453369140625, 5.704441070556641, 11.822227478027344, 17.940013885498047, 24.057798385620117, 30.175582885742188, 36.29336929321289, 42.411155700683594, 48.52893829345703, 54.646724700927734, 60.76451110839844, 66.88229370117188, 73.00008392333984, 79.11786651611328, 85.23565673828125, 91.35343933105469, 97.47122192382812, 103.58900451660156, 109.70679473876953, 115.82457733154297, 121.94236755371094, 128.06015014648438, 134.1779327392578, 140.29571533203125, 146.41351318359375, 152.5312957763672, 158.64907836914062]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 6.0, 2.0, 4.0, 5.0, 7.0, 15.0, 18.0, 11.0, 29.0, 57.0, 78.0, 123.0, 177.0, 317.0, 534.0, 1027.0, 1856.0, 3789.0, 8344.0, 19460.0, 50334.0, 155024.0, 431578.0, 249975.0, 76224.0, 27791.0, 11331.0, 5163.0, 2327.0, 1284.0, 658.0, 354.0, 238.0, 131.0, 72.0, 78.0, 40.0, 24.0, 25.0, 12.0, 14.0, 5.0, 5.0, 2.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-43.3125, -41.9013671875, -40.490234375, -39.0791015625, -37.66796875, -36.2568359375, -34.845703125, -33.4345703125, -32.0234375, -30.6123046875, -29.201171875, -27.7900390625, -26.37890625, -24.9677734375, -23.556640625, -22.1455078125, -20.734375, -19.3232421875, -17.912109375, -16.5009765625, -15.08984375, -13.6787109375, -12.267578125, -10.8564453125, -9.4453125, -8.0341796875, -6.623046875, -5.2119140625, -3.80078125, -2.3896484375, -0.978515625, 0.4326171875, 1.84375, 3.2548828125, 4.666015625, 6.0771484375, 7.48828125, 8.8994140625, 10.310546875, 11.7216796875, 13.1328125, 14.5439453125, 15.955078125, 17.3662109375, 18.77734375, 20.1884765625, 21.599609375, 23.0107421875, 24.421875, 25.8330078125, 27.244140625, 28.6552734375, 30.06640625, 31.4775390625, 32.888671875, 34.2998046875, 35.7109375, 37.1220703125, 38.533203125, 39.9443359375, 41.35546875, 42.7666015625, 44.177734375, 45.5888671875, 47.0]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 5.0, 6.0, 8.0, 16.0, 10.0, 20.0, 19.0, 31.0, 27.0, 43.0, 55.0, 54.0, 59.0, 71.0, 60.0, 46.0, 66.0, 68.0, 54.0, 45.0, 44.0, 34.0, 29.0, 24.0, 30.0, 18.0, 12.0, 14.0, 11.0, 3.0, 4.0, 8.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-20.921875, -20.2099609375, -19.498046875, -18.7861328125, -18.07421875, -17.3623046875, -16.650390625, -15.9384765625, -15.2265625, -14.5146484375, -13.802734375, -13.0908203125, -12.37890625, -11.6669921875, -10.955078125, -10.2431640625, -9.53125, -8.8193359375, -8.107421875, -7.3955078125, -6.68359375, -5.9716796875, -5.259765625, -4.5478515625, -3.8359375, -3.1240234375, -2.412109375, -1.7001953125, -0.98828125, -0.2763671875, 0.435546875, 1.1474609375, 1.859375, 2.5712890625, 3.283203125, 3.9951171875, 4.70703125, 5.4189453125, 6.130859375, 6.8427734375, 7.5546875, 8.2666015625, 8.978515625, 9.6904296875, 10.40234375, 11.1142578125, 11.826171875, 12.5380859375, 13.25, 13.9619140625, 14.673828125, 15.3857421875, 16.09765625, 16.8095703125, 17.521484375, 18.2333984375, 18.9453125, 19.6572265625, 20.369140625, 21.0810546875, 21.79296875, 22.5048828125, 23.216796875, 23.9287109375, 24.640625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 4.0, 5.0, 5.0, 10.0, 9.0, 17.0, 26.0, 21.0, 33.0, 48.0, 74.0, 108.0, 165.0, 255.0, 483.0, 927.0, 2213.0, 6987.0, 30102.0, 194346.0, 680504.0, 105142.0, 18817.0, 4656.0, 1690.0, 790.0, 409.0, 263.0, 145.0, 76.0, 48.0, 47.0, 35.0, 29.0, 20.0, 11.0, 7.0, 9.0, 7.0, 6.0, 4.0, 2.0, 2.0, 2.0], "bins": [-87.0625, -84.90478515625, -82.7470703125, -80.58935546875, -78.431640625, -76.27392578125, -74.1162109375, -71.95849609375, -69.80078125, -67.64306640625, -65.4853515625, -63.32763671875, -61.169921875, -59.01220703125, -56.8544921875, -54.69677734375, -52.5390625, -50.38134765625, -48.2236328125, -46.06591796875, -43.908203125, -41.75048828125, -39.5927734375, -37.43505859375, -35.27734375, -33.11962890625, -30.9619140625, -28.80419921875, -26.646484375, -24.48876953125, -22.3310546875, -20.17333984375, -18.015625, -15.85791015625, -13.7001953125, -11.54248046875, -9.384765625, -7.22705078125, -5.0693359375, -2.91162109375, -0.75390625, 1.40380859375, 3.5615234375, 5.71923828125, 7.876953125, 10.03466796875, 12.1923828125, 14.35009765625, 16.5078125, 18.66552734375, 20.8232421875, 22.98095703125, 25.138671875, 27.29638671875, 29.4541015625, 31.61181640625, 33.76953125, 35.92724609375, 38.0849609375, 40.24267578125, 42.400390625, 44.55810546875, 46.7158203125, 48.87353515625, 51.03125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 8.0, 5.0, 5.0, 12.0, 6.0, 8.0, 15.0, 13.0, 16.0, 15.0, 23.0, 23.0, 27.0, 22.0, 19.0, 35.0, 26.0, 32.0, 32.0, 37.0, 37.0, 24.0, 42.0, 37.0, 42.0, 47.0, 23.0, 42.0, 33.0, 46.0, 32.0, 30.0, 23.0, 28.0, 19.0, 20.0, 13.0, 19.0, 10.0, 10.0, 8.0, 7.0, 3.0, 9.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-51.25, -49.5703125, -47.890625, -46.2109375, -44.53125, -42.8515625, -41.171875, -39.4921875, -37.8125, -36.1328125, -34.453125, -32.7734375, -31.09375, -29.4140625, -27.734375, -26.0546875, -24.375, -22.6953125, -21.015625, -19.3359375, -17.65625, -15.9765625, -14.296875, -12.6171875, -10.9375, -9.2578125, -7.578125, -5.8984375, -4.21875, -2.5390625, -0.859375, 0.8203125, 2.5, 4.1796875, 5.859375, 7.5390625, 9.21875, 10.8984375, 12.578125, 14.2578125, 15.9375, 17.6171875, 19.296875, 20.9765625, 22.65625, 24.3359375, 26.015625, 27.6953125, 29.375, 31.0546875, 32.734375, 34.4140625, 36.09375, 37.7734375, 39.453125, 41.1328125, 42.8125, 44.4921875, 46.171875, 47.8515625, 49.53125, 51.2109375, 52.890625, 54.5703125, 56.25]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 1.0, 3.0, 6.0, 7.0, 0.0, 3.0, 10.0, 9.0, 15.0, 20.0, 25.0, 41.0, 59.0, 101.0, 250.0, 528.0, 1472.0, 6477.0, 74201.0, 863922.0, 91378.0, 7305.0, 1645.0, 525.0, 229.0, 119.0, 58.0, 44.0, 21.0, 16.0, 13.0, 8.0, 8.0, 5.0, 1.0, 6.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-37.71875, -36.4833984375, -35.248046875, -34.0126953125, -32.77734375, -31.5419921875, -30.306640625, -29.0712890625, -27.8359375, -26.6005859375, -25.365234375, -24.1298828125, -22.89453125, -21.6591796875, -20.423828125, -19.1884765625, -17.953125, -16.7177734375, -15.482421875, -14.2470703125, -13.01171875, -11.7763671875, -10.541015625, -9.3056640625, -8.0703125, -6.8349609375, -5.599609375, -4.3642578125, -3.12890625, -1.8935546875, -0.658203125, 0.5771484375, 1.8125, 3.0478515625, 4.283203125, 5.5185546875, 6.75390625, 7.9892578125, 9.224609375, 10.4599609375, 11.6953125, 12.9306640625, 14.166015625, 15.4013671875, 16.63671875, 17.8720703125, 19.107421875, 20.3427734375, 21.578125, 22.8134765625, 24.048828125, 25.2841796875, 26.51953125, 27.7548828125, 28.990234375, 30.2255859375, 31.4609375, 32.6962890625, 33.931640625, 35.1669921875, 36.40234375, 37.6376953125, 38.873046875, 40.1083984375, 41.34375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 4.0, 7.0, 12.0, 4.0, 10.0, 11.0, 11.0, 16.0, 16.0, 22.0, 31.0, 39.0, 53.0, 51.0, 62.0, 78.0, 119.0, 97.0, 66.0, 60.0, 49.0, 38.0, 29.0, 24.0, 16.0, 9.0, 7.0, 14.0, 6.0, 8.0, 2.0, 4.0, 5.0, 7.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0031871795654296875, -0.0030864179134368896, -0.002985656261444092, -0.002884894609451294, -0.002784132957458496, -0.0026833713054656982, -0.0025826096534729004, -0.0024818480014801025, -0.0023810863494873047, -0.002280324697494507, -0.002179563045501709, -0.002078801393508911, -0.0019780397415161133, -0.0018772780895233154, -0.0017765164375305176, -0.0016757547855377197, -0.0015749931335449219, -0.001474231481552124, -0.0013734698295593262, -0.0012727081775665283, -0.0011719465255737305, -0.0010711848735809326, -0.0009704232215881348, -0.0008696615695953369, -0.0007688999176025391, -0.0006681382656097412, -0.0005673766136169434, -0.0004666149616241455, -0.00036585330963134766, -0.0002650916576385498, -0.00016433000564575195, -6.35683536529541e-05, 3.719329833984375e-05, 0.0001379549503326416, 0.00023871660232543945, 0.0003394782543182373, 0.00044023990631103516, 0.000541001558303833, 0.0006417632102966309, 0.0007425248622894287, 0.0008432865142822266, 0.0009440481662750244, 0.0010448098182678223, 0.0011455714702606201, 0.001246333122253418, 0.0013470947742462158, 0.0014478564262390137, 0.0015486180782318115, 0.0016493797302246094, 0.0017501413822174072, 0.001850903034210205, 0.001951664686203003, 0.0020524263381958008, 0.0021531879901885986, 0.0022539496421813965, 0.0023547112941741943, 0.002455472946166992, 0.00255623459815979, 0.002656996250152588, 0.0027577579021453857, 0.0028585195541381836, 0.0029592812061309814, 0.0030600428581237793, 0.003160804510116577, 0.003261566162109375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 8.0, 8.0, 11.0, 16.0, 15.0, 32.0, 49.0, 78.0, 124.0, 197.0, 381.0, 763.0, 1741.0, 4964.0, 20367.0, 166016.0, 735871.0, 96833.0, 14318.0, 3791.0, 1410.0, 672.0, 377.0, 176.0, 113.0, 83.0, 52.0, 25.0, 22.0, 16.0, 9.0, 7.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.40625, -22.581787109375, -21.75732421875, -20.932861328125, -20.1083984375, -19.283935546875, -18.45947265625, -17.635009765625, -16.810546875, -15.986083984375, -15.16162109375, -14.337158203125, -13.5126953125, -12.688232421875, -11.86376953125, -11.039306640625, -10.21484375, -9.390380859375, -8.56591796875, -7.741455078125, -6.9169921875, -6.092529296875, -5.26806640625, -4.443603515625, -3.619140625, -2.794677734375, -1.97021484375, -1.145751953125, -0.3212890625, 0.503173828125, 1.32763671875, 2.152099609375, 2.9765625, 3.801025390625, 4.62548828125, 5.449951171875, 6.2744140625, 7.098876953125, 7.92333984375, 8.747802734375, 9.572265625, 10.396728515625, 11.22119140625, 12.045654296875, 12.8701171875, 13.694580078125, 14.51904296875, 15.343505859375, 16.16796875, 16.992431640625, 17.81689453125, 18.641357421875, 19.4658203125, 20.290283203125, 21.11474609375, 21.939208984375, 22.763671875, 23.588134765625, 24.41259765625, 25.237060546875, 26.0615234375, 26.885986328125, 27.71044921875, 28.534912109375, 29.359375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 6.0, 3.0, 7.0, 5.0, 8.0, 11.0, 19.0, 22.0, 43.0, 44.0, 58.0, 58.0, 95.0, 106.0, 110.0, 94.0, 72.0, 68.0, 47.0, 46.0, 27.0, 14.0, 6.0, 11.0, 10.0, 8.0, 1.0, 5.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.3125, -21.597412109375, -20.88232421875, -20.167236328125, -19.4521484375, -18.737060546875, -18.02197265625, -17.306884765625, -16.591796875, -15.876708984375, -15.16162109375, -14.446533203125, -13.7314453125, -13.016357421875, -12.30126953125, -11.586181640625, -10.87109375, -10.156005859375, -9.44091796875, -8.725830078125, -8.0107421875, -7.295654296875, -6.58056640625, -5.865478515625, -5.150390625, -4.435302734375, -3.72021484375, -3.005126953125, -2.2900390625, -1.574951171875, -0.85986328125, -0.144775390625, 0.5703125, 1.285400390625, 2.00048828125, 2.715576171875, 3.4306640625, 4.145751953125, 4.86083984375, 5.575927734375, 6.291015625, 7.006103515625, 7.72119140625, 8.436279296875, 9.1513671875, 9.866455078125, 10.58154296875, 11.296630859375, 12.01171875, 12.726806640625, 13.44189453125, 14.156982421875, 14.8720703125, 15.587158203125, 16.30224609375, 17.017333984375, 17.732421875, 18.447509765625, 19.16259765625, 19.877685546875, 20.5927734375, 21.307861328125, 22.02294921875, 22.738037109375, 23.453125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 9.0, 14.0, 37.0, 83.0, 142.0, 202.0, 229.0, 148.0, 66.0, 32.0, 13.0, 6.0, 5.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-354.76593017578125, -336.0225524902344, -317.2791748046875, -298.5357971191406, -279.79241943359375, -261.04901123046875, -242.30563354492188, -223.562255859375, -204.81887817382812, -186.07550048828125, -167.33212280273438, -148.58872985839844, -129.84535217285156, -111.10197448730469, -92.35858917236328, -73.61520385742188, -54.871826171875, -36.12844467163086, -17.38506317138672, 1.3583183288574219, 20.101699829101562, 38.84507751464844, 57.588462829589844, 76.33184814453125, 95.07522583007812, 113.818603515625, 132.56198120117188, 151.3053741455078, 170.0487518310547, 188.79212951660156, 207.5355224609375, 226.27890014648438, 245.0223388671875, 263.7657165527344, 282.50909423828125, 301.2524719238281, 319.995849609375, 338.7392578125, 357.4826354980469, 376.22601318359375, 394.9693908691406, 413.7127685546875, 432.4561462402344, 451.19952392578125, 469.94293212890625, 488.686279296875, 507.4296875, 526.173095703125, 544.9164428710938, 563.6598510742188, 582.4031982421875, 601.1466064453125, 619.8899536132812, 638.6333618164062, 657.376708984375, 676.1201171875, 694.863525390625, 713.60693359375, 732.3502807617188, 751.0936889648438, 769.8370361328125, 788.5804443359375, 807.3237915039062, 826.0671997070312, 844.810546875]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 6.0, 2.0, 2.0, 2.0, 7.0, 5.0, 10.0, 7.0, 4.0, 13.0, 13.0, 16.0, 15.0, 17.0, 21.0, 28.0, 22.0, 23.0, 36.0, 39.0, 42.0, 35.0, 46.0, 44.0, 56.0, 52.0, 38.0, 47.0, 38.0, 37.0, 34.0, 29.0, 34.0, 31.0, 26.0, 22.0, 25.0, 13.0, 13.0, 8.0, 14.0, 9.0, 6.0, 5.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-239.80885314941406, -232.10250854492188, -224.39614868164062, -216.68980407714844, -208.98345947265625, -201.27711486816406, -193.57077026367188, -185.86441040039062, -178.15806579589844, -170.45172119140625, -162.745361328125, -155.0390167236328, -147.33267211914062, -139.62632751464844, -131.91998291015625, -124.213623046875, -116.50727844238281, -108.80093383789062, -101.0945816040039, -93.38822937011719, -85.681884765625, -77.97554016113281, -70.2691879272461, -62.56283950805664, -54.85649108886719, -47.150142669677734, -39.44379425048828, -31.737445831298828, -24.031097412109375, -16.324748992919922, -8.618400573730469, -0.9120521545410156, 6.794281005859375, 14.500629425048828, 22.20697784423828, 29.913326263427734, 37.61967468261719, 45.32602310180664, 53.032371520996094, 60.73871994018555, 68.445068359375, 76.15141296386719, 83.8577651977539, 91.56411743164062, 99.27046203613281, 106.976806640625, 114.68315887451172, 122.38951110839844, 130.09585571289062, 137.8022003173828, 145.508544921875, 153.21490478515625, 160.92124938964844, 168.62759399414062, 176.33395385742188, 184.04029846191406, 191.74664306640625, 199.45298767089844, 207.15933227539062, 214.86569213867188, 222.57203674316406, 230.27838134765625, 237.9847412109375, 245.6910858154297, 253.39743041992188]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 7.0, 5.0, 13.0, 17.0, 14.0, 30.0, 39.0, 59.0, 100.0, 165.0, 301.0, 518.0, 1005.0, 2194.0, 4992.0, 12806.0, 38807.0, 147231.0, 895032.0, 2398496.0, 544207.0, 102121.0, 28669.0, 9783.0, 3852.0, 1763.0, 837.0, 460.0, 266.0, 151.0, 89.0, 68.0, 46.0, 37.0, 30.0, 14.0, 12.0, 15.0, 6.0, 6.0, 3.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-23.46875, -22.6416015625, -21.814453125, -20.9873046875, -20.16015625, -19.3330078125, -18.505859375, -17.6787109375, -16.8515625, -16.0244140625, -15.197265625, -14.3701171875, -13.54296875, -12.7158203125, -11.888671875, -11.0615234375, -10.234375, -9.4072265625, -8.580078125, -7.7529296875, -6.92578125, -6.0986328125, -5.271484375, -4.4443359375, -3.6171875, -2.7900390625, -1.962890625, -1.1357421875, -0.30859375, 0.5185546875, 1.345703125, 2.1728515625, 3.0, 3.8271484375, 4.654296875, 5.4814453125, 6.30859375, 7.1357421875, 7.962890625, 8.7900390625, 9.6171875, 10.4443359375, 11.271484375, 12.0986328125, 12.92578125, 13.7529296875, 14.580078125, 15.4072265625, 16.234375, 17.0615234375, 17.888671875, 18.7158203125, 19.54296875, 20.3701171875, 21.197265625, 22.0244140625, 22.8515625, 23.6787109375, 24.505859375, 25.3330078125, 26.16015625, 26.9873046875, 27.814453125, 28.6416015625, 29.46875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 7.0, 11.0, 8.0, 13.0, 23.0, 33.0, 30.0, 39.0, 42.0, 66.0, 65.0, 56.0, 50.0, 62.0, 83.0, 68.0, 54.0, 57.0, 51.0, 37.0, 40.0, 30.0, 21.0, 14.0, 9.0, 13.0, 12.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-22.296875, -21.5703125, -20.84375, -20.1171875, -19.390625, -18.6640625, -17.9375, -17.2109375, -16.484375, -15.7578125, -15.03125, -14.3046875, -13.578125, -12.8515625, -12.125, -11.3984375, -10.671875, -9.9453125, -9.21875, -8.4921875, -7.765625, -7.0390625, -6.3125, -5.5859375, -4.859375, -4.1328125, -3.40625, -2.6796875, -1.953125, -1.2265625, -0.5, 0.2265625, 0.953125, 1.6796875, 2.40625, 3.1328125, 3.859375, 4.5859375, 5.3125, 6.0390625, 6.765625, 7.4921875, 8.21875, 8.9453125, 9.671875, 10.3984375, 11.125, 11.8515625, 12.578125, 13.3046875, 14.03125, 14.7578125, 15.484375, 16.2109375, 16.9375, 17.6640625, 18.390625, 19.1171875, 19.84375, 20.5703125, 21.296875, 22.0234375, 22.75, 23.4765625, 24.203125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 6.0, 0.0, 5.0, 14.0, 13.0, 18.0, 24.0, 41.0, 70.0, 105.0, 217.0, 412.0, 949.0, 2695.0, 8453.0, 34324.0, 196254.0, 2555527.0, 1248742.0, 113224.0, 23144.0, 6357.0, 2123.0, 765.0, 375.0, 164.0, 106.0, 53.0, 47.0, 16.0, 17.0, 10.0, 3.0, 5.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.875, -39.591796875, -38.30859375, -37.025390625, -35.7421875, -34.458984375, -33.17578125, -31.892578125, -30.609375, -29.326171875, -28.04296875, -26.759765625, -25.4765625, -24.193359375, -22.91015625, -21.626953125, -20.34375, -19.060546875, -17.77734375, -16.494140625, -15.2109375, -13.927734375, -12.64453125, -11.361328125, -10.078125, -8.794921875, -7.51171875, -6.228515625, -4.9453125, -3.662109375, -2.37890625, -1.095703125, 0.1875, 1.470703125, 2.75390625, 4.037109375, 5.3203125, 6.603515625, 7.88671875, 9.169921875, 10.453125, 11.736328125, 13.01953125, 14.302734375, 15.5859375, 16.869140625, 18.15234375, 19.435546875, 20.71875, 22.001953125, 23.28515625, 24.568359375, 25.8515625, 27.134765625, 28.41796875, 29.701171875, 30.984375, 32.267578125, 33.55078125, 34.833984375, 36.1171875, 37.400390625, 38.68359375, 39.966796875, 41.25]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 4.0, 5.0, 3.0, 4.0, 7.0, 9.0, 12.0, 15.0, 12.0, 20.0, 29.0, 37.0, 44.0, 58.0, 76.0, 105.0, 130.0, 192.0, 296.0, 389.0, 503.0, 505.0, 430.0, 313.0, 224.0, 156.0, 127.0, 87.0, 54.0, 42.0, 40.0, 35.0, 25.0, 22.0, 16.0, 8.0, 8.0, 6.0, 7.0, 6.0, 3.0, 4.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-30.109375, -29.074951171875, -28.04052734375, -27.006103515625, -25.9716796875, -24.937255859375, -23.90283203125, -22.868408203125, -21.833984375, -20.799560546875, -19.76513671875, -18.730712890625, -17.6962890625, -16.661865234375, -15.62744140625, -14.593017578125, -13.55859375, -12.524169921875, -11.48974609375, -10.455322265625, -9.4208984375, -8.386474609375, -7.35205078125, -6.317626953125, -5.283203125, -4.248779296875, -3.21435546875, -2.179931640625, -1.1455078125, -0.111083984375, 0.92333984375, 1.957763671875, 2.9921875, 4.026611328125, 5.06103515625, 6.095458984375, 7.1298828125, 8.164306640625, 9.19873046875, 10.233154296875, 11.267578125, 12.302001953125, 13.33642578125, 14.370849609375, 15.4052734375, 16.439697265625, 17.47412109375, 18.508544921875, 19.54296875, 20.577392578125, 21.61181640625, 22.646240234375, 23.6806640625, 24.715087890625, 25.74951171875, 26.783935546875, 27.818359375, 28.852783203125, 29.88720703125, 30.921630859375, 31.9560546875, 32.990478515625, 34.02490234375, 35.059326171875, 36.09375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 13.0, 19.0, 25.0, 63.0, 154.0, 198.0, 206.0, 161.0, 80.0, 43.0, 16.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-368.93560791015625, -351.4669189453125, -333.9981994628906, -316.52947998046875, -299.060791015625, -281.59210205078125, -264.1233825683594, -246.65467834472656, -229.18597412109375, -211.71726989746094, -194.24856567382812, -176.7798614501953, -159.3111572265625, -141.8424530029297, -124.37374877929688, -106.90504455566406, -89.43634033203125, -71.96763610839844, -54.498931884765625, -37.03022766113281, -19.5615234375, -2.0928192138671875, 15.375885009765625, 32.84458923339844, 50.31329345703125, 67.78199768066406, 85.25070190429688, 102.71940612792969, 120.1881103515625, 137.6568145751953, 155.12551879882812, 172.59422302246094, 190.0628662109375, 207.5315704345703, 225.00027465820312, 242.46897888183594, 259.93768310546875, 277.4063720703125, 294.8750915527344, 312.34381103515625, 329.8125, 347.28118896484375, 364.7499084472656, 382.2186279296875, 399.68731689453125, 417.156005859375, 434.6247253417969, 452.09344482421875, 469.5621337890625, 487.03082275390625, 504.4995422363281, 521.96826171875, 539.4369506835938, 556.9056396484375, 574.3743896484375, 591.8430786132812, 609.311767578125, 626.7804565429688, 644.2491455078125, 661.7178955078125, 679.1865844726562, 696.6552734375, 714.1240234375, 731.5927124023438, 749.0614013671875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 6.0, 5.0, 9.0, 11.0, 10.0, 25.0, 16.0, 35.0, 36.0, 47.0, 49.0, 65.0, 56.0, 52.0, 84.0, 81.0, 71.0, 64.0, 61.0, 40.0, 42.0, 34.0, 29.0, 23.0, 11.0, 17.0, 9.0, 6.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-228.9528045654297, -219.63490295410156, -210.3170166015625, -200.99911499023438, -191.68121337890625, -182.36331176757812, -173.04541015625, -163.72752380371094, -154.4096221923828, -145.0917205810547, -135.77383422851562, -126.4559326171875, -117.13803100585938, -107.82012939453125, -98.50223541259766, -89.18434143066406, -79.86643981933594, -70.54853820800781, -61.23064422607422, -51.91274642944336, -42.5948486328125, -33.27695083618164, -23.95905303955078, -14.641159057617188, -5.3232574462890625, 3.994640350341797, 13.312538146972656, 22.630435943603516, 31.948333740234375, 41.266231536865234, 50.584129333496094, 59.90202331542969, 69.21990966796875, 78.53781127929688, 87.85570526123047, 97.17359924316406, 106.49150085449219, 115.80940246582031, 125.1272964477539, 134.4451904296875, 143.76309204101562, 153.08099365234375, 162.39889526367188, 171.71678161621094, 181.03468322753906, 190.3525848388672, 199.67047119140625, 208.98837280273438, 218.3062744140625, 227.62417602539062, 236.94207763671875, 246.2599639892578, 255.57786560058594, 264.895751953125, 274.2136535644531, 283.53155517578125, 292.8494567871094, 302.1673583984375, 311.4852600097656, 320.80316162109375, 330.12103271484375, 339.4389343261719, 348.7568359375, 358.0747375488281, 367.39263916015625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 8.0, 14.0, 11.0, 14.0, 17.0, 28.0, 43.0, 62.0, 77.0, 118.0, 162.0, 280.0, 440.0, 772.0, 1412.0, 2620.0, 5191.0, 11386.0, 27034.0, 65894.0, 157826.0, 332175.0, 255070.0, 108109.0, 44473.0, 18664.0, 8127.0, 3883.0, 1930.0, 1061.0, 602.0, 345.0, 214.0, 140.0, 97.0, 56.0, 58.0, 41.0, 38.0, 18.0, 16.0, 8.0, 8.0, 5.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-35.96875, -34.87158203125, -33.7744140625, -32.67724609375, -31.580078125, -30.48291015625, -29.3857421875, -28.28857421875, -27.19140625, -26.09423828125, -24.9970703125, -23.89990234375, -22.802734375, -21.70556640625, -20.6083984375, -19.51123046875, -18.4140625, -17.31689453125, -16.2197265625, -15.12255859375, -14.025390625, -12.92822265625, -11.8310546875, -10.73388671875, -9.63671875, -8.53955078125, -7.4423828125, -6.34521484375, -5.248046875, -4.15087890625, -3.0537109375, -1.95654296875, -0.859375, 0.23779296875, 1.3349609375, 2.43212890625, 3.529296875, 4.62646484375, 5.7236328125, 6.82080078125, 7.91796875, 9.01513671875, 10.1123046875, 11.20947265625, 12.306640625, 13.40380859375, 14.5009765625, 15.59814453125, 16.6953125, 17.79248046875, 18.8896484375, 19.98681640625, 21.083984375, 22.18115234375, 23.2783203125, 24.37548828125, 25.47265625, 26.56982421875, 27.6669921875, 28.76416015625, 29.861328125, 30.95849609375, 32.0556640625, 33.15283203125, 34.25]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 12.0, 2.0, 9.0, 11.0, 13.0, 24.0, 30.0, 23.0, 38.0, 45.0, 54.0, 58.0, 59.0, 61.0, 72.0, 64.0, 62.0, 56.0, 55.0, 43.0, 47.0, 41.0, 35.0, 29.0, 17.0, 12.0, 10.0, 3.0, 7.0, 6.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-21.3125, -20.599365234375, -19.88623046875, -19.173095703125, -18.4599609375, -17.746826171875, -17.03369140625, -16.320556640625, -15.607421875, -14.894287109375, -14.18115234375, -13.468017578125, -12.7548828125, -12.041748046875, -11.32861328125, -10.615478515625, -9.90234375, -9.189208984375, -8.47607421875, -7.762939453125, -7.0498046875, -6.336669921875, -5.62353515625, -4.910400390625, -4.197265625, -3.484130859375, -2.77099609375, -2.057861328125, -1.3447265625, -0.631591796875, 0.08154296875, 0.794677734375, 1.5078125, 2.220947265625, 2.93408203125, 3.647216796875, 4.3603515625, 5.073486328125, 5.78662109375, 6.499755859375, 7.212890625, 7.926025390625, 8.63916015625, 9.352294921875, 10.0654296875, 10.778564453125, 11.49169921875, 12.204833984375, 12.91796875, 13.631103515625, 14.34423828125, 15.057373046875, 15.7705078125, 16.483642578125, 17.19677734375, 17.909912109375, 18.623046875, 19.336181640625, 20.04931640625, 20.762451171875, 21.4755859375, 22.188720703125, 22.90185546875, 23.614990234375, 24.328125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 8.0, 4.0, 18.0, 15.0, 26.0, 32.0, 39.0, 60.0, 91.0, 155.0, 205.0, 368.0, 604.0, 1089.0, 2167.0, 5434.0, 30777.0, 475876.0, 490164.0, 30936.0, 5622.0, 2171.0, 1049.0, 620.0, 347.0, 221.0, 140.0, 89.0, 75.0, 44.0, 28.0, 21.0, 16.0, 17.0, 7.0, 8.0, 8.0, 7.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.1875, -100.3212890625, -97.455078125, -94.5888671875, -91.72265625, -88.8564453125, -85.990234375, -83.1240234375, -80.2578125, -77.3916015625, -74.525390625, -71.6591796875, -68.79296875, -65.9267578125, -63.060546875, -60.1943359375, -57.328125, -54.4619140625, -51.595703125, -48.7294921875, -45.86328125, -42.9970703125, -40.130859375, -37.2646484375, -34.3984375, -31.5322265625, -28.666015625, -25.7998046875, -22.93359375, -20.0673828125, -17.201171875, -14.3349609375, -11.46875, -8.6025390625, -5.736328125, -2.8701171875, -0.00390625, 2.8623046875, 5.728515625, 8.5947265625, 11.4609375, 14.3271484375, 17.193359375, 20.0595703125, 22.92578125, 25.7919921875, 28.658203125, 31.5244140625, 34.390625, 37.2568359375, 40.123046875, 42.9892578125, 45.85546875, 48.7216796875, 51.587890625, 54.4541015625, 57.3203125, 60.1865234375, 63.052734375, 65.9189453125, 68.78515625, 71.6513671875, 74.517578125, 77.3837890625, 80.25]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 5.0, 1.0, 8.0, 8.0, 7.0, 9.0, 14.0, 17.0, 22.0, 22.0, 37.0, 30.0, 32.0, 32.0, 52.0, 58.0, 34.0, 53.0, 54.0, 46.0, 51.0, 38.0, 39.0, 35.0, 44.0, 36.0, 40.0, 29.0, 30.0, 32.0, 13.0, 16.0, 18.0, 12.0, 7.0, 4.0, 4.0, 2.0, 3.0, 4.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-69.0, -66.5927734375, -64.185546875, -61.7783203125, -59.37109375, -56.9638671875, -54.556640625, -52.1494140625, -49.7421875, -47.3349609375, -44.927734375, -42.5205078125, -40.11328125, -37.7060546875, -35.298828125, -32.8916015625, -30.484375, -28.0771484375, -25.669921875, -23.2626953125, -20.85546875, -18.4482421875, -16.041015625, -13.6337890625, -11.2265625, -8.8193359375, -6.412109375, -4.0048828125, -1.59765625, 0.8095703125, 3.216796875, 5.6240234375, 8.03125, 10.4384765625, 12.845703125, 15.2529296875, 17.66015625, 20.0673828125, 22.474609375, 24.8818359375, 27.2890625, 29.6962890625, 32.103515625, 34.5107421875, 36.91796875, 39.3251953125, 41.732421875, 44.1396484375, 46.546875, 48.9541015625, 51.361328125, 53.7685546875, 56.17578125, 58.5830078125, 60.990234375, 63.3974609375, 65.8046875, 68.2119140625, 70.619140625, 73.0263671875, 75.43359375, 77.8408203125, 80.248046875, 82.6552734375, 85.0625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 6.0, 5.0, 11.0, 13.0, 16.0, 27.0, 30.0, 61.0, 104.0, 144.0, 303.0, 625.0, 1649.0, 7050.0, 57928.0, 744085.0, 212395.0, 18881.0, 3225.0, 973.0, 433.0, 218.0, 122.0, 78.0, 44.0, 28.0, 24.0, 11.0, 15.0, 12.0, 7.0, 5.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.546875, -24.7900390625, -24.033203125, -23.2763671875, -22.51953125, -21.7626953125, -21.005859375, -20.2490234375, -19.4921875, -18.7353515625, -17.978515625, -17.2216796875, -16.46484375, -15.7080078125, -14.951171875, -14.1943359375, -13.4375, -12.6806640625, -11.923828125, -11.1669921875, -10.41015625, -9.6533203125, -8.896484375, -8.1396484375, -7.3828125, -6.6259765625, -5.869140625, -5.1123046875, -4.35546875, -3.5986328125, -2.841796875, -2.0849609375, -1.328125, -0.5712890625, 0.185546875, 0.9423828125, 1.69921875, 2.4560546875, 3.212890625, 3.9697265625, 4.7265625, 5.4833984375, 6.240234375, 6.9970703125, 7.75390625, 8.5107421875, 9.267578125, 10.0244140625, 10.78125, 11.5380859375, 12.294921875, 13.0517578125, 13.80859375, 14.5654296875, 15.322265625, 16.0791015625, 16.8359375, 17.5927734375, 18.349609375, 19.1064453125, 19.86328125, 20.6201171875, 21.376953125, 22.1337890625, 22.890625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 7.0, 3.0, 5.0, 6.0, 9.0, 15.0, 16.0, 12.0, 19.0, 19.0, 21.0, 29.0, 39.0, 52.0, 39.0, 75.0, 108.0, 106.0, 92.0, 61.0, 46.0, 45.0, 31.0, 20.0, 20.0, 15.0, 14.0, 7.0, 12.0, 9.0, 8.0, 13.0, 5.0, 9.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00330352783203125, -0.003193795680999756, -0.0030840635299682617, -0.0029743313789367676, -0.0028645992279052734, -0.0027548670768737793, -0.002645134925842285, -0.002535402774810791, -0.002425670623779297, -0.0023159384727478027, -0.0022062063217163086, -0.0020964741706848145, -0.0019867420196533203, -0.0018770098686218262, -0.001767277717590332, -0.0016575455665588379, -0.0015478134155273438, -0.0014380812644958496, -0.0013283491134643555, -0.0012186169624328613, -0.0011088848114013672, -0.000999152660369873, -0.0008894205093383789, -0.0007796883583068848, -0.0006699562072753906, -0.0005602240562438965, -0.00045049190521240234, -0.0003407597541809082, -0.00023102760314941406, -0.00012129545211791992, -1.1563301086425781e-05, 9.816884994506836e-05, 0.0002079010009765625, 0.00031763315200805664, 0.0004273653030395508, 0.0005370974540710449, 0.0006468296051025391, 0.0007565617561340332, 0.0008662939071655273, 0.0009760260581970215, 0.0010857582092285156, 0.0011954903602600098, 0.001305222511291504, 0.001414954662322998, 0.0015246868133544922, 0.0016344189643859863, 0.0017441511154174805, 0.0018538832664489746, 0.0019636154174804688, 0.002073347568511963, 0.002183079719543457, 0.002292811870574951, 0.0024025440216064453, 0.0025122761726379395, 0.0026220083236694336, 0.0027317404747009277, 0.002841472625732422, 0.002951204776763916, 0.00306093692779541, 0.0031706690788269043, 0.0032804012298583984, 0.0033901333808898926, 0.0034998655319213867, 0.003609597682952881, 0.003719329833984375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 8.0, 6.0, 11.0, 15.0, 16.0, 18.0, 28.0, 59.0, 46.0, 67.0, 84.0, 154.0, 224.0, 330.0, 518.0, 869.0, 1738.0, 3684.0, 10095.0, 41938.0, 302061.0, 596766.0, 66708.0, 13624.0, 4622.0, 2009.0, 1043.0, 604.0, 360.0, 253.0, 166.0, 129.0, 84.0, 47.0, 31.0, 34.0, 25.0, 23.0, 16.0, 5.0, 8.0, 8.0, 7.0, 3.0, 3.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.53125, -14.0146484375, -13.498046875, -12.9814453125, -12.46484375, -11.9482421875, -11.431640625, -10.9150390625, -10.3984375, -9.8818359375, -9.365234375, -8.8486328125, -8.33203125, -7.8154296875, -7.298828125, -6.7822265625, -6.265625, -5.7490234375, -5.232421875, -4.7158203125, -4.19921875, -3.6826171875, -3.166015625, -2.6494140625, -2.1328125, -1.6162109375, -1.099609375, -0.5830078125, -0.06640625, 0.4501953125, 0.966796875, 1.4833984375, 2.0, 2.5166015625, 3.033203125, 3.5498046875, 4.06640625, 4.5830078125, 5.099609375, 5.6162109375, 6.1328125, 6.6494140625, 7.166015625, 7.6826171875, 8.19921875, 8.7158203125, 9.232421875, 9.7490234375, 10.265625, 10.7822265625, 11.298828125, 11.8154296875, 12.33203125, 12.8486328125, 13.365234375, 13.8818359375, 14.3984375, 14.9150390625, 15.431640625, 15.9482421875, 16.46484375, 16.9814453125, 17.498046875, 18.0146484375, 18.53125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 7.0, 14.0, 18.0, 11.0, 21.0, 30.0, 28.0, 32.0, 38.0, 48.0, 66.0, 55.0, 72.0, 86.0, 68.0, 80.0, 61.0, 54.0, 41.0, 35.0, 20.0, 30.0, 23.0, 15.0, 14.0, 2.0, 10.0, 7.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.90625, -15.3974609375, -14.888671875, -14.3798828125, -13.87109375, -13.3623046875, -12.853515625, -12.3447265625, -11.8359375, -11.3271484375, -10.818359375, -10.3095703125, -9.80078125, -9.2919921875, -8.783203125, -8.2744140625, -7.765625, -7.2568359375, -6.748046875, -6.2392578125, -5.73046875, -5.2216796875, -4.712890625, -4.2041015625, -3.6953125, -3.1865234375, -2.677734375, -2.1689453125, -1.66015625, -1.1513671875, -0.642578125, -0.1337890625, 0.375, 0.8837890625, 1.392578125, 1.9013671875, 2.41015625, 2.9189453125, 3.427734375, 3.9365234375, 4.4453125, 4.9541015625, 5.462890625, 5.9716796875, 6.48046875, 6.9892578125, 7.498046875, 8.0068359375, 8.515625, 9.0244140625, 9.533203125, 10.0419921875, 10.55078125, 11.0595703125, 11.568359375, 12.0771484375, 12.5859375, 13.0947265625, 13.603515625, 14.1123046875, 14.62109375, 15.1298828125, 15.638671875, 16.1474609375, 16.65625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 10.0, 16.0, 15.0, 26.0, 65.0, 117.0, 190.0, 245.0, 139.0, 94.0, 39.0, 20.0, 7.0, 9.0, 5.0, 4.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-676.3380737304688, -661.01611328125, -645.694091796875, -630.3721313476562, -615.0501708984375, -599.7281494140625, -584.4061889648438, -569.084228515625, -553.76220703125, -538.4402465820312, -523.1182250976562, -507.7962646484375, -492.4742736816406, -477.15228271484375, -461.830322265625, -446.5083312988281, -431.18634033203125, -415.8643493652344, -400.5423889160156, -385.22039794921875, -369.8984069824219, -354.576416015625, -339.25445556640625, -323.9324645996094, -308.6105041503906, -293.28851318359375, -277.966552734375, -262.6445617675781, -247.32257080078125, -232.00059509277344, -216.67861938476562, -201.35662841796875, -186.03463745117188, -170.71266174316406, -155.3906707763672, -140.06869506835938, -124.7467041015625, -109.42472839355469, -94.10274505615234, -78.78076171875, -63.458778381347656, -48.13679504394531, -32.81481170654297, -17.49283218383789, -2.170848846435547, 13.151130676269531, 28.473114013671875, 43.79509735107422, 59.11708068847656, 74.4390640258789, 89.76104736328125, 105.08302307128906, 120.40501403808594, 135.72698974609375, 151.04898071289062, 166.37095642089844, 181.69293212890625, 197.01490783691406, 212.33689880371094, 227.65887451171875, 242.98086547851562, 258.3028564453125, 273.62481689453125, 288.9468078613281, 304.268798828125]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 8.0, 9.0, 4.0, 9.0, 12.0, 6.0, 21.0, 15.0, 18.0, 37.0, 28.0, 36.0, 42.0, 26.0, 34.0, 55.0, 61.0, 63.0, 94.0, 65.0, 50.0, 39.0, 34.0, 32.0, 31.0, 27.0, 30.0, 19.0, 14.0, 17.0, 19.0, 5.0, 10.0, 4.0, 5.0, 4.0, 6.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-347.7723388671875, -337.8692321777344, -327.96612548828125, -318.0630187988281, -308.159912109375, -298.2568054199219, -288.35369873046875, -278.45062255859375, -268.5474853515625, -258.6443786621094, -248.74127197265625, -238.83816528320312, -228.93505859375, -219.03195190429688, -209.1288604736328, -199.2257537841797, -189.32266235351562, -179.4195556640625, -169.51644897460938, -159.61334228515625, -149.71023559570312, -139.80712890625, -129.90403747558594, -120.00093078613281, -110.09782409667969, -100.19471740722656, -90.29161071777344, -80.38851165771484, -70.48540496826172, -60.582298278808594, -50.679195404052734, -40.776092529296875, -30.872955322265625, -20.969850540161133, -11.06674575805664, -1.1636409759521484, 8.739463806152344, 18.64257049560547, 28.545673370361328, 38.44877624511719, 48.35188293457031, 58.25498962402344, 68.15809631347656, 78.06119537353516, 87.96430206298828, 97.8674087524414, 107.7705078125, 117.67361450195312, 127.57672119140625, 137.47982788085938, 147.3829345703125, 157.28604125976562, 167.18914794921875, 177.09225463867188, 186.99534606933594, 196.89845275878906, 206.8015594482422, 216.7046661376953, 226.60777282714844, 236.51087951660156, 246.41397094726562, 256.31707763671875, 266.2201843261719, 276.123291015625, 286.0263977050781]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 5.0, 5.0, 14.0, 22.0, 37.0, 55.0, 120.0, 229.0, 470.0, 1176.0, 3073.0, 10243.0, 42843.0, 326889.0, 2895487.0, 813525.0, 77343.0, 15426.0, 4471.0, 1523.0, 670.0, 281.0, 147.0, 82.0, 53.0, 41.0, 14.0, 17.0, 10.0, 7.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.515625, -28.486083984375, -27.45654296875, -26.427001953125, -25.3974609375, -24.367919921875, -23.33837890625, -22.308837890625, -21.279296875, -20.249755859375, -19.22021484375, -18.190673828125, -17.1611328125, -16.131591796875, -15.10205078125, -14.072509765625, -13.04296875, -12.013427734375, -10.98388671875, -9.954345703125, -8.9248046875, -7.895263671875, -6.86572265625, -5.836181640625, -4.806640625, -3.777099609375, -2.74755859375, -1.718017578125, -0.6884765625, 0.341064453125, 1.37060546875, 2.400146484375, 3.4296875, 4.459228515625, 5.48876953125, 6.518310546875, 7.5478515625, 8.577392578125, 9.60693359375, 10.636474609375, 11.666015625, 12.695556640625, 13.72509765625, 14.754638671875, 15.7841796875, 16.813720703125, 17.84326171875, 18.872802734375, 19.90234375, 20.931884765625, 21.96142578125, 22.990966796875, 24.0205078125, 25.050048828125, 26.07958984375, 27.109130859375, 28.138671875, 29.168212890625, 30.19775390625, 31.227294921875, 32.2568359375, 33.286376953125, 34.31591796875, 35.345458984375, 36.375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 7.0, 10.0, 8.0, 13.0, 8.0, 19.0, 26.0, 31.0, 28.0, 43.0, 47.0, 48.0, 44.0, 55.0, 65.0, 59.0, 63.0, 54.0, 64.0, 44.0, 44.0, 44.0, 40.0, 31.0, 20.0, 25.0, 17.0, 13.0, 6.0, 6.0, 7.0, 4.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-19.515625, -18.83740234375, -18.1591796875, -17.48095703125, -16.802734375, -16.12451171875, -15.4462890625, -14.76806640625, -14.08984375, -13.41162109375, -12.7333984375, -12.05517578125, -11.376953125, -10.69873046875, -10.0205078125, -9.34228515625, -8.6640625, -7.98583984375, -7.3076171875, -6.62939453125, -5.951171875, -5.27294921875, -4.5947265625, -3.91650390625, -3.23828125, -2.56005859375, -1.8818359375, -1.20361328125, -0.525390625, 0.15283203125, 0.8310546875, 1.50927734375, 2.1875, 2.86572265625, 3.5439453125, 4.22216796875, 4.900390625, 5.57861328125, 6.2568359375, 6.93505859375, 7.61328125, 8.29150390625, 8.9697265625, 9.64794921875, 10.326171875, 11.00439453125, 11.6826171875, 12.36083984375, 13.0390625, 13.71728515625, 14.3955078125, 15.07373046875, 15.751953125, 16.43017578125, 17.1083984375, 17.78662109375, 18.46484375, 19.14306640625, 19.8212890625, 20.49951171875, 21.177734375, 21.85595703125, 22.5341796875, 23.21240234375, 23.890625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 7.0, 8.0, 6.0, 13.0, 14.0, 17.0, 33.0, 58.0, 88.0, 157.0, 297.0, 664.0, 1554.0, 4203.0, 13980.0, 64304.0, 719418.0, 3113223.0, 223387.0, 36680.0, 9658.0, 3442.0, 1452.0, 674.0, 334.0, 230.0, 145.0, 81.0, 49.0, 35.0, 24.0, 15.0, 7.0, 12.0, 2.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-41.875, -40.578125, -39.28125, -37.984375, -36.6875, -35.390625, -34.09375, -32.796875, -31.5, -30.203125, -28.90625, -27.609375, -26.3125, -25.015625, -23.71875, -22.421875, -21.125, -19.828125, -18.53125, -17.234375, -15.9375, -14.640625, -13.34375, -12.046875, -10.75, -9.453125, -8.15625, -6.859375, -5.5625, -4.265625, -2.96875, -1.671875, -0.375, 0.921875, 2.21875, 3.515625, 4.8125, 6.109375, 7.40625, 8.703125, 10.0, 11.296875, 12.59375, 13.890625, 15.1875, 16.484375, 17.78125, 19.078125, 20.375, 21.671875, 22.96875, 24.265625, 25.5625, 26.859375, 28.15625, 29.453125, 30.75, 32.046875, 33.34375, 34.640625, 35.9375, 37.234375, 38.53125, 39.828125, 41.125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 3.0, 0.0, 6.0, 3.0, 5.0, 7.0, 7.0, 17.0, 15.0, 30.0, 50.0, 65.0, 143.0, 281.0, 551.0, 877.0, 847.0, 520.0, 246.0, 133.0, 86.0, 58.0, 40.0, 23.0, 19.0, 16.0, 10.0, 5.0, 8.0, 4.0, 0.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.625, -30.90234375, -29.1796875, -27.45703125, -25.734375, -24.01171875, -22.2890625, -20.56640625, -18.84375, -17.12109375, -15.3984375, -13.67578125, -11.953125, -10.23046875, -8.5078125, -6.78515625, -5.0625, -3.33984375, -1.6171875, 0.10546875, 1.828125, 3.55078125, 5.2734375, 6.99609375, 8.71875, 10.44140625, 12.1640625, 13.88671875, 15.609375, 17.33203125, 19.0546875, 20.77734375, 22.5, 24.22265625, 25.9453125, 27.66796875, 29.390625, 31.11328125, 32.8359375, 34.55859375, 36.28125, 38.00390625, 39.7265625, 41.44921875, 43.171875, 44.89453125, 46.6171875, 48.33984375, 50.0625, 51.78515625, 53.5078125, 55.23046875, 56.953125, 58.67578125, 60.3984375, 62.12109375, 63.84375, 65.56640625, 67.2890625, 69.01171875, 70.734375, 72.45703125, 74.1796875, 75.90234375, 77.625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 7.0, 31.0, 64.0, 131.0, 216.0, 263.0, 143.0, 75.0, 31.0, 15.0, 5.0, 7.0, 4.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-428.302734375, -410.3797607421875, -392.456787109375, -374.5338439941406, -356.6108703613281, -338.6878967285156, -320.76495361328125, -302.84197998046875, -284.91900634765625, -266.99603271484375, -249.0730743408203, -231.15011596679688, -213.22714233398438, -195.30416870117188, -177.38121032714844, -159.458251953125, -141.5352783203125, -123.61231231689453, -105.68934631347656, -87.7663803100586, -69.84341430664062, -51.920448303222656, -33.99748229980469, -16.07451629638672, 1.84844970703125, 19.77141571044922, 37.69438171386719, 55.617347717285156, 73.54031372070312, 91.4632797241211, 109.38624572753906, 127.30921173095703, 145.23223876953125, 163.15521240234375, 181.0781707763672, 199.00112915039062, 216.92410278320312, 234.84707641601562, 252.77003479003906, 270.6929931640625, 288.615966796875, 306.5389404296875, 324.4619140625, 342.3848571777344, 360.3078308105469, 378.2308044433594, 396.15374755859375, 414.07672119140625, 431.99969482421875, 449.92266845703125, 467.84564208984375, 485.7685852050781, 503.6915588378906, 521.614501953125, 539.5374755859375, 557.46044921875, 575.3834228515625, 593.306396484375, 611.2293701171875, 629.15234375, 647.0753173828125, 664.9982299804688, 682.9212036132812, 700.8441772460938, 718.7671508789062]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 2.0, 3.0, 10.0, 11.0, 20.0, 13.0, 19.0, 40.0, 39.0, 50.0, 55.0, 52.0, 61.0, 66.0, 57.0, 71.0, 74.0, 67.0, 58.0, 54.0, 35.0, 32.0, 38.0, 20.0, 20.0, 12.0, 9.0, 8.0, 7.0, 3.0, 0.0, 0.0, 2.0, 3.0], "bins": [-404.4827880859375, -395.73114013671875, -386.9794921875, -378.22784423828125, -369.4761962890625, -360.72454833984375, -351.972900390625, -343.22125244140625, -334.4696044921875, -325.71795654296875, -316.96630859375, -308.21466064453125, -299.4630126953125, -290.71136474609375, -281.959716796875, -273.20806884765625, -264.4563903808594, -255.70474243164062, -246.95309448242188, -238.20144653320312, -229.44979858398438, -220.69815063476562, -211.9464874267578, -203.19483947753906, -194.4431915283203, -185.69154357910156, -176.9398956298828, -168.18824768066406, -159.43658447265625, -150.6849365234375, -141.93328857421875, -133.181640625, -124.43002319335938, -115.67837524414062, -106.92672729492188, -98.1750717163086, -89.42342376708984, -80.6717758178711, -71.92012023925781, -63.16847229003906, -54.41682434082031, -45.66517639160156, -36.91352462768555, -28.161874771118164, -19.41022491455078, -10.658576965332031, -1.9069252014160156, 6.8447265625, 15.59637451171875, 24.348024368286133, 33.099674224853516, 41.85132598876953, 50.60297393798828, 59.35462188720703, 68.10627746582031, 76.85792541503906, 85.60957336425781, 94.36122131347656, 103.11286926269531, 111.8645248413086, 120.61617279052734, 129.36782836914062, 138.11947631835938, 146.87112426757812, 155.62277221679688]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 11.0, 10.0, 14.0, 20.0, 35.0, 42.0, 54.0, 86.0, 141.0, 198.0, 360.0, 573.0, 1098.0, 1866.0, 3598.0, 6731.0, 13620.0, 30019.0, 71353.0, 190099.0, 372944.0, 212491.0, 79620.0, 33091.0, 14969.0, 7093.0, 3609.0, 1986.0, 1087.0, 638.0, 431.0, 245.0, 155.0, 78.0, 55.0, 51.0, 26.0, 19.0, 15.0, 9.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.609375, -30.607666015625, -29.60595703125, -28.604248046875, -27.6025390625, -26.600830078125, -25.59912109375, -24.597412109375, -23.595703125, -22.593994140625, -21.59228515625, -20.590576171875, -19.5888671875, -18.587158203125, -17.58544921875, -16.583740234375, -15.58203125, -14.580322265625, -13.57861328125, -12.576904296875, -11.5751953125, -10.573486328125, -9.57177734375, -8.570068359375, -7.568359375, -6.566650390625, -5.56494140625, -4.563232421875, -3.5615234375, -2.559814453125, -1.55810546875, -0.556396484375, 0.4453125, 1.447021484375, 2.44873046875, 3.450439453125, 4.4521484375, 5.453857421875, 6.45556640625, 7.457275390625, 8.458984375, 9.460693359375, 10.46240234375, 11.464111328125, 12.4658203125, 13.467529296875, 14.46923828125, 15.470947265625, 16.47265625, 17.474365234375, 18.47607421875, 19.477783203125, 20.4794921875, 21.481201171875, 22.48291015625, 23.484619140625, 24.486328125, 25.488037109375, 26.48974609375, 27.491455078125, 28.4931640625, 29.494873046875, 30.49658203125, 31.498291015625, 32.5]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 11.0, 14.0, 9.0, 14.0, 23.0, 18.0, 23.0, 32.0, 39.0, 43.0, 42.0, 67.0, 57.0, 50.0, 53.0, 78.0, 63.0, 55.0, 48.0, 61.0, 38.0, 29.0, 28.0, 22.0, 22.0, 18.0, 6.0, 5.0, 12.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-19.53125, -18.848388671875, -18.16552734375, -17.482666015625, -16.7998046875, -16.116943359375, -15.43408203125, -14.751220703125, -14.068359375, -13.385498046875, -12.70263671875, -12.019775390625, -11.3369140625, -10.654052734375, -9.97119140625, -9.288330078125, -8.60546875, -7.922607421875, -7.23974609375, -6.556884765625, -5.8740234375, -5.191162109375, -4.50830078125, -3.825439453125, -3.142578125, -2.459716796875, -1.77685546875, -1.093994140625, -0.4111328125, 0.271728515625, 0.95458984375, 1.637451171875, 2.3203125, 3.003173828125, 3.68603515625, 4.368896484375, 5.0517578125, 5.734619140625, 6.41748046875, 7.100341796875, 7.783203125, 8.466064453125, 9.14892578125, 9.831787109375, 10.5146484375, 11.197509765625, 11.88037109375, 12.563232421875, 13.24609375, 13.928955078125, 14.61181640625, 15.294677734375, 15.9775390625, 16.660400390625, 17.34326171875, 18.026123046875, 18.708984375, 19.391845703125, 20.07470703125, 20.757568359375, 21.4404296875, 22.123291015625, 22.80615234375, 23.489013671875, 24.171875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 5.0, 6.0, 5.0, 10.0, 15.0, 23.0, 32.0, 41.0, 63.0, 96.0, 156.0, 204.0, 369.0, 530.0, 866.0, 1657.0, 3743.0, 13423.0, 85766.0, 748121.0, 162616.0, 20902.0, 5027.0, 2028.0, 1063.0, 642.0, 378.0, 249.0, 163.0, 110.0, 76.0, 63.0, 29.0, 22.0, 15.0, 14.0, 7.0, 6.0, 7.0, 1.0, 6.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-77.0, -74.7109375, -72.421875, -70.1328125, -67.84375, -65.5546875, -63.265625, -60.9765625, -58.6875, -56.3984375, -54.109375, -51.8203125, -49.53125, -47.2421875, -44.953125, -42.6640625, -40.375, -38.0859375, -35.796875, -33.5078125, -31.21875, -28.9296875, -26.640625, -24.3515625, -22.0625, -19.7734375, -17.484375, -15.1953125, -12.90625, -10.6171875, -8.328125, -6.0390625, -3.75, -1.4609375, 0.828125, 3.1171875, 5.40625, 7.6953125, 9.984375, 12.2734375, 14.5625, 16.8515625, 19.140625, 21.4296875, 23.71875, 26.0078125, 28.296875, 30.5859375, 32.875, 35.1640625, 37.453125, 39.7421875, 42.03125, 44.3203125, 46.609375, 48.8984375, 51.1875, 53.4765625, 55.765625, 58.0546875, 60.34375, 62.6328125, 64.921875, 67.2109375, 69.5]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 6.0, 1.0, 5.0, 6.0, 6.0, 5.0, 6.0, 6.0, 16.0, 15.0, 14.0, 17.0, 25.0, 36.0, 24.0, 32.0, 32.0, 50.0, 45.0, 40.0, 39.0, 47.0, 47.0, 53.0, 48.0, 52.0, 31.0, 39.0, 32.0, 36.0, 25.0, 19.0, 25.0, 27.0, 13.0, 19.0, 14.0, 14.0, 9.0, 10.0, 1.0, 7.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0], "bins": [-69.1875, -67.2275390625, -65.267578125, -63.3076171875, -61.34765625, -59.3876953125, -57.427734375, -55.4677734375, -53.5078125, -51.5478515625, -49.587890625, -47.6279296875, -45.66796875, -43.7080078125, -41.748046875, -39.7880859375, -37.828125, -35.8681640625, -33.908203125, -31.9482421875, -29.98828125, -28.0283203125, -26.068359375, -24.1083984375, -22.1484375, -20.1884765625, -18.228515625, -16.2685546875, -14.30859375, -12.3486328125, -10.388671875, -8.4287109375, -6.46875, -4.5087890625, -2.548828125, -0.5888671875, 1.37109375, 3.3310546875, 5.291015625, 7.2509765625, 9.2109375, 11.1708984375, 13.130859375, 15.0908203125, 17.05078125, 19.0107421875, 20.970703125, 22.9306640625, 24.890625, 26.8505859375, 28.810546875, 30.7705078125, 32.73046875, 34.6904296875, 36.650390625, 38.6103515625, 40.5703125, 42.5302734375, 44.490234375, 46.4501953125, 48.41015625, 50.3701171875, 52.330078125, 54.2900390625, 56.25]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 9.0, 7.0, 12.0, 17.0, 19.0, 38.0, 43.0, 77.0, 92.0, 172.0, 375.0, 731.0, 2084.0, 8908.0, 64161.0, 776486.0, 171333.0, 18342.0, 3527.0, 1047.0, 456.0, 222.0, 134.0, 77.0, 45.0, 35.0, 31.0, 24.0, 14.0, 11.0, 8.0, 3.0, 3.0, 5.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.453125, -16.79931640625, -16.1455078125, -15.49169921875, -14.837890625, -14.18408203125, -13.5302734375, -12.87646484375, -12.22265625, -11.56884765625, -10.9150390625, -10.26123046875, -9.607421875, -8.95361328125, -8.2998046875, -7.64599609375, -6.9921875, -6.33837890625, -5.6845703125, -5.03076171875, -4.376953125, -3.72314453125, -3.0693359375, -2.41552734375, -1.76171875, -1.10791015625, -0.4541015625, 0.19970703125, 0.853515625, 1.50732421875, 2.1611328125, 2.81494140625, 3.46875, 4.12255859375, 4.7763671875, 5.43017578125, 6.083984375, 6.73779296875, 7.3916015625, 8.04541015625, 8.69921875, 9.35302734375, 10.0068359375, 10.66064453125, 11.314453125, 11.96826171875, 12.6220703125, 13.27587890625, 13.9296875, 14.58349609375, 15.2373046875, 15.89111328125, 16.544921875, 17.19873046875, 17.8525390625, 18.50634765625, 19.16015625, 19.81396484375, 20.4677734375, 21.12158203125, 21.775390625, 22.42919921875, 23.0830078125, 23.73681640625, 24.390625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 5.0, 6.0, 4.0, 3.0, 6.0, 7.0, 14.0, 10.0, 17.0, 12.0, 22.0, 27.0, 48.0, 48.0, 82.0, 119.0, 138.0, 111.0, 70.0, 48.0, 43.0, 26.0, 23.0, 17.0, 17.0, 22.0, 13.0, 8.0, 6.0, 6.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.00366973876953125, -0.003556668758392334, -0.003443598747253418, -0.003330528736114502, -0.003217458724975586, -0.00310438871383667, -0.002991318702697754, -0.002878248691558838, -0.002765178680419922, -0.002652108669281006, -0.00253903865814209, -0.002425968647003174, -0.002312898635864258, -0.002199828624725342, -0.0020867586135864258, -0.0019736886024475098, -0.0018606185913085938, -0.0017475485801696777, -0.0016344785690307617, -0.0015214085578918457, -0.0014083385467529297, -0.0012952685356140137, -0.0011821985244750977, -0.0010691285133361816, -0.0009560585021972656, -0.0008429884910583496, -0.0007299184799194336, -0.0006168484687805176, -0.0005037784576416016, -0.00039070844650268555, -0.00027763843536376953, -0.00016456842422485352, -5.14984130859375e-05, 6.157159805297852e-05, 0.00017464160919189453, 0.00028771162033081055, 0.00040078163146972656, 0.0005138516426086426, 0.0006269216537475586, 0.0007399916648864746, 0.0008530616760253906, 0.0009661316871643066, 0.0010792016983032227, 0.0011922717094421387, 0.0013053417205810547, 0.0014184117317199707, 0.0015314817428588867, 0.0016445517539978027, 0.0017576217651367188, 0.0018706917762756348, 0.0019837617874145508, 0.002096831798553467, 0.002209901809692383, 0.002322971820831299, 0.002436041831970215, 0.002549111843109131, 0.002662181854248047, 0.002775251865386963, 0.002888321876525879, 0.003001391887664795, 0.003114461898803711, 0.003227531909942627, 0.003340601921081543, 0.003453671932220459, 0.003566741943359375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 23.0, 16.0, 22.0, 39.0, 70.0, 167.0, 315.0, 547.0, 1277.0, 3435.0, 14415.0, 161009.0, 797280.0, 57896.0, 7933.0, 2291.0, 950.0, 427.0, 210.0, 101.0, 63.0, 23.0, 20.0, 7.0, 8.0, 5.0, 3.0, 1.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.453125, -21.8173828125, -21.181640625, -20.5458984375, -19.91015625, -19.2744140625, -18.638671875, -18.0029296875, -17.3671875, -16.7314453125, -16.095703125, -15.4599609375, -14.82421875, -14.1884765625, -13.552734375, -12.9169921875, -12.28125, -11.6455078125, -11.009765625, -10.3740234375, -9.73828125, -9.1025390625, -8.466796875, -7.8310546875, -7.1953125, -6.5595703125, -5.923828125, -5.2880859375, -4.65234375, -4.0166015625, -3.380859375, -2.7451171875, -2.109375, -1.4736328125, -0.837890625, -0.2021484375, 0.43359375, 1.0693359375, 1.705078125, 2.3408203125, 2.9765625, 3.6123046875, 4.248046875, 4.8837890625, 5.51953125, 6.1552734375, 6.791015625, 7.4267578125, 8.0625, 8.6982421875, 9.333984375, 9.9697265625, 10.60546875, 11.2412109375, 11.876953125, 12.5126953125, 13.1484375, 13.7841796875, 14.419921875, 15.0556640625, 15.69140625, 16.3271484375, 16.962890625, 17.5986328125, 18.234375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 3.0, 9.0, 9.0, 9.0, 24.0, 13.0, 11.0, 16.0, 28.0, 39.0, 37.0, 61.0, 59.0, 70.0, 79.0, 65.0, 90.0, 61.0, 52.0, 38.0, 45.0, 34.0, 27.0, 28.0, 20.0, 7.0, 16.0, 7.0, 11.0, 5.0, 6.0, 5.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.46875, -10.099853515625, -9.73095703125, -9.362060546875, -8.9931640625, -8.624267578125, -8.25537109375, -7.886474609375, -7.517578125, -7.148681640625, -6.77978515625, -6.410888671875, -6.0419921875, -5.673095703125, -5.30419921875, -4.935302734375, -4.56640625, -4.197509765625, -3.82861328125, -3.459716796875, -3.0908203125, -2.721923828125, -2.35302734375, -1.984130859375, -1.615234375, -1.246337890625, -0.87744140625, -0.508544921875, -0.1396484375, 0.229248046875, 0.59814453125, 0.967041015625, 1.3359375, 1.704833984375, 2.07373046875, 2.442626953125, 2.8115234375, 3.180419921875, 3.54931640625, 3.918212890625, 4.287109375, 4.656005859375, 5.02490234375, 5.393798828125, 5.7626953125, 6.131591796875, 6.50048828125, 6.869384765625, 7.23828125, 7.607177734375, 7.97607421875, 8.344970703125, 8.7138671875, 9.082763671875, 9.45166015625, 9.820556640625, 10.189453125, 10.558349609375, 10.92724609375, 11.296142578125, 11.6650390625, 12.033935546875, 12.40283203125, 12.771728515625, 13.140625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 7.0, 6.0, 14.0, 39.0, 65.0, 182.0, 284.0, 193.0, 107.0, 49.0, 23.0, 11.0, 8.0, 6.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-566.0093383789062, -550.6088256835938, -535.2083740234375, -519.807861328125, -504.4073791503906, -489.00689697265625, -473.6064147949219, -458.2059326171875, -442.805419921875, -427.4049377441406, -412.00445556640625, -396.60394287109375, -381.2034606933594, -365.802978515625, -350.4024963378906, -335.00201416015625, -319.60150146484375, -304.2010192871094, -288.800537109375, -273.4000244140625, -257.9995422363281, -242.59906005859375, -227.19857788085938, -211.79808044433594, -196.39761352539062, -180.99713134765625, -165.5966339111328, -150.19615173339844, -134.795654296875, -119.39517211914062, -103.99468231201172, -88.59419250488281, -73.19369506835938, -57.79320526123047, -42.39271545410156, -26.992229461669922, -11.591739654541016, 3.808746337890625, 19.20923614501953, 34.60972595214844, 50.010215759277344, 65.41070556640625, 80.81119537353516, 96.21168518066406, 111.61216735839844, 127.01265716552734, 142.41314697265625, 157.81362915039062, 173.21412658691406, 188.61460876464844, 204.01510620117188, 219.41558837890625, 234.8160858154297, 250.21656799316406, 265.6170654296875, 281.0175476074219, 296.41802978515625, 311.8185119628906, 327.218994140625, 342.6195068359375, 358.0199890136719, 373.42047119140625, 388.8209533691406, 404.221435546875, 419.6219482421875]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 4.0, 5.0, 1.0, 6.0, 3.0, 4.0, 10.0, 13.0, 12.0, 10.0, 21.0, 23.0, 24.0, 17.0, 26.0, 30.0, 24.0, 29.0, 34.0, 38.0, 48.0, 58.0, 72.0, 65.0, 52.0, 44.0, 41.0, 30.0, 38.0, 34.0, 25.0, 21.0, 26.0, 15.0, 17.0, 14.0, 17.0, 11.0, 10.0, 6.0, 8.0, 4.0, 6.0, 3.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-199.12289428710938, -191.53216552734375, -183.94142150878906, -176.35069274902344, -168.75994873046875, -161.16921997070312, -153.5784912109375, -145.9877471923828, -138.3970184326172, -130.80628967285156, -123.21554565429688, -115.62481689453125, -108.0340805053711, -100.44334411621094, -92.85260772705078, -85.26187133789062, -77.67113494873047, -70.08039855957031, -62.48966598510742, -54.898929595947266, -47.308197021484375, -39.71746063232422, -32.12672424316406, -24.535991668701172, -16.945255279541016, -9.354520797729492, -1.7637853622436523, 5.8269500732421875, 13.417684555053711, 21.008419036865234, 28.59915542602539, 36.18988800048828, 43.78062438964844, 51.371360778808594, 58.962093353271484, 66.55282592773438, 74.14356231689453, 81.73429870605469, 89.32503509521484, 96.915771484375, 104.50650024414062, 112.09723663330078, 119.68797302246094, 127.27870178222656, 134.86944580078125, 142.46017456054688, 150.0509033203125, 157.6416473388672, 165.23239135742188, 172.8231201171875, 180.4138641357422, 188.0045928955078, 195.5953369140625, 203.18606567382812, 210.77679443359375, 218.36753845214844, 225.95826721191406, 233.5489959716797, 241.13973999023438, 248.73046875, 256.3211975097656, 263.91192626953125, 271.502685546875, 279.0934143066406, 286.68414306640625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 3.0, 5.0, 6.0, 12.0, 22.0, 20.0, 20.0, 43.0, 60.0, 68.0, 96.0, 165.0, 274.0, 484.0, 878.0, 1573.0, 3396.0, 7974.0, 24701.0, 124338.0, 1216053.0, 2452150.0, 297871.0, 43155.0, 11485.0, 4564.0, 2169.0, 1064.0, 610.0, 380.0, 217.0, 128.0, 84.0, 52.0, 35.0, 34.0, 25.0, 21.0, 9.0, 12.0, 6.0, 3.0, 0.0, 4.0, 3.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.65625, -24.833984375, -24.01171875, -23.189453125, -22.3671875, -21.544921875, -20.72265625, -19.900390625, -19.078125, -18.255859375, -17.43359375, -16.611328125, -15.7890625, -14.966796875, -14.14453125, -13.322265625, -12.5, -11.677734375, -10.85546875, -10.033203125, -9.2109375, -8.388671875, -7.56640625, -6.744140625, -5.921875, -5.099609375, -4.27734375, -3.455078125, -2.6328125, -1.810546875, -0.98828125, -0.166015625, 0.65625, 1.478515625, 2.30078125, 3.123046875, 3.9453125, 4.767578125, 5.58984375, 6.412109375, 7.234375, 8.056640625, 8.87890625, 9.701171875, 10.5234375, 11.345703125, 12.16796875, 12.990234375, 13.8125, 14.634765625, 15.45703125, 16.279296875, 17.1015625, 17.923828125, 18.74609375, 19.568359375, 20.390625, 21.212890625, 22.03515625, 22.857421875, 23.6796875, 24.501953125, 25.32421875, 26.146484375, 26.96875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 7.0, 6.0, 11.0, 13.0, 12.0, 28.0, 18.0, 22.0, 28.0, 38.0, 46.0, 50.0, 47.0, 65.0, 64.0, 53.0, 47.0, 57.0, 66.0, 61.0, 48.0, 40.0, 33.0, 22.0, 22.0, 34.0, 21.0, 11.0, 6.0, 8.0, 8.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.640625, -17.972412109375, -17.30419921875, -16.635986328125, -15.9677734375, -15.299560546875, -14.63134765625, -13.963134765625, -13.294921875, -12.626708984375, -11.95849609375, -11.290283203125, -10.6220703125, -9.953857421875, -9.28564453125, -8.617431640625, -7.94921875, -7.281005859375, -6.61279296875, -5.944580078125, -5.2763671875, -4.608154296875, -3.93994140625, -3.271728515625, -2.603515625, -1.935302734375, -1.26708984375, -0.598876953125, 0.0693359375, 0.737548828125, 1.40576171875, 2.073974609375, 2.7421875, 3.410400390625, 4.07861328125, 4.746826171875, 5.4150390625, 6.083251953125, 6.75146484375, 7.419677734375, 8.087890625, 8.756103515625, 9.42431640625, 10.092529296875, 10.7607421875, 11.428955078125, 12.09716796875, 12.765380859375, 13.43359375, 14.101806640625, 14.77001953125, 15.438232421875, 16.1064453125, 16.774658203125, 17.44287109375, 18.111083984375, 18.779296875, 19.447509765625, 20.11572265625, 20.783935546875, 21.4521484375, 22.120361328125, 22.78857421875, 23.456787109375, 24.125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 3.0, 7.0, 7.0, 15.0, 15.0, 35.0, 45.0, 60.0, 114.0, 210.0, 432.0, 1112.0, 3151.0, 11685.0, 72234.0, 2225509.0, 1798473.0, 64908.0, 11227.0, 3010.0, 1031.0, 435.0, 211.0, 123.0, 67.0, 62.0, 37.0, 16.0, 21.0, 11.0, 5.0, 3.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.8125, -33.3603515625, -31.908203125, -30.4560546875, -29.00390625, -27.5517578125, -26.099609375, -24.6474609375, -23.1953125, -21.7431640625, -20.291015625, -18.8388671875, -17.38671875, -15.9345703125, -14.482421875, -13.0302734375, -11.578125, -10.1259765625, -8.673828125, -7.2216796875, -5.76953125, -4.3173828125, -2.865234375, -1.4130859375, 0.0390625, 1.4912109375, 2.943359375, 4.3955078125, 5.84765625, 7.2998046875, 8.751953125, 10.2041015625, 11.65625, 13.1083984375, 14.560546875, 16.0126953125, 17.46484375, 18.9169921875, 20.369140625, 21.8212890625, 23.2734375, 24.7255859375, 26.177734375, 27.6298828125, 29.08203125, 30.5341796875, 31.986328125, 33.4384765625, 34.890625, 36.3427734375, 37.794921875, 39.2470703125, 40.69921875, 42.1513671875, 43.603515625, 45.0556640625, 46.5078125, 47.9599609375, 49.412109375, 50.8642578125, 52.31640625, 53.7685546875, 55.220703125, 56.6728515625, 58.125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 8.0, 10.0, 15.0, 19.0, 24.0, 30.0, 47.0, 85.0, 134.0, 210.0, 393.0, 632.0, 790.0, 639.0, 434.0, 210.0, 140.0, 73.0, 48.0, 26.0, 23.0, 30.0, 13.0, 9.0, 5.0, 6.0, 3.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.5625, -29.32080078125, -28.0791015625, -26.83740234375, -25.595703125, -24.35400390625, -23.1123046875, -21.87060546875, -20.62890625, -19.38720703125, -18.1455078125, -16.90380859375, -15.662109375, -14.42041015625, -13.1787109375, -11.93701171875, -10.6953125, -9.45361328125, -8.2119140625, -6.97021484375, -5.728515625, -4.48681640625, -3.2451171875, -2.00341796875, -0.76171875, 0.47998046875, 1.7216796875, 2.96337890625, 4.205078125, 5.44677734375, 6.6884765625, 7.93017578125, 9.171875, 10.41357421875, 11.6552734375, 12.89697265625, 14.138671875, 15.38037109375, 16.6220703125, 17.86376953125, 19.10546875, 20.34716796875, 21.5888671875, 22.83056640625, 24.072265625, 25.31396484375, 26.5556640625, 27.79736328125, 29.0390625, 30.28076171875, 31.5224609375, 32.76416015625, 34.005859375, 35.24755859375, 36.4892578125, 37.73095703125, 38.97265625, 40.21435546875, 41.4560546875, 42.69775390625, 43.939453125, 45.18115234375, 46.4228515625, 47.66455078125, 48.90625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 14.0, 37.0, 157.0, 356.0, 287.0, 99.0, 24.0, 13.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-724.652587890625, -702.5910034179688, -680.5293579101562, -658.4677734375, -636.4061279296875, -614.3445434570312, -592.282958984375, -570.2213134765625, -548.1597290039062, -526.09814453125, -504.0364990234375, -481.97491455078125, -459.9132995605469, -437.8516845703125, -415.7900695800781, -393.72845458984375, -371.6668395996094, -349.605224609375, -327.5436096191406, -305.48199462890625, -283.42041015625, -261.3587951660156, -239.29718017578125, -217.23558044433594, -195.17396545410156, -173.1123504638672, -151.05075073242188, -128.9891357421875, -106.92752838134766, -84.86592102050781, -62.80430603027344, -40.742706298828125, -18.68109130859375, 3.3805179595947266, 25.442127227783203, 47.50373840332031, 69.56534576416016, 91.626953125, 113.68856811523438, 135.7501678466797, 157.81178283691406, 179.87339782714844, 201.93499755859375, 223.99661254882812, 246.0582275390625, 268.11981201171875, 290.18145751953125, 312.2430419921875, 334.3046569824219, 356.36627197265625, 378.4278869628906, 400.489501953125, 422.55108642578125, 444.6127014160156, 466.67431640625, 488.73590087890625, 510.79754638671875, 532.859130859375, 554.9207763671875, 576.9823608398438, 599.0440063476562, 621.1055908203125, 643.167236328125, 665.2288208007812, 687.2904052734375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 6.0, 13.0, 8.0, 16.0, 13.0, 19.0, 17.0, 13.0, 27.0, 38.0, 35.0, 30.0, 35.0, 43.0, 43.0, 41.0, 55.0, 50.0, 45.0, 58.0, 48.0, 42.0, 41.0, 45.0, 24.0, 24.0, 30.0, 23.0, 15.0, 12.0, 21.0, 13.0, 15.0, 9.0, 6.0, 6.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-146.69329833984375, -141.41461181640625, -136.13592529296875, -130.85723876953125, -125.57854461669922, -120.29985809326172, -115.02116394042969, -109.74247741699219, -104.46379089355469, -99.18510437011719, -93.90641784667969, -88.62772369384766, -83.34903717041016, -78.07035064697266, -72.79165649414062, -67.51296997070312, -62.234283447265625, -56.955596923828125, -51.67690658569336, -46.398216247558594, -41.119529724121094, -35.840843200683594, -30.562152862548828, -25.283462524414062, -20.004776000976562, -14.72608757019043, -9.447399139404297, -4.168710708618164, 1.1099777221679688, 6.388666152954102, 11.667354583740234, 16.946044921875, 22.2247314453125, 27.503419876098633, 32.782108306884766, 38.06079864501953, 43.33948516845703, 48.61817169189453, 53.8968620300293, 59.17555236816406, 64.45423889160156, 69.73292541503906, 75.01161193847656, 80.2903060913086, 85.5689926147461, 90.8476791381836, 96.12637329101562, 101.40505981445312, 106.68374633789062, 111.96243286132812, 117.24111938476562, 122.51981353759766, 127.79850006103516, 133.0771942138672, 138.3558807373047, 143.6345672607422, 148.9132537841797, 154.1919403076172, 159.4706268310547, 164.7493133544922, 170.02801513671875, 175.30670166015625, 180.58538818359375, 185.86407470703125, 191.14276123046875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 6.0, 3.0, 5.0, 6.0, 6.0, 9.0, 22.0, 28.0, 45.0, 49.0, 98.0, 129.0, 223.0, 418.0, 755.0, 1435.0, 3012.0, 6507.0, 15646.0, 42884.0, 126853.0, 319138.0, 325674.0, 131781.0, 44615.0, 16171.0, 6740.0, 3004.0, 1442.0, 791.0, 415.0, 226.0, 141.0, 81.0, 61.0, 52.0, 25.0, 23.0, 9.0, 10.0, 7.0, 5.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.375, -23.56298828125, -22.7509765625, -21.93896484375, -21.126953125, -20.31494140625, -19.5029296875, -18.69091796875, -17.87890625, -17.06689453125, -16.2548828125, -15.44287109375, -14.630859375, -13.81884765625, -13.0068359375, -12.19482421875, -11.3828125, -10.57080078125, -9.7587890625, -8.94677734375, -8.134765625, -7.32275390625, -6.5107421875, -5.69873046875, -4.88671875, -4.07470703125, -3.2626953125, -2.45068359375, -1.638671875, -0.82666015625, -0.0146484375, 0.79736328125, 1.609375, 2.42138671875, 3.2333984375, 4.04541015625, 4.857421875, 5.66943359375, 6.4814453125, 7.29345703125, 8.10546875, 8.91748046875, 9.7294921875, 10.54150390625, 11.353515625, 12.16552734375, 12.9775390625, 13.78955078125, 14.6015625, 15.41357421875, 16.2255859375, 17.03759765625, 17.849609375, 18.66162109375, 19.4736328125, 20.28564453125, 21.09765625, 21.90966796875, 22.7216796875, 23.53369140625, 24.345703125, 25.15771484375, 25.9697265625, 26.78173828125, 27.59375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 7.0, 7.0, 12.0, 12.0, 15.0, 17.0, 18.0, 30.0, 29.0, 35.0, 41.0, 60.0, 59.0, 54.0, 67.0, 47.0, 51.0, 46.0, 56.0, 42.0, 42.0, 44.0, 33.0, 33.0, 27.0, 28.0, 21.0, 13.0, 17.0, 6.0, 7.0, 7.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.109375, -16.468994140625, -15.82861328125, -15.188232421875, -14.5478515625, -13.907470703125, -13.26708984375, -12.626708984375, -11.986328125, -11.345947265625, -10.70556640625, -10.065185546875, -9.4248046875, -8.784423828125, -8.14404296875, -7.503662109375, -6.86328125, -6.222900390625, -5.58251953125, -4.942138671875, -4.3017578125, -3.661376953125, -3.02099609375, -2.380615234375, -1.740234375, -1.099853515625, -0.45947265625, 0.180908203125, 0.8212890625, 1.461669921875, 2.10205078125, 2.742431640625, 3.3828125, 4.023193359375, 4.66357421875, 5.303955078125, 5.9443359375, 6.584716796875, 7.22509765625, 7.865478515625, 8.505859375, 9.146240234375, 9.78662109375, 10.427001953125, 11.0673828125, 11.707763671875, 12.34814453125, 12.988525390625, 13.62890625, 14.269287109375, 14.90966796875, 15.550048828125, 16.1904296875, 16.830810546875, 17.47119140625, 18.111572265625, 18.751953125, 19.392333984375, 20.03271484375, 20.673095703125, 21.3134765625, 21.953857421875, 22.59423828125, 23.234619140625, 23.875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 4.0, 9.0, 16.0, 25.0, 39.0, 51.0, 81.0, 146.0, 308.0, 714.0, 2034.0, 7183.0, 37290.0, 298868.0, 621885.0, 64353.0, 10954.0, 2798.0, 925.0, 408.0, 184.0, 115.0, 59.0, 31.0, 19.0, 15.0, 11.0, 8.0, 6.0, 5.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.0625, -48.4013671875, -46.740234375, -45.0791015625, -43.41796875, -41.7568359375, -40.095703125, -38.4345703125, -36.7734375, -35.1123046875, -33.451171875, -31.7900390625, -30.12890625, -28.4677734375, -26.806640625, -25.1455078125, -23.484375, -21.8232421875, -20.162109375, -18.5009765625, -16.83984375, -15.1787109375, -13.517578125, -11.8564453125, -10.1953125, -8.5341796875, -6.873046875, -5.2119140625, -3.55078125, -1.8896484375, -0.228515625, 1.4326171875, 3.09375, 4.7548828125, 6.416015625, 8.0771484375, 9.73828125, 11.3994140625, 13.060546875, 14.7216796875, 16.3828125, 18.0439453125, 19.705078125, 21.3662109375, 23.02734375, 24.6884765625, 26.349609375, 28.0107421875, 29.671875, 31.3330078125, 32.994140625, 34.6552734375, 36.31640625, 37.9775390625, 39.638671875, 41.2998046875, 42.9609375, 44.6220703125, 46.283203125, 47.9443359375, 49.60546875, 51.2666015625, 52.927734375, 54.5888671875, 56.25]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 8.0, 7.0, 6.0, 9.0, 15.0, 24.0, 17.0, 18.0, 24.0, 31.0, 26.0, 32.0, 44.0, 47.0, 44.0, 48.0, 50.0, 47.0, 42.0, 36.0, 50.0, 42.0, 50.0, 45.0, 39.0, 35.0, 29.0, 28.0, 19.0, 16.0, 13.0, 12.0, 12.0, 6.0, 4.0, 5.0, 4.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 3.0], "bins": [-73.125, -71.17919921875, -69.2333984375, -67.28759765625, -65.341796875, -63.39599609375, -61.4501953125, -59.50439453125, -57.55859375, -55.61279296875, -53.6669921875, -51.72119140625, -49.775390625, -47.82958984375, -45.8837890625, -43.93798828125, -41.9921875, -40.04638671875, -38.1005859375, -36.15478515625, -34.208984375, -32.26318359375, -30.3173828125, -28.37158203125, -26.42578125, -24.47998046875, -22.5341796875, -20.58837890625, -18.642578125, -16.69677734375, -14.7509765625, -12.80517578125, -10.859375, -8.91357421875, -6.9677734375, -5.02197265625, -3.076171875, -1.13037109375, 0.8154296875, 2.76123046875, 4.70703125, 6.65283203125, 8.5986328125, 10.54443359375, 12.490234375, 14.43603515625, 16.3818359375, 18.32763671875, 20.2734375, 22.21923828125, 24.1650390625, 26.11083984375, 28.056640625, 30.00244140625, 31.9482421875, 33.89404296875, 35.83984375, 37.78564453125, 39.7314453125, 41.67724609375, 43.623046875, 45.56884765625, 47.5146484375, 49.46044921875, 51.40625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 4.0, 6.0, 8.0, 9.0, 11.0, 25.0, 39.0, 58.0, 84.0, 145.0, 283.0, 582.0, 1147.0, 3358.0, 11381.0, 50913.0, 287257.0, 591155.0, 78452.0, 16296.0, 4434.0, 1496.0, 646.0, 283.0, 152.0, 105.0, 61.0, 39.0, 34.0, 26.0, 15.0, 10.0, 7.0, 7.0, 4.0, 6.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-10.796875, -10.498046875, -10.19921875, -9.900390625, -9.6015625, -9.302734375, -9.00390625, -8.705078125, -8.40625, -8.107421875, -7.80859375, -7.509765625, -7.2109375, -6.912109375, -6.61328125, -6.314453125, -6.015625, -5.716796875, -5.41796875, -5.119140625, -4.8203125, -4.521484375, -4.22265625, -3.923828125, -3.625, -3.326171875, -3.02734375, -2.728515625, -2.4296875, -2.130859375, -1.83203125, -1.533203125, -1.234375, -0.935546875, -0.63671875, -0.337890625, -0.0390625, 0.259765625, 0.55859375, 0.857421875, 1.15625, 1.455078125, 1.75390625, 2.052734375, 2.3515625, 2.650390625, 2.94921875, 3.248046875, 3.546875, 3.845703125, 4.14453125, 4.443359375, 4.7421875, 5.041015625, 5.33984375, 5.638671875, 5.9375, 6.236328125, 6.53515625, 6.833984375, 7.1328125, 7.431640625, 7.73046875, 8.029296875, 8.328125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 5.0, 1.0, 4.0, 3.0, 8.0, 12.0, 7.0, 10.0, 9.0, 29.0, 35.0, 50.0, 65.0, 80.0, 107.0, 135.0, 115.0, 103.0, 60.0, 47.0, 38.0, 18.0, 22.0, 14.0, 3.0, 9.0, 4.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0023784637451171875, -0.0023027658462524414, -0.0022270679473876953, -0.0021513700485229492, -0.002075672149658203, -0.001999974250793457, -0.001924276351928711, -0.0018485784530639648, -0.0017728805541992188, -0.0016971826553344727, -0.0016214847564697266, -0.0015457868576049805, -0.0014700889587402344, -0.0013943910598754883, -0.0013186931610107422, -0.001242995262145996, -0.00116729736328125, -0.001091599464416504, -0.0010159015655517578, -0.0009402036666870117, -0.0008645057678222656, -0.0007888078689575195, -0.0007131099700927734, -0.0006374120712280273, -0.0005617141723632812, -0.00048601627349853516, -0.00041031837463378906, -0.00033462047576904297, -0.0002589225769042969, -0.00018322467803955078, -0.00010752677917480469, -3.1828880310058594e-05, 4.38690185546875e-05, 0.0001195669174194336, 0.0001952648162841797, 0.0002709627151489258, 0.0003466606140136719, 0.00042235851287841797, 0.0004980564117431641, 0.0005737543106079102, 0.0006494522094726562, 0.0007251501083374023, 0.0008008480072021484, 0.0008765459060668945, 0.0009522438049316406, 0.0010279417037963867, 0.0011036396026611328, 0.001179337501525879, 0.001255035400390625, 0.001330733299255371, 0.0014064311981201172, 0.0014821290969848633, 0.0015578269958496094, 0.0016335248947143555, 0.0017092227935791016, 0.0017849206924438477, 0.0018606185913085938, 0.0019363164901733398, 0.002012014389038086, 0.002087712287902832, 0.002163410186767578, 0.0022391080856323242, 0.0023148059844970703, 0.0023905038833618164, 0.0024662017822265625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 8.0, 6.0, 10.0, 10.0, 11.0, 19.0, 32.0, 39.0, 53.0, 94.0, 160.0, 341.0, 707.0, 1543.0, 4042.0, 13263.0, 61250.0, 481474.0, 405758.0, 59754.0, 12928.0, 4072.0, 1516.0, 671.0, 323.0, 185.0, 103.0, 59.0, 38.0, 26.0, 18.0, 12.0, 11.0, 5.0, 2.0, 3.0, 2.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.25, -7.919921875, -7.58984375, -7.259765625, -6.9296875, -6.599609375, -6.26953125, -5.939453125, -5.609375, -5.279296875, -4.94921875, -4.619140625, -4.2890625, -3.958984375, -3.62890625, -3.298828125, -2.96875, -2.638671875, -2.30859375, -1.978515625, -1.6484375, -1.318359375, -0.98828125, -0.658203125, -0.328125, 0.001953125, 0.33203125, 0.662109375, 0.9921875, 1.322265625, 1.65234375, 1.982421875, 2.3125, 2.642578125, 2.97265625, 3.302734375, 3.6328125, 3.962890625, 4.29296875, 4.623046875, 4.953125, 5.283203125, 5.61328125, 5.943359375, 6.2734375, 6.603515625, 6.93359375, 7.263671875, 7.59375, 7.923828125, 8.25390625, 8.583984375, 8.9140625, 9.244140625, 9.57421875, 9.904296875, 10.234375, 10.564453125, 10.89453125, 11.224609375, 11.5546875, 11.884765625, 12.21484375, 12.544921875, 12.875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 9.0, 7.0, 11.0, 11.0, 6.0, 17.0, 21.0, 27.0, 27.0, 43.0, 46.0, 52.0, 55.0, 70.0, 69.0, 68.0, 69.0, 61.0, 66.0, 56.0, 38.0, 23.0, 30.0, 16.0, 19.0, 10.0, 14.0, 10.0, 11.0, 4.0, 4.0, 6.0, 8.0, 2.0, 2.0, 1.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.078125, -6.827392578125, -6.57666015625, -6.325927734375, -6.0751953125, -5.824462890625, -5.57373046875, -5.322998046875, -5.072265625, -4.821533203125, -4.57080078125, -4.320068359375, -4.0693359375, -3.818603515625, -3.56787109375, -3.317138671875, -3.06640625, -2.815673828125, -2.56494140625, -2.314208984375, -2.0634765625, -1.812744140625, -1.56201171875, -1.311279296875, -1.060546875, -0.809814453125, -0.55908203125, -0.308349609375, -0.0576171875, 0.193115234375, 0.44384765625, 0.694580078125, 0.9453125, 1.196044921875, 1.44677734375, 1.697509765625, 1.9482421875, 2.198974609375, 2.44970703125, 2.700439453125, 2.951171875, 3.201904296875, 3.45263671875, 3.703369140625, 3.9541015625, 4.204833984375, 4.45556640625, 4.706298828125, 4.95703125, 5.207763671875, 5.45849609375, 5.709228515625, 5.9599609375, 6.210693359375, 6.46142578125, 6.712158203125, 6.962890625, 7.213623046875, 7.46435546875, 7.715087890625, 7.9658203125, 8.216552734375, 8.46728515625, 8.718017578125, 8.96875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 5.0, 14.0, 17.0, 39.0, 89.0, 168.0, 310.0, 181.0, 98.0, 33.0, 27.0, 6.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-606.7669677734375, -594.0113525390625, -581.2557373046875, -568.5000610351562, -555.7444458007812, -542.9888305664062, -530.2332153320312, -517.4776000976562, -504.7219543457031, -491.9663391113281, -479.210693359375, -466.455078125, -453.699462890625, -440.9438171386719, -428.1882019042969, -415.43255615234375, -402.67694091796875, -389.92132568359375, -377.1656799316406, -364.4100646972656, -351.6544189453125, -338.8988037109375, -326.1431884765625, -313.3875732421875, -300.6319274902344, -287.8763122558594, -275.12066650390625, -262.36505126953125, -249.6094207763672, -236.85379028320312, -224.09817504882812, -211.34254455566406, -198.58688354492188, -185.8312530517578, -173.07562255859375, -160.32000732421875, -147.5643768310547, -134.80874633789062, -122.0531234741211, -109.29750061035156, -96.5418701171875, -83.78623962402344, -71.0306167602539, -58.27499008178711, -45.51936340332031, -32.763736724853516, -20.00811004638672, -7.2524871826171875, 5.503143310546875, 18.258769989013672, 31.01439666748047, 43.770023345947266, 56.52565002441406, 69.28128051757812, 82.03690338134766, 94.79252624511719, 107.54815673828125, 120.30378723144531, 133.05941772460938, 145.81503295898438, 158.57066345214844, 171.3262939453125, 184.0819091796875, 196.83753967285156, 209.59317016601562]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 4.0, 9.0, 8.0, 9.0, 11.0, 11.0, 11.0, 17.0, 24.0, 17.0, 29.0, 28.0, 35.0, 33.0, 33.0, 46.0, 49.0, 79.0, 86.0, 84.0, 41.0, 44.0, 32.0, 31.0, 33.0, 22.0, 29.0, 33.0, 13.0, 13.0, 17.0, 12.0, 6.0, 11.0, 9.0, 8.0, 9.0, 1.0, 5.0, 6.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-220.49673461914062, -212.74285888671875, -204.9889678955078, -197.23509216308594, -189.48121643066406, -181.72732543945312, -173.97344970703125, -166.21957397460938, -158.46568298339844, -150.71180725097656, -142.95791625976562, -135.20404052734375, -127.45015716552734, -119.69627380371094, -111.94239807128906, -104.18851470947266, -96.43463897705078, -88.68075561523438, -80.9268798828125, -73.1729965209961, -65.41911315917969, -57.66523361206055, -49.911354064941406, -42.157470703125, -34.40359115600586, -26.649709701538086, -18.895828247070312, -11.141948699951172, -3.3880672454833984, 4.365814208984375, 12.119693756103516, 19.873577117919922, 27.627456665039062, 35.3813362121582, 43.13521957397461, 50.88909912109375, 58.642982482910156, 66.39686584472656, 74.15074157714844, 81.90462493896484, 89.65850830078125, 97.41239166259766, 105.16626739501953, 112.92015075683594, 120.67403411865234, 128.42791748046875, 136.18179321289062, 143.9356689453125, 151.68954467773438, 159.44342041015625, 167.1973114013672, 174.95118713378906, 182.70506286621094, 190.45895385742188, 198.21282958984375, 205.96670532226562, 213.72059631347656, 221.47447204589844, 229.22836303710938, 236.98223876953125, 244.73611450195312, 252.49000549316406, 260.243896484375, 267.9977722167969, 275.75164794921875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 5.0, 9.0, 8.0, 14.0, 14.0, 25.0, 33.0, 44.0, 88.0, 137.0, 222.0, 362.0, 639.0, 1305.0, 2677.0, 5859.0, 14531.0, 45595.0, 197626.0, 991298.0, 2075615.0, 668873.0, 136142.0, 33735.0, 10826.0, 4293.0, 1928.0, 978.0, 579.0, 303.0, 172.0, 109.0, 76.0, 42.0, 33.0, 22.0, 13.0, 13.0, 14.0, 8.0, 1.0, 5.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.640625, -15.14208984375, -14.6435546875, -14.14501953125, -13.646484375, -13.14794921875, -12.6494140625, -12.15087890625, -11.65234375, -11.15380859375, -10.6552734375, -10.15673828125, -9.658203125, -9.15966796875, -8.6611328125, -8.16259765625, -7.6640625, -7.16552734375, -6.6669921875, -6.16845703125, -5.669921875, -5.17138671875, -4.6728515625, -4.17431640625, -3.67578125, -3.17724609375, -2.6787109375, -2.18017578125, -1.681640625, -1.18310546875, -0.6845703125, -0.18603515625, 0.3125, 0.81103515625, 1.3095703125, 1.80810546875, 2.306640625, 2.80517578125, 3.3037109375, 3.80224609375, 4.30078125, 4.79931640625, 5.2978515625, 5.79638671875, 6.294921875, 6.79345703125, 7.2919921875, 7.79052734375, 8.2890625, 8.78759765625, 9.2861328125, 9.78466796875, 10.283203125, 10.78173828125, 11.2802734375, 11.77880859375, 12.27734375, 12.77587890625, 13.2744140625, 13.77294921875, 14.271484375, 14.77001953125, 15.2685546875, 15.76708984375, 16.265625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 5.0, 0.0, 4.0, 1.0, 6.0, 2.0, 7.0, 6.0, 11.0, 13.0, 18.0, 16.0, 25.0, 32.0, 30.0, 21.0, 37.0, 43.0, 51.0, 55.0, 56.0, 50.0, 54.0, 46.0, 43.0, 67.0, 35.0, 43.0, 41.0, 41.0, 34.0, 23.0, 20.0, 20.0, 14.0, 11.0, 11.0, 9.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.890625, -15.289306640625, -14.68798828125, -14.086669921875, -13.4853515625, -12.884033203125, -12.28271484375, -11.681396484375, -11.080078125, -10.478759765625, -9.87744140625, -9.276123046875, -8.6748046875, -8.073486328125, -7.47216796875, -6.870849609375, -6.26953125, -5.668212890625, -5.06689453125, -4.465576171875, -3.8642578125, -3.262939453125, -2.66162109375, -2.060302734375, -1.458984375, -0.857666015625, -0.25634765625, 0.344970703125, 0.9462890625, 1.547607421875, 2.14892578125, 2.750244140625, 3.3515625, 3.952880859375, 4.55419921875, 5.155517578125, 5.7568359375, 6.358154296875, 6.95947265625, 7.560791015625, 8.162109375, 8.763427734375, 9.36474609375, 9.966064453125, 10.5673828125, 11.168701171875, 11.77001953125, 12.371337890625, 12.97265625, 13.573974609375, 14.17529296875, 14.776611328125, 15.3779296875, 15.979248046875, 16.58056640625, 17.181884765625, 17.783203125, 18.384521484375, 18.98583984375, 19.587158203125, 20.1884765625, 20.789794921875, 21.39111328125, 21.992431640625, 22.59375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 3.0, 4.0, 7.0, 7.0, 7.0, 19.0, 19.0, 38.0, 61.0, 101.0, 137.0, 398.0, 1271.0, 6478.0, 54622.0, 2897339.0, 1196139.0, 31236.0, 4521.0, 1044.0, 373.0, 178.0, 105.0, 71.0, 36.0, 20.0, 18.0, 10.0, 11.0, 4.0, 5.0, 4.0, 0.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.78125, -52.36181640625, -50.9423828125, -49.52294921875, -48.103515625, -46.68408203125, -45.2646484375, -43.84521484375, -42.42578125, -41.00634765625, -39.5869140625, -38.16748046875, -36.748046875, -35.32861328125, -33.9091796875, -32.48974609375, -31.0703125, -29.65087890625, -28.2314453125, -26.81201171875, -25.392578125, -23.97314453125, -22.5537109375, -21.13427734375, -19.71484375, -18.29541015625, -16.8759765625, -15.45654296875, -14.037109375, -12.61767578125, -11.1982421875, -9.77880859375, -8.359375, -6.93994140625, -5.5205078125, -4.10107421875, -2.681640625, -1.26220703125, 0.1572265625, 1.57666015625, 2.99609375, 4.41552734375, 5.8349609375, 7.25439453125, 8.673828125, 10.09326171875, 11.5126953125, 12.93212890625, 14.3515625, 15.77099609375, 17.1904296875, 18.60986328125, 20.029296875, 21.44873046875, 22.8681640625, 24.28759765625, 25.70703125, 27.12646484375, 28.5458984375, 29.96533203125, 31.384765625, 32.80419921875, 34.2236328125, 35.64306640625, 37.0625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 5.0, 14.0, 10.0, 20.0, 34.0, 51.0, 70.0, 184.0, 267.0, 462.0, 757.0, 749.0, 600.0, 363.0, 184.0, 117.0, 44.0, 44.0, 26.0, 20.0, 8.0, 9.0, 6.0, 7.0, 6.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.421875, -19.305908203125, -18.18994140625, -17.073974609375, -15.9580078125, -14.842041015625, -13.72607421875, -12.610107421875, -11.494140625, -10.378173828125, -9.26220703125, -8.146240234375, -7.0302734375, -5.914306640625, -4.79833984375, -3.682373046875, -2.56640625, -1.450439453125, -0.33447265625, 0.781494140625, 1.8974609375, 3.013427734375, 4.12939453125, 5.245361328125, 6.361328125, 7.477294921875, 8.59326171875, 9.709228515625, 10.8251953125, 11.941162109375, 13.05712890625, 14.173095703125, 15.2890625, 16.405029296875, 17.52099609375, 18.636962890625, 19.7529296875, 20.868896484375, 21.98486328125, 23.100830078125, 24.216796875, 25.332763671875, 26.44873046875, 27.564697265625, 28.6806640625, 29.796630859375, 30.91259765625, 32.028564453125, 33.14453125, 34.260498046875, 35.37646484375, 36.492431640625, 37.6083984375, 38.724365234375, 39.84033203125, 40.956298828125, 42.072265625, 43.188232421875, 44.30419921875, 45.420166015625, 46.5361328125, 47.652099609375, 48.76806640625, 49.884033203125, 51.0]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 8.0, 40.0, 89.0, 195.0, 266.0, 189.0, 112.0, 58.0, 20.0, 7.0, 8.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-226.63174438476562, -215.13035583496094, -203.62896728515625, -192.12759399414062, -180.62620544433594, -169.12481689453125, -157.62344360351562, -146.12205505371094, -134.62066650390625, -123.11927795410156, -111.6178970336914, -100.11651611328125, -88.61512756347656, -77.11373901367188, -65.61235809326172, -54.11097717285156, -42.609588623046875, -31.108203887939453, -19.60681915283203, -8.10543441772461, 3.3959503173828125, 14.897335052490234, 26.398719787597656, 37.90010070800781, 49.4014892578125, 60.90287399291992, 72.40425872802734, 83.9056396484375, 95.40702819824219, 106.90841674804688, 118.40979766845703, 129.9111785888672, 141.41253662109375, 152.91392517089844, 164.41531372070312, 175.91668701171875, 187.41807556152344, 198.91946411132812, 210.42083740234375, 221.92222595214844, 233.42361450195312, 244.9250030517578, 256.4263916015625, 267.9277648925781, 279.42913818359375, 290.9305419921875, 302.4319152832031, 313.93328857421875, 325.4346923828125, 336.9360656738281, 348.4374694824219, 359.9388427734375, 371.44024658203125, 382.9416198730469, 394.4429931640625, 405.94439697265625, 417.4457702636719, 428.9471435546875, 440.44854736328125, 451.9499206542969, 463.4512939453125, 474.95269775390625, 486.4540710449219, 497.9554443359375, 509.45684814453125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 3.0, 5.0, 12.0, 15.0, 14.0, 16.0, 16.0, 24.0, 21.0, 35.0, 36.0, 31.0, 58.0, 43.0, 69.0, 55.0, 61.0, 73.0, 61.0, 56.0, 44.0, 37.0, 42.0, 42.0, 24.0, 24.0, 22.0, 15.0, 11.0, 7.0, 7.0, 5.0, 4.0, 10.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-172.08407592773438, -167.24609375, -162.4081268310547, -157.57015991210938, -152.732177734375, -147.89419555664062, -143.0562286376953, -138.21826171875, -133.38027954101562, -128.54229736328125, -123.70433044433594, -118.8663558959961, -114.02838134765625, -109.1904067993164, -104.35243225097656, -99.51445770263672, -94.67648315429688, -89.83850860595703, -85.00053405761719, -80.16255950927734, -75.3245849609375, -70.48661041259766, -65.64863586425781, -60.81066131591797, -55.972686767578125, -51.13471221923828, -46.29673767089844, -41.458763122558594, -36.62078857421875, -31.782814025878906, -26.944839477539062, -22.10686492919922, -17.268905639648438, -12.430931091308594, -7.59295654296875, -2.7549819946289062, 2.0829925537109375, 6.920967102050781, 11.758941650390625, 16.59691619873047, 21.434890747070312, 26.272865295410156, 31.11083984375, 35.948814392089844, 40.78678894042969, 45.62476348876953, 50.462738037109375, 55.30071258544922, 60.13868713378906, 64.9766616821289, 69.81463623046875, 74.6526107788086, 79.49058532714844, 84.32855987548828, 89.16653442382812, 94.00450897216797, 98.84248352050781, 103.68045806884766, 108.5184326171875, 113.35640716552734, 118.19438171386719, 123.03235626220703, 127.87033081054688, 132.70831298828125, 137.54627990722656]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 6.0, 17.0, 15.0, 20.0, 30.0, 43.0, 73.0, 121.0, 197.0, 361.0, 598.0, 1092.0, 2155.0, 4328.0, 9998.0, 23598.0, 60687.0, 164255.0, 345789.0, 265438.0, 102615.0, 38464.0, 15242.0, 6796.0, 3018.0, 1555.0, 811.0, 490.0, 266.0, 164.0, 115.0, 68.0, 49.0, 24.0, 23.0, 11.0, 6.0, 7.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.375, -18.701416015625, -18.02783203125, -17.354248046875, -16.6806640625, -16.007080078125, -15.33349609375, -14.659912109375, -13.986328125, -13.312744140625, -12.63916015625, -11.965576171875, -11.2919921875, -10.618408203125, -9.94482421875, -9.271240234375, -8.59765625, -7.924072265625, -7.25048828125, -6.576904296875, -5.9033203125, -5.229736328125, -4.55615234375, -3.882568359375, -3.208984375, -2.535400390625, -1.86181640625, -1.188232421875, -0.5146484375, 0.158935546875, 0.83251953125, 1.506103515625, 2.1796875, 2.853271484375, 3.52685546875, 4.200439453125, 4.8740234375, 5.547607421875, 6.22119140625, 6.894775390625, 7.568359375, 8.241943359375, 8.91552734375, 9.589111328125, 10.2626953125, 10.936279296875, 11.60986328125, 12.283447265625, 12.95703125, 13.630615234375, 14.30419921875, 14.977783203125, 15.6513671875, 16.324951171875, 16.99853515625, 17.672119140625, 18.345703125, 19.019287109375, 19.69287109375, 20.366455078125, 21.0400390625, 21.713623046875, 22.38720703125, 23.060791015625, 23.734375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 3.0, 5.0, 7.0, 4.0, 4.0, 14.0, 8.0, 10.0, 24.0, 20.0, 30.0, 26.0, 32.0, 29.0, 37.0, 52.0, 60.0, 45.0, 55.0, 58.0, 43.0, 57.0, 57.0, 50.0, 41.0, 36.0, 40.0, 31.0, 20.0, 24.0, 24.0, 20.0, 11.0, 7.0, 10.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.03125, -15.42822265625, -14.8251953125, -14.22216796875, -13.619140625, -13.01611328125, -12.4130859375, -11.81005859375, -11.20703125, -10.60400390625, -10.0009765625, -9.39794921875, -8.794921875, -8.19189453125, -7.5888671875, -6.98583984375, -6.3828125, -5.77978515625, -5.1767578125, -4.57373046875, -3.970703125, -3.36767578125, -2.7646484375, -2.16162109375, -1.55859375, -0.95556640625, -0.3525390625, 0.25048828125, 0.853515625, 1.45654296875, 2.0595703125, 2.66259765625, 3.265625, 3.86865234375, 4.4716796875, 5.07470703125, 5.677734375, 6.28076171875, 6.8837890625, 7.48681640625, 8.08984375, 8.69287109375, 9.2958984375, 9.89892578125, 10.501953125, 11.10498046875, 11.7080078125, 12.31103515625, 12.9140625, 13.51708984375, 14.1201171875, 14.72314453125, 15.326171875, 15.92919921875, 16.5322265625, 17.13525390625, 17.73828125, 18.34130859375, 18.9443359375, 19.54736328125, 20.150390625, 20.75341796875, 21.3564453125, 21.95947265625, 22.5625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 7.0, 17.0, 12.0, 14.0, 17.0, 31.0, 39.0, 40.0, 73.0, 81.0, 135.0, 175.0, 251.0, 363.0, 544.0, 949.0, 1759.0, 4064.0, 11319.0, 40445.0, 178185.0, 626778.0, 135235.0, 31314.0, 9227.0, 3369.0, 1569.0, 804.0, 561.0, 339.0, 226.0, 145.0, 122.0, 83.0, 61.0, 52.0, 35.0, 26.0, 24.0, 14.0, 11.0, 11.0, 9.0, 4.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-31.921875, -30.905517578125, -29.88916015625, -28.872802734375, -27.8564453125, -26.840087890625, -25.82373046875, -24.807373046875, -23.791015625, -22.774658203125, -21.75830078125, -20.741943359375, -19.7255859375, -18.709228515625, -17.69287109375, -16.676513671875, -15.66015625, -14.643798828125, -13.62744140625, -12.611083984375, -11.5947265625, -10.578369140625, -9.56201171875, -8.545654296875, -7.529296875, -6.512939453125, -5.49658203125, -4.480224609375, -3.4638671875, -2.447509765625, -1.43115234375, -0.414794921875, 0.6015625, 1.617919921875, 2.63427734375, 3.650634765625, 4.6669921875, 5.683349609375, 6.69970703125, 7.716064453125, 8.732421875, 9.748779296875, 10.76513671875, 11.781494140625, 12.7978515625, 13.814208984375, 14.83056640625, 15.846923828125, 16.86328125, 17.879638671875, 18.89599609375, 19.912353515625, 20.9287109375, 21.945068359375, 22.96142578125, 23.977783203125, 24.994140625, 26.010498046875, 27.02685546875, 28.043212890625, 29.0595703125, 30.075927734375, 31.09228515625, 32.108642578125, 33.125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 1.0, 3.0, 5.0, 6.0, 6.0, 6.0, 7.0, 16.0, 16.0, 14.0, 15.0, 30.0, 29.0, 37.0, 31.0, 30.0, 41.0, 36.0, 49.0, 50.0, 64.0, 49.0, 60.0, 33.0, 45.0, 32.0, 41.0, 29.0, 31.0, 31.0, 23.0, 30.0, 24.0, 19.0, 14.0, 13.0, 7.0, 3.0, 5.0, 6.0, 4.0, 3.0, 2.0, 4.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.65625, -48.87646484375, -47.0966796875, -45.31689453125, -43.537109375, -41.75732421875, -39.9775390625, -38.19775390625, -36.41796875, -34.63818359375, -32.8583984375, -31.07861328125, -29.298828125, -27.51904296875, -25.7392578125, -23.95947265625, -22.1796875, -20.39990234375, -18.6201171875, -16.84033203125, -15.060546875, -13.28076171875, -11.5009765625, -9.72119140625, -7.94140625, -6.16162109375, -4.3818359375, -2.60205078125, -0.822265625, 0.95751953125, 2.7373046875, 4.51708984375, 6.296875, 8.07666015625, 9.8564453125, 11.63623046875, 13.416015625, 15.19580078125, 16.9755859375, 18.75537109375, 20.53515625, 22.31494140625, 24.0947265625, 25.87451171875, 27.654296875, 29.43408203125, 31.2138671875, 32.99365234375, 34.7734375, 36.55322265625, 38.3330078125, 40.11279296875, 41.892578125, 43.67236328125, 45.4521484375, 47.23193359375, 49.01171875, 50.79150390625, 52.5712890625, 54.35107421875, 56.130859375, 57.91064453125, 59.6904296875, 61.47021484375, 63.25]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 6.0, 2.0, 13.0, 15.0, 10.0, 26.0, 43.0, 55.0, 98.0, 193.0, 295.0, 580.0, 1318.0, 3135.0, 8912.0, 29052.0, 142221.0, 719361.0, 106591.0, 24078.0, 7479.0, 2745.0, 1127.0, 526.0, 260.0, 152.0, 91.0, 46.0, 47.0, 29.0, 15.0, 7.0, 13.0, 6.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.59765625, -6.34796142578125, -6.0982666015625, -5.84857177734375, -5.598876953125, -5.34918212890625, -5.0994873046875, -4.84979248046875, -4.60009765625, -4.35040283203125, -4.1007080078125, -3.85101318359375, -3.601318359375, -3.35162353515625, -3.1019287109375, -2.85223388671875, -2.6025390625, -2.35284423828125, -2.1031494140625, -1.85345458984375, -1.603759765625, -1.35406494140625, -1.1043701171875, -0.85467529296875, -0.60498046875, -0.35528564453125, -0.1055908203125, 0.14410400390625, 0.393798828125, 0.64349365234375, 0.8931884765625, 1.14288330078125, 1.392578125, 1.64227294921875, 1.8919677734375, 2.14166259765625, 2.391357421875, 2.64105224609375, 2.8907470703125, 3.14044189453125, 3.39013671875, 3.63983154296875, 3.8895263671875, 4.13922119140625, 4.388916015625, 4.63861083984375, 4.8883056640625, 5.13800048828125, 5.3876953125, 5.63739013671875, 5.8870849609375, 6.13677978515625, 6.386474609375, 6.63616943359375, 6.8858642578125, 7.13555908203125, 7.38525390625, 7.63494873046875, 7.8846435546875, 8.13433837890625, 8.384033203125, 8.63372802734375, 8.8834228515625, 9.13311767578125, 9.3828125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 8.0, 1.0, 4.0, 6.0, 7.0, 9.0, 16.0, 16.0, 29.0, 49.0, 86.0, 129.0, 181.0, 170.0, 111.0, 54.0, 37.0, 24.0, 17.0, 16.0, 16.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0029430389404296875, -0.0028631985187530518, -0.002783358097076416, -0.0027035176753997803, -0.0026236772537231445, -0.002543836832046509, -0.002463996410369873, -0.0023841559886932373, -0.0023043155670166016, -0.002224475145339966, -0.00214463472366333, -0.0020647943019866943, -0.0019849538803100586, -0.0019051134586334229, -0.0018252730369567871, -0.0017454326152801514, -0.0016655921936035156, -0.0015857517719268799, -0.0015059113502502441, -0.0014260709285736084, -0.0013462305068969727, -0.001266390085220337, -0.0011865496635437012, -0.0011067092418670654, -0.0010268688201904297, -0.0009470283985137939, -0.0008671879768371582, -0.0007873475551605225, -0.0007075071334838867, -0.000627666711807251, -0.0005478262901306152, -0.0004679858684539795, -0.00038814544677734375, -0.000308305025100708, -0.00022846460342407227, -0.00014862418174743652, -6.878376007080078e-05, 1.1056661605834961e-05, 9.08970832824707e-05, 0.00017073750495910645, 0.0002505779266357422, 0.00033041834831237793, 0.00041025876998901367, 0.0004900991916656494, 0.0005699396133422852, 0.0006497800350189209, 0.0007296204566955566, 0.0008094608783721924, 0.0008893013000488281, 0.0009691417217254639, 0.0010489821434020996, 0.0011288225650787354, 0.001208662986755371, 0.0012885034084320068, 0.0013683438301086426, 0.0014481842517852783, 0.001528024673461914, 0.0016078650951385498, 0.0016877055168151855, 0.0017675459384918213, 0.001847386360168457, 0.0019272267818450928, 0.0020070672035217285, 0.0020869076251983643, 0.002166748046875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 8.0, 13.0, 11.0, 14.0, 25.0, 36.0, 42.0, 51.0, 95.0, 179.0, 229.0, 393.0, 781.0, 1599.0, 3568.0, 10009.0, 34870.0, 170444.0, 687990.0, 101815.0, 23666.0, 7097.0, 2740.0, 1292.0, 630.0, 367.0, 203.0, 117.0, 83.0, 63.0, 31.0, 30.0, 23.0, 11.0, 12.0, 11.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2109375, -7.9571533203125, -7.703369140625, -7.4495849609375, -7.19580078125, -6.9420166015625, -6.688232421875, -6.4344482421875, -6.1806640625, -5.9268798828125, -5.673095703125, -5.4193115234375, -5.16552734375, -4.9117431640625, -4.657958984375, -4.4041748046875, -4.150390625, -3.8966064453125, -3.642822265625, -3.3890380859375, -3.13525390625, -2.8814697265625, -2.627685546875, -2.3739013671875, -2.1201171875, -1.8663330078125, -1.612548828125, -1.3587646484375, -1.10498046875, -0.8511962890625, -0.597412109375, -0.3436279296875, -0.08984375, 0.1639404296875, 0.417724609375, 0.6715087890625, 0.92529296875, 1.1790771484375, 1.432861328125, 1.6866455078125, 1.9404296875, 2.1942138671875, 2.447998046875, 2.7017822265625, 2.95556640625, 3.2093505859375, 3.463134765625, 3.7169189453125, 3.970703125, 4.2244873046875, 4.478271484375, 4.7320556640625, 4.98583984375, 5.2396240234375, 5.493408203125, 5.7471923828125, 6.0009765625, 6.2547607421875, 6.508544921875, 6.7623291015625, 7.01611328125, 7.2698974609375, 7.523681640625, 7.7774658203125, 8.03125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 4.0, 8.0, 10.0, 8.0, 17.0, 18.0, 23.0, 38.0, 33.0, 43.0, 70.0, 76.0, 88.0, 89.0, 89.0, 77.0, 67.0, 39.0, 46.0, 38.0, 25.0, 21.0, 13.0, 11.0, 9.0, 10.0, 1.0, 4.0, 1.0, 6.0, 0.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.84375, -7.569580078125, -7.29541015625, -7.021240234375, -6.7470703125, -6.472900390625, -6.19873046875, -5.924560546875, -5.650390625, -5.376220703125, -5.10205078125, -4.827880859375, -4.5537109375, -4.279541015625, -4.00537109375, -3.731201171875, -3.45703125, -3.182861328125, -2.90869140625, -2.634521484375, -2.3603515625, -2.086181640625, -1.81201171875, -1.537841796875, -1.263671875, -0.989501953125, -0.71533203125, -0.441162109375, -0.1669921875, 0.107177734375, 0.38134765625, 0.655517578125, 0.9296875, 1.203857421875, 1.47802734375, 1.752197265625, 2.0263671875, 2.300537109375, 2.57470703125, 2.848876953125, 3.123046875, 3.397216796875, 3.67138671875, 3.945556640625, 4.2197265625, 4.493896484375, 4.76806640625, 5.042236328125, 5.31640625, 5.590576171875, 5.86474609375, 6.138916015625, 6.4130859375, 6.687255859375, 6.96142578125, 7.235595703125, 7.509765625, 7.783935546875, 8.05810546875, 8.332275390625, 8.6064453125, 8.880615234375, 9.15478515625, 9.428955078125, 9.703125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 4.0, 5.0, 12.0, 28.0, 42.0, 98.0, 198.0, 342.0, 133.0, 72.0, 31.0, 16.0, 11.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-318.91046142578125, -308.029052734375, -297.1476745605469, -286.2662658691406, -275.3848876953125, -264.50347900390625, -253.6220703125, -242.7406768798828, -231.85928344726562, -220.97789001464844, -210.09649658203125, -199.215087890625, -188.3336944580078, -177.45230102539062, -166.57089233398438, -155.6894989013672, -144.80810546875, -133.9267120361328, -123.0453109741211, -112.16390991210938, -101.28251647949219, -90.401123046875, -79.51972198486328, -68.63832092285156, -57.756927490234375, -46.87553024291992, -35.99413299560547, -25.112735748291016, -14.231338500976562, -3.3499412536621094, 7.531455993652344, 18.412857055664062, 29.294281005859375, 40.17567825317383, 51.05707550048828, 61.938472747802734, 72.81986999511719, 83.70126342773438, 94.5826644897461, 105.46406555175781, 116.345458984375, 127.22685241699219, 138.10824584960938, 148.98965454101562, 159.8710479736328, 170.75244140625, 181.63385009765625, 192.51524353027344, 203.39663696289062, 214.2780303955078, 225.159423828125, 236.04083251953125, 246.92222595214844, 257.8036193847656, 268.6850280761719, 279.56640625, 290.44781494140625, 301.3292236328125, 312.2106018066406, 323.0920104980469, 333.973388671875, 344.85479736328125, 355.7362060546875, 366.61761474609375, 377.4989929199219]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 4.0, 10.0, 12.0, 9.0, 5.0, 14.0, 17.0, 20.0, 15.0, 13.0, 26.0, 26.0, 26.0, 26.0, 37.0, 46.0, 70.0, 79.0, 93.0, 85.0, 53.0, 32.0, 40.0, 38.0, 27.0, 26.0, 20.0, 16.0, 14.0, 15.0, 14.0, 17.0, 7.0, 11.0, 10.0, 2.0, 4.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-212.47348022460938, -205.71902465820312, -198.96456909179688, -192.2101287841797, -185.45567321777344, -178.7012176513672, -171.94677734375, -165.19232177734375, -158.4378662109375, -151.68341064453125, -144.928955078125, -138.1745147705078, -131.42005920410156, -124.66560363769531, -117.9111557006836, -111.15670776367188, -104.40225219726562, -97.64779663085938, -90.89334869384766, -84.13890075683594, -77.38444519042969, -70.62998962402344, -63.87554168701172, -57.121089935302734, -50.36663818359375, -43.612186431884766, -36.85773468017578, -30.103282928466797, -23.348831176757812, -16.594379425048828, -9.839927673339844, -3.0854759216308594, 3.668975830078125, 10.42342758178711, 17.177879333496094, 23.932331085205078, 30.686782836914062, 37.44123458862305, 44.19568634033203, 50.950138092041016, 57.70458984375, 64.45904541015625, 71.21349334716797, 77.96794128417969, 84.72239685058594, 91.47685241699219, 98.2313003540039, 104.98574829101562, 111.74020385742188, 118.49465942382812, 125.24910736083984, 132.00355529785156, 138.7580108642578, 145.51246643066406, 152.26690673828125, 159.0213623046875, 165.77581787109375, 172.5302734375, 179.28472900390625, 186.03916931152344, 192.7936248779297, 199.54808044433594, 206.30252075195312, 213.05697631835938, 219.81143188476562]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 2.0, 13.0, 17.0, 20.0, 30.0, 75.0, 125.0, 294.0, 709.0, 2756.0, 15258.0, 167309.0, 2613241.0, 1317059.0, 67194.0, 7507.0, 1602.0, 549.0, 241.0, 106.0, 61.0, 38.0, 30.0, 18.0, 11.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.046875, -20.989013671875, -19.93115234375, -18.873291015625, -17.8154296875, -16.757568359375, -15.69970703125, -14.641845703125, -13.583984375, -12.526123046875, -11.46826171875, -10.410400390625, -9.3525390625, -8.294677734375, -7.23681640625, -6.178955078125, -5.12109375, -4.063232421875, -3.00537109375, -1.947509765625, -0.8896484375, 0.168212890625, 1.22607421875, 2.283935546875, 3.341796875, 4.399658203125, 5.45751953125, 6.515380859375, 7.5732421875, 8.631103515625, 9.68896484375, 10.746826171875, 11.8046875, 12.862548828125, 13.92041015625, 14.978271484375, 16.0361328125, 17.093994140625, 18.15185546875, 19.209716796875, 20.267578125, 21.325439453125, 22.38330078125, 23.441162109375, 24.4990234375, 25.556884765625, 26.61474609375, 27.672607421875, 28.73046875, 29.788330078125, 30.84619140625, 31.904052734375, 32.9619140625, 34.019775390625, 35.07763671875, 36.135498046875, 37.193359375, 38.251220703125, 39.30908203125, 40.366943359375, 41.4248046875, 42.482666015625, 43.54052734375, 44.598388671875, 45.65625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 7.0, 4.0, 8.0, 10.0, 12.0, 9.0, 25.0, 21.0, 24.0, 32.0, 37.0, 47.0, 42.0, 44.0, 54.0, 48.0, 53.0, 55.0, 60.0, 56.0, 56.0, 51.0, 39.0, 36.0, 37.0, 33.0, 18.0, 20.0, 15.0, 13.0, 8.0, 8.0, 3.0, 4.0, 2.0, 5.0, 1.0, 5.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.59375, -15.98681640625, -15.3798828125, -14.77294921875, -14.166015625, -13.55908203125, -12.9521484375, -12.34521484375, -11.73828125, -11.13134765625, -10.5244140625, -9.91748046875, -9.310546875, -8.70361328125, -8.0966796875, -7.48974609375, -6.8828125, -6.27587890625, -5.6689453125, -5.06201171875, -4.455078125, -3.84814453125, -3.2412109375, -2.63427734375, -2.02734375, -1.42041015625, -0.8134765625, -0.20654296875, 0.400390625, 1.00732421875, 1.6142578125, 2.22119140625, 2.828125, 3.43505859375, 4.0419921875, 4.64892578125, 5.255859375, 5.86279296875, 6.4697265625, 7.07666015625, 7.68359375, 8.29052734375, 8.8974609375, 9.50439453125, 10.111328125, 10.71826171875, 11.3251953125, 11.93212890625, 12.5390625, 13.14599609375, 13.7529296875, 14.35986328125, 14.966796875, 15.57373046875, 16.1806640625, 16.78759765625, 17.39453125, 18.00146484375, 18.6083984375, 19.21533203125, 19.822265625, 20.42919921875, 21.0361328125, 21.64306640625, 22.25]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 4.0, 4.0, 4.0, 6.0, 9.0, 20.0, 14.0, 19.0, 30.0, 39.0, 55.0, 114.0, 194.0, 385.0, 980.0, 3459.0, 16478.0, 228685.0, 3649084.0, 271282.0, 17771.0, 3626.0, 1134.0, 386.0, 183.0, 107.0, 72.0, 31.0, 26.0, 18.0, 16.0, 12.0, 10.0, 6.0, 3.0, 5.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0], "bins": [-39.71875, -38.49755859375, -37.2763671875, -36.05517578125, -34.833984375, -33.61279296875, -32.3916015625, -31.17041015625, -29.94921875, -28.72802734375, -27.5068359375, -26.28564453125, -25.064453125, -23.84326171875, -22.6220703125, -21.40087890625, -20.1796875, -18.95849609375, -17.7373046875, -16.51611328125, -15.294921875, -14.07373046875, -12.8525390625, -11.63134765625, -10.41015625, -9.18896484375, -7.9677734375, -6.74658203125, -5.525390625, -4.30419921875, -3.0830078125, -1.86181640625, -0.640625, 0.58056640625, 1.8017578125, 3.02294921875, 4.244140625, 5.46533203125, 6.6865234375, 7.90771484375, 9.12890625, 10.35009765625, 11.5712890625, 12.79248046875, 14.013671875, 15.23486328125, 16.4560546875, 17.67724609375, 18.8984375, 20.11962890625, 21.3408203125, 22.56201171875, 23.783203125, 25.00439453125, 26.2255859375, 27.44677734375, 28.66796875, 29.88916015625, 31.1103515625, 32.33154296875, 33.552734375, 34.77392578125, 35.9951171875, 37.21630859375, 38.4375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 3.0, 5.0, 1.0, 9.0, 12.0, 12.0, 19.0, 39.0, 43.0, 76.0, 134.0, 195.0, 272.0, 446.0, 599.0, 652.0, 542.0, 342.0, 238.0, 146.0, 80.0, 70.0, 54.0, 19.0, 15.0, 16.0, 10.0, 4.0, 6.0, 4.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.015625, -29.030029296875, -28.04443359375, -27.058837890625, -26.0732421875, -25.087646484375, -24.10205078125, -23.116455078125, -22.130859375, -21.145263671875, -20.15966796875, -19.174072265625, -18.1884765625, -17.202880859375, -16.21728515625, -15.231689453125, -14.24609375, -13.260498046875, -12.27490234375, -11.289306640625, -10.3037109375, -9.318115234375, -8.33251953125, -7.346923828125, -6.361328125, -5.375732421875, -4.39013671875, -3.404541015625, -2.4189453125, -1.433349609375, -0.44775390625, 0.537841796875, 1.5234375, 2.509033203125, 3.49462890625, 4.480224609375, 5.4658203125, 6.451416015625, 7.43701171875, 8.422607421875, 9.408203125, 10.393798828125, 11.37939453125, 12.364990234375, 13.3505859375, 14.336181640625, 15.32177734375, 16.307373046875, 17.29296875, 18.278564453125, 19.26416015625, 20.249755859375, 21.2353515625, 22.220947265625, 23.20654296875, 24.192138671875, 25.177734375, 26.163330078125, 27.14892578125, 28.134521484375, 29.1201171875, 30.105712890625, 31.09130859375, 32.076904296875, 33.0625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 2.0, 11.0, 20.0, 41.0, 117.0, 264.0, 309.0, 165.0, 48.0, 14.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-675.2928466796875, -660.3777465820312, -645.4627075195312, -630.547607421875, -615.632568359375, -600.7174682617188, -585.8024291992188, -570.8873291015625, -555.9722900390625, -541.0571899414062, -526.1421508789062, -511.2270812988281, -496.31201171875, -481.3969421386719, -466.48187255859375, -451.5667724609375, -436.6517028808594, -421.73663330078125, -406.8215637207031, -391.906494140625, -376.9914245605469, -362.07635498046875, -347.1612548828125, -332.2462158203125, -317.33111572265625, -302.4160461425781, -287.5009765625, -272.5859069824219, -257.67083740234375, -242.75576782226562, -227.84068298339844, -212.9256134033203, -198.01052856445312, -183.095458984375, -168.18038940429688, -153.26531982421875, -138.35025024414062, -123.43517303466797, -108.52009582519531, -93.60502624511719, -78.68995666503906, -63.77488708496094, -48.85981369018555, -33.944740295410156, -19.02967071533203, -4.114601135253906, 10.80047607421875, 25.715545654296875, 40.630615234375, 55.545684814453125, 70.46075439453125, 85.3758316040039, 100.29090118408203, 115.20597076416016, 130.1210479736328, 145.03611755371094, 159.95118713378906, 174.8662567138672, 189.7813262939453, 204.6964111328125, 219.61148071289062, 234.52655029296875, 249.44161987304688, 264.356689453125, 279.2717590332031]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 0.0, 4.0, 2.0, 5.0, 4.0, 8.0, 15.0, 16.0, 10.0, 12.0, 18.0, 15.0, 16.0, 24.0, 24.0, 28.0, 18.0, 34.0, 47.0, 33.0, 39.0, 41.0, 36.0, 30.0, 40.0, 36.0, 35.0, 43.0, 27.0, 36.0, 33.0, 26.0, 28.0, 31.0, 29.0, 25.0, 20.0, 22.0, 21.0, 11.0, 12.0, 8.0, 9.0, 6.0, 11.0, 3.0, 2.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-129.9894561767578, -126.17731475830078, -122.36516571044922, -118.55302429199219, -114.74087524414062, -110.9287338256836, -107.11659240722656, -103.304443359375, -99.49230194091797, -95.68016052246094, -91.86801147460938, -88.05587005615234, -84.24372863769531, -80.43157958984375, -76.61943817138672, -72.80729675292969, -68.99514770507812, -65.1830062866211, -61.37085723876953, -57.5587158203125, -53.7465705871582, -49.934425354003906, -46.122283935546875, -42.31013870239258, -38.49799346923828, -34.685848236083984, -30.87370491027832, -27.061561584472656, -23.24941635131836, -19.437271118164062, -15.625127792358398, -11.812984466552734, -8.000839233398438, -4.188694953918457, -0.37655067443847656, 3.435593605041504, 7.247737884521484, 11.059883117675781, 14.872026443481445, 18.68416976928711, 22.496315002441406, 26.308460235595703, 30.120603561401367, 33.93274688720703, 37.74489212036133, 41.557037353515625, 45.369178771972656, 49.18132400512695, 52.99346923828125, 56.80561447143555, 60.617759704589844, 64.42990112304688, 68.24205017089844, 72.05419158935547, 75.8663330078125, 79.67848205566406, 83.4906234741211, 87.30276489257812, 91.11491394042969, 94.92705535888672, 98.73919677734375, 102.55134582519531, 106.36348724365234, 110.17562866210938, 113.98777770996094]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 6.0, 3.0, 4.0, 8.0, 3.0, 16.0, 16.0, 35.0, 62.0, 88.0, 122.0, 221.0, 287.0, 476.0, 856.0, 1562.0, 3030.0, 6335.0, 13825.0, 34181.0, 92223.0, 254336.0, 375443.0, 163774.0, 59249.0, 22749.0, 9858.0, 4482.0, 2278.0, 1231.0, 657.0, 429.0, 255.0, 156.0, 90.0, 68.0, 37.0, 44.0, 27.0, 16.0, 10.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-24.546875, -23.809326171875, -23.07177734375, -22.334228515625, -21.5966796875, -20.859130859375, -20.12158203125, -19.384033203125, -18.646484375, -17.908935546875, -17.17138671875, -16.433837890625, -15.6962890625, -14.958740234375, -14.22119140625, -13.483642578125, -12.74609375, -12.008544921875, -11.27099609375, -10.533447265625, -9.7958984375, -9.058349609375, -8.32080078125, -7.583251953125, -6.845703125, -6.108154296875, -5.37060546875, -4.633056640625, -3.8955078125, -3.157958984375, -2.42041015625, -1.682861328125, -0.9453125, -0.207763671875, 0.52978515625, 1.267333984375, 2.0048828125, 2.742431640625, 3.47998046875, 4.217529296875, 4.955078125, 5.692626953125, 6.43017578125, 7.167724609375, 7.9052734375, 8.642822265625, 9.38037109375, 10.117919921875, 10.85546875, 11.593017578125, 12.33056640625, 13.068115234375, 13.8056640625, 14.543212890625, 15.28076171875, 16.018310546875, 16.755859375, 17.493408203125, 18.23095703125, 18.968505859375, 19.7060546875, 20.443603515625, 21.18115234375, 21.918701171875, 22.65625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 3.0, 5.0, 7.0, 8.0, 3.0, 15.0, 22.0, 24.0, 31.0, 37.0, 26.0, 48.0, 41.0, 43.0, 46.0, 49.0, 58.0, 73.0, 61.0, 43.0, 58.0, 39.0, 47.0, 34.0, 23.0, 35.0, 29.0, 22.0, 13.0, 9.0, 7.0, 9.0, 5.0, 2.0, 4.0, 6.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.625, -16.0166015625, -15.408203125, -14.7998046875, -14.19140625, -13.5830078125, -12.974609375, -12.3662109375, -11.7578125, -11.1494140625, -10.541015625, -9.9326171875, -9.32421875, -8.7158203125, -8.107421875, -7.4990234375, -6.890625, -6.2822265625, -5.673828125, -5.0654296875, -4.45703125, -3.8486328125, -3.240234375, -2.6318359375, -2.0234375, -1.4150390625, -0.806640625, -0.1982421875, 0.41015625, 1.0185546875, 1.626953125, 2.2353515625, 2.84375, 3.4521484375, 4.060546875, 4.6689453125, 5.27734375, 5.8857421875, 6.494140625, 7.1025390625, 7.7109375, 8.3193359375, 8.927734375, 9.5361328125, 10.14453125, 10.7529296875, 11.361328125, 11.9697265625, 12.578125, 13.1865234375, 13.794921875, 14.4033203125, 15.01171875, 15.6201171875, 16.228515625, 16.8369140625, 17.4453125, 18.0537109375, 18.662109375, 19.2705078125, 19.87890625, 20.4873046875, 21.095703125, 21.7041015625, 22.3125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 6.0, 5.0, 5.0, 3.0, 5.0, 4.0, 13.0, 15.0, 21.0, 24.0, 35.0, 50.0, 55.0, 67.0, 115.0, 108.0, 198.0, 224.0, 325.0, 514.0, 753.0, 1226.0, 2198.0, 4966.0, 15461.0, 69731.0, 677927.0, 220224.0, 36122.0, 9548.0, 3515.0, 1849.0, 1021.0, 638.0, 421.0, 330.0, 225.0, 131.0, 123.0, 90.0, 58.0, 43.0, 39.0, 34.0, 30.0, 17.0, 15.0, 9.0, 16.0, 3.0, 3.0, 3.0, 5.0, 2.0, 0.0, 1.0], "bins": [-42.09375, -40.88427734375, -39.6748046875, -38.46533203125, -37.255859375, -36.04638671875, -34.8369140625, -33.62744140625, -32.41796875, -31.20849609375, -29.9990234375, -28.78955078125, -27.580078125, -26.37060546875, -25.1611328125, -23.95166015625, -22.7421875, -21.53271484375, -20.3232421875, -19.11376953125, -17.904296875, -16.69482421875, -15.4853515625, -14.27587890625, -13.06640625, -11.85693359375, -10.6474609375, -9.43798828125, -8.228515625, -7.01904296875, -5.8095703125, -4.60009765625, -3.390625, -2.18115234375, -0.9716796875, 0.23779296875, 1.447265625, 2.65673828125, 3.8662109375, 5.07568359375, 6.28515625, 7.49462890625, 8.7041015625, 9.91357421875, 11.123046875, 12.33251953125, 13.5419921875, 14.75146484375, 15.9609375, 17.17041015625, 18.3798828125, 19.58935546875, 20.798828125, 22.00830078125, 23.2177734375, 24.42724609375, 25.63671875, 26.84619140625, 28.0556640625, 29.26513671875, 30.474609375, 31.68408203125, 32.8935546875, 34.10302734375, 35.3125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 7.0, 10.0, 12.0, 14.0, 19.0, 14.0, 27.0, 26.0, 23.0, 34.0, 32.0, 31.0, 43.0, 39.0, 51.0, 42.0, 48.0, 46.0, 44.0, 53.0, 52.0, 41.0, 34.0, 40.0, 31.0, 30.0, 26.0, 22.0, 14.0, 16.0, 11.0, 12.0, 9.0, 7.0, 5.0, 5.0, 3.0, 2.0, 3.0, 5.0, 5.0, 2.0, 1.0, 0.0, 4.0], "bins": [-65.5, -63.67626953125, -61.8525390625, -60.02880859375, -58.205078125, -56.38134765625, -54.5576171875, -52.73388671875, -50.91015625, -49.08642578125, -47.2626953125, -45.43896484375, -43.615234375, -41.79150390625, -39.9677734375, -38.14404296875, -36.3203125, -34.49658203125, -32.6728515625, -30.84912109375, -29.025390625, -27.20166015625, -25.3779296875, -23.55419921875, -21.73046875, -19.90673828125, -18.0830078125, -16.25927734375, -14.435546875, -12.61181640625, -10.7880859375, -8.96435546875, -7.140625, -5.31689453125, -3.4931640625, -1.66943359375, 0.154296875, 1.97802734375, 3.8017578125, 5.62548828125, 7.44921875, 9.27294921875, 11.0966796875, 12.92041015625, 14.744140625, 16.56787109375, 18.3916015625, 20.21533203125, 22.0390625, 23.86279296875, 25.6865234375, 27.51025390625, 29.333984375, 31.15771484375, 32.9814453125, 34.80517578125, 36.62890625, 38.45263671875, 40.2763671875, 42.10009765625, 43.923828125, 45.74755859375, 47.5712890625, 49.39501953125, 51.21875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 4.0, 5.0, 7.0, 13.0, 12.0, 17.0, 33.0, 53.0, 61.0, 57.0, 141.0, 263.0, 566.0, 1407.0, 5103.0, 32928.0, 900049.0, 95150.0, 9066.0, 2100.0, 745.0, 301.0, 167.0, 93.0, 61.0, 35.0, 40.0, 18.0, 12.0, 10.0, 7.0, 5.0, 8.0, 7.0, 6.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.28125, -12.8748779296875, -12.468505859375, -12.0621337890625, -11.65576171875, -11.2493896484375, -10.843017578125, -10.4366455078125, -10.0302734375, -9.6239013671875, -9.217529296875, -8.8111572265625, -8.40478515625, -7.9984130859375, -7.592041015625, -7.1856689453125, -6.779296875, -6.3729248046875, -5.966552734375, -5.5601806640625, -5.15380859375, -4.7474365234375, -4.341064453125, -3.9346923828125, -3.5283203125, -3.1219482421875, -2.715576171875, -2.3092041015625, -1.90283203125, -1.4964599609375, -1.090087890625, -0.6837158203125, -0.27734375, 0.1290283203125, 0.535400390625, 0.9417724609375, 1.34814453125, 1.7545166015625, 2.160888671875, 2.5672607421875, 2.9736328125, 3.3800048828125, 3.786376953125, 4.1927490234375, 4.59912109375, 5.0054931640625, 5.411865234375, 5.8182373046875, 6.224609375, 6.6309814453125, 7.037353515625, 7.4437255859375, 7.85009765625, 8.2564697265625, 8.662841796875, 9.0692138671875, 9.4755859375, 9.8819580078125, 10.288330078125, 10.6947021484375, 11.10107421875, 11.5074462890625, 11.913818359375, 12.3201904296875, 12.7265625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 4.0, 2.0, 11.0, 3.0, 11.0, 20.0, 40.0, 60.0, 157.0, 299.0, 176.0, 86.0, 35.0, 27.0, 12.0, 14.0, 5.0, 8.0, 7.0, 1.0, 5.0, 0.0, 5.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00255584716796875, -0.00244748592376709, -0.0023391246795654297, -0.0022307634353637695, -0.0021224021911621094, -0.0020140409469604492, -0.001905679702758789, -0.001797318458557129, -0.0016889572143554688, -0.0015805959701538086, -0.0014722347259521484, -0.0013638734817504883, -0.0012555122375488281, -0.001147150993347168, -0.0010387897491455078, -0.0009304285049438477, -0.0008220672607421875, -0.0007137060165405273, -0.0006053447723388672, -0.000496983528137207, -0.0003886222839355469, -0.0002802610397338867, -0.00017189979553222656, -6.35385513305664e-05, 4.482269287109375e-05, 0.0001531839370727539, 0.00026154518127441406, 0.0003699064254760742, 0.0004782676696777344, 0.0005866289138793945, 0.0006949901580810547, 0.0008033514022827148, 0.000911712646484375, 0.0010200738906860352, 0.0011284351348876953, 0.0012367963790893555, 0.0013451576232910156, 0.0014535188674926758, 0.001561880111694336, 0.001670241355895996, 0.0017786026000976562, 0.0018869638442993164, 0.0019953250885009766, 0.0021036863327026367, 0.002212047576904297, 0.002320408821105957, 0.002428770065307617, 0.0025371313095092773, 0.0026454925537109375, 0.0027538537979125977, 0.002862215042114258, 0.002970576286315918, 0.003078937530517578, 0.0031872987747192383, 0.0032956600189208984, 0.0034040212631225586, 0.0035123825073242188, 0.003620743751525879, 0.003729104995727539, 0.0038374662399291992, 0.003945827484130859, 0.0040541887283325195, 0.00416254997253418, 0.00427091121673584, 0.0043792724609375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 4.0, 7.0, 5.0, 26.0, 22.0, 30.0, 37.0, 48.0, 54.0, 75.0, 99.0, 155.0, 261.0, 332.0, 606.0, 900.0, 1755.0, 3424.0, 7188.0, 18987.0, 74523.0, 681406.0, 199580.0, 36747.0, 11378.0, 5020.0, 2286.0, 1347.0, 750.0, 467.0, 298.0, 184.0, 147.0, 105.0, 90.0, 48.0, 48.0, 30.0, 23.0, 15.0, 11.0, 11.0, 7.0, 8.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.7421875, -5.5555419921875, -5.368896484375, -5.1822509765625, -4.99560546875, -4.8089599609375, -4.622314453125, -4.4356689453125, -4.2490234375, -4.0623779296875, -3.875732421875, -3.6890869140625, -3.50244140625, -3.3157958984375, -3.129150390625, -2.9425048828125, -2.755859375, -2.5692138671875, -2.382568359375, -2.1959228515625, -2.00927734375, -1.8226318359375, -1.635986328125, -1.4493408203125, -1.2626953125, -1.0760498046875, -0.889404296875, -0.7027587890625, -0.51611328125, -0.3294677734375, -0.142822265625, 0.0438232421875, 0.23046875, 0.4171142578125, 0.603759765625, 0.7904052734375, 0.97705078125, 1.1636962890625, 1.350341796875, 1.5369873046875, 1.7236328125, 1.9102783203125, 2.096923828125, 2.2835693359375, 2.47021484375, 2.6568603515625, 2.843505859375, 3.0301513671875, 3.216796875, 3.4034423828125, 3.590087890625, 3.7767333984375, 3.96337890625, 4.1500244140625, 4.336669921875, 4.5233154296875, 4.7099609375, 4.8966064453125, 5.083251953125, 5.2698974609375, 5.45654296875, 5.6431884765625, 5.829833984375, 6.0164794921875, 6.203125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 1.0, 5.0, 8.0, 5.0, 13.0, 14.0, 14.0, 20.0, 22.0, 28.0, 41.0, 50.0, 87.0, 101.0, 112.0, 114.0, 83.0, 58.0, 58.0, 40.0, 24.0, 23.0, 13.0, 16.0, 7.0, 5.0, 8.0, 6.0, 5.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.7421875, -7.4920654296875, -7.241943359375, -6.9918212890625, -6.74169921875, -6.4915771484375, -6.241455078125, -5.9913330078125, -5.7412109375, -5.4910888671875, -5.240966796875, -4.9908447265625, -4.74072265625, -4.4906005859375, -4.240478515625, -3.9903564453125, -3.740234375, -3.4901123046875, -3.239990234375, -2.9898681640625, -2.73974609375, -2.4896240234375, -2.239501953125, -1.9893798828125, -1.7392578125, -1.4891357421875, -1.239013671875, -0.9888916015625, -0.73876953125, -0.4886474609375, -0.238525390625, 0.0115966796875, 0.26171875, 0.5118408203125, 0.761962890625, 1.0120849609375, 1.26220703125, 1.5123291015625, 1.762451171875, 2.0125732421875, 2.2626953125, 2.5128173828125, 2.762939453125, 3.0130615234375, 3.26318359375, 3.5133056640625, 3.763427734375, 4.0135498046875, 4.263671875, 4.5137939453125, 4.763916015625, 5.0140380859375, 5.26416015625, 5.5142822265625, 5.764404296875, 6.0145263671875, 6.2646484375, 6.5147705078125, 6.764892578125, 7.0150146484375, 7.26513671875, 7.5152587890625, 7.765380859375, 8.0155029296875, 8.265625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 1.0, 2.0, 5.0, 11.0, 17.0, 34.0, 45.0, 81.0, 176.0, 329.0, 133.0, 62.0, 37.0, 22.0, 15.0, 7.0, 5.0, 7.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-201.1312255859375, -192.88150024414062, -184.63177490234375, -176.38204956054688, -168.13232421875, -159.88259887695312, -151.63287353515625, -143.38314819335938, -135.1334228515625, -126.88369750976562, -118.63397216796875, -110.38424682617188, -102.134521484375, -93.88479614257812, -85.63507080078125, -77.38534545898438, -69.1356201171875, -60.885894775390625, -52.63616943359375, -44.386444091796875, -36.13671875, -27.886993408203125, -19.63726806640625, -11.387542724609375, -3.1378173828125, 5.111907958984375, 13.36163330078125, 21.611358642578125, 29.861083984375, 38.110809326171875, 46.36053466796875, 54.610260009765625, 62.860015869140625, 71.1097412109375, 79.35946655273438, 87.60919189453125, 95.85891723632812, 104.108642578125, 112.35836791992188, 120.60809326171875, 128.85781860351562, 137.1075439453125, 145.35726928710938, 153.60699462890625, 161.85671997070312, 170.1064453125, 178.35617065429688, 186.60589599609375, 194.85562133789062, 203.1053466796875, 211.35507202148438, 219.60479736328125, 227.85452270507812, 236.104248046875, 244.35397338867188, 252.60369873046875, 260.8534240722656, 269.1031494140625, 277.3528747558594, 285.60260009765625, 293.8523254394531, 302.10205078125, 310.3517761230469, 318.60150146484375, 326.8512268066406]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 11.0, 7.0, 10.0, 12.0, 13.0, 11.0, 10.0, 18.0, 20.0, 23.0, 24.0, 26.0, 28.0, 25.0, 27.0, 71.0, 89.0, 122.0, 114.0, 47.0, 35.0, 37.0, 26.0, 20.0, 20.0, 16.0, 20.0, 24.0, 14.0, 17.0, 10.0, 11.0, 14.0, 7.0, 2.0, 6.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-208.0072784423828, -200.46408081054688, -192.9208984375, -185.37770080566406, -177.83450317382812, -170.29132080078125, -162.7481231689453, -155.20492553710938, -147.6617431640625, -140.11854553222656, -132.5753631591797, -125.03216552734375, -117.48897552490234, -109.94578552246094, -102.402587890625, -94.8593978881836, -87.31620788574219, -79.77301788330078, -72.22982788085938, -64.68663024902344, -57.14344024658203, -49.600250244140625, -42.05705642700195, -34.51386260986328, -26.970672607421875, -19.427480697631836, -11.884288787841797, -4.341096878051758, 3.2020950317382812, 10.745285034179688, 18.28847885131836, 25.83167266845703, 33.374847412109375, 40.91803741455078, 48.46123123168945, 56.004425048828125, 63.54761505126953, 71.09080505371094, 78.63400268554688, 86.17719268798828, 93.72038269042969, 101.2635726928711, 108.8067626953125, 116.34996032714844, 123.89315032958984, 131.43634033203125, 138.9795379638672, 146.52273559570312, 154.06591796875, 161.60911560058594, 169.1522979736328, 176.69549560546875, 184.23867797851562, 191.78187561035156, 199.3250732421875, 206.86825561523438, 214.4114532470703, 221.95465087890625, 229.49783325195312, 237.04103088378906, 244.584228515625, 252.12741088867188, 259.67059326171875, 267.21380615234375, 274.7569885253906]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 7.0, 7.0, 7.0, 12.0, 17.0, 19.0, 36.0, 61.0, 70.0, 128.0, 188.0, 350.0, 568.0, 999.0, 2220.0, 6292.0, 22037.0, 128437.0, 1080382.0, 2386092.0, 490875.0, 57563.0, 10795.0, 3471.0, 1548.0, 864.0, 484.0, 264.0, 174.0, 100.0, 58.0, 44.0, 37.0, 25.0, 18.0, 13.0, 11.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.6875, -23.815185546875, -22.94287109375, -22.070556640625, -21.1982421875, -20.325927734375, -19.45361328125, -18.581298828125, -17.708984375, -16.836669921875, -15.96435546875, -15.092041015625, -14.2197265625, -13.347412109375, -12.47509765625, -11.602783203125, -10.73046875, -9.858154296875, -8.98583984375, -8.113525390625, -7.2412109375, -6.368896484375, -5.49658203125, -4.624267578125, -3.751953125, -2.879638671875, -2.00732421875, -1.135009765625, -0.2626953125, 0.609619140625, 1.48193359375, 2.354248046875, 3.2265625, 4.098876953125, 4.97119140625, 5.843505859375, 6.7158203125, 7.588134765625, 8.46044921875, 9.332763671875, 10.205078125, 11.077392578125, 11.94970703125, 12.822021484375, 13.6943359375, 14.566650390625, 15.43896484375, 16.311279296875, 17.18359375, 18.055908203125, 18.92822265625, 19.800537109375, 20.6728515625, 21.545166015625, 22.41748046875, 23.289794921875, 24.162109375, 25.034423828125, 25.90673828125, 26.779052734375, 27.6513671875, 28.523681640625, 29.39599609375, 30.268310546875, 31.140625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 4.0, 8.0, 5.0, 7.0, 7.0, 19.0, 21.0, 25.0, 33.0, 45.0, 41.0, 43.0, 39.0, 60.0, 55.0, 74.0, 56.0, 56.0, 70.0, 56.0, 48.0, 46.0, 25.0, 37.0, 27.0, 23.0, 23.0, 11.0, 10.0, 11.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.640625, -16.030517578125, -15.42041015625, -14.810302734375, -14.2001953125, -13.590087890625, -12.97998046875, -12.369873046875, -11.759765625, -11.149658203125, -10.53955078125, -9.929443359375, -9.3193359375, -8.709228515625, -8.09912109375, -7.489013671875, -6.87890625, -6.268798828125, -5.65869140625, -5.048583984375, -4.4384765625, -3.828369140625, -3.21826171875, -2.608154296875, -1.998046875, -1.387939453125, -0.77783203125, -0.167724609375, 0.4423828125, 1.052490234375, 1.66259765625, 2.272705078125, 2.8828125, 3.492919921875, 4.10302734375, 4.713134765625, 5.3232421875, 5.933349609375, 6.54345703125, 7.153564453125, 7.763671875, 8.373779296875, 8.98388671875, 9.593994140625, 10.2041015625, 10.814208984375, 11.42431640625, 12.034423828125, 12.64453125, 13.254638671875, 13.86474609375, 14.474853515625, 15.0849609375, 15.695068359375, 16.30517578125, 16.915283203125, 17.525390625, 18.135498046875, 18.74560546875, 19.355712890625, 19.9658203125, 20.575927734375, 21.18603515625, 21.796142578125, 22.40625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 9.0, 9.0, 12.0, 13.0, 30.0, 38.0, 36.0, 86.0, 147.0, 273.0, 516.0, 1359.0, 4894.0, 45361.0, 3962462.0, 167551.0, 8266.0, 1832.0, 646.0, 300.0, 172.0, 83.0, 64.0, 41.0, 18.0, 21.0, 11.0, 10.0, 10.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.6875, -69.1865234375, -66.685546875, -64.1845703125, -61.68359375, -59.1826171875, -56.681640625, -54.1806640625, -51.6796875, -49.1787109375, -46.677734375, -44.1767578125, -41.67578125, -39.1748046875, -36.673828125, -34.1728515625, -31.671875, -29.1708984375, -26.669921875, -24.1689453125, -21.66796875, -19.1669921875, -16.666015625, -14.1650390625, -11.6640625, -9.1630859375, -6.662109375, -4.1611328125, -1.66015625, 0.8408203125, 3.341796875, 5.8427734375, 8.34375, 10.8447265625, 13.345703125, 15.8466796875, 18.34765625, 20.8486328125, 23.349609375, 25.8505859375, 28.3515625, 30.8525390625, 33.353515625, 35.8544921875, 38.35546875, 40.8564453125, 43.357421875, 45.8583984375, 48.359375, 50.8603515625, 53.361328125, 55.8623046875, 58.36328125, 60.8642578125, 63.365234375, 65.8662109375, 68.3671875, 70.8681640625, 73.369140625, 75.8701171875, 78.37109375, 80.8720703125, 83.373046875, 85.8740234375, 88.375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 1.0, 13.0, 6.0, 7.0, 11.0, 21.0, 22.0, 44.0, 56.0, 73.0, 130.0, 204.0, 303.0, 539.0, 701.0, 663.0, 504.0, 285.0, 180.0, 97.0, 61.0, 43.0, 42.0, 16.0, 10.0, 12.0, 9.0, 5.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-52.03125, -50.50341796875, -48.9755859375, -47.44775390625, -45.919921875, -44.39208984375, -42.8642578125, -41.33642578125, -39.80859375, -38.28076171875, -36.7529296875, -35.22509765625, -33.697265625, -32.16943359375, -30.6416015625, -29.11376953125, -27.5859375, -26.05810546875, -24.5302734375, -23.00244140625, -21.474609375, -19.94677734375, -18.4189453125, -16.89111328125, -15.36328125, -13.83544921875, -12.3076171875, -10.77978515625, -9.251953125, -7.72412109375, -6.1962890625, -4.66845703125, -3.140625, -1.61279296875, -0.0849609375, 1.44287109375, 2.970703125, 4.49853515625, 6.0263671875, 7.55419921875, 9.08203125, 10.60986328125, 12.1376953125, 13.66552734375, 15.193359375, 16.72119140625, 18.2490234375, 19.77685546875, 21.3046875, 22.83251953125, 24.3603515625, 25.88818359375, 27.416015625, 28.94384765625, 30.4716796875, 31.99951171875, 33.52734375, 35.05517578125, 36.5830078125, 38.11083984375, 39.638671875, 41.16650390625, 42.6943359375, 44.22216796875, 45.75]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 4.0, 7.0, 10.0, 16.0, 25.0, 35.0, 80.0, 158.0, 240.0, 173.0, 116.0, 53.0, 34.0, 13.0, 10.0, 9.0, 5.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-340.818603515625, -325.2418518066406, -309.66510009765625, -294.0883483886719, -278.5115966796875, -262.934814453125, -247.35806274414062, -231.78131103515625, -216.20455932617188, -200.6278076171875, -185.05105590820312, -169.4742889404297, -153.8975372314453, -138.32078552246094, -122.74402618408203, -107.16726684570312, -91.59051513671875, -76.01376342773438, -60.43700408935547, -44.86024856567383, -29.283493041992188, -13.706741333007812, 1.8700180053710938, 17.44677734375, 33.023529052734375, 48.600284576416016, 64.17704010009766, 79.75379943847656, 95.33055114746094, 110.90730285644531, 126.48406219482422, 142.06082153320312, 157.6375732421875, 173.21432495117188, 188.79107666015625, 204.3678436279297, 219.94459533691406, 235.52134704589844, 251.09811401367188, 266.67486572265625, 282.2516174316406, 297.828369140625, 313.4051208496094, 328.98187255859375, 344.55865478515625, 360.1353759765625, 375.712158203125, 391.2889099121094, 406.86566162109375, 422.4424133300781, 438.0191650390625, 453.5959167480469, 469.17266845703125, 484.74945068359375, 500.3262023925781, 515.9029541015625, 531.479736328125, 547.0565185546875, 562.6332397460938, 578.2100219726562, 593.7867431640625, 609.363525390625, 624.9402465820312, 640.5170288085938, 656.09375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 4.0, 6.0, 4.0, 13.0, 9.0, 17.0, 29.0, 19.0, 27.0, 28.0, 45.0, 41.0, 43.0, 53.0, 63.0, 68.0, 54.0, 73.0, 47.0, 48.0, 30.0, 41.0, 49.0, 36.0, 33.0, 15.0, 20.0, 20.0, 17.0, 13.0, 6.0, 10.0, 6.0, 11.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-266.8985900878906, -258.9678039550781, -251.03701782226562, -243.10623168945312, -235.17544555664062, -227.24465942382812, -219.31385803222656, -211.38307189941406, -203.45228576660156, -195.52149963378906, -187.59071350097656, -179.65992736816406, -171.7291259765625, -163.79833984375, -155.8675537109375, -147.936767578125, -140.0059814453125, -132.0751953125, -124.1444091796875, -116.21361541748047, -108.28282928466797, -100.35204315185547, -92.42124938964844, -84.49046325683594, -76.55967712402344, -68.62889099121094, -60.69810104370117, -52.767311096191406, -44.836524963378906, -36.905738830566406, -28.97494888305664, -21.044158935546875, -13.113388061523438, -5.182600021362305, 2.748188018798828, 10.678976058959961, 18.609764099121094, 26.540550231933594, 34.47134017944336, 42.402130126953125, 50.332916259765625, 58.263702392578125, 66.19448852539062, 74.12528228759766, 82.05606842041016, 89.98685455322266, 97.91764831542969, 105.84843444824219, 113.77922058105469, 121.71000671386719, 129.6407928466797, 137.5715789794922, 145.50238037109375, 153.43316650390625, 161.36395263671875, 169.29473876953125, 177.22552490234375, 185.15631103515625, 193.08709716796875, 201.01788330078125, 208.94866943359375, 216.87945556640625, 224.8102569580078, 232.7410430908203, 240.6718292236328]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 4.0, 9.0, 16.0, 24.0, 28.0, 45.0, 76.0, 101.0, 180.0, 307.0, 466.0, 771.0, 1520.0, 3077.0, 6498.0, 15982.0, 44897.0, 145213.0, 444968.0, 262200.0, 77619.0, 25582.0, 9835.0, 4389.0, 2043.0, 1115.0, 619.0, 338.0, 217.0, 111.0, 95.0, 70.0, 32.0, 32.0, 23.0, 8.0, 14.0, 8.0, 4.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.703125, -23.970947265625, -23.23876953125, -22.506591796875, -21.7744140625, -21.042236328125, -20.31005859375, -19.577880859375, -18.845703125, -18.113525390625, -17.38134765625, -16.649169921875, -15.9169921875, -15.184814453125, -14.45263671875, -13.720458984375, -12.98828125, -12.256103515625, -11.52392578125, -10.791748046875, -10.0595703125, -9.327392578125, -8.59521484375, -7.863037109375, -7.130859375, -6.398681640625, -5.66650390625, -4.934326171875, -4.2021484375, -3.469970703125, -2.73779296875, -2.005615234375, -1.2734375, -0.541259765625, 0.19091796875, 0.923095703125, 1.6552734375, 2.387451171875, 3.11962890625, 3.851806640625, 4.583984375, 5.316162109375, 6.04833984375, 6.780517578125, 7.5126953125, 8.244873046875, 8.97705078125, 9.709228515625, 10.44140625, 11.173583984375, 11.90576171875, 12.637939453125, 13.3701171875, 14.102294921875, 14.83447265625, 15.566650390625, 16.298828125, 17.031005859375, 17.76318359375, 18.495361328125, 19.2275390625, 19.959716796875, 20.69189453125, 21.424072265625, 22.15625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 6.0, 4.0, 5.0, 6.0, 13.0, 16.0, 22.0, 23.0, 28.0, 44.0, 37.0, 26.0, 61.0, 55.0, 61.0, 44.0, 47.0, 50.0, 49.0, 59.0, 54.0, 52.0, 42.0, 34.0, 35.0, 22.0, 25.0, 20.0, 9.0, 10.0, 13.0, 10.0, 6.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-17.984375, -17.385986328125, -16.78759765625, -16.189208984375, -15.5908203125, -14.992431640625, -14.39404296875, -13.795654296875, -13.197265625, -12.598876953125, -12.00048828125, -11.402099609375, -10.8037109375, -10.205322265625, -9.60693359375, -9.008544921875, -8.41015625, -7.811767578125, -7.21337890625, -6.614990234375, -6.0166015625, -5.418212890625, -4.81982421875, -4.221435546875, -3.623046875, -3.024658203125, -2.42626953125, -1.827880859375, -1.2294921875, -0.631103515625, -0.03271484375, 0.565673828125, 1.1640625, 1.762451171875, 2.36083984375, 2.959228515625, 3.5576171875, 4.156005859375, 4.75439453125, 5.352783203125, 5.951171875, 6.549560546875, 7.14794921875, 7.746337890625, 8.3447265625, 8.943115234375, 9.54150390625, 10.139892578125, 10.73828125, 11.336669921875, 11.93505859375, 12.533447265625, 13.1318359375, 13.730224609375, 14.32861328125, 14.927001953125, 15.525390625, 16.123779296875, 16.72216796875, 17.320556640625, 17.9189453125, 18.517333984375, 19.11572265625, 19.714111328125, 20.3125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 7.0, 12.0, 13.0, 26.0, 36.0, 42.0, 53.0, 86.0, 134.0, 205.0, 448.0, 985.0, 2988.0, 18795.0, 647429.0, 359052.0, 14020.0, 2409.0, 806.0, 418.0, 227.0, 109.0, 87.0, 57.0, 32.0, 27.0, 17.0, 10.0, 11.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.15625, -32.83935546875, -31.5224609375, -30.20556640625, -28.888671875, -27.57177734375, -26.2548828125, -24.93798828125, -23.62109375, -22.30419921875, -20.9873046875, -19.67041015625, -18.353515625, -17.03662109375, -15.7197265625, -14.40283203125, -13.0859375, -11.76904296875, -10.4521484375, -9.13525390625, -7.818359375, -6.50146484375, -5.1845703125, -3.86767578125, -2.55078125, -1.23388671875, 0.0830078125, 1.39990234375, 2.716796875, 4.03369140625, 5.3505859375, 6.66748046875, 7.984375, 9.30126953125, 10.6181640625, 11.93505859375, 13.251953125, 14.56884765625, 15.8857421875, 17.20263671875, 18.51953125, 19.83642578125, 21.1533203125, 22.47021484375, 23.787109375, 25.10400390625, 26.4208984375, 27.73779296875, 29.0546875, 30.37158203125, 31.6884765625, 33.00537109375, 34.322265625, 35.63916015625, 36.9560546875, 38.27294921875, 39.58984375, 40.90673828125, 42.2236328125, 43.54052734375, 44.857421875, 46.17431640625, 47.4912109375, 48.80810546875, 50.125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 5.0, 5.0, 8.0, 9.0, 7.0, 16.0, 20.0, 23.0, 33.0, 41.0, 29.0, 79.0, 73.0, 102.0, 83.0, 98.0, 92.0, 60.0, 42.0, 29.0, 35.0, 27.0, 26.0, 18.0, 10.0, 6.0, 4.0, 8.0, 0.0, 4.0, 5.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.375, -71.69140625, -69.0078125, -66.32421875, -63.640625, -60.95703125, -58.2734375, -55.58984375, -52.90625, -50.22265625, -47.5390625, -44.85546875, -42.171875, -39.48828125, -36.8046875, -34.12109375, -31.4375, -28.75390625, -26.0703125, -23.38671875, -20.703125, -18.01953125, -15.3359375, -12.65234375, -9.96875, -7.28515625, -4.6015625, -1.91796875, 0.765625, 3.44921875, 6.1328125, 8.81640625, 11.5, 14.18359375, 16.8671875, 19.55078125, 22.234375, 24.91796875, 27.6015625, 30.28515625, 32.96875, 35.65234375, 38.3359375, 41.01953125, 43.703125, 46.38671875, 49.0703125, 51.75390625, 54.4375, 57.12109375, 59.8046875, 62.48828125, 65.171875, 67.85546875, 70.5390625, 73.22265625, 75.90625, 78.58984375, 81.2734375, 83.95703125, 86.640625, 89.32421875, 92.0078125, 94.69140625, 97.375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 3.0, 4.0, 1.0, 10.0, 11.0, 11.0, 12.0, 32.0, 41.0, 60.0, 129.0, 246.0, 539.0, 1708.0, 8848.0, 170716.0, 848523.0, 14102.0, 2247.0, 671.0, 292.0, 131.0, 64.0, 50.0, 41.0, 14.0, 13.0, 10.0, 4.0, 6.0, 2.0, 1.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.80859375, -6.5897216796875, -6.370849609375, -6.1519775390625, -5.93310546875, -5.7142333984375, -5.495361328125, -5.2764892578125, -5.0576171875, -4.8387451171875, -4.619873046875, -4.4010009765625, -4.18212890625, -3.9632568359375, -3.744384765625, -3.5255126953125, -3.306640625, -3.0877685546875, -2.868896484375, -2.6500244140625, -2.43115234375, -2.2122802734375, -1.993408203125, -1.7745361328125, -1.5556640625, -1.3367919921875, -1.117919921875, -0.8990478515625, -0.68017578125, -0.4613037109375, -0.242431640625, -0.0235595703125, 0.1953125, 0.4141845703125, 0.633056640625, 0.8519287109375, 1.07080078125, 1.2896728515625, 1.508544921875, 1.7274169921875, 1.9462890625, 2.1651611328125, 2.384033203125, 2.6029052734375, 2.82177734375, 3.0406494140625, 3.259521484375, 3.4783935546875, 3.697265625, 3.9161376953125, 4.135009765625, 4.3538818359375, 4.57275390625, 4.7916259765625, 5.010498046875, 5.2293701171875, 5.4482421875, 5.6671142578125, 5.885986328125, 6.1048583984375, 6.32373046875, 6.5426025390625, 6.761474609375, 6.9803466796875, 7.19921875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 12.0, 9.0, 6.0, 10.0, 9.0, 16.0, 21.0, 23.0, 32.0, 42.0, 53.0, 60.0, 90.0, 94.0, 91.0, 82.0, 85.0, 73.0, 47.0, 21.0, 21.0, 26.0, 10.0, 10.0, 14.0, 8.0, 6.0, 7.0, 3.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0008563995361328125, -0.0008327588438987732, -0.0008091181516647339, -0.0007854774594306946, -0.0007618367671966553, -0.000738196074962616, -0.0007145553827285767, -0.0006909146904945374, -0.000667273998260498, -0.0006436333060264587, -0.0006199926137924194, -0.0005963519215583801, -0.0005727112293243408, -0.0005490705370903015, -0.0005254298448562622, -0.0005017891526222229, -0.0004781484603881836, -0.0004545077681541443, -0.000430867075920105, -0.0004072263836860657, -0.00038358569145202637, -0.00035994499921798706, -0.00033630430698394775, -0.00031266361474990845, -0.00028902292251586914, -0.00026538223028182983, -0.00024174153804779053, -0.00021810084581375122, -0.00019446015357971191, -0.0001708194613456726, -0.0001471787691116333, -0.000123538076877594, -9.989738464355469e-05, -7.625669240951538e-05, -5.2616000175476074e-05, -2.8975307941436768e-05, -5.334615707397461e-06, 1.8306076526641846e-05, 4.194676876068115e-05, 6.558746099472046e-05, 8.922815322875977e-05, 0.00011286884546279907, 0.00013650953769683838, 0.00016015022993087769, 0.000183790922164917, 0.0002074316143989563, 0.0002310723066329956, 0.0002547129988670349, 0.0002783536911010742, 0.0003019943833351135, 0.00032563507556915283, 0.00034927576780319214, 0.00037291646003723145, 0.00039655715227127075, 0.00042019784450531006, 0.00044383853673934937, 0.00046747922897338867, 0.000491119921207428, 0.0005147606134414673, 0.0005384013056755066, 0.0005620419979095459, 0.0005856826901435852, 0.0006093233823776245, 0.0006329640746116638, 0.0006566047668457031]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 1.0, 1.0, 3.0, 4.0, 6.0, 10.0, 14.0, 19.0, 30.0, 52.0, 69.0, 111.0, 200.0, 326.0, 565.0, 1187.0, 2597.0, 7025.0, 23391.0, 154762.0, 780903.0, 56076.0, 12888.0, 4442.0, 1932.0, 773.0, 469.0, 255.0, 150.0, 89.0, 60.0, 43.0, 30.0, 15.0, 9.0, 15.0, 8.0, 7.0, 2.0, 6.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.66796875, -3.5543212890625, -3.440673828125, -3.3270263671875, -3.21337890625, -3.0997314453125, -2.986083984375, -2.8724365234375, -2.7587890625, -2.6451416015625, -2.531494140625, -2.4178466796875, -2.30419921875, -2.1905517578125, -2.076904296875, -1.9632568359375, -1.849609375, -1.7359619140625, -1.622314453125, -1.5086669921875, -1.39501953125, -1.2813720703125, -1.167724609375, -1.0540771484375, -0.9404296875, -0.8267822265625, -0.713134765625, -0.5994873046875, -0.48583984375, -0.3721923828125, -0.258544921875, -0.1448974609375, -0.03125, 0.0823974609375, 0.196044921875, 0.3096923828125, 0.42333984375, 0.5369873046875, 0.650634765625, 0.7642822265625, 0.8779296875, 0.9915771484375, 1.105224609375, 1.2188720703125, 1.33251953125, 1.4461669921875, 1.559814453125, 1.6734619140625, 1.787109375, 1.9007568359375, 2.014404296875, 2.1280517578125, 2.24169921875, 2.3553466796875, 2.468994140625, 2.5826416015625, 2.6962890625, 2.8099365234375, 2.923583984375, 3.0372314453125, 3.15087890625, 3.2645263671875, 3.378173828125, 3.4918212890625, 3.60546875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 2.0, 4.0, 0.0, 11.0, 6.0, 8.0, 8.0, 11.0, 7.0, 17.0, 22.0, 23.0, 61.0, 85.0, 133.0, 167.0, 126.0, 98.0, 56.0, 48.0, 25.0, 20.0, 10.0, 16.0, 10.0, 14.0, 3.0, 3.0, 4.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9296875, -5.73651123046875, -5.5433349609375, -5.35015869140625, -5.156982421875, -4.96380615234375, -4.7706298828125, -4.57745361328125, -4.38427734375, -4.19110107421875, -3.9979248046875, -3.80474853515625, -3.611572265625, -3.41839599609375, -3.2252197265625, -3.03204345703125, -2.8388671875, -2.64569091796875, -2.4525146484375, -2.25933837890625, -2.066162109375, -1.87298583984375, -1.6798095703125, -1.48663330078125, -1.29345703125, -1.10028076171875, -0.9071044921875, -0.71392822265625, -0.520751953125, -0.32757568359375, -0.1343994140625, 0.05877685546875, 0.251953125, 0.44512939453125, 0.6383056640625, 0.83148193359375, 1.024658203125, 1.21783447265625, 1.4110107421875, 1.60418701171875, 1.79736328125, 1.99053955078125, 2.1837158203125, 2.37689208984375, 2.570068359375, 2.76324462890625, 2.9564208984375, 3.14959716796875, 3.3427734375, 3.53594970703125, 3.7291259765625, 3.92230224609375, 4.115478515625, 4.30865478515625, 4.5018310546875, 4.69500732421875, 4.88818359375, 5.08135986328125, 5.2745361328125, 5.46771240234375, 5.660888671875, 5.85406494140625, 6.0472412109375, 6.24041748046875, 6.43359375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 11.0, 33.0, 65.0, 280.0, 453.0, 97.0, 29.0, 14.0, 9.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-443.47271728515625, -431.5397033691406, -419.6067199707031, -407.6737060546875, -395.7406921386719, -383.80767822265625, -371.87469482421875, -359.9416809082031, -348.0086669921875, -336.0756530761719, -324.1426696777344, -312.20965576171875, -300.2766418457031, -288.3436279296875, -276.41064453125, -264.4776306152344, -252.54464721679688, -240.6116485595703, -228.6786346435547, -216.74563598632812, -204.8126220703125, -192.87962341308594, -180.94662475585938, -169.01361083984375, -157.0806121826172, -145.14761352539062, -133.214599609375, -121.28160095214844, -109.34859466552734, -97.41558837890625, -85.48258972167969, -73.5495834350586, -61.616607666015625, -49.68360137939453, -37.7505989074707, -25.817596435546875, -13.884590148925781, -1.9515838623046875, 9.981414794921875, 21.91442108154297, 33.84742736816406, 45.780433654785156, 57.713436126708984, 69.64643859863281, 81.5794448852539, 93.512451171875, 105.44544982910156, 117.37845611572266, 129.31146240234375, 141.2444610595703, 153.17747497558594, 165.1104736328125, 177.04348754882812, 188.9764862060547, 200.90948486328125, 212.84249877929688, 224.77549743652344, 236.70849609375, 248.64151000976562, 260.57452392578125, 272.50750732421875, 284.4405212402344, 296.37353515625, 308.3065185546875, 320.2395324707031]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 5.0, 4.0, 5.0, 11.0, 13.0, 12.0, 17.0, 17.0, 18.0, 17.0, 26.0, 18.0, 37.0, 126.0, 123.0, 59.0, 109.0, 154.0, 35.0, 23.0, 33.0, 22.0, 19.0, 15.0, 24.0, 15.0, 9.0, 8.0, 10.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-227.55841064453125, -220.78248596191406, -214.00656127929688, -207.23065185546875, -200.45472717285156, -193.67880249023438, -186.9028778076172, -180.126953125, -173.35104370117188, -166.5751190185547, -159.7991943359375, -153.02328491210938, -146.2473602294922, -139.471435546875, -132.6955108642578, -125.91959381103516, -119.14366912841797, -112.36774444580078, -105.59182739257812, -98.81590270996094, -92.03998565673828, -85.2640609741211, -78.48814392089844, -71.71221923828125, -64.93629455566406, -58.16037368774414, -51.38445281982422, -44.60852813720703, -37.832611083984375, -31.056686401367188, -24.280765533447266, -17.504844665527344, -10.728927612304688, -3.9530062675476074, 2.8229150772094727, 9.598836898803711, 16.374757766723633, 23.150680541992188, 29.92660140991211, 36.70252227783203, 43.47844314575195, 50.254364013671875, 57.0302848815918, 63.80620574951172, 70.5821304321289, 77.35804748535156, 84.13397216796875, 90.90989685058594, 97.6858139038086, 104.46173858642578, 111.23765563964844, 118.01358032226562, 124.78949737548828, 131.5654296875, 138.34133911132812, 145.1172637939453, 151.8931884765625, 158.6691131591797, 165.44503784179688, 172.220947265625, 178.9968719482422, 185.77279663085938, 192.54872131347656, 199.32464599609375, 206.10055541992188]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 4.0, 8.0, 8.0, 5.0, 15.0, 18.0, 19.0, 23.0, 25.0, 21.0, 43.0, 32.0, 37.0, 62.0, 216.0, 182.0, 56.0, 44.0, 29.0, 20.0, 24.0, 19.0, 16.0, 20.0, 16.0, 7.0, 13.0, 5.0, 4.0, 5.0, 1.0, 1.0, 5.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.4375, -16.8740234375, -16.310546875, -15.7470703125, -15.18359375, -14.6201171875, -14.056640625, -13.4931640625, -12.9296875, -12.3662109375, -11.802734375, -11.2392578125, -10.67578125, -10.1123046875, -9.548828125, -8.9853515625, -8.421875, -7.8583984375, -7.294921875, -6.7314453125, -6.16796875, -5.6044921875, -5.041015625, -4.4775390625, -3.9140625, -3.3505859375, -2.787109375, -2.2236328125, -1.66015625, -1.0966796875, -0.533203125, 0.0302734375, 0.59375, 1.1572265625, 1.720703125, 2.2841796875, 2.84765625, 3.4111328125, 3.974609375, 4.5380859375, 5.1015625, 5.6650390625, 6.228515625, 6.7919921875, 7.35546875, 7.9189453125, 8.482421875, 9.0458984375, 9.609375, 10.1728515625, 10.736328125, 11.2998046875, 11.86328125, 12.4267578125, 12.990234375, 13.5537109375, 14.1171875, 14.6806640625, 15.244140625, 15.8076171875, 16.37109375, 16.9345703125, 17.498046875, 18.0615234375, 18.625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 8.0, 3.0, 8.0, 14.0, 15.0, 18.0, 18.0, 27.0, 28.0, 46.0, 93.0, 232.0, 562.0, 2174.0, 17322.0, 8354671.0, 10760.0, 1648.0, 466.0, 205.0, 96.0, 55.0, 18.0, 26.0, 20.0, 14.0, 6.0, 11.0, 10.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0], "bins": [-205.54661560058594, -199.00250244140625, -192.45838928222656, -185.91427612304688, -179.3701629638672, -172.8260498046875, -166.28192138671875, -159.73782348632812, -153.19369506835938, -146.6495819091797, -140.10546875, -133.5613555908203, -127.01724243164062, -120.47312927246094, -113.92900848388672, -107.38489532470703, -100.84078979492188, -94.29667663574219, -87.7525634765625, -81.20845031738281, -74.66433715820312, -68.12022399902344, -61.57610321044922, -55.03199005126953, -48.487876892089844, -41.943763732910156, -35.39965057373047, -28.855533599853516, -22.311420440673828, -15.76730728149414, -9.223190307617188, -2.6790771484375, 3.865020751953125, 10.409134864807129, 16.953248977661133, 23.497364044189453, 30.04147720336914, 36.58559036254883, 43.12970733642578, 49.67382049560547, 56.217933654785156, 62.762046813964844, 69.30615997314453, 75.85028076171875, 82.39439392089844, 88.93850708007812, 95.48262023925781, 102.0267333984375, 108.57084655761719, 115.11495971679688, 121.65907287597656, 128.20318603515625, 134.74729919433594, 141.29141235351562, 147.83554077148438, 154.379638671875, 160.92376708984375, 167.46788024902344, 174.01199340820312, 180.5561065673828, 187.1002197265625, 193.6443328857422, 200.18844604492188, 206.73257446289062, 213.27667236328125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 4.0, 2.0, 8.0, 6.0, 5.0, 5.0, 4.0, 4.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 3.0, 3.0, 8.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-186.46343994140625, -180.51824951171875, -174.5730743408203, -168.6278839111328, -162.68270874023438, -156.73751831054688, -150.79232788085938, -144.84715270996094, -138.90196228027344, -132.95677185058594, -127.0115966796875, -121.06640625, -115.12122344970703, -109.17604064941406, -103.2308578491211, -97.28567504882812, -91.34049224853516, -85.39530944824219, -79.45012664794922, -73.50494384765625, -67.55975341796875, -61.61457061767578, -55.66938781738281, -49.72420120239258, -43.77901840209961, -37.83383560180664, -31.888648986816406, -25.943466186523438, -19.998281478881836, -14.053096771240234, -8.107913970947266, -2.1627273559570312, 3.7824554443359375, 9.727640151977539, 15.672823905944824, 21.61800765991211, 27.56319236755371, 33.50837707519531, 39.45355987548828, 45.398746490478516, 51.343929290771484, 57.28911209106445, 63.23429870605469, 69.17948150634766, 75.12466430664062, 81.06985473632812, 87.01502990722656, 92.96022033691406, 98.90540313720703, 104.8505859375, 110.79576873779297, 116.74095153808594, 122.68614196777344, 128.63131713867188, 134.57650756835938, 140.52169799804688, 146.4668731689453, 152.4120635986328, 158.35723876953125, 164.30242919921875, 170.2476043701172, 176.1927947998047, 182.13796997070312, 188.08316040039062, 194.02835083007812]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 5.0, 8.0, 9.0, 9.0, 15.0, 22.0, 35.0, 56.0, 79.0, 109.0, 200.0, 277.0, 471.0, 821.0, 1544.0, 2840.0, 5131.0, 9703.0, 18230.0, 34522.0, 65765.0, 112609.0, 117542.0, 72353.0, 38075.0, 20099.0, 10735.0, 5643.0, 3206.0, 1728.0, 933.0, 517.0, 380.0, 216.0, 143.0, 77.0, 48.0, 38.0, 24.0, 23.0, 15.0, 1.0, 5.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-82.5625, -80.2734375, -77.984375, -75.6953125, -73.40625, -71.1171875, -68.828125, -66.5390625, -64.25, -61.9609375, -59.671875, -57.3828125, -55.09375, -52.8046875, -50.515625, -48.2265625, -45.9375, -43.6484375, -41.359375, -39.0703125, -36.78125, -34.4921875, -32.203125, -29.9140625, -27.625, -25.3359375, -23.046875, -20.7578125, -18.46875, -16.1796875, -13.890625, -11.6015625, -9.3125, -7.0234375, -4.734375, -2.4453125, -0.15625, 2.1328125, 4.421875, 6.7109375, 9.0, 11.2890625, 13.578125, 15.8671875, 18.15625, 20.4453125, 22.734375, 25.0234375, 27.3125, 29.6015625, 31.890625, 34.1796875, 36.46875, 38.7578125, 41.046875, 43.3359375, 45.625, 47.9140625, 50.203125, 52.4921875, 54.78125, 57.0703125, 59.359375, 61.6484375, 63.9375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 5.0, 4.0, 4.0, 4.0, 5.0, 8.0, 9.0, 15.0, 21.0, 31.0, 26.0, 39.0, 45.0, 51.0, 62.0, 79.0, 63.0, 55.0, 62.0, 68.0, 66.0, 54.0, 53.0, 33.0, 33.0, 19.0, 19.0, 11.0, 15.0, 9.0, 4.0, 6.0, 9.0, 3.0, 9.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.234375, -17.6123046875, -16.990234375, -16.3681640625, -15.74609375, -15.1240234375, -14.501953125, -13.8798828125, -13.2578125, -12.6357421875, -12.013671875, -11.3916015625, -10.76953125, -10.1474609375, -9.525390625, -8.9033203125, -8.28125, -7.6591796875, -7.037109375, -6.4150390625, -5.79296875, -5.1708984375, -4.548828125, -3.9267578125, -3.3046875, -2.6826171875, -2.060546875, -1.4384765625, -0.81640625, -0.1943359375, 0.427734375, 1.0498046875, 1.671875, 2.2939453125, 2.916015625, 3.5380859375, 4.16015625, 4.7822265625, 5.404296875, 6.0263671875, 6.6484375, 7.2705078125, 7.892578125, 8.5146484375, 9.13671875, 9.7587890625, 10.380859375, 11.0029296875, 11.625, 12.2470703125, 12.869140625, 13.4912109375, 14.11328125, 14.7353515625, 15.357421875, 15.9794921875, 16.6015625, 17.2236328125, 17.845703125, 18.4677734375, 19.08984375, 19.7119140625, 20.333984375, 20.9560546875, 21.578125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 8.0, 5.0, 17.0, 19.0, 21.0, 30.0, 49.0, 72.0, 62.0, 64.0, 39.0, 35.0, 15.0, 15.0, 9.0, 10.0, 2.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-113.70374298095703, -110.53536987304688, -107.36700439453125, -104.1986312866211, -101.03025817871094, -97.86189270019531, -94.69351959228516, -91.525146484375, -88.35678100585938, -85.18840789794922, -82.0200424194336, -78.85166931152344, -75.68330383300781, -72.51493072509766, -69.3465576171875, -66.17819213867188, -63.00981903076172, -59.84144973754883, -56.67308044433594, -53.50470733642578, -50.33633804321289, -47.16796875, -43.999595642089844, -40.83122634887695, -37.66285705566406, -34.49448776245117, -31.32611656188965, -28.157745361328125, -24.989376068115234, -21.821006774902344, -18.65263557434082, -15.484264373779297, -12.315902709960938, -9.14753246307373, -5.979162216186523, -2.8107919692993164, 0.3575782775878906, 3.5259485244750977, 6.694318771362305, 9.862689971923828, 13.031059265136719, 16.19942855834961, 19.367799758911133, 22.536170959472656, 25.704540252685547, 28.872909545898438, 32.041282653808594, 35.209651947021484, 38.378021240234375, 41.546390533447266, 44.714759826660156, 47.88313293457031, 51.0515022277832, 54.219871520996094, 57.38824462890625, 60.55661392211914, 63.72498321533203, 66.89335632324219, 70.06172180175781, 73.23009490966797, 76.39846801757812, 79.56683349609375, 82.7352066040039, 85.90357971191406, 89.07194519042969]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 7.0, 11.0, 16.0, 12.0, 30.0, 55.0, 74.0, 85.0, 58.0, 39.0, 24.0, 16.0, 8.0, 4.0, 6.0, 7.0, 7.0, 2.0, 2.0, 4.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.78057098388672, -66.1164321899414, -63.452293395996094, -60.78815460205078, -58.12401580810547, -55.459877014160156, -52.795738220214844, -50.13159942626953, -47.46746063232422, -44.803321838378906, -42.139183044433594, -39.47504425048828, -36.81090545654297, -34.146766662597656, -31.482627868652344, -28.81848907470703, -26.15435028076172, -23.490211486816406, -20.826072692871094, -18.16193389892578, -15.497795104980469, -12.833656311035156, -10.169517517089844, -7.505378723144531, -4.841239929199219, -2.1771011352539062, 0.48703765869140625, 3.1511764526367188, 5.815315246582031, 8.479454040527344, 11.143592834472656, 13.807731628417969, 16.47186279296875, 19.136001586914062, 21.800140380859375, 24.464279174804688, 27.12841796875, 29.792556762695312, 32.456695556640625, 35.12083435058594, 37.78497314453125, 40.44911193847656, 43.113250732421875, 45.77738952636719, 48.4415283203125, 51.10566711425781, 53.769805908203125, 56.43394470214844, 59.09808349609375, 61.76222229003906, 64.42636108398438, 67.09049987792969, 69.754638671875, 72.41877746582031, 75.08291625976562, 77.74705505371094, 80.41119384765625, 83.07533264160156, 85.73947143554688, 88.40361022949219, 91.0677490234375, 93.73188781738281, 96.39602661132812, 99.06016540527344, 101.72430419921875]}, "eval/loss": 0.9598673582077026, "eval/wer": 0.14415540607575847, "eval/runtime": 868.6571, "eval/samples_per_second": 3.041, "eval/steps_per_second": 0.381, "train/train_runtime": 116020.8621, "train/train_samples_per_second": 4.919, "train/train_steps_per_second": 0.154, "train/total_flos": 0.0, "train/train_loss": 2.37383288616657} \ No newline at end of file +{"train/loss": 0.292, "train/learning_rate": 8.907363420427554e-09, "train/epoch": 20.0, "train/global_step": 17840, "_runtime": 117345, "_timestamp": 1646778584, "_step": 17852, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 21.0, 7.0, 2.0, 2.0, 4.0, 1.0, 1.0, 5.0, 0.0, 5.0, 4.0, 1.0, 2.0, 7.0, 14.0, 29.0, 30270.0, 111.0, 20.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-701.0, -687.619140625, -674.23828125, -660.857421875, -647.4765625, -634.095703125, -620.71484375, -607.333984375, -593.953125, -580.572265625, -567.19140625, -553.810546875, -540.4296875, -527.048828125, -513.66796875, -500.287109375, -486.90625, -473.525390625, -460.14453125, -446.763671875, -433.3828125, -420.001953125, -406.62109375, -393.240234375, -379.859375, -366.478515625, -353.09765625, -339.716796875, -326.3359375, -312.955078125, -299.57421875, -286.193359375, -272.8125, -259.431640625, -246.05078125, -232.669921875, -219.2890625, -205.908203125, -192.52734375, -179.146484375, -165.765625, -152.384765625, -139.00390625, -125.623046875, -112.2421875, -98.861328125, -85.48046875, -72.099609375, -58.71875, -45.337890625, -31.95703125, -18.576171875, -5.1953125, 8.185546875, 21.56640625, 34.947265625, 48.328125, 61.708984375, 75.08984375, 88.470703125, 101.8515625, 115.232421875, 128.61328125, 141.994140625, 155.375]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 7.0, 12.0, 8.0, 5.0, 20.0, 8.0, 20.0, 29.0, 29.0, 35.0, 42.0, 47.0, 64.0, 55.0, 58.0, 58.0, 55.0, 71.0, 52.0, 41.0, 54.0, 44.0, 29.0, 31.0, 34.0, 16.0, 26.0, 18.0, 15.0, 4.0, 3.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-213.13580322265625, -208.03428649902344, -202.93275451660156, -197.83123779296875, -192.72970581054688, -187.62818908691406, -182.5266571044922, -177.42514038085938, -172.3236083984375, -167.2220916748047, -162.1205596923828, -157.01904296875, -151.91751098632812, -146.8159942626953, -141.71446228027344, -136.61294555664062, -131.5114288330078, -126.40990447998047, -121.30838012695312, -116.20685577392578, -111.10533142089844, -106.00381469726562, -100.90229034423828, -95.80076599121094, -90.6992416381836, -85.59771728515625, -80.4961929321289, -75.39466857910156, -70.29315185546875, -65.19161987304688, -60.09010314941406, -54.98857879638672, -49.88706970214844, -44.785545349121094, -39.68402099609375, -34.58250045776367, -29.480976104736328, -24.379451751708984, -19.277929306030273, -14.176406860351562, -9.074882507324219, -3.9733591079711914, 1.128164291381836, 6.229687690734863, 11.33121109008789, 16.432735443115234, 21.534257888793945, 26.635780334472656, 31.7373046875, 36.838829040527344, 41.94035339355469, 47.041873931884766, 52.14339828491211, 57.24492263793945, 62.34644317626953, 67.44796752929688, 72.54949188232422, 77.65101623535156, 82.7525405883789, 87.85406494140625, 92.95558166503906, 98.05711364746094, 103.15863037109375, 108.2601547241211, 113.36167907714844]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 1.0, 5.0, 5.0, 8.0, 6.0, 12.0, 7.0, 7.0, 12.0, 14.0, 24.0, 10.0, 25.0, 32.0, 41.0, 31.0, 27.0, 32.0, 44.0, 45.0, 43.0, 42.0, 45.0, 47.0, 49.0, 36.0, 32.0, 32.0, 27.0, 28.0, 30.0, 33.0, 27.0, 22.0, 22.0, 21.0, 14.0, 17.0, 13.0, 10.0, 7.0, 7.0, 2.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-124.2356185913086, -120.41963195800781, -116.60365295410156, -112.78766632080078, -108.9716796875, -105.15570068359375, -101.33971405029297, -97.52372741699219, -93.70774841308594, -89.89176177978516, -86.0757827758789, -82.25979614257812, -78.44381713867188, -74.6278305053711, -70.81184387207031, -66.99586486816406, -63.17987823486328, -59.363895416259766, -55.54791259765625, -51.73192596435547, -47.91594314575195, -44.09996032714844, -40.283973693847656, -36.46799087524414, -32.652008056640625, -28.83602523803711, -25.02004051208496, -21.204055786132812, -17.388072967529297, -13.572090148925781, -9.756105422973633, -5.940120697021484, -2.1241378784179688, 1.6918458938598633, 5.507829666137695, 9.323813438415527, 13.13979721069336, 16.955780029296875, 20.771764755249023, 24.587749481201172, 28.403732299804688, 32.2197151184082, 36.03569793701172, 39.8516845703125, 43.667667388916016, 47.48365020751953, 51.29963684082031, 55.11561965942383, 58.931602478027344, 62.74758529663086, 66.56356811523438, 70.37955474853516, 74.19554138183594, 78.01152038574219, 81.82750701904297, 85.64349365234375, 89.45947265625, 93.27545928955078, 97.09143829345703, 100.90742492675781, 104.72340393066406, 108.53939056396484, 112.35537719726562, 116.17135620117188, 119.98734283447266]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 7.0, 18.0, 25.0, 27.0, 50.0, 81.0, 145.0, 194.0, 351.0, 504.0, 780.0, 1315.0, 2016.0, 3131.0, 4959.0, 7612.0, 11577.0, 16624.0, 24222.0, 33958.0, 45803.0, 60119.0, 75042.0, 89462.0, 101695.0, 127668.0, 97477.0, 83977.0, 69542.0, 54968.0, 41591.0, 29967.0, 21211.0, 14441.0, 9894.0, 6441.0, 4196.0, 2752.0, 1717.0, 1086.0, 735.0, 434.0, 274.0, 163.0, 113.0, 77.0, 35.0, 27.0, 14.0, 14.0, 11.0, 10.0, 6.0, 3.0, 1.0, 1.0], "bins": [-404.75, -392.6015625, -380.453125, -368.3046875, -356.15625, -344.0078125, -331.859375, -319.7109375, -307.5625, -295.4140625, -283.265625, -271.1171875, -258.96875, -246.8203125, -234.671875, -222.5234375, -210.375, -198.2265625, -186.078125, -173.9296875, -161.78125, -149.6328125, -137.484375, -125.3359375, -113.1875, -101.0390625, -88.890625, -76.7421875, -64.59375, -52.4453125, -40.296875, -28.1484375, -16.0, -3.8515625, 8.296875, 20.4453125, 32.59375, 44.7421875, 56.890625, 69.0390625, 81.1875, 93.3359375, 105.484375, 117.6328125, 129.78125, 141.9296875, 154.078125, 166.2265625, 178.375, 190.5234375, 202.671875, 214.8203125, 226.96875, 239.1171875, 251.265625, 263.4140625, 275.5625, 287.7109375, 299.859375, 312.0078125, 324.15625, 336.3046875, 348.453125, 360.6015625, 372.75]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 2.0, 5.0, 1.0, 7.0, 6.0, 8.0, 15.0, 9.0, 12.0, 14.0, 22.0, 18.0, 33.0, 18.0, 33.0, 19.0, 43.0, 42.0, 45.0, 43.0, 41.0, 41.0, 62.0, 42.0, 41.0, 45.0, 38.0, 38.0, 33.0, 27.0, 26.0, 27.0, 24.0, 28.0, 18.0, 12.0, 15.0, 13.0, 10.0, 10.0, 5.0, 6.0, 1.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-188.875, -182.82421875, -176.7734375, -170.72265625, -164.671875, -158.62109375, -152.5703125, -146.51953125, -140.46875, -134.41796875, -128.3671875, -122.31640625, -116.265625, -110.21484375, -104.1640625, -98.11328125, -92.0625, -86.01171875, -79.9609375, -73.91015625, -67.859375, -61.80859375, -55.7578125, -49.70703125, -43.65625, -37.60546875, -31.5546875, -25.50390625, -19.453125, -13.40234375, -7.3515625, -1.30078125, 4.75, 10.80078125, 16.8515625, 22.90234375, 28.953125, 35.00390625, 41.0546875, 47.10546875, 53.15625, 59.20703125, 65.2578125, 71.30859375, 77.359375, 83.41015625, 89.4609375, 95.51171875, 101.5625, 107.61328125, 113.6640625, 119.71484375, 125.765625, 131.81640625, 137.8671875, 143.91796875, 149.96875, 156.01953125, 162.0703125, 168.12109375, 174.171875, 180.22265625, 186.2734375, 192.32421875, 198.375]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 1.0, 7.0, 3.0, 6.0, 8.0, 14.0, 19.0, 13.0, 19.0, 24.0, 44.0, 31.0, 23.0, 44.0, 41.0, 49.0, 42.0, 52.0, 54.0, 43.0, 52.0, 55.0, 45.0, 43.0, 50.0, 36.0, 32.0, 24.0, 26.0, 20.0, 14.0, 20.0, 15.0, 11.0, 12.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-146.77110290527344, -142.3655548095703, -137.96002197265625, -133.55447387695312, -129.14894104003906, -124.74339294433594, -120.33785247802734, -115.93231201171875, -111.52677154541016, -107.12123107910156, -102.71569061279297, -98.31015014648438, -93.90460205078125, -89.49906921386719, -85.09352111816406, -80.68798065185547, -76.28244018554688, -71.87689971923828, -67.47135925292969, -63.06581497192383, -58.660274505615234, -54.25473403930664, -49.84918975830078, -45.44364929199219, -41.038108825683594, -36.632568359375, -32.227027893066406, -27.821483612060547, -23.415943145751953, -19.01040267944336, -14.604860305786133, -10.199317932128906, -5.793792724609375, -1.3882513046264648, 3.0172901153564453, 7.4228315353393555, 11.828372955322266, 16.23391342163086, 20.639455795288086, 25.044998168945312, 29.450538635253906, 33.8560791015625, 38.261619567871094, 42.66716384887695, 47.07270431518555, 51.47824478149414, 55.8837890625, 60.289329528808594, 64.69486999511719, 69.10041046142578, 73.50595092773438, 77.91149139404297, 82.31703186035156, 86.72257995605469, 91.12812042236328, 95.53366088867188, 99.93920135498047, 104.34474182128906, 108.75028228759766, 113.15582275390625, 117.56137084960938, 121.96690368652344, 126.37245178222656, 130.77798461914062, 135.18353271484375]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 7.0, 6.0, 4.0, 9.0, 6.0, 7.0, 19.0, 17.0, 10.0, 24.0, 20.0, 25.0, 19.0, 22.0, 28.0, 40.0, 37.0, 28.0, 42.0, 48.0, 45.0, 38.0, 39.0, 46.0, 39.0, 47.0, 42.0, 35.0, 41.0, 38.0, 28.0, 27.0, 30.0, 16.0, 12.0, 13.0, 12.0, 14.0, 4.0, 8.0, 6.0, 2.0, 0.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-136.23291015625, -132.0714569091797, -127.9100112915039, -123.7485580444336, -119.58710479736328, -115.4256591796875, -111.26420593261719, -107.10275268554688, -102.94129943847656, -98.77984619140625, -94.61840057373047, -90.45694732666016, -86.29549407958984, -82.13404846191406, -77.97259521484375, -73.81114196777344, -69.64969635009766, -65.48824310302734, -61.3267936706543, -57.16534423828125, -53.00389099121094, -48.84244155883789, -44.680992126464844, -40.51953887939453, -36.358089447021484, -32.19664001464844, -28.035186767578125, -23.873737335205078, -19.7122859954834, -15.550834655761719, -11.389385223388672, -7.227933883666992, -3.0664825439453125, 1.094968318939209, 5.2564191818237305, 9.417869567871094, 13.579320907592773, 17.740772247314453, 21.9022216796875, 26.06367301940918, 30.22512435913086, 34.386573791503906, 38.54802703857422, 42.709476470947266, 46.87092590332031, 51.032379150390625, 55.19382858276367, 59.35527801513672, 63.51673126220703, 67.67818450927734, 71.83963012695312, 76.00108337402344, 80.16253662109375, 84.32398986816406, 88.48543548583984, 92.64688873291016, 96.80833435058594, 100.96978759765625, 105.13123321533203, 109.29268646240234, 113.45413970947266, 117.61558532714844, 121.77703857421875, 125.93849182128906, 130.09994506835938]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 7.0, 11.0, 12.0, 18.0, 19.0, 39.0, 56.0, 104.0, 204.0, 300.0, 481.0, 816.0, 1275.0, 2071.0, 3549.0, 5819.0, 9740.0, 16663.0, 28230.0, 47989.0, 82882.0, 144040.0, 251088.0, 432745.0, 714245.0, 885607.0, 642858.0, 385436.0, 224792.0, 130596.0, 75765.0, 43935.0, 25837.0, 15019.0, 8889.0, 5280.0, 3147.0, 1873.0, 1113.0, 662.0, 431.0, 261.0, 168.0, 83.0, 48.0, 31.0, 27.0, 15.0, 6.0, 4.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-208.375, -201.517578125, -194.66015625, -187.802734375, -180.9453125, -174.087890625, -167.23046875, -160.373046875, -153.515625, -146.658203125, -139.80078125, -132.943359375, -126.0859375, -119.228515625, -112.37109375, -105.513671875, -98.65625, -91.798828125, -84.94140625, -78.083984375, -71.2265625, -64.369140625, -57.51171875, -50.654296875, -43.796875, -36.939453125, -30.08203125, -23.224609375, -16.3671875, -9.509765625, -2.65234375, 4.205078125, 11.0625, 17.919921875, 24.77734375, 31.634765625, 38.4921875, 45.349609375, 52.20703125, 59.064453125, 65.921875, 72.779296875, 79.63671875, 86.494140625, 93.3515625, 100.208984375, 107.06640625, 113.923828125, 120.78125, 127.638671875, 134.49609375, 141.353515625, 148.2109375, 155.068359375, 161.92578125, 168.783203125, 175.640625, 182.498046875, 189.35546875, 196.212890625, 203.0703125, 209.927734375, 216.78515625, 223.642578125, 230.5]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 9.0, 6.0, 8.0, 3.0, 6.0, 18.0, 17.0, 16.0, 10.0, 14.0, 24.0, 25.0, 30.0, 24.0, 27.0, 39.0, 48.0, 47.0, 36.0, 33.0, 41.0, 45.0, 44.0, 36.0, 41.0, 26.0, 49.0, 40.0, 35.0, 39.0, 18.0, 27.0, 28.0, 20.0, 11.0, 14.0, 12.0, 11.0, 8.0, 5.0, 6.0, 2.0, 1.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-115.0, -111.431640625, -107.86328125, -104.294921875, -100.7265625, -97.158203125, -93.58984375, -90.021484375, -86.453125, -82.884765625, -79.31640625, -75.748046875, -72.1796875, -68.611328125, -65.04296875, -61.474609375, -57.90625, -54.337890625, -50.76953125, -47.201171875, -43.6328125, -40.064453125, -36.49609375, -32.927734375, -29.359375, -25.791015625, -22.22265625, -18.654296875, -15.0859375, -11.517578125, -7.94921875, -4.380859375, -0.8125, 2.755859375, 6.32421875, 9.892578125, 13.4609375, 17.029296875, 20.59765625, 24.166015625, 27.734375, 31.302734375, 34.87109375, 38.439453125, 42.0078125, 45.576171875, 49.14453125, 52.712890625, 56.28125, 59.849609375, 63.41796875, 66.986328125, 70.5546875, 74.123046875, 77.69140625, 81.259765625, 84.828125, 88.396484375, 91.96484375, 95.533203125, 99.1015625, 102.669921875, 106.23828125, 109.806640625, 113.375]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 6.0, 7.0, 7.0, 14.0, 16.0, 18.0, 34.0, 72.0, 121.0, 154.0, 280.0, 479.0, 819.0, 1399.0, 2416.0, 3963.0, 7097.0, 12505.0, 22166.0, 38226.0, 66934.0, 113626.0, 191997.0, 312977.0, 481061.0, 672622.0, 730343.0, 568556.0, 380966.0, 239674.0, 144990.0, 85483.0, 49339.0, 28158.0, 16106.0, 9226.0, 5097.0, 2875.0, 1788.0, 1085.0, 632.0, 344.0, 221.0, 137.0, 87.0, 54.0, 39.0, 31.0, 19.0, 7.0, 8.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-144.25, -139.7734375, -135.296875, -130.8203125, -126.34375, -121.8671875, -117.390625, -112.9140625, -108.4375, -103.9609375, -99.484375, -95.0078125, -90.53125, -86.0546875, -81.578125, -77.1015625, -72.625, -68.1484375, -63.671875, -59.1953125, -54.71875, -50.2421875, -45.765625, -41.2890625, -36.8125, -32.3359375, -27.859375, -23.3828125, -18.90625, -14.4296875, -9.953125, -5.4765625, -1.0, 3.4765625, 7.953125, 12.4296875, 16.90625, 21.3828125, 25.859375, 30.3359375, 34.8125, 39.2890625, 43.765625, 48.2421875, 52.71875, 57.1953125, 61.671875, 66.1484375, 70.625, 75.1015625, 79.578125, 84.0546875, 88.53125, 93.0078125, 97.484375, 101.9609375, 106.4375, 110.9140625, 115.390625, 119.8671875, 124.34375, 128.8203125, 133.296875, 137.7734375, 142.25]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 3.0, 7.0, 12.0, 12.0, 12.0, 21.0, 14.0, 22.0, 20.0, 46.0, 57.0, 62.0, 88.0, 98.0, 131.0, 117.0, 153.0, 170.0, 210.0, 266.0, 260.0, 292.0, 290.0, 244.0, 251.0, 191.0, 167.0, 145.0, 164.0, 103.0, 90.0, 80.0, 60.0, 53.0, 38.0, 38.0, 14.0, 20.0, 24.0, 7.0, 12.0, 3.0, 5.0, 0.0, 8.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.21875, -56.3203125, -54.421875, -52.5234375, -50.625, -48.7265625, -46.828125, -44.9296875, -43.03125, -41.1328125, -39.234375, -37.3359375, -35.4375, -33.5390625, -31.640625, -29.7421875, -27.84375, -25.9453125, -24.046875, -22.1484375, -20.25, -18.3515625, -16.453125, -14.5546875, -12.65625, -10.7578125, -8.859375, -6.9609375, -5.0625, -3.1640625, -1.265625, 0.6328125, 2.53125, 4.4296875, 6.328125, 8.2265625, 10.125, 12.0234375, 13.921875, 15.8203125, 17.71875, 19.6171875, 21.515625, 23.4140625, 25.3125, 27.2109375, 29.109375, 31.0078125, 32.90625, 34.8046875, 36.703125, 38.6015625, 40.5, 42.3984375, 44.296875, 46.1953125, 48.09375, 49.9921875, 51.890625, 53.7890625, 55.6875, 57.5859375, 59.484375, 61.3828125, 63.28125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 9.0, 5.0, 3.0, 8.0, 14.0, 12.0, 20.0, 20.0, 26.0, 26.0, 33.0, 31.0, 43.0, 39.0, 56.0, 50.0, 49.0, 60.0, 62.0, 62.0, 38.0, 45.0, 36.0, 44.0, 32.0, 33.0, 30.0, 24.0, 25.0, 23.0, 11.0, 8.0, 5.0, 8.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-166.92550659179688, -162.397705078125, -157.86990356445312, -153.34210205078125, -148.81430053710938, -144.28648376464844, -139.75868225097656, -135.2308807373047, -130.7030792236328, -126.17527770996094, -121.64747619628906, -117.11966705322266, -112.59186553955078, -108.0640640258789, -103.5362548828125, -99.00845336914062, -94.48065185546875, -89.95285034179688, -85.425048828125, -80.8972396850586, -76.36943817138672, -71.84163665771484, -67.31382751464844, -62.78602600097656, -58.25822448730469, -53.73042297363281, -49.20261764526367, -44.67481231689453, -40.147010803222656, -35.61920928955078, -31.09140396118164, -26.563600540161133, -22.035781860351562, -17.507978439331055, -12.980175018310547, -8.452371597290039, -3.9245681762695312, 0.6032352447509766, 5.131038665771484, 9.658842086791992, 14.1866455078125, 18.714448928833008, 23.242252349853516, 27.770055770874023, 32.29785919189453, 36.825660705566406, 41.35346603393555, 45.88127136230469, 50.40907287597656, 54.93687438964844, 59.46467971801758, 63.99248504638672, 68.5202865600586, 73.04808807373047, 77.57589721679688, 82.10369873046875, 86.63150024414062, 91.1593017578125, 95.68710327148438, 100.21491241455078, 104.74271392822266, 109.27051544189453, 113.79832458496094, 118.32612609863281, 122.85392761230469]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 4.0, 5.0, 6.0, 10.0, 9.0, 7.0, 12.0, 18.0, 13.0, 14.0, 16.0, 15.0, 35.0, 27.0, 23.0, 34.0, 24.0, 49.0, 39.0, 32.0, 42.0, 47.0, 40.0, 43.0, 32.0, 37.0, 45.0, 30.0, 41.0, 32.0, 27.0, 27.0, 34.0, 25.0, 23.0, 19.0, 10.0, 16.0, 13.0, 8.0, 7.0, 5.0, 3.0, 2.0, 2.0, 0.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.46715545654297, -115.53140258789062, -111.59565734863281, -107.65990447998047, -103.72415161132812, -99.78840637207031, -95.85265350341797, -91.91690063476562, -87.98115539550781, -84.04540252685547, -80.10965728759766, -76.17390441894531, -72.23815155029297, -68.30239868164062, -64.36665344238281, -60.43090057373047, -56.495147705078125, -52.55939865112305, -48.6236457824707, -44.687896728515625, -40.75214385986328, -36.8163948059082, -32.880645751953125, -28.944894790649414, -25.009143829345703, -21.073392868041992, -17.13764190673828, -13.201892852783203, -9.266141891479492, -5.330390930175781, -1.3946418762207031, 2.541109085083008, 6.4768524169921875, 10.412603378295898, 14.348353385925293, 18.284103393554688, 22.2198543548584, 26.15560531616211, 30.091354370117188, 34.02710723876953, 37.96285629272461, 41.89860534667969, 45.83435821533203, 49.77010726928711, 53.70585632324219, 57.64160919189453, 61.57735824584961, 65.51310729980469, 69.44886016845703, 73.38461303710938, 77.32035827636719, 81.25611114501953, 85.19186401367188, 89.12760925292969, 93.06336212158203, 96.99911499023438, 100.93486022949219, 104.87061309814453, 108.80635833740234, 112.74211120605469, 116.67786407470703, 120.61361694335938, 124.54936218261719, 128.485107421875, 132.42086791992188]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 7.0, 3.0, 8.0, 6.0, 14.0, 25.0, 46.0, 54.0, 78.0, 123.0, 170.0, 289.0, 426.0, 753.0, 1063.0, 1747.0, 2700.0, 4267.0, 6539.0, 10310.0, 16185.0, 25888.0, 41322.0, 66798.0, 106493.0, 153691.0, 177951.0, 151808.0, 104255.0, 65440.0, 40768.0, 25368.0, 15885.0, 10177.0, 6536.0, 4114.0, 2565.0, 1673.0, 1069.0, 676.0, 444.0, 298.0, 162.0, 124.0, 84.0, 51.0, 36.0, 29.0, 21.0, 7.0, 11.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0], "bins": [-193.75, -187.962890625, -182.17578125, -176.388671875, -170.6015625, -164.814453125, -159.02734375, -153.240234375, -147.453125, -141.666015625, -135.87890625, -130.091796875, -124.3046875, -118.517578125, -112.73046875, -106.943359375, -101.15625, -95.369140625, -89.58203125, -83.794921875, -78.0078125, -72.220703125, -66.43359375, -60.646484375, -54.859375, -49.072265625, -43.28515625, -37.498046875, -31.7109375, -25.923828125, -20.13671875, -14.349609375, -8.5625, -2.775390625, 3.01171875, 8.798828125, 14.5859375, 20.373046875, 26.16015625, 31.947265625, 37.734375, 43.521484375, 49.30859375, 55.095703125, 60.8828125, 66.669921875, 72.45703125, 78.244140625, 84.03125, 89.818359375, 95.60546875, 101.392578125, 107.1796875, 112.966796875, 118.75390625, 124.541015625, 130.328125, 136.115234375, 141.90234375, 147.689453125, 153.4765625, 159.263671875, 165.05078125, 170.837890625, 176.625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 5.0, 10.0, 8.0, 4.0, 10.0, 5.0, 22.0, 23.0, 18.0, 28.0, 25.0, 22.0, 24.0, 27.0, 26.0, 30.0, 36.0, 42.0, 44.0, 42.0, 34.0, 36.0, 30.0, 44.0, 41.0, 44.0, 42.0, 40.0, 35.0, 25.0, 26.0, 25.0, 19.0, 17.0, 16.0, 16.0, 11.0, 6.0, 16.0, 10.0, 4.0, 3.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.4375, -89.125, -85.8125, -82.5, -79.1875, -75.875, -72.5625, -69.25, -65.9375, -62.625, -59.3125, -56.0, -52.6875, -49.375, -46.0625, -42.75, -39.4375, -36.125, -32.8125, -29.5, -26.1875, -22.875, -19.5625, -16.25, -12.9375, -9.625, -6.3125, -3.0, 0.3125, 3.625, 6.9375, 10.25, 13.5625, 16.875, 20.1875, 23.5, 26.8125, 30.125, 33.4375, 36.75, 40.0625, 43.375, 46.6875, 50.0, 53.3125, 56.625, 59.9375, 63.25, 66.5625, 69.875, 73.1875, 76.5, 79.8125, 83.125, 86.4375, 89.75, 93.0625, 96.375, 99.6875, 103.0, 106.3125, 109.625, 112.9375, 116.25, 119.5625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 14.0, 12.0, 20.0, 44.0, 38.0, 68.0, 96.0, 112.0, 182.0, 267.0, 360.0, 517.0, 766.0, 1233.0, 2073.0, 3145.0, 5135.0, 8740.0, 15803.0, 29857.0, 61687.0, 141734.0, 294670.0, 258318.0, 113885.0, 50816.0, 25364.0, 13497.0, 7643.0, 4415.0, 2845.0, 1700.0, 1137.0, 757.0, 506.0, 324.0, 225.0, 190.0, 87.0, 85.0, 53.0, 38.0, 32.0, 24.0, 13.0, 6.0, 8.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-319.0, -308.66796875, -298.3359375, -288.00390625, -277.671875, -267.33984375, -257.0078125, -246.67578125, -236.34375, -226.01171875, -215.6796875, -205.34765625, -195.015625, -184.68359375, -174.3515625, -164.01953125, -153.6875, -143.35546875, -133.0234375, -122.69140625, -112.359375, -102.02734375, -91.6953125, -81.36328125, -71.03125, -60.69921875, -50.3671875, -40.03515625, -29.703125, -19.37109375, -9.0390625, 1.29296875, 11.625, 21.95703125, 32.2890625, 42.62109375, 52.953125, 63.28515625, 73.6171875, 83.94921875, 94.28125, 104.61328125, 114.9453125, 125.27734375, 135.609375, 145.94140625, 156.2734375, 166.60546875, 176.9375, 187.26953125, 197.6015625, 207.93359375, 218.265625, 228.59765625, 238.9296875, 249.26171875, 259.59375, 269.92578125, 280.2578125, 290.58984375, 300.921875, 311.25390625, 321.5859375, 331.91796875, 342.25]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 10.0, 7.0, 8.0, 8.0, 14.0, 15.0, 5.0, 18.0, 12.0, 27.0, 16.0, 23.0, 27.0, 35.0, 41.0, 42.0, 39.0, 41.0, 41.0, 53.0, 44.0, 40.0, 40.0, 42.0, 27.0, 40.0, 33.0, 33.0, 30.0, 25.0, 22.0, 14.0, 22.0, 18.0, 15.0, 19.0, 9.0, 13.0, 13.0, 8.0, 5.0, 1.0, 6.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.0625, -72.580078125, -70.09765625, -67.615234375, -65.1328125, -62.650390625, -60.16796875, -57.685546875, -55.203125, -52.720703125, -50.23828125, -47.755859375, -45.2734375, -42.791015625, -40.30859375, -37.826171875, -35.34375, -32.861328125, -30.37890625, -27.896484375, -25.4140625, -22.931640625, -20.44921875, -17.966796875, -15.484375, -13.001953125, -10.51953125, -8.037109375, -5.5546875, -3.072265625, -0.58984375, 1.892578125, 4.375, 6.857421875, 9.33984375, 11.822265625, 14.3046875, 16.787109375, 19.26953125, 21.751953125, 24.234375, 26.716796875, 29.19921875, 31.681640625, 34.1640625, 36.646484375, 39.12890625, 41.611328125, 44.09375, 46.576171875, 49.05859375, 51.541015625, 54.0234375, 56.505859375, 58.98828125, 61.470703125, 63.953125, 66.435546875, 68.91796875, 71.400390625, 73.8828125, 76.365234375, 78.84765625, 81.330078125, 83.8125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 11.0, 10.0, 11.0, 15.0, 19.0, 38.0, 51.0, 73.0, 104.0, 154.0, 249.0, 368.0, 640.0, 1245.0, 3131.0, 13068.0, 101937.0, 652468.0, 240525.0, 25595.0, 5021.0, 1667.0, 825.0, 466.0, 276.0, 185.0, 114.0, 81.0, 52.0, 42.0, 26.0, 26.0, 17.0, 7.0, 7.0, 8.0, 1.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-348.5, -337.5, -326.5, -315.5, -304.5, -293.5, -282.5, -271.5, -260.5, -249.5, -238.5, -227.5, -216.5, -205.5, -194.5, -183.5, -172.5, -161.5, -150.5, -139.5, -128.5, -117.5, -106.5, -95.5, -84.5, -73.5, -62.5, -51.5, -40.5, -29.5, -18.5, -7.5, 3.5, 14.5, 25.5, 36.5, 47.5, 58.5, 69.5, 80.5, 91.5, 102.5, 113.5, 124.5, 135.5, 146.5, 157.5, 168.5, 179.5, 190.5, 201.5, 212.5, 223.5, 234.5, 245.5, 256.5, 267.5, 278.5, 289.5, 300.5, 311.5, 322.5, 333.5, 344.5, 355.5]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 9.0, 9.0, 14.0, 25.0, 26.0, 50.0, 141.0, 228.0, 214.0, 147.0, 60.0, 32.0, 14.0, 15.0, 7.0, 2.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0224151611328125, -0.021712303161621094, -0.021009445190429688, -0.02030658721923828, -0.019603729248046875, -0.01890087127685547, -0.018198013305664062, -0.017495155334472656, -0.01679229736328125, -0.016089439392089844, -0.015386581420898438, -0.014683723449707031, -0.013980865478515625, -0.013278007507324219, -0.012575149536132812, -0.011872291564941406, -0.01116943359375, -0.010466575622558594, -0.009763717651367188, -0.009060859680175781, -0.008358001708984375, -0.007655143737792969, -0.0069522857666015625, -0.006249427795410156, -0.00554656982421875, -0.004843711853027344, -0.0041408538818359375, -0.0034379959106445312, -0.002735137939453125, -0.0020322799682617188, -0.0013294219970703125, -0.0006265640258789062, 7.62939453125e-05, 0.0007791519165039062, 0.0014820098876953125, 0.0021848678588867188, 0.002887725830078125, 0.0035905838012695312, 0.0042934417724609375, 0.004996299743652344, 0.00569915771484375, 0.006402015686035156, 0.0071048736572265625, 0.007807731628417969, 0.008510589599609375, 0.009213447570800781, 0.009916305541992188, 0.010619163513183594, 0.011322021484375, 0.012024879455566406, 0.012727737426757812, 0.013430595397949219, 0.014133453369140625, 0.014836311340332031, 0.015539169311523438, 0.016242027282714844, 0.01694488525390625, 0.017647743225097656, 0.018350601196289062, 0.01905345916748047, 0.019756317138671875, 0.02045917510986328, 0.021162033081054688, 0.021864891052246094, 0.0225677490234375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 8.0, 4.0, 14.0, 9.0, 13.0, 38.0, 39.0, 57.0, 73.0, 77.0, 113.0, 143.0, 153.0, 237.0, 274.0, 452.0, 642.0, 962.0, 1613.0, 3250.0, 7974.0, 23796.0, 78933.0, 222650.0, 355951.0, 228150.0, 81691.0, 24898.0, 8077.0, 3357.0, 1655.0, 868.0, 595.0, 456.0, 324.0, 252.0, 198.0, 139.0, 104.0, 77.0, 53.0, 47.0, 35.0, 31.0, 20.0, 19.0, 13.0, 7.0, 9.0, 6.0, 3.0, 1.0, 1.0, 2.0], "bins": [-213.625, -207.435546875, -201.24609375, -195.056640625, -188.8671875, -182.677734375, -176.48828125, -170.298828125, -164.109375, -157.919921875, -151.73046875, -145.541015625, -139.3515625, -133.162109375, -126.97265625, -120.783203125, -114.59375, -108.404296875, -102.21484375, -96.025390625, -89.8359375, -83.646484375, -77.45703125, -71.267578125, -65.078125, -58.888671875, -52.69921875, -46.509765625, -40.3203125, -34.130859375, -27.94140625, -21.751953125, -15.5625, -9.373046875, -3.18359375, 3.005859375, 9.1953125, 15.384765625, 21.57421875, 27.763671875, 33.953125, 40.142578125, 46.33203125, 52.521484375, 58.7109375, 64.900390625, 71.08984375, 77.279296875, 83.46875, 89.658203125, 95.84765625, 102.037109375, 108.2265625, 114.416015625, 120.60546875, 126.794921875, 132.984375, 139.173828125, 145.36328125, 151.552734375, 157.7421875, 163.931640625, 170.12109375, 176.310546875, 182.5]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 7.0, 10.0, 18.0, 24.0, 25.0, 28.0, 34.0, 53.0, 52.0, 78.0, 88.0, 71.0, 81.0, 75.0, 80.0, 53.0, 56.0, 39.0, 43.0, 14.0, 14.0, 16.0, 7.0, 6.0, 4.0, 2.0, 6.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-60.6875, -58.99365234375, -57.2998046875, -55.60595703125, -53.912109375, -52.21826171875, -50.5244140625, -48.83056640625, -47.13671875, -45.44287109375, -43.7490234375, -42.05517578125, -40.361328125, -38.66748046875, -36.9736328125, -35.27978515625, -33.5859375, -31.89208984375, -30.1982421875, -28.50439453125, -26.810546875, -25.11669921875, -23.4228515625, -21.72900390625, -20.03515625, -18.34130859375, -16.6474609375, -14.95361328125, -13.259765625, -11.56591796875, -9.8720703125, -8.17822265625, -6.484375, -4.79052734375, -3.0966796875, -1.40283203125, 0.291015625, 1.98486328125, 3.6787109375, 5.37255859375, 7.06640625, 8.76025390625, 10.4541015625, 12.14794921875, 13.841796875, 15.53564453125, 17.2294921875, 18.92333984375, 20.6171875, 22.31103515625, 24.0048828125, 25.69873046875, 27.392578125, 29.08642578125, 30.7802734375, 32.47412109375, 34.16796875, 35.86181640625, 37.5556640625, 39.24951171875, 40.943359375, 42.63720703125, 44.3310546875, 46.02490234375, 47.71875]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 7.0, 2.0, 7.0, 6.0, 4.0, 9.0, 10.0, 16.0, 16.0, 20.0, 15.0, 21.0, 28.0, 21.0, 48.0, 33.0, 45.0, 53.0, 47.0, 42.0, 43.0, 57.0, 39.0, 47.0, 60.0, 39.0, 37.0, 45.0, 29.0, 24.0, 19.0, 33.0, 11.0, 11.0, 12.0, 12.0, 7.0, 10.0, 6.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-123.48811340332031, -119.9590835571289, -116.43004608154297, -112.90101623535156, -109.37197875976562, -105.84294891357422, -102.31391906738281, -98.78488159179688, -95.25584411621094, -91.72681427001953, -88.1977767944336, -84.66874694824219, -81.13970947265625, -77.61067962646484, -74.08164978027344, -70.5526123046875, -67.0235824584961, -63.49454879760742, -59.96551513671875, -56.436485290527344, -52.907447814941406, -49.37841796875, -45.84938430786133, -42.320350646972656, -38.791316986083984, -35.26228332519531, -31.73324966430664, -28.2042179107666, -24.67518424987793, -21.146150588989258, -17.61711883544922, -14.088085174560547, -10.559043884277344, -7.03001070022583, -3.5009775161743164, 0.028055191040039062, 3.557088851928711, 7.086122512817383, 10.615154266357422, 14.144187927246094, 17.673221588134766, 21.202255249023438, 24.73128890991211, 28.26032066345215, 31.78935432434082, 35.318389892578125, 38.84741973876953, 42.3764533996582, 45.905487060546875, 49.43452072143555, 52.96355438232422, 56.492584228515625, 60.02162170410156, 63.55065155029297, 67.07968139648438, 70.60871887207031, 74.13775634765625, 77.66678619384766, 81.1958236694336, 84.724853515625, 88.25389099121094, 91.78292083740234, 95.31195068359375, 98.84098815917969, 102.3700180053711]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 5.0, 3.0, 8.0, 8.0, 6.0, 12.0, 11.0, 13.0, 16.0, 17.0, 17.0, 29.0, 29.0, 36.0, 24.0, 35.0, 35.0, 52.0, 40.0, 39.0, 43.0, 29.0, 37.0, 40.0, 43.0, 35.0, 45.0, 34.0, 37.0, 37.0, 23.0, 28.0, 24.0, 14.0, 20.0, 14.0, 15.0, 13.0, 8.0, 9.0, 4.0, 8.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-114.05889129638672, -110.54922485351562, -107.03955841064453, -103.52989196777344, -100.02022552490234, -96.51055908203125, -93.00089263916016, -89.49122619628906, -85.98155975341797, -82.47189331054688, -78.96222686767578, -75.45256042480469, -71.9428939819336, -68.4332275390625, -64.9235610961914, -61.41389465332031, -57.90422439575195, -54.39455795288086, -50.884891510009766, -47.37522506713867, -43.86555862426758, -40.35588836669922, -36.846221923828125, -33.33655548095703, -29.82689094543457, -26.317224502563477, -22.807558059692383, -19.297889709472656, -15.788224220275879, -12.278556823730469, -8.768890380859375, -5.259223937988281, -1.7495574951171875, 1.7601091861724854, 5.269775867462158, 8.77944278717041, 12.289109230041504, 15.798776626586914, 19.308443069458008, 22.8181095123291, 26.327775955200195, 29.83744239807129, 33.347110748291016, 36.85677719116211, 40.3664436340332, 43.8761100769043, 47.38577651977539, 50.895442962646484, 54.40510940551758, 57.91477584838867, 61.424442291259766, 64.93411254882812, 68.44377899169922, 71.95344543457031, 75.4631118774414, 78.9727783203125, 82.4824447631836, 85.99211120605469, 89.50177764892578, 93.01144409179688, 96.52111053466797, 100.03077697753906, 103.54044342041016, 107.05010986328125, 110.55977630615234]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 7.0, 10.0, 16.0, 26.0, 45.0, 67.0, 100.0, 162.0, 245.0, 415.0, 665.0, 999.0, 1570.0, 2462.0, 3730.0, 5804.0, 8949.0, 13743.0, 20482.0, 29909.0, 42420.0, 57996.0, 75721.0, 93355.0, 106658.0, 111350.0, 106843.0, 94144.0, 77013.0, 59177.0, 43402.0, 30517.0, 20662.0, 13984.0, 9234.0, 6000.0, 3825.0, 2513.0, 1558.0, 1045.0, 609.0, 388.0, 246.0, 180.0, 120.0, 83.0, 41.0, 38.0, 17.0, 9.0, 6.0, 1.0, 2.0, 2.0, 3.0], "bins": [-128.5, -124.7783203125, -121.056640625, -117.3349609375, -113.61328125, -109.8916015625, -106.169921875, -102.4482421875, -98.7265625, -95.0048828125, -91.283203125, -87.5615234375, -83.83984375, -80.1181640625, -76.396484375, -72.6748046875, -68.953125, -65.2314453125, -61.509765625, -57.7880859375, -54.06640625, -50.3447265625, -46.623046875, -42.9013671875, -39.1796875, -35.4580078125, -31.736328125, -28.0146484375, -24.29296875, -20.5712890625, -16.849609375, -13.1279296875, -9.40625, -5.6845703125, -1.962890625, 1.7587890625, 5.48046875, 9.2021484375, 12.923828125, 16.6455078125, 20.3671875, 24.0888671875, 27.810546875, 31.5322265625, 35.25390625, 38.9755859375, 42.697265625, 46.4189453125, 50.140625, 53.8623046875, 57.583984375, 61.3056640625, 65.02734375, 68.7490234375, 72.470703125, 76.1923828125, 79.9140625, 83.6357421875, 87.357421875, 91.0791015625, 94.80078125, 98.5224609375, 102.244140625, 105.9658203125, 109.6875]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 8.0, 3.0, 8.0, 7.0, 3.0, 7.0, 11.0, 10.0, 20.0, 18.0, 18.0, 23.0, 27.0, 26.0, 35.0, 36.0, 36.0, 51.0, 40.0, 42.0, 35.0, 46.0, 37.0, 33.0, 44.0, 41.0, 34.0, 43.0, 33.0, 34.0, 40.0, 25.0, 21.0, 20.0, 16.0, 13.0, 13.0, 11.0, 12.0, 7.0, 4.0, 7.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.3125, -96.953125, -93.59375, -90.234375, -86.875, -83.515625, -80.15625, -76.796875, -73.4375, -70.078125, -66.71875, -63.359375, -60.0, -56.640625, -53.28125, -49.921875, -46.5625, -43.203125, -39.84375, -36.484375, -33.125, -29.765625, -26.40625, -23.046875, -19.6875, -16.328125, -12.96875, -9.609375, -6.25, -2.890625, 0.46875, 3.828125, 7.1875, 10.546875, 13.90625, 17.265625, 20.625, 23.984375, 27.34375, 30.703125, 34.0625, 37.421875, 40.78125, 44.140625, 47.5, 50.859375, 54.21875, 57.578125, 60.9375, 64.296875, 67.65625, 71.015625, 74.375, 77.734375, 81.09375, 84.453125, 87.8125, 91.171875, 94.53125, 97.890625, 101.25, 104.609375, 107.96875, 111.328125, 114.6875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 6.0, 6.0, 9.0, 16.0, 30.0, 57.0, 78.0, 126.0, 177.0, 329.0, 507.0, 848.0, 1282.0, 2054.0, 3007.0, 4726.0, 7360.0, 11442.0, 17330.0, 26307.0, 37483.0, 53059.0, 70238.0, 88302.0, 104195.0, 112638.0, 110688.0, 100270.0, 83339.0, 64655.0, 47858.0, 33491.0, 23198.0, 15260.0, 10139.0, 6412.0, 4179.0, 2718.0, 1725.0, 1113.0, 690.0, 468.0, 283.0, 167.0, 113.0, 75.0, 42.0, 31.0, 20.0, 6.0, 8.0, 2.0, 2.0, 1.0, 3.0, 1.0], "bins": [-120.25, -116.697265625, -113.14453125, -109.591796875, -106.0390625, -102.486328125, -98.93359375, -95.380859375, -91.828125, -88.275390625, -84.72265625, -81.169921875, -77.6171875, -74.064453125, -70.51171875, -66.958984375, -63.40625, -59.853515625, -56.30078125, -52.748046875, -49.1953125, -45.642578125, -42.08984375, -38.537109375, -34.984375, -31.431640625, -27.87890625, -24.326171875, -20.7734375, -17.220703125, -13.66796875, -10.115234375, -6.5625, -3.009765625, 0.54296875, 4.095703125, 7.6484375, 11.201171875, 14.75390625, 18.306640625, 21.859375, 25.412109375, 28.96484375, 32.517578125, 36.0703125, 39.623046875, 43.17578125, 46.728515625, 50.28125, 53.833984375, 57.38671875, 60.939453125, 64.4921875, 68.044921875, 71.59765625, 75.150390625, 78.703125, 82.255859375, 85.80859375, 89.361328125, 92.9140625, 96.466796875, 100.01953125, 103.572265625, 107.125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 7.0, 6.0, 10.0, 7.0, 17.0, 12.0, 17.0, 24.0, 27.0, 21.0, 22.0, 21.0, 36.0, 29.0, 34.0, 45.0, 41.0, 39.0, 52.0, 54.0, 45.0, 31.0, 43.0, 29.0, 42.0, 31.0, 40.0, 36.0, 23.0, 23.0, 20.0, 21.0, 15.0, 18.0, 13.0, 13.0, 8.0, 8.0, 4.0, 7.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.0625, -67.724609375, -65.38671875, -63.048828125, -60.7109375, -58.373046875, -56.03515625, -53.697265625, -51.359375, -49.021484375, -46.68359375, -44.345703125, -42.0078125, -39.669921875, -37.33203125, -34.994140625, -32.65625, -30.318359375, -27.98046875, -25.642578125, -23.3046875, -20.966796875, -18.62890625, -16.291015625, -13.953125, -11.615234375, -9.27734375, -6.939453125, -4.6015625, -2.263671875, 0.07421875, 2.412109375, 4.75, 7.087890625, 9.42578125, 11.763671875, 14.1015625, 16.439453125, 18.77734375, 21.115234375, 23.453125, 25.791015625, 28.12890625, 30.466796875, 32.8046875, 35.142578125, 37.48046875, 39.818359375, 42.15625, 44.494140625, 46.83203125, 49.169921875, 51.5078125, 53.845703125, 56.18359375, 58.521484375, 60.859375, 63.197265625, 65.53515625, 67.873046875, 70.2109375, 72.548828125, 74.88671875, 77.224609375, 79.5625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 5.0, 12.0, 8.0, 22.0, 26.0, 46.0, 61.0, 95.0, 159.0, 248.0, 437.0, 656.0, 1043.0, 1769.0, 3079.0, 5282.0, 9518.0, 17000.0, 30473.0, 52508.0, 85355.0, 124592.0, 158090.0, 164186.0, 141159.0, 100504.0, 64472.0, 38083.0, 21639.0, 11928.0, 6684.0, 3827.0, 2181.0, 1285.0, 772.0, 463.0, 312.0, 202.0, 129.0, 76.0, 52.0, 39.0, 20.0, 32.0, 7.0, 5.0, 4.0, 2.0, 5.0, 1.0, 5.0, 1.0], "bins": [-55.84375, -54.25732421875, -52.6708984375, -51.08447265625, -49.498046875, -47.91162109375, -46.3251953125, -44.73876953125, -43.15234375, -41.56591796875, -39.9794921875, -38.39306640625, -36.806640625, -35.22021484375, -33.6337890625, -32.04736328125, -30.4609375, -28.87451171875, -27.2880859375, -25.70166015625, -24.115234375, -22.52880859375, -20.9423828125, -19.35595703125, -17.76953125, -16.18310546875, -14.5966796875, -13.01025390625, -11.423828125, -9.83740234375, -8.2509765625, -6.66455078125, -5.078125, -3.49169921875, -1.9052734375, -0.31884765625, 1.267578125, 2.85400390625, 4.4404296875, 6.02685546875, 7.61328125, 9.19970703125, 10.7861328125, 12.37255859375, 13.958984375, 15.54541015625, 17.1318359375, 18.71826171875, 20.3046875, 21.89111328125, 23.4775390625, 25.06396484375, 26.650390625, 28.23681640625, 29.8232421875, 31.40966796875, 32.99609375, 34.58251953125, 36.1689453125, 37.75537109375, 39.341796875, 40.92822265625, 42.5146484375, 44.10107421875, 45.6875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 3.0, 4.0, 5.0, 13.0, 10.0, 12.0, 11.0, 16.0, 30.0, 26.0, 19.0, 43.0, 24.0, 45.0, 58.0, 59.0, 50.0, 56.0, 70.0, 62.0, 46.0, 44.0, 42.0, 36.0, 42.0, 20.0, 24.0, 23.0, 29.0, 16.0, 17.0, 13.0, 8.0, 5.0, 3.0, 3.0, 3.0, 3.0, 4.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.005023956298828125, -0.004869401454925537, -0.004714846611022949, -0.004560291767120361, -0.0044057369232177734, -0.0042511820793151855, -0.004096627235412598, -0.00394207239151001, -0.003787517547607422, -0.003632962703704834, -0.003478407859802246, -0.003323853015899658, -0.0031692981719970703, -0.0030147433280944824, -0.0028601884841918945, -0.0027056336402893066, -0.0025510787963867188, -0.002396523952484131, -0.002241969108581543, -0.002087414264678955, -0.0019328594207763672, -0.0017783045768737793, -0.0016237497329711914, -0.0014691948890686035, -0.0013146400451660156, -0.0011600852012634277, -0.0010055303573608398, -0.000850975513458252, -0.0006964206695556641, -0.0005418658256530762, -0.0003873109817504883, -0.0002327561378479004, -7.82012939453125e-05, 7.635354995727539e-05, 0.00023090839385986328, 0.00038546323776245117, 0.0005400180816650391, 0.000694572925567627, 0.0008491277694702148, 0.0010036826133728027, 0.0011582374572753906, 0.0013127923011779785, 0.0014673471450805664, 0.0016219019889831543, 0.0017764568328857422, 0.00193101167678833, 0.002085566520690918, 0.002240121364593506, 0.0023946762084960938, 0.0025492310523986816, 0.0027037858963012695, 0.0028583407402038574, 0.0030128955841064453, 0.003167450428009033, 0.003322005271911621, 0.003476560115814209, 0.003631114959716797, 0.0037856698036193848, 0.003940224647521973, 0.0040947794914245605, 0.0042493343353271484, 0.004403889179229736, 0.004558444023132324, 0.004712998867034912, 0.0048675537109375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 11.0, 11.0, 15.0, 36.0, 57.0, 87.0, 137.0, 224.0, 339.0, 612.0, 945.0, 1485.0, 2461.0, 4082.0, 6315.0, 10539.0, 16916.0, 26703.0, 40596.0, 60094.0, 83482.0, 107337.0, 123756.0, 128587.0, 118232.0, 98046.0, 73392.0, 51555.0, 34181.0, 22071.0, 13922.0, 8645.0, 5290.0, 3233.0, 2011.0, 1208.0, 699.0, 495.0, 291.0, 166.0, 118.0, 61.0, 48.0, 27.0, 17.0, 10.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-40.21875, -39.0458984375, -37.873046875, -36.7001953125, -35.52734375, -34.3544921875, -33.181640625, -32.0087890625, -30.8359375, -29.6630859375, -28.490234375, -27.3173828125, -26.14453125, -24.9716796875, -23.798828125, -22.6259765625, -21.453125, -20.2802734375, -19.107421875, -17.9345703125, -16.76171875, -15.5888671875, -14.416015625, -13.2431640625, -12.0703125, -10.8974609375, -9.724609375, -8.5517578125, -7.37890625, -6.2060546875, -5.033203125, -3.8603515625, -2.6875, -1.5146484375, -0.341796875, 0.8310546875, 2.00390625, 3.1767578125, 4.349609375, 5.5224609375, 6.6953125, 7.8681640625, 9.041015625, 10.2138671875, 11.38671875, 12.5595703125, 13.732421875, 14.9052734375, 16.078125, 17.2509765625, 18.423828125, 19.5966796875, 20.76953125, 21.9423828125, 23.115234375, 24.2880859375, 25.4609375, 26.6337890625, 27.806640625, 28.9794921875, 30.15234375, 31.3251953125, 32.498046875, 33.6708984375, 34.84375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 5.0, 8.0, 7.0, 3.0, 12.0, 10.0, 11.0, 10.0, 16.0, 13.0, 20.0, 22.0, 35.0, 32.0, 38.0, 39.0, 35.0, 27.0, 42.0, 44.0, 43.0, 49.0, 52.0, 45.0, 32.0, 40.0, 36.0, 26.0, 29.0, 23.0, 35.0, 24.0, 23.0, 15.0, 16.0, 14.0, 19.0, 12.0, 10.0, 9.0, 5.0, 5.0, 3.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.1796875, -12.7508544921875, -12.322021484375, -11.8931884765625, -11.46435546875, -11.0355224609375, -10.606689453125, -10.1778564453125, -9.7490234375, -9.3201904296875, -8.891357421875, -8.4625244140625, -8.03369140625, -7.6048583984375, -7.176025390625, -6.7471923828125, -6.318359375, -5.8895263671875, -5.460693359375, -5.0318603515625, -4.60302734375, -4.1741943359375, -3.745361328125, -3.3165283203125, -2.8876953125, -2.4588623046875, -2.030029296875, -1.6011962890625, -1.17236328125, -0.7435302734375, -0.314697265625, 0.1141357421875, 0.54296875, 0.9718017578125, 1.400634765625, 1.8294677734375, 2.25830078125, 2.6871337890625, 3.115966796875, 3.5447998046875, 3.9736328125, 4.4024658203125, 4.831298828125, 5.2601318359375, 5.68896484375, 6.1177978515625, 6.546630859375, 6.9754638671875, 7.404296875, 7.8331298828125, 8.261962890625, 8.6907958984375, 9.11962890625, 9.5484619140625, 9.977294921875, 10.4061279296875, 10.8349609375, 11.2637939453125, 11.692626953125, 12.1214599609375, 12.55029296875, 12.9791259765625, 13.407958984375, 13.8367919921875, 14.265625]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 2.0, 4.0, 7.0, 6.0, 3.0, 6.0, 8.0, 9.0, 10.0, 20.0, 8.0, 20.0, 18.0, 20.0, 28.0, 39.0, 32.0, 41.0, 34.0, 52.0, 48.0, 33.0, 50.0, 50.0, 52.0, 32.0, 41.0, 43.0, 31.0, 25.0, 29.0, 35.0, 21.0, 23.0, 20.0, 22.0, 10.0, 13.0, 12.0, 9.0, 10.0, 5.0, 9.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.63424682617188, -102.45063018798828, -99.26700592041016, -96.08338928222656, -92.89977264404297, -89.71615600585938, -86.53253173828125, -83.34891510009766, -80.16529846191406, -76.98168182373047, -73.79805755615234, -70.61444091796875, -67.43082427978516, -64.24720764160156, -61.06358337402344, -57.879966735839844, -54.69634246826172, -51.51272201538086, -48.329105377197266, -45.145484924316406, -41.96186828613281, -38.77824783325195, -35.594627380371094, -32.4110107421875, -29.22739028930664, -26.043771743774414, -22.860153198242188, -19.676532745361328, -16.4929141998291, -13.309295654296875, -10.125675201416016, -6.942056655883789, -3.7584381103515625, -0.5748190879821777, 2.608799934387207, 5.79241943359375, 8.976037979125977, 12.159656524658203, 15.343276977539062, 18.52689552307129, 21.710514068603516, 24.894132614135742, 28.07775115966797, 31.261371612548828, 34.44499206542969, 37.62860870361328, 40.81222915649414, 43.995849609375, 47.179466247558594, 50.36308670043945, 53.54670333862305, 56.730323791503906, 59.9139404296875, 63.09756088256836, 66.28118133544922, 69.46479797363281, 72.64842224121094, 75.83203887939453, 79.01566314697266, 82.19927978515625, 85.38289642333984, 88.56651306152344, 91.75013732910156, 94.93375396728516, 98.11737060546875]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 7.0, 4.0, 9.0, 4.0, 15.0, 8.0, 10.0, 5.0, 23.0, 17.0, 27.0, 34.0, 24.0, 28.0, 29.0, 37.0, 25.0, 33.0, 42.0, 42.0, 48.0, 39.0, 45.0, 47.0, 49.0, 34.0, 36.0, 25.0, 35.0, 33.0, 25.0, 28.0, 11.0, 22.0, 19.0, 20.0, 13.0, 8.0, 11.0, 6.0, 10.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-103.10801696777344, -99.7562484741211, -96.40447998046875, -93.0527114868164, -89.70094299316406, -86.34918212890625, -82.9974136352539, -79.64564514160156, -76.29387664794922, -72.94210815429688, -69.59033966064453, -66.23857116699219, -62.88680648803711, -59.535037994384766, -56.18327331542969, -52.831504821777344, -49.479736328125, -46.127967834472656, -42.77619934082031, -39.424434661865234, -36.07266616821289, -32.72089767456055, -29.369131088256836, -26.017364501953125, -22.66559600830078, -19.313827514648438, -15.962060928344727, -12.6102933883667, -9.258525848388672, -5.906757354736328, -2.554990768432617, 0.7967758178710938, 4.148536682128906, 7.500304222106934, 10.852071762084961, 14.203839302062988, 17.555606842041016, 20.90737533569336, 24.25914192199707, 27.61090850830078, 30.962677001953125, 34.31444549560547, 37.66621398925781, 41.01797866821289, 44.369747161865234, 47.72151565551758, 51.073280334472656, 54.425048828125, 57.776817321777344, 61.12858581542969, 64.48035430908203, 67.83212280273438, 71.18388366699219, 74.53565979003906, 77.88742065429688, 81.23918914794922, 84.59095764160156, 87.9427261352539, 91.29449462890625, 94.6462631225586, 97.99803161621094, 101.34979248046875, 104.7015609741211, 108.05332946777344, 111.40509796142578]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 18.0, 16.0, 42.0, 55.0, 82.0, 124.0, 205.0, 284.0, 506.0, 839.0, 1201.0, 1915.0, 3001.0, 4740.0, 7415.0, 11432.0, 18164.0, 28515.0, 45302.0, 72567.0, 116309.0, 186892.0, 301315.0, 479835.0, 685372.0, 728753.0, 553730.0, 359369.0, 222573.0, 137114.0, 84601.0, 53004.0, 33094.0, 20608.0, 12945.0, 8387.0, 5061.0, 3299.0, 2095.0, 1281.0, 884.0, 483.0, 296.0, 198.0, 128.0, 74.0, 69.0, 31.0, 24.0, 12.0, 9.0, 5.0, 0.0, 2.0, 5.0], "bins": [-126.5, -122.7978515625, -119.095703125, -115.3935546875, -111.69140625, -107.9892578125, -104.287109375, -100.5849609375, -96.8828125, -93.1806640625, -89.478515625, -85.7763671875, -82.07421875, -78.3720703125, -74.669921875, -70.9677734375, -67.265625, -63.5634765625, -59.861328125, -56.1591796875, -52.45703125, -48.7548828125, -45.052734375, -41.3505859375, -37.6484375, -33.9462890625, -30.244140625, -26.5419921875, -22.83984375, -19.1376953125, -15.435546875, -11.7333984375, -8.03125, -4.3291015625, -0.626953125, 3.0751953125, 6.77734375, 10.4794921875, 14.181640625, 17.8837890625, 21.5859375, 25.2880859375, 28.990234375, 32.6923828125, 36.39453125, 40.0966796875, 43.798828125, 47.5009765625, 51.203125, 54.9052734375, 58.607421875, 62.3095703125, 66.01171875, 69.7138671875, 73.416015625, 77.1181640625, 80.8203125, 84.5224609375, 88.224609375, 91.9267578125, 95.62890625, 99.3310546875, 103.033203125, 106.7353515625, 110.4375]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 3.0, 7.0, 7.0, 7.0, 14.0, 7.0, 8.0, 19.0, 19.0, 25.0, 24.0, 23.0, 31.0, 31.0, 19.0, 40.0, 38.0, 27.0, 37.0, 37.0, 44.0, 49.0, 41.0, 43.0, 51.0, 40.0, 33.0, 29.0, 35.0, 31.0, 28.0, 22.0, 25.0, 11.0, 19.0, 12.0, 9.0, 9.0, 12.0, 8.0, 9.0, 3.0, 5.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-78.75, -76.3154296875, -73.880859375, -71.4462890625, -69.01171875, -66.5771484375, -64.142578125, -61.7080078125, -59.2734375, -56.8388671875, -54.404296875, -51.9697265625, -49.53515625, -47.1005859375, -44.666015625, -42.2314453125, -39.796875, -37.3623046875, -34.927734375, -32.4931640625, -30.05859375, -27.6240234375, -25.189453125, -22.7548828125, -20.3203125, -17.8857421875, -15.451171875, -13.0166015625, -10.58203125, -8.1474609375, -5.712890625, -3.2783203125, -0.84375, 1.5908203125, 4.025390625, 6.4599609375, 8.89453125, 11.3291015625, 13.763671875, 16.1982421875, 18.6328125, 21.0673828125, 23.501953125, 25.9365234375, 28.37109375, 30.8056640625, 33.240234375, 35.6748046875, 38.109375, 40.5439453125, 42.978515625, 45.4130859375, 47.84765625, 50.2822265625, 52.716796875, 55.1513671875, 57.5859375, 60.0205078125, 62.455078125, 64.8896484375, 67.32421875, 69.7587890625, 72.193359375, 74.6279296875, 77.0625]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 7.0, 5.0, 15.0, 12.0, 17.0, 41.0, 61.0, 100.0, 147.0, 213.0, 379.0, 598.0, 894.0, 1312.0, 2177.0, 3169.0, 4970.0, 7807.0, 12269.0, 19277.0, 29765.0, 45658.0, 70772.0, 108606.0, 162912.0, 240745.0, 342966.0, 458233.0, 554155.0, 559100.0, 470688.0, 353240.0, 250162.0, 170511.0, 113501.0, 74304.0, 48075.0, 31156.0, 20133.0, 12762.0, 8481.0, 5268.0, 3437.0, 2309.0, 1345.0, 860.0, 566.0, 411.0, 267.0, 165.0, 95.0, 70.0, 40.0, 22.0, 15.0, 19.0, 6.0, 5.0, 1.0, 0.0, 2.0], "bins": [-76.125, -73.75, -71.375, -69.0, -66.625, -64.25, -61.875, -59.5, -57.125, -54.75, -52.375, -50.0, -47.625, -45.25, -42.875, -40.5, -38.125, -35.75, -33.375, -31.0, -28.625, -26.25, -23.875, -21.5, -19.125, -16.75, -14.375, -12.0, -9.625, -7.25, -4.875, -2.5, -0.125, 2.25, 4.625, 7.0, 9.375, 11.75, 14.125, 16.5, 18.875, 21.25, 23.625, 26.0, 28.375, 30.75, 33.125, 35.5, 37.875, 40.25, 42.625, 45.0, 47.375, 49.75, 52.125, 54.5, 56.875, 59.25, 61.625, 64.0, 66.375, 68.75, 71.125, 73.5, 75.875]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 11.0, 6.0, 6.0, 10.0, 13.0, 14.0, 15.0, 35.0, 27.0, 33.0, 43.0, 40.0, 60.0, 69.0, 85.0, 95.0, 128.0, 157.0, 175.0, 186.0, 221.0, 214.0, 247.0, 260.0, 236.0, 214.0, 191.0, 155.0, 163.0, 166.0, 126.0, 115.0, 107.0, 81.0, 78.0, 64.0, 34.0, 37.0, 35.0, 33.0, 26.0, 17.0, 15.0, 8.0, 5.0, 6.0, 3.0, 2.0, 4.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.1875, -36.017578125, -34.84765625, -33.677734375, -32.5078125, -31.337890625, -30.16796875, -28.998046875, -27.828125, -26.658203125, -25.48828125, -24.318359375, -23.1484375, -21.978515625, -20.80859375, -19.638671875, -18.46875, -17.298828125, -16.12890625, -14.958984375, -13.7890625, -12.619140625, -11.44921875, -10.279296875, -9.109375, -7.939453125, -6.76953125, -5.599609375, -4.4296875, -3.259765625, -2.08984375, -0.919921875, 0.25, 1.419921875, 2.58984375, 3.759765625, 4.9296875, 6.099609375, 7.26953125, 8.439453125, 9.609375, 10.779296875, 11.94921875, 13.119140625, 14.2890625, 15.458984375, 16.62890625, 17.798828125, 18.96875, 20.138671875, 21.30859375, 22.478515625, 23.6484375, 24.818359375, 25.98828125, 27.158203125, 28.328125, 29.498046875, 30.66796875, 31.837890625, 33.0078125, 34.177734375, 35.34765625, 36.517578125, 37.6875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 6.0, 6.0, 7.0, 3.0, 14.0, 9.0, 6.0, 11.0, 24.0, 23.0, 30.0, 33.0, 28.0, 34.0, 33.0, 48.0, 56.0, 55.0, 40.0, 48.0, 58.0, 49.0, 66.0, 46.0, 32.0, 40.0, 28.0, 23.0, 29.0, 28.0, 20.0, 29.0, 5.0, 10.0, 7.0, 9.0, 4.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-107.5115966796875, -104.39836883544922, -101.28514099121094, -98.17191314697266, -95.05868530273438, -91.9454574584961, -88.83222961425781, -85.718994140625, -82.60577392578125, -79.49254608154297, -76.37931823730469, -73.2660903930664, -70.15286254882812, -67.03963470458984, -63.9264030456543, -60.813175201416016, -57.69994354248047, -54.58671569824219, -51.473487854003906, -48.360260009765625, -45.247032165527344, -42.13380432128906, -39.020572662353516, -35.907344818115234, -32.79411697387695, -29.680889129638672, -26.56766128540039, -23.454431533813477, -20.341203689575195, -17.227975845336914, -14.11474609375, -11.001518249511719, -7.888282775878906, -4.775054454803467, -1.6618261337280273, 1.4514026641845703, 4.564630508422852, 7.677858352661133, 10.791088104248047, 13.904315948486328, 17.01754379272461, 20.13077163696289, 23.243999481201172, 26.357229232788086, 29.470457077026367, 32.58368682861328, 35.69691467285156, 38.810142517089844, 41.923370361328125, 45.036598205566406, 48.14982604980469, 51.26305389404297, 54.37628173828125, 57.48950958251953, 60.60274124145508, 63.71596908569336, 66.82919311523438, 69.94242095947266, 73.05564880371094, 76.16887664794922, 79.2821044921875, 82.39533233642578, 85.50856018066406, 88.62179565429688, 91.73502349853516]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 5.0, 2.0, 6.0, 7.0, 17.0, 9.0, 12.0, 18.0, 20.0, 15.0, 21.0, 28.0, 23.0, 29.0, 44.0, 26.0, 36.0, 27.0, 39.0, 38.0, 38.0, 41.0, 45.0, 52.0, 44.0, 35.0, 38.0, 36.0, 25.0, 36.0, 25.0, 23.0, 20.0, 10.0, 21.0, 19.0, 16.0, 12.0, 12.0, 6.0, 9.0, 8.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.69476318359375, -85.98043060302734, -83.26609802246094, -80.55176544189453, -77.83743286132812, -75.12310028076172, -72.40876770019531, -69.69444274902344, -66.9801025390625, -64.2657699584961, -61.55143737792969, -58.83710479736328, -56.122772216796875, -53.40843963623047, -50.69411087036133, -47.97977828979492, -45.26544952392578, -42.551116943359375, -39.83678436279297, -37.12245178222656, -34.408119201660156, -31.693788528442383, -28.97945785522461, -26.265125274658203, -23.550792694091797, -20.83646011352539, -18.122127532958984, -15.407796859741211, -12.693464279174805, -9.979131698608398, -7.264801025390625, -4.550468444824219, -1.8361358642578125, 0.8781962394714355, 3.5925283432006836, 6.306859970092773, 9.02119255065918, 11.735525131225586, 14.44985580444336, 17.164188385009766, 19.878520965576172, 22.592853546142578, 25.307186126708984, 28.021516799926758, 30.735849380493164, 33.45018005371094, 36.164512634277344, 38.87884521484375, 41.593177795410156, 44.30751037597656, 47.02184295654297, 49.736175537109375, 52.45050811767578, 55.16484069824219, 57.87916946411133, 60.593502044677734, 63.30783462524414, 66.02216339111328, 68.73649597167969, 71.4508285522461, 74.1651611328125, 76.8794937133789, 79.59382629394531, 82.30815887451172, 85.02249145507812]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 3.0, 8.0, 13.0, 10.0, 18.0, 24.0, 40.0, 75.0, 110.0, 162.0, 237.0, 319.0, 533.0, 775.0, 1206.0, 1866.0, 2795.0, 4185.0, 6224.0, 9631.0, 14216.0, 21871.0, 32120.0, 45296.0, 63159.0, 83099.0, 101993.0, 114397.0, 116141.0, 106513.0, 89964.0, 70189.0, 51239.0, 36426.0, 24771.0, 16721.0, 11045.0, 7268.0, 4724.0, 3102.0, 2070.0, 1365.0, 881.0, 558.0, 384.0, 272.0, 183.0, 137.0, 75.0, 50.0, 34.0, 20.0, 12.0, 12.0, 10.0, 6.0, 2.0, 1.0, 3.0, 5.0], "bins": [-144.5, -140.0078125, -135.515625, -131.0234375, -126.53125, -122.0390625, -117.546875, -113.0546875, -108.5625, -104.0703125, -99.578125, -95.0859375, -90.59375, -86.1015625, -81.609375, -77.1171875, -72.625, -68.1328125, -63.640625, -59.1484375, -54.65625, -50.1640625, -45.671875, -41.1796875, -36.6875, -32.1953125, -27.703125, -23.2109375, -18.71875, -14.2265625, -9.734375, -5.2421875, -0.75, 3.7421875, 8.234375, 12.7265625, 17.21875, 21.7109375, 26.203125, 30.6953125, 35.1875, 39.6796875, 44.171875, 48.6640625, 53.15625, 57.6484375, 62.140625, 66.6328125, 71.125, 75.6171875, 80.109375, 84.6015625, 89.09375, 93.5859375, 98.078125, 102.5703125, 107.0625, 111.5546875, 116.046875, 120.5390625, 125.03125, 129.5234375, 134.015625, 138.5078125, 143.0]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 5.0, 6.0, 7.0, 16.0, 16.0, 11.0, 21.0, 20.0, 24.0, 17.0, 27.0, 30.0, 30.0, 33.0, 38.0, 27.0, 30.0, 35.0, 53.0, 49.0, 49.0, 45.0, 40.0, 43.0, 37.0, 37.0, 26.0, 22.0, 27.0, 22.0, 19.0, 22.0, 18.0, 18.0, 15.0, 13.0, 11.0, 8.0, 12.0, 6.0, 2.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.875, -53.9306640625, -51.986328125, -50.0419921875, -48.09765625, -46.1533203125, -44.208984375, -42.2646484375, -40.3203125, -38.3759765625, -36.431640625, -34.4873046875, -32.54296875, -30.5986328125, -28.654296875, -26.7099609375, -24.765625, -22.8212890625, -20.876953125, -18.9326171875, -16.98828125, -15.0439453125, -13.099609375, -11.1552734375, -9.2109375, -7.2666015625, -5.322265625, -3.3779296875, -1.43359375, 0.5107421875, 2.455078125, 4.3994140625, 6.34375, 8.2880859375, 10.232421875, 12.1767578125, 14.12109375, 16.0654296875, 18.009765625, 19.9541015625, 21.8984375, 23.8427734375, 25.787109375, 27.7314453125, 29.67578125, 31.6201171875, 33.564453125, 35.5087890625, 37.453125, 39.3974609375, 41.341796875, 43.2861328125, 45.23046875, 47.1748046875, 49.119140625, 51.0634765625, 53.0078125, 54.9521484375, 56.896484375, 58.8408203125, 60.78515625, 62.7294921875, 64.673828125, 66.6181640625, 68.5625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 4.0, 7.0, 10.0, 13.0, 14.0, 25.0, 25.0, 56.0, 78.0, 113.0, 154.0, 215.0, 333.0, 455.0, 683.0, 1003.0, 1581.0, 2488.0, 3983.0, 6339.0, 10862.0, 19018.0, 34540.0, 63644.0, 116296.0, 194703.0, 227364.0, 160084.0, 90650.0, 49290.0, 26208.0, 14921.0, 8748.0, 5227.0, 3234.0, 2094.0, 1320.0, 883.0, 603.0, 385.0, 276.0, 186.0, 130.0, 110.0, 57.0, 57.0, 23.0, 25.0, 16.0, 18.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-253.625, -246.005859375, -238.38671875, -230.767578125, -223.1484375, -215.529296875, -207.91015625, -200.291015625, -192.671875, -185.052734375, -177.43359375, -169.814453125, -162.1953125, -154.576171875, -146.95703125, -139.337890625, -131.71875, -124.099609375, -116.48046875, -108.861328125, -101.2421875, -93.623046875, -86.00390625, -78.384765625, -70.765625, -63.146484375, -55.52734375, -47.908203125, -40.2890625, -32.669921875, -25.05078125, -17.431640625, -9.8125, -2.193359375, 5.42578125, 13.044921875, 20.6640625, 28.283203125, 35.90234375, 43.521484375, 51.140625, 58.759765625, 66.37890625, 73.998046875, 81.6171875, 89.236328125, 96.85546875, 104.474609375, 112.09375, 119.712890625, 127.33203125, 134.951171875, 142.5703125, 150.189453125, 157.80859375, 165.427734375, 173.046875, 180.666015625, 188.28515625, 195.904296875, 203.5234375, 211.142578125, 218.76171875, 226.380859375, 234.0]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 0.0, 3.0, 3.0, 4.0, 10.0, 17.0, 11.0, 10.0, 17.0, 19.0, 25.0, 16.0, 32.0, 24.0, 33.0, 28.0, 24.0, 33.0, 37.0, 38.0, 42.0, 45.0, 41.0, 42.0, 39.0, 44.0, 38.0, 36.0, 34.0, 35.0, 33.0, 22.0, 19.0, 13.0, 13.0, 25.0, 15.0, 18.0, 13.0, 11.0, 7.0, 4.0, 6.0, 6.0, 3.0, 7.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.375, -44.8154296875, -43.255859375, -41.6962890625, -40.13671875, -38.5771484375, -37.017578125, -35.4580078125, -33.8984375, -32.3388671875, -30.779296875, -29.2197265625, -27.66015625, -26.1005859375, -24.541015625, -22.9814453125, -21.421875, -19.8623046875, -18.302734375, -16.7431640625, -15.18359375, -13.6240234375, -12.064453125, -10.5048828125, -8.9453125, -7.3857421875, -5.826171875, -4.2666015625, -2.70703125, -1.1474609375, 0.412109375, 1.9716796875, 3.53125, 5.0908203125, 6.650390625, 8.2099609375, 9.76953125, 11.3291015625, 12.888671875, 14.4482421875, 16.0078125, 17.5673828125, 19.126953125, 20.6865234375, 22.24609375, 23.8056640625, 25.365234375, 26.9248046875, 28.484375, 30.0439453125, 31.603515625, 33.1630859375, 34.72265625, 36.2822265625, 37.841796875, 39.4013671875, 40.9609375, 42.5205078125, 44.080078125, 45.6396484375, 47.19921875, 48.7587890625, 50.318359375, 51.8779296875, 53.4375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 5.0, 3.0, 7.0, 11.0, 21.0, 31.0, 48.0, 66.0, 79.0, 110.0, 178.0, 247.0, 385.0, 568.0, 896.0, 1382.0, 2158.0, 3533.0, 5699.0, 10460.0, 21792.0, 58661.0, 205606.0, 466803.0, 174912.0, 50860.0, 19762.0, 9685.0, 5517.0, 3273.0, 2040.0, 1283.0, 846.0, 531.0, 340.0, 239.0, 151.0, 106.0, 80.0, 56.0, 36.0, 24.0, 23.0, 8.0, 7.0, 7.0, 4.0, 5.0, 0.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-245.25, -237.44921875, -229.6484375, -221.84765625, -214.046875, -206.24609375, -198.4453125, -190.64453125, -182.84375, -175.04296875, -167.2421875, -159.44140625, -151.640625, -143.83984375, -136.0390625, -128.23828125, -120.4375, -112.63671875, -104.8359375, -97.03515625, -89.234375, -81.43359375, -73.6328125, -65.83203125, -58.03125, -50.23046875, -42.4296875, -34.62890625, -26.828125, -19.02734375, -11.2265625, -3.42578125, 4.375, 12.17578125, 19.9765625, 27.77734375, 35.578125, 43.37890625, 51.1796875, 58.98046875, 66.78125, 74.58203125, 82.3828125, 90.18359375, 97.984375, 105.78515625, 113.5859375, 121.38671875, 129.1875, 136.98828125, 144.7890625, 152.58984375, 160.390625, 168.19140625, 175.9921875, 183.79296875, 191.59375, 199.39453125, 207.1953125, 214.99609375, 222.796875, 230.59765625, 238.3984375, 246.19921875, 254.0]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 6.0, 9.0, 10.0, 15.0, 11.0, 24.0, 31.0, 34.0, 56.0, 60.0, 94.0, 99.0, 100.0, 103.0, 98.0, 57.0, 50.0, 36.0, 32.0, 13.0, 12.0, 10.0, 4.0, 4.0, 7.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0230712890625, -0.02243518829345703, -0.021799087524414062, -0.021162986755371094, -0.020526885986328125, -0.019890785217285156, -0.019254684448242188, -0.01861858367919922, -0.01798248291015625, -0.01734638214111328, -0.016710281372070312, -0.016074180603027344, -0.015438079833984375, -0.014801979064941406, -0.014165878295898438, -0.013529777526855469, -0.0128936767578125, -0.012257575988769531, -0.011621475219726562, -0.010985374450683594, -0.010349273681640625, -0.009713172912597656, -0.009077072143554688, -0.008440971374511719, -0.00780487060546875, -0.007168769836425781, -0.0065326690673828125, -0.005896568298339844, -0.005260467529296875, -0.004624366760253906, -0.0039882659912109375, -0.0033521652221679688, -0.002716064453125, -0.0020799636840820312, -0.0014438629150390625, -0.0008077621459960938, -0.000171661376953125, 0.00046443939208984375, 0.0011005401611328125, 0.0017366409301757812, 0.00237274169921875, 0.0030088424682617188, 0.0036449432373046875, 0.004281044006347656, 0.004917144775390625, 0.005553245544433594, 0.0061893463134765625, 0.006825447082519531, 0.0074615478515625, 0.008097648620605469, 0.008733749389648438, 0.009369850158691406, 0.010005950927734375, 0.010642051696777344, 0.011278152465820312, 0.011914253234863281, 0.01255035400390625, 0.013186454772949219, 0.013822555541992188, 0.014458656311035156, 0.015094757080078125, 0.015730857849121094, 0.016366958618164062, 0.01700305938720703, 0.01763916015625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 9.0, 11.0, 18.0, 16.0, 35.0, 36.0, 69.0, 95.0, 127.0, 184.0, 259.0, 387.0, 544.0, 768.0, 1225.0, 1772.0, 2759.0, 4394.0, 7298.0, 13809.0, 30660.0, 79612.0, 211850.0, 344514.0, 206924.0, 78026.0, 29707.0, 13659.0, 7199.0, 4261.0, 2768.0, 1750.0, 1282.0, 758.0, 531.0, 385.0, 266.0, 174.0, 135.0, 84.0, 59.0, 42.0, 39.0, 19.0, 15.0, 6.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-147.75, -143.337890625, -138.92578125, -134.513671875, -130.1015625, -125.689453125, -121.27734375, -116.865234375, -112.453125, -108.041015625, -103.62890625, -99.216796875, -94.8046875, -90.392578125, -85.98046875, -81.568359375, -77.15625, -72.744140625, -68.33203125, -63.919921875, -59.5078125, -55.095703125, -50.68359375, -46.271484375, -41.859375, -37.447265625, -33.03515625, -28.623046875, -24.2109375, -19.798828125, -15.38671875, -10.974609375, -6.5625, -2.150390625, 2.26171875, 6.673828125, 11.0859375, 15.498046875, 19.91015625, 24.322265625, 28.734375, 33.146484375, 37.55859375, 41.970703125, 46.3828125, 50.794921875, 55.20703125, 59.619140625, 64.03125, 68.443359375, 72.85546875, 77.267578125, 81.6796875, 86.091796875, 90.50390625, 94.916015625, 99.328125, 103.740234375, 108.15234375, 112.564453125, 116.9765625, 121.388671875, 125.80078125, 130.212890625, 134.625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 0.0, 3.0, 4.0, 3.0, 6.0, 8.0, 10.0, 6.0, 13.0, 28.0, 38.0, 66.0, 84.0, 116.0, 128.0, 126.0, 106.0, 67.0, 66.0, 35.0, 28.0, 18.0, 9.0, 11.0, 5.0, 3.0, 1.0, 2.0, 8.0, 1.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.53125, -60.6923828125, -58.853515625, -57.0146484375, -55.17578125, -53.3369140625, -51.498046875, -49.6591796875, -47.8203125, -45.9814453125, -44.142578125, -42.3037109375, -40.46484375, -38.6259765625, -36.787109375, -34.9482421875, -33.109375, -31.2705078125, -29.431640625, -27.5927734375, -25.75390625, -23.9150390625, -22.076171875, -20.2373046875, -18.3984375, -16.5595703125, -14.720703125, -12.8818359375, -11.04296875, -9.2041015625, -7.365234375, -5.5263671875, -3.6875, -1.8486328125, -0.009765625, 1.8291015625, 3.66796875, 5.5068359375, 7.345703125, 9.1845703125, 11.0234375, 12.8623046875, 14.701171875, 16.5400390625, 18.37890625, 20.2177734375, 22.056640625, 23.8955078125, 25.734375, 27.5732421875, 29.412109375, 31.2509765625, 33.08984375, 34.9287109375, 36.767578125, 38.6064453125, 40.4453125, 42.2841796875, 44.123046875, 45.9619140625, 47.80078125, 49.6396484375, 51.478515625, 53.3173828125, 55.15625]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 3.0, 9.0, 8.0, 11.0, 13.0, 13.0, 15.0, 16.0, 20.0, 20.0, 31.0, 33.0, 27.0, 36.0, 57.0, 37.0, 51.0, 49.0, 46.0, 40.0, 50.0, 45.0, 55.0, 33.0, 43.0, 32.0, 30.0, 21.0, 26.0, 21.0, 20.0, 12.0, 14.0, 11.0, 5.0, 7.0, 14.0, 1.0, 3.0, 9.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-72.33639526367188, -70.1641845703125, -67.99197387695312, -65.81976318359375, -63.647552490234375, -61.475341796875, -59.30312728881836, -57.130916595458984, -54.95870590209961, -52.786495208740234, -50.61428451538086, -48.442073822021484, -46.269859313964844, -44.09764862060547, -41.925437927246094, -39.75322723388672, -37.581016540527344, -35.40880584716797, -33.236595153808594, -31.064382553100586, -28.89217185974121, -26.719961166381836, -24.547748565673828, -22.375537872314453, -20.203327178955078, -18.031116485595703, -15.858904838562012, -13.68669319152832, -11.514482498168945, -9.34227180480957, -7.170060157775879, -4.9978485107421875, -2.8256454467773438, -0.6534342765808105, 1.5187768936157227, 3.690988063812256, 5.863199234008789, 8.035409927368164, 10.207621574401855, 12.379833221435547, 14.552043914794922, 16.724254608154297, 18.896465301513672, 21.06867790222168, 23.240888595581055, 25.41309928894043, 27.585311889648438, 29.757522583007812, 31.929733276367188, 34.10194396972656, 36.27415466308594, 38.44636535644531, 40.61857604980469, 42.79078674316406, 44.9630012512207, 47.13521194458008, 49.30742263793945, 51.47963333129883, 53.6518440246582, 55.82405471801758, 57.99626922607422, 60.168479919433594, 62.34069061279297, 64.51290130615234, 66.68511199951172]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 7.0, 4.0, 6.0, 12.0, 13.0, 12.0, 14.0, 25.0, 20.0, 18.0, 24.0, 27.0, 31.0, 32.0, 27.0, 33.0, 42.0, 32.0, 41.0, 45.0, 48.0, 43.0, 40.0, 37.0, 33.0, 36.0, 26.0, 32.0, 34.0, 28.0, 19.0, 28.0, 21.0, 12.0, 16.0, 17.0, 22.0, 9.0, 8.0, 6.0, 8.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-74.7188720703125, -72.49765014648438, -70.27642822265625, -68.05520629882812, -65.833984375, -63.612762451171875, -61.391536712646484, -59.17031478881836, -56.949092864990234, -54.72787094116211, -52.506649017333984, -50.28542709350586, -48.06420135498047, -45.842979431152344, -43.62175750732422, -41.400535583496094, -39.17931365966797, -36.958091735839844, -34.73686981201172, -32.515647888183594, -30.294424057006836, -28.07320213317871, -25.851978302001953, -23.630756378173828, -21.409534454345703, -19.188312530517578, -16.967090606689453, -14.745866775512695, -12.52464485168457, -10.303422927856445, -8.082200050354004, -5.8609771728515625, -3.6397552490234375, -1.4185328483581543, 0.8026895523071289, 3.023911952972412, 5.245134353637695, 7.46635627746582, 9.687579154968262, 11.908802032470703, 14.130023956298828, 16.351245880126953, 18.572467803955078, 20.793691635131836, 23.01491355895996, 25.236135482788086, 27.457359313964844, 29.67858123779297, 31.899803161621094, 34.12102508544922, 36.342247009277344, 38.56346893310547, 40.784690856933594, 43.00591278076172, 45.22713851928711, 47.448360443115234, 49.66958236694336, 51.890804290771484, 54.11202621459961, 56.333248138427734, 58.554473876953125, 60.77569580078125, 62.996917724609375, 65.2181396484375, 67.43936157226562]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 12.0, 24.0, 38.0, 56.0, 78.0, 118.0, 186.0, 297.0, 453.0, 709.0, 1081.0, 1822.0, 3001.0, 4544.0, 7477.0, 11655.0, 18677.0, 28747.0, 43543.0, 63891.0, 89948.0, 116111.0, 133377.0, 133466.0, 115317.0, 89295.0, 63516.0, 43298.0, 28446.0, 18325.0, 11753.0, 7213.0, 4430.0, 2819.0, 1817.0, 1094.0, 727.0, 438.0, 253.0, 161.0, 121.0, 80.0, 61.0, 24.0, 22.0, 14.0, 6.0, 9.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-61.3125, -59.267578125, -57.22265625, -55.177734375, -53.1328125, -51.087890625, -49.04296875, -46.998046875, -44.953125, -42.908203125, -40.86328125, -38.818359375, -36.7734375, -34.728515625, -32.68359375, -30.638671875, -28.59375, -26.548828125, -24.50390625, -22.458984375, -20.4140625, -18.369140625, -16.32421875, -14.279296875, -12.234375, -10.189453125, -8.14453125, -6.099609375, -4.0546875, -2.009765625, 0.03515625, 2.080078125, 4.125, 6.169921875, 8.21484375, 10.259765625, 12.3046875, 14.349609375, 16.39453125, 18.439453125, 20.484375, 22.529296875, 24.57421875, 26.619140625, 28.6640625, 30.708984375, 32.75390625, 34.798828125, 36.84375, 38.888671875, 40.93359375, 42.978515625, 45.0234375, 47.068359375, 49.11328125, 51.158203125, 53.203125, 55.248046875, 57.29296875, 59.337890625, 61.3828125, 63.427734375, 65.47265625, 67.517578125, 69.5625]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 7.0, 8.0, 6.0, 11.0, 6.0, 17.0, 15.0, 14.0, 22.0, 20.0, 18.0, 27.0, 30.0, 31.0, 31.0, 41.0, 48.0, 41.0, 44.0, 39.0, 43.0, 50.0, 42.0, 50.0, 36.0, 33.0, 39.0, 30.0, 26.0, 31.0, 24.0, 12.0, 18.0, 19.0, 15.0, 14.0, 14.0, 9.0, 9.0, 5.0, 5.0, 3.0, 1.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.625, -70.4365234375, -68.248046875, -66.0595703125, -63.87109375, -61.6826171875, -59.494140625, -57.3056640625, -55.1171875, -52.9287109375, -50.740234375, -48.5517578125, -46.36328125, -44.1748046875, -41.986328125, -39.7978515625, -37.609375, -35.4208984375, -33.232421875, -31.0439453125, -28.85546875, -26.6669921875, -24.478515625, -22.2900390625, -20.1015625, -17.9130859375, -15.724609375, -13.5361328125, -11.34765625, -9.1591796875, -6.970703125, -4.7822265625, -2.59375, -0.4052734375, 1.783203125, 3.9716796875, 6.16015625, 8.3486328125, 10.537109375, 12.7255859375, 14.9140625, 17.1025390625, 19.291015625, 21.4794921875, 23.66796875, 25.8564453125, 28.044921875, 30.2333984375, 32.421875, 34.6103515625, 36.798828125, 38.9873046875, 41.17578125, 43.3642578125, 45.552734375, 47.7412109375, 49.9296875, 52.1181640625, 54.306640625, 56.4951171875, 58.68359375, 60.8720703125, 63.060546875, 65.2490234375, 67.4375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 5.0, 6.0, 7.0, 11.0, 15.0, 20.0, 35.0, 37.0, 46.0, 96.0, 130.0, 186.0, 331.0, 433.0, 593.0, 969.0, 1316.0, 1964.0, 2848.0, 4191.0, 6259.0, 9320.0, 14155.0, 21104.0, 31531.0, 46057.0, 66168.0, 92208.0, 118402.0, 134560.0, 129536.0, 107743.0, 80742.0, 57574.0, 39456.0, 26401.0, 17748.0, 11854.0, 7807.0, 5331.0, 3657.0, 2418.0, 1649.0, 1176.0, 791.0, 508.0, 373.0, 267.0, 177.0, 128.0, 75.0, 49.0, 39.0, 28.0, 12.0, 6.0, 11.0, 3.0, 2.0, 2.0, 3.0], "bins": [-79.125, -76.7119140625, -74.298828125, -71.8857421875, -69.47265625, -67.0595703125, -64.646484375, -62.2333984375, -59.8203125, -57.4072265625, -54.994140625, -52.5810546875, -50.16796875, -47.7548828125, -45.341796875, -42.9287109375, -40.515625, -38.1025390625, -35.689453125, -33.2763671875, -30.86328125, -28.4501953125, -26.037109375, -23.6240234375, -21.2109375, -18.7978515625, -16.384765625, -13.9716796875, -11.55859375, -9.1455078125, -6.732421875, -4.3193359375, -1.90625, 0.5068359375, 2.919921875, 5.3330078125, 7.74609375, 10.1591796875, 12.572265625, 14.9853515625, 17.3984375, 19.8115234375, 22.224609375, 24.6376953125, 27.05078125, 29.4638671875, 31.876953125, 34.2900390625, 36.703125, 39.1162109375, 41.529296875, 43.9423828125, 46.35546875, 48.7685546875, 51.181640625, 53.5947265625, 56.0078125, 58.4208984375, 60.833984375, 63.2470703125, 65.66015625, 68.0732421875, 70.486328125, 72.8994140625, 75.3125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 7.0, 9.0, 11.0, 10.0, 12.0, 18.0, 15.0, 15.0, 22.0, 24.0, 28.0, 29.0, 39.0, 30.0, 36.0, 32.0, 35.0, 38.0, 39.0, 41.0, 28.0, 41.0, 40.0, 56.0, 32.0, 30.0, 31.0, 33.0, 29.0, 26.0, 21.0, 22.0, 17.0, 17.0, 18.0, 8.0, 9.0, 9.0, 10.0, 3.0, 2.0, 11.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-57.59375, -55.91259765625, -54.2314453125, -52.55029296875, -50.869140625, -49.18798828125, -47.5068359375, -45.82568359375, -44.14453125, -42.46337890625, -40.7822265625, -39.10107421875, -37.419921875, -35.73876953125, -34.0576171875, -32.37646484375, -30.6953125, -29.01416015625, -27.3330078125, -25.65185546875, -23.970703125, -22.28955078125, -20.6083984375, -18.92724609375, -17.24609375, -15.56494140625, -13.8837890625, -12.20263671875, -10.521484375, -8.84033203125, -7.1591796875, -5.47802734375, -3.796875, -2.11572265625, -0.4345703125, 1.24658203125, 2.927734375, 4.60888671875, 6.2900390625, 7.97119140625, 9.65234375, 11.33349609375, 13.0146484375, 14.69580078125, 16.376953125, 18.05810546875, 19.7392578125, 21.42041015625, 23.1015625, 24.78271484375, 26.4638671875, 28.14501953125, 29.826171875, 31.50732421875, 33.1884765625, 34.86962890625, 36.55078125, 38.23193359375, 39.9130859375, 41.59423828125, 43.275390625, 44.95654296875, 46.6376953125, 48.31884765625, 50.0]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [4.0, 5.0, 4.0, 9.0, 7.0, 15.0, 28.0, 32.0, 49.0, 52.0, 88.0, 148.0, 197.0, 287.0, 406.0, 529.0, 843.0, 1275.0, 1832.0, 2737.0, 3984.0, 6319.0, 9915.0, 16671.0, 28621.0, 51787.0, 97416.0, 172311.0, 229689.0, 183586.0, 105237.0, 55843.0, 30232.0, 17689.0, 10731.0, 6636.0, 4281.0, 2955.0, 1965.0, 1332.0, 851.0, 606.0, 413.0, 271.0, 200.0, 145.0, 100.0, 69.0, 52.0, 33.0, 26.0, 26.0, 9.0, 9.0, 5.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-71.9375, -69.4189453125, -66.900390625, -64.3818359375, -61.86328125, -59.3447265625, -56.826171875, -54.3076171875, -51.7890625, -49.2705078125, -46.751953125, -44.2333984375, -41.71484375, -39.1962890625, -36.677734375, -34.1591796875, -31.640625, -29.1220703125, -26.603515625, -24.0849609375, -21.56640625, -19.0478515625, -16.529296875, -14.0107421875, -11.4921875, -8.9736328125, -6.455078125, -3.9365234375, -1.41796875, 1.1005859375, 3.619140625, 6.1376953125, 8.65625, 11.1748046875, 13.693359375, 16.2119140625, 18.73046875, 21.2490234375, 23.767578125, 26.2861328125, 28.8046875, 31.3232421875, 33.841796875, 36.3603515625, 38.87890625, 41.3974609375, 43.916015625, 46.4345703125, 48.953125, 51.4716796875, 53.990234375, 56.5087890625, 59.02734375, 61.5458984375, 64.064453125, 66.5830078125, 69.1015625, 71.6201171875, 74.138671875, 76.6572265625, 79.17578125, 81.6943359375, 84.212890625, 86.7314453125, 89.25]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 5.0, 6.0, 8.0, 10.0, 5.0, 14.0, 22.0, 32.0, 48.0, 59.0, 87.0, 96.0, 126.0, 113.0, 93.0, 77.0, 58.0, 38.0, 34.0, 17.0, 11.0, 7.0, 12.0, 10.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01236724853515625, -0.011964917182922363, -0.011562585830688477, -0.01116025447845459, -0.010757923126220703, -0.010355591773986816, -0.00995326042175293, -0.009550929069519043, -0.009148597717285156, -0.00874626636505127, -0.008343935012817383, -0.007941603660583496, -0.007539272308349609, -0.007136940956115723, -0.006734609603881836, -0.006332278251647949, -0.0059299468994140625, -0.005527615547180176, -0.005125284194946289, -0.004722952842712402, -0.004320621490478516, -0.003918290138244629, -0.003515958786010742, -0.0031136274337768555, -0.0027112960815429688, -0.002308964729309082, -0.0019066333770751953, -0.0015043020248413086, -0.0011019706726074219, -0.0006996393203735352, -0.00029730796813964844, 0.00010502338409423828, 0.000507354736328125, 0.0009096860885620117, 0.0013120174407958984, 0.0017143487930297852, 0.002116680145263672, 0.0025190114974975586, 0.0029213428497314453, 0.003323674201965332, 0.0037260055541992188, 0.0041283369064331055, 0.004530668258666992, 0.004932999610900879, 0.005335330963134766, 0.005737662315368652, 0.006139993667602539, 0.006542325019836426, 0.0069446563720703125, 0.007346987724304199, 0.007749319076538086, 0.008151650428771973, 0.00855398178100586, 0.008956313133239746, 0.009358644485473633, 0.00976097583770752, 0.010163307189941406, 0.010565638542175293, 0.01096796989440918, 0.011370301246643066, 0.011772632598876953, 0.01217496395111084, 0.012577295303344727, 0.012979626655578613, 0.0133819580078125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 7.0, 15.0, 8.0, 13.0, 19.0, 29.0, 40.0, 64.0, 83.0, 109.0, 187.0, 242.0, 371.0, 544.0, 843.0, 1214.0, 1889.0, 2840.0, 4486.0, 7143.0, 11606.0, 18710.0, 31895.0, 54584.0, 96629.0, 158445.0, 207203.0, 177132.0, 112300.0, 64831.0, 37063.0, 21812.0, 13054.0, 8234.0, 5100.0, 3349.0, 2167.0, 1425.0, 954.0, 659.0, 390.0, 260.0, 174.0, 137.0, 95.0, 73.0, 36.0, 31.0, 29.0, 13.0, 12.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-69.6875, -67.552734375, -65.41796875, -63.283203125, -61.1484375, -59.013671875, -56.87890625, -54.744140625, -52.609375, -50.474609375, -48.33984375, -46.205078125, -44.0703125, -41.935546875, -39.80078125, -37.666015625, -35.53125, -33.396484375, -31.26171875, -29.126953125, -26.9921875, -24.857421875, -22.72265625, -20.587890625, -18.453125, -16.318359375, -14.18359375, -12.048828125, -9.9140625, -7.779296875, -5.64453125, -3.509765625, -1.375, 0.759765625, 2.89453125, 5.029296875, 7.1640625, 9.298828125, 11.43359375, 13.568359375, 15.703125, 17.837890625, 19.97265625, 22.107421875, 24.2421875, 26.376953125, 28.51171875, 30.646484375, 32.78125, 34.916015625, 37.05078125, 39.185546875, 41.3203125, 43.455078125, 45.58984375, 47.724609375, 49.859375, 51.994140625, 54.12890625, 56.263671875, 58.3984375, 60.533203125, 62.66796875, 64.802734375, 66.9375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 1.0, 1.0, 6.0, 4.0, 16.0, 12.0, 10.0, 19.0, 16.0, 22.0, 24.0, 24.0, 38.0, 43.0, 49.0, 54.0, 63.0, 68.0, 64.0, 58.0, 59.0, 52.0, 45.0, 43.0, 48.0, 25.0, 26.0, 19.0, 25.0, 11.0, 11.0, 9.0, 9.0, 8.0, 5.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.75, -22.947998046875, -22.14599609375, -21.343994140625, -20.5419921875, -19.739990234375, -18.93798828125, -18.135986328125, -17.333984375, -16.531982421875, -15.72998046875, -14.927978515625, -14.1259765625, -13.323974609375, -12.52197265625, -11.719970703125, -10.91796875, -10.115966796875, -9.31396484375, -8.511962890625, -7.7099609375, -6.907958984375, -6.10595703125, -5.303955078125, -4.501953125, -3.699951171875, -2.89794921875, -2.095947265625, -1.2939453125, -0.491943359375, 0.31005859375, 1.112060546875, 1.9140625, 2.716064453125, 3.51806640625, 4.320068359375, 5.1220703125, 5.924072265625, 6.72607421875, 7.528076171875, 8.330078125, 9.132080078125, 9.93408203125, 10.736083984375, 11.5380859375, 12.340087890625, 13.14208984375, 13.944091796875, 14.74609375, 15.548095703125, 16.35009765625, 17.152099609375, 17.9541015625, 18.756103515625, 19.55810546875, 20.360107421875, 21.162109375, 21.964111328125, 22.76611328125, 23.568115234375, 24.3701171875, 25.172119140625, 25.97412109375, 26.776123046875, 27.578125]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 7.0, 3.0, 7.0, 9.0, 11.0, 14.0, 14.0, 24.0, 23.0, 28.0, 24.0, 29.0, 28.0, 39.0, 37.0, 46.0, 41.0, 44.0, 45.0, 53.0, 50.0, 42.0, 40.0, 34.0, 36.0, 28.0, 33.0, 26.0, 30.0, 23.0, 28.0, 23.0, 15.0, 17.0, 7.0, 6.0, 8.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-70.84236907958984, -68.74482727050781, -66.64729309082031, -64.54975128173828, -62.452213287353516, -60.35467529296875, -58.25713348388672, -56.15959548950195, -54.06205749511719, -51.96451950073242, -49.86697769165039, -47.769439697265625, -45.67190170288086, -43.574363708496094, -41.47682189941406, -39.3792839050293, -37.281742095947266, -35.1842041015625, -33.08666229248047, -30.989124298095703, -28.891586303710938, -26.79404640197754, -24.69650650024414, -22.598968505859375, -20.501428604125977, -18.403888702392578, -16.306350708007812, -14.208810806274414, -12.111271858215332, -10.01373291015625, -7.916193008422852, -5.8186540603637695, -3.7211151123046875, -1.6235759258270264, 0.47396326065063477, 2.571502685546875, 4.669041633605957, 6.766580581665039, 8.864120483398438, 10.96165943145752, 13.059198379516602, 15.156737327575684, 17.254276275634766, 19.351816177368164, 21.449356079101562, 23.546894073486328, 25.644433975219727, 27.741973876953125, 29.83951187133789, 31.93705177307129, 34.03459167480469, 36.13212966918945, 38.22966766357422, 40.32720947265625, 42.424747467041016, 44.52228546142578, 46.61982727050781, 48.71736526489258, 50.81490707397461, 52.912445068359375, 55.00998306274414, 57.107521057128906, 59.20506286621094, 61.3026008605957, 63.40013885498047]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 5.0, 6.0, 0.0, 3.0, 4.0, 8.0, 10.0, 14.0, 11.0, 15.0, 17.0, 18.0, 25.0, 31.0, 36.0, 21.0, 32.0, 36.0, 35.0, 38.0, 48.0, 35.0, 35.0, 48.0, 50.0, 40.0, 31.0, 41.0, 31.0, 35.0, 32.0, 24.0, 21.0, 37.0, 16.0, 22.0, 14.0, 15.0, 8.0, 13.0, 12.0, 6.0, 11.0, 9.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-82.25519561767578, -79.89909362792969, -77.5429916381836, -75.1868896484375, -72.83078002929688, -70.47467803955078, -68.11857604980469, -65.7624740600586, -63.4063720703125, -61.050270080566406, -58.69416427612305, -56.33806228637695, -53.98196029663086, -51.6258544921875, -49.269752502441406, -46.91365051269531, -44.55754470825195, -42.20144271850586, -39.8453369140625, -37.489234924316406, -35.13313293457031, -32.77703094482422, -30.42092514038086, -28.064823150634766, -25.70871925354004, -23.352615356445312, -20.99651336669922, -18.640409469604492, -16.284305572509766, -13.928203582763672, -11.572099685668945, -9.215997695922852, -6.859893798828125, -4.503790855407715, -2.1476874351501465, 0.20841598510742188, 2.564518928527832, 4.920621871948242, 7.276725769042969, 9.632827758789062, 11.988931655883789, 14.3450345993042, 16.70113754272461, 19.057241439819336, 21.413345336914062, 23.769447326660156, 26.125551223754883, 28.481653213500977, 30.837757110595703, 33.1938591003418, 35.549964904785156, 37.90606689453125, 40.262168884277344, 42.61827087402344, 44.9743766784668, 47.33047866821289, 49.68658447265625, 52.042686462402344, 54.3987922668457, 56.7548942565918, 59.11099624633789, 61.46710205078125, 63.823204040527344, 66.17930603027344, 68.53540802001953]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 8.0, 8.0, 9.0, 15.0, 28.0, 34.0, 55.0, 94.0, 144.0, 299.0, 537.0, 910.0, 1701.0, 3022.0, 5942.0, 11319.0, 22160.0, 44759.0, 92201.0, 196775.0, 425776.0, 817788.0, 1052723.0, 774938.0, 392618.0, 181550.0, 85167.0, 41000.0, 20661.0, 10382.0, 5406.0, 2776.0, 1512.0, 829.0, 459.0, 295.0, 143.0, 94.0, 50.0, 40.0, 26.0, 13.0, 14.0, 8.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-86.6875, -84.1708984375, -81.654296875, -79.1376953125, -76.62109375, -74.1044921875, -71.587890625, -69.0712890625, -66.5546875, -64.0380859375, -61.521484375, -59.0048828125, -56.48828125, -53.9716796875, -51.455078125, -48.9384765625, -46.421875, -43.9052734375, -41.388671875, -38.8720703125, -36.35546875, -33.8388671875, -31.322265625, -28.8056640625, -26.2890625, -23.7724609375, -21.255859375, -18.7392578125, -16.22265625, -13.7060546875, -11.189453125, -8.6728515625, -6.15625, -3.6396484375, -1.123046875, 1.3935546875, 3.91015625, 6.4267578125, 8.943359375, 11.4599609375, 13.9765625, 16.4931640625, 19.009765625, 21.5263671875, 24.04296875, 26.5595703125, 29.076171875, 31.5927734375, 34.109375, 36.6259765625, 39.142578125, 41.6591796875, 44.17578125, 46.6923828125, 49.208984375, 51.7255859375, 54.2421875, 56.7587890625, 59.275390625, 61.7919921875, 64.30859375, 66.8251953125, 69.341796875, 71.8583984375, 74.375]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 10.0, 9.0, 16.0, 18.0, 21.0, 21.0, 22.0, 20.0, 28.0, 30.0, 35.0, 46.0, 47.0, 39.0, 32.0, 27.0, 47.0, 49.0, 47.0, 30.0, 39.0, 48.0, 35.0, 24.0, 28.0, 35.0, 26.0, 23.0, 25.0, 18.0, 21.0, 10.0, 11.0, 13.0, 10.0, 9.0, 8.0, 3.0, 7.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-65.0625, -63.27490234375, -61.4873046875, -59.69970703125, -57.912109375, -56.12451171875, -54.3369140625, -52.54931640625, -50.76171875, -48.97412109375, -47.1865234375, -45.39892578125, -43.611328125, -41.82373046875, -40.0361328125, -38.24853515625, -36.4609375, -34.67333984375, -32.8857421875, -31.09814453125, -29.310546875, -27.52294921875, -25.7353515625, -23.94775390625, -22.16015625, -20.37255859375, -18.5849609375, -16.79736328125, -15.009765625, -13.22216796875, -11.4345703125, -9.64697265625, -7.859375, -6.07177734375, -4.2841796875, -2.49658203125, -0.708984375, 1.07861328125, 2.8662109375, 4.65380859375, 6.44140625, 8.22900390625, 10.0166015625, 11.80419921875, 13.591796875, 15.37939453125, 17.1669921875, 18.95458984375, 20.7421875, 22.52978515625, 24.3173828125, 26.10498046875, 27.892578125, 29.68017578125, 31.4677734375, 33.25537109375, 35.04296875, 36.83056640625, 38.6181640625, 40.40576171875, 42.193359375, 43.98095703125, 45.7685546875, 47.55615234375, 49.34375]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 6.0, 11.0, 14.0, 22.0, 45.0, 57.0, 128.0, 212.0, 392.0, 697.0, 1231.0, 2222.0, 4284.0, 7743.0, 14628.0, 27537.0, 52178.0, 98188.0, 182586.0, 330433.0, 552318.0, 778712.0, 792791.0, 579803.0, 350044.0, 195364.0, 104400.0, 55414.0, 29086.0, 15386.0, 8341.0, 4481.0, 2457.0, 1365.0, 729.0, 424.0, 230.0, 141.0, 85.0, 40.0, 22.0, 11.0, 11.0, 9.0, 4.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-75.5625, -73.40673828125, -71.2509765625, -69.09521484375, -66.939453125, -64.78369140625, -62.6279296875, -60.47216796875, -58.31640625, -56.16064453125, -54.0048828125, -51.84912109375, -49.693359375, -47.53759765625, -45.3818359375, -43.22607421875, -41.0703125, -38.91455078125, -36.7587890625, -34.60302734375, -32.447265625, -30.29150390625, -28.1357421875, -25.97998046875, -23.82421875, -21.66845703125, -19.5126953125, -17.35693359375, -15.201171875, -13.04541015625, -10.8896484375, -8.73388671875, -6.578125, -4.42236328125, -2.2666015625, -0.11083984375, 2.044921875, 4.20068359375, 6.3564453125, 8.51220703125, 10.66796875, 12.82373046875, 14.9794921875, 17.13525390625, 19.291015625, 21.44677734375, 23.6025390625, 25.75830078125, 27.9140625, 30.06982421875, 32.2255859375, 34.38134765625, 36.537109375, 38.69287109375, 40.8486328125, 43.00439453125, 45.16015625, 47.31591796875, 49.4716796875, 51.62744140625, 53.783203125, 55.93896484375, 58.0947265625, 60.25048828125, 62.40625]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 6.0, 9.0, 8.0, 13.0, 9.0, 31.0, 28.0, 30.0, 38.0, 50.0, 52.0, 68.0, 92.0, 111.0, 142.0, 154.0, 169.0, 194.0, 199.0, 239.0, 284.0, 257.0, 274.0, 237.0, 208.0, 193.0, 176.0, 174.0, 127.0, 123.0, 70.0, 70.0, 52.0, 48.0, 34.0, 29.0, 20.0, 13.0, 13.0, 11.0, 10.0, 5.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.140625, -27.32080078125, -26.5009765625, -25.68115234375, -24.861328125, -24.04150390625, -23.2216796875, -22.40185546875, -21.58203125, -20.76220703125, -19.9423828125, -19.12255859375, -18.302734375, -17.48291015625, -16.6630859375, -15.84326171875, -15.0234375, -14.20361328125, -13.3837890625, -12.56396484375, -11.744140625, -10.92431640625, -10.1044921875, -9.28466796875, -8.46484375, -7.64501953125, -6.8251953125, -6.00537109375, -5.185546875, -4.36572265625, -3.5458984375, -2.72607421875, -1.90625, -1.08642578125, -0.2666015625, 0.55322265625, 1.373046875, 2.19287109375, 3.0126953125, 3.83251953125, 4.65234375, 5.47216796875, 6.2919921875, 7.11181640625, 7.931640625, 8.75146484375, 9.5712890625, 10.39111328125, 11.2109375, 12.03076171875, 12.8505859375, 13.67041015625, 14.490234375, 15.31005859375, 16.1298828125, 16.94970703125, 17.76953125, 18.58935546875, 19.4091796875, 20.22900390625, 21.048828125, 21.86865234375, 22.6884765625, 23.50830078125, 24.328125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 9.0, 10.0, 11.0, 12.0, 18.0, 19.0, 26.0, 36.0, 31.0, 28.0, 37.0, 43.0, 35.0, 45.0, 48.0, 57.0, 49.0, 60.0, 43.0, 49.0, 45.0, 45.0, 36.0, 40.0, 32.0, 19.0, 28.0, 17.0, 12.0, 10.0, 13.0, 3.0, 13.0, 3.0, 2.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-61.50790023803711, -59.4245719909668, -57.341243743896484, -55.257911682128906, -53.174583435058594, -51.09125518798828, -49.00792694091797, -46.924598693847656, -44.841270446777344, -42.75794219970703, -40.67461395263672, -38.591285705566406, -36.50795364379883, -34.424625396728516, -32.3412971496582, -30.25796890258789, -28.174636840820312, -26.09130859375, -24.007978439331055, -21.924650192260742, -19.841320037841797, -17.757991790771484, -15.674663543701172, -13.591334342956543, -11.508005142211914, -9.424675941467285, -7.3413472175598145, -5.258018493652344, -3.174689292907715, -1.091360092163086, 0.9919681549072266, 3.0752973556518555, 5.158622741699219, 7.241951942443848, 9.325281143188477, 11.408609390258789, 13.491938591003418, 15.575267791748047, 17.65859603881836, 19.741924285888672, 21.825254440307617, 23.90858268737793, 25.991912841796875, 28.075241088867188, 30.1585693359375, 32.24189758300781, 34.325225830078125, 36.4085578918457, 38.491886138916016, 40.57521438598633, 42.65854263305664, 44.74187469482422, 46.82520294189453, 48.908531188964844, 50.991859436035156, 53.07518768310547, 55.15851593017578, 57.241844177246094, 59.325172424316406, 61.40850067138672, 63.4918327331543, 65.57516479492188, 67.65849304199219, 69.7418212890625, 71.82514953613281]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 2.0, 9.0, 5.0, 7.0, 5.0, 7.0, 16.0, 11.0, 8.0, 15.0, 26.0, 29.0, 28.0, 24.0, 38.0, 38.0, 36.0, 34.0, 41.0, 38.0, 38.0, 35.0, 36.0, 41.0, 40.0, 29.0, 33.0, 39.0, 31.0, 37.0, 23.0, 38.0, 22.0, 13.0, 19.0, 19.0, 14.0, 6.0, 14.0, 12.0, 9.0, 6.0, 3.0, 9.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-71.58344268798828, -69.53543853759766, -67.48743438720703, -65.43943786621094, -63.39143371582031, -61.34342956542969, -59.29542541503906, -57.24742126464844, -55.19942092895508, -53.15141677856445, -51.103416442871094, -49.05541229248047, -47.007408142089844, -44.959407806396484, -42.91140365600586, -40.8634033203125, -38.815399169921875, -36.76739501953125, -34.71939468383789, -32.671390533447266, -30.623388290405273, -28.57538604736328, -26.527381896972656, -24.479379653930664, -22.431377410888672, -20.38337516784668, -18.335372924804688, -16.287368774414062, -14.23936653137207, -12.191364288330078, -10.14336109161377, -8.095357894897461, -6.047351837158203, -3.9993491172790527, -1.9513463973999023, 0.09665632247924805, 2.1446590423583984, 4.192661285400391, 6.240664482116699, 8.288667678833008, 10.336669921875, 12.384672164916992, 14.4326753616333, 16.48067855834961, 18.5286808013916, 20.576683044433594, 22.62468719482422, 24.67268943786621, 26.720691680908203, 28.768693923950195, 30.816696166992188, 32.86470031738281, 34.91270446777344, 36.9607048034668, 39.00870895385742, 41.05670928955078, 43.104713439941406, 45.15271759033203, 47.20071792602539, 49.248722076416016, 51.296722412109375, 53.3447265625, 55.392730712890625, 57.44073486328125, 59.48873519897461]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 8.0, 6.0, 14.0, 10.0, 18.0, 25.0, 35.0, 52.0, 75.0, 109.0, 149.0, 202.0, 326.0, 461.0, 686.0, 1141.0, 1852.0, 2952.0, 4841.0, 8641.0, 14481.0, 25283.0, 45857.0, 81637.0, 143225.0, 212320.0, 203014.0, 130139.0, 73959.0, 41175.0, 23126.0, 13162.0, 7566.0, 4505.0, 2699.0, 1664.0, 990.0, 693.0, 486.0, 307.0, 212.0, 143.0, 105.0, 56.0, 41.0, 43.0, 11.0, 16.0, 8.0, 9.0, 7.0, 7.0, 2.0, 3.0, 3.0, 1.0, 3.0], "bins": [-212.375, -205.921875, -199.46875, -193.015625, -186.5625, -180.109375, -173.65625, -167.203125, -160.75, -154.296875, -147.84375, -141.390625, -134.9375, -128.484375, -122.03125, -115.578125, -109.125, -102.671875, -96.21875, -89.765625, -83.3125, -76.859375, -70.40625, -63.953125, -57.5, -51.046875, -44.59375, -38.140625, -31.6875, -25.234375, -18.78125, -12.328125, -5.875, 0.578125, 7.03125, 13.484375, 19.9375, 26.390625, 32.84375, 39.296875, 45.75, 52.203125, 58.65625, 65.109375, 71.5625, 78.015625, 84.46875, 90.921875, 97.375, 103.828125, 110.28125, 116.734375, 123.1875, 129.640625, 136.09375, 142.546875, 149.0, 155.453125, 161.90625, 168.359375, 174.8125, 181.265625, 187.71875, 194.171875, 200.625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 5.0, 0.0, 4.0, 4.0, 4.0, 4.0, 10.0, 8.0, 8.0, 12.0, 16.0, 14.0, 14.0, 26.0, 23.0, 23.0, 27.0, 34.0, 44.0, 37.0, 35.0, 41.0, 37.0, 27.0, 46.0, 44.0, 33.0, 39.0, 42.0, 37.0, 29.0, 32.0, 21.0, 35.0, 30.0, 22.0, 21.0, 13.0, 22.0, 17.0, 10.0, 12.0, 6.0, 6.0, 8.0, 6.0, 8.0, 6.0, 3.0, 5.0, 0.0, 0.0, 1.0, 1.0], "bins": [-59.28125, -57.58837890625, -55.8955078125, -54.20263671875, -52.509765625, -50.81689453125, -49.1240234375, -47.43115234375, -45.73828125, -44.04541015625, -42.3525390625, -40.65966796875, -38.966796875, -37.27392578125, -35.5810546875, -33.88818359375, -32.1953125, -30.50244140625, -28.8095703125, -27.11669921875, -25.423828125, -23.73095703125, -22.0380859375, -20.34521484375, -18.65234375, -16.95947265625, -15.2666015625, -13.57373046875, -11.880859375, -10.18798828125, -8.4951171875, -6.80224609375, -5.109375, -3.41650390625, -1.7236328125, -0.03076171875, 1.662109375, 3.35498046875, 5.0478515625, 6.74072265625, 8.43359375, 10.12646484375, 11.8193359375, 13.51220703125, 15.205078125, 16.89794921875, 18.5908203125, 20.28369140625, 21.9765625, 23.66943359375, 25.3623046875, 27.05517578125, 28.748046875, 30.44091796875, 32.1337890625, 33.82666015625, 35.51953125, 37.21240234375, 38.9052734375, 40.59814453125, 42.291015625, 43.98388671875, 45.6767578125, 47.36962890625, 49.0625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 0.0, 3.0, 6.0, 1.0, 11.0, 12.0, 18.0, 22.0, 38.0, 53.0, 91.0, 123.0, 159.0, 266.0, 379.0, 608.0, 980.0, 1598.0, 2556.0, 4200.0, 7067.0, 12334.0, 22326.0, 41958.0, 82661.0, 170457.0, 279383.0, 206331.0, 101843.0, 50639.0, 26649.0, 14676.0, 8306.0, 4893.0, 2781.0, 1814.0, 1109.0, 764.0, 479.0, 295.0, 213.0, 138.0, 100.0, 70.0, 38.0, 36.0, 27.0, 11.0, 15.0, 12.0, 2.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0], "bins": [-225.125, -218.43359375, -211.7421875, -205.05078125, -198.359375, -191.66796875, -184.9765625, -178.28515625, -171.59375, -164.90234375, -158.2109375, -151.51953125, -144.828125, -138.13671875, -131.4453125, -124.75390625, -118.0625, -111.37109375, -104.6796875, -97.98828125, -91.296875, -84.60546875, -77.9140625, -71.22265625, -64.53125, -57.83984375, -51.1484375, -44.45703125, -37.765625, -31.07421875, -24.3828125, -17.69140625, -11.0, -4.30859375, 2.3828125, 9.07421875, 15.765625, 22.45703125, 29.1484375, 35.83984375, 42.53125, 49.22265625, 55.9140625, 62.60546875, 69.296875, 75.98828125, 82.6796875, 89.37109375, 96.0625, 102.75390625, 109.4453125, 116.13671875, 122.828125, 129.51953125, 136.2109375, 142.90234375, 149.59375, 156.28515625, 162.9765625, 169.66796875, 176.359375, 183.05078125, 189.7421875, 196.43359375, 203.125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 5.0, 10.0, 9.0, 12.0, 13.0, 12.0, 21.0, 17.0, 32.0, 24.0, 27.0, 41.0, 38.0, 47.0, 39.0, 39.0, 48.0, 43.0, 46.0, 52.0, 46.0, 46.0, 35.0, 51.0, 44.0, 32.0, 27.0, 20.0, 20.0, 22.0, 17.0, 10.0, 11.0, 8.0, 8.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.75, -61.7626953125, -59.775390625, -57.7880859375, -55.80078125, -53.8134765625, -51.826171875, -49.8388671875, -47.8515625, -45.8642578125, -43.876953125, -41.8896484375, -39.90234375, -37.9150390625, -35.927734375, -33.9404296875, -31.953125, -29.9658203125, -27.978515625, -25.9912109375, -24.00390625, -22.0166015625, -20.029296875, -18.0419921875, -16.0546875, -14.0673828125, -12.080078125, -10.0927734375, -8.10546875, -6.1181640625, -4.130859375, -2.1435546875, -0.15625, 1.8310546875, 3.818359375, 5.8056640625, 7.79296875, 9.7802734375, 11.767578125, 13.7548828125, 15.7421875, 17.7294921875, 19.716796875, 21.7041015625, 23.69140625, 25.6787109375, 27.666015625, 29.6533203125, 31.640625, 33.6279296875, 35.615234375, 37.6025390625, 39.58984375, 41.5771484375, 43.564453125, 45.5517578125, 47.5390625, 49.5263671875, 51.513671875, 53.5009765625, 55.48828125, 57.4755859375, 59.462890625, 61.4501953125, 63.4375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 7.0, 8.0, 9.0, 12.0, 16.0, 27.0, 35.0, 44.0, 66.0, 85.0, 121.0, 173.0, 290.0, 415.0, 585.0, 963.0, 1503.0, 2504.0, 4149.0, 7397.0, 14005.0, 27936.0, 60832.0, 150946.0, 348750.0, 247563.0, 95088.0, 40846.0, 19754.0, 10286.0, 5613.0, 3126.0, 1888.0, 1164.0, 739.0, 501.0, 331.0, 236.0, 136.0, 124.0, 79.0, 57.0, 41.0, 29.0, 29.0, 14.0, 12.0, 12.0, 4.0, 6.0, 2.0, 2.0, 2.0, 3.0], "bins": [-150.25, -145.9267578125, -141.603515625, -137.2802734375, -132.95703125, -128.6337890625, -124.310546875, -119.9873046875, -115.6640625, -111.3408203125, -107.017578125, -102.6943359375, -98.37109375, -94.0478515625, -89.724609375, -85.4013671875, -81.078125, -76.7548828125, -72.431640625, -68.1083984375, -63.78515625, -59.4619140625, -55.138671875, -50.8154296875, -46.4921875, -42.1689453125, -37.845703125, -33.5224609375, -29.19921875, -24.8759765625, -20.552734375, -16.2294921875, -11.90625, -7.5830078125, -3.259765625, 1.0634765625, 5.38671875, 9.7099609375, 14.033203125, 18.3564453125, 22.6796875, 27.0029296875, 31.326171875, 35.6494140625, 39.97265625, 44.2958984375, 48.619140625, 52.9423828125, 57.265625, 61.5888671875, 65.912109375, 70.2353515625, 74.55859375, 78.8818359375, 83.205078125, 87.5283203125, 91.8515625, 96.1748046875, 100.498046875, 104.8212890625, 109.14453125, 113.4677734375, 117.791015625, 122.1142578125, 126.4375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 6.0, 2.0, 7.0, 7.0, 8.0, 16.0, 22.0, 16.0, 31.0, 51.0, 59.0, 87.0, 127.0, 120.0, 121.0, 83.0, 64.0, 43.0, 28.0, 12.0, 22.0, 15.0, 6.0, 8.0, 5.0, 3.0, 2.0, 5.0, 5.0, 1.0, 0.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01058197021484375, -0.010209918022155762, -0.009837865829467773, -0.009465813636779785, -0.009093761444091797, -0.008721709251403809, -0.00834965705871582, -0.007977604866027832, -0.007605552673339844, -0.0072335004806518555, -0.006861448287963867, -0.006489396095275879, -0.006117343902587891, -0.005745291709899902, -0.005373239517211914, -0.005001187324523926, -0.0046291351318359375, -0.004257082939147949, -0.003885030746459961, -0.0035129785537719727, -0.0031409263610839844, -0.002768874168395996, -0.002396821975708008, -0.0020247697830200195, -0.0016527175903320312, -0.001280665397644043, -0.0009086132049560547, -0.0005365610122680664, -0.00016450881958007812, 0.00020754337310791016, 0.0005795955657958984, 0.0009516477584838867, 0.001323699951171875, 0.0016957521438598633, 0.0020678043365478516, 0.00243985652923584, 0.002811908721923828, 0.0031839609146118164, 0.0035560131072998047, 0.003928065299987793, 0.004300117492675781, 0.0046721696853637695, 0.005044221878051758, 0.005416274070739746, 0.005788326263427734, 0.006160378456115723, 0.006532430648803711, 0.006904482841491699, 0.0072765350341796875, 0.007648587226867676, 0.008020639419555664, 0.008392691612243652, 0.00876474380493164, 0.009136795997619629, 0.009508848190307617, 0.009880900382995605, 0.010252952575683594, 0.010625004768371582, 0.01099705696105957, 0.011369109153747559, 0.011741161346435547, 0.012113213539123535, 0.012485265731811523, 0.012857317924499512, 0.0132293701171875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 7.0, 1.0, 10.0, 11.0, 13.0, 20.0, 29.0, 51.0, 56.0, 91.0, 114.0, 167.0, 241.0, 323.0, 499.0, 663.0, 926.0, 1420.0, 2112.0, 3354.0, 5621.0, 10124.0, 19827.0, 41169.0, 93400.0, 210790.0, 302237.0, 191986.0, 84172.0, 37122.0, 18013.0, 9376.0, 5170.0, 3052.0, 2000.0, 1354.0, 858.0, 626.0, 401.0, 326.0, 235.0, 166.0, 129.0, 75.0, 78.0, 46.0, 33.0, 29.0, 14.0, 14.0, 5.0, 3.0, 3.0, 1.0, 0.0, 3.0], "bins": [-115.375, -112.0244140625, -108.673828125, -105.3232421875, -101.97265625, -98.6220703125, -95.271484375, -91.9208984375, -88.5703125, -85.2197265625, -81.869140625, -78.5185546875, -75.16796875, -71.8173828125, -68.466796875, -65.1162109375, -61.765625, -58.4150390625, -55.064453125, -51.7138671875, -48.36328125, -45.0126953125, -41.662109375, -38.3115234375, -34.9609375, -31.6103515625, -28.259765625, -24.9091796875, -21.55859375, -18.2080078125, -14.857421875, -11.5068359375, -8.15625, -4.8056640625, -1.455078125, 1.8955078125, 5.24609375, 8.5966796875, 11.947265625, 15.2978515625, 18.6484375, 21.9990234375, 25.349609375, 28.7001953125, 32.05078125, 35.4013671875, 38.751953125, 42.1025390625, 45.453125, 48.8037109375, 52.154296875, 55.5048828125, 58.85546875, 62.2060546875, 65.556640625, 68.9072265625, 72.2578125, 75.6083984375, 78.958984375, 82.3095703125, 85.66015625, 89.0107421875, 92.361328125, 95.7119140625, 99.0625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 6.0, 3.0, 8.0, 7.0, 13.0, 15.0, 20.0, 19.0, 28.0, 32.0, 65.0, 52.0, 67.0, 98.0, 98.0, 94.0, 81.0, 53.0, 53.0, 44.0, 23.0, 26.0, 18.0, 16.0, 16.0, 6.0, 8.0, 8.0, 0.0, 5.0, 4.0, 1.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-44.53125, -43.16845703125, -41.8056640625, -40.44287109375, -39.080078125, -37.71728515625, -36.3544921875, -34.99169921875, -33.62890625, -32.26611328125, -30.9033203125, -29.54052734375, -28.177734375, -26.81494140625, -25.4521484375, -24.08935546875, -22.7265625, -21.36376953125, -20.0009765625, -18.63818359375, -17.275390625, -15.91259765625, -14.5498046875, -13.18701171875, -11.82421875, -10.46142578125, -9.0986328125, -7.73583984375, -6.373046875, -5.01025390625, -3.6474609375, -2.28466796875, -0.921875, 0.44091796875, 1.8037109375, 3.16650390625, 4.529296875, 5.89208984375, 7.2548828125, 8.61767578125, 9.98046875, 11.34326171875, 12.7060546875, 14.06884765625, 15.431640625, 16.79443359375, 18.1572265625, 19.52001953125, 20.8828125, 22.24560546875, 23.6083984375, 24.97119140625, 26.333984375, 27.69677734375, 29.0595703125, 30.42236328125, 31.78515625, 33.14794921875, 34.5107421875, 35.87353515625, 37.236328125, 38.59912109375, 39.9619140625, 41.32470703125, 42.6875]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 1.0, 7.0, 5.0, 5.0, 14.0, 18.0, 16.0, 38.0, 33.0, 35.0, 48.0, 39.0, 64.0, 52.0, 58.0, 66.0, 53.0, 56.0, 54.0, 44.0, 48.0, 40.0, 46.0, 25.0, 27.0, 26.0, 13.0, 11.0, 9.0, 11.0, 9.0, 4.0, 6.0, 10.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.23002624511719, -67.13697814941406, -65.04393768310547, -62.95089340209961, -60.85784912109375, -58.76480484008789, -56.67176055908203, -54.57871627807617, -52.48567199707031, -50.39262771606445, -48.299583435058594, -46.206539154052734, -44.113494873046875, -42.020450592041016, -39.927406311035156, -37.8343620300293, -35.74131774902344, -33.64827346801758, -31.55522918701172, -29.46218490600586, -27.369140625, -25.27609634399414, -23.18305206298828, -21.090007781982422, -18.996963500976562, -16.903919219970703, -14.810874938964844, -12.717830657958984, -10.624786376953125, -8.531742095947266, -6.438697814941406, -4.345653533935547, -2.2526168823242188, -0.15957260131835938, 1.9334716796875, 4.026515960693359, 6.119560241699219, 8.212604522705078, 10.305648803710938, 12.398693084716797, 14.491737365722656, 16.584781646728516, 18.677825927734375, 20.770870208740234, 22.863914489746094, 24.956958770751953, 27.050003051757812, 29.143047332763672, 31.23609161376953, 33.32913589477539, 35.42218017578125, 37.51522445678711, 39.60826873779297, 41.70131301879883, 43.79435729980469, 45.88740158081055, 47.980445861816406, 50.073490142822266, 52.166534423828125, 54.259578704833984, 56.352622985839844, 58.4456672668457, 60.53871154785156, 62.63175582885742, 64.72480010986328]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 3.0, 5.0, 10.0, 8.0, 12.0, 16.0, 13.0, 16.0, 24.0, 17.0, 32.0, 32.0, 39.0, 39.0, 37.0, 35.0, 51.0, 45.0, 46.0, 56.0, 45.0, 44.0, 46.0, 52.0, 37.0, 33.0, 29.0, 31.0, 29.0, 18.0, 27.0, 16.0, 11.0, 15.0, 10.0, 6.0, 10.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-73.37081909179688, -71.34426879882812, -69.3177261352539, -67.29117584228516, -65.2646255493164, -63.23807907104492, -61.21153259277344, -59.18498229980469, -57.15843200683594, -55.13188552856445, -53.1053352355957, -51.07878875732422, -49.05223846435547, -47.025691986083984, -44.9991455078125, -42.97259521484375, -40.946048736572266, -38.91950225830078, -36.89295196533203, -34.86640548706055, -32.8398551940918, -30.813308715820312, -28.786760330200195, -26.760211944580078, -24.73366355895996, -22.707115173339844, -20.680566787719727, -18.65401840209961, -16.627471923828125, -14.600922584533691, -12.57437515258789, -10.547826766967773, -8.521278381347656, -6.494729995727539, -4.46818208694458, -2.441634178161621, -0.4150857925415039, 1.6114625930786133, 3.638010025024414, 5.664558410644531, 7.691106796264648, 9.717655181884766, 11.744203567504883, 13.770750999450684, 15.7972993850708, 17.823848724365234, 19.85039520263672, 21.876943588256836, 23.903491973876953, 25.93004035949707, 27.956588745117188, 29.983135223388672, 32.00968551635742, 34.036231994628906, 36.062782287597656, 38.08932876586914, 40.115875244140625, 42.14242172241211, 44.16897201538086, 46.195518493652344, 48.222068786621094, 50.24861526489258, 52.27516174316406, 54.30171203613281, 56.32826232910156]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 11.0, 14.0, 26.0, 35.0, 41.0, 66.0, 100.0, 157.0, 215.0, 340.0, 532.0, 671.0, 1036.0, 1562.0, 2443.0, 3686.0, 5468.0, 8493.0, 12559.0, 19438.0, 28922.0, 42544.0, 60025.0, 82178.0, 103700.0, 119772.0, 122973.0, 113078.0, 92472.0, 70804.0, 50452.0, 35098.0, 23602.0, 15647.0, 10376.0, 6709.0, 4525.0, 2933.0, 2003.0, 1223.0, 857.0, 559.0, 407.0, 257.0, 185.0, 112.0, 70.0, 68.0, 42.0, 29.0, 18.0, 9.0, 5.0, 5.0, 0.0, 4.0, 2.0], "bins": [-43.875, -42.55517578125, -41.2353515625, -39.91552734375, -38.595703125, -37.27587890625, -35.9560546875, -34.63623046875, -33.31640625, -31.99658203125, -30.6767578125, -29.35693359375, -28.037109375, -26.71728515625, -25.3974609375, -24.07763671875, -22.7578125, -21.43798828125, -20.1181640625, -18.79833984375, -17.478515625, -16.15869140625, -14.8388671875, -13.51904296875, -12.19921875, -10.87939453125, -9.5595703125, -8.23974609375, -6.919921875, -5.60009765625, -4.2802734375, -2.96044921875, -1.640625, -0.32080078125, 0.9990234375, 2.31884765625, 3.638671875, 4.95849609375, 6.2783203125, 7.59814453125, 8.91796875, 10.23779296875, 11.5576171875, 12.87744140625, 14.197265625, 15.51708984375, 16.8369140625, 18.15673828125, 19.4765625, 20.79638671875, 22.1162109375, 23.43603515625, 24.755859375, 26.07568359375, 27.3955078125, 28.71533203125, 30.03515625, 31.35498046875, 32.6748046875, 33.99462890625, 35.314453125, 36.63427734375, 37.9541015625, 39.27392578125, 40.59375]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 12.0, 5.0, 7.0, 11.0, 17.0, 13.0, 17.0, 22.0, 19.0, 33.0, 38.0, 46.0, 37.0, 44.0, 48.0, 43.0, 45.0, 50.0, 54.0, 40.0, 55.0, 45.0, 35.0, 41.0, 39.0, 28.0, 30.0, 24.0, 16.0, 20.0, 13.0, 17.0, 11.0, 5.0, 5.0, 4.0, 6.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-69.1875, -67.30078125, -65.4140625, -63.52734375, -61.640625, -59.75390625, -57.8671875, -55.98046875, -54.09375, -52.20703125, -50.3203125, -48.43359375, -46.546875, -44.66015625, -42.7734375, -40.88671875, -39.0, -37.11328125, -35.2265625, -33.33984375, -31.453125, -29.56640625, -27.6796875, -25.79296875, -23.90625, -22.01953125, -20.1328125, -18.24609375, -16.359375, -14.47265625, -12.5859375, -10.69921875, -8.8125, -6.92578125, -5.0390625, -3.15234375, -1.265625, 0.62109375, 2.5078125, 4.39453125, 6.28125, 8.16796875, 10.0546875, 11.94140625, 13.828125, 15.71484375, 17.6015625, 19.48828125, 21.375, 23.26171875, 25.1484375, 27.03515625, 28.921875, 30.80859375, 32.6953125, 34.58203125, 36.46875, 38.35546875, 40.2421875, 42.12890625, 44.015625, 45.90234375, 47.7890625, 49.67578125, 51.5625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 4.0, 8.0, 7.0, 16.0, 25.0, 36.0, 68.0, 71.0, 116.0, 177.0, 246.0, 398.0, 637.0, 959.0, 1549.0, 2320.0, 3580.0, 5734.0, 9485.0, 15195.0, 24534.0, 40083.0, 64904.0, 101147.0, 142122.0, 165885.0, 153991.0, 115217.0, 75889.0, 47534.0, 28849.0, 17851.0, 10986.0, 6919.0, 4316.0, 2703.0, 1761.0, 1157.0, 723.0, 470.0, 267.0, 188.0, 145.0, 104.0, 67.0, 36.0, 31.0, 10.0, 15.0, 9.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0], "bins": [-58.5625, -56.77001953125, -54.9775390625, -53.18505859375, -51.392578125, -49.60009765625, -47.8076171875, -46.01513671875, -44.22265625, -42.43017578125, -40.6376953125, -38.84521484375, -37.052734375, -35.26025390625, -33.4677734375, -31.67529296875, -29.8828125, -28.09033203125, -26.2978515625, -24.50537109375, -22.712890625, -20.92041015625, -19.1279296875, -17.33544921875, -15.54296875, -13.75048828125, -11.9580078125, -10.16552734375, -8.373046875, -6.58056640625, -4.7880859375, -2.99560546875, -1.203125, 0.58935546875, 2.3818359375, 4.17431640625, 5.966796875, 7.75927734375, 9.5517578125, 11.34423828125, 13.13671875, 14.92919921875, 16.7216796875, 18.51416015625, 20.306640625, 22.09912109375, 23.8916015625, 25.68408203125, 27.4765625, 29.26904296875, 31.0615234375, 32.85400390625, 34.646484375, 36.43896484375, 38.2314453125, 40.02392578125, 41.81640625, 43.60888671875, 45.4013671875, 47.19384765625, 48.986328125, 50.77880859375, 52.5712890625, 54.36376953125, 56.15625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 8.0, 0.0, 2.0, 9.0, 9.0, 13.0, 12.0, 19.0, 24.0, 15.0, 30.0, 27.0, 35.0, 30.0, 51.0, 40.0, 47.0, 48.0, 53.0, 63.0, 52.0, 41.0, 41.0, 53.0, 44.0, 43.0, 31.0, 31.0, 35.0, 13.0, 22.0, 15.0, 12.0, 11.0, 10.0, 6.0, 6.0, 8.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.25, -53.6064453125, -51.962890625, -50.3193359375, -48.67578125, -47.0322265625, -45.388671875, -43.7451171875, -42.1015625, -40.4580078125, -38.814453125, -37.1708984375, -35.52734375, -33.8837890625, -32.240234375, -30.5966796875, -28.953125, -27.3095703125, -25.666015625, -24.0224609375, -22.37890625, -20.7353515625, -19.091796875, -17.4482421875, -15.8046875, -14.1611328125, -12.517578125, -10.8740234375, -9.23046875, -7.5869140625, -5.943359375, -4.2998046875, -2.65625, -1.0126953125, 0.630859375, 2.2744140625, 3.91796875, 5.5615234375, 7.205078125, 8.8486328125, 10.4921875, 12.1357421875, 13.779296875, 15.4228515625, 17.06640625, 18.7099609375, 20.353515625, 21.9970703125, 23.640625, 25.2841796875, 26.927734375, 28.5712890625, 30.21484375, 31.8583984375, 33.501953125, 35.1455078125, 36.7890625, 38.4326171875, 40.076171875, 41.7197265625, 43.36328125, 45.0068359375, 46.650390625, 48.2939453125, 49.9375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 5.0, 13.0, 12.0, 26.0, 32.0, 44.0, 71.0, 83.0, 144.0, 199.0, 274.0, 404.0, 624.0, 885.0, 1424.0, 2237.0, 3713.0, 6424.0, 11413.0, 21477.0, 42368.0, 86334.0, 176113.0, 269101.0, 208176.0, 106242.0, 51545.0, 26173.0, 13593.0, 7571.0, 4494.0, 2602.0, 1568.0, 1046.0, 698.0, 439.0, 313.0, 221.0, 137.0, 88.0, 68.0, 47.0, 38.0, 25.0, 18.0, 11.0, 10.0, 2.0, 4.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-82.625, -80.09375, -77.5625, -75.03125, -72.5, -69.96875, -67.4375, -64.90625, -62.375, -59.84375, -57.3125, -54.78125, -52.25, -49.71875, -47.1875, -44.65625, -42.125, -39.59375, -37.0625, -34.53125, -32.0, -29.46875, -26.9375, -24.40625, -21.875, -19.34375, -16.8125, -14.28125, -11.75, -9.21875, -6.6875, -4.15625, -1.625, 0.90625, 3.4375, 5.96875, 8.5, 11.03125, 13.5625, 16.09375, 18.625, 21.15625, 23.6875, 26.21875, 28.75, 31.28125, 33.8125, 36.34375, 38.875, 41.40625, 43.9375, 46.46875, 49.0, 51.53125, 54.0625, 56.59375, 59.125, 61.65625, 64.1875, 66.71875, 69.25, 71.78125, 74.3125, 76.84375, 79.375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 7.0, 8.0, 8.0, 10.0, 8.0, 5.0, 12.0, 12.0, 22.0, 24.0, 20.0, 35.0, 42.0, 42.0, 54.0, 53.0, 49.0, 63.0, 65.0, 57.0, 53.0, 57.0, 41.0, 42.0, 34.0, 19.0, 25.0, 20.0, 21.0, 20.0, 12.0, 11.0, 9.0, 10.0, 1.0, 6.0, 4.0, 2.0, 3.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00479888916015625, -0.0046347975730896, -0.004470705986022949, -0.004306614398956299, -0.0041425228118896484, -0.003978431224822998, -0.0038143396377563477, -0.0036502480506896973, -0.003486156463623047, -0.0033220648765563965, -0.003157973289489746, -0.0029938817024230957, -0.0028297901153564453, -0.002665698528289795, -0.0025016069412231445, -0.002337515354156494, -0.0021734237670898438, -0.0020093321800231934, -0.001845240592956543, -0.0016811490058898926, -0.0015170574188232422, -0.0013529658317565918, -0.0011888742446899414, -0.001024782657623291, -0.0008606910705566406, -0.0006965994834899902, -0.0005325078964233398, -0.00036841630935668945, -0.00020432472229003906, -4.023313522338867e-05, 0.00012385845184326172, 0.0002879500389099121, 0.0004520416259765625, 0.0006161332130432129, 0.0007802248001098633, 0.0009443163871765137, 0.001108407974243164, 0.0012724995613098145, 0.0014365911483764648, 0.0016006827354431152, 0.0017647743225097656, 0.001928865909576416, 0.0020929574966430664, 0.002257049083709717, 0.002421140670776367, 0.0025852322578430176, 0.002749323844909668, 0.0029134154319763184, 0.0030775070190429688, 0.003241598606109619, 0.0034056901931762695, 0.00356978178024292, 0.0037338733673095703, 0.0038979649543762207, 0.004062056541442871, 0.0042261481285095215, 0.004390239715576172, 0.004554331302642822, 0.004718422889709473, 0.004882514476776123, 0.0050466060638427734, 0.005210697650909424, 0.005374789237976074, 0.005538880825042725, 0.005702972412109375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 6.0, 10.0, 6.0, 12.0, 23.0, 23.0, 59.0, 72.0, 114.0, 172.0, 241.0, 414.0, 661.0, 1092.0, 2008.0, 3642.0, 6591.0, 12860.0, 26916.0, 58426.0, 130060.0, 259502.0, 274922.0, 144786.0, 65647.0, 29621.0, 14242.0, 7247.0, 3930.0, 2085.0, 1222.0, 730.0, 416.0, 256.0, 179.0, 111.0, 88.0, 58.0, 32.0, 27.0, 8.0, 17.0, 7.0, 3.0, 3.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-87.8125, -85.07421875, -82.3359375, -79.59765625, -76.859375, -74.12109375, -71.3828125, -68.64453125, -65.90625, -63.16796875, -60.4296875, -57.69140625, -54.953125, -52.21484375, -49.4765625, -46.73828125, -44.0, -41.26171875, -38.5234375, -35.78515625, -33.046875, -30.30859375, -27.5703125, -24.83203125, -22.09375, -19.35546875, -16.6171875, -13.87890625, -11.140625, -8.40234375, -5.6640625, -2.92578125, -0.1875, 2.55078125, 5.2890625, 8.02734375, 10.765625, 13.50390625, 16.2421875, 18.98046875, 21.71875, 24.45703125, 27.1953125, 29.93359375, 32.671875, 35.41015625, 38.1484375, 40.88671875, 43.625, 46.36328125, 49.1015625, 51.83984375, 54.578125, 57.31640625, 60.0546875, 62.79296875, 65.53125, 68.26953125, 71.0078125, 73.74609375, 76.484375, 79.22265625, 81.9609375, 84.69921875, 87.4375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 7.0, 7.0, 20.0, 17.0, 10.0, 13.0, 17.0, 24.0, 30.0, 47.0, 46.0, 51.0, 67.0, 58.0, 66.0, 57.0, 48.0, 47.0, 52.0, 44.0, 44.0, 39.0, 30.0, 39.0, 19.0, 19.0, 12.0, 12.0, 12.0, 9.0, 12.0, 5.0, 2.0, 6.0, 6.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.40625, -20.74658203125, -20.0869140625, -19.42724609375, -18.767578125, -18.10791015625, -17.4482421875, -16.78857421875, -16.12890625, -15.46923828125, -14.8095703125, -14.14990234375, -13.490234375, -12.83056640625, -12.1708984375, -11.51123046875, -10.8515625, -10.19189453125, -9.5322265625, -8.87255859375, -8.212890625, -7.55322265625, -6.8935546875, -6.23388671875, -5.57421875, -4.91455078125, -4.2548828125, -3.59521484375, -2.935546875, -2.27587890625, -1.6162109375, -0.95654296875, -0.296875, 0.36279296875, 1.0224609375, 1.68212890625, 2.341796875, 3.00146484375, 3.6611328125, 4.32080078125, 4.98046875, 5.64013671875, 6.2998046875, 6.95947265625, 7.619140625, 8.27880859375, 8.9384765625, 9.59814453125, 10.2578125, 10.91748046875, 11.5771484375, 12.23681640625, 12.896484375, 13.55615234375, 14.2158203125, 14.87548828125, 15.53515625, 16.19482421875, 16.8544921875, 17.51416015625, 18.173828125, 18.83349609375, 19.4931640625, 20.15283203125, 20.8125]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 1.0, 3.0, 2.0, 11.0, 8.0, 10.0, 19.0, 11.0, 18.0, 19.0, 31.0, 32.0, 45.0, 45.0, 50.0, 53.0, 63.0, 57.0, 76.0, 51.0, 59.0, 45.0, 45.0, 59.0, 42.0, 31.0, 24.0, 19.0, 24.0, 15.0, 6.0, 6.0, 5.0, 6.0, 5.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-74.30104064941406, -72.1893310546875, -70.07762145996094, -67.96591186523438, -65.85420227050781, -63.742496490478516, -61.63079071044922, -59.519081115722656, -57.407371520996094, -55.29566192626953, -53.18395233154297, -51.07224655151367, -48.96053695678711, -46.84882736206055, -44.73712158203125, -42.62541198730469, -40.513702392578125, -38.40199279785156, -36.290283203125, -34.1785774230957, -32.06686782836914, -29.955158233642578, -27.84345054626465, -25.73174285888672, -23.620033264160156, -21.508323669433594, -19.396615982055664, -17.284908294677734, -15.173198699951172, -13.061490058898926, -10.94978141784668, -8.838072776794434, -6.726371765136719, -4.614663124084473, -2.5029544830322266, -0.39124584197998047, 1.7204627990722656, 3.8321714401245117, 5.943880081176758, 8.055588722229004, 10.16729736328125, 12.279006004333496, 14.390714645385742, 16.502422332763672, 18.614131927490234, 20.725841522216797, 22.837549209594727, 24.949256896972656, 27.06096649169922, 29.17267608642578, 31.28438377380371, 33.39609146118164, 35.5078010559082, 37.619510650634766, 39.73121643066406, 41.842926025390625, 43.95463562011719, 46.06634521484375, 48.17805480957031, 50.28976058959961, 52.40147018432617, 54.513179779052734, 56.62488555908203, 58.736595153808594, 60.848304748535156]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 0.0, 6.0, 4.0, 4.0, 7.0, 7.0, 7.0, 12.0, 18.0, 14.0, 23.0, 26.0, 30.0, 26.0, 31.0, 42.0, 34.0, 45.0, 32.0, 41.0, 52.0, 46.0, 48.0, 47.0, 41.0, 40.0, 47.0, 48.0, 32.0, 29.0, 19.0, 23.0, 26.0, 13.0, 17.0, 16.0, 11.0, 17.0, 8.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-70.2049560546875, -68.05781555175781, -65.91067504882812, -63.76353454589844, -61.61639404296875, -59.46925354003906, -57.32210922241211, -55.17496871948242, -53.027828216552734, -50.88068771362305, -48.73354721069336, -46.58640670776367, -44.43926239013672, -42.29212188720703, -40.144981384277344, -37.997840881347656, -35.85070037841797, -33.70355987548828, -31.556419372558594, -29.409276962280273, -27.262136459350586, -25.1149959564209, -22.967853546142578, -20.82071304321289, -18.673572540283203, -16.526432037353516, -14.379290580749512, -12.232149124145508, -10.08500862121582, -7.937868118286133, -5.790726661682129, -3.643585205078125, -1.4964370727539062, 0.6507039070129395, 2.797844886779785, 4.944985866546631, 7.092126846313477, 9.239267349243164, 11.386408805847168, 13.533550262451172, 15.68069076538086, 17.827831268310547, 19.974971771240234, 22.122114181518555, 24.269254684448242, 26.41639518737793, 28.56353759765625, 30.710678100585938, 32.857818603515625, 35.00495910644531, 37.152099609375, 39.29924011230469, 41.446380615234375, 43.59352111816406, 45.740665435791016, 47.8878059387207, 50.03494644165039, 52.18208694458008, 54.329227447509766, 56.47636795043945, 58.623512268066406, 60.770652770996094, 62.91779327392578, 65.06493377685547, 67.21207427978516]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 6.0, 8.0, 13.0, 26.0, 36.0, 52.0, 104.0, 144.0, 198.0, 332.0, 473.0, 806.0, 1353.0, 2379.0, 3962.0, 6753.0, 11954.0, 20958.0, 37621.0, 70564.0, 133206.0, 259327.0, 491185.0, 779244.0, 879261.0, 674995.0, 391103.0, 201879.0, 103449.0, 54656.0, 29454.0, 16266.0, 9317.0, 5266.0, 3075.0, 1837.0, 1105.0, 705.0, 440.0, 278.0, 203.0, 91.0, 82.0, 33.0, 34.0, 16.0, 17.0, 12.0, 2.0, 5.0, 2.0, 1.0, 0.0, 4.0], "bins": [-49.09375, -47.66259765625, -46.2314453125, -44.80029296875, -43.369140625, -41.93798828125, -40.5068359375, -39.07568359375, -37.64453125, -36.21337890625, -34.7822265625, -33.35107421875, -31.919921875, -30.48876953125, -29.0576171875, -27.62646484375, -26.1953125, -24.76416015625, -23.3330078125, -21.90185546875, -20.470703125, -19.03955078125, -17.6083984375, -16.17724609375, -14.74609375, -13.31494140625, -11.8837890625, -10.45263671875, -9.021484375, -7.59033203125, -6.1591796875, -4.72802734375, -3.296875, -1.86572265625, -0.4345703125, 0.99658203125, 2.427734375, 3.85888671875, 5.2900390625, 6.72119140625, 8.15234375, 9.58349609375, 11.0146484375, 12.44580078125, 13.876953125, 15.30810546875, 16.7392578125, 18.17041015625, 19.6015625, 21.03271484375, 22.4638671875, 23.89501953125, 25.326171875, 26.75732421875, 28.1884765625, 29.61962890625, 31.05078125, 32.48193359375, 33.9130859375, 35.34423828125, 36.775390625, 38.20654296875, 39.6376953125, 41.06884765625, 42.5]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 0.0, 4.0, 4.0, 5.0, 2.0, 11.0, 10.0, 17.0, 21.0, 19.0, 27.0, 32.0, 31.0, 34.0, 20.0, 35.0, 41.0, 40.0, 35.0, 48.0, 56.0, 49.0, 40.0, 39.0, 41.0, 37.0, 45.0, 39.0, 31.0, 27.0, 26.0, 20.0, 17.0, 14.0, 28.0, 13.0, 12.0, 11.0, 10.0, 4.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-50.0625, -48.55517578125, -47.0478515625, -45.54052734375, -44.033203125, -42.52587890625, -41.0185546875, -39.51123046875, -38.00390625, -36.49658203125, -34.9892578125, -33.48193359375, -31.974609375, -30.46728515625, -28.9599609375, -27.45263671875, -25.9453125, -24.43798828125, -22.9306640625, -21.42333984375, -19.916015625, -18.40869140625, -16.9013671875, -15.39404296875, -13.88671875, -12.37939453125, -10.8720703125, -9.36474609375, -7.857421875, -6.35009765625, -4.8427734375, -3.33544921875, -1.828125, -0.32080078125, 1.1865234375, 2.69384765625, 4.201171875, 5.70849609375, 7.2158203125, 8.72314453125, 10.23046875, 11.73779296875, 13.2451171875, 14.75244140625, 16.259765625, 17.76708984375, 19.2744140625, 20.78173828125, 22.2890625, 23.79638671875, 25.3037109375, 26.81103515625, 28.318359375, 29.82568359375, 31.3330078125, 32.84033203125, 34.34765625, 35.85498046875, 37.3623046875, 38.86962890625, 40.376953125, 41.88427734375, 43.3916015625, 44.89892578125, 46.40625]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 8.0, 5.0, 13.0, 9.0, 27.0, 42.0, 49.0, 75.0, 118.0, 172.0, 279.0, 415.0, 636.0, 1002.0, 1685.0, 2592.0, 4152.0, 6585.0, 11203.0, 18485.0, 30812.0, 51205.0, 86540.0, 146329.0, 241643.0, 382777.0, 565210.0, 698068.0, 654968.0, 486479.0, 317157.0, 194887.0, 116839.0, 69570.0, 41301.0, 24434.0, 14788.0, 8944.0, 5494.0, 3331.0, 2198.0, 1362.0, 850.0, 514.0, 376.0, 232.0, 137.0, 102.0, 69.0, 40.0, 33.0, 23.0, 13.0, 8.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-39.4375, -38.19677734375, -36.9560546875, -35.71533203125, -34.474609375, -33.23388671875, -31.9931640625, -30.75244140625, -29.51171875, -28.27099609375, -27.0302734375, -25.78955078125, -24.548828125, -23.30810546875, -22.0673828125, -20.82666015625, -19.5859375, -18.34521484375, -17.1044921875, -15.86376953125, -14.623046875, -13.38232421875, -12.1416015625, -10.90087890625, -9.66015625, -8.41943359375, -7.1787109375, -5.93798828125, -4.697265625, -3.45654296875, -2.2158203125, -0.97509765625, 0.265625, 1.50634765625, 2.7470703125, 3.98779296875, 5.228515625, 6.46923828125, 7.7099609375, 8.95068359375, 10.19140625, 11.43212890625, 12.6728515625, 13.91357421875, 15.154296875, 16.39501953125, 17.6357421875, 18.87646484375, 20.1171875, 21.35791015625, 22.5986328125, 23.83935546875, 25.080078125, 26.32080078125, 27.5615234375, 28.80224609375, 30.04296875, 31.28369140625, 32.5244140625, 33.76513671875, 35.005859375, 36.24658203125, 37.4873046875, 38.72802734375, 39.96875]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 5.0, 1.0, 4.0, 5.0, 11.0, 18.0, 10.0, 19.0, 19.0, 24.0, 46.0, 52.0, 66.0, 58.0, 93.0, 120.0, 123.0, 138.0, 194.0, 198.0, 206.0, 243.0, 248.0, 246.0, 294.0, 228.0, 229.0, 221.0, 196.0, 164.0, 139.0, 105.0, 77.0, 72.0, 46.0, 36.0, 31.0, 22.0, 17.0, 16.0, 8.0, 7.0, 5.0, 7.0, 2.0, 7.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.65625, -16.050537109375, -15.44482421875, -14.839111328125, -14.2333984375, -13.627685546875, -13.02197265625, -12.416259765625, -11.810546875, -11.204833984375, -10.59912109375, -9.993408203125, -9.3876953125, -8.781982421875, -8.17626953125, -7.570556640625, -6.96484375, -6.359130859375, -5.75341796875, -5.147705078125, -4.5419921875, -3.936279296875, -3.33056640625, -2.724853515625, -2.119140625, -1.513427734375, -0.90771484375, -0.302001953125, 0.3037109375, 0.909423828125, 1.51513671875, 2.120849609375, 2.7265625, 3.332275390625, 3.93798828125, 4.543701171875, 5.1494140625, 5.755126953125, 6.36083984375, 6.966552734375, 7.572265625, 8.177978515625, 8.78369140625, 9.389404296875, 9.9951171875, 10.600830078125, 11.20654296875, 11.812255859375, 12.41796875, 13.023681640625, 13.62939453125, 14.235107421875, 14.8408203125, 15.446533203125, 16.05224609375, 16.657958984375, 17.263671875, 17.869384765625, 18.47509765625, 19.080810546875, 19.6865234375, 20.292236328125, 20.89794921875, 21.503662109375, 22.109375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 5.0, 5.0, 5.0, 8.0, 7.0, 9.0, 23.0, 17.0, 17.0, 29.0, 38.0, 43.0, 42.0, 43.0, 69.0, 72.0, 63.0, 88.0, 55.0, 56.0, 59.0, 45.0, 52.0, 38.0, 22.0, 20.0, 13.0, 11.0, 17.0, 7.0, 7.0, 10.0, 7.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0], "bins": [-70.68123626708984, -68.78840637207031, -66.89556884765625, -65.00273895263672, -63.10990905761719, -61.21707534790039, -59.324241638183594, -57.43141174316406, -55.538578033447266, -53.64574432373047, -51.75291442871094, -49.86008071899414, -47.967247009277344, -46.07441711425781, -44.181583404541016, -42.28874969482422, -40.39591979980469, -38.50308609008789, -36.61025619506836, -34.71742248535156, -32.82459259033203, -30.931758880615234, -29.038925170898438, -27.146093368530273, -25.25326156616211, -23.360429763793945, -21.46759796142578, -19.574764251708984, -17.68193244934082, -15.789100646972656, -13.896267890930176, -12.003435134887695, -10.110599517822266, -8.217767715454102, -6.324934959411621, -4.432102680206299, -2.5392704010009766, -0.6464385986328125, 1.246394157409668, 3.1392269134521484, 5.0320587158203125, 6.924890995025635, 8.817723274230957, 10.710556030273438, 12.603387832641602, 14.496219635009766, 16.389053344726562, 18.281885147094727, 20.17471694946289, 22.067548751831055, 23.96038055419922, 25.853214263916016, 27.74604606628418, 29.638877868652344, 31.53171157836914, 33.42454528808594, 35.31737518310547, 37.210208892822266, 39.1030387878418, 40.995872497558594, 42.888702392578125, 44.78153610229492, 46.67436981201172, 48.56719970703125, 50.46003341674805]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 6.0, 6.0, 13.0, 10.0, 15.0, 18.0, 35.0, 24.0, 24.0, 27.0, 23.0, 38.0, 31.0, 25.0, 29.0, 43.0, 48.0, 48.0, 44.0, 42.0, 40.0, 47.0, 36.0, 38.0, 48.0, 30.0, 27.0, 20.0, 27.0, 23.0, 23.0, 23.0, 14.0, 16.0, 7.0, 7.0, 7.0, 5.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-53.50748062133789, -51.859893798828125, -50.212310791015625, -48.56472396850586, -46.917137145996094, -45.269554138183594, -43.62196731567383, -41.97438049316406, -40.32679748535156, -38.6792106628418, -37.0316276550293, -35.38404083251953, -33.73645782470703, -32.088871002197266, -30.4412841796875, -28.793699264526367, -27.146114349365234, -25.4985294342041, -23.85094451904297, -22.203357696533203, -20.55577278137207, -18.908187866210938, -17.260601043701172, -15.613016128540039, -13.965431213378906, -12.317846298217773, -10.670260429382324, -9.022674560546875, -7.375089645385742, -5.727504730224609, -4.07991886138916, -2.432332992553711, -0.7847480773925781, 0.8628373146057129, 2.510422706604004, 4.158008098602295, 5.805593490600586, 7.453178405761719, 9.100764274597168, 10.748350143432617, 12.39593505859375, 14.043519973754883, 15.691105842590332, 17.33869171142578, 18.986276626586914, 20.633861541748047, 22.281448364257812, 23.929033279418945, 25.576618194580078, 27.22420310974121, 28.871788024902344, 30.51937484741211, 32.166961669921875, 33.814544677734375, 35.46213150024414, 37.109718322753906, 38.757301330566406, 40.40488815307617, 42.05247116088867, 43.70005798339844, 45.34764099121094, 46.9952278137207, 48.64281463623047, 50.29039764404297, 51.937984466552734]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 0.0, 6.0, 10.0, 12.0, 21.0, 26.0, 37.0, 56.0, 57.0, 101.0, 134.0, 181.0, 297.0, 412.0, 624.0, 960.0, 1478.0, 2340.0, 3902.0, 6608.0, 12109.0, 24410.0, 57485.0, 151646.0, 330137.0, 266277.0, 105670.0, 40949.0, 18672.0, 9676.0, 5321.0, 3162.0, 1935.0, 1280.0, 793.0, 565.0, 374.0, 271.0, 174.0, 123.0, 87.0, 59.0, 38.0, 21.0, 17.0, 16.0, 8.0, 5.0, 8.0, 1.0, 0.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-146.25, -141.50390625, -136.7578125, -132.01171875, -127.265625, -122.51953125, -117.7734375, -113.02734375, -108.28125, -103.53515625, -98.7890625, -94.04296875, -89.296875, -84.55078125, -79.8046875, -75.05859375, -70.3125, -65.56640625, -60.8203125, -56.07421875, -51.328125, -46.58203125, -41.8359375, -37.08984375, -32.34375, -27.59765625, -22.8515625, -18.10546875, -13.359375, -8.61328125, -3.8671875, 0.87890625, 5.625, 10.37109375, 15.1171875, 19.86328125, 24.609375, 29.35546875, 34.1015625, 38.84765625, 43.59375, 48.33984375, 53.0859375, 57.83203125, 62.578125, 67.32421875, 72.0703125, 76.81640625, 81.5625, 86.30859375, 91.0546875, 95.80078125, 100.546875, 105.29296875, 110.0390625, 114.78515625, 119.53125, 124.27734375, 129.0234375, 133.76953125, 138.515625, 143.26171875, 148.0078125, 152.75390625, 157.5]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 3.0, 4.0, 7.0, 4.0, 12.0, 15.0, 23.0, 16.0, 20.0, 23.0, 26.0, 28.0, 23.0, 33.0, 27.0, 34.0, 38.0, 46.0, 50.0, 41.0, 49.0, 40.0, 34.0, 49.0, 42.0, 38.0, 36.0, 31.0, 34.0, 23.0, 25.0, 23.0, 17.0, 16.0, 17.0, 12.0, 13.0, 7.0, 6.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-48.8125, -47.3427734375, -45.873046875, -44.4033203125, -42.93359375, -41.4638671875, -39.994140625, -38.5244140625, -37.0546875, -35.5849609375, -34.115234375, -32.6455078125, -31.17578125, -29.7060546875, -28.236328125, -26.7666015625, -25.296875, -23.8271484375, -22.357421875, -20.8876953125, -19.41796875, -17.9482421875, -16.478515625, -15.0087890625, -13.5390625, -12.0693359375, -10.599609375, -9.1298828125, -7.66015625, -6.1904296875, -4.720703125, -3.2509765625, -1.78125, -0.3115234375, 1.158203125, 2.6279296875, 4.09765625, 5.5673828125, 7.037109375, 8.5068359375, 9.9765625, 11.4462890625, 12.916015625, 14.3857421875, 15.85546875, 17.3251953125, 18.794921875, 20.2646484375, 21.734375, 23.2041015625, 24.673828125, 26.1435546875, 27.61328125, 29.0830078125, 30.552734375, 32.0224609375, 33.4921875, 34.9619140625, 36.431640625, 37.9013671875, 39.37109375, 40.8408203125, 42.310546875, 43.7802734375, 45.25]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 6.0, 7.0, 8.0, 10.0, 21.0, 16.0, 25.0, 24.0, 29.0, 38.0, 49.0, 70.0, 99.0, 148.0, 198.0, 275.0, 403.0, 745.0, 1094.0, 1820.0, 3082.0, 5800.0, 11212.0, 23412.0, 58049.0, 184377.0, 450701.0, 195368.0, 61147.0, 24677.0, 11510.0, 5791.0, 3235.0, 1812.0, 1107.0, 694.0, 436.0, 266.0, 193.0, 178.0, 95.0, 83.0, 64.0, 55.0, 27.0, 28.0, 19.0, 18.0, 13.0, 8.0, 9.0, 2.0, 8.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-177.5, -171.869140625, -166.23828125, -160.607421875, -154.9765625, -149.345703125, -143.71484375, -138.083984375, -132.453125, -126.822265625, -121.19140625, -115.560546875, -109.9296875, -104.298828125, -98.66796875, -93.037109375, -87.40625, -81.775390625, -76.14453125, -70.513671875, -64.8828125, -59.251953125, -53.62109375, -47.990234375, -42.359375, -36.728515625, -31.09765625, -25.466796875, -19.8359375, -14.205078125, -8.57421875, -2.943359375, 2.6875, 8.318359375, 13.94921875, 19.580078125, 25.2109375, 30.841796875, 36.47265625, 42.103515625, 47.734375, 53.365234375, 58.99609375, 64.626953125, 70.2578125, 75.888671875, 81.51953125, 87.150390625, 92.78125, 98.412109375, 104.04296875, 109.673828125, 115.3046875, 120.935546875, 126.56640625, 132.197265625, 137.828125, 143.458984375, 149.08984375, 154.720703125, 160.3515625, 165.982421875, 171.61328125, 177.244140625, 182.875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 1.0, 3.0, 5.0, 6.0, 2.0, 13.0, 14.0, 12.0, 23.0, 32.0, 34.0, 44.0, 50.0, 62.0, 66.0, 93.0, 89.0, 66.0, 61.0, 54.0, 63.0, 48.0, 42.0, 31.0, 21.0, 11.0, 18.0, 15.0, 7.0, 1.0, 5.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.5, -55.63623046875, -53.7724609375, -51.90869140625, -50.044921875, -48.18115234375, -46.3173828125, -44.45361328125, -42.58984375, -40.72607421875, -38.8623046875, -36.99853515625, -35.134765625, -33.27099609375, -31.4072265625, -29.54345703125, -27.6796875, -25.81591796875, -23.9521484375, -22.08837890625, -20.224609375, -18.36083984375, -16.4970703125, -14.63330078125, -12.76953125, -10.90576171875, -9.0419921875, -7.17822265625, -5.314453125, -3.45068359375, -1.5869140625, 0.27685546875, 2.140625, 4.00439453125, 5.8681640625, 7.73193359375, 9.595703125, 11.45947265625, 13.3232421875, 15.18701171875, 17.05078125, 18.91455078125, 20.7783203125, 22.64208984375, 24.505859375, 26.36962890625, 28.2333984375, 30.09716796875, 31.9609375, 33.82470703125, 35.6884765625, 37.55224609375, 39.416015625, 41.27978515625, 43.1435546875, 45.00732421875, 46.87109375, 48.73486328125, 50.5986328125, 52.46240234375, 54.326171875, 56.18994140625, 58.0537109375, 59.91748046875, 61.78125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 8.0, 8.0, 18.0, 12.0, 34.0, 54.0, 94.0, 160.0, 268.0, 476.0, 735.0, 1270.0, 2412.0, 4545.0, 9413.0, 22137.0, 62632.0, 240190.0, 470686.0, 156502.0, 44489.0, 16725.0, 7347.0, 3738.0, 1969.0, 1117.0, 592.0, 356.0, 206.0, 117.0, 80.0, 60.0, 36.0, 30.0, 18.0, 8.0, 7.0, 4.0, 2.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-88.625, -85.7978515625, -82.970703125, -80.1435546875, -77.31640625, -74.4892578125, -71.662109375, -68.8349609375, -66.0078125, -63.1806640625, -60.353515625, -57.5263671875, -54.69921875, -51.8720703125, -49.044921875, -46.2177734375, -43.390625, -40.5634765625, -37.736328125, -34.9091796875, -32.08203125, -29.2548828125, -26.427734375, -23.6005859375, -20.7734375, -17.9462890625, -15.119140625, -12.2919921875, -9.46484375, -6.6376953125, -3.810546875, -0.9833984375, 1.84375, 4.6708984375, 7.498046875, 10.3251953125, 13.15234375, 15.9794921875, 18.806640625, 21.6337890625, 24.4609375, 27.2880859375, 30.115234375, 32.9423828125, 35.76953125, 38.5966796875, 41.423828125, 44.2509765625, 47.078125, 49.9052734375, 52.732421875, 55.5595703125, 58.38671875, 61.2138671875, 64.041015625, 66.8681640625, 69.6953125, 72.5224609375, 75.349609375, 78.1767578125, 81.00390625, 83.8310546875, 86.658203125, 89.4853515625, 92.3125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 0.0, 9.0, 3.0, 6.0, 2.0, 4.0, 6.0, 14.0, 13.0, 20.0, 24.0, 42.0, 97.0, 141.0, 178.0, 148.0, 109.0, 58.0, 41.0, 21.0, 22.0, 7.0, 6.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0064239501953125, -0.00625300407409668, -0.006082057952880859, -0.005911111831665039, -0.005740165710449219, -0.0055692195892333984, -0.005398273468017578, -0.005227327346801758, -0.0050563812255859375, -0.004885435104370117, -0.004714488983154297, -0.0045435428619384766, -0.004372596740722656, -0.004201650619506836, -0.004030704498291016, -0.0038597583770751953, -0.003688812255859375, -0.0035178661346435547, -0.0033469200134277344, -0.003175973892211914, -0.0030050277709960938, -0.0028340816497802734, -0.002663135528564453, -0.002492189407348633, -0.0023212432861328125, -0.002150297164916992, -0.001979351043701172, -0.0018084049224853516, -0.0016374588012695312, -0.001466512680053711, -0.0012955665588378906, -0.0011246204376220703, -0.00095367431640625, -0.0007827281951904297, -0.0006117820739746094, -0.00044083595275878906, -0.00026988983154296875, -9.894371032714844e-05, 7.200241088867188e-05, 0.0002429485321044922, 0.0004138946533203125, 0.0005848407745361328, 0.0007557868957519531, 0.0009267330169677734, 0.0010976791381835938, 0.001268625259399414, 0.0014395713806152344, 0.0016105175018310547, 0.001781463623046875, 0.0019524097442626953, 0.0021233558654785156, 0.002294301986694336, 0.0024652481079101562, 0.0026361942291259766, 0.002807140350341797, 0.002978086471557617, 0.0031490325927734375, 0.003319978713989258, 0.003490924835205078, 0.0036618709564208984, 0.0038328170776367188, 0.004003763198852539, 0.004174709320068359, 0.00434565544128418, 0.0045166015625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 7.0, 9.0, 12.0, 18.0, 20.0, 31.0, 58.0, 82.0, 118.0, 151.0, 224.0, 349.0, 533.0, 819.0, 1255.0, 2040.0, 3329.0, 5468.0, 9783.0, 18869.0, 38845.0, 89453.0, 202259.0, 300046.0, 203097.0, 89200.0, 39088.0, 19007.0, 9854.0, 5610.0, 3155.0, 2026.0, 1263.0, 800.0, 552.0, 380.0, 253.0, 157.0, 99.0, 73.0, 47.0, 37.0, 26.0, 18.0, 12.0, 5.0, 4.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0], "bins": [-59.59375, -57.81494140625, -56.0361328125, -54.25732421875, -52.478515625, -50.69970703125, -48.9208984375, -47.14208984375, -45.36328125, -43.58447265625, -41.8056640625, -40.02685546875, -38.248046875, -36.46923828125, -34.6904296875, -32.91162109375, -31.1328125, -29.35400390625, -27.5751953125, -25.79638671875, -24.017578125, -22.23876953125, -20.4599609375, -18.68115234375, -16.90234375, -15.12353515625, -13.3447265625, -11.56591796875, -9.787109375, -8.00830078125, -6.2294921875, -4.45068359375, -2.671875, -0.89306640625, 0.8857421875, 2.66455078125, 4.443359375, 6.22216796875, 8.0009765625, 9.77978515625, 11.55859375, 13.33740234375, 15.1162109375, 16.89501953125, 18.673828125, 20.45263671875, 22.2314453125, 24.01025390625, 25.7890625, 27.56787109375, 29.3466796875, 31.12548828125, 32.904296875, 34.68310546875, 36.4619140625, 38.24072265625, 40.01953125, 41.79833984375, 43.5771484375, 45.35595703125, 47.134765625, 48.91357421875, 50.6923828125, 52.47119140625, 54.25]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 1.0, 6.0, 7.0, 14.0, 11.0, 17.0, 23.0, 26.0, 41.0, 44.0, 61.0, 82.0, 82.0, 105.0, 85.0, 90.0, 71.0, 58.0, 41.0, 35.0, 23.0, 18.0, 12.0, 7.0, 4.0, 8.0, 4.0, 3.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.71875, -23.889404296875, -23.06005859375, -22.230712890625, -21.4013671875, -20.572021484375, -19.74267578125, -18.913330078125, -18.083984375, -17.254638671875, -16.42529296875, -15.595947265625, -14.7666015625, -13.937255859375, -13.10791015625, -12.278564453125, -11.44921875, -10.619873046875, -9.79052734375, -8.961181640625, -8.1318359375, -7.302490234375, -6.47314453125, -5.643798828125, -4.814453125, -3.985107421875, -3.15576171875, -2.326416015625, -1.4970703125, -0.667724609375, 0.16162109375, 0.990966796875, 1.8203125, 2.649658203125, 3.47900390625, 4.308349609375, 5.1376953125, 5.967041015625, 6.79638671875, 7.625732421875, 8.455078125, 9.284423828125, 10.11376953125, 10.943115234375, 11.7724609375, 12.601806640625, 13.43115234375, 14.260498046875, 15.08984375, 15.919189453125, 16.74853515625, 17.577880859375, 18.4072265625, 19.236572265625, 20.06591796875, 20.895263671875, 21.724609375, 22.553955078125, 23.38330078125, 24.212646484375, 25.0419921875, 25.871337890625, 26.70068359375, 27.530029296875, 28.359375]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 1.0, 5.0, 2.0, 0.0, 6.0, 9.0, 14.0, 14.0, 16.0, 30.0, 22.0, 32.0, 38.0, 57.0, 54.0, 39.0, 58.0, 54.0, 72.0, 64.0, 57.0, 53.0, 56.0, 49.0, 46.0, 34.0, 22.0, 30.0, 18.0, 9.0, 6.0, 13.0, 5.0, 8.0, 2.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.05623245239258, -48.432655334472656, -46.809078216552734, -45.18550109863281, -43.56192398071289, -41.93834686279297, -40.31477355957031, -38.69119644165039, -37.06761932373047, -35.44404220581055, -33.820465087890625, -32.1968879699707, -30.573312759399414, -28.949735641479492, -27.32615852355957, -25.70258331298828, -24.079004287719727, -22.455427169799805, -20.831850051879883, -19.208274841308594, -17.584697723388672, -15.96112060546875, -14.337543487548828, -12.713967323303223, -11.0903902053833, -9.466813087463379, -7.843236923217773, -6.219659805297852, -4.596083164215088, -2.972506523132324, -1.3489294052124023, 0.2746467590332031, 1.898223876953125, 3.5218005180358887, 5.145377159118652, 6.768954277038574, 8.39253044128418, 10.016107559204102, 11.639684677124023, 13.263260841369629, 14.88683795928955, 16.510414123535156, 18.133991241455078, 19.757568359375, 21.381145477294922, 23.004722595214844, 24.628299713134766, 26.251874923706055, 27.875452041625977, 29.4990291595459, 31.12260627746582, 32.74618148803711, 34.36975860595703, 35.99333572387695, 37.616912841796875, 39.2404899597168, 40.86406707763672, 42.48764419555664, 44.11122131347656, 45.734798431396484, 47.358375549316406, 48.98194885253906, 50.60552978515625, 52.229103088378906, 53.85268020629883]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 6.0, 8.0, 10.0, 8.0, 11.0, 15.0, 12.0, 17.0, 22.0, 20.0, 32.0, 22.0, 27.0, 31.0, 24.0, 28.0, 41.0, 40.0, 50.0, 55.0, 27.0, 41.0, 41.0, 35.0, 28.0, 36.0, 36.0, 39.0, 23.0, 27.0, 29.0, 23.0, 21.0, 18.0, 15.0, 19.0, 13.0, 11.0, 10.0, 7.0, 3.0, 5.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0], "bins": [-41.95718002319336, -40.70591735839844, -39.45465087890625, -38.20338821411133, -36.952125549316406, -35.700862884521484, -34.44960021972656, -33.198333740234375, -31.947071075439453, -30.69580841064453, -29.444543838500977, -28.193279266357422, -26.9420166015625, -25.690753936767578, -24.439489364624023, -23.18822479248047, -21.936962127685547, -20.685699462890625, -19.43443489074707, -18.183170318603516, -16.931907653808594, -15.680644035339355, -14.429380416870117, -13.178116798400879, -11.92685317993164, -10.675589561462402, -9.424325942993164, -8.173062324523926, -6.9217987060546875, -5.670535087585449, -4.419271469116211, -3.1680078506469727, -1.9167442321777344, -0.6654806137084961, 0.5857830047607422, 1.8370466232299805, 3.0883102416992188, 4.339573860168457, 5.590837478637695, 6.842101097106934, 8.093364715576172, 9.34462833404541, 10.595891952514648, 11.847155570983887, 13.098419189453125, 14.349682807922363, 15.600946426391602, 16.852210998535156, 18.103473663330078, 19.354736328125, 20.606000900268555, 21.85726547241211, 23.10852813720703, 24.359790802001953, 25.611055374145508, 26.862319946289062, 28.113582611083984, 29.364845275878906, 30.61610984802246, 31.867374420166016, 33.11863708496094, 34.36989974975586, 35.62116241455078, 36.87242889404297, 38.12369155883789]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 3.0, 10.0, 18.0, 29.0, 32.0, 56.0, 89.0, 120.0, 229.0, 321.0, 508.0, 769.0, 1218.0, 1986.0, 3195.0, 5218.0, 7978.0, 13360.0, 21682.0, 34792.0, 54989.0, 82508.0, 117315.0, 147298.0, 152921.0, 130741.0, 95787.0, 64495.0, 41984.0, 25982.0, 16393.0, 9931.0, 6185.0, 3803.0, 2401.0, 1495.0, 992.0, 608.0, 398.0, 248.0, 162.0, 110.0, 59.0, 60.0, 33.0, 12.0, 18.0, 11.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-41.125, -39.88623046875, -38.6474609375, -37.40869140625, -36.169921875, -34.93115234375, -33.6923828125, -32.45361328125, -31.21484375, -29.97607421875, -28.7373046875, -27.49853515625, -26.259765625, -25.02099609375, -23.7822265625, -22.54345703125, -21.3046875, -20.06591796875, -18.8271484375, -17.58837890625, -16.349609375, -15.11083984375, -13.8720703125, -12.63330078125, -11.39453125, -10.15576171875, -8.9169921875, -7.67822265625, -6.439453125, -5.20068359375, -3.9619140625, -2.72314453125, -1.484375, -0.24560546875, 0.9931640625, 2.23193359375, 3.470703125, 4.70947265625, 5.9482421875, 7.18701171875, 8.42578125, 9.66455078125, 10.9033203125, 12.14208984375, 13.380859375, 14.61962890625, 15.8583984375, 17.09716796875, 18.3359375, 19.57470703125, 20.8134765625, 22.05224609375, 23.291015625, 24.52978515625, 25.7685546875, 27.00732421875, 28.24609375, 29.48486328125, 30.7236328125, 31.96240234375, 33.201171875, 34.43994140625, 35.6787109375, 36.91748046875, 38.15625]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 4.0, 7.0, 7.0, 11.0, 6.0, 8.0, 21.0, 19.0, 14.0, 17.0, 19.0, 31.0, 23.0, 27.0, 31.0, 27.0, 37.0, 39.0, 37.0, 38.0, 45.0, 49.0, 39.0, 33.0, 36.0, 32.0, 41.0, 32.0, 33.0, 33.0, 24.0, 25.0, 26.0, 27.0, 18.0, 19.0, 13.0, 10.0, 3.0, 10.0, 5.0, 6.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-37.4375, -36.24951171875, -35.0615234375, -33.87353515625, -32.685546875, -31.49755859375, -30.3095703125, -29.12158203125, -27.93359375, -26.74560546875, -25.5576171875, -24.36962890625, -23.181640625, -21.99365234375, -20.8056640625, -19.61767578125, -18.4296875, -17.24169921875, -16.0537109375, -14.86572265625, -13.677734375, -12.48974609375, -11.3017578125, -10.11376953125, -8.92578125, -7.73779296875, -6.5498046875, -5.36181640625, -4.173828125, -2.98583984375, -1.7978515625, -0.60986328125, 0.578125, 1.76611328125, 2.9541015625, 4.14208984375, 5.330078125, 6.51806640625, 7.7060546875, 8.89404296875, 10.08203125, 11.27001953125, 12.4580078125, 13.64599609375, 14.833984375, 16.02197265625, 17.2099609375, 18.39794921875, 19.5859375, 20.77392578125, 21.9619140625, 23.14990234375, 24.337890625, 25.52587890625, 26.7138671875, 27.90185546875, 29.08984375, 30.27783203125, 31.4658203125, 32.65380859375, 33.841796875, 35.02978515625, 36.2177734375, 37.40576171875, 38.59375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 9.0, 12.0, 11.0, 19.0, 23.0, 32.0, 71.0, 109.0, 139.0, 238.0, 316.0, 511.0, 736.0, 1154.0, 1763.0, 2675.0, 4248.0, 6646.0, 10092.0, 15752.0, 24521.0, 37484.0, 56261.0, 81122.0, 109266.0, 131553.0, 137465.0, 123154.0, 97196.0, 69339.0, 47437.0, 31581.0, 20340.0, 13259.0, 8595.0, 5374.0, 3503.0, 2245.0, 1526.0, 925.0, 639.0, 434.0, 266.0, 163.0, 126.0, 81.0, 45.0, 42.0, 16.0, 17.0, 8.0, 7.0, 8.0, 4.0, 7.0, 1.0, 3.0, 2.0], "bins": [-32.40625, -31.402587890625, -30.39892578125, -29.395263671875, -28.3916015625, -27.387939453125, -26.38427734375, -25.380615234375, -24.376953125, -23.373291015625, -22.36962890625, -21.365966796875, -20.3623046875, -19.358642578125, -18.35498046875, -17.351318359375, -16.34765625, -15.343994140625, -14.34033203125, -13.336669921875, -12.3330078125, -11.329345703125, -10.32568359375, -9.322021484375, -8.318359375, -7.314697265625, -6.31103515625, -5.307373046875, -4.3037109375, -3.300048828125, -2.29638671875, -1.292724609375, -0.2890625, 0.714599609375, 1.71826171875, 2.721923828125, 3.7255859375, 4.729248046875, 5.73291015625, 6.736572265625, 7.740234375, 8.743896484375, 9.74755859375, 10.751220703125, 11.7548828125, 12.758544921875, 13.76220703125, 14.765869140625, 15.76953125, 16.773193359375, 17.77685546875, 18.780517578125, 19.7841796875, 20.787841796875, 21.79150390625, 22.795166015625, 23.798828125, 24.802490234375, 25.80615234375, 26.809814453125, 27.8134765625, 28.817138671875, 29.82080078125, 30.824462890625, 31.828125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 12.0, 6.0, 13.0, 7.0, 15.0, 16.0, 16.0, 13.0, 21.0, 18.0, 25.0, 26.0, 37.0, 23.0, 27.0, 31.0, 45.0, 38.0, 38.0, 42.0, 48.0, 31.0, 38.0, 46.0, 44.0, 34.0, 29.0, 31.0, 29.0, 24.0, 13.0, 25.0, 24.0, 14.0, 17.0, 12.0, 12.0, 12.0, 7.0, 7.0, 11.0, 4.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-21.921875, -21.212646484375, -20.50341796875, -19.794189453125, -19.0849609375, -18.375732421875, -17.66650390625, -16.957275390625, -16.248046875, -15.538818359375, -14.82958984375, -14.120361328125, -13.4111328125, -12.701904296875, -11.99267578125, -11.283447265625, -10.57421875, -9.864990234375, -9.15576171875, -8.446533203125, -7.7373046875, -7.028076171875, -6.31884765625, -5.609619140625, -4.900390625, -4.191162109375, -3.48193359375, -2.772705078125, -2.0634765625, -1.354248046875, -0.64501953125, 0.064208984375, 0.7734375, 1.482666015625, 2.19189453125, 2.901123046875, 3.6103515625, 4.319580078125, 5.02880859375, 5.738037109375, 6.447265625, 7.156494140625, 7.86572265625, 8.574951171875, 9.2841796875, 9.993408203125, 10.70263671875, 11.411865234375, 12.12109375, 12.830322265625, 13.53955078125, 14.248779296875, 14.9580078125, 15.667236328125, 16.37646484375, 17.085693359375, 17.794921875, 18.504150390625, 19.21337890625, 19.922607421875, 20.6318359375, 21.341064453125, 22.05029296875, 22.759521484375, 23.46875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 2.0, 4.0, 5.0, 3.0, 8.0, 5.0, 12.0, 20.0, 17.0, 27.0, 43.0, 46.0, 80.0, 93.0, 139.0, 168.0, 248.0, 352.0, 498.0, 770.0, 1068.0, 1859.0, 3158.0, 6060.0, 12692.0, 31188.0, 84872.0, 233400.0, 360935.0, 193120.0, 68165.0, 25631.0, 10820.0, 5189.0, 2798.0, 1664.0, 1090.0, 699.0, 426.0, 338.0, 214.0, 181.0, 133.0, 77.0, 55.0, 44.0, 45.0, 36.0, 15.0, 19.0, 11.0, 7.0, 4.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-49.5625, -47.98388671875, -46.4052734375, -44.82666015625, -43.248046875, -41.66943359375, -40.0908203125, -38.51220703125, -36.93359375, -35.35498046875, -33.7763671875, -32.19775390625, -30.619140625, -29.04052734375, -27.4619140625, -25.88330078125, -24.3046875, -22.72607421875, -21.1474609375, -19.56884765625, -17.990234375, -16.41162109375, -14.8330078125, -13.25439453125, -11.67578125, -10.09716796875, -8.5185546875, -6.93994140625, -5.361328125, -3.78271484375, -2.2041015625, -0.62548828125, 0.953125, 2.53173828125, 4.1103515625, 5.68896484375, 7.267578125, 8.84619140625, 10.4248046875, 12.00341796875, 13.58203125, 15.16064453125, 16.7392578125, 18.31787109375, 19.896484375, 21.47509765625, 23.0537109375, 24.63232421875, 26.2109375, 27.78955078125, 29.3681640625, 30.94677734375, 32.525390625, 34.10400390625, 35.6826171875, 37.26123046875, 38.83984375, 40.41845703125, 41.9970703125, 43.57568359375, 45.154296875, 46.73291015625, 48.3115234375, 49.89013671875, 51.46875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 1.0, 5.0, 7.0, 15.0, 26.0, 31.0, 60.0, 69.0, 90.0, 135.0, 138.0, 120.0, 93.0, 66.0, 40.0, 38.0, 19.0, 6.0, 14.0, 8.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00440216064453125, -0.004246711730957031, -0.0040912628173828125, -0.003935813903808594, -0.003780364990234375, -0.0036249160766601562, -0.0034694671630859375, -0.0033140182495117188, -0.0031585693359375, -0.0030031204223632812, -0.0028476715087890625, -0.0026922225952148438, -0.002536773681640625, -0.0023813247680664062, -0.0022258758544921875, -0.0020704269409179688, -0.00191497802734375, -0.0017595291137695312, -0.0016040802001953125, -0.0014486312866210938, -0.001293182373046875, -0.0011377334594726562, -0.0009822845458984375, -0.0008268356323242188, -0.00067138671875, -0.0005159378051757812, -0.0003604888916015625, -0.00020503997802734375, -4.9591064453125e-05, 0.00010585784912109375, 0.0002613067626953125, 0.00041675567626953125, 0.00057220458984375, 0.0007276535034179688, 0.0008831024169921875, 0.0010385513305664062, 0.001194000244140625, 0.0013494491577148438, 0.0015048980712890625, 0.0016603469848632812, 0.0018157958984375, 0.0019712448120117188, 0.0021266937255859375, 0.0022821426391601562, 0.002437591552734375, 0.0025930404663085938, 0.0027484893798828125, 0.0029039382934570312, 0.00305938720703125, 0.0032148361206054688, 0.0033702850341796875, 0.0035257339477539062, 0.003681182861328125, 0.0038366317749023438, 0.0039920806884765625, 0.004147529602050781, 0.004302978515625, 0.004458427429199219, 0.0046138763427734375, 0.004769325256347656, 0.004924774169921875, 0.005080223083496094, 0.0052356719970703125, 0.005391120910644531, 0.00554656982421875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 9.0, 6.0, 13.0, 22.0, 32.0, 41.0, 58.0, 75.0, 116.0, 165.0, 279.0, 324.0, 506.0, 808.0, 1139.0, 1765.0, 2661.0, 4071.0, 6740.0, 11136.0, 18846.0, 32743.0, 57284.0, 97009.0, 149795.0, 188198.0, 172547.0, 122548.0, 74373.0, 43168.0, 24369.0, 14175.0, 8729.0, 5229.0, 3240.0, 2137.0, 1349.0, 951.0, 571.0, 418.0, 266.0, 204.0, 130.0, 109.0, 60.0, 52.0, 38.0, 14.0, 10.0, 19.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.9375, -23.183349609375, -22.42919921875, -21.675048828125, -20.9208984375, -20.166748046875, -19.41259765625, -18.658447265625, -17.904296875, -17.150146484375, -16.39599609375, -15.641845703125, -14.8876953125, -14.133544921875, -13.37939453125, -12.625244140625, -11.87109375, -11.116943359375, -10.36279296875, -9.608642578125, -8.8544921875, -8.100341796875, -7.34619140625, -6.592041015625, -5.837890625, -5.083740234375, -4.32958984375, -3.575439453125, -2.8212890625, -2.067138671875, -1.31298828125, -0.558837890625, 0.1953125, 0.949462890625, 1.70361328125, 2.457763671875, 3.2119140625, 3.966064453125, 4.72021484375, 5.474365234375, 6.228515625, 6.982666015625, 7.73681640625, 8.490966796875, 9.2451171875, 9.999267578125, 10.75341796875, 11.507568359375, 12.26171875, 13.015869140625, 13.77001953125, 14.524169921875, 15.2783203125, 16.032470703125, 16.78662109375, 17.540771484375, 18.294921875, 19.049072265625, 19.80322265625, 20.557373046875, 21.3115234375, 22.065673828125, 22.81982421875, 23.573974609375, 24.328125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 5.0, 9.0, 6.0, 8.0, 9.0, 14.0, 11.0, 16.0, 28.0, 33.0, 33.0, 33.0, 47.0, 50.0, 72.0, 71.0, 62.0, 78.0, 58.0, 54.0, 49.0, 44.0, 43.0, 27.0, 31.0, 25.0, 13.0, 12.0, 16.0, 12.0, 9.0, 7.0, 6.0, 4.0, 3.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.7421875, -10.4505615234375, -10.158935546875, -9.8673095703125, -9.57568359375, -9.2840576171875, -8.992431640625, -8.7008056640625, -8.4091796875, -8.1175537109375, -7.825927734375, -7.5343017578125, -7.24267578125, -6.9510498046875, -6.659423828125, -6.3677978515625, -6.076171875, -5.7845458984375, -5.492919921875, -5.2012939453125, -4.90966796875, -4.6180419921875, -4.326416015625, -4.0347900390625, -3.7431640625, -3.4515380859375, -3.159912109375, -2.8682861328125, -2.57666015625, -2.2850341796875, -1.993408203125, -1.7017822265625, -1.41015625, -1.1185302734375, -0.826904296875, -0.5352783203125, -0.24365234375, 0.0479736328125, 0.339599609375, 0.6312255859375, 0.9228515625, 1.2144775390625, 1.506103515625, 1.7977294921875, 2.08935546875, 2.3809814453125, 2.672607421875, 2.9642333984375, 3.255859375, 3.5474853515625, 3.839111328125, 4.1307373046875, 4.42236328125, 4.7139892578125, 5.005615234375, 5.2972412109375, 5.5888671875, 5.8804931640625, 6.172119140625, 6.4637451171875, 6.75537109375, 7.0469970703125, 7.338623046875, 7.6302490234375, 7.921875]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 1.0, 4.0, 4.0, 8.0, 6.0, 11.0, 13.0, 20.0, 23.0, 23.0, 30.0, 35.0, 39.0, 53.0, 57.0, 49.0, 57.0, 79.0, 57.0, 65.0, 70.0, 62.0, 58.0, 40.0, 27.0, 26.0, 20.0, 20.0, 15.0, 7.0, 2.0, 6.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.41061019897461, -48.828453063964844, -47.246299743652344, -45.66414260864258, -44.08198547363281, -42.49983215332031, -40.91767501831055, -39.33551788330078, -37.75336456298828, -36.171207427978516, -34.589054107666016, -33.00689697265625, -31.424741744995117, -29.842586517333984, -28.26042938232422, -26.678274154663086, -25.09611701965332, -23.513961791992188, -21.931804656982422, -20.34964942932129, -18.767494201660156, -17.18533706665039, -15.603181838989258, -14.021026611328125, -12.438870429992676, -10.856714248657227, -9.274559020996094, -7.6924028396606445, -6.1102471351623535, -4.5280914306640625, -2.9459352493286133, -1.3637800216674805, 0.21837615966796875, 1.8005319833755493, 3.38268780708313, 4.96484375, 6.546999454498291, 8.129155158996582, 9.711311340332031, 11.293466567993164, 12.875622749328613, 14.457778930664062, 16.039934158325195, 17.622089385986328, 19.204246520996094, 20.786401748657227, 22.36855697631836, 23.950714111328125, 25.532869338989258, 27.11502456665039, 28.697181701660156, 30.27933692932129, 31.861492156982422, 33.44364929199219, 35.02580261230469, 36.60795974731445, 38.19011688232422, 39.772274017333984, 41.354427337646484, 42.93658447265625, 44.518741607666016, 46.100894927978516, 47.68305206298828, 49.26520538330078, 50.84736251831055]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 7.0, 5.0, 5.0, 4.0, 5.0, 12.0, 10.0, 9.0, 13.0, 20.0, 14.0, 25.0, 19.0, 20.0, 26.0, 36.0, 40.0, 30.0, 36.0, 47.0, 39.0, 39.0, 42.0, 26.0, 33.0, 41.0, 48.0, 37.0, 34.0, 32.0, 28.0, 39.0, 27.0, 22.0, 28.0, 20.0, 17.0, 15.0, 19.0, 12.0, 7.0, 4.0, 1.0, 4.0, 6.0, 7.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-40.945762634277344, -39.7737922668457, -38.60182189941406, -37.429847717285156, -36.257877349853516, -35.085906982421875, -33.913936614990234, -32.741966247558594, -31.56999397277832, -30.39802360534668, -29.226051330566406, -28.054080963134766, -26.882110595703125, -25.71013832092285, -24.53816795349121, -23.366195678710938, -22.194225311279297, -21.022254943847656, -19.850282669067383, -18.678312301635742, -17.50634002685547, -16.334369659423828, -15.162399291992188, -13.99042797088623, -12.818456649780273, -11.646485328674316, -10.47451400756836, -9.302543640136719, -8.130572319030762, -6.958600997924805, -5.786630153656006, -4.614659309387207, -3.44268798828125, -2.270716905593872, -1.0987458229064941, 0.07322525978088379, 1.2451963424682617, 2.4171676635742188, 3.5891385078430176, 4.761109352111816, 5.933080673217773, 7.1050519943237305, 8.277023315429688, 9.448993682861328, 10.620965003967285, 11.792936325073242, 12.964906692504883, 14.13687801361084, 15.308849334716797, 16.480819702148438, 17.65279197692871, 18.82476234436035, 19.996734619140625, 21.168704986572266, 22.340675354003906, 23.512645721435547, 24.68461799621582, 25.85658836364746, 27.028560638427734, 28.200531005859375, 29.372501373291016, 30.54447364807129, 31.71644401550293, 32.8884162902832, 34.060386657714844]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 2.0, 5.0, 8.0, 13.0, 30.0, 52.0, 75.0, 94.0, 171.0, 263.0, 385.0, 645.0, 949.0, 1478.0, 2152.0, 3267.0, 5214.0, 8384.0, 12862.0, 21182.0, 34367.0, 57172.0, 96861.0, 166869.0, 286547.0, 470811.0, 664112.0, 733194.0, 611312.0, 409949.0, 245962.0, 142854.0, 84457.0, 49803.0, 30466.0, 19128.0, 11910.0, 7491.0, 4870.0, 3087.0, 2018.0, 1289.0, 861.0, 536.0, 376.0, 242.0, 176.0, 133.0, 67.0, 52.0, 32.0, 22.0, 10.0, 8.0, 9.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-26.28125, -25.41552734375, -24.5498046875, -23.68408203125, -22.818359375, -21.95263671875, -21.0869140625, -20.22119140625, -19.35546875, -18.48974609375, -17.6240234375, -16.75830078125, -15.892578125, -15.02685546875, -14.1611328125, -13.29541015625, -12.4296875, -11.56396484375, -10.6982421875, -9.83251953125, -8.966796875, -8.10107421875, -7.2353515625, -6.36962890625, -5.50390625, -4.63818359375, -3.7724609375, -2.90673828125, -2.041015625, -1.17529296875, -0.3095703125, 0.55615234375, 1.421875, 2.28759765625, 3.1533203125, 4.01904296875, 4.884765625, 5.75048828125, 6.6162109375, 7.48193359375, 8.34765625, 9.21337890625, 10.0791015625, 10.94482421875, 11.810546875, 12.67626953125, 13.5419921875, 14.40771484375, 15.2734375, 16.13916015625, 17.0048828125, 17.87060546875, 18.736328125, 19.60205078125, 20.4677734375, 21.33349609375, 22.19921875, 23.06494140625, 23.9306640625, 24.79638671875, 25.662109375, 26.52783203125, 27.3935546875, 28.25927734375, 29.125]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 6.0, 4.0, 4.0, 2.0, 3.0, 9.0, 9.0, 16.0, 15.0, 13.0, 15.0, 20.0, 18.0, 14.0, 23.0, 27.0, 25.0, 30.0, 32.0, 30.0, 35.0, 37.0, 37.0, 44.0, 32.0, 39.0, 35.0, 36.0, 23.0, 37.0, 29.0, 21.0, 34.0, 27.0, 44.0, 22.0, 24.0, 22.0, 19.0, 18.0, 17.0, 12.0, 12.0, 9.0, 5.0, 3.0, 3.0, 5.0, 5.0, 3.0, 2.0, 4.0, 1.0, 4.0], "bins": [-26.0, -25.259033203125, -24.51806640625, -23.777099609375, -23.0361328125, -22.295166015625, -21.55419921875, -20.813232421875, -20.072265625, -19.331298828125, -18.59033203125, -17.849365234375, -17.1083984375, -16.367431640625, -15.62646484375, -14.885498046875, -14.14453125, -13.403564453125, -12.66259765625, -11.921630859375, -11.1806640625, -10.439697265625, -9.69873046875, -8.957763671875, -8.216796875, -7.475830078125, -6.73486328125, -5.993896484375, -5.2529296875, -4.511962890625, -3.77099609375, -3.030029296875, -2.2890625, -1.548095703125, -0.80712890625, -0.066162109375, 0.6748046875, 1.415771484375, 2.15673828125, 2.897705078125, 3.638671875, 4.379638671875, 5.12060546875, 5.861572265625, 6.6025390625, 7.343505859375, 8.08447265625, 8.825439453125, 9.56640625, 10.307373046875, 11.04833984375, 11.789306640625, 12.5302734375, 13.271240234375, 14.01220703125, 14.753173828125, 15.494140625, 16.235107421875, 16.97607421875, 17.717041015625, 18.4580078125, 19.198974609375, 19.93994140625, 20.680908203125, 21.421875]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 6.0, 6.0, 9.0, 13.0, 28.0, 36.0, 47.0, 74.0, 94.0, 163.0, 272.0, 367.0, 608.0, 961.0, 1476.0, 2503.0, 3905.0, 6369.0, 10576.0, 17554.0, 30280.0, 51555.0, 88417.0, 152494.0, 259206.0, 422624.0, 626253.0, 749351.0, 650134.0, 447870.0, 276649.0, 163944.0, 95059.0, 55061.0, 32055.0, 18930.0, 11283.0, 7012.0, 4055.0, 2524.0, 1575.0, 1047.0, 629.0, 427.0, 254.0, 180.0, 118.0, 74.0, 53.0, 38.0, 26.0, 15.0, 11.0, 7.0, 8.0, 3.0, 8.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.4375, -27.507080078125, -26.57666015625, -25.646240234375, -24.7158203125, -23.785400390625, -22.85498046875, -21.924560546875, -20.994140625, -20.063720703125, -19.13330078125, -18.202880859375, -17.2724609375, -16.342041015625, -15.41162109375, -14.481201171875, -13.55078125, -12.620361328125, -11.68994140625, -10.759521484375, -9.8291015625, -8.898681640625, -7.96826171875, -7.037841796875, -6.107421875, -5.177001953125, -4.24658203125, -3.316162109375, -2.3857421875, -1.455322265625, -0.52490234375, 0.405517578125, 1.3359375, 2.266357421875, 3.19677734375, 4.127197265625, 5.0576171875, 5.988037109375, 6.91845703125, 7.848876953125, 8.779296875, 9.709716796875, 10.64013671875, 11.570556640625, 12.5009765625, 13.431396484375, 14.36181640625, 15.292236328125, 16.22265625, 17.153076171875, 18.08349609375, 19.013916015625, 19.9443359375, 20.874755859375, 21.80517578125, 22.735595703125, 23.666015625, 24.596435546875, 25.52685546875, 26.457275390625, 27.3876953125, 28.318115234375, 29.24853515625, 30.178955078125, 31.109375]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 5.0, 1.0, 4.0, 2.0, 5.0, 10.0, 6.0, 14.0, 11.0, 20.0, 27.0, 27.0, 28.0, 50.0, 54.0, 65.0, 82.0, 94.0, 93.0, 133.0, 157.0, 140.0, 195.0, 211.0, 230.0, 229.0, 235.0, 260.0, 200.0, 209.0, 183.0, 178.0, 144.0, 124.0, 131.0, 107.0, 72.0, 77.0, 55.0, 48.0, 30.0, 35.0, 15.0, 16.0, 19.0, 11.0, 9.0, 11.0, 10.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-10.328125, -9.976806640625, -9.62548828125, -9.274169921875, -8.9228515625, -8.571533203125, -8.22021484375, -7.868896484375, -7.517578125, -7.166259765625, -6.81494140625, -6.463623046875, -6.1123046875, -5.760986328125, -5.40966796875, -5.058349609375, -4.70703125, -4.355712890625, -4.00439453125, -3.653076171875, -3.3017578125, -2.950439453125, -2.59912109375, -2.247802734375, -1.896484375, -1.545166015625, -1.19384765625, -0.842529296875, -0.4912109375, -0.139892578125, 0.21142578125, 0.562744140625, 0.9140625, 1.265380859375, 1.61669921875, 1.968017578125, 2.3193359375, 2.670654296875, 3.02197265625, 3.373291015625, 3.724609375, 4.075927734375, 4.42724609375, 4.778564453125, 5.1298828125, 5.481201171875, 5.83251953125, 6.183837890625, 6.53515625, 6.886474609375, 7.23779296875, 7.589111328125, 7.9404296875, 8.291748046875, 8.64306640625, 8.994384765625, 9.345703125, 9.697021484375, 10.04833984375, 10.399658203125, 10.7509765625, 11.102294921875, 11.45361328125, 11.804931640625, 12.15625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 6.0, 3.0, 4.0, 7.0, 6.0, 8.0, 9.0, 14.0, 24.0, 23.0, 20.0, 29.0, 25.0, 36.0, 37.0, 46.0, 43.0, 63.0, 45.0, 69.0, 46.0, 51.0, 40.0, 51.0, 53.0, 40.0, 33.0, 24.0, 20.0, 20.0, 12.0, 20.0, 13.0, 9.0, 15.0, 11.0, 7.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-35.933067321777344, -34.862876892089844, -33.792686462402344, -32.72249221801758, -31.652301788330078, -30.582111358642578, -29.511919021606445, -28.441726684570312, -27.371536254882812, -26.301345825195312, -25.23115348815918, -24.160961151123047, -23.090770721435547, -22.020580291748047, -20.950387954711914, -19.88019561767578, -18.81000518798828, -17.73981475830078, -16.66962242126465, -15.599431037902832, -14.529239654541016, -13.4590482711792, -12.388856887817383, -11.318665504455566, -10.24847412109375, -9.178282737731934, -8.108091354370117, -7.037899971008301, -5.967708587646484, -4.897517204284668, -3.8273258209228516, -2.757134437561035, -1.6869392395019531, -0.6167478561401367, 0.4534435272216797, 1.523634910583496, 2.5938262939453125, 3.664017677307129, 4.734209060668945, 5.804400444030762, 6.874591827392578, 7.9447832107543945, 9.014974594116211, 10.085165977478027, 11.155357360839844, 12.22554874420166, 13.295740127563477, 14.365931510925293, 15.43612289428711, 16.50631332397461, 17.576505661010742, 18.646697998046875, 19.716888427734375, 20.787078857421875, 21.857271194458008, 22.92746353149414, 23.99765396118164, 25.06784439086914, 26.138036727905273, 27.208229064941406, 28.278419494628906, 29.348609924316406, 30.41880226135254, 31.488994598388672, 32.55918502807617]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 5.0, 3.0, 4.0, 8.0, 2.0, 10.0, 6.0, 8.0, 5.0, 16.0, 15.0, 27.0, 21.0, 24.0, 34.0, 29.0, 31.0, 36.0, 25.0, 34.0, 44.0, 46.0, 53.0, 31.0, 44.0, 50.0, 42.0, 38.0, 37.0, 40.0, 33.0, 29.0, 28.0, 25.0, 17.0, 13.0, 15.0, 17.0, 15.0, 10.0, 9.0, 10.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-29.264554977416992, -28.384599685668945, -27.5046443939209, -26.62468910217285, -25.744733810424805, -24.864778518676758, -23.984825134277344, -23.104869842529297, -22.22491455078125, -21.344959259033203, -20.465003967285156, -19.58504867553711, -18.705093383789062, -17.825138092041016, -16.94518280029297, -16.065227508544922, -15.185272216796875, -14.305316925048828, -13.425361633300781, -12.545406341552734, -11.665451049804688, -10.78549575805664, -9.90554141998291, -9.025586128234863, -8.145630836486816, -7.2656755447387695, -6.385720252990723, -5.505765438079834, -4.625810146331787, -3.7458548545837402, -2.8659000396728516, -1.9859447479248047, -1.1059894561767578, -0.2260342836380005, 0.6539208889007568, 1.5338759422302246, 2.4138312339782715, 3.2937865257263184, 4.173741340637207, 5.053696632385254, 5.933651924133301, 6.813607215881348, 7.6935625076293945, 8.573516845703125, 9.453472137451172, 10.333427429199219, 11.213382720947266, 12.093338012695312, 12.97329330444336, 13.853248596191406, 14.733203887939453, 15.6131591796875, 16.493114471435547, 17.373069763183594, 18.25302505493164, 19.132980346679688, 20.012935638427734, 20.89289093017578, 21.772846221923828, 22.652801513671875, 23.532756805419922, 24.41271209716797, 25.292667388916016, 26.172622680664062, 27.052576065063477]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 7.0, 14.0, 35.0, 33.0, 60.0, 78.0, 108.0, 174.0, 271.0, 424.0, 650.0, 1033.0, 1687.0, 2799.0, 4627.0, 7967.0, 13674.0, 24296.0, 43021.0, 78120.0, 132827.0, 193216.0, 200139.0, 144819.0, 86150.0, 48282.0, 26953.0, 15204.0, 8608.0, 5130.0, 3081.0, 1923.0, 1169.0, 674.0, 430.0, 291.0, 197.0, 123.0, 99.0, 57.0, 33.0, 27.0, 13.0, 9.0, 7.0, 7.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-43.625, -42.306640625, -40.98828125, -39.669921875, -38.3515625, -37.033203125, -35.71484375, -34.396484375, -33.078125, -31.759765625, -30.44140625, -29.123046875, -27.8046875, -26.486328125, -25.16796875, -23.849609375, -22.53125, -21.212890625, -19.89453125, -18.576171875, -17.2578125, -15.939453125, -14.62109375, -13.302734375, -11.984375, -10.666015625, -9.34765625, -8.029296875, -6.7109375, -5.392578125, -4.07421875, -2.755859375, -1.4375, -0.119140625, 1.19921875, 2.517578125, 3.8359375, 5.154296875, 6.47265625, 7.791015625, 9.109375, 10.427734375, 11.74609375, 13.064453125, 14.3828125, 15.701171875, 17.01953125, 18.337890625, 19.65625, 20.974609375, 22.29296875, 23.611328125, 24.9296875, 26.248046875, 27.56640625, 28.884765625, 30.203125, 31.521484375, 32.83984375, 34.158203125, 35.4765625, 36.794921875, 38.11328125, 39.431640625, 40.75]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 6.0, 3.0, 4.0, 8.0, 3.0, 5.0, 8.0, 11.0, 14.0, 13.0, 10.0, 26.0, 24.0, 19.0, 27.0, 19.0, 37.0, 32.0, 35.0, 32.0, 37.0, 43.0, 47.0, 49.0, 47.0, 42.0, 42.0, 42.0, 36.0, 35.0, 29.0, 19.0, 34.0, 20.0, 14.0, 33.0, 18.0, 14.0, 17.0, 8.0, 10.0, 8.0, 11.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-28.78125, -27.923095703125, -27.06494140625, -26.206787109375, -25.3486328125, -24.490478515625, -23.63232421875, -22.774169921875, -21.916015625, -21.057861328125, -20.19970703125, -19.341552734375, -18.4833984375, -17.625244140625, -16.76708984375, -15.908935546875, -15.05078125, -14.192626953125, -13.33447265625, -12.476318359375, -11.6181640625, -10.760009765625, -9.90185546875, -9.043701171875, -8.185546875, -7.327392578125, -6.46923828125, -5.611083984375, -4.7529296875, -3.894775390625, -3.03662109375, -2.178466796875, -1.3203125, -0.462158203125, 0.39599609375, 1.254150390625, 2.1123046875, 2.970458984375, 3.82861328125, 4.686767578125, 5.544921875, 6.403076171875, 7.26123046875, 8.119384765625, 8.9775390625, 9.835693359375, 10.69384765625, 11.552001953125, 12.41015625, 13.268310546875, 14.12646484375, 14.984619140625, 15.8427734375, 16.700927734375, 17.55908203125, 18.417236328125, 19.275390625, 20.133544921875, 20.99169921875, 21.849853515625, 22.7080078125, 23.566162109375, 24.42431640625, 25.282470703125, 26.140625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 6.0, 1.0, 2.0, 9.0, 7.0, 7.0, 19.0, 23.0, 30.0, 50.0, 64.0, 77.0, 118.0, 212.0, 289.0, 406.0, 665.0, 984.0, 1595.0, 2476.0, 4155.0, 7073.0, 12803.0, 26875.0, 64776.0, 179128.0, 371929.0, 224769.0, 81384.0, 32810.0, 15212.0, 8128.0, 4619.0, 2745.0, 1728.0, 1146.0, 760.0, 508.0, 330.0, 198.0, 140.0, 92.0, 54.0, 56.0, 41.0, 23.0, 19.0, 12.0, 4.0, 7.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.125, -71.6220703125, -69.119140625, -66.6162109375, -64.11328125, -61.6103515625, -59.107421875, -56.6044921875, -54.1015625, -51.5986328125, -49.095703125, -46.5927734375, -44.08984375, -41.5869140625, -39.083984375, -36.5810546875, -34.078125, -31.5751953125, -29.072265625, -26.5693359375, -24.06640625, -21.5634765625, -19.060546875, -16.5576171875, -14.0546875, -11.5517578125, -9.048828125, -6.5458984375, -4.04296875, -1.5400390625, 0.962890625, 3.4658203125, 5.96875, 8.4716796875, 10.974609375, 13.4775390625, 15.98046875, 18.4833984375, 20.986328125, 23.4892578125, 25.9921875, 28.4951171875, 30.998046875, 33.5009765625, 36.00390625, 38.5068359375, 41.009765625, 43.5126953125, 46.015625, 48.5185546875, 51.021484375, 53.5244140625, 56.02734375, 58.5302734375, 61.033203125, 63.5361328125, 66.0390625, 68.5419921875, 71.044921875, 73.5478515625, 76.05078125, 78.5537109375, 81.056640625, 83.5595703125, 86.0625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 8.0, 1.0, 6.0, 12.0, 6.0, 11.0, 19.0, 9.0, 17.0, 28.0, 14.0, 17.0, 22.0, 30.0, 23.0, 31.0, 34.0, 35.0, 52.0, 37.0, 43.0, 38.0, 50.0, 42.0, 31.0, 36.0, 35.0, 40.0, 34.0, 27.0, 26.0, 35.0, 16.0, 22.0, 21.0, 23.0, 12.0, 14.0, 9.0, 9.0, 12.0, 6.0, 4.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-16.296875, -15.7578125, -15.21875, -14.6796875, -14.140625, -13.6015625, -13.0625, -12.5234375, -11.984375, -11.4453125, -10.90625, -10.3671875, -9.828125, -9.2890625, -8.75, -8.2109375, -7.671875, -7.1328125, -6.59375, -6.0546875, -5.515625, -4.9765625, -4.4375, -3.8984375, -3.359375, -2.8203125, -2.28125, -1.7421875, -1.203125, -0.6640625, -0.125, 0.4140625, 0.953125, 1.4921875, 2.03125, 2.5703125, 3.109375, 3.6484375, 4.1875, 4.7265625, 5.265625, 5.8046875, 6.34375, 6.8828125, 7.421875, 7.9609375, 8.5, 9.0390625, 9.578125, 10.1171875, 10.65625, 11.1953125, 11.734375, 12.2734375, 12.8125, 13.3515625, 13.890625, 14.4296875, 14.96875, 15.5078125, 16.046875, 16.5859375, 17.125, 17.6640625, 18.203125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 6.0, 6.0, 14.0, 15.0, 19.0, 29.0, 43.0, 65.0, 85.0, 112.0, 203.0, 280.0, 502.0, 789.0, 1327.0, 2336.0, 4495.0, 8823.0, 17827.0, 38093.0, 86998.0, 192638.0, 301301.0, 211659.0, 97833.0, 42709.0, 19481.0, 9641.0, 4896.0, 2642.0, 1488.0, 812.0, 478.0, 300.0, 196.0, 127.0, 94.0, 66.0, 31.0, 30.0, 19.0, 15.0, 16.0, 6.0, 4.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-30.65625, -29.76953125, -28.8828125, -27.99609375, -27.109375, -26.22265625, -25.3359375, -24.44921875, -23.5625, -22.67578125, -21.7890625, -20.90234375, -20.015625, -19.12890625, -18.2421875, -17.35546875, -16.46875, -15.58203125, -14.6953125, -13.80859375, -12.921875, -12.03515625, -11.1484375, -10.26171875, -9.375, -8.48828125, -7.6015625, -6.71484375, -5.828125, -4.94140625, -4.0546875, -3.16796875, -2.28125, -1.39453125, -0.5078125, 0.37890625, 1.265625, 2.15234375, 3.0390625, 3.92578125, 4.8125, 5.69921875, 6.5859375, 7.47265625, 8.359375, 9.24609375, 10.1328125, 11.01953125, 11.90625, 12.79296875, 13.6796875, 14.56640625, 15.453125, 16.33984375, 17.2265625, 18.11328125, 19.0, 19.88671875, 20.7734375, 21.66015625, 22.546875, 23.43359375, 24.3203125, 25.20703125, 26.09375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 5.0, 2.0, 2.0, 4.0, 8.0, 10.0, 9.0, 14.0, 21.0, 30.0, 24.0, 34.0, 43.0, 66.0, 65.0, 73.0, 96.0, 94.0, 84.0, 54.0, 51.0, 39.0, 29.0, 23.0, 21.0, 19.0, 12.0, 11.0, 5.0, 10.0, 8.0, 5.0, 3.0, 3.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0012836456298828125, -0.0012420117855072021, -0.0012003779411315918, -0.0011587440967559814, -0.001117110252380371, -0.0010754764080047607, -0.0010338425636291504, -0.00099220871925354, -0.0009505748748779297, -0.0009089410305023193, -0.000867307186126709, -0.0008256733417510986, -0.0007840394973754883, -0.0007424056529998779, -0.0007007718086242676, -0.0006591379642486572, -0.0006175041198730469, -0.0005758702754974365, -0.0005342364311218262, -0.0004926025867462158, -0.00045096874237060547, -0.0004093348979949951, -0.00036770105361938477, -0.0003260672092437744, -0.00028443336486816406, -0.0002427995204925537, -0.00020116567611694336, -0.000159531831741333, -0.00011789798736572266, -7.62641429901123e-05, -3.463029861450195e-05, 7.0035457611083984e-06, 4.863739013671875e-05, 9.02712345123291e-05, 0.00013190507888793945, 0.0001735389232635498, 0.00021517276763916016, 0.0002568066120147705, 0.00029844045639038086, 0.0003400743007659912, 0.00038170814514160156, 0.0004233419895172119, 0.00046497583389282227, 0.0005066096782684326, 0.000548243522644043, 0.0005898773670196533, 0.0006315112113952637, 0.000673145055770874, 0.0007147789001464844, 0.0007564127445220947, 0.0007980465888977051, 0.0008396804332733154, 0.0008813142776489258, 0.0009229481220245361, 0.0009645819664001465, 0.0010062158107757568, 0.0010478496551513672, 0.0010894834995269775, 0.0011311173439025879, 0.0011727511882781982, 0.0012143850326538086, 0.001256018877029419, 0.0012976527214050293, 0.0013392865657806396, 0.00138092041015625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 5.0, 11.0, 7.0, 13.0, 27.0, 30.0, 48.0, 83.0, 102.0, 153.0, 256.0, 400.0, 646.0, 960.0, 1580.0, 2447.0, 3868.0, 5965.0, 9760.0, 15722.0, 25756.0, 41738.0, 66663.0, 100801.0, 138213.0, 159472.0, 148962.0, 114568.0, 78875.0, 50210.0, 30711.0, 18775.0, 11770.0, 7274.0, 4457.0, 2991.0, 1886.0, 1211.0, 788.0, 490.0, 298.0, 182.0, 139.0, 91.0, 48.0, 38.0, 33.0, 13.0, 13.0, 6.0, 7.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.625, -13.114501953125, -12.60400390625, -12.093505859375, -11.5830078125, -11.072509765625, -10.56201171875, -10.051513671875, -9.541015625, -9.030517578125, -8.52001953125, -8.009521484375, -7.4990234375, -6.988525390625, -6.47802734375, -5.967529296875, -5.45703125, -4.946533203125, -4.43603515625, -3.925537109375, -3.4150390625, -2.904541015625, -2.39404296875, -1.883544921875, -1.373046875, -0.862548828125, -0.35205078125, 0.158447265625, 0.6689453125, 1.179443359375, 1.68994140625, 2.200439453125, 2.7109375, 3.221435546875, 3.73193359375, 4.242431640625, 4.7529296875, 5.263427734375, 5.77392578125, 6.284423828125, 6.794921875, 7.305419921875, 7.81591796875, 8.326416015625, 8.8369140625, 9.347412109375, 9.85791015625, 10.368408203125, 10.87890625, 11.389404296875, 11.89990234375, 12.410400390625, 12.9208984375, 13.431396484375, 13.94189453125, 14.452392578125, 14.962890625, 15.473388671875, 15.98388671875, 16.494384765625, 17.0048828125, 17.515380859375, 18.02587890625, 18.536376953125, 19.046875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 5.0, 6.0, 10.0, 12.0, 13.0, 20.0, 26.0, 34.0, 20.0, 40.0, 29.0, 43.0, 55.0, 53.0, 48.0, 58.0, 49.0, 53.0, 46.0, 45.0, 54.0, 40.0, 29.0, 26.0, 27.0, 25.0, 19.0, 23.0, 17.0, 20.0, 14.0, 7.0, 3.0, 8.0, 4.0, 3.0, 2.0, 1.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.515625, -5.32623291015625, -5.1368408203125, -4.94744873046875, -4.758056640625, -4.56866455078125, -4.3792724609375, -4.18988037109375, -4.00048828125, -3.81109619140625, -3.6217041015625, -3.43231201171875, -3.242919921875, -3.05352783203125, -2.8641357421875, -2.67474365234375, -2.4853515625, -2.29595947265625, -2.1065673828125, -1.91717529296875, -1.727783203125, -1.53839111328125, -1.3489990234375, -1.15960693359375, -0.97021484375, -0.78082275390625, -0.5914306640625, -0.40203857421875, -0.212646484375, -0.02325439453125, 0.1661376953125, 0.35552978515625, 0.544921875, 0.73431396484375, 0.9237060546875, 1.11309814453125, 1.302490234375, 1.49188232421875, 1.6812744140625, 1.87066650390625, 2.06005859375, 2.24945068359375, 2.4388427734375, 2.62823486328125, 2.817626953125, 3.00701904296875, 3.1964111328125, 3.38580322265625, 3.5751953125, 3.76458740234375, 3.9539794921875, 4.14337158203125, 4.332763671875, 4.52215576171875, 4.7115478515625, 4.90093994140625, 5.09033203125, 5.27972412109375, 5.4691162109375, 5.65850830078125, 5.847900390625, 6.03729248046875, 6.2266845703125, 6.41607666015625, 6.60546875]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 4.0, 4.0, 3.0, 10.0, 4.0, 4.0, 9.0, 10.0, 12.0, 12.0, 19.0, 15.0, 21.0, 23.0, 35.0, 41.0, 45.0, 60.0, 55.0, 40.0, 53.0, 54.0, 56.0, 47.0, 48.0, 43.0, 44.0, 38.0, 26.0, 26.0, 31.0, 23.0, 13.0, 11.0, 10.0, 8.0, 13.0, 3.0, 8.0, 8.0, 7.0, 3.0, 1.0, 5.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-35.86669921875, -34.82542419433594, -33.78415298461914, -32.74287796020508, -31.70160675048828, -30.66033172607422, -29.61905860900879, -28.57778549194336, -27.53651237487793, -26.4952392578125, -25.45396614074707, -24.41269302368164, -23.371417999267578, -22.33014678955078, -21.28887176513672, -20.24759864807129, -19.20632553100586, -18.16505241394043, -17.123779296875, -16.08250617980957, -15.041232109069824, -13.999958992004395, -12.958684921264648, -11.917411804199219, -10.876138687133789, -9.83486557006836, -8.79359245300293, -7.752318382263184, -6.711045265197754, -5.669772148132324, -4.628498554229736, -3.5872249603271484, -2.545949935913086, -1.5046765804290771, -0.46340322494506836, 0.5778701305389404, 1.6191434860229492, 2.660416603088379, 3.701690196990967, 4.742963790893555, 5.784236907958984, 6.825510025024414, 7.866783618927002, 8.90805721282959, 9.94933032989502, 10.99060344696045, 12.031877517700195, 13.073150634765625, 14.114423751831055, 15.155696868896484, 16.196969985961914, 17.238243103027344, 18.279518127441406, 19.320789337158203, 20.362064361572266, 21.403337478637695, 22.444610595703125, 23.485883712768555, 24.527156829833984, 25.568429946899414, 26.609703063964844, 27.650978088378906, 28.692251205444336, 29.733524322509766, 30.774797439575195]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 3.0, 1.0, 3.0, 9.0, 5.0, 4.0, 9.0, 9.0, 9.0, 6.0, 7.0, 19.0, 16.0, 22.0, 24.0, 29.0, 31.0, 31.0, 33.0, 33.0, 36.0, 37.0, 41.0, 45.0, 43.0, 43.0, 41.0, 40.0, 37.0, 43.0, 34.0, 36.0, 35.0, 28.0, 26.0, 20.0, 15.0, 21.0, 15.0, 18.0, 10.0, 9.0, 6.0, 9.0, 6.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-27.09512710571289, -26.266862869262695, -25.438600540161133, -24.610336303710938, -23.782072067260742, -22.953807830810547, -22.125545501708984, -21.29728126525879, -20.469017028808594, -19.6407527923584, -18.812490463256836, -17.98422622680664, -17.155961990356445, -16.32769775390625, -15.499435424804688, -14.671171188354492, -13.84290885925293, -13.01464557647705, -12.186381340026855, -11.358118057250977, -10.529853820800781, -9.701590538024902, -8.873327255249023, -8.045063018798828, -7.216799736022949, -6.388535976409912, -5.560272216796875, -4.732008934020996, -3.903745174407959, -3.075481414794922, -2.247218132019043, -1.4189543724060059, -0.5906925201416016, 0.237571120262146, 1.0658347606658936, 1.8940982818603516, 2.7223620414733887, 3.550625801086426, 4.378889083862305, 5.207152843475342, 6.035416603088379, 6.863680362701416, 7.691944122314453, 8.520207405090332, 9.348470687866211, 10.176734924316406, 11.004998207092285, 11.833261489868164, 12.66152572631836, 13.489789009094238, 14.318053245544434, 15.146316528320312, 15.974580764770508, 16.802845001220703, 17.631107330322266, 18.45937156677246, 19.287635803222656, 20.11590003967285, 20.944162368774414, 21.77242660522461, 22.600690841674805, 23.428955078125, 24.257217407226562, 25.085481643676758, 25.91374397277832]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 4.0, 5.0, 8.0, 17.0, 21.0, 38.0, 67.0, 90.0, 106.0, 174.0, 261.0, 401.0, 574.0, 933.0, 1476.0, 2143.0, 3122.0, 4869.0, 7706.0, 11536.0, 17682.0, 26467.0, 39236.0, 57273.0, 78022.0, 101954.0, 119871.0, 126162.0, 117114.0, 97191.0, 74099.0, 52769.0, 36335.0, 24328.0, 16440.0, 10522.0, 6805.0, 4385.0, 2908.0, 1838.0, 1214.0, 808.0, 499.0, 346.0, 255.0, 157.0, 93.0, 82.0, 52.0, 41.0, 24.0, 18.0, 5.0, 7.0, 5.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0], "bins": [-24.65625, -23.844970703125, -23.03369140625, -22.222412109375, -21.4111328125, -20.599853515625, -19.78857421875, -18.977294921875, -18.166015625, -17.354736328125, -16.54345703125, -15.732177734375, -14.9208984375, -14.109619140625, -13.29833984375, -12.487060546875, -11.67578125, -10.864501953125, -10.05322265625, -9.241943359375, -8.4306640625, -7.619384765625, -6.80810546875, -5.996826171875, -5.185546875, -4.374267578125, -3.56298828125, -2.751708984375, -1.9404296875, -1.129150390625, -0.31787109375, 0.493408203125, 1.3046875, 2.115966796875, 2.92724609375, 3.738525390625, 4.5498046875, 5.361083984375, 6.17236328125, 6.983642578125, 7.794921875, 8.606201171875, 9.41748046875, 10.228759765625, 11.0400390625, 11.851318359375, 12.66259765625, 13.473876953125, 14.28515625, 15.096435546875, 15.90771484375, 16.718994140625, 17.5302734375, 18.341552734375, 19.15283203125, 19.964111328125, 20.775390625, 21.586669921875, 22.39794921875, 23.209228515625, 24.0205078125, 24.831787109375, 25.64306640625, 26.454345703125, 27.265625]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 6.0, 5.0, 1.0, 7.0, 3.0, 9.0, 10.0, 11.0, 6.0, 10.0, 18.0, 20.0, 21.0, 17.0, 26.0, 31.0, 29.0, 36.0, 34.0, 32.0, 41.0, 43.0, 37.0, 38.0, 46.0, 49.0, 38.0, 40.0, 38.0, 46.0, 27.0, 33.0, 23.0, 24.0, 23.0, 16.0, 27.0, 10.0, 12.0, 16.0, 9.0, 7.0, 7.0, 5.0, 5.0, 3.0, 5.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-26.53125, -25.72119140625, -24.9111328125, -24.10107421875, -23.291015625, -22.48095703125, -21.6708984375, -20.86083984375, -20.05078125, -19.24072265625, -18.4306640625, -17.62060546875, -16.810546875, -16.00048828125, -15.1904296875, -14.38037109375, -13.5703125, -12.76025390625, -11.9501953125, -11.14013671875, -10.330078125, -9.52001953125, -8.7099609375, -7.89990234375, -7.08984375, -6.27978515625, -5.4697265625, -4.65966796875, -3.849609375, -3.03955078125, -2.2294921875, -1.41943359375, -0.609375, 0.20068359375, 1.0107421875, 1.82080078125, 2.630859375, 3.44091796875, 4.2509765625, 5.06103515625, 5.87109375, 6.68115234375, 7.4912109375, 8.30126953125, 9.111328125, 9.92138671875, 10.7314453125, 11.54150390625, 12.3515625, 13.16162109375, 13.9716796875, 14.78173828125, 15.591796875, 16.40185546875, 17.2119140625, 18.02197265625, 18.83203125, 19.64208984375, 20.4521484375, 21.26220703125, 22.072265625, 22.88232421875, 23.6923828125, 24.50244140625, 25.3125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 7.0, 7.0, 18.0, 29.0, 43.0, 78.0, 118.0, 165.0, 321.0, 520.0, 920.0, 1449.0, 2567.0, 4263.0, 7484.0, 12927.0, 22233.0, 37407.0, 61531.0, 94115.0, 131088.0, 156965.0, 154664.0, 127300.0, 89690.0, 57676.0, 35106.0, 20933.0, 11986.0, 7033.0, 4030.0, 2346.0, 1422.0, 811.0, 518.0, 324.0, 161.0, 115.0, 79.0, 42.0, 26.0, 14.0, 14.0, 5.0, 6.0, 2.0, 5.0, 3.0], "bins": [-35.4375, -34.50341796875, -33.5693359375, -32.63525390625, -31.701171875, -30.76708984375, -29.8330078125, -28.89892578125, -27.96484375, -27.03076171875, -26.0966796875, -25.16259765625, -24.228515625, -23.29443359375, -22.3603515625, -21.42626953125, -20.4921875, -19.55810546875, -18.6240234375, -17.68994140625, -16.755859375, -15.82177734375, -14.8876953125, -13.95361328125, -13.01953125, -12.08544921875, -11.1513671875, -10.21728515625, -9.283203125, -8.34912109375, -7.4150390625, -6.48095703125, -5.546875, -4.61279296875, -3.6787109375, -2.74462890625, -1.810546875, -0.87646484375, 0.0576171875, 0.99169921875, 1.92578125, 2.85986328125, 3.7939453125, 4.72802734375, 5.662109375, 6.59619140625, 7.5302734375, 8.46435546875, 9.3984375, 10.33251953125, 11.2666015625, 12.20068359375, 13.134765625, 14.06884765625, 15.0029296875, 15.93701171875, 16.87109375, 17.80517578125, 18.7392578125, 19.67333984375, 20.607421875, 21.54150390625, 22.4755859375, 23.40966796875, 24.34375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 7.0, 2.0, 6.0, 8.0, 14.0, 9.0, 13.0, 11.0, 22.0, 16.0, 26.0, 32.0, 38.0, 38.0, 29.0, 33.0, 37.0, 54.0, 63.0, 52.0, 51.0, 43.0, 51.0, 33.0, 42.0, 43.0, 37.0, 22.0, 24.0, 29.0, 19.0, 19.0, 21.0, 11.0, 9.0, 11.0, 7.0, 4.0, 6.0, 7.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-20.921875, -20.335693359375, -19.74951171875, -19.163330078125, -18.5771484375, -17.990966796875, -17.40478515625, -16.818603515625, -16.232421875, -15.646240234375, -15.06005859375, -14.473876953125, -13.8876953125, -13.301513671875, -12.71533203125, -12.129150390625, -11.54296875, -10.956787109375, -10.37060546875, -9.784423828125, -9.1982421875, -8.612060546875, -8.02587890625, -7.439697265625, -6.853515625, -6.267333984375, -5.68115234375, -5.094970703125, -4.5087890625, -3.922607421875, -3.33642578125, -2.750244140625, -2.1640625, -1.577880859375, -0.99169921875, -0.405517578125, 0.1806640625, 0.766845703125, 1.35302734375, 1.939208984375, 2.525390625, 3.111572265625, 3.69775390625, 4.283935546875, 4.8701171875, 5.456298828125, 6.04248046875, 6.628662109375, 7.21484375, 7.801025390625, 8.38720703125, 8.973388671875, 9.5595703125, 10.145751953125, 10.73193359375, 11.318115234375, 11.904296875, 12.490478515625, 13.07666015625, 13.662841796875, 14.2490234375, 14.835205078125, 15.42138671875, 16.007568359375, 16.59375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 10.0, 13.0, 34.0, 30.0, 49.0, 52.0, 110.0, 143.0, 206.0, 283.0, 451.0, 665.0, 994.0, 1597.0, 2408.0, 3944.0, 6167.0, 10044.0, 16480.0, 27047.0, 44638.0, 70786.0, 108537.0, 147490.0, 166036.0, 147302.0, 107754.0, 70824.0, 44164.0, 26742.0, 16426.0, 9979.0, 6229.0, 3885.0, 2461.0, 1559.0, 1039.0, 639.0, 427.0, 285.0, 205.0, 128.0, 117.0, 48.0, 47.0, 31.0, 15.0, 13.0, 5.0, 10.0, 2.0, 3.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0], "bins": [-18.03125, -17.43994140625, -16.8486328125, -16.25732421875, -15.666015625, -15.07470703125, -14.4833984375, -13.89208984375, -13.30078125, -12.70947265625, -12.1181640625, -11.52685546875, -10.935546875, -10.34423828125, -9.7529296875, -9.16162109375, -8.5703125, -7.97900390625, -7.3876953125, -6.79638671875, -6.205078125, -5.61376953125, -5.0224609375, -4.43115234375, -3.83984375, -3.24853515625, -2.6572265625, -2.06591796875, -1.474609375, -0.88330078125, -0.2919921875, 0.29931640625, 0.890625, 1.48193359375, 2.0732421875, 2.66455078125, 3.255859375, 3.84716796875, 4.4384765625, 5.02978515625, 5.62109375, 6.21240234375, 6.8037109375, 7.39501953125, 7.986328125, 8.57763671875, 9.1689453125, 9.76025390625, 10.3515625, 10.94287109375, 11.5341796875, 12.12548828125, 12.716796875, 13.30810546875, 13.8994140625, 14.49072265625, 15.08203125, 15.67333984375, 16.2646484375, 16.85595703125, 17.447265625, 18.03857421875, 18.6298828125, 19.22119140625, 19.8125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 2.0, 3.0, 5.0, 6.0, 7.0, 5.0, 9.0, 12.0, 15.0, 16.0, 26.0, 28.0, 29.0, 34.0, 46.0, 47.0, 48.0, 60.0, 54.0, 55.0, 74.0, 69.0, 53.0, 41.0, 47.0, 42.0, 26.0, 20.0, 30.0, 19.0, 20.0, 11.0, 11.0, 11.0, 6.0, 6.0, 5.0, 3.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001750946044921875, -0.0016855597496032715, -0.001620173454284668, -0.0015547871589660645, -0.001489400863647461, -0.0014240145683288574, -0.001358628273010254, -0.0012932419776916504, -0.0012278556823730469, -0.0011624693870544434, -0.0010970830917358398, -0.0010316967964172363, -0.0009663105010986328, -0.0009009242057800293, -0.0008355379104614258, -0.0007701516151428223, -0.0007047653198242188, -0.0006393790245056152, -0.0005739927291870117, -0.0005086064338684082, -0.0004432201385498047, -0.00037783384323120117, -0.00031244754791259766, -0.00024706125259399414, -0.00018167495727539062, -0.00011628866195678711, -5.0902366638183594e-05, 1.4483928680419922e-05, 7.987022399902344e-05, 0.00014525651931762695, 0.00021064281463623047, 0.000276029109954834, 0.0003414154052734375, 0.000406801700592041, 0.00047218799591064453, 0.000537574291229248, 0.0006029605865478516, 0.0006683468818664551, 0.0007337331771850586, 0.0007991194725036621, 0.0008645057678222656, 0.0009298920631408691, 0.0009952783584594727, 0.0010606646537780762, 0.0011260509490966797, 0.0011914372444152832, 0.0012568235397338867, 0.0013222098350524902, 0.0013875961303710938, 0.0014529824256896973, 0.0015183687210083008, 0.0015837550163269043, 0.0016491413116455078, 0.0017145276069641113, 0.0017799139022827148, 0.0018453001976013184, 0.0019106864929199219, 0.0019760727882385254, 0.002041459083557129, 0.0021068453788757324, 0.002172231674194336, 0.0022376179695129395, 0.002303004264831543, 0.0023683905601501465, 0.00243377685546875]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 1.0, 15.0, 16.0, 12.0, 26.0, 31.0, 53.0, 72.0, 103.0, 183.0, 242.0, 365.0, 590.0, 1011.0, 1546.0, 2629.0, 4405.0, 7418.0, 12127.0, 21011.0, 35351.0, 57625.0, 89821.0, 128291.0, 157968.0, 159453.0, 130251.0, 91224.0, 58536.0, 35638.0, 21352.0, 12477.0, 7357.0, 4421.0, 2571.0, 1614.0, 1011.0, 634.0, 384.0, 248.0, 156.0, 112.0, 64.0, 59.0, 23.0, 24.0, 13.0, 7.0, 8.0, 5.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-16.96875, -16.438720703125, -15.90869140625, -15.378662109375, -14.8486328125, -14.318603515625, -13.78857421875, -13.258544921875, -12.728515625, -12.198486328125, -11.66845703125, -11.138427734375, -10.6083984375, -10.078369140625, -9.54833984375, -9.018310546875, -8.48828125, -7.958251953125, -7.42822265625, -6.898193359375, -6.3681640625, -5.838134765625, -5.30810546875, -4.778076171875, -4.248046875, -3.718017578125, -3.18798828125, -2.657958984375, -2.1279296875, -1.597900390625, -1.06787109375, -0.537841796875, -0.0078125, 0.522216796875, 1.05224609375, 1.582275390625, 2.1123046875, 2.642333984375, 3.17236328125, 3.702392578125, 4.232421875, 4.762451171875, 5.29248046875, 5.822509765625, 6.3525390625, 6.882568359375, 7.41259765625, 7.942626953125, 8.47265625, 9.002685546875, 9.53271484375, 10.062744140625, 10.5927734375, 11.122802734375, 11.65283203125, 12.182861328125, 12.712890625, 13.242919921875, 13.77294921875, 14.302978515625, 14.8330078125, 15.363037109375, 15.89306640625, 16.423095703125, 16.953125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 8.0, 8.0, 9.0, 13.0, 14.0, 16.0, 17.0, 14.0, 35.0, 28.0, 27.0, 35.0, 49.0, 33.0, 59.0, 47.0, 58.0, 66.0, 41.0, 45.0, 47.0, 33.0, 34.0, 35.0, 35.0, 28.0, 19.0, 27.0, 20.0, 15.0, 14.0, 8.0, 7.0, 12.0, 9.0, 5.0, 5.0, 3.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.890625, -5.71954345703125, -5.5484619140625, -5.37738037109375, -5.206298828125, -5.03521728515625, -4.8641357421875, -4.69305419921875, -4.52197265625, -4.35089111328125, -4.1798095703125, -4.00872802734375, -3.837646484375, -3.66656494140625, -3.4954833984375, -3.32440185546875, -3.1533203125, -2.98223876953125, -2.8111572265625, -2.64007568359375, -2.468994140625, -2.29791259765625, -2.1268310546875, -1.95574951171875, -1.78466796875, -1.61358642578125, -1.4425048828125, -1.27142333984375, -1.100341796875, -0.92926025390625, -0.7581787109375, -0.58709716796875, -0.416015625, -0.24493408203125, -0.0738525390625, 0.09722900390625, 0.268310546875, 0.43939208984375, 0.6104736328125, 0.78155517578125, 0.95263671875, 1.12371826171875, 1.2947998046875, 1.46588134765625, 1.636962890625, 1.80804443359375, 1.9791259765625, 2.15020751953125, 2.3212890625, 2.49237060546875, 2.6634521484375, 2.83453369140625, 3.005615234375, 3.17669677734375, 3.3477783203125, 3.51885986328125, 3.68994140625, 3.86102294921875, 4.0321044921875, 4.20318603515625, 4.374267578125, 4.54534912109375, 4.7164306640625, 4.88751220703125, 5.05859375]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 3.0, 9.0, 5.0, 7.0, 10.0, 12.0, 16.0, 25.0, 22.0, 29.0, 26.0, 41.0, 55.0, 45.0, 60.0, 39.0, 67.0, 62.0, 71.0, 53.0, 51.0, 40.0, 38.0, 54.0, 22.0, 25.0, 24.0, 17.0, 11.0, 13.0, 12.0, 8.0, 7.0, 7.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-38.23472595214844, -37.09128952026367, -35.94785690307617, -34.804420471191406, -33.66098403930664, -32.51755142211914, -31.374114990234375, -30.230680465698242, -29.08724594116211, -27.943811416625977, -26.80037498474121, -25.656940460205078, -24.513505935668945, -23.370071411132812, -22.226634979248047, -21.083200454711914, -19.93976402282715, -18.796329498291016, -17.65289306640625, -16.509458541870117, -15.366024017333984, -14.222588539123535, -13.079153060913086, -11.935718536376953, -10.792283058166504, -9.648847579956055, -8.505413055419922, -7.361977577209473, -6.218542575836182, -5.075107574462891, -3.9316720962524414, -2.7882375717163086, -1.6448020935058594, -0.5013669729232788, 0.6420681476593018, 1.7855033874511719, 2.928938388824463, 4.072373390197754, 5.215808868408203, 6.359243392944336, 7.502678871154785, 8.646114349365234, 9.789548873901367, 10.932984352111816, 12.076419830322266, 13.219854354858398, 14.363289833068848, 15.50672435760498, 16.65015983581543, 17.793594360351562, 18.937030792236328, 20.08046531677246, 21.223899841308594, 22.36733627319336, 23.510770797729492, 24.654205322265625, 25.79764175415039, 26.941076278686523, 28.08451271057129, 29.227947235107422, 30.371381759643555, 31.514816284179688, 32.65825271606445, 33.80168914794922, 34.94512176513672]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 6.0, 2.0, 9.0, 10.0, 13.0, 9.0, 9.0, 15.0, 16.0, 14.0, 22.0, 22.0, 26.0, 28.0, 35.0, 32.0, 33.0, 31.0, 37.0, 46.0, 40.0, 31.0, 32.0, 50.0, 51.0, 41.0, 35.0, 32.0, 36.0, 35.0, 31.0, 21.0, 20.0, 27.0, 17.0, 21.0, 10.0, 13.0, 7.0, 4.0, 9.0, 6.0, 7.0, 9.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-26.145259857177734, -25.346248626708984, -24.547239303588867, -23.748228073120117, -22.94921875, -22.15020751953125, -21.3511962890625, -20.552186965942383, -19.753177642822266, -18.954166412353516, -18.1551570892334, -17.35614585876465, -16.55713653564453, -15.758125305175781, -14.959115028381348, -14.160104751586914, -13.361093521118164, -12.56208324432373, -11.763072967529297, -10.964061737060547, -10.16505241394043, -9.36604118347168, -8.567030906677246, -7.7680206298828125, -6.969010353088379, -6.170000076293945, -5.370989799499512, -4.57197904586792, -3.7729687690734863, -2.9739584922790527, -2.174947738647461, -1.3759374618530273, -0.5769290924072266, 0.22208130359649658, 1.0210916996002197, 1.8201022148132324, 2.619112491607666, 3.4181227684020996, 4.217133522033691, 5.016143798828125, 5.815154075622559, 6.614164352416992, 7.413174629211426, 8.21218490600586, 9.01119613647461, 9.810205459594727, 10.609216690063477, 11.40822696685791, 12.207237243652344, 13.006247520446777, 13.805257797241211, 14.604269027709961, 15.403278350830078, 16.202289581298828, 17.001300811767578, 17.800310134887695, 18.599319458007812, 19.398330688476562, 20.19734001159668, 20.99635124206543, 21.795360565185547, 22.594371795654297, 23.393383026123047, 24.192392349243164, 24.991403579711914]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 9.0, 12.0, 14.0, 23.0, 31.0, 58.0, 107.0, 147.0, 231.0, 387.0, 638.0, 1073.0, 1740.0, 2824.0, 4738.0, 8422.0, 14605.0, 26498.0, 48500.0, 94013.0, 186193.0, 373862.0, 682533.0, 926404.0, 808754.0, 489696.0, 250258.0, 126039.0, 65270.0, 35146.0, 19319.0, 10936.0, 6399.0, 3828.0, 2213.0, 1330.0, 804.0, 462.0, 298.0, 195.0, 117.0, 79.0, 31.0, 22.0, 11.0, 9.0, 7.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.625, -27.75, -26.875, -26.0, -25.125, -24.25, -23.375, -22.5, -21.625, -20.75, -19.875, -19.0, -18.125, -17.25, -16.375, -15.5, -14.625, -13.75, -12.875, -12.0, -11.125, -10.25, -9.375, -8.5, -7.625, -6.75, -5.875, -5.0, -4.125, -3.25, -2.375, -1.5, -0.625, 0.25, 1.125, 2.0, 2.875, 3.75, 4.625, 5.5, 6.375, 7.25, 8.125, 9.0, 9.875, 10.75, 11.625, 12.5, 13.375, 14.25, 15.125, 16.0, 16.875, 17.75, 18.625, 19.5, 20.375, 21.25, 22.125, 23.0, 23.875, 24.75, 25.625, 26.5, 27.375]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 6.0, 11.0, 5.0, 11.0, 9.0, 7.0, 20.0, 17.0, 15.0, 22.0, 23.0, 31.0, 27.0, 35.0, 46.0, 21.0, 38.0, 54.0, 36.0, 44.0, 42.0, 46.0, 46.0, 42.0, 32.0, 37.0, 34.0, 36.0, 28.0, 32.0, 21.0, 24.0, 14.0, 18.0, 16.0, 3.0, 10.0, 8.0, 13.0, 3.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-20.046875, -19.459228515625, -18.87158203125, -18.283935546875, -17.6962890625, -17.108642578125, -16.52099609375, -15.933349609375, -15.345703125, -14.758056640625, -14.17041015625, -13.582763671875, -12.9951171875, -12.407470703125, -11.81982421875, -11.232177734375, -10.64453125, -10.056884765625, -9.46923828125, -8.881591796875, -8.2939453125, -7.706298828125, -7.11865234375, -6.531005859375, -5.943359375, -5.355712890625, -4.76806640625, -4.180419921875, -3.5927734375, -3.005126953125, -2.41748046875, -1.829833984375, -1.2421875, -0.654541015625, -0.06689453125, 0.520751953125, 1.1083984375, 1.696044921875, 2.28369140625, 2.871337890625, 3.458984375, 4.046630859375, 4.63427734375, 5.221923828125, 5.8095703125, 6.397216796875, 6.98486328125, 7.572509765625, 8.16015625, 8.747802734375, 9.33544921875, 9.923095703125, 10.5107421875, 11.098388671875, 11.68603515625, 12.273681640625, 12.861328125, 13.448974609375, 14.03662109375, 14.624267578125, 15.2119140625, 15.799560546875, 16.38720703125, 16.974853515625, 17.5625]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 7.0, 9.0, 15.0, 14.0, 30.0, 44.0, 68.0, 104.0, 136.0, 227.0, 380.0, 603.0, 928.0, 1490.0, 2511.0, 3920.0, 6602.0, 10990.0, 18038.0, 30446.0, 51085.0, 86409.0, 146994.0, 247335.0, 402288.0, 596026.0, 731272.0, 660557.0, 467094.0, 294986.0, 177286.0, 104770.0, 61044.0, 36241.0, 21470.0, 12802.0, 7831.0, 4640.0, 2825.0, 1767.0, 1088.0, 678.0, 450.0, 279.0, 177.0, 115.0, 81.0, 52.0, 32.0, 18.0, 15.0, 10.0, 5.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0], "bins": [-23.5, -22.758056640625, -22.01611328125, -21.274169921875, -20.5322265625, -19.790283203125, -19.04833984375, -18.306396484375, -17.564453125, -16.822509765625, -16.08056640625, -15.338623046875, -14.5966796875, -13.854736328125, -13.11279296875, -12.370849609375, -11.62890625, -10.886962890625, -10.14501953125, -9.403076171875, -8.6611328125, -7.919189453125, -7.17724609375, -6.435302734375, -5.693359375, -4.951416015625, -4.20947265625, -3.467529296875, -2.7255859375, -1.983642578125, -1.24169921875, -0.499755859375, 0.2421875, 0.984130859375, 1.72607421875, 2.468017578125, 3.2099609375, 3.951904296875, 4.69384765625, 5.435791015625, 6.177734375, 6.919677734375, 7.66162109375, 8.403564453125, 9.1455078125, 9.887451171875, 10.62939453125, 11.371337890625, 12.11328125, 12.855224609375, 13.59716796875, 14.339111328125, 15.0810546875, 15.822998046875, 16.56494140625, 17.306884765625, 18.048828125, 18.790771484375, 19.53271484375, 20.274658203125, 21.0166015625, 21.758544921875, 22.50048828125, 23.242431640625, 23.984375]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 6.0, 6.0, 13.0, 6.0, 10.0, 15.0, 25.0, 34.0, 23.0, 37.0, 50.0, 50.0, 72.0, 83.0, 103.0, 100.0, 138.0, 155.0, 168.0, 192.0, 187.0, 223.0, 244.0, 222.0, 236.0, 248.0, 192.0, 173.0, 177.0, 143.0, 143.0, 126.0, 91.0, 75.0, 77.0, 55.0, 25.0, 33.0, 22.0, 24.0, 16.0, 7.0, 13.0, 9.0, 11.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 4.0], "bins": [-9.28125, -9.0115966796875, -8.741943359375, -8.4722900390625, -8.20263671875, -7.9329833984375, -7.663330078125, -7.3936767578125, -7.1240234375, -6.8543701171875, -6.584716796875, -6.3150634765625, -6.04541015625, -5.7757568359375, -5.506103515625, -5.2364501953125, -4.966796875, -4.6971435546875, -4.427490234375, -4.1578369140625, -3.88818359375, -3.6185302734375, -3.348876953125, -3.0792236328125, -2.8095703125, -2.5399169921875, -2.270263671875, -2.0006103515625, -1.73095703125, -1.4613037109375, -1.191650390625, -0.9219970703125, -0.65234375, -0.3826904296875, -0.113037109375, 0.1566162109375, 0.42626953125, 0.6959228515625, 0.965576171875, 1.2352294921875, 1.5048828125, 1.7745361328125, 2.044189453125, 2.3138427734375, 2.58349609375, 2.8531494140625, 3.122802734375, 3.3924560546875, 3.662109375, 3.9317626953125, 4.201416015625, 4.4710693359375, 4.74072265625, 5.0103759765625, 5.280029296875, 5.5496826171875, 5.8193359375, 6.0889892578125, 6.358642578125, 6.6282958984375, 6.89794921875, 7.1676025390625, 7.437255859375, 7.7069091796875, 7.9765625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 6.0, 3.0, 5.0, 7.0, 12.0, 15.0, 8.0, 18.0, 29.0, 36.0, 49.0, 45.0, 39.0, 47.0, 50.0, 55.0, 56.0, 61.0, 57.0, 44.0, 60.0, 50.0, 47.0, 36.0, 37.0, 20.0, 19.0, 14.0, 16.0, 13.0, 16.0, 7.0, 5.0, 9.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0], "bins": [-40.7682991027832, -39.72697448730469, -38.685646057128906, -37.644317626953125, -36.60299301147461, -35.561668395996094, -34.52033996582031, -33.47901153564453, -32.437686920166016, -31.396360397338867, -30.35503387451172, -29.31370735168457, -28.272380828857422, -27.231054306030273, -26.189727783203125, -25.148401260375977, -24.107074737548828, -23.06574821472168, -22.02442169189453, -20.983095169067383, -19.941768646240234, -18.900442123413086, -17.859115600585938, -16.81778907775879, -15.77646255493164, -14.735136032104492, -13.693809509277344, -12.652482986450195, -11.611156463623047, -10.569829940795898, -9.52850341796875, -8.487176895141602, -7.445850372314453, -6.404523849487305, -5.363197326660156, -4.321870803833008, -3.2805442810058594, -2.239217758178711, -1.1978912353515625, -0.15656471252441406, 0.8847618103027344, 1.9260883331298828, 2.9674148559570312, 4.00874137878418, 5.050067901611328, 6.091394424438477, 7.132720947265625, 8.174047470092773, 9.215373992919922, 10.25670051574707, 11.298027038574219, 12.339353561401367, 13.380680084228516, 14.422006607055664, 15.463333129882812, 16.50465965270996, 17.54598617553711, 18.587312698364258, 19.628639221191406, 20.669965744018555, 21.711292266845703, 22.75261878967285, 23.7939453125, 24.83527183532715, 25.876598358154297]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 9.0, 7.0, 8.0, 12.0, 13.0, 10.0, 14.0, 14.0, 27.0, 23.0, 28.0, 29.0, 36.0, 43.0, 40.0, 35.0, 30.0, 48.0, 51.0, 41.0, 53.0, 55.0, 44.0, 48.0, 31.0, 30.0, 28.0, 29.0, 23.0, 28.0, 19.0, 24.0, 16.0, 13.0, 12.0, 5.0, 3.0, 10.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.79245376586914, -22.08443832397461, -21.376422882080078, -20.668407440185547, -19.960390090942383, -19.25237464904785, -18.54435920715332, -17.83634376525879, -17.128328323364258, -16.420312881469727, -15.712296485900879, -15.004281044006348, -14.296265602111816, -13.588249206542969, -12.880233764648438, -12.172218322753906, -11.464201927185059, -10.756186485290527, -10.04817008972168, -9.340154647827148, -8.632139205932617, -7.924123287200928, -7.216107368469238, -6.508091926574707, -5.800076007843018, -5.092060089111328, -4.384044647216797, -3.6760287284851074, -2.968013048171997, -2.2599973678588867, -1.5519814491271973, -0.843966007232666, -0.13595008850097656, 0.5720656514167786, 1.2800813913345337, 1.9880971908569336, 2.696112871170044, 3.4041285514831543, 4.112144470214844, 4.820159912109375, 5.5281758308410645, 6.236191749572754, 6.944207191467285, 7.652223110198975, 8.360239028930664, 9.068254470825195, 9.776269912719727, 10.484285354614258, 11.192301750183105, 11.900317192077637, 12.608333587646484, 13.316349029541016, 14.024364471435547, 14.732379913330078, 15.440396308898926, 16.14841079711914, 16.856428146362305, 17.564443588256836, 18.272459030151367, 18.98047637939453, 19.688491821289062, 20.396507263183594, 21.104522705078125, 21.812538146972656, 22.520553588867188]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 5.0, 7.0, 8.0, 5.0, 7.0, 9.0, 13.0, 29.0, 39.0, 43.0, 74.0, 111.0, 125.0, 165.0, 267.0, 374.0, 527.0, 760.0, 986.0, 1625.0, 2445.0, 4167.0, 7625.0, 15984.0, 36079.0, 87204.0, 191308.0, 285082.0, 220314.0, 106811.0, 44708.0, 19355.0, 9197.0, 4706.0, 2690.0, 1802.0, 1175.0, 781.0, 548.0, 411.0, 298.0, 218.0, 131.0, 85.0, 74.0, 56.0, 36.0, 28.0, 20.0, 13.0, 12.0, 7.0, 5.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.40625, -40.00830078125, -38.6103515625, -37.21240234375, -35.814453125, -34.41650390625, -33.0185546875, -31.62060546875, -30.22265625, -28.82470703125, -27.4267578125, -26.02880859375, -24.630859375, -23.23291015625, -21.8349609375, -20.43701171875, -19.0390625, -17.64111328125, -16.2431640625, -14.84521484375, -13.447265625, -12.04931640625, -10.6513671875, -9.25341796875, -7.85546875, -6.45751953125, -5.0595703125, -3.66162109375, -2.263671875, -0.86572265625, 0.5322265625, 1.93017578125, 3.328125, 4.72607421875, 6.1240234375, 7.52197265625, 8.919921875, 10.31787109375, 11.7158203125, 13.11376953125, 14.51171875, 15.90966796875, 17.3076171875, 18.70556640625, 20.103515625, 21.50146484375, 22.8994140625, 24.29736328125, 25.6953125, 27.09326171875, 28.4912109375, 29.88916015625, 31.287109375, 32.68505859375, 34.0830078125, 35.48095703125, 36.87890625, 38.27685546875, 39.6748046875, 41.07275390625, 42.470703125, 43.86865234375, 45.2666015625, 46.66455078125, 48.0625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 8.0, 2.0, 5.0, 9.0, 13.0, 14.0, 8.0, 13.0, 13.0, 15.0, 18.0, 33.0, 18.0, 26.0, 32.0, 38.0, 38.0, 41.0, 54.0, 34.0, 38.0, 42.0, 49.0, 48.0, 44.0, 31.0, 42.0, 31.0, 32.0, 33.0, 28.0, 24.0, 22.0, 19.0, 18.0, 9.0, 8.0, 7.0, 14.0, 11.0, 3.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-21.234375, -20.55615234375, -19.8779296875, -19.19970703125, -18.521484375, -17.84326171875, -17.1650390625, -16.48681640625, -15.80859375, -15.13037109375, -14.4521484375, -13.77392578125, -13.095703125, -12.41748046875, -11.7392578125, -11.06103515625, -10.3828125, -9.70458984375, -9.0263671875, -8.34814453125, -7.669921875, -6.99169921875, -6.3134765625, -5.63525390625, -4.95703125, -4.27880859375, -3.6005859375, -2.92236328125, -2.244140625, -1.56591796875, -0.8876953125, -0.20947265625, 0.46875, 1.14697265625, 1.8251953125, 2.50341796875, 3.181640625, 3.85986328125, 4.5380859375, 5.21630859375, 5.89453125, 6.57275390625, 7.2509765625, 7.92919921875, 8.607421875, 9.28564453125, 9.9638671875, 10.64208984375, 11.3203125, 11.99853515625, 12.6767578125, 13.35498046875, 14.033203125, 14.71142578125, 15.3896484375, 16.06787109375, 16.74609375, 17.42431640625, 18.1025390625, 18.78076171875, 19.458984375, 20.13720703125, 20.8154296875, 21.49365234375, 22.171875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 6.0, 8.0, 10.0, 27.0, 31.0, 39.0, 62.0, 70.0, 109.0, 177.0, 237.0, 334.0, 482.0, 691.0, 1078.0, 1587.0, 2517.0, 3916.0, 6572.0, 12241.0, 24950.0, 57287.0, 142684.0, 302616.0, 273765.0, 120022.0, 48105.0, 21764.0, 10714.0, 6037.0, 3517.0, 2268.0, 1478.0, 1027.0, 632.0, 449.0, 293.0, 199.0, 175.0, 119.0, 75.0, 51.0, 35.0, 24.0, 20.0, 12.0, 20.0, 9.0, 1.0, 2.0, 3.0, 5.0, 4.0], "bins": [-54.65625, -53.09033203125, -51.5244140625, -49.95849609375, -48.392578125, -46.82666015625, -45.2607421875, -43.69482421875, -42.12890625, -40.56298828125, -38.9970703125, -37.43115234375, -35.865234375, -34.29931640625, -32.7333984375, -31.16748046875, -29.6015625, -28.03564453125, -26.4697265625, -24.90380859375, -23.337890625, -21.77197265625, -20.2060546875, -18.64013671875, -17.07421875, -15.50830078125, -13.9423828125, -12.37646484375, -10.810546875, -9.24462890625, -7.6787109375, -6.11279296875, -4.546875, -2.98095703125, -1.4150390625, 0.15087890625, 1.716796875, 3.28271484375, 4.8486328125, 6.41455078125, 7.98046875, 9.54638671875, 11.1123046875, 12.67822265625, 14.244140625, 15.81005859375, 17.3759765625, 18.94189453125, 20.5078125, 22.07373046875, 23.6396484375, 25.20556640625, 26.771484375, 28.33740234375, 29.9033203125, 31.46923828125, 33.03515625, 34.60107421875, 36.1669921875, 37.73291015625, 39.298828125, 40.86474609375, 42.4306640625, 43.99658203125, 45.5625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 7.0, 5.0, 5.0, 6.0, 9.0, 14.0, 13.0, 17.0, 18.0, 22.0, 22.0, 31.0, 25.0, 29.0, 29.0, 28.0, 29.0, 32.0, 45.0, 56.0, 39.0, 34.0, 32.0, 36.0, 31.0, 32.0, 34.0, 32.0, 29.0, 30.0, 25.0, 31.0, 19.0, 23.0, 14.0, 21.0, 8.0, 17.0, 12.0, 13.0, 11.0, 5.0, 6.0, 7.0, 10.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0], "bins": [-13.0546875, -12.6796875, -12.3046875, -11.9296875, -11.5546875, -11.1796875, -10.8046875, -10.4296875, -10.0546875, -9.6796875, -9.3046875, -8.9296875, -8.5546875, -8.1796875, -7.8046875, -7.4296875, -7.0546875, -6.6796875, -6.3046875, -5.9296875, -5.5546875, -5.1796875, -4.8046875, -4.4296875, -4.0546875, -3.6796875, -3.3046875, -2.9296875, -2.5546875, -2.1796875, -1.8046875, -1.4296875, -1.0546875, -0.6796875, -0.3046875, 0.0703125, 0.4453125, 0.8203125, 1.1953125, 1.5703125, 1.9453125, 2.3203125, 2.6953125, 3.0703125, 3.4453125, 3.8203125, 4.1953125, 4.5703125, 4.9453125, 5.3203125, 5.6953125, 6.0703125, 6.4453125, 6.8203125, 7.1953125, 7.5703125, 7.9453125, 8.3203125, 8.6953125, 9.0703125, 9.4453125, 9.8203125, 10.1953125, 10.5703125, 10.9453125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 2.0, 5.0, 7.0, 16.0, 31.0, 24.0, 39.0, 58.0, 78.0, 143.0, 205.0, 321.0, 432.0, 703.0, 1107.0, 1953.0, 3103.0, 5573.0, 9653.0, 17853.0, 34847.0, 70834.0, 149651.0, 262940.0, 238722.0, 125613.0, 59927.0, 29275.0, 15252.0, 8330.0, 4726.0, 2689.0, 1609.0, 1030.0, 634.0, 396.0, 252.0, 157.0, 105.0, 85.0, 48.0, 38.0, 22.0, 20.0, 13.0, 11.0, 11.0, 6.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-21.0625, -20.421875, -19.78125, -19.140625, -18.5, -17.859375, -17.21875, -16.578125, -15.9375, -15.296875, -14.65625, -14.015625, -13.375, -12.734375, -12.09375, -11.453125, -10.8125, -10.171875, -9.53125, -8.890625, -8.25, -7.609375, -6.96875, -6.328125, -5.6875, -5.046875, -4.40625, -3.765625, -3.125, -2.484375, -1.84375, -1.203125, -0.5625, 0.078125, 0.71875, 1.359375, 2.0, 2.640625, 3.28125, 3.921875, 4.5625, 5.203125, 5.84375, 6.484375, 7.125, 7.765625, 8.40625, 9.046875, 9.6875, 10.328125, 10.96875, 11.609375, 12.25, 12.890625, 13.53125, 14.171875, 14.8125, 15.453125, 16.09375, 16.734375, 17.375, 18.015625, 18.65625, 19.296875, 19.9375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 1.0, 2.0, 1.0, 7.0, 10.0, 10.0, 9.0, 16.0, 25.0, 50.0, 57.0, 82.0, 112.0, 121.0, 109.0, 125.0, 70.0, 52.0, 37.0, 32.0, 21.0, 10.0, 7.0, 9.0, 7.0, 3.0, 7.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0014095306396484375, -0.0013667196035385132, -0.0013239085674285889, -0.0012810975313186646, -0.0012382864952087402, -0.001195475459098816, -0.0011526644229888916, -0.0011098533868789673, -0.001067042350769043, -0.0010242313146591187, -0.0009814202785491943, -0.00093860924243927, -0.0008957982063293457, -0.0008529871702194214, -0.0008101761341094971, -0.0007673650979995728, -0.0007245540618896484, -0.0006817430257797241, -0.0006389319896697998, -0.0005961209535598755, -0.0005533099174499512, -0.0005104988813400269, -0.00046768784523010254, -0.0004248768091201782, -0.0003820657730102539, -0.0003392547369003296, -0.0002964437007904053, -0.00025363266468048096, -0.00021082162857055664, -0.00016801059246063232, -0.000125199556350708, -8.238852024078369e-05, -3.9577484130859375e-05, 3.2335519790649414e-06, 4.604458808898926e-05, 8.885562419891357e-05, 0.0001316666603088379, 0.0001744776964187622, 0.00021728873252868652, 0.00026009976863861084, 0.00030291080474853516, 0.00034572184085845947, 0.0003885328769683838, 0.0004313439130783081, 0.0004741549491882324, 0.0005169659852981567, 0.0005597770214080811, 0.0006025880575180054, 0.0006453990936279297, 0.000688210129737854, 0.0007310211658477783, 0.0007738322019577026, 0.000816643238067627, 0.0008594542741775513, 0.0009022653102874756, 0.0009450763463973999, 0.0009878873825073242, 0.0010306984186172485, 0.0010735094547271729, 0.0011163204908370972, 0.0011591315269470215, 0.0012019425630569458, 0.0012447535991668701, 0.0012875646352767944, 0.0013303756713867188]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 8.0, 9.0, 13.0, 26.0, 21.0, 34.0, 60.0, 65.0, 121.0, 189.0, 244.0, 377.0, 521.0, 862.0, 1385.0, 2165.0, 3383.0, 5693.0, 9110.0, 15594.0, 26905.0, 46359.0, 79305.0, 128325.0, 176929.0, 184791.0, 143344.0, 91472.0, 53960.0, 31248.0, 18001.0, 10778.0, 6510.0, 3864.0, 2398.0, 1493.0, 1010.0, 623.0, 438.0, 314.0, 199.0, 132.0, 86.0, 57.0, 35.0, 37.0, 16.0, 12.0, 15.0, 9.0, 7.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0], "bins": [-14.3984375, -13.950439453125, -13.50244140625, -13.054443359375, -12.6064453125, -12.158447265625, -11.71044921875, -11.262451171875, -10.814453125, -10.366455078125, -9.91845703125, -9.470458984375, -9.0224609375, -8.574462890625, -8.12646484375, -7.678466796875, -7.23046875, -6.782470703125, -6.33447265625, -5.886474609375, -5.4384765625, -4.990478515625, -4.54248046875, -4.094482421875, -3.646484375, -3.198486328125, -2.75048828125, -2.302490234375, -1.8544921875, -1.406494140625, -0.95849609375, -0.510498046875, -0.0625, 0.385498046875, 0.83349609375, 1.281494140625, 1.7294921875, 2.177490234375, 2.62548828125, 3.073486328125, 3.521484375, 3.969482421875, 4.41748046875, 4.865478515625, 5.3134765625, 5.761474609375, 6.20947265625, 6.657470703125, 7.10546875, 7.553466796875, 8.00146484375, 8.449462890625, 8.8974609375, 9.345458984375, 9.79345703125, 10.241455078125, 10.689453125, 11.137451171875, 11.58544921875, 12.033447265625, 12.4814453125, 12.929443359375, 13.37744140625, 13.825439453125, 14.2734375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 3.0, 7.0, 8.0, 8.0, 11.0, 11.0, 15.0, 24.0, 26.0, 26.0, 31.0, 42.0, 41.0, 56.0, 57.0, 66.0, 64.0, 64.0, 56.0, 49.0, 52.0, 44.0, 46.0, 35.0, 26.0, 26.0, 20.0, 18.0, 8.0, 12.0, 7.0, 2.0, 5.0, 8.0, 2.0, 4.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.06640625, -4.90667724609375, -4.7469482421875, -4.58721923828125, -4.427490234375, -4.26776123046875, -4.1080322265625, -3.94830322265625, -3.78857421875, -3.62884521484375, -3.4691162109375, -3.30938720703125, -3.149658203125, -2.98992919921875, -2.8302001953125, -2.67047119140625, -2.5107421875, -2.35101318359375, -2.1912841796875, -2.03155517578125, -1.871826171875, -1.71209716796875, -1.5523681640625, -1.39263916015625, -1.23291015625, -1.07318115234375, -0.9134521484375, -0.75372314453125, -0.593994140625, -0.43426513671875, -0.2745361328125, -0.11480712890625, 0.044921875, 0.20465087890625, 0.3643798828125, 0.52410888671875, 0.683837890625, 0.84356689453125, 1.0032958984375, 1.16302490234375, 1.32275390625, 1.48248291015625, 1.6422119140625, 1.80194091796875, 1.961669921875, 2.12139892578125, 2.2811279296875, 2.44085693359375, 2.6005859375, 2.76031494140625, 2.9200439453125, 3.07977294921875, 3.239501953125, 3.39923095703125, 3.5589599609375, 3.71868896484375, 3.87841796875, 4.03814697265625, 4.1978759765625, 4.35760498046875, 4.517333984375, 4.67706298828125, 4.8367919921875, 4.99652099609375, 5.15625]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 7.0, 12.0, 5.0, 8.0, 15.0, 15.0, 20.0, 29.0, 28.0, 37.0, 37.0, 50.0, 45.0, 53.0, 65.0, 50.0, 47.0, 53.0, 52.0, 52.0, 51.0, 34.0, 33.0, 40.0, 23.0, 25.0, 17.0, 14.0, 22.0, 16.0, 8.0, 7.0, 7.0, 8.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-33.87684631347656, -32.922794342041016, -31.96874237060547, -31.014690399169922, -30.060638427734375, -29.106586456298828, -28.152536392211914, -27.198484420776367, -26.24443244934082, -25.290380477905273, -24.336328506469727, -23.38227653503418, -22.428226470947266, -21.47417449951172, -20.520122528076172, -19.566070556640625, -18.612018585205078, -17.65796661376953, -16.703914642333984, -15.749863624572754, -14.795811653137207, -13.84175968170166, -12.88770866394043, -11.933656692504883, -10.979604721069336, -10.025552749633789, -9.071500778198242, -8.117449760437012, -7.163397789001465, -6.209345817565918, -5.255294322967529, -4.301242828369141, -3.347188949584961, -2.393137216567993, -1.4390854835510254, -0.4850337505340576, 0.46901798248291016, 1.423069953918457, 2.3771214485168457, 3.3311729431152344, 4.285224914550781, 5.239276885986328, 6.193328380584717, 7.1473798751831055, 8.101431846618652, 9.0554838180542, 10.00953483581543, 10.963586807250977, 11.917638778686523, 12.87169075012207, 13.825742721557617, 14.779793739318848, 15.733845710754395, 16.687896728515625, 17.641948699951172, 18.59600067138672, 19.550052642822266, 20.504104614257812, 21.45815658569336, 22.412208557128906, 23.366260528564453, 24.3203125, 25.274362564086914, 26.22841453552246, 27.182466506958008]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 6.0, 2.0, 3.0, 5.0, 9.0, 10.0, 10.0, 16.0, 15.0, 10.0, 21.0, 24.0, 19.0, 35.0, 26.0, 35.0, 45.0, 42.0, 38.0, 40.0, 48.0, 50.0, 48.0, 50.0, 47.0, 47.0, 36.0, 34.0, 31.0, 41.0, 18.0, 29.0, 22.0, 22.0, 18.0, 15.0, 11.0, 8.0, 5.0, 11.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.00705337524414, -22.3016414642334, -21.596229553222656, -20.890817642211914, -20.185405731201172, -19.47999382019043, -18.774581909179688, -18.069169998168945, -17.363758087158203, -16.65834617614746, -15.952934265136719, -15.247522354125977, -14.542110443115234, -13.836698532104492, -13.13128662109375, -12.425874710083008, -11.720462799072266, -11.015050888061523, -10.309638977050781, -9.604227066040039, -8.898815155029297, -8.193403244018555, -7.4879913330078125, -6.78257942199707, -6.077167510986328, -5.371755599975586, -4.666343688964844, -3.9609317779541016, -3.2555198669433594, -2.550107955932617, -1.844696044921875, -1.1392841339111328, -0.4338722229003906, 0.27153968811035156, 0.9769515991210938, 1.682363510131836, 2.387775421142578, 3.0931873321533203, 3.7985992431640625, 4.504011154174805, 5.209423065185547, 5.914834976196289, 6.620246887207031, 7.325658798217773, 8.031070709228516, 8.736482620239258, 9.44189453125, 10.147306442260742, 10.852718353271484, 11.558130264282227, 12.263542175292969, 12.968954086303711, 13.674365997314453, 14.379777908325195, 15.085189819335938, 15.79060173034668, 16.496013641357422, 17.201425552368164, 17.906837463378906, 18.61224937438965, 19.31766128540039, 20.023073196411133, 20.728485107421875, 21.433897018432617, 22.13930892944336]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 8.0, 4.0, 9.0, 14.0, 28.0, 26.0, 41.0, 57.0, 94.0, 149.0, 246.0, 385.0, 562.0, 862.0, 1314.0, 2100.0, 3304.0, 5366.0, 8192.0, 13061.0, 20516.0, 32183.0, 48693.0, 71432.0, 98800.0, 123633.0, 137162.0, 130374.0, 108574.0, 81289.0, 56197.0, 37341.0, 24092.0, 15359.0, 9992.0, 6255.0, 3984.0, 2432.0, 1569.0, 1011.0, 665.0, 389.0, 295.0, 183.0, 119.0, 84.0, 59.0, 23.0, 9.0, 13.0, 7.0, 2.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-25.53125, -24.75, -23.96875, -23.1875, -22.40625, -21.625, -20.84375, -20.0625, -19.28125, -18.5, -17.71875, -16.9375, -16.15625, -15.375, -14.59375, -13.8125, -13.03125, -12.25, -11.46875, -10.6875, -9.90625, -9.125, -8.34375, -7.5625, -6.78125, -6.0, -5.21875, -4.4375, -3.65625, -2.875, -2.09375, -1.3125, -0.53125, 0.25, 1.03125, 1.8125, 2.59375, 3.375, 4.15625, 4.9375, 5.71875, 6.5, 7.28125, 8.0625, 8.84375, 9.625, 10.40625, 11.1875, 11.96875, 12.75, 13.53125, 14.3125, 15.09375, 15.875, 16.65625, 17.4375, 18.21875, 19.0, 19.78125, 20.5625, 21.34375, 22.125, 22.90625, 23.6875, 24.46875]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 8.0, 5.0, 8.0, 11.0, 16.0, 8.0, 20.0, 19.0, 25.0, 14.0, 24.0, 25.0, 40.0, 26.0, 38.0, 40.0, 38.0, 35.0, 34.0, 39.0, 59.0, 36.0, 52.0, 21.0, 44.0, 57.0, 33.0, 31.0, 25.0, 31.0, 14.0, 23.0, 29.0, 7.0, 14.0, 10.0, 15.0, 5.0, 6.0, 4.0, 6.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.625, -21.9580078125, -21.291015625, -20.6240234375, -19.95703125, -19.2900390625, -18.623046875, -17.9560546875, -17.2890625, -16.6220703125, -15.955078125, -15.2880859375, -14.62109375, -13.9541015625, -13.287109375, -12.6201171875, -11.953125, -11.2861328125, -10.619140625, -9.9521484375, -9.28515625, -8.6181640625, -7.951171875, -7.2841796875, -6.6171875, -5.9501953125, -5.283203125, -4.6162109375, -3.94921875, -3.2822265625, -2.615234375, -1.9482421875, -1.28125, -0.6142578125, 0.052734375, 0.7197265625, 1.38671875, 2.0537109375, 2.720703125, 3.3876953125, 4.0546875, 4.7216796875, 5.388671875, 6.0556640625, 6.72265625, 7.3896484375, 8.056640625, 8.7236328125, 9.390625, 10.0576171875, 10.724609375, 11.3916015625, 12.05859375, 12.7255859375, 13.392578125, 14.0595703125, 14.7265625, 15.3935546875, 16.060546875, 16.7275390625, 17.39453125, 18.0615234375, 18.728515625, 19.3955078125, 20.0625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 4.0, 7.0, 7.0, 10.0, 10.0, 16.0, 28.0, 51.0, 67.0, 96.0, 145.0, 195.0, 292.0, 424.0, 648.0, 990.0, 1471.0, 2098.0, 3047.0, 4485.0, 6724.0, 9939.0, 14267.0, 21146.0, 30029.0, 42714.0, 58114.0, 77550.0, 96020.0, 110873.0, 115247.0, 107571.0, 91567.0, 72209.0, 54139.0, 38919.0, 27525.0, 19130.0, 13129.0, 8837.0, 6051.0, 4039.0, 2768.0, 1915.0, 1305.0, 860.0, 599.0, 414.0, 271.0, 197.0, 124.0, 94.0, 57.0, 42.0, 31.0, 26.0, 13.0, 13.0, 4.0, 4.0, 4.0, 3.0, 1.0], "bins": [-18.703125, -18.10693359375, -17.5107421875, -16.91455078125, -16.318359375, -15.72216796875, -15.1259765625, -14.52978515625, -13.93359375, -13.33740234375, -12.7412109375, -12.14501953125, -11.548828125, -10.95263671875, -10.3564453125, -9.76025390625, -9.1640625, -8.56787109375, -7.9716796875, -7.37548828125, -6.779296875, -6.18310546875, -5.5869140625, -4.99072265625, -4.39453125, -3.79833984375, -3.2021484375, -2.60595703125, -2.009765625, -1.41357421875, -0.8173828125, -0.22119140625, 0.375, 0.97119140625, 1.5673828125, 2.16357421875, 2.759765625, 3.35595703125, 3.9521484375, 4.54833984375, 5.14453125, 5.74072265625, 6.3369140625, 6.93310546875, 7.529296875, 8.12548828125, 8.7216796875, 9.31787109375, 9.9140625, 10.51025390625, 11.1064453125, 11.70263671875, 12.298828125, 12.89501953125, 13.4912109375, 14.08740234375, 14.68359375, 15.27978515625, 15.8759765625, 16.47216796875, 17.068359375, 17.66455078125, 18.2607421875, 18.85693359375, 19.453125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 9.0, 11.0, 8.0, 7.0, 15.0, 16.0, 15.0, 18.0, 23.0, 29.0, 23.0, 30.0, 39.0, 30.0, 38.0, 35.0, 49.0, 46.0, 32.0, 42.0, 36.0, 43.0, 39.0, 37.0, 41.0, 41.0, 29.0, 29.0, 29.0, 18.0, 20.0, 15.0, 22.0, 14.0, 12.0, 8.0, 10.0, 9.0, 4.0, 3.0, 2.0, 8.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-14.8671875, -14.431396484375, -13.99560546875, -13.559814453125, -13.1240234375, -12.688232421875, -12.25244140625, -11.816650390625, -11.380859375, -10.945068359375, -10.50927734375, -10.073486328125, -9.6376953125, -9.201904296875, -8.76611328125, -8.330322265625, -7.89453125, -7.458740234375, -7.02294921875, -6.587158203125, -6.1513671875, -5.715576171875, -5.27978515625, -4.843994140625, -4.408203125, -3.972412109375, -3.53662109375, -3.100830078125, -2.6650390625, -2.229248046875, -1.79345703125, -1.357666015625, -0.921875, -0.486083984375, -0.05029296875, 0.385498046875, 0.8212890625, 1.257080078125, 1.69287109375, 2.128662109375, 2.564453125, 3.000244140625, 3.43603515625, 3.871826171875, 4.3076171875, 4.743408203125, 5.17919921875, 5.614990234375, 6.05078125, 6.486572265625, 6.92236328125, 7.358154296875, 7.7939453125, 8.229736328125, 8.66552734375, 9.101318359375, 9.537109375, 9.972900390625, 10.40869140625, 10.844482421875, 11.2802734375, 11.716064453125, 12.15185546875, 12.587646484375, 13.0234375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 5.0, 10.0, 19.0, 14.0, 47.0, 55.0, 78.0, 154.0, 203.0, 347.0, 614.0, 959.0, 1581.0, 2669.0, 4686.0, 7927.0, 13739.0, 24533.0, 43465.0, 76888.0, 128276.0, 181770.0, 193883.0, 149005.0, 93865.0, 53679.0, 29865.0, 16946.0, 9617.0, 5550.0, 3213.0, 1887.0, 1133.0, 701.0, 401.0, 269.0, 174.0, 112.0, 75.0, 48.0, 24.0, 29.0, 12.0, 6.0, 8.0, 5.0, 2.0, 5.0, 3.0, 2.0, 0.0, 2.0], "bins": [-21.4375, -20.810302734375, -20.18310546875, -19.555908203125, -18.9287109375, -18.301513671875, -17.67431640625, -17.047119140625, -16.419921875, -15.792724609375, -15.16552734375, -14.538330078125, -13.9111328125, -13.283935546875, -12.65673828125, -12.029541015625, -11.40234375, -10.775146484375, -10.14794921875, -9.520751953125, -8.8935546875, -8.266357421875, -7.63916015625, -7.011962890625, -6.384765625, -5.757568359375, -5.13037109375, -4.503173828125, -3.8759765625, -3.248779296875, -2.62158203125, -1.994384765625, -1.3671875, -0.739990234375, -0.11279296875, 0.514404296875, 1.1416015625, 1.768798828125, 2.39599609375, 3.023193359375, 3.650390625, 4.277587890625, 4.90478515625, 5.531982421875, 6.1591796875, 6.786376953125, 7.41357421875, 8.040771484375, 8.66796875, 9.295166015625, 9.92236328125, 10.549560546875, 11.1767578125, 11.803955078125, 12.43115234375, 13.058349609375, 13.685546875, 14.312744140625, 14.93994140625, 15.567138671875, 16.1943359375, 16.821533203125, 17.44873046875, 18.075927734375, 18.703125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 2.0, 8.0, 10.0, 8.0, 10.0, 14.0, 13.0, 23.0, 28.0, 41.0, 29.0, 31.0, 31.0, 42.0, 50.0, 40.0, 48.0, 62.0, 57.0, 53.0, 50.0, 49.0, 40.0, 44.0, 27.0, 35.0, 32.0, 13.0, 13.0, 12.0, 12.0, 11.0, 5.0, 6.0, 9.0, 6.0, 2.0, 5.0, 8.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0015411376953125, -0.0014872103929519653, -0.0014332830905914307, -0.001379355788230896, -0.0013254284858703613, -0.0012715011835098267, -0.001217573881149292, -0.0011636465787887573, -0.0011097192764282227, -0.001055791974067688, -0.0010018646717071533, -0.0009479373693466187, -0.000894010066986084, -0.0008400827646255493, -0.0007861554622650146, -0.00073222815990448, -0.0006783008575439453, -0.0006243735551834106, -0.000570446252822876, -0.0005165189504623413, -0.00046259164810180664, -0.00040866434574127197, -0.0003547370433807373, -0.00030080974102020264, -0.00024688243865966797, -0.0001929551362991333, -0.00013902783393859863, -8.510053157806396e-05, -3.11732292175293e-05, 2.275407314300537e-05, 7.668137550354004e-05, 0.0001306086778640747, 0.00018453598022460938, 0.00023846328258514404, 0.0002923905849456787, 0.0003463178873062134, 0.00040024518966674805, 0.0004541724920272827, 0.0005080997943878174, 0.000562027096748352, 0.0006159543991088867, 0.0006698817014694214, 0.0007238090038299561, 0.0007777363061904907, 0.0008316636085510254, 0.0008855909109115601, 0.0009395182132720947, 0.0009934455156326294, 0.001047372817993164, 0.0011013001203536987, 0.0011552274227142334, 0.001209154725074768, 0.0012630820274353027, 0.0013170093297958374, 0.001370936632156372, 0.0014248639345169067, 0.0014787912368774414, 0.001532718539237976, 0.0015866458415985107, 0.0016405731439590454, 0.00169450044631958, 0.0017484277486801147, 0.0018023550510406494, 0.001856282353401184, 0.0019102096557617188]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 5.0, 7.0, 6.0, 10.0, 24.0, 37.0, 49.0, 61.0, 110.0, 182.0, 319.0, 535.0, 925.0, 1705.0, 3200.0, 5877.0, 10967.0, 20489.0, 38682.0, 71508.0, 123413.0, 182991.0, 203440.0, 161573.0, 101239.0, 56396.0, 29923.0, 16158.0, 8376.0, 4583.0, 2599.0, 1336.0, 757.0, 468.0, 227.0, 126.0, 72.0, 45.0, 40.0, 26.0, 14.0, 17.0, 11.0, 5.0, 7.0, 4.0, 5.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-19.078125, -18.487548828125, -17.89697265625, -17.306396484375, -16.7158203125, -16.125244140625, -15.53466796875, -14.944091796875, -14.353515625, -13.762939453125, -13.17236328125, -12.581787109375, -11.9912109375, -11.400634765625, -10.81005859375, -10.219482421875, -9.62890625, -9.038330078125, -8.44775390625, -7.857177734375, -7.2666015625, -6.676025390625, -6.08544921875, -5.494873046875, -4.904296875, -4.313720703125, -3.72314453125, -3.132568359375, -2.5419921875, -1.951416015625, -1.36083984375, -0.770263671875, -0.1796875, 0.410888671875, 1.00146484375, 1.592041015625, 2.1826171875, 2.773193359375, 3.36376953125, 3.954345703125, 4.544921875, 5.135498046875, 5.72607421875, 6.316650390625, 6.9072265625, 7.497802734375, 8.08837890625, 8.678955078125, 9.26953125, 9.860107421875, 10.45068359375, 11.041259765625, 11.6318359375, 12.222412109375, 12.81298828125, 13.403564453125, 13.994140625, 14.584716796875, 15.17529296875, 15.765869140625, 16.3564453125, 16.947021484375, 17.53759765625, 18.128173828125, 18.71875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 1.0, 2.0, 8.0, 3.0, 6.0, 10.0, 8.0, 16.0, 20.0, 32.0, 18.0, 20.0, 26.0, 43.0, 36.0, 50.0, 53.0, 57.0, 64.0, 66.0, 54.0, 59.0, 57.0, 49.0, 35.0, 42.0, 30.0, 24.0, 25.0, 20.0, 13.0, 12.0, 15.0, 7.0, 5.0, 4.0, 3.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.46875, -6.296875, -6.125, -5.953125, -5.78125, -5.609375, -5.4375, -5.265625, -5.09375, -4.921875, -4.75, -4.578125, -4.40625, -4.234375, -4.0625, -3.890625, -3.71875, -3.546875, -3.375, -3.203125, -3.03125, -2.859375, -2.6875, -2.515625, -2.34375, -2.171875, -2.0, -1.828125, -1.65625, -1.484375, -1.3125, -1.140625, -0.96875, -0.796875, -0.625, -0.453125, -0.28125, -0.109375, 0.0625, 0.234375, 0.40625, 0.578125, 0.75, 0.921875, 1.09375, 1.265625, 1.4375, 1.609375, 1.78125, 1.953125, 2.125, 2.296875, 2.46875, 2.640625, 2.8125, 2.984375, 3.15625, 3.328125, 3.5, 3.671875, 3.84375, 4.015625, 4.1875, 4.359375, 4.53125]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 7.0, 4.0, 3.0, 6.0, 13.0, 8.0, 14.0, 17.0, 23.0, 35.0, 41.0, 35.0, 37.0, 60.0, 63.0, 52.0, 63.0, 61.0, 46.0, 71.0, 56.0, 49.0, 51.0, 39.0, 37.0, 19.0, 30.0, 12.0, 14.0, 6.0, 11.0, 5.0, 4.0, 7.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.52616882324219, -36.46769714355469, -35.40922546386719, -34.35075378417969, -33.29228210449219, -32.23381042480469, -31.175338745117188, -30.116867065429688, -29.058395385742188, -27.999923706054688, -26.941452026367188, -25.882980346679688, -24.824508666992188, -23.766036987304688, -22.707565307617188, -21.649093627929688, -20.590621948242188, -19.532150268554688, -18.473678588867188, -17.415206909179688, -16.356735229492188, -15.298263549804688, -14.239791870117188, -13.181320190429688, -12.122848510742188, -11.064376831054688, -10.005905151367188, -8.947433471679688, -7.8889617919921875, -6.8304901123046875, -5.7720184326171875, -4.7135467529296875, -3.655078887939453, -2.596607208251953, -1.5381355285644531, -0.4796638488769531, 0.5788078308105469, 1.6372795104980469, 2.695751190185547, 3.754222869873047, 4.812694549560547, 5.871166229248047, 6.929637908935547, 7.988109588623047, 9.046581268310547, 10.105052947998047, 11.163524627685547, 12.221996307373047, 13.280467987060547, 14.338939666748047, 15.397411346435547, 16.455883026123047, 17.514354705810547, 18.572826385498047, 19.631298065185547, 20.689769744873047, 21.748241424560547, 22.806713104248047, 23.865184783935547, 24.923656463623047, 25.982128143310547, 27.040599822998047, 28.099071502685547, 29.157543182373047, 30.216014862060547]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 4.0, 9.0, 6.0, 9.0, 11.0, 10.0, 12.0, 10.0, 12.0, 16.0, 18.0, 28.0, 25.0, 23.0, 30.0, 36.0, 35.0, 21.0, 32.0, 28.0, 41.0, 64.0, 38.0, 39.0, 36.0, 39.0, 39.0, 40.0, 36.0, 29.0, 33.0, 27.0, 31.0, 24.0, 21.0, 11.0, 17.0, 17.0, 13.0, 11.0, 10.0, 3.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.468870162963867, -19.79831886291504, -19.12776756286621, -18.457216262817383, -17.786663055419922, -17.116111755371094, -16.445560455322266, -15.775009155273438, -15.10445785522461, -14.433906555175781, -13.763355255126953, -13.092803001403809, -12.42225170135498, -11.751700401306152, -11.081148147583008, -10.41059684753418, -9.740045547485352, -9.069494247436523, -8.398942947387695, -7.728390693664551, -7.057839393615723, -6.3872880935668945, -5.716736316680908, -5.046184539794922, -4.375633239746094, -3.7050817012786865, -3.0345301628112793, -2.363978624343872, -1.6934270858764648, -1.0228755474090576, -0.3523240089416504, 0.31822776794433594, 0.9887771606445312, 1.6593286991119385, 2.3298802375793457, 3.000431776046753, 3.67098331451416, 4.341534614562988, 5.012086391448975, 5.682638168334961, 6.353189468383789, 7.023740768432617, 7.6942925453186035, 8.36484432220459, 9.035395622253418, 9.705946922302246, 10.37649917602539, 11.047050476074219, 11.717601776123047, 12.388153076171875, 13.058704376220703, 13.729256629943848, 14.399807929992676, 15.070359230041504, 15.740911483764648, 16.411462783813477, 17.082014083862305, 17.752565383911133, 18.42311668395996, 19.09366798400879, 19.76422119140625, 20.434772491455078, 21.105323791503906, 21.775875091552734, 22.446426391601562]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 3.0, 9.0, 8.0, 18.0, 32.0, 52.0, 73.0, 120.0, 154.0, 310.0, 503.0, 830.0, 1451.0, 2572.0, 4488.0, 8294.0, 15348.0, 29663.0, 59609.0, 127794.0, 284348.0, 631812.0, 1066958.0, 985485.0, 531654.0, 234427.0, 105595.0, 49829.0, 24729.0, 12691.0, 6735.0, 3591.0, 2138.0, 1192.0, 672.0, 426.0, 255.0, 157.0, 83.0, 65.0, 36.0, 22.0, 29.0, 12.0, 8.0, 5.0, 0.0, 1.0, 1.0, 1.0], "bins": [-31.890625, -31.02587890625, -30.1611328125, -29.29638671875, -28.431640625, -27.56689453125, -26.7021484375, -25.83740234375, -24.97265625, -24.10791015625, -23.2431640625, -22.37841796875, -21.513671875, -20.64892578125, -19.7841796875, -18.91943359375, -18.0546875, -17.18994140625, -16.3251953125, -15.46044921875, -14.595703125, -13.73095703125, -12.8662109375, -12.00146484375, -11.13671875, -10.27197265625, -9.4072265625, -8.54248046875, -7.677734375, -6.81298828125, -5.9482421875, -5.08349609375, -4.21875, -3.35400390625, -2.4892578125, -1.62451171875, -0.759765625, 0.10498046875, 0.9697265625, 1.83447265625, 2.69921875, 3.56396484375, 4.4287109375, 5.29345703125, 6.158203125, 7.02294921875, 7.8876953125, 8.75244140625, 9.6171875, 10.48193359375, 11.3466796875, 12.21142578125, 13.076171875, 13.94091796875, 14.8056640625, 15.67041015625, 16.53515625, 17.39990234375, 18.2646484375, 19.12939453125, 19.994140625, 20.85888671875, 21.7236328125, 22.58837890625, 23.453125]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 9.0, 5.0, 8.0, 12.0, 8.0, 5.0, 16.0, 14.0, 10.0, 17.0, 10.0, 12.0, 18.0, 14.0, 23.0, 25.0, 17.0, 29.0, 30.0, 35.0, 28.0, 32.0, 28.0, 34.0, 29.0, 43.0, 33.0, 39.0, 36.0, 26.0, 35.0, 30.0, 28.0, 29.0, 33.0, 19.0, 34.0, 22.0, 19.0, 18.0, 20.0, 7.0, 17.0, 8.0, 5.0, 5.0, 5.0, 4.0, 10.0, 4.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0], "bins": [-13.1015625, -12.6968994140625, -12.292236328125, -11.8875732421875, -11.48291015625, -11.0782470703125, -10.673583984375, -10.2689208984375, -9.8642578125, -9.4595947265625, -9.054931640625, -8.6502685546875, -8.24560546875, -7.8409423828125, -7.436279296875, -7.0316162109375, -6.626953125, -6.2222900390625, -5.817626953125, -5.4129638671875, -5.00830078125, -4.6036376953125, -4.198974609375, -3.7943115234375, -3.3896484375, -2.9849853515625, -2.580322265625, -2.1756591796875, -1.77099609375, -1.3663330078125, -0.961669921875, -0.5570068359375, -0.15234375, 0.2523193359375, 0.656982421875, 1.0616455078125, 1.46630859375, 1.8709716796875, 2.275634765625, 2.6802978515625, 3.0849609375, 3.4896240234375, 3.894287109375, 4.2989501953125, 4.70361328125, 5.1082763671875, 5.512939453125, 5.9176025390625, 6.322265625, 6.7269287109375, 7.131591796875, 7.5362548828125, 7.94091796875, 8.3455810546875, 8.750244140625, 9.1549072265625, 9.5595703125, 9.9642333984375, 10.368896484375, 10.7735595703125, 11.17822265625, 11.5828857421875, 11.987548828125, 12.3922119140625, 12.796875]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 8.0, 11.0, 20.0, 36.0, 43.0, 60.0, 87.0, 173.0, 260.0, 418.0, 722.0, 1056.0, 1704.0, 2847.0, 4682.0, 7793.0, 13422.0, 23310.0, 41282.0, 74234.0, 136741.0, 249543.0, 445873.0, 719056.0, 870437.0, 678937.0, 410138.0, 227983.0, 124342.0, 67820.0, 38299.0, 21771.0, 12446.0, 7230.0, 4457.0, 2623.0, 1608.0, 1035.0, 588.0, 412.0, 261.0, 180.0, 130.0, 59.0, 58.0, 29.0, 17.0, 9.0, 10.0, 9.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0], "bins": [-22.703125, -21.980712890625, -21.25830078125, -20.535888671875, -19.8134765625, -19.091064453125, -18.36865234375, -17.646240234375, -16.923828125, -16.201416015625, -15.47900390625, -14.756591796875, -14.0341796875, -13.311767578125, -12.58935546875, -11.866943359375, -11.14453125, -10.422119140625, -9.69970703125, -8.977294921875, -8.2548828125, -7.532470703125, -6.81005859375, -6.087646484375, -5.365234375, -4.642822265625, -3.92041015625, -3.197998046875, -2.4755859375, -1.753173828125, -1.03076171875, -0.308349609375, 0.4140625, 1.136474609375, 1.85888671875, 2.581298828125, 3.3037109375, 4.026123046875, 4.74853515625, 5.470947265625, 6.193359375, 6.915771484375, 7.63818359375, 8.360595703125, 9.0830078125, 9.805419921875, 10.52783203125, 11.250244140625, 11.97265625, 12.695068359375, 13.41748046875, 14.139892578125, 14.8623046875, 15.584716796875, 16.30712890625, 17.029541015625, 17.751953125, 18.474365234375, 19.19677734375, 19.919189453125, 20.6416015625, 21.364013671875, 22.08642578125, 22.808837890625, 23.53125]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 6.0, 4.0, 10.0, 8.0, 12.0, 22.0, 26.0, 37.0, 48.0, 72.0, 74.0, 102.0, 121.0, 141.0, 192.0, 214.0, 261.0, 253.0, 299.0, 294.0, 275.0, 269.0, 246.0, 226.0, 160.0, 151.0, 120.0, 81.0, 92.0, 50.0, 58.0, 43.0, 31.0, 25.0, 19.0, 7.0, 9.0, 10.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5078125, -8.228271484375, -7.94873046875, -7.669189453125, -7.3896484375, -7.110107421875, -6.83056640625, -6.551025390625, -6.271484375, -5.991943359375, -5.71240234375, -5.432861328125, -5.1533203125, -4.873779296875, -4.59423828125, -4.314697265625, -4.03515625, -3.755615234375, -3.47607421875, -3.196533203125, -2.9169921875, -2.637451171875, -2.35791015625, -2.078369140625, -1.798828125, -1.519287109375, -1.23974609375, -0.960205078125, -0.6806640625, -0.401123046875, -0.12158203125, 0.157958984375, 0.4375, 0.717041015625, 0.99658203125, 1.276123046875, 1.5556640625, 1.835205078125, 2.11474609375, 2.394287109375, 2.673828125, 2.953369140625, 3.23291015625, 3.512451171875, 3.7919921875, 4.071533203125, 4.35107421875, 4.630615234375, 4.91015625, 5.189697265625, 5.46923828125, 5.748779296875, 6.0283203125, 6.307861328125, 6.58740234375, 6.866943359375, 7.146484375, 7.426025390625, 7.70556640625, 7.985107421875, 8.2646484375, 8.544189453125, 8.82373046875, 9.103271484375, 9.3828125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 9.0, 9.0, 8.0, 6.0, 17.0, 12.0, 20.0, 26.0, 32.0, 42.0, 50.0, 60.0, 62.0, 51.0, 85.0, 54.0, 61.0, 63.0, 59.0, 55.0, 41.0, 35.0, 30.0, 22.0, 20.0, 17.0, 17.0, 11.0, 8.0, 5.0, 3.0, 3.0, 5.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.959232330322266, -32.002872467041016, -31.0465087890625, -30.090147018432617, -29.133785247802734, -28.17742347717285, -27.22106170654297, -26.26470184326172, -25.308338165283203, -24.35197639465332, -23.395614624023438, -22.439252853393555, -21.482891082763672, -20.52652931213379, -19.570167541503906, -18.613807678222656, -17.657445907592773, -16.70108413696289, -15.744722366333008, -14.788360595703125, -13.831998825073242, -12.87563705444336, -11.919276237487793, -10.96291446685791, -10.006552696228027, -9.050190925598145, -8.093829154968262, -7.137467861175537, -6.181106090545654, -5.2247443199157715, -4.268383026123047, -3.312021255493164, -2.3556575775146484, -1.3992959260940552, -0.4429342746734619, 0.5134272575378418, 1.4697890281677246, 2.4261507987976074, 3.382512092590332, 4.338873863220215, 5.295235633850098, 6.2515974044799805, 7.207959175109863, 8.16431999206543, 9.120681762695312, 10.077043533325195, 11.033405303955078, 11.989767074584961, 12.946128845214844, 13.902490615844727, 14.85885238647461, 15.815214157104492, 16.771575927734375, 17.727937698364258, 18.68429946899414, 19.64065933227539, 20.597023010253906, 21.55338478088379, 22.509746551513672, 23.466108322143555, 24.422470092773438, 25.37883186340332, 26.335193634033203, 27.291553497314453, 28.247915267944336]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 1.0, 4.0, 3.0, 7.0, 12.0, 9.0, 14.0, 18.0, 13.0, 15.0, 17.0, 33.0, 33.0, 27.0, 40.0, 36.0, 32.0, 33.0, 45.0, 32.0, 37.0, 41.0, 48.0, 42.0, 35.0, 44.0, 45.0, 40.0, 33.0, 35.0, 29.0, 20.0, 19.0, 19.0, 17.0, 16.0, 14.0, 11.0, 7.0, 8.0, 5.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-19.292423248291016, -18.728939056396484, -18.16545295715332, -17.60196876525879, -17.038482666015625, -16.474998474121094, -15.911514282226562, -15.348029136657715, -14.784543991088867, -14.22105884552002, -13.657573699951172, -13.09408950805664, -12.530604362487793, -11.967119216918945, -11.403635025024414, -10.840149879455566, -10.276664733886719, -9.713179588317871, -9.149694442749023, -8.586210250854492, -8.022725105285645, -7.459239959716797, -6.895755290985107, -6.332270622253418, -5.76878547668457, -5.205300331115723, -4.641815662384033, -4.078330993652344, -3.514845848083496, -2.9513609409332275, -2.387876033782959, -1.8243911266326904, -1.2609062194824219, -0.6974213123321533, -0.13393640518188477, 0.4295485019683838, 0.9930334091186523, 1.556518316268921, 2.1200032234191895, 2.683488130569458, 3.2469730377197266, 3.810457944869995, 4.373942852020264, 4.937427520751953, 5.500912666320801, 6.064397811889648, 6.627882480621338, 7.191367149353027, 7.754852294921875, 8.318337440490723, 8.88182258605957, 9.445306777954102, 10.00879192352295, 10.572277069091797, 11.135761260986328, 11.699246406555176, 12.262731552124023, 12.826216697692871, 13.389701843261719, 13.95318603515625, 14.516671180725098, 15.080156326293945, 15.643640518188477, 16.20712661743164, 16.770610809326172]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 7.0, 10.0, 13.0, 21.0, 23.0, 38.0, 51.0, 87.0, 149.0, 198.0, 258.0, 416.0, 678.0, 1032.0, 1501.0, 2448.0, 3892.0, 6362.0, 10782.0, 18914.0, 33600.0, 61275.0, 109124.0, 172749.0, 208047.0, 170437.0, 107018.0, 59974.0, 33217.0, 18779.0, 10590.0, 6318.0, 3744.0, 2332.0, 1493.0, 1033.0, 675.0, 405.0, 267.0, 181.0, 144.0, 86.0, 68.0, 44.0, 26.0, 17.0, 12.0, 8.0, 13.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.390625, -22.623291015625, -21.85595703125, -21.088623046875, -20.3212890625, -19.553955078125, -18.78662109375, -18.019287109375, -17.251953125, -16.484619140625, -15.71728515625, -14.949951171875, -14.1826171875, -13.415283203125, -12.64794921875, -11.880615234375, -11.11328125, -10.345947265625, -9.57861328125, -8.811279296875, -8.0439453125, -7.276611328125, -6.50927734375, -5.741943359375, -4.974609375, -4.207275390625, -3.43994140625, -2.672607421875, -1.9052734375, -1.137939453125, -0.37060546875, 0.396728515625, 1.1640625, 1.931396484375, 2.69873046875, 3.466064453125, 4.2333984375, 5.000732421875, 5.76806640625, 6.535400390625, 7.302734375, 8.070068359375, 8.83740234375, 9.604736328125, 10.3720703125, 11.139404296875, 11.90673828125, 12.674072265625, 13.44140625, 14.208740234375, 14.97607421875, 15.743408203125, 16.5107421875, 17.278076171875, 18.04541015625, 18.812744140625, 19.580078125, 20.347412109375, 21.11474609375, 21.882080078125, 22.6494140625, 23.416748046875, 24.18408203125, 24.951416015625, 25.71875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 6.0, 3.0, 7.0, 4.0, 10.0, 5.0, 7.0, 10.0, 15.0, 16.0, 15.0, 20.0, 27.0, 26.0, 33.0, 37.0, 31.0, 31.0, 36.0, 44.0, 39.0, 55.0, 36.0, 50.0, 30.0, 46.0, 46.0, 31.0, 40.0, 30.0, 33.0, 28.0, 29.0, 29.0, 21.0, 10.0, 10.0, 11.0, 9.0, 12.0, 8.0, 8.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-20.75, -20.166259765625, -19.58251953125, -18.998779296875, -18.4150390625, -17.831298828125, -17.24755859375, -16.663818359375, -16.080078125, -15.496337890625, -14.91259765625, -14.328857421875, -13.7451171875, -13.161376953125, -12.57763671875, -11.993896484375, -11.41015625, -10.826416015625, -10.24267578125, -9.658935546875, -9.0751953125, -8.491455078125, -7.90771484375, -7.323974609375, -6.740234375, -6.156494140625, -5.57275390625, -4.989013671875, -4.4052734375, -3.821533203125, -3.23779296875, -2.654052734375, -2.0703125, -1.486572265625, -0.90283203125, -0.319091796875, 0.2646484375, 0.848388671875, 1.43212890625, 2.015869140625, 2.599609375, 3.183349609375, 3.76708984375, 4.350830078125, 4.9345703125, 5.518310546875, 6.10205078125, 6.685791015625, 7.26953125, 7.853271484375, 8.43701171875, 9.020751953125, 9.6044921875, 10.188232421875, 10.77197265625, 11.355712890625, 11.939453125, 12.523193359375, 13.10693359375, 13.690673828125, 14.2744140625, 14.858154296875, 15.44189453125, 16.025634765625, 16.609375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 9.0, 8.0, 8.0, 10.0, 22.0, 29.0, 44.0, 80.0, 112.0, 152.0, 214.0, 362.0, 569.0, 820.0, 1457.0, 2630.0, 5186.0, 11282.0, 29827.0, 101025.0, 365164.0, 371429.0, 103709.0, 30946.0, 11532.0, 5281.0, 2727.0, 1406.0, 932.0, 568.0, 356.0, 192.0, 141.0, 103.0, 64.0, 54.0, 32.0, 20.0, 14.0, 13.0, 7.0, 8.0, 7.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-68.0, -66.0576171875, -64.115234375, -62.1728515625, -60.23046875, -58.2880859375, -56.345703125, -54.4033203125, -52.4609375, -50.5185546875, -48.576171875, -46.6337890625, -44.69140625, -42.7490234375, -40.806640625, -38.8642578125, -36.921875, -34.9794921875, -33.037109375, -31.0947265625, -29.15234375, -27.2099609375, -25.267578125, -23.3251953125, -21.3828125, -19.4404296875, -17.498046875, -15.5556640625, -13.61328125, -11.6708984375, -9.728515625, -7.7861328125, -5.84375, -3.9013671875, -1.958984375, -0.0166015625, 1.92578125, 3.8681640625, 5.810546875, 7.7529296875, 9.6953125, 11.6376953125, 13.580078125, 15.5224609375, 17.46484375, 19.4072265625, 21.349609375, 23.2919921875, 25.234375, 27.1767578125, 29.119140625, 31.0615234375, 33.00390625, 34.9462890625, 36.888671875, 38.8310546875, 40.7734375, 42.7158203125, 44.658203125, 46.6005859375, 48.54296875, 50.4853515625, 52.427734375, 54.3701171875, 56.3125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 6.0, 4.0, 5.0, 8.0, 10.0, 12.0, 15.0, 12.0, 13.0, 17.0, 22.0, 22.0, 20.0, 35.0, 32.0, 44.0, 42.0, 34.0, 50.0, 45.0, 37.0, 46.0, 55.0, 44.0, 35.0, 39.0, 40.0, 41.0, 32.0, 29.0, 33.0, 16.0, 17.0, 23.0, 16.0, 9.0, 14.0, 6.0, 7.0, 7.0, 8.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.9140625, -11.522216796875, -11.13037109375, -10.738525390625, -10.3466796875, -9.954833984375, -9.56298828125, -9.171142578125, -8.779296875, -8.387451171875, -7.99560546875, -7.603759765625, -7.2119140625, -6.820068359375, -6.42822265625, -6.036376953125, -5.64453125, -5.252685546875, -4.86083984375, -4.468994140625, -4.0771484375, -3.685302734375, -3.29345703125, -2.901611328125, -2.509765625, -2.117919921875, -1.72607421875, -1.334228515625, -0.9423828125, -0.550537109375, -0.15869140625, 0.233154296875, 0.625, 1.016845703125, 1.40869140625, 1.800537109375, 2.1923828125, 2.584228515625, 2.97607421875, 3.367919921875, 3.759765625, 4.151611328125, 4.54345703125, 4.935302734375, 5.3271484375, 5.718994140625, 6.11083984375, 6.502685546875, 6.89453125, 7.286376953125, 7.67822265625, 8.070068359375, 8.4619140625, 8.853759765625, 9.24560546875, 9.637451171875, 10.029296875, 10.421142578125, 10.81298828125, 11.204833984375, 11.5966796875, 11.988525390625, 12.38037109375, 12.772216796875, 13.1640625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 5.0, 2.0, 6.0, 10.0, 10.0, 17.0, 24.0, 26.0, 42.0, 57.0, 57.0, 78.0, 114.0, 121.0, 166.0, 231.0, 343.0, 404.0, 679.0, 881.0, 1244.0, 1998.0, 3012.0, 5015.0, 8555.0, 15847.0, 32252.0, 73205.0, 173359.0, 318032.0, 225611.0, 97421.0, 42110.0, 20242.0, 10602.0, 5928.0, 3614.0, 2228.0, 1419.0, 961.0, 694.0, 486.0, 352.0, 272.0, 205.0, 134.0, 126.0, 90.0, 75.0, 46.0, 45.0, 39.0, 22.0, 17.0, 13.0, 13.0, 4.0, 7.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-19.21875, -18.592041015625, -17.96533203125, -17.338623046875, -16.7119140625, -16.085205078125, -15.45849609375, -14.831787109375, -14.205078125, -13.578369140625, -12.95166015625, -12.324951171875, -11.6982421875, -11.071533203125, -10.44482421875, -9.818115234375, -9.19140625, -8.564697265625, -7.93798828125, -7.311279296875, -6.6845703125, -6.057861328125, -5.43115234375, -4.804443359375, -4.177734375, -3.551025390625, -2.92431640625, -2.297607421875, -1.6708984375, -1.044189453125, -0.41748046875, 0.209228515625, 0.8359375, 1.462646484375, 2.08935546875, 2.716064453125, 3.3427734375, 3.969482421875, 4.59619140625, 5.222900390625, 5.849609375, 6.476318359375, 7.10302734375, 7.729736328125, 8.3564453125, 8.983154296875, 9.60986328125, 10.236572265625, 10.86328125, 11.489990234375, 12.11669921875, 12.743408203125, 13.3701171875, 13.996826171875, 14.62353515625, 15.250244140625, 15.876953125, 16.503662109375, 17.13037109375, 17.757080078125, 18.3837890625, 19.010498046875, 19.63720703125, 20.263916015625, 20.890625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 7.0, 7.0, 15.0, 21.0, 40.0, 74.0, 152.0, 154.0, 189.0, 129.0, 81.0, 50.0, 26.0, 16.0, 7.0, 5.0, 6.0, 4.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018215179443359375, -0.0017646849155426025, -0.0017078518867492676, -0.0016510188579559326, -0.0015941858291625977, -0.0015373528003692627, -0.0014805197715759277, -0.0014236867427825928, -0.0013668537139892578, -0.0013100206851959229, -0.0012531876564025879, -0.001196354627609253, -0.001139521598815918, -0.001082688570022583, -0.001025855541229248, -0.0009690225124359131, -0.0009121894836425781, -0.0008553564548492432, -0.0007985234260559082, -0.0007416903972625732, -0.0006848573684692383, -0.0006280243396759033, -0.0005711913108825684, -0.0005143582820892334, -0.00045752525329589844, -0.0004006922245025635, -0.0003438591957092285, -0.00028702616691589355, -0.0002301931381225586, -0.00017336010932922363, -0.00011652708053588867, -5.969405174255371e-05, -2.86102294921875e-06, 5.397200584411621e-05, 0.00011080503463745117, 0.00016763806343078613, 0.0002244710922241211, 0.00028130412101745605, 0.000338137149810791, 0.000394970178604126, 0.00045180320739746094, 0.0005086362361907959, 0.0005654692649841309, 0.0006223022937774658, 0.0006791353225708008, 0.0007359683513641357, 0.0007928013801574707, 0.0008496344089508057, 0.0009064674377441406, 0.0009633004665374756, 0.0010201334953308105, 0.0010769665241241455, 0.0011337995529174805, 0.0011906325817108154, 0.0012474656105041504, 0.0013042986392974854, 0.0013611316680908203, 0.0014179646968841553, 0.0014747977256774902, 0.0015316307544708252, 0.0015884637832641602, 0.0016452968120574951, 0.00170212984085083, 0.001758962869644165, 0.0018157958984375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 6.0, 6.0, 7.0, 7.0, 12.0, 17.0, 25.0, 35.0, 37.0, 55.0, 88.0, 108.0, 188.0, 273.0, 371.0, 556.0, 876.0, 1487.0, 2583.0, 4644.0, 9812.0, 22382.0, 58083.0, 158866.0, 315917.0, 275410.0, 118389.0, 43577.0, 17204.0, 7813.0, 3912.0, 2135.0, 1297.0, 801.0, 499.0, 329.0, 216.0, 167.0, 91.0, 77.0, 44.0, 37.0, 31.0, 18.0, 25.0, 14.0, 15.0, 6.0, 6.0, 2.0, 0.0, 3.0], "bins": [-23.859375, -23.2119140625, -22.564453125, -21.9169921875, -21.26953125, -20.6220703125, -19.974609375, -19.3271484375, -18.6796875, -18.0322265625, -17.384765625, -16.7373046875, -16.08984375, -15.4423828125, -14.794921875, -14.1474609375, -13.5, -12.8525390625, -12.205078125, -11.5576171875, -10.91015625, -10.2626953125, -9.615234375, -8.9677734375, -8.3203125, -7.6728515625, -7.025390625, -6.3779296875, -5.73046875, -5.0830078125, -4.435546875, -3.7880859375, -3.140625, -2.4931640625, -1.845703125, -1.1982421875, -0.55078125, 0.0966796875, 0.744140625, 1.3916015625, 2.0390625, 2.6865234375, 3.333984375, 3.9814453125, 4.62890625, 5.2763671875, 5.923828125, 6.5712890625, 7.21875, 7.8662109375, 8.513671875, 9.1611328125, 9.80859375, 10.4560546875, 11.103515625, 11.7509765625, 12.3984375, 13.0458984375, 13.693359375, 14.3408203125, 14.98828125, 15.6357421875, 16.283203125, 16.9306640625, 17.578125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 7.0, 8.0, 5.0, 7.0, 9.0, 8.0, 11.0, 11.0, 16.0, 32.0, 32.0, 41.0, 48.0, 58.0, 69.0, 82.0, 73.0, 68.0, 90.0, 67.0, 58.0, 39.0, 37.0, 22.0, 16.0, 18.0, 15.0, 9.0, 6.0, 8.0, 7.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.97265625, -4.828857421875, -4.68505859375, -4.541259765625, -4.3974609375, -4.253662109375, -4.10986328125, -3.966064453125, -3.822265625, -3.678466796875, -3.53466796875, -3.390869140625, -3.2470703125, -3.103271484375, -2.95947265625, -2.815673828125, -2.671875, -2.528076171875, -2.38427734375, -2.240478515625, -2.0966796875, -1.952880859375, -1.80908203125, -1.665283203125, -1.521484375, -1.377685546875, -1.23388671875, -1.090087890625, -0.9462890625, -0.802490234375, -0.65869140625, -0.514892578125, -0.37109375, -0.227294921875, -0.08349609375, 0.060302734375, 0.2041015625, 0.347900390625, 0.49169921875, 0.635498046875, 0.779296875, 0.923095703125, 1.06689453125, 1.210693359375, 1.3544921875, 1.498291015625, 1.64208984375, 1.785888671875, 1.9296875, 2.073486328125, 2.21728515625, 2.361083984375, 2.5048828125, 2.648681640625, 2.79248046875, 2.936279296875, 3.080078125, 3.223876953125, 3.36767578125, 3.511474609375, 3.6552734375, 3.799072265625, 3.94287109375, 4.086669921875, 4.23046875]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 7.0, 8.0, 10.0, 9.0, 15.0, 24.0, 26.0, 25.0, 39.0, 29.0, 41.0, 45.0, 61.0, 66.0, 75.0, 61.0, 64.0, 65.0, 59.0, 45.0, 52.0, 27.0, 25.0, 27.0, 24.0, 11.0, 13.0, 14.0, 9.0, 6.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-31.970867156982422, -31.039974212646484, -30.109081268310547, -29.17818832397461, -28.247295379638672, -27.316402435302734, -26.385509490966797, -25.45461654663086, -24.523723602294922, -23.592830657958984, -22.661937713623047, -21.73104476928711, -20.800151824951172, -19.869258880615234, -18.938365936279297, -18.00747299194336, -17.076580047607422, -16.145687103271484, -15.214794158935547, -14.28390121459961, -13.353008270263672, -12.422115325927734, -11.491222381591797, -10.56032943725586, -9.629434585571289, -8.698541641235352, -7.767648696899414, -6.836755752563477, -5.905862808227539, -4.974969387054443, -4.044076442718506, -3.1131834983825684, -2.182291030883789, -1.2513980865478516, -0.3205050230026245, 0.6103880405426025, 1.54128098487854, 2.4721741676330566, 3.403067111968994, 4.333960056304932, 5.264853000640869, 6.195745944976807, 7.126638889312744, 8.05753231048584, 8.988425254821777, 9.919318199157715, 10.850211143493652, 11.78110408782959, 12.711997032165527, 13.642889976501465, 14.573782920837402, 15.50467586517334, 16.435569763183594, 17.36646270751953, 18.29735565185547, 19.228248596191406, 20.159141540527344, 21.09003448486328, 22.02092742919922, 22.951820373535156, 23.882713317871094, 24.81360626220703, 25.74449920654297, 26.675392150878906, 27.606285095214844]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 4.0, 2.0, 2.0, 5.0, 6.0, 14.0, 11.0, 13.0, 10.0, 18.0, 11.0, 22.0, 26.0, 20.0, 45.0, 32.0, 39.0, 27.0, 42.0, 31.0, 41.0, 35.0, 35.0, 36.0, 46.0, 45.0, 36.0, 43.0, 49.0, 33.0, 38.0, 17.0, 25.0, 24.0, 25.0, 20.0, 16.0, 15.0, 14.0, 4.0, 5.0, 6.0, 5.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-18.145809173583984, -17.60721206665039, -17.068614959716797, -16.530019760131836, -15.991422653198242, -15.452825546264648, -14.914229393005371, -14.375633239746094, -13.8370361328125, -13.298439025878906, -12.759842872619629, -12.221246719360352, -11.682649612426758, -11.144052505493164, -10.605456352233887, -10.06686019897461, -9.528263092041016, -8.989665985107422, -8.451069831848145, -7.912473201751709, -7.373876571655273, -6.835279941558838, -6.296683311462402, -5.758086681365967, -5.219490051269531, -4.680893421173096, -4.14229679107666, -3.6037001609802246, -3.065103530883789, -2.5265069007873535, -1.987910270690918, -1.4493136405944824, -0.9107189178466797, -0.37212228775024414, 0.1664743423461914, 0.705070972442627, 1.2436676025390625, 1.782264232635498, 2.3208608627319336, 2.859457492828369, 3.3980541229248047, 3.9366507530212402, 4.475247383117676, 5.013844013214111, 5.552440643310547, 6.091037273406982, 6.629633903503418, 7.1682305335998535, 7.706827163696289, 8.245424270629883, 8.78402042388916, 9.322616577148438, 9.861213684082031, 10.399810791015625, 10.938406944274902, 11.47700309753418, 12.015600204467773, 12.554197311401367, 13.092793464660645, 13.631389617919922, 14.169986724853516, 14.70858383178711, 15.247179985046387, 15.785776138305664, 16.324373245239258]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 14.0, 16.0, 16.0, 25.0, 45.0, 58.0, 79.0, 108.0, 172.0, 266.0, 396.0, 596.0, 998.0, 1451.0, 2503.0, 3734.0, 6284.0, 10698.0, 17478.0, 29304.0, 48740.0, 77279.0, 116948.0, 154322.0, 167137.0, 141915.0, 100627.0, 65354.0, 40144.0, 24464.0, 14424.0, 8743.0, 5369.0, 3277.0, 2002.0, 1253.0, 838.0, 498.0, 329.0, 196.0, 130.0, 101.0, 77.0, 58.0, 31.0, 20.0, 18.0, 11.0, 5.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-23.34375, -22.621337890625, -21.89892578125, -21.176513671875, -20.4541015625, -19.731689453125, -19.00927734375, -18.286865234375, -17.564453125, -16.842041015625, -16.11962890625, -15.397216796875, -14.6748046875, -13.952392578125, -13.22998046875, -12.507568359375, -11.78515625, -11.062744140625, -10.34033203125, -9.617919921875, -8.8955078125, -8.173095703125, -7.45068359375, -6.728271484375, -6.005859375, -5.283447265625, -4.56103515625, -3.838623046875, -3.1162109375, -2.393798828125, -1.67138671875, -0.948974609375, -0.2265625, 0.495849609375, 1.21826171875, 1.940673828125, 2.6630859375, 3.385498046875, 4.10791015625, 4.830322265625, 5.552734375, 6.275146484375, 6.99755859375, 7.719970703125, 8.4423828125, 9.164794921875, 9.88720703125, 10.609619140625, 11.33203125, 12.054443359375, 12.77685546875, 13.499267578125, 14.2216796875, 14.944091796875, 15.66650390625, 16.388916015625, 17.111328125, 17.833740234375, 18.55615234375, 19.278564453125, 20.0009765625, 20.723388671875, 21.44580078125, 22.168212890625, 22.890625]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 3.0, 3.0, 4.0, 8.0, 14.0, 14.0, 19.0, 18.0, 16.0, 25.0, 36.0, 40.0, 30.0, 37.0, 50.0, 51.0, 36.0, 45.0, 50.0, 60.0, 51.0, 37.0, 51.0, 45.0, 44.0, 28.0, 41.0, 31.0, 27.0, 26.0, 17.0, 9.0, 8.0, 7.0, 6.0, 3.0, 7.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.609375, -18.951171875, -18.29296875, -17.634765625, -16.9765625, -16.318359375, -15.66015625, -15.001953125, -14.34375, -13.685546875, -13.02734375, -12.369140625, -11.7109375, -11.052734375, -10.39453125, -9.736328125, -9.078125, -8.419921875, -7.76171875, -7.103515625, -6.4453125, -5.787109375, -5.12890625, -4.470703125, -3.8125, -3.154296875, -2.49609375, -1.837890625, -1.1796875, -0.521484375, 0.13671875, 0.794921875, 1.453125, 2.111328125, 2.76953125, 3.427734375, 4.0859375, 4.744140625, 5.40234375, 6.060546875, 6.71875, 7.376953125, 8.03515625, 8.693359375, 9.3515625, 10.009765625, 10.66796875, 11.326171875, 11.984375, 12.642578125, 13.30078125, 13.958984375, 14.6171875, 15.275390625, 15.93359375, 16.591796875, 17.25, 17.908203125, 18.56640625, 19.224609375, 19.8828125, 20.541015625, 21.19921875, 21.857421875, 22.515625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 8.0, 6.0, 19.0, 35.0, 43.0, 55.0, 108.0, 156.0, 241.0, 374.0, 593.0, 1005.0, 1577.0, 2650.0, 4147.0, 6965.0, 11021.0, 18442.0, 28703.0, 45381.0, 69061.0, 99694.0, 130789.0, 147207.0, 139926.0, 112702.0, 80903.0, 54508.0, 34617.0, 22066.0, 13531.0, 8324.0, 5238.0, 3180.0, 1981.0, 1296.0, 761.0, 448.0, 300.0, 160.0, 135.0, 86.0, 52.0, 25.0, 19.0, 13.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-17.65625, -17.099365234375, -16.54248046875, -15.985595703125, -15.4287109375, -14.871826171875, -14.31494140625, -13.758056640625, -13.201171875, -12.644287109375, -12.08740234375, -11.530517578125, -10.9736328125, -10.416748046875, -9.85986328125, -9.302978515625, -8.74609375, -8.189208984375, -7.63232421875, -7.075439453125, -6.5185546875, -5.961669921875, -5.40478515625, -4.847900390625, -4.291015625, -3.734130859375, -3.17724609375, -2.620361328125, -2.0634765625, -1.506591796875, -0.94970703125, -0.392822265625, 0.1640625, 0.720947265625, 1.27783203125, 1.834716796875, 2.3916015625, 2.948486328125, 3.50537109375, 4.062255859375, 4.619140625, 5.176025390625, 5.73291015625, 6.289794921875, 6.8466796875, 7.403564453125, 7.96044921875, 8.517333984375, 9.07421875, 9.631103515625, 10.18798828125, 10.744873046875, 11.3017578125, 11.858642578125, 12.41552734375, 12.972412109375, 13.529296875, 14.086181640625, 14.64306640625, 15.199951171875, 15.7568359375, 16.313720703125, 16.87060546875, 17.427490234375, 17.984375]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 5.0, 8.0, 7.0, 17.0, 13.0, 17.0, 25.0, 25.0, 34.0, 36.0, 24.0, 39.0, 34.0, 34.0, 40.0, 45.0, 55.0, 50.0, 40.0, 48.0, 33.0, 41.0, 37.0, 39.0, 28.0, 29.0, 31.0, 21.0, 24.0, 18.0, 23.0, 18.0, 9.0, 13.0, 7.0, 9.0, 9.0, 6.0, 4.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.046875, -11.6805419921875, -11.314208984375, -10.9478759765625, -10.58154296875, -10.2152099609375, -9.848876953125, -9.4825439453125, -9.1162109375, -8.7498779296875, -8.383544921875, -8.0172119140625, -7.65087890625, -7.2845458984375, -6.918212890625, -6.5518798828125, -6.185546875, -5.8192138671875, -5.452880859375, -5.0865478515625, -4.72021484375, -4.3538818359375, -3.987548828125, -3.6212158203125, -3.2548828125, -2.8885498046875, -2.522216796875, -2.1558837890625, -1.78955078125, -1.4232177734375, -1.056884765625, -0.6905517578125, -0.32421875, 0.0421142578125, 0.408447265625, 0.7747802734375, 1.14111328125, 1.5074462890625, 1.873779296875, 2.2401123046875, 2.6064453125, 2.9727783203125, 3.339111328125, 3.7054443359375, 4.07177734375, 4.4381103515625, 4.804443359375, 5.1707763671875, 5.537109375, 5.9034423828125, 6.269775390625, 6.6361083984375, 7.00244140625, 7.3687744140625, 7.735107421875, 8.1014404296875, 8.4677734375, 8.8341064453125, 9.200439453125, 9.5667724609375, 9.93310546875, 10.2994384765625, 10.665771484375, 11.0321044921875, 11.3984375]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 2.0, 3.0, 7.0, 8.0, 11.0, 14.0, 22.0, 31.0, 51.0, 66.0, 99.0, 113.0, 175.0, 275.0, 353.0, 531.0, 847.0, 1348.0, 2094.0, 3087.0, 4952.0, 7676.0, 12482.0, 19936.0, 32705.0, 54208.0, 88267.0, 135683.0, 177069.0, 171387.0, 125971.0, 80762.0, 49143.0, 29690.0, 18351.0, 11241.0, 7040.0, 4406.0, 2805.0, 1895.0, 1206.0, 795.0, 561.0, 364.0, 242.0, 158.0, 124.0, 95.0, 56.0, 48.0, 32.0, 16.0, 16.0, 14.0, 13.0, 7.0, 2.0, 7.0, 3.0, 2.0, 1.0], "bins": [-14.3359375, -13.8865966796875, -13.437255859375, -12.9879150390625, -12.53857421875, -12.0892333984375, -11.639892578125, -11.1905517578125, -10.7412109375, -10.2918701171875, -9.842529296875, -9.3931884765625, -8.94384765625, -8.4945068359375, -8.045166015625, -7.5958251953125, -7.146484375, -6.6971435546875, -6.247802734375, -5.7984619140625, -5.34912109375, -4.8997802734375, -4.450439453125, -4.0010986328125, -3.5517578125, -3.1024169921875, -2.653076171875, -2.2037353515625, -1.75439453125, -1.3050537109375, -0.855712890625, -0.4063720703125, 0.04296875, 0.4923095703125, 0.941650390625, 1.3909912109375, 1.84033203125, 2.2896728515625, 2.739013671875, 3.1883544921875, 3.6376953125, 4.0870361328125, 4.536376953125, 4.9857177734375, 5.43505859375, 5.8843994140625, 6.333740234375, 6.7830810546875, 7.232421875, 7.6817626953125, 8.131103515625, 8.5804443359375, 9.02978515625, 9.4791259765625, 9.928466796875, 10.3778076171875, 10.8271484375, 11.2764892578125, 11.725830078125, 12.1751708984375, 12.62451171875, 13.0738525390625, 13.523193359375, 13.9725341796875, 14.421875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 4.0, 5.0, 7.0, 9.0, 5.0, 11.0, 20.0, 26.0, 39.0, 71.0, 85.0, 106.0, 122.0, 120.0, 75.0, 91.0, 69.0, 43.0, 26.0, 20.0, 10.0, 10.0, 12.0, 7.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020427703857421875, -0.001950383186340332, -0.0018579959869384766, -0.001765608787536621, -0.0016732215881347656, -0.0015808343887329102, -0.0014884471893310547, -0.0013960599899291992, -0.0013036727905273438, -0.0012112855911254883, -0.0011188983917236328, -0.0010265111923217773, -0.0009341239929199219, -0.0008417367935180664, -0.0007493495941162109, -0.0006569623947143555, -0.0005645751953125, -0.00047218799591064453, -0.00037980079650878906, -0.0002874135971069336, -0.00019502639770507812, -0.00010263919830322266, -1.0251998901367188e-05, 8.213520050048828e-05, 0.00017452239990234375, 0.0002669095993041992, 0.0003592967987060547, 0.00045168399810791016, 0.0005440711975097656, 0.0006364583969116211, 0.0007288455963134766, 0.000821232795715332, 0.0009136199951171875, 0.001006007194519043, 0.0010983943939208984, 0.001190781593322754, 0.0012831687927246094, 0.0013755559921264648, 0.0014679431915283203, 0.0015603303909301758, 0.0016527175903320312, 0.0017451047897338867, 0.0018374919891357422, 0.0019298791885375977, 0.002022266387939453, 0.0021146535873413086, 0.002207040786743164, 0.0022994279861450195, 0.002391815185546875, 0.0024842023849487305, 0.002576589584350586, 0.0026689767837524414, 0.002761363983154297, 0.0028537511825561523, 0.002946138381958008, 0.0030385255813598633, 0.0031309127807617188, 0.0032232999801635742, 0.0033156871795654297, 0.003408074378967285, 0.0035004615783691406, 0.003592848777770996, 0.0036852359771728516, 0.003777623176574707, 0.0038700103759765625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 4.0, 17.0, 13.0, 21.0, 26.0, 29.0, 47.0, 85.0, 99.0, 150.0, 202.0, 290.0, 428.0, 618.0, 843.0, 1318.0, 1760.0, 2532.0, 3865.0, 5603.0, 8622.0, 13282.0, 20747.0, 32771.0, 52461.0, 81896.0, 120894.0, 155094.0, 160105.0, 130547.0, 91537.0, 58735.0, 36745.0, 23081.0, 14776.0, 9434.0, 6273.0, 4285.0, 2869.0, 1903.0, 1338.0, 931.0, 687.0, 498.0, 338.0, 242.0, 162.0, 115.0, 89.0, 42.0, 35.0, 31.0, 12.0, 20.0, 7.0, 8.0, 1.0, 5.0, 0.0, 1.0], "bins": [-12.1484375, -11.770263671875, -11.39208984375, -11.013916015625, -10.6357421875, -10.257568359375, -9.87939453125, -9.501220703125, -9.123046875, -8.744873046875, -8.36669921875, -7.988525390625, -7.6103515625, -7.232177734375, -6.85400390625, -6.475830078125, -6.09765625, -5.719482421875, -5.34130859375, -4.963134765625, -4.5849609375, -4.206787109375, -3.82861328125, -3.450439453125, -3.072265625, -2.694091796875, -2.31591796875, -1.937744140625, -1.5595703125, -1.181396484375, -0.80322265625, -0.425048828125, -0.046875, 0.331298828125, 0.70947265625, 1.087646484375, 1.4658203125, 1.843994140625, 2.22216796875, 2.600341796875, 2.978515625, 3.356689453125, 3.73486328125, 4.113037109375, 4.4912109375, 4.869384765625, 5.24755859375, 5.625732421875, 6.00390625, 6.382080078125, 6.76025390625, 7.138427734375, 7.5166015625, 7.894775390625, 8.27294921875, 8.651123046875, 9.029296875, 9.407470703125, 9.78564453125, 10.163818359375, 10.5419921875, 10.920166015625, 11.29833984375, 11.676513671875, 12.0546875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 6.0, 3.0, 5.0, 2.0, 6.0, 6.0, 10.0, 14.0, 13.0, 20.0, 17.0, 26.0, 23.0, 34.0, 39.0, 44.0, 55.0, 63.0, 52.0, 59.0, 72.0, 41.0, 48.0, 47.0, 47.0, 32.0, 26.0, 43.0, 17.0, 29.0, 24.0, 14.0, 12.0, 15.0, 13.0, 8.0, 5.0, 2.0, 5.0, 5.0, 1.0, 4.0, 0.0, 3.0, 3.0], "bins": [-5.84765625, -5.699462890625, -5.55126953125, -5.403076171875, -5.2548828125, -5.106689453125, -4.95849609375, -4.810302734375, -4.662109375, -4.513916015625, -4.36572265625, -4.217529296875, -4.0693359375, -3.921142578125, -3.77294921875, -3.624755859375, -3.4765625, -3.328369140625, -3.18017578125, -3.031982421875, -2.8837890625, -2.735595703125, -2.58740234375, -2.439208984375, -2.291015625, -2.142822265625, -1.99462890625, -1.846435546875, -1.6982421875, -1.550048828125, -1.40185546875, -1.253662109375, -1.10546875, -0.957275390625, -0.80908203125, -0.660888671875, -0.5126953125, -0.364501953125, -0.21630859375, -0.068115234375, 0.080078125, 0.228271484375, 0.37646484375, 0.524658203125, 0.6728515625, 0.821044921875, 0.96923828125, 1.117431640625, 1.265625, 1.413818359375, 1.56201171875, 1.710205078125, 1.8583984375, 2.006591796875, 2.15478515625, 2.302978515625, 2.451171875, 2.599365234375, 2.74755859375, 2.895751953125, 3.0439453125, 3.192138671875, 3.34033203125, 3.488525390625, 3.63671875]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 12.0, 9.0, 18.0, 22.0, 21.0, 25.0, 21.0, 46.0, 45.0, 49.0, 49.0, 62.0, 58.0, 68.0, 76.0, 57.0, 59.0, 45.0, 63.0, 36.0, 34.0, 29.0, 29.0, 16.0, 8.0, 14.0, 8.0, 2.0, 6.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.97602081298828, -30.03790283203125, -29.09978485107422, -28.161666870117188, -27.223548889160156, -26.285430908203125, -25.347312927246094, -24.409194946289062, -23.47107696533203, -22.532958984375, -21.59484100341797, -20.656723022460938, -19.718605041503906, -18.780487060546875, -17.842369079589844, -16.904251098632812, -15.966133117675781, -15.02801513671875, -14.089897155761719, -13.151779174804688, -12.213661193847656, -11.275543212890625, -10.337425231933594, -9.399307250976562, -8.461189270019531, -7.5230712890625, -6.584953308105469, -5.6468353271484375, -4.708717346191406, -3.770599365234375, -2.8324813842773438, -1.8943634033203125, -0.9562473297119141, -0.018129348754882812, 0.9199886322021484, 1.8581066131591797, 2.796224594116211, 3.734342575073242, 4.672460556030273, 5.610578536987305, 6.548696517944336, 7.486814498901367, 8.424932479858398, 9.36305046081543, 10.301168441772461, 11.239286422729492, 12.177404403686523, 13.115522384643555, 14.053640365600586, 14.991758346557617, 15.929876327514648, 16.86799430847168, 17.80611228942871, 18.744230270385742, 19.682348251342773, 20.620466232299805, 21.558584213256836, 22.496702194213867, 23.4348201751709, 24.37293815612793, 25.31105613708496, 26.249174118041992, 27.187292098999023, 28.125410079956055, 29.063528060913086]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 5.0, 0.0, 4.0, 1.0, 4.0, 5.0, 7.0, 6.0, 7.0, 9.0, 10.0, 13.0, 14.0, 21.0, 24.0, 34.0, 20.0, 23.0, 31.0, 31.0, 45.0, 40.0, 33.0, 34.0, 45.0, 32.0, 37.0, 53.0, 50.0, 29.0, 44.0, 34.0, 33.0, 42.0, 18.0, 26.0, 27.0, 19.0, 20.0, 14.0, 13.0, 14.0, 2.0, 9.0, 9.0, 7.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-17.848920822143555, -17.321720123291016, -16.79452133178711, -16.26732063293457, -15.740120887756348, -15.212921142578125, -14.685720443725586, -14.158520698547363, -13.63132095336914, -13.104121208190918, -12.576921463012695, -12.049720764160156, -11.522521018981934, -10.995321273803711, -10.468120574951172, -9.94092082977295, -9.413721084594727, -8.886521339416504, -8.359321594238281, -7.832120895385742, -7.3049211502075195, -6.777721405029297, -6.250521183013916, -5.723320960998535, -5.1961212158203125, -4.66892147064209, -4.141721248626709, -3.6145212650299072, -3.0873212814331055, -2.5601212978363037, -2.032921314239502, -1.5057213306427002, -0.9785223007202148, -0.4513223171234131, 0.07587766647338867, 0.6030776500701904, 1.1302776336669922, 1.657477617263794, 2.1846776008605957, 2.7118775844573975, 3.239077568054199, 3.766277551651001, 4.293477535247803, 4.820677757263184, 5.347877502441406, 5.875077247619629, 6.40227746963501, 6.929477691650391, 7.456677436828613, 7.983877182006836, 8.511077880859375, 9.038277626037598, 9.56547737121582, 10.092677116394043, 10.619876861572266, 11.147077560424805, 11.674277305603027, 12.20147705078125, 12.728677749633789, 13.255877494812012, 13.783077239990234, 14.310276985168457, 14.83747673034668, 15.364677429199219, 15.891877174377441]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 8.0, 9.0, 22.0, 28.0, 38.0, 43.0, 98.0, 137.0, 217.0, 296.0, 468.0, 752.0, 1148.0, 1680.0, 2782.0, 4465.0, 7223.0, 11697.0, 20046.0, 34415.0, 61549.0, 111691.0, 211138.0, 403587.0, 699685.0, 898662.0, 747450.0, 447110.0, 237355.0, 125895.0, 68493.0, 38589.0, 22362.0, 13181.0, 8233.0, 5059.0, 3196.0, 1963.0, 1281.0, 795.0, 513.0, 335.0, 214.0, 131.0, 90.0, 62.0, 34.0, 24.0, 13.0, 10.0, 10.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0], "bins": [-19.390625, -18.795654296875, -18.20068359375, -17.605712890625, -17.0107421875, -16.415771484375, -15.82080078125, -15.225830078125, -14.630859375, -14.035888671875, -13.44091796875, -12.845947265625, -12.2509765625, -11.656005859375, -11.06103515625, -10.466064453125, -9.87109375, -9.276123046875, -8.68115234375, -8.086181640625, -7.4912109375, -6.896240234375, -6.30126953125, -5.706298828125, -5.111328125, -4.516357421875, -3.92138671875, -3.326416015625, -2.7314453125, -2.136474609375, -1.54150390625, -0.946533203125, -0.3515625, 0.243408203125, 0.83837890625, 1.433349609375, 2.0283203125, 2.623291015625, 3.21826171875, 3.813232421875, 4.408203125, 5.003173828125, 5.59814453125, 6.193115234375, 6.7880859375, 7.383056640625, 7.97802734375, 8.572998046875, 9.16796875, 9.762939453125, 10.35791015625, 10.952880859375, 11.5478515625, 12.142822265625, 12.73779296875, 13.332763671875, 13.927734375, 14.522705078125, 15.11767578125, 15.712646484375, 16.3076171875, 16.902587890625, 17.49755859375, 18.092529296875, 18.6875]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 1.0, 6.0, 8.0, 9.0, 7.0, 12.0, 12.0, 17.0, 18.0, 30.0, 22.0, 24.0, 31.0, 36.0, 40.0, 31.0, 40.0, 31.0, 43.0, 52.0, 34.0, 55.0, 41.0, 35.0, 35.0, 31.0, 38.0, 31.0, 33.0, 34.0, 29.0, 25.0, 19.0, 21.0, 14.0, 12.0, 11.0, 7.0, 4.0, 7.0, 4.0, 3.0, 2.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2890625, -10.9088134765625, -10.528564453125, -10.1483154296875, -9.76806640625, -9.3878173828125, -9.007568359375, -8.6273193359375, -8.2470703125, -7.8668212890625, -7.486572265625, -7.1063232421875, -6.72607421875, -6.3458251953125, -5.965576171875, -5.5853271484375, -5.205078125, -4.8248291015625, -4.444580078125, -4.0643310546875, -3.68408203125, -3.3038330078125, -2.923583984375, -2.5433349609375, -2.1630859375, -1.7828369140625, -1.402587890625, -1.0223388671875, -0.64208984375, -0.2618408203125, 0.118408203125, 0.4986572265625, 0.87890625, 1.2591552734375, 1.639404296875, 2.0196533203125, 2.39990234375, 2.7801513671875, 3.160400390625, 3.5406494140625, 3.9208984375, 4.3011474609375, 4.681396484375, 5.0616455078125, 5.44189453125, 5.8221435546875, 6.202392578125, 6.5826416015625, 6.962890625, 7.3431396484375, 7.723388671875, 8.1036376953125, 8.48388671875, 8.8641357421875, 9.244384765625, 9.6246337890625, 10.0048828125, 10.3851318359375, 10.765380859375, 11.1456298828125, 11.52587890625, 11.9061279296875, 12.286376953125, 12.6666259765625, 13.046875]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 11.0, 8.0, 25.0, 30.0, 42.0, 60.0, 101.0, 187.0, 292.0, 416.0, 651.0, 1018.0, 1564.0, 2576.0, 4263.0, 6923.0, 11905.0, 19841.0, 33560.0, 58908.0, 104026.0, 184420.0, 324443.0, 541175.0, 770886.0, 782593.0, 558549.0, 337277.0, 192609.0, 108068.0, 61466.0, 35211.0, 20470.0, 12014.0, 7128.0, 4374.0, 2712.0, 1628.0, 991.0, 682.0, 424.0, 270.0, 172.0, 100.0, 75.0, 53.0, 25.0, 25.0, 15.0, 16.0, 6.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.671875, -17.08349609375, -16.4951171875, -15.90673828125, -15.318359375, -14.72998046875, -14.1416015625, -13.55322265625, -12.96484375, -12.37646484375, -11.7880859375, -11.19970703125, -10.611328125, -10.02294921875, -9.4345703125, -8.84619140625, -8.2578125, -7.66943359375, -7.0810546875, -6.49267578125, -5.904296875, -5.31591796875, -4.7275390625, -4.13916015625, -3.55078125, -2.96240234375, -2.3740234375, -1.78564453125, -1.197265625, -0.60888671875, -0.0205078125, 0.56787109375, 1.15625, 1.74462890625, 2.3330078125, 2.92138671875, 3.509765625, 4.09814453125, 4.6865234375, 5.27490234375, 5.86328125, 6.45166015625, 7.0400390625, 7.62841796875, 8.216796875, 8.80517578125, 9.3935546875, 9.98193359375, 10.5703125, 11.15869140625, 11.7470703125, 12.33544921875, 12.923828125, 13.51220703125, 14.1005859375, 14.68896484375, 15.27734375, 15.86572265625, 16.4541015625, 17.04248046875, 17.630859375, 18.21923828125, 18.8076171875, 19.39599609375, 19.984375]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 9.0, 5.0, 11.0, 14.0, 13.0, 19.0, 20.0, 28.0, 44.0, 48.0, 42.0, 61.0, 82.0, 94.0, 95.0, 120.0, 153.0, 162.0, 204.0, 194.0, 225.0, 236.0, 257.0, 215.0, 227.0, 192.0, 205.0, 181.0, 137.0, 133.0, 95.0, 92.0, 91.0, 76.0, 55.0, 55.0, 38.0, 23.0, 26.0, 13.0, 16.0, 14.0, 17.0, 7.0, 3.0, 4.0, 6.0, 5.0, 5.0, 1.0, 1.0, 2.0, 4.0, 3.0], "bins": [-5.875, -5.6947021484375, -5.514404296875, -5.3341064453125, -5.15380859375, -4.9735107421875, -4.793212890625, -4.6129150390625, -4.4326171875, -4.2523193359375, -4.072021484375, -3.8917236328125, -3.71142578125, -3.5311279296875, -3.350830078125, -3.1705322265625, -2.990234375, -2.8099365234375, -2.629638671875, -2.4493408203125, -2.26904296875, -2.0887451171875, -1.908447265625, -1.7281494140625, -1.5478515625, -1.3675537109375, -1.187255859375, -1.0069580078125, -0.82666015625, -0.6463623046875, -0.466064453125, -0.2857666015625, -0.10546875, 0.0748291015625, 0.255126953125, 0.4354248046875, 0.61572265625, 0.7960205078125, 0.976318359375, 1.1566162109375, 1.3369140625, 1.5172119140625, 1.697509765625, 1.8778076171875, 2.05810546875, 2.2384033203125, 2.418701171875, 2.5989990234375, 2.779296875, 2.9595947265625, 3.139892578125, 3.3201904296875, 3.50048828125, 3.6807861328125, 3.861083984375, 4.0413818359375, 4.2216796875, 4.4019775390625, 4.582275390625, 4.7625732421875, 4.94287109375, 5.1231689453125, 5.303466796875, 5.4837646484375, 5.6640625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 2.0, 7.0, 7.0, 6.0, 13.0, 15.0, 26.0, 28.0, 36.0, 41.0, 53.0, 51.0, 75.0, 86.0, 73.0, 88.0, 52.0, 74.0, 50.0, 48.0, 33.0, 32.0, 21.0, 26.0, 4.0, 16.0, 12.0, 7.0, 7.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-29.978443145751953, -29.03729820251465, -28.09615135192871, -27.155006408691406, -26.2138614654541, -25.272716522216797, -24.33156967163086, -23.390424728393555, -22.44927978515625, -21.508134841918945, -20.566987991333008, -19.625843048095703, -18.6846981048584, -17.743553161621094, -16.802406311035156, -15.861261367797852, -14.920114517211914, -13.978968620300293, -13.037823677062988, -12.096677780151367, -11.155532836914062, -10.214386940002441, -9.27324104309082, -8.332096099853516, -7.3909502029418945, -6.449804782867432, -5.508659362792969, -4.567513465881348, -3.6263680458068848, -2.685222625732422, -1.7440767288208008, -0.8029313087463379, 0.1382160186767578, 1.0793615579605103, 2.0205070972442627, 2.9616527557373047, 3.9027981758117676, 4.8439435958862305, 5.785089492797852, 6.7262349128723145, 7.667380332946777, 8.608526229858398, 9.549671173095703, 10.490817070007324, 11.431962966918945, 12.37310791015625, 13.314253807067871, 14.255399703979492, 15.196544647216797, 16.1376895904541, 17.07883644104004, 18.019981384277344, 18.96112632751465, 19.902271270751953, 20.84341812133789, 21.784563064575195, 22.7257080078125, 23.666852951049805, 24.607999801635742, 25.549144744873047, 26.49028968811035, 27.431434631347656, 28.372581481933594, 29.3137264251709, 30.254873275756836]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 8.0, 5.0, 14.0, 9.0, 20.0, 17.0, 22.0, 16.0, 32.0, 18.0, 24.0, 36.0, 31.0, 42.0, 38.0, 40.0, 41.0, 47.0, 47.0, 52.0, 50.0, 40.0, 38.0, 32.0, 40.0, 32.0, 29.0, 24.0, 23.0, 24.0, 16.0, 15.0, 16.0, 9.0, 9.0, 12.0, 4.0, 6.0, 5.0, 2.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.447772026062012, -15.009613037109375, -14.571454048156738, -14.133295059204102, -13.695135116577148, -13.256977081298828, -12.818817138671875, -12.380658149719238, -11.942499160766602, -11.504340171813965, -11.066181182861328, -10.628022193908691, -10.189863204956055, -9.751703262329102, -9.313544273376465, -8.875385284423828, -8.437226295471191, -7.999067306518555, -7.560908317565918, -7.122748851776123, -6.684589862823486, -6.24643087387085, -5.808271408081055, -5.370112419128418, -4.931953430175781, -4.4937944412231445, -4.055635452270508, -3.617475986480713, -3.179316997528076, -2.7411580085754395, -2.3029987812042236, -1.8648395538330078, -1.426680564880371, -0.9885214567184448, -0.5503623485565186, -0.11220324039459229, 0.325955867767334, 0.7641148567199707, 1.2022740840911865, 1.6404333114624023, 2.078592300415039, 2.516751289367676, 2.9549105167388916, 3.3930697441101074, 3.831228733062744, 4.269387722015381, 4.707547187805176, 5.1457061767578125, 5.583865165710449, 6.022024154663086, 6.460183143615723, 6.898342609405518, 7.336501598358154, 7.774660587310791, 8.212820053100586, 8.650979042053223, 9.08913803100586, 9.527297019958496, 9.965456008911133, 10.40361499786377, 10.841773986816406, 11.27993392944336, 11.718092918395996, 12.156251907348633, 12.59441089630127]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 4.0, 5.0, 7.0, 9.0, 22.0, 30.0, 39.0, 68.0, 99.0, 138.0, 255.0, 418.0, 708.0, 1266.0, 2312.0, 4535.0, 9445.0, 19870.0, 42956.0, 88470.0, 161694.0, 228097.0, 212543.0, 137940.0, 71881.0, 34063.0, 15960.0, 7550.0, 3625.0, 2004.0, 1014.0, 584.0, 394.0, 186.0, 130.0, 71.0, 53.0, 25.0, 25.0, 23.0, 20.0, 6.0, 3.0, 7.0, 7.0, 3.0, 1.0], "bins": [-23.21875, -22.62109375, -22.0234375, -21.42578125, -20.828125, -20.23046875, -19.6328125, -19.03515625, -18.4375, -17.83984375, -17.2421875, -16.64453125, -16.046875, -15.44921875, -14.8515625, -14.25390625, -13.65625, -13.05859375, -12.4609375, -11.86328125, -11.265625, -10.66796875, -10.0703125, -9.47265625, -8.875, -8.27734375, -7.6796875, -7.08203125, -6.484375, -5.88671875, -5.2890625, -4.69140625, -4.09375, -3.49609375, -2.8984375, -2.30078125, -1.703125, -1.10546875, -0.5078125, 0.08984375, 0.6875, 1.28515625, 1.8828125, 2.48046875, 3.078125, 3.67578125, 4.2734375, 4.87109375, 5.46875, 6.06640625, 6.6640625, 7.26171875, 7.859375, 8.45703125, 9.0546875, 9.65234375, 10.25, 10.84765625, 11.4453125, 12.04296875, 12.640625, 13.23828125, 13.8359375, 14.43359375, 15.03125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 4.0, 2.0, 9.0, 7.0, 10.0, 14.0, 17.0, 13.0, 24.0, 27.0, 23.0, 30.0, 25.0, 33.0, 34.0, 44.0, 32.0, 38.0, 46.0, 45.0, 48.0, 46.0, 40.0, 38.0, 40.0, 33.0, 32.0, 39.0, 24.0, 18.0, 31.0, 29.0, 20.0, 17.0, 17.0, 10.0, 4.0, 10.0, 7.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 4.0, 2.0], "bins": [-16.59375, -16.1480712890625, -15.702392578125, -15.2567138671875, -14.81103515625, -14.3653564453125, -13.919677734375, -13.4739990234375, -13.0283203125, -12.5826416015625, -12.136962890625, -11.6912841796875, -11.24560546875, -10.7999267578125, -10.354248046875, -9.9085693359375, -9.462890625, -9.0172119140625, -8.571533203125, -8.1258544921875, -7.68017578125, -7.2344970703125, -6.788818359375, -6.3431396484375, -5.8974609375, -5.4517822265625, -5.006103515625, -4.5604248046875, -4.11474609375, -3.6690673828125, -3.223388671875, -2.7777099609375, -2.33203125, -1.8863525390625, -1.440673828125, -0.9949951171875, -0.54931640625, -0.1036376953125, 0.342041015625, 0.7877197265625, 1.2333984375, 1.6790771484375, 2.124755859375, 2.5704345703125, 3.01611328125, 3.4617919921875, 3.907470703125, 4.3531494140625, 4.798828125, 5.2445068359375, 5.690185546875, 6.1358642578125, 6.58154296875, 7.0272216796875, 7.472900390625, 7.9185791015625, 8.3642578125, 8.8099365234375, 9.255615234375, 9.7012939453125, 10.14697265625, 10.5926513671875, 11.038330078125, 11.4840087890625, 11.9296875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 7.0, 2.0, 12.0, 12.0, 11.0, 27.0, 34.0, 51.0, 70.0, 120.0, 200.0, 327.0, 526.0, 982.0, 1755.0, 3346.0, 6190.0, 13110.0, 27371.0, 60249.0, 127837.0, 236837.0, 266083.0, 159365.0, 75566.0, 35308.0, 16326.0, 7895.0, 4046.0, 2102.0, 1132.0, 619.0, 373.0, 242.0, 169.0, 88.0, 48.0, 49.0, 19.0, 14.0, 13.0, 8.0, 5.0, 6.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-23.296875, -22.59423828125, -21.8916015625, -21.18896484375, -20.486328125, -19.78369140625, -19.0810546875, -18.37841796875, -17.67578125, -16.97314453125, -16.2705078125, -15.56787109375, -14.865234375, -14.16259765625, -13.4599609375, -12.75732421875, -12.0546875, -11.35205078125, -10.6494140625, -9.94677734375, -9.244140625, -8.54150390625, -7.8388671875, -7.13623046875, -6.43359375, -5.73095703125, -5.0283203125, -4.32568359375, -3.623046875, -2.92041015625, -2.2177734375, -1.51513671875, -0.8125, -0.10986328125, 0.5927734375, 1.29541015625, 1.998046875, 2.70068359375, 3.4033203125, 4.10595703125, 4.80859375, 5.51123046875, 6.2138671875, 6.91650390625, 7.619140625, 8.32177734375, 9.0244140625, 9.72705078125, 10.4296875, 11.13232421875, 11.8349609375, 12.53759765625, 13.240234375, 13.94287109375, 14.6455078125, 15.34814453125, 16.05078125, 16.75341796875, 17.4560546875, 18.15869140625, 18.861328125, 19.56396484375, 20.2666015625, 20.96923828125, 21.671875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 6.0, 9.0, 8.0, 11.0, 12.0, 10.0, 19.0, 16.0, 17.0, 20.0, 20.0, 27.0, 27.0, 29.0, 29.0, 34.0, 32.0, 40.0, 38.0, 36.0, 42.0, 39.0, 32.0, 41.0, 34.0, 39.0, 37.0, 38.0, 37.0, 31.0, 27.0, 28.0, 20.0, 15.0, 14.0, 10.0, 8.0, 18.0, 8.0, 7.0, 3.0, 6.0, 9.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.3125, -7.0711669921875, -6.829833984375, -6.5885009765625, -6.34716796875, -6.1058349609375, -5.864501953125, -5.6231689453125, -5.3818359375, -5.1405029296875, -4.899169921875, -4.6578369140625, -4.41650390625, -4.1751708984375, -3.933837890625, -3.6925048828125, -3.451171875, -3.2098388671875, -2.968505859375, -2.7271728515625, -2.48583984375, -2.2445068359375, -2.003173828125, -1.7618408203125, -1.5205078125, -1.2791748046875, -1.037841796875, -0.7965087890625, -0.55517578125, -0.3138427734375, -0.072509765625, 0.1688232421875, 0.41015625, 0.6514892578125, 0.892822265625, 1.1341552734375, 1.37548828125, 1.6168212890625, 1.858154296875, 2.0994873046875, 2.3408203125, 2.5821533203125, 2.823486328125, 3.0648193359375, 3.30615234375, 3.5474853515625, 3.788818359375, 4.0301513671875, 4.271484375, 4.5128173828125, 4.754150390625, 4.9954833984375, 5.23681640625, 5.4781494140625, 5.719482421875, 5.9608154296875, 6.2021484375, 6.4434814453125, 6.684814453125, 6.9261474609375, 7.16748046875, 7.4088134765625, 7.650146484375, 7.8914794921875, 8.1328125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 6.0, 8.0, 14.0, 12.0, 26.0, 40.0, 70.0, 109.0, 170.0, 247.0, 388.0, 634.0, 1020.0, 1881.0, 3208.0, 5762.0, 10770.0, 21674.0, 45625.0, 100446.0, 214045.0, 293346.0, 185170.0, 84835.0, 38826.0, 18645.0, 9446.0, 5219.0, 2752.0, 1606.0, 964.0, 595.0, 354.0, 220.0, 155.0, 80.0, 60.0, 44.0, 23.0, 23.0, 7.0, 13.0, 3.0, 4.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.7265625, -11.35302734375, -10.9794921875, -10.60595703125, -10.232421875, -9.85888671875, -9.4853515625, -9.11181640625, -8.73828125, -8.36474609375, -7.9912109375, -7.61767578125, -7.244140625, -6.87060546875, -6.4970703125, -6.12353515625, -5.75, -5.37646484375, -5.0029296875, -4.62939453125, -4.255859375, -3.88232421875, -3.5087890625, -3.13525390625, -2.76171875, -2.38818359375, -2.0146484375, -1.64111328125, -1.267578125, -0.89404296875, -0.5205078125, -0.14697265625, 0.2265625, 0.60009765625, 0.9736328125, 1.34716796875, 1.720703125, 2.09423828125, 2.4677734375, 2.84130859375, 3.21484375, 3.58837890625, 3.9619140625, 4.33544921875, 4.708984375, 5.08251953125, 5.4560546875, 5.82958984375, 6.203125, 6.57666015625, 6.9501953125, 7.32373046875, 7.697265625, 8.07080078125, 8.4443359375, 8.81787109375, 9.19140625, 9.56494140625, 9.9384765625, 10.31201171875, 10.685546875, 11.05908203125, 11.4326171875, 11.80615234375, 12.1796875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 6.0, 2.0, 3.0, 5.0, 8.0, 11.0, 7.0, 15.0, 8.0, 31.0, 33.0, 50.0, 46.0, 44.0, 64.0, 53.0, 73.0, 64.0, 66.0, 63.0, 52.0, 62.0, 54.0, 36.0, 25.0, 28.0, 22.0, 23.0, 14.0, 9.0, 5.0, 6.0, 3.0, 6.0, 5.0, 7.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0004525184631347656, -0.0004387795925140381, -0.00042504072189331055, -0.000411301851272583, -0.00039756298065185547, -0.00038382411003112793, -0.0003700852394104004, -0.00035634636878967285, -0.0003426074981689453, -0.0003288686275482178, -0.00031512975692749023, -0.0003013908863067627, -0.00028765201568603516, -0.0002739131450653076, -0.0002601742744445801, -0.00024643540382385254, -0.000232696533203125, -0.00021895766258239746, -0.00020521879196166992, -0.00019147992134094238, -0.00017774105072021484, -0.0001640021800994873, -0.00015026330947875977, -0.00013652443885803223, -0.0001227855682373047, -0.00010904669761657715, -9.530782699584961e-05, -8.156895637512207e-05, -6.783008575439453e-05, -5.409121513366699e-05, -4.035234451293945e-05, -2.6613473892211914e-05, -1.2874603271484375e-05, 8.642673492431641e-07, 1.4603137969970703e-05, 2.8342008590698242e-05, 4.208087921142578e-05, 5.581974983215332e-05, 6.955862045288086e-05, 8.32974910736084e-05, 9.703636169433594e-05, 0.00011077523231506348, 0.00012451410293579102, 0.00013825297355651855, 0.0001519918441772461, 0.00016573071479797363, 0.00017946958541870117, 0.0001932084560394287, 0.00020694732666015625, 0.0002206861972808838, 0.00023442506790161133, 0.00024816393852233887, 0.0002619028091430664, 0.00027564167976379395, 0.0002893805503845215, 0.000303119421005249, 0.00031685829162597656, 0.0003305971622467041, 0.00034433603286743164, 0.0003580749034881592, 0.0003718137741088867, 0.00038555264472961426, 0.0003992915153503418, 0.00041303038597106934, 0.0004267692565917969]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 3.0, 7.0, 15.0, 17.0, 21.0, 32.0, 51.0, 68.0, 109.0, 175.0, 263.0, 444.0, 729.0, 1176.0, 1987.0, 3424.0, 5740.0, 10252.0, 18431.0, 33547.0, 59727.0, 101245.0, 153565.0, 188641.0, 172928.0, 123220.0, 75111.0, 42843.0, 23817.0, 13081.0, 7376.0, 4215.0, 2496.0, 1510.0, 816.0, 550.0, 356.0, 202.0, 123.0, 93.0, 45.0, 36.0, 24.0, 16.0, 12.0, 6.0, 10.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.2109375, -6.97613525390625, -6.7413330078125, -6.50653076171875, -6.271728515625, -6.03692626953125, -5.8021240234375, -5.56732177734375, -5.33251953125, -5.09771728515625, -4.8629150390625, -4.62811279296875, -4.393310546875, -4.15850830078125, -3.9237060546875, -3.68890380859375, -3.4541015625, -3.21929931640625, -2.9844970703125, -2.74969482421875, -2.514892578125, -2.28009033203125, -2.0452880859375, -1.81048583984375, -1.57568359375, -1.34088134765625, -1.1060791015625, -0.87127685546875, -0.636474609375, -0.40167236328125, -0.1668701171875, 0.06793212890625, 0.302734375, 0.53753662109375, 0.7723388671875, 1.00714111328125, 1.241943359375, 1.47674560546875, 1.7115478515625, 1.94635009765625, 2.18115234375, 2.41595458984375, 2.6507568359375, 2.88555908203125, 3.120361328125, 3.35516357421875, 3.5899658203125, 3.82476806640625, 4.0595703125, 4.29437255859375, 4.5291748046875, 4.76397705078125, 4.998779296875, 5.23358154296875, 5.4683837890625, 5.70318603515625, 5.93798828125, 6.17279052734375, 6.4075927734375, 6.64239501953125, 6.877197265625, 7.11199951171875, 7.3468017578125, 7.58160400390625, 7.81640625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 5.0, 7.0, 12.0, 12.0, 12.0, 15.0, 18.0, 18.0, 25.0, 35.0, 43.0, 33.0, 38.0, 53.0, 47.0, 51.0, 59.0, 56.0, 54.0, 54.0, 54.0, 46.0, 33.0, 42.0, 29.0, 22.0, 22.0, 17.0, 16.0, 14.0, 11.0, 8.0, 8.0, 7.0, 4.0, 4.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.125, -2.058868408203125, -1.99273681640625, -1.926605224609375, -1.8604736328125, -1.794342041015625, -1.72821044921875, -1.662078857421875, -1.595947265625, -1.529815673828125, -1.46368408203125, -1.397552490234375, -1.3314208984375, -1.265289306640625, -1.19915771484375, -1.133026123046875, -1.06689453125, -1.000762939453125, -0.93463134765625, -0.868499755859375, -0.8023681640625, -0.736236572265625, -0.67010498046875, -0.603973388671875, -0.537841796875, -0.471710205078125, -0.40557861328125, -0.339447021484375, -0.2733154296875, -0.207183837890625, -0.14105224609375, -0.074920654296875, -0.0087890625, 0.057342529296875, 0.12347412109375, 0.189605712890625, 0.2557373046875, 0.321868896484375, 0.38800048828125, 0.454132080078125, 0.520263671875, 0.586395263671875, 0.65252685546875, 0.718658447265625, 0.7847900390625, 0.850921630859375, 0.91705322265625, 0.983184814453125, 1.04931640625, 1.115447998046875, 1.18157958984375, 1.247711181640625, 1.3138427734375, 1.379974365234375, 1.44610595703125, 1.512237548828125, 1.578369140625, 1.644500732421875, 1.71063232421875, 1.776763916015625, 1.8428955078125, 1.909027099609375, 1.97515869140625, 2.041290283203125, 2.107421875]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 8.0, 7.0, 8.0, 10.0, 8.0, 21.0, 42.0, 39.0, 46.0, 51.0, 69.0, 77.0, 84.0, 83.0, 71.0, 71.0, 60.0, 55.0, 37.0, 38.0, 29.0, 19.0, 16.0, 14.0, 14.0, 7.0, 2.0, 4.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-29.729543685913086, -28.753942489624023, -27.778343200683594, -26.80274200439453, -25.82714080810547, -24.85154151916504, -23.875940322875977, -22.900341033935547, -21.924739837646484, -20.949138641357422, -19.973539352416992, -18.99793815612793, -18.0223388671875, -17.046737670898438, -16.071136474609375, -15.095536231994629, -14.119935989379883, -13.144335746765137, -12.16873550415039, -11.193134307861328, -10.217534065246582, -9.241933822631836, -8.266332626342773, -7.290732383728027, -6.315132141113281, -5.339531898498535, -4.363931179046631, -3.3883306980133057, -2.4127302169799805, -1.4371299743652344, -0.4615292549133301, 0.5140714645385742, 1.4896736145019531, 2.4652740955352783, 3.4408745765686035, 4.416475296020508, 5.392075538635254, 6.36767578125, 7.343276500701904, 8.318877220153809, 9.294477462768555, 10.2700777053833, 11.245677947998047, 12.22127914428711, 13.196879386901855, 14.172479629516602, 15.148080825805664, 16.123680114746094, 17.099281311035156, 18.07488250732422, 19.05048179626465, 20.02608299255371, 21.00168228149414, 21.977283477783203, 22.952884674072266, 23.928485870361328, 24.904085159301758, 25.87968635559082, 26.85528564453125, 27.830886840820312, 28.806488037109375, 29.782087326049805, 30.757688522338867, 31.733287811279297, 32.70888900756836]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 7.0, 6.0, 6.0, 6.0, 7.0, 18.0, 11.0, 22.0, 14.0, 25.0, 24.0, 26.0, 25.0, 34.0, 36.0, 38.0, 35.0, 51.0, 45.0, 55.0, 44.0, 42.0, 57.0, 49.0, 33.0, 33.0, 39.0, 37.0, 24.0, 21.0, 27.0, 20.0, 21.0, 11.0, 13.0, 6.0, 7.0, 10.0, 7.0, 5.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.315722465515137, -14.86660099029541, -14.417479515075684, -13.968358039855957, -13.51923656463623, -13.070115089416504, -12.620992660522461, -12.171871185302734, -11.722749710083008, -11.273628234863281, -10.824506759643555, -10.375385284423828, -9.926263809204102, -9.477142333984375, -9.028020858764648, -8.578899383544922, -8.129777908325195, -7.680656433105469, -7.231534957885742, -6.782413482666016, -6.333292007446289, -5.8841705322265625, -5.435048580169678, -4.985927104949951, -4.536805629730225, -4.087684154510498, -3.6385626792907715, -3.189440965652466, -2.7403194904327393, -2.2911980152130127, -1.842076301574707, -1.3929548263549805, -0.9438333511352539, -0.49471181631088257, -0.04559028148651123, 0.4035313129425049, 0.8526527881622314, 1.301774263381958, 1.7508959770202637, 2.2000174522399902, 2.649138927459717, 3.0982604026794434, 3.54738187789917, 3.9965035915374756, 4.445625305175781, 4.894746780395508, 5.343868255615234, 5.792989730834961, 6.2421112060546875, 6.691232681274414, 7.140354156494141, 7.589475631713867, 8.038597106933594, 8.48771858215332, 8.936840057373047, 9.385961532592773, 9.8350830078125, 10.284204483032227, 10.733325958251953, 11.18244743347168, 11.631568908691406, 12.080690383911133, 12.52981185913086, 12.978933334350586, 13.428055763244629]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 6.0, 9.0, 7.0, 10.0, 15.0, 26.0, 48.0, 51.0, 80.0, 124.0, 193.0, 292.0, 456.0, 691.0, 1115.0, 1617.0, 2578.0, 4171.0, 6560.0, 10701.0, 17148.0, 27464.0, 42696.0, 65214.0, 93633.0, 122722.0, 140931.0, 138732.0, 117389.0, 87851.0, 59754.0, 39667.0, 24731.0, 15712.0, 9706.0, 6121.0, 3695.0, 2378.0, 1527.0, 931.0, 652.0, 403.0, 253.0, 176.0, 113.0, 82.0, 44.0, 31.0, 14.0, 15.0, 8.0, 11.0, 2.0, 4.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-14.015625, -13.546875, -13.078125, -12.609375, -12.140625, -11.671875, -11.203125, -10.734375, -10.265625, -9.796875, -9.328125, -8.859375, -8.390625, -7.921875, -7.453125, -6.984375, -6.515625, -6.046875, -5.578125, -5.109375, -4.640625, -4.171875, -3.703125, -3.234375, -2.765625, -2.296875, -1.828125, -1.359375, -0.890625, -0.421875, 0.046875, 0.515625, 0.984375, 1.453125, 1.921875, 2.390625, 2.859375, 3.328125, 3.796875, 4.265625, 4.734375, 5.203125, 5.671875, 6.140625, 6.609375, 7.078125, 7.546875, 8.015625, 8.484375, 8.953125, 9.421875, 9.890625, 10.359375, 10.828125, 11.296875, 11.765625, 12.234375, 12.703125, 13.171875, 13.640625, 14.109375, 14.578125, 15.046875, 15.515625, 15.984375]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 6.0, 5.0, 4.0, 3.0, 12.0, 8.0, 11.0, 13.0, 10.0, 20.0, 18.0, 31.0, 35.0, 28.0, 33.0, 45.0, 46.0, 33.0, 44.0, 43.0, 46.0, 50.0, 44.0, 41.0, 45.0, 29.0, 53.0, 38.0, 29.0, 36.0, 23.0, 24.0, 20.0, 11.0, 9.0, 15.0, 9.0, 10.0, 11.0, 5.0, 7.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.7265625, -15.252685546875, -14.77880859375, -14.304931640625, -13.8310546875, -13.357177734375, -12.88330078125, -12.409423828125, -11.935546875, -11.461669921875, -10.98779296875, -10.513916015625, -10.0400390625, -9.566162109375, -9.09228515625, -8.618408203125, -8.14453125, -7.670654296875, -7.19677734375, -6.722900390625, -6.2490234375, -5.775146484375, -5.30126953125, -4.827392578125, -4.353515625, -3.879638671875, -3.40576171875, -2.931884765625, -2.4580078125, -1.984130859375, -1.51025390625, -1.036376953125, -0.5625, -0.088623046875, 0.38525390625, 0.859130859375, 1.3330078125, 1.806884765625, 2.28076171875, 2.754638671875, 3.228515625, 3.702392578125, 4.17626953125, 4.650146484375, 5.1240234375, 5.597900390625, 6.07177734375, 6.545654296875, 7.01953125, 7.493408203125, 7.96728515625, 8.441162109375, 8.9150390625, 9.388916015625, 9.86279296875, 10.336669921875, 10.810546875, 11.284423828125, 11.75830078125, 12.232177734375, 12.7060546875, 13.179931640625, 13.65380859375, 14.127685546875, 14.6015625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 14.0, 16.0, 23.0, 43.0, 52.0, 88.0, 123.0, 205.0, 302.0, 503.0, 800.0, 1264.0, 2087.0, 3510.0, 5626.0, 9451.0, 15523.0, 25340.0, 40597.0, 62940.0, 92275.0, 124003.0, 146159.0, 145156.0, 121007.0, 89633.0, 60298.0, 38837.0, 24407.0, 14975.0, 8894.0, 5638.0, 3381.0, 2025.0, 1204.0, 826.0, 498.0, 310.0, 187.0, 128.0, 79.0, 43.0, 33.0, 27.0, 7.0, 6.0, 9.0, 5.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.515625, -13.064453125, -12.61328125, -12.162109375, -11.7109375, -11.259765625, -10.80859375, -10.357421875, -9.90625, -9.455078125, -9.00390625, -8.552734375, -8.1015625, -7.650390625, -7.19921875, -6.748046875, -6.296875, -5.845703125, -5.39453125, -4.943359375, -4.4921875, -4.041015625, -3.58984375, -3.138671875, -2.6875, -2.236328125, -1.78515625, -1.333984375, -0.8828125, -0.431640625, 0.01953125, 0.470703125, 0.921875, 1.373046875, 1.82421875, 2.275390625, 2.7265625, 3.177734375, 3.62890625, 4.080078125, 4.53125, 4.982421875, 5.43359375, 5.884765625, 6.3359375, 6.787109375, 7.23828125, 7.689453125, 8.140625, 8.591796875, 9.04296875, 9.494140625, 9.9453125, 10.396484375, 10.84765625, 11.298828125, 11.75, 12.201171875, 12.65234375, 13.103515625, 13.5546875, 14.005859375, 14.45703125, 14.908203125, 15.359375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 7.0, 7.0, 7.0, 15.0, 10.0, 18.0, 16.0, 15.0, 18.0, 22.0, 29.0, 33.0, 16.0, 40.0, 41.0, 30.0, 34.0, 36.0, 37.0, 45.0, 41.0, 41.0, 39.0, 49.0, 39.0, 39.0, 39.0, 37.0, 29.0, 32.0, 20.0, 26.0, 18.0, 19.0, 9.0, 10.0, 7.0, 8.0, 8.0, 7.0, 4.0, 2.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.109375, -8.8173828125, -8.525390625, -8.2333984375, -7.94140625, -7.6494140625, -7.357421875, -7.0654296875, -6.7734375, -6.4814453125, -6.189453125, -5.8974609375, -5.60546875, -5.3134765625, -5.021484375, -4.7294921875, -4.4375, -4.1455078125, -3.853515625, -3.5615234375, -3.26953125, -2.9775390625, -2.685546875, -2.3935546875, -2.1015625, -1.8095703125, -1.517578125, -1.2255859375, -0.93359375, -0.6416015625, -0.349609375, -0.0576171875, 0.234375, 0.5263671875, 0.818359375, 1.1103515625, 1.40234375, 1.6943359375, 1.986328125, 2.2783203125, 2.5703125, 2.8623046875, 3.154296875, 3.4462890625, 3.73828125, 4.0302734375, 4.322265625, 4.6142578125, 4.90625, 5.1982421875, 5.490234375, 5.7822265625, 6.07421875, 6.3662109375, 6.658203125, 6.9501953125, 7.2421875, 7.5341796875, 7.826171875, 8.1181640625, 8.41015625, 8.7021484375, 8.994140625, 9.2861328125, 9.578125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 4.0, 12.0, 11.0, 19.0, 37.0, 54.0, 57.0, 109.0, 165.0, 291.0, 478.0, 902.0, 1643.0, 2913.0, 5765.0, 11628.0, 24338.0, 51876.0, 107984.0, 199469.0, 254920.0, 190259.0, 101953.0, 48566.0, 22503.0, 10823.0, 5396.0, 2775.0, 1572.0, 850.0, 466.0, 283.0, 172.0, 100.0, 54.0, 45.0, 27.0, 20.0, 11.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-15.1875, -14.7335205078125, -14.279541015625, -13.8255615234375, -13.37158203125, -12.9176025390625, -12.463623046875, -12.0096435546875, -11.5556640625, -11.1016845703125, -10.647705078125, -10.1937255859375, -9.73974609375, -9.2857666015625, -8.831787109375, -8.3778076171875, -7.923828125, -7.4698486328125, -7.015869140625, -6.5618896484375, -6.10791015625, -5.6539306640625, -5.199951171875, -4.7459716796875, -4.2919921875, -3.8380126953125, -3.384033203125, -2.9300537109375, -2.47607421875, -2.0220947265625, -1.568115234375, -1.1141357421875, -0.66015625, -0.2061767578125, 0.247802734375, 0.7017822265625, 1.15576171875, 1.6097412109375, 2.063720703125, 2.5177001953125, 2.9716796875, 3.4256591796875, 3.879638671875, 4.3336181640625, 4.78759765625, 5.2415771484375, 5.695556640625, 6.1495361328125, 6.603515625, 7.0574951171875, 7.511474609375, 7.9654541015625, 8.41943359375, 8.8734130859375, 9.327392578125, 9.7813720703125, 10.2353515625, 10.6893310546875, 11.143310546875, 11.5972900390625, 12.05126953125, 12.5052490234375, 12.959228515625, 13.4132080078125, 13.8671875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 5.0, 4.0, 6.0, 12.0, 7.0, 11.0, 25.0, 31.0, 37.0, 45.0, 40.0, 69.0, 69.0, 78.0, 82.0, 72.0, 83.0, 61.0, 57.0, 37.0, 32.0, 27.0, 27.0, 15.0, 10.0, 15.0, 8.0, 7.0, 7.0, 2.0, 5.0, 3.0, 0.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0015783309936523438, -0.0015366077423095703, -0.0014948844909667969, -0.0014531612396240234, -0.00141143798828125, -0.0013697147369384766, -0.0013279914855957031, -0.0012862682342529297, -0.0012445449829101562, -0.0012028217315673828, -0.0011610984802246094, -0.001119375228881836, -0.0010776519775390625, -0.001035928726196289, -0.0009942054748535156, -0.0009524822235107422, -0.0009107589721679688, -0.0008690357208251953, -0.0008273124694824219, -0.0007855892181396484, -0.000743865966796875, -0.0007021427154541016, -0.0006604194641113281, -0.0006186962127685547, -0.0005769729614257812, -0.0005352497100830078, -0.0004935264587402344, -0.00045180320739746094, -0.0004100799560546875, -0.00036835670471191406, -0.0003266334533691406, -0.0002849102020263672, -0.00024318695068359375, -0.0002014636993408203, -0.00015974044799804688, -0.00011801719665527344, -7.62939453125e-05, -3.457069396972656e-05, 7.152557373046875e-06, 4.887580871582031e-05, 9.059906005859375e-05, 0.0001323223114013672, 0.00017404556274414062, 0.00021576881408691406, 0.0002574920654296875, 0.00029921531677246094, 0.0003409385681152344, 0.0003826618194580078, 0.00042438507080078125, 0.0004661083221435547, 0.0005078315734863281, 0.0005495548248291016, 0.000591278076171875, 0.0006330013275146484, 0.0006747245788574219, 0.0007164478302001953, 0.0007581710815429688, 0.0007998943328857422, 0.0008416175842285156, 0.0008833408355712891, 0.0009250640869140625, 0.0009667873382568359, 0.0010085105895996094, 0.0010502338409423828, 0.0010919570922851562]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 8.0, 8.0, 4.0, 9.0, 16.0, 17.0, 25.0, 33.0, 61.0, 85.0, 128.0, 211.0, 284.0, 430.0, 688.0, 1051.0, 1741.0, 2922.0, 4852.0, 8167.0, 13799.0, 23679.0, 39870.0, 65667.0, 102419.0, 142858.0, 167724.0, 156435.0, 118234.0, 78251.0, 47995.0, 28806.0, 16846.0, 10083.0, 5976.0, 3456.0, 2083.0, 1318.0, 800.0, 512.0, 342.0, 202.0, 158.0, 92.0, 78.0, 40.0, 33.0, 22.0, 7.0, 11.0, 8.0, 11.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.1328125, -8.8446044921875, -8.556396484375, -8.2681884765625, -7.97998046875, -7.6917724609375, -7.403564453125, -7.1153564453125, -6.8271484375, -6.5389404296875, -6.250732421875, -5.9625244140625, -5.67431640625, -5.3861083984375, -5.097900390625, -4.8096923828125, -4.521484375, -4.2332763671875, -3.945068359375, -3.6568603515625, -3.36865234375, -3.0804443359375, -2.792236328125, -2.5040283203125, -2.2158203125, -1.9276123046875, -1.639404296875, -1.3511962890625, -1.06298828125, -0.7747802734375, -0.486572265625, -0.1983642578125, 0.08984375, 0.3780517578125, 0.666259765625, 0.9544677734375, 1.24267578125, 1.5308837890625, 1.819091796875, 2.1072998046875, 2.3955078125, 2.6837158203125, 2.971923828125, 3.2601318359375, 3.54833984375, 3.8365478515625, 4.124755859375, 4.4129638671875, 4.701171875, 4.9893798828125, 5.277587890625, 5.5657958984375, 5.85400390625, 6.1422119140625, 6.430419921875, 6.7186279296875, 7.0068359375, 7.2950439453125, 7.583251953125, 7.8714599609375, 8.15966796875, 8.4478759765625, 8.736083984375, 9.0242919921875, 9.3125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 4.0, 5.0, 5.0, 9.0, 14.0, 10.0, 24.0, 29.0, 41.0, 42.0, 53.0, 67.0, 78.0, 88.0, 76.0, 73.0, 78.0, 65.0, 62.0, 56.0, 37.0, 27.0, 17.0, 11.0, 10.0, 4.0, 5.0, 2.0, 2.0, 5.0, 0.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.703125, -4.5491943359375, -4.395263671875, -4.2413330078125, -4.08740234375, -3.9334716796875, -3.779541015625, -3.6256103515625, -3.4716796875, -3.3177490234375, -3.163818359375, -3.0098876953125, -2.85595703125, -2.7020263671875, -2.548095703125, -2.3941650390625, -2.240234375, -2.0863037109375, -1.932373046875, -1.7784423828125, -1.62451171875, -1.4705810546875, -1.316650390625, -1.1627197265625, -1.0087890625, -0.8548583984375, -0.700927734375, -0.5469970703125, -0.39306640625, -0.2391357421875, -0.085205078125, 0.0687255859375, 0.22265625, 0.3765869140625, 0.530517578125, 0.6844482421875, 0.83837890625, 0.9923095703125, 1.146240234375, 1.3001708984375, 1.4541015625, 1.6080322265625, 1.761962890625, 1.9158935546875, 2.06982421875, 2.2237548828125, 2.377685546875, 2.5316162109375, 2.685546875, 2.8394775390625, 2.993408203125, 3.1473388671875, 3.30126953125, 3.4552001953125, 3.609130859375, 3.7630615234375, 3.9169921875, 4.0709228515625, 4.224853515625, 4.3787841796875, 4.53271484375, 4.6866455078125, 4.840576171875, 4.9945068359375, 5.1484375]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 4.0, 3.0, 6.0, 7.0, 10.0, 18.0, 23.0, 26.0, 40.0, 34.0, 41.0, 56.0, 60.0, 79.0, 94.0, 75.0, 80.0, 47.0, 49.0, 49.0, 49.0, 37.0, 21.0, 25.0, 18.0, 13.0, 11.0, 8.0, 8.0, 5.0, 2.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.850130081176758, -27.93405532836914, -27.017980575561523, -26.101905822753906, -25.18583106994629, -24.269756317138672, -23.353683471679688, -22.437606811523438, -21.521533966064453, -20.605459213256836, -19.68938446044922, -18.7733097076416, -17.857234954833984, -16.941160202026367, -16.02508544921875, -15.10901165008545, -14.192935943603516, -13.276861190795898, -12.360786437988281, -11.444711685180664, -10.528636932373047, -9.61256217956543, -8.696488380432129, -7.780413627624512, -6.8643388748168945, -5.948264122009277, -5.03218936920166, -4.116115093231201, -3.200040340423584, -2.283965587615967, -1.3678913116455078, -0.4518165588378906, 0.4642601013183594, 1.380334734916687, 2.2964093685150146, 3.2124838829040527, 4.12855863571167, 5.044633388519287, 5.960707664489746, 6.876782417297363, 7.7928571701049805, 8.708931922912598, 9.625006675720215, 10.541080474853516, 11.457155227661133, 12.37322998046875, 13.289304733276367, 14.205379486083984, 15.121454238891602, 16.03752899169922, 16.953603744506836, 17.869678497314453, 18.78575325012207, 19.701828002929688, 20.617900848388672, 21.533977508544922, 22.450050354003906, 23.366125106811523, 24.28219985961914, 25.198274612426758, 26.114349365234375, 27.030424118041992, 27.94649887084961, 28.862571716308594, 29.778648376464844]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 7.0, 6.0, 6.0, 8.0, 14.0, 11.0, 13.0, 25.0, 23.0, 25.0, 19.0, 35.0, 30.0, 29.0, 37.0, 40.0, 52.0, 42.0, 51.0, 45.0, 46.0, 38.0, 47.0, 34.0, 44.0, 49.0, 27.0, 31.0, 27.0, 26.0, 25.0, 11.0, 16.0, 15.0, 10.0, 9.0, 6.0, 9.0, 5.0, 5.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.063613891601562, -15.586197853088379, -15.108782768249512, -14.631366729736328, -14.153950691223145, -13.676534652709961, -13.199119567871094, -12.72170352935791, -12.244287490844727, -11.766871452331543, -11.289456367492676, -10.812040328979492, -10.334624290466309, -9.857208251953125, -9.379793167114258, -8.902377128601074, -8.42496109008789, -7.947545528411865, -7.470129489898682, -6.992713928222656, -6.515297889709473, -6.037882328033447, -5.560466766357422, -5.083050727844238, -4.605635643005371, -4.128220081329346, -3.650804042816162, -3.1733884811401367, -2.695972442626953, -2.2185568809509277, -1.7411410808563232, -1.2637252807617188, -0.7863092422485352, -0.30889347195625305, 0.16852229833602905, 0.6459380388259888, 1.1233538389205933, 1.6007695198059082, 2.0781853199005127, 2.555601119995117, 3.0330169200897217, 3.510432720184326, 3.9878485202789307, 4.465264320373535, 4.9426798820495605, 5.420095443725586, 5.8975114822387695, 6.374927520751953, 6.8523430824279785, 7.329758644104004, 7.8071746826171875, 8.284590721130371, 8.762005805969238, 9.239421844482422, 9.716837882995605, 10.194253921508789, 10.671669006347656, 11.14908504486084, 11.626500129699707, 12.10391616821289, 12.581332206726074, 13.058748245239258, 13.536163330078125, 14.013579368591309, 14.490995407104492]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 7.0, 4.0, 4.0, 10.0, 11.0, 22.0, 30.0, 41.0, 58.0, 84.0, 136.0, 178.0, 305.0, 460.0, 797.0, 1301.0, 2123.0, 3553.0, 6592.0, 12129.0, 22876.0, 45786.0, 96648.0, 215759.0, 501709.0, 1000826.0, 1121214.0, 640720.0, 278849.0, 122940.0, 57372.0, 28396.0, 14436.0, 7876.0, 4346.0, 2548.0, 1534.0, 897.0, 587.0, 373.0, 243.0, 185.0, 115.0, 64.0, 52.0, 31.0, 17.0, 20.0, 4.0, 10.0, 2.0, 6.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.75, -19.072509765625, -18.39501953125, -17.717529296875, -17.0400390625, -16.362548828125, -15.68505859375, -15.007568359375, -14.330078125, -13.652587890625, -12.97509765625, -12.297607421875, -11.6201171875, -10.942626953125, -10.26513671875, -9.587646484375, -8.91015625, -8.232666015625, -7.55517578125, -6.877685546875, -6.2001953125, -5.522705078125, -4.84521484375, -4.167724609375, -3.490234375, -2.812744140625, -2.13525390625, -1.457763671875, -0.7802734375, -0.102783203125, 0.57470703125, 1.252197265625, 1.9296875, 2.607177734375, 3.28466796875, 3.962158203125, 4.6396484375, 5.317138671875, 5.99462890625, 6.672119140625, 7.349609375, 8.027099609375, 8.70458984375, 9.382080078125, 10.0595703125, 10.737060546875, 11.41455078125, 12.092041015625, 12.76953125, 13.447021484375, 14.12451171875, 14.802001953125, 15.4794921875, 16.156982421875, 16.83447265625, 17.511962890625, 18.189453125, 18.866943359375, 19.54443359375, 20.221923828125, 20.8994140625, 21.576904296875, 22.25439453125, 22.931884765625, 23.609375]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 2.0, 5.0, 8.0, 4.0, 9.0, 5.0, 7.0, 12.0, 15.0, 22.0, 20.0, 26.0, 24.0, 24.0, 30.0, 31.0, 28.0, 30.0, 45.0, 43.0, 41.0, 42.0, 40.0, 37.0, 44.0, 47.0, 39.0, 35.0, 29.0, 31.0, 30.0, 30.0, 31.0, 25.0, 16.0, 16.0, 16.0, 10.0, 11.0, 7.0, 10.0, 9.0, 3.0, 4.0, 6.0, 5.0, 1.0, 1.0, 2.0, 2.0], "bins": [-11.3125, -11.003173828125, -10.69384765625, -10.384521484375, -10.0751953125, -9.765869140625, -9.45654296875, -9.147216796875, -8.837890625, -8.528564453125, -8.21923828125, -7.909912109375, -7.6005859375, -7.291259765625, -6.98193359375, -6.672607421875, -6.36328125, -6.053955078125, -5.74462890625, -5.435302734375, -5.1259765625, -4.816650390625, -4.50732421875, -4.197998046875, -3.888671875, -3.579345703125, -3.27001953125, -2.960693359375, -2.6513671875, -2.342041015625, -2.03271484375, -1.723388671875, -1.4140625, -1.104736328125, -0.79541015625, -0.486083984375, -0.1767578125, 0.132568359375, 0.44189453125, 0.751220703125, 1.060546875, 1.369873046875, 1.67919921875, 1.988525390625, 2.2978515625, 2.607177734375, 2.91650390625, 3.225830078125, 3.53515625, 3.844482421875, 4.15380859375, 4.463134765625, 4.7724609375, 5.081787109375, 5.39111328125, 5.700439453125, 6.009765625, 6.319091796875, 6.62841796875, 6.937744140625, 7.2470703125, 7.556396484375, 7.86572265625, 8.175048828125, 8.484375]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 7.0, 5.0, 10.0, 7.0, 12.0, 37.0, 31.0, 63.0, 82.0, 129.0, 230.0, 305.0, 533.0, 819.0, 1419.0, 2346.0, 4012.0, 7208.0, 13144.0, 25066.0, 49075.0, 97280.0, 198694.0, 403904.0, 759442.0, 1038040.0, 770654.0, 412691.0, 202435.0, 99913.0, 49822.0, 25820.0, 13598.0, 7268.0, 4167.0, 2378.0, 1389.0, 887.0, 492.0, 309.0, 196.0, 126.0, 86.0, 59.0, 37.0, 29.0, 18.0, 7.0, 9.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-21.203125, -20.551025390625, -19.89892578125, -19.246826171875, -18.5947265625, -17.942626953125, -17.29052734375, -16.638427734375, -15.986328125, -15.334228515625, -14.68212890625, -14.030029296875, -13.3779296875, -12.725830078125, -12.07373046875, -11.421630859375, -10.76953125, -10.117431640625, -9.46533203125, -8.813232421875, -8.1611328125, -7.509033203125, -6.85693359375, -6.204833984375, -5.552734375, -4.900634765625, -4.24853515625, -3.596435546875, -2.9443359375, -2.292236328125, -1.64013671875, -0.988037109375, -0.3359375, 0.316162109375, 0.96826171875, 1.620361328125, 2.2724609375, 2.924560546875, 3.57666015625, 4.228759765625, 4.880859375, 5.532958984375, 6.18505859375, 6.837158203125, 7.4892578125, 8.141357421875, 8.79345703125, 9.445556640625, 10.09765625, 10.749755859375, 11.40185546875, 12.053955078125, 12.7060546875, 13.358154296875, 14.01025390625, 14.662353515625, 15.314453125, 15.966552734375, 16.61865234375, 17.270751953125, 17.9228515625, 18.574951171875, 19.22705078125, 19.879150390625, 20.53125]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 8.0, 4.0, 7.0, 9.0, 17.0, 24.0, 28.0, 31.0, 40.0, 62.0, 83.0, 110.0, 119.0, 157.0, 189.0, 231.0, 270.0, 283.0, 307.0, 290.0, 315.0, 272.0, 226.0, 188.0, 183.0, 127.0, 126.0, 76.0, 67.0, 56.0, 47.0, 30.0, 23.0, 23.0, 13.0, 22.0, 5.0, 7.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.7421875, -6.53192138671875, -6.3216552734375, -6.11138916015625, -5.901123046875, -5.69085693359375, -5.4805908203125, -5.27032470703125, -5.06005859375, -4.84979248046875, -4.6395263671875, -4.42926025390625, -4.218994140625, -4.00872802734375, -3.7984619140625, -3.58819580078125, -3.3779296875, -3.16766357421875, -2.9573974609375, -2.74713134765625, -2.536865234375, -2.32659912109375, -2.1163330078125, -1.90606689453125, -1.69580078125, -1.48553466796875, -1.2752685546875, -1.06500244140625, -0.854736328125, -0.64447021484375, -0.4342041015625, -0.22393798828125, -0.013671875, 0.19659423828125, 0.4068603515625, 0.61712646484375, 0.827392578125, 1.03765869140625, 1.2479248046875, 1.45819091796875, 1.66845703125, 1.87872314453125, 2.0889892578125, 2.29925537109375, 2.509521484375, 2.71978759765625, 2.9300537109375, 3.14031982421875, 3.3505859375, 3.56085205078125, 3.7711181640625, 3.98138427734375, 4.191650390625, 4.40191650390625, 4.6121826171875, 4.82244873046875, 5.03271484375, 5.24298095703125, 5.4532470703125, 5.66351318359375, 5.873779296875, 6.08404541015625, 6.2943115234375, 6.50457763671875, 6.71484375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 11.0, 4.0, 7.0, 9.0, 6.0, 31.0, 25.0, 33.0, 33.0, 39.0, 45.0, 38.0, 45.0, 56.0, 72.0, 48.0, 56.0, 53.0, 54.0, 38.0, 47.0, 37.0, 42.0, 28.0, 31.0, 16.0, 16.0, 15.0, 12.0, 6.0, 11.0, 6.0, 4.0, 8.0, 5.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.8176326751709, -19.158353805541992, -18.499074935913086, -17.839797973632812, -17.180519104003906, -16.521240234375, -15.861961364746094, -15.202682495117188, -14.543403625488281, -13.884124755859375, -13.224846839904785, -12.565567970275879, -11.906289100646973, -11.247011184692383, -10.587732315063477, -9.92845344543457, -9.26917552947998, -8.609896659851074, -7.950618267059326, -7.291339874267578, -6.632061004638672, -5.972782611846924, -5.313504219055176, -4.6542253494262695, -3.9949469566345215, -3.3356683254241943, -2.676389694213867, -2.017111301422119, -1.357832670211792, -0.6985540390014648, -0.0392756462097168, 0.6200032234191895, 1.2792816162109375, 1.9385602474212646, 2.597838878631592, 3.25711727142334, 3.916395902633667, 4.575674533843994, 5.234952926635742, 5.894231796264648, 6.5535101890563965, 7.2127885818481445, 7.872067451477051, 8.53134536743164, 9.190624237060547, 9.849903106689453, 10.50918197631836, 11.168460845947266, 11.827738761901855, 12.487017631530762, 13.146295547485352, 13.805574417114258, 14.464853286743164, 15.12413215637207, 15.78341007232666, 16.44268798828125, 17.101966857910156, 17.761245727539062, 18.42052459716797, 19.079803466796875, 19.73908042907715, 20.398359298706055, 21.05763816833496, 21.716917037963867, 22.376195907592773]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 5.0, 10.0, 9.0, 9.0, 13.0, 24.0, 17.0, 25.0, 31.0, 27.0, 38.0, 39.0, 32.0, 40.0, 50.0, 44.0, 50.0, 53.0, 44.0, 47.0, 51.0, 39.0, 37.0, 46.0, 43.0, 37.0, 25.0, 22.0, 13.0, 19.0, 18.0, 10.0, 10.0, 5.0, 2.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-14.765066146850586, -14.335415840148926, -13.905765533447266, -13.476116180419922, -13.046465873718262, -12.616815567016602, -12.187166213989258, -11.757515907287598, -11.327865600585938, -10.898215293884277, -10.468564987182617, -10.038915634155273, -9.609265327453613, -9.179615020751953, -8.74996566772461, -8.32031536102295, -7.890665054321289, -7.461014747619629, -7.031364917755127, -6.601715087890625, -6.172064781188965, -5.742414474487305, -5.312764644622803, -4.883114814758301, -4.453464508056641, -4.0238142013549805, -3.5941643714904785, -3.1645143032073975, -2.7348642349243164, -2.3052141666412354, -1.8755640983581543, -1.4459140300750732, -1.0162630081176758, -0.5866129398345947, -0.15696287155151367, 0.2726871967315674, 0.7023372650146484, 1.1319873332977295, 1.5616374015808105, 1.9912874698638916, 2.4209375381469727, 2.8505876064300537, 3.2802376747131348, 3.709887742996216, 4.139537811279297, 4.569188117980957, 4.998837947845459, 5.428487777709961, 5.858138084411621, 6.287788391113281, 6.717438220977783, 7.147088050842285, 7.576738357543945, 8.006388664245605, 8.436038970947266, 8.86568832397461, 9.29533863067627, 9.72498893737793, 10.154638290405273, 10.584288597106934, 11.013938903808594, 11.443589210510254, 11.873239517211914, 12.302888870239258, 12.732539176940918]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 10.0, 10.0, 16.0, 10.0, 23.0, 43.0, 56.0, 80.0, 107.0, 202.0, 307.0, 489.0, 860.0, 1445.0, 2606.0, 4678.0, 8738.0, 16421.0, 31892.0, 59183.0, 106245.0, 167913.0, 205160.0, 179278.0, 118160.0, 67541.0, 35649.0, 18966.0, 9910.0, 5389.0, 2977.0, 1691.0, 946.0, 580.0, 358.0, 201.0, 140.0, 94.0, 58.0, 42.0, 29.0, 20.0, 13.0, 6.0, 5.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-13.6875, -13.240234375, -12.79296875, -12.345703125, -11.8984375, -11.451171875, -11.00390625, -10.556640625, -10.109375, -9.662109375, -9.21484375, -8.767578125, -8.3203125, -7.873046875, -7.42578125, -6.978515625, -6.53125, -6.083984375, -5.63671875, -5.189453125, -4.7421875, -4.294921875, -3.84765625, -3.400390625, -2.953125, -2.505859375, -2.05859375, -1.611328125, -1.1640625, -0.716796875, -0.26953125, 0.177734375, 0.625, 1.072265625, 1.51953125, 1.966796875, 2.4140625, 2.861328125, 3.30859375, 3.755859375, 4.203125, 4.650390625, 5.09765625, 5.544921875, 5.9921875, 6.439453125, 6.88671875, 7.333984375, 7.78125, 8.228515625, 8.67578125, 9.123046875, 9.5703125, 10.017578125, 10.46484375, 10.912109375, 11.359375, 11.806640625, 12.25390625, 12.701171875, 13.1484375, 13.595703125, 14.04296875, 14.490234375, 14.9375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 1.0, 5.0, 9.0, 9.0, 9.0, 9.0, 10.0, 19.0, 19.0, 24.0, 29.0, 37.0, 26.0, 40.0, 41.0, 50.0, 36.0, 50.0, 61.0, 47.0, 56.0, 49.0, 51.0, 49.0, 43.0, 37.0, 43.0, 21.0, 32.0, 15.0, 20.0, 11.0, 11.0, 7.0, 6.0, 10.0, 5.0, 2.0, 2.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-16.3125, -15.835205078125, -15.35791015625, -14.880615234375, -14.4033203125, -13.926025390625, -13.44873046875, -12.971435546875, -12.494140625, -12.016845703125, -11.53955078125, -11.062255859375, -10.5849609375, -10.107666015625, -9.63037109375, -9.153076171875, -8.67578125, -8.198486328125, -7.72119140625, -7.243896484375, -6.7666015625, -6.289306640625, -5.81201171875, -5.334716796875, -4.857421875, -4.380126953125, -3.90283203125, -3.425537109375, -2.9482421875, -2.470947265625, -1.99365234375, -1.516357421875, -1.0390625, -0.561767578125, -0.08447265625, 0.392822265625, 0.8701171875, 1.347412109375, 1.82470703125, 2.302001953125, 2.779296875, 3.256591796875, 3.73388671875, 4.211181640625, 4.6884765625, 5.165771484375, 5.64306640625, 6.120361328125, 6.59765625, 7.074951171875, 7.55224609375, 8.029541015625, 8.5068359375, 8.984130859375, 9.46142578125, 9.938720703125, 10.416015625, 10.893310546875, 11.37060546875, 11.847900390625, 12.3251953125, 12.802490234375, 13.27978515625, 13.757080078125, 14.234375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 8.0, 2.0, 5.0, 10.0, 17.0, 17.0, 20.0, 28.0, 49.0, 70.0, 111.0, 120.0, 200.0, 309.0, 519.0, 837.0, 1475.0, 2773.0, 5725.0, 12010.0, 27608.0, 64747.0, 148930.0, 282196.0, 265796.0, 132195.0, 56813.0, 24288.0, 10680.0, 4986.0, 2560.0, 1391.0, 753.0, 462.0, 280.0, 175.0, 116.0, 87.0, 63.0, 45.0, 23.0, 14.0, 21.0, 12.0, 6.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-23.796875, -23.095458984375, -22.39404296875, -21.692626953125, -20.9912109375, -20.289794921875, -19.58837890625, -18.886962890625, -18.185546875, -17.484130859375, -16.78271484375, -16.081298828125, -15.3798828125, -14.678466796875, -13.97705078125, -13.275634765625, -12.57421875, -11.872802734375, -11.17138671875, -10.469970703125, -9.7685546875, -9.067138671875, -8.36572265625, -7.664306640625, -6.962890625, -6.261474609375, -5.56005859375, -4.858642578125, -4.1572265625, -3.455810546875, -2.75439453125, -2.052978515625, -1.3515625, -0.650146484375, 0.05126953125, 0.752685546875, 1.4541015625, 2.155517578125, 2.85693359375, 3.558349609375, 4.259765625, 4.961181640625, 5.66259765625, 6.364013671875, 7.0654296875, 7.766845703125, 8.46826171875, 9.169677734375, 9.87109375, 10.572509765625, 11.27392578125, 11.975341796875, 12.6767578125, 13.378173828125, 14.07958984375, 14.781005859375, 15.482421875, 16.183837890625, 16.88525390625, 17.586669921875, 18.2880859375, 18.989501953125, 19.69091796875, 20.392333984375, 21.09375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 3.0, 7.0, 6.0, 9.0, 16.0, 11.0, 12.0, 22.0, 20.0, 32.0, 31.0, 33.0, 34.0, 32.0, 43.0, 39.0, 43.0, 54.0, 37.0, 40.0, 29.0, 46.0, 39.0, 34.0, 47.0, 33.0, 39.0, 32.0, 32.0, 19.0, 23.0, 15.0, 13.0, 15.0, 14.0, 12.0, 5.0, 8.0, 7.0, 4.0, 3.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.59375, -7.348388671875, -7.10302734375, -6.857666015625, -6.6123046875, -6.366943359375, -6.12158203125, -5.876220703125, -5.630859375, -5.385498046875, -5.14013671875, -4.894775390625, -4.6494140625, -4.404052734375, -4.15869140625, -3.913330078125, -3.66796875, -3.422607421875, -3.17724609375, -2.931884765625, -2.6865234375, -2.441162109375, -2.19580078125, -1.950439453125, -1.705078125, -1.459716796875, -1.21435546875, -0.968994140625, -0.7236328125, -0.478271484375, -0.23291015625, 0.012451171875, 0.2578125, 0.503173828125, 0.74853515625, 0.993896484375, 1.2392578125, 1.484619140625, 1.72998046875, 1.975341796875, 2.220703125, 2.466064453125, 2.71142578125, 2.956787109375, 3.2021484375, 3.447509765625, 3.69287109375, 3.938232421875, 4.18359375, 4.428955078125, 4.67431640625, 4.919677734375, 5.1650390625, 5.410400390625, 5.65576171875, 5.901123046875, 6.146484375, 6.391845703125, 6.63720703125, 6.882568359375, 7.1279296875, 7.373291015625, 7.61865234375, 7.864013671875, 8.109375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 9.0, 8.0, 22.0, 25.0, 32.0, 63.0, 103.0, 143.0, 214.0, 279.0, 469.0, 742.0, 1140.0, 1861.0, 3040.0, 5050.0, 8580.0, 14966.0, 27423.0, 50385.0, 94088.0, 166886.0, 233633.0, 190601.0, 111753.0, 60696.0, 32906.0, 17959.0, 10080.0, 5884.0, 3526.0, 2117.0, 1414.0, 862.0, 534.0, 368.0, 234.0, 154.0, 114.0, 59.0, 44.0, 26.0, 27.0, 8.0, 20.0, 2.0, 4.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.59765625, -7.34136962890625, -7.0850830078125, -6.82879638671875, -6.572509765625, -6.31622314453125, -6.0599365234375, -5.80364990234375, -5.54736328125, -5.29107666015625, -5.0347900390625, -4.77850341796875, -4.522216796875, -4.26593017578125, -4.0096435546875, -3.75335693359375, -3.4970703125, -3.24078369140625, -2.9844970703125, -2.72821044921875, -2.471923828125, -2.21563720703125, -1.9593505859375, -1.70306396484375, -1.44677734375, -1.19049072265625, -0.9342041015625, -0.67791748046875, -0.421630859375, -0.16534423828125, 0.0909423828125, 0.34722900390625, 0.603515625, 0.85980224609375, 1.1160888671875, 1.37237548828125, 1.628662109375, 1.88494873046875, 2.1412353515625, 2.39752197265625, 2.65380859375, 2.91009521484375, 3.1663818359375, 3.42266845703125, 3.678955078125, 3.93524169921875, 4.1915283203125, 4.44781494140625, 4.7041015625, 4.96038818359375, 5.2166748046875, 5.47296142578125, 5.729248046875, 5.98553466796875, 6.2418212890625, 6.49810791015625, 6.75439453125, 7.01068115234375, 7.2669677734375, 7.52325439453125, 7.779541015625, 8.03582763671875, 8.2921142578125, 8.54840087890625, 8.8046875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 5.0, 2.0, 9.0, 5.0, 8.0, 10.0, 12.0, 12.0, 23.0, 22.0, 31.0, 41.0, 49.0, 62.0, 80.0, 91.0, 85.0, 96.0, 74.0, 65.0, 48.0, 41.0, 34.0, 20.0, 24.0, 13.0, 10.0, 5.0, 3.0, 5.0, 4.0, 3.0, 1.0, 3.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00048279762268066406, -0.00046736374497413635, -0.00045192986726760864, -0.00043649598956108093, -0.0004210621118545532, -0.0004056282341480255, -0.0003901943564414978, -0.0003747604787349701, -0.0003593266010284424, -0.00034389272332191467, -0.00032845884561538696, -0.00031302496790885925, -0.00029759109020233154, -0.00028215721249580383, -0.0002667233347892761, -0.0002512894570827484, -0.0002358555793762207, -0.000220421701669693, -0.00020498782396316528, -0.00018955394625663757, -0.00017412006855010986, -0.00015868619084358215, -0.00014325231313705444, -0.00012781843543052673, -0.00011238455772399902, -9.695068001747131e-05, -8.15168023109436e-05, -6.60829246044159e-05, -5.0649046897888184e-05, -3.5215169191360474e-05, -1.9781291484832764e-05, -4.347413778305054e-06, 1.1086463928222656e-05, 2.6520341634750366e-05, 4.1954219341278076e-05, 5.7388097047805786e-05, 7.28219747543335e-05, 8.82558524608612e-05, 0.00010368973016738892, 0.00011912360787391663, 0.00013455748558044434, 0.00014999136328697205, 0.00016542524099349976, 0.00018085911870002747, 0.00019629299640655518, 0.00021172687411308289, 0.0002271607518196106, 0.0002425946295261383, 0.000258028507232666, 0.0002734623849391937, 0.00028889626264572144, 0.00030433014035224915, 0.00031976401805877686, 0.00033519789576530457, 0.0003506317734718323, 0.00036606565117836, 0.0003814995288848877, 0.0003969334065914154, 0.0004123672842979431, 0.0004278011620044708, 0.00044323503971099854, 0.00045866891741752625, 0.00047410279512405396, 0.0004895366728305817, 0.0005049705505371094]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 3.0, 3.0, 3.0, 6.0, 10.0, 17.0, 22.0, 26.0, 24.0, 52.0, 78.0, 101.0, 143.0, 212.0, 326.0, 494.0, 795.0, 1240.0, 1974.0, 3337.0, 5595.0, 8871.0, 15128.0, 25301.0, 42102.0, 68101.0, 104243.0, 144099.0, 165275.0, 152108.0, 113730.0, 76015.0, 47455.0, 28386.0, 17089.0, 10076.0, 6109.0, 3594.0, 2316.0, 1395.0, 898.0, 599.0, 391.0, 240.0, 189.0, 120.0, 87.0, 50.0, 37.0, 24.0, 24.0, 15.0, 16.0, 10.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-5.671875, -5.49249267578125, -5.3131103515625, -5.13372802734375, -4.954345703125, -4.77496337890625, -4.5955810546875, -4.41619873046875, -4.23681640625, -4.05743408203125, -3.8780517578125, -3.69866943359375, -3.519287109375, -3.33990478515625, -3.1605224609375, -2.98114013671875, -2.8017578125, -2.62237548828125, -2.4429931640625, -2.26361083984375, -2.084228515625, -1.90484619140625, -1.7254638671875, -1.54608154296875, -1.36669921875, -1.18731689453125, -1.0079345703125, -0.82855224609375, -0.649169921875, -0.46978759765625, -0.2904052734375, -0.11102294921875, 0.068359375, 0.24774169921875, 0.4271240234375, 0.60650634765625, 0.785888671875, 0.96527099609375, 1.1446533203125, 1.32403564453125, 1.50341796875, 1.68280029296875, 1.8621826171875, 2.04156494140625, 2.220947265625, 2.40032958984375, 2.5797119140625, 2.75909423828125, 2.9384765625, 3.11785888671875, 3.2972412109375, 3.47662353515625, 3.656005859375, 3.83538818359375, 4.0147705078125, 4.19415283203125, 4.37353515625, 4.55291748046875, 4.7322998046875, 4.91168212890625, 5.091064453125, 5.27044677734375, 5.4498291015625, 5.62921142578125, 5.80859375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 6.0, 1.0, 4.0, 1.0, 5.0, 8.0, 5.0, 6.0, 14.0, 6.0, 11.0, 25.0, 21.0, 19.0, 22.0, 35.0, 44.0, 30.0, 40.0, 45.0, 45.0, 41.0, 47.0, 51.0, 37.0, 54.0, 48.0, 45.0, 40.0, 39.0, 34.0, 30.0, 25.0, 21.0, 11.0, 23.0, 13.0, 8.0, 7.0, 7.0, 6.0, 8.0, 7.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.6396484375, -1.592010498046875, -1.54437255859375, -1.496734619140625, -1.4490966796875, -1.401458740234375, -1.35382080078125, -1.306182861328125, -1.258544921875, -1.210906982421875, -1.16326904296875, -1.115631103515625, -1.0679931640625, -1.020355224609375, -0.97271728515625, -0.925079345703125, -0.87744140625, -0.829803466796875, -0.78216552734375, -0.734527587890625, -0.6868896484375, -0.639251708984375, -0.59161376953125, -0.543975830078125, -0.496337890625, -0.448699951171875, -0.40106201171875, -0.353424072265625, -0.3057861328125, -0.258148193359375, -0.21051025390625, -0.162872314453125, -0.115234375, -0.067596435546875, -0.01995849609375, 0.027679443359375, 0.0753173828125, 0.122955322265625, 0.17059326171875, 0.218231201171875, 0.265869140625, 0.313507080078125, 0.36114501953125, 0.408782958984375, 0.4564208984375, 0.504058837890625, 0.55169677734375, 0.599334716796875, 0.64697265625, 0.694610595703125, 0.74224853515625, 0.789886474609375, 0.8375244140625, 0.885162353515625, 0.93280029296875, 0.980438232421875, 1.028076171875, 1.075714111328125, 1.12335205078125, 1.170989990234375, 1.2186279296875, 1.266265869140625, 1.31390380859375, 1.361541748046875, 1.4091796875]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 0.0, 7.0, 3.0, 4.0, 7.0, 12.0, 9.0, 12.0, 19.0, 21.0, 32.0, 34.0, 35.0, 39.0, 44.0, 62.0, 54.0, 54.0, 58.0, 58.0, 59.0, 43.0, 38.0, 46.0, 48.0, 30.0, 39.0, 21.0, 24.0, 17.0, 11.0, 14.0, 9.0, 6.0, 10.0, 6.0, 3.0, 5.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-19.617773056030273, -18.964508056640625, -18.311241149902344, -17.657976150512695, -17.004711151123047, -16.351444244384766, -15.698179244995117, -15.044913291931152, -14.391647338867188, -13.738381385803223, -13.085115432739258, -12.43185043334961, -11.778584480285645, -11.12531852722168, -10.472053527832031, -9.818787574768066, -9.165521621704102, -8.512255668640137, -7.85899019241333, -7.205724716186523, -6.552458763122559, -5.899192810058594, -5.245927333831787, -4.5926618576049805, -3.9393959045410156, -3.28613018989563, -2.632864475250244, -1.9795987606048584, -1.3263330459594727, -0.6730673313140869, -0.019801616668701172, 0.6334638595581055, 1.2867317199707031, 1.9399974346160889, 2.5932631492614746, 3.2465288639068604, 3.899794578552246, 4.553060531616211, 5.206326007843018, 5.859591484069824, 6.512857437133789, 7.166123390197754, 7.8193888664245605, 8.472654342651367, 9.125920295715332, 9.779186248779297, 10.432451248168945, 11.08571720123291, 11.738983154296875, 12.39224910736084, 13.045515060424805, 13.698780059814453, 14.352046012878418, 15.005311965942383, 15.658576965332031, 16.311843872070312, 16.96510887145996, 17.61837387084961, 18.27164077758789, 18.92490577697754, 19.578170776367188, 20.23143768310547, 20.884702682495117, 21.537967681884766, 22.191234588623047]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 7.0, 5.0, 10.0, 6.0, 12.0, 10.0, 12.0, 19.0, 29.0, 24.0, 27.0, 37.0, 42.0, 34.0, 37.0, 39.0, 49.0, 49.0, 50.0, 54.0, 51.0, 46.0, 40.0, 43.0, 40.0, 45.0, 39.0, 31.0, 25.0, 18.0, 13.0, 22.0, 8.0, 5.0, 14.0, 0.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-14.852544784545898, -14.425804138183594, -13.999063491821289, -13.572322845458984, -13.145581245422363, -12.718840599060059, -12.292099952697754, -11.86535930633545, -11.438618659973145, -11.01187801361084, -10.585137367248535, -10.158395767211914, -9.73165512084961, -9.304914474487305, -8.878173828125, -8.451433181762695, -8.02469253540039, -7.597951889038086, -7.171210765838623, -6.744470119476318, -6.317729473114014, -5.890988349914551, -5.464247703552246, -5.037507057189941, -4.61076545715332, -4.184024810791016, -3.757283926010132, -3.330543041229248, -2.9038023948669434, -2.4770615100860596, -2.050320625305176, -1.623579978942871, -1.1968393325805664, -0.7700985670089722, -0.34335774183273315, 0.08338308334350586, 0.5101238489151001, 0.9368646144866943, 1.3636054992675781, 1.7903461456298828, 2.2170870304107666, 2.6438279151916504, 3.070568561553955, 3.497309446334839, 3.9240503311157227, 4.350790977478027, 4.777531623840332, 5.204272270202637, 5.6310133934021, 6.057754039764404, 6.484495162963867, 6.911235809326172, 7.337976455688477, 7.764717102050781, 8.191457748413086, 8.61819839477539, 9.044939994812012, 9.471680641174316, 9.898421287536621, 10.325162887573242, 10.751903533935547, 11.178644180297852, 11.605384826660156, 12.032125473022461, 12.458866119384766]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 11.0, 6.0, 14.0, 21.0, 22.0, 42.0, 38.0, 61.0, 113.0, 123.0, 156.0, 248.0, 399.0, 626.0, 946.0, 1732.0, 2895.0, 5159.0, 9289.0, 17290.0, 31734.0, 56799.0, 96975.0, 147487.0, 182704.0, 175094.0, 131211.0, 82357.0, 46890.0, 25607.0, 14271.0, 7652.0, 4170.0, 2471.0, 1436.0, 862.0, 561.0, 352.0, 219.0, 146.0, 116.0, 73.0, 44.0, 33.0, 33.0, 17.0, 16.0, 11.0, 7.0, 5.0, 7.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-16.703125, -16.178466796875, -15.65380859375, -15.129150390625, -14.6044921875, -14.079833984375, -13.55517578125, -13.030517578125, -12.505859375, -11.981201171875, -11.45654296875, -10.931884765625, -10.4072265625, -9.882568359375, -9.35791015625, -8.833251953125, -8.30859375, -7.783935546875, -7.25927734375, -6.734619140625, -6.2099609375, -5.685302734375, -5.16064453125, -4.635986328125, -4.111328125, -3.586669921875, -3.06201171875, -2.537353515625, -2.0126953125, -1.488037109375, -0.96337890625, -0.438720703125, 0.0859375, 0.610595703125, 1.13525390625, 1.659912109375, 2.1845703125, 2.709228515625, 3.23388671875, 3.758544921875, 4.283203125, 4.807861328125, 5.33251953125, 5.857177734375, 6.3818359375, 6.906494140625, 7.43115234375, 7.955810546875, 8.48046875, 9.005126953125, 9.52978515625, 10.054443359375, 10.5791015625, 11.103759765625, 11.62841796875, 12.153076171875, 12.677734375, 13.202392578125, 13.72705078125, 14.251708984375, 14.7763671875, 15.301025390625, 15.82568359375, 16.350341796875, 16.875]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 5.0, 8.0, 8.0, 12.0, 9.0, 7.0, 13.0, 23.0, 23.0, 33.0, 35.0, 46.0, 64.0, 46.0, 40.0, 49.0, 49.0, 63.0, 48.0, 52.0, 60.0, 59.0, 37.0, 32.0, 36.0, 32.0, 28.0, 17.0, 12.0, 9.0, 13.0, 13.0, 4.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.296875, -14.80712890625, -14.3173828125, -13.82763671875, -13.337890625, -12.84814453125, -12.3583984375, -11.86865234375, -11.37890625, -10.88916015625, -10.3994140625, -9.90966796875, -9.419921875, -8.93017578125, -8.4404296875, -7.95068359375, -7.4609375, -6.97119140625, -6.4814453125, -5.99169921875, -5.501953125, -5.01220703125, -4.5224609375, -4.03271484375, -3.54296875, -3.05322265625, -2.5634765625, -2.07373046875, -1.583984375, -1.09423828125, -0.6044921875, -0.11474609375, 0.375, 0.86474609375, 1.3544921875, 1.84423828125, 2.333984375, 2.82373046875, 3.3134765625, 3.80322265625, 4.29296875, 4.78271484375, 5.2724609375, 5.76220703125, 6.251953125, 6.74169921875, 7.2314453125, 7.72119140625, 8.2109375, 8.70068359375, 9.1904296875, 9.68017578125, 10.169921875, 10.65966796875, 11.1494140625, 11.63916015625, 12.12890625, 12.61865234375, 13.1083984375, 13.59814453125, 14.087890625, 14.57763671875, 15.0673828125, 15.55712890625, 16.046875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 10.0, 16.0, 19.0, 36.0, 44.0, 78.0, 108.0, 142.0, 250.0, 398.0, 697.0, 1073.0, 1875.0, 3167.0, 5568.0, 9994.0, 17554.0, 30909.0, 53229.0, 85670.0, 126711.0, 159577.0, 165628.0, 138669.0, 98334.0, 62301.0, 37481.0, 21139.0, 11958.0, 6654.0, 3865.0, 2167.0, 1278.0, 756.0, 475.0, 269.0, 148.0, 113.0, 72.0, 50.0, 33.0, 16.0, 10.0, 10.0, 6.0, 6.0, 2.0, 1.0, 0.0, 4.0], "bins": [-15.5859375, -15.1549072265625, -14.723876953125, -14.2928466796875, -13.86181640625, -13.4307861328125, -12.999755859375, -12.5687255859375, -12.1376953125, -11.7066650390625, -11.275634765625, -10.8446044921875, -10.41357421875, -9.9825439453125, -9.551513671875, -9.1204833984375, -8.689453125, -8.2584228515625, -7.827392578125, -7.3963623046875, -6.96533203125, -6.5343017578125, -6.103271484375, -5.6722412109375, -5.2412109375, -4.8101806640625, -4.379150390625, -3.9481201171875, -3.51708984375, -3.0860595703125, -2.655029296875, -2.2239990234375, -1.79296875, -1.3619384765625, -0.930908203125, -0.4998779296875, -0.06884765625, 0.3621826171875, 0.793212890625, 1.2242431640625, 1.6552734375, 2.0863037109375, 2.517333984375, 2.9483642578125, 3.37939453125, 3.8104248046875, 4.241455078125, 4.6724853515625, 5.103515625, 5.5345458984375, 5.965576171875, 6.3966064453125, 6.82763671875, 7.2586669921875, 7.689697265625, 8.1207275390625, 8.5517578125, 8.9827880859375, 9.413818359375, 9.8448486328125, 10.27587890625, 10.7069091796875, 11.137939453125, 11.5689697265625, 12.0]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 0.0, 4.0, 6.0, 3.0, 6.0, 5.0, 8.0, 10.0, 12.0, 12.0, 14.0, 25.0, 24.0, 21.0, 27.0, 27.0, 34.0, 30.0, 33.0, 48.0, 38.0, 43.0, 40.0, 32.0, 36.0, 41.0, 31.0, 33.0, 32.0, 34.0, 31.0, 25.0, 36.0, 26.0, 27.0, 27.0, 22.0, 18.0, 11.0, 11.0, 13.0, 7.0, 8.0, 4.0, 7.0, 6.0, 6.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-6.875, -6.6630859375, -6.451171875, -6.2392578125, -6.02734375, -5.8154296875, -5.603515625, -5.3916015625, -5.1796875, -4.9677734375, -4.755859375, -4.5439453125, -4.33203125, -4.1201171875, -3.908203125, -3.6962890625, -3.484375, -3.2724609375, -3.060546875, -2.8486328125, -2.63671875, -2.4248046875, -2.212890625, -2.0009765625, -1.7890625, -1.5771484375, -1.365234375, -1.1533203125, -0.94140625, -0.7294921875, -0.517578125, -0.3056640625, -0.09375, 0.1181640625, 0.330078125, 0.5419921875, 0.75390625, 0.9658203125, 1.177734375, 1.3896484375, 1.6015625, 1.8134765625, 2.025390625, 2.2373046875, 2.44921875, 2.6611328125, 2.873046875, 3.0849609375, 3.296875, 3.5087890625, 3.720703125, 3.9326171875, 4.14453125, 4.3564453125, 4.568359375, 4.7802734375, 4.9921875, 5.2041015625, 5.416015625, 5.6279296875, 5.83984375, 6.0517578125, 6.263671875, 6.4755859375, 6.6875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 1.0, 7.0, 6.0, 13.0, 13.0, 21.0, 37.0, 37.0, 72.0, 66.0, 98.0, 164.0, 223.0, 333.0, 512.0, 780.0, 1298.0, 2012.0, 3446.0, 6031.0, 10538.0, 19480.0, 35885.0, 65926.0, 113589.0, 171128.0, 199419.0, 167229.0, 109885.0, 62614.0, 34367.0, 18497.0, 10352.0, 5750.0, 3323.0, 1885.0, 1225.0, 738.0, 488.0, 319.0, 237.0, 159.0, 92.0, 84.0, 57.0, 29.0, 28.0, 16.0, 15.0, 14.0, 7.0, 5.0, 2.0, 4.0, 5.0, 2.0, 1.0, 1.0], "bins": [-9.046875, -8.7681884765625, -8.489501953125, -8.2108154296875, -7.93212890625, -7.6534423828125, -7.374755859375, -7.0960693359375, -6.8173828125, -6.5386962890625, -6.260009765625, -5.9813232421875, -5.70263671875, -5.4239501953125, -5.145263671875, -4.8665771484375, -4.587890625, -4.3092041015625, -4.030517578125, -3.7518310546875, -3.47314453125, -3.1944580078125, -2.915771484375, -2.6370849609375, -2.3583984375, -2.0797119140625, -1.801025390625, -1.5223388671875, -1.24365234375, -0.9649658203125, -0.686279296875, -0.4075927734375, -0.12890625, 0.1497802734375, 0.428466796875, 0.7071533203125, 0.98583984375, 1.2645263671875, 1.543212890625, 1.8218994140625, 2.1005859375, 2.3792724609375, 2.657958984375, 2.9366455078125, 3.21533203125, 3.4940185546875, 3.772705078125, 4.0513916015625, 4.330078125, 4.6087646484375, 4.887451171875, 5.1661376953125, 5.44482421875, 5.7235107421875, 6.002197265625, 6.2808837890625, 6.5595703125, 6.8382568359375, 7.116943359375, 7.3956298828125, 7.67431640625, 7.9530029296875, 8.231689453125, 8.5103759765625, 8.7890625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 2.0, 8.0, 9.0, 16.0, 8.0, 15.0, 18.0, 19.0, 25.0, 40.0, 32.0, 42.0, 63.0, 39.0, 48.0, 53.0, 60.0, 56.0, 67.0, 51.0, 46.0, 50.0, 36.0, 33.0, 26.0, 23.0, 27.0, 18.0, 20.0, 12.0, 9.0, 9.0, 8.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008192062377929688, -0.0007928088307380676, -0.0007664114236831665, -0.0007400140166282654, -0.0007136166095733643, -0.0006872192025184631, -0.000660821795463562, -0.0006344243884086609, -0.0006080269813537598, -0.0005816295742988586, -0.0005552321672439575, -0.0005288347601890564, -0.0005024373531341553, -0.00047603994607925415, -0.00044964253902435303, -0.0004232451319694519, -0.0003968477249145508, -0.00037045031785964966, -0.00034405291080474854, -0.0003176555037498474, -0.0002912580966949463, -0.00026486068964004517, -0.00023846328258514404, -0.00021206587553024292, -0.0001856684684753418, -0.00015927106142044067, -0.00013287365436553955, -0.00010647624731063843, -8.00788402557373e-05, -5.368143320083618e-05, -2.728402614593506e-05, -8.866190910339355e-07, 2.5510787963867188e-05, 5.190819501876831e-05, 7.830560207366943e-05, 0.00010470300912857056, 0.00013110041618347168, 0.0001574978232383728, 0.00018389523029327393, 0.00021029263734817505, 0.00023669004440307617, 0.0002630874514579773, 0.0002894848585128784, 0.00031588226556777954, 0.00034227967262268066, 0.0003686770796775818, 0.0003950744867324829, 0.00042147189378738403, 0.00044786930084228516, 0.0004742667078971863, 0.0005006641149520874, 0.0005270615220069885, 0.0005534589290618896, 0.0005798563361167908, 0.0006062537431716919, 0.000632651150226593, 0.0006590485572814941, 0.0006854459643363953, 0.0007118433713912964, 0.0007382407784461975, 0.0007646381855010986, 0.0007910355925559998, 0.0008174329996109009, 0.000843830406665802, 0.0008702278137207031]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 3.0, 5.0, 8.0, 15.0, 24.0, 32.0, 34.0, 59.0, 95.0, 159.0, 231.0, 386.0, 602.0, 971.0, 1608.0, 2722.0, 4543.0, 7668.0, 13634.0, 23915.0, 41913.0, 72201.0, 117297.0, 164632.0, 182693.0, 154980.0, 106081.0, 64356.0, 37463.0, 21145.0, 12076.0, 6894.0, 3939.0, 2354.0, 1471.0, 842.0, 538.0, 342.0, 219.0, 143.0, 96.0, 62.0, 30.0, 26.0, 18.0, 8.0, 8.0, 6.0, 6.0, 1.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.03125, -7.775390625, -7.51953125, -7.263671875, -7.0078125, -6.751953125, -6.49609375, -6.240234375, -5.984375, -5.728515625, -5.47265625, -5.216796875, -4.9609375, -4.705078125, -4.44921875, -4.193359375, -3.9375, -3.681640625, -3.42578125, -3.169921875, -2.9140625, -2.658203125, -2.40234375, -2.146484375, -1.890625, -1.634765625, -1.37890625, -1.123046875, -0.8671875, -0.611328125, -0.35546875, -0.099609375, 0.15625, 0.412109375, 0.66796875, 0.923828125, 1.1796875, 1.435546875, 1.69140625, 1.947265625, 2.203125, 2.458984375, 2.71484375, 2.970703125, 3.2265625, 3.482421875, 3.73828125, 3.994140625, 4.25, 4.505859375, 4.76171875, 5.017578125, 5.2734375, 5.529296875, 5.78515625, 6.041015625, 6.296875, 6.552734375, 6.80859375, 7.064453125, 7.3203125, 7.576171875, 7.83203125, 8.087890625, 8.34375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 9.0, 6.0, 15.0, 11.0, 14.0, 12.0, 17.0, 22.0, 27.0, 47.0, 35.0, 45.0, 53.0, 54.0, 55.0, 61.0, 75.0, 66.0, 49.0, 49.0, 40.0, 48.0, 29.0, 27.0, 25.0, 21.0, 13.0, 16.0, 12.0, 11.0, 3.0, 8.0, 2.0, 2.0, 3.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.55859375, -2.47100830078125, -2.3834228515625, -2.29583740234375, -2.208251953125, -2.12066650390625, -2.0330810546875, -1.94549560546875, -1.85791015625, -1.77032470703125, -1.6827392578125, -1.59515380859375, -1.507568359375, -1.41998291015625, -1.3323974609375, -1.24481201171875, -1.1572265625, -1.06964111328125, -0.9820556640625, -0.89447021484375, -0.806884765625, -0.71929931640625, -0.6317138671875, -0.54412841796875, -0.45654296875, -0.36895751953125, -0.2813720703125, -0.19378662109375, -0.106201171875, -0.01861572265625, 0.0689697265625, 0.15655517578125, 0.244140625, 0.33172607421875, 0.4193115234375, 0.50689697265625, 0.594482421875, 0.68206787109375, 0.7696533203125, 0.85723876953125, 0.94482421875, 1.03240966796875, 1.1199951171875, 1.20758056640625, 1.295166015625, 1.38275146484375, 1.4703369140625, 1.55792236328125, 1.6455078125, 1.73309326171875, 1.8206787109375, 1.90826416015625, 1.995849609375, 2.08343505859375, 2.1710205078125, 2.25860595703125, 2.34619140625, 2.43377685546875, 2.5213623046875, 2.60894775390625, 2.696533203125, 2.78411865234375, 2.8717041015625, 2.95928955078125, 3.046875]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 1.0, 3.0, 3.0, 7.0, 6.0, 9.0, 9.0, 12.0, 18.0, 18.0, 22.0, 41.0, 37.0, 37.0, 54.0, 51.0, 82.0, 52.0, 77.0, 56.0, 68.0, 58.0, 50.0, 38.0, 37.0, 30.0, 27.0, 17.0, 19.0, 17.0, 11.0, 6.0, 8.0, 2.0, 12.0, 4.0, 0.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.460142135620117, -18.730737686157227, -18.001331329345703, -17.271926879882812, -16.542522430419922, -15.813116073608398, -15.083711624145508, -14.3543062210083, -13.624900817871094, -12.895495414733887, -12.16609001159668, -11.436685562133789, -10.707280158996582, -9.977874755859375, -9.248470306396484, -8.519064903259277, -7.78965950012207, -7.060254096984863, -6.3308491706848145, -5.601444244384766, -4.872038841247559, -4.142633438110352, -3.4132285118103027, -2.683823585510254, -1.9544181823730469, -1.225013017654419, -0.495607852935791, 0.23379731178283691, 0.9632024765014648, 1.6926076412200928, 2.4220128059387207, 3.1514177322387695, 3.8808231353759766, 4.610228538513184, 5.339633464813232, 6.069038391113281, 6.798443794250488, 7.527849197387695, 8.257253646850586, 8.986659049987793, 9.716064453125, 10.445469856262207, 11.174875259399414, 11.904279708862305, 12.633685111999512, 13.363090515136719, 14.09249496459961, 14.821900367736816, 15.551305770874023, 16.280710220336914, 17.010116577148438, 17.739521026611328, 18.46892547607422, 19.198331832885742, 19.927736282348633, 20.657142639160156, 21.386547088623047, 22.115951538085938, 22.84535789489746, 23.57476234436035, 24.304168701171875, 25.033573150634766, 25.762977600097656, 26.492382049560547, 27.22178840637207]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 6.0, 3.0, 4.0, 4.0, 8.0, 7.0, 13.0, 13.0, 11.0, 15.0, 8.0, 14.0, 26.0, 26.0, 24.0, 34.0, 44.0, 29.0, 25.0, 52.0, 43.0, 42.0, 51.0, 42.0, 49.0, 41.0, 39.0, 52.0, 37.0, 16.0, 30.0, 29.0, 27.0, 21.0, 24.0, 20.0, 13.0, 14.0, 14.0, 9.0, 7.0, 7.0, 12.0, 4.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.368841171264648, -10.982305526733398, -10.595768928527832, -10.209233283996582, -9.822696685791016, -9.436161041259766, -9.049625396728516, -8.66308879852295, -8.2765531539917, -7.890017032623291, -7.503480911254883, -7.116945266723633, -6.730409145355225, -6.343873023986816, -5.957336902618408, -5.57080078125, -5.184264659881592, -4.797728538513184, -4.411192417144775, -4.024656295776367, -3.638120651245117, -3.251584529876709, -2.865048408508301, -2.4785125255584717, -2.0919764041900635, -1.7054404020309448, -1.3189043998718262, -0.932368278503418, -0.5458322763442993, -0.15929627418518066, 0.22723984718322754, 0.6137757301330566, 1.0003118515014648, 1.3868478536605835, 1.7733838558197021, 2.1599199771881104, 2.5464558601379395, 2.9329919815063477, 3.319528102874756, 3.706063985824585, 4.092599868774414, 4.479135990142822, 4.8656721115112305, 5.2522077560424805, 5.638743877410889, 6.025279998779297, 6.411816120147705, 6.798352241516113, 7.1848883628845215, 7.57142448425293, 7.957960605621338, 8.344496726989746, 8.731032371520996, 9.117568969726562, 9.504104614257812, 9.890640258789062, 10.277176856994629, 10.663712501525879, 11.050249099731445, 11.436784744262695, 11.823321342468262, 12.209856986999512, 12.596393585205078, 12.982929229736328, 13.369464874267578]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 3.0, 10.0, 13.0, 16.0, 26.0, 32.0, 51.0, 75.0, 89.0, 146.0, 202.0, 338.0, 479.0, 703.0, 1128.0, 1687.0, 2632.0, 4415.0, 7187.0, 12117.0, 21513.0, 37874.0, 69756.0, 133270.0, 262834.0, 522323.0, 881499.0, 946883.0, 620571.0, 317167.0, 159035.0, 83116.0, 44393.0, 24837.0, 14659.0, 8566.0, 5215.0, 3308.0, 1999.0, 1354.0, 933.0, 597.0, 387.0, 242.0, 192.0, 118.0, 100.0, 55.0, 39.0, 32.0, 17.0, 16.0, 9.0, 12.0, 7.0, 5.0, 3.0, 2.0], "bins": [-16.84375, -16.3355712890625, -15.827392578125, -15.3192138671875, -14.81103515625, -14.3028564453125, -13.794677734375, -13.2864990234375, -12.7783203125, -12.2701416015625, -11.761962890625, -11.2537841796875, -10.74560546875, -10.2374267578125, -9.729248046875, -9.2210693359375, -8.712890625, -8.2047119140625, -7.696533203125, -7.1883544921875, -6.68017578125, -6.1719970703125, -5.663818359375, -5.1556396484375, -4.6474609375, -4.1392822265625, -3.631103515625, -3.1229248046875, -2.61474609375, -2.1065673828125, -1.598388671875, -1.0902099609375, -0.58203125, -0.0738525390625, 0.434326171875, 0.9425048828125, 1.45068359375, 1.9588623046875, 2.467041015625, 2.9752197265625, 3.4833984375, 3.9915771484375, 4.499755859375, 5.0079345703125, 5.51611328125, 6.0242919921875, 6.532470703125, 7.0406494140625, 7.548828125, 8.0570068359375, 8.565185546875, 9.0733642578125, 9.58154296875, 10.0897216796875, 10.597900390625, 11.1060791015625, 11.6142578125, 12.1224365234375, 12.630615234375, 13.1387939453125, 13.64697265625, 14.1551513671875, 14.663330078125, 15.1715087890625, 15.6796875]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 1.0, 5.0, 5.0, 2.0, 5.0, 11.0, 13.0, 13.0, 10.0, 10.0, 17.0, 15.0, 28.0, 25.0, 32.0, 33.0, 29.0, 32.0, 38.0, 39.0, 41.0, 42.0, 44.0, 35.0, 61.0, 50.0, 46.0, 42.0, 40.0, 38.0, 39.0, 27.0, 23.0, 21.0, 17.0, 17.0, 12.0, 6.0, 12.0, 11.0, 4.0, 3.0, 1.0, 5.0, 10.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.1640625, -8.87841796875, -8.5927734375, -8.30712890625, -8.021484375, -7.73583984375, -7.4501953125, -7.16455078125, -6.87890625, -6.59326171875, -6.3076171875, -6.02197265625, -5.736328125, -5.45068359375, -5.1650390625, -4.87939453125, -4.59375, -4.30810546875, -4.0224609375, -3.73681640625, -3.451171875, -3.16552734375, -2.8798828125, -2.59423828125, -2.30859375, -2.02294921875, -1.7373046875, -1.45166015625, -1.166015625, -0.88037109375, -0.5947265625, -0.30908203125, -0.0234375, 0.26220703125, 0.5478515625, 0.83349609375, 1.119140625, 1.40478515625, 1.6904296875, 1.97607421875, 2.26171875, 2.54736328125, 2.8330078125, 3.11865234375, 3.404296875, 3.68994140625, 3.9755859375, 4.26123046875, 4.546875, 4.83251953125, 5.1181640625, 5.40380859375, 5.689453125, 5.97509765625, 6.2607421875, 6.54638671875, 6.83203125, 7.11767578125, 7.4033203125, 7.68896484375, 7.974609375, 8.26025390625, 8.5458984375, 8.83154296875, 9.1171875]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 7.0, 15.0, 23.0, 45.0, 51.0, 77.0, 131.0, 160.0, 273.0, 401.0, 673.0, 1060.0, 1697.0, 2688.0, 4383.0, 7276.0, 12377.0, 21725.0, 38595.0, 69415.0, 128998.0, 237706.0, 434658.0, 720980.0, 896821.0, 696263.0, 413971.0, 226675.0, 121935.0, 66786.0, 37166.0, 20911.0, 12091.0, 6993.0, 4306.0, 2563.0, 1576.0, 1036.0, 623.0, 373.0, 269.0, 178.0, 112.0, 69.0, 45.0, 39.0, 22.0, 14.0, 9.0, 10.0, 8.0, 3.0, 1.0, 2.0], "bins": [-17.78125, -17.2652587890625, -16.749267578125, -16.2332763671875, -15.71728515625, -15.2012939453125, -14.685302734375, -14.1693115234375, -13.6533203125, -13.1373291015625, -12.621337890625, -12.1053466796875, -11.58935546875, -11.0733642578125, -10.557373046875, -10.0413818359375, -9.525390625, -9.0093994140625, -8.493408203125, -7.9774169921875, -7.46142578125, -6.9454345703125, -6.429443359375, -5.9134521484375, -5.3974609375, -4.8814697265625, -4.365478515625, -3.8494873046875, -3.33349609375, -2.8175048828125, -2.301513671875, -1.7855224609375, -1.26953125, -0.7535400390625, -0.237548828125, 0.2784423828125, 0.79443359375, 1.3104248046875, 1.826416015625, 2.3424072265625, 2.8583984375, 3.3743896484375, 3.890380859375, 4.4063720703125, 4.92236328125, 5.4383544921875, 5.954345703125, 6.4703369140625, 6.986328125, 7.5023193359375, 8.018310546875, 8.5343017578125, 9.05029296875, 9.5662841796875, 10.082275390625, 10.5982666015625, 11.1142578125, 11.6302490234375, 12.146240234375, 12.6622314453125, 13.17822265625, 13.6942138671875, 14.210205078125, 14.7261962890625, 15.2421875]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 8.0, 9.0, 16.0, 30.0, 26.0, 35.0, 43.0, 60.0, 88.0, 117.0, 147.0, 176.0, 215.0, 262.0, 278.0, 303.0, 321.0, 310.0, 280.0, 275.0, 222.0, 159.0, 165.0, 128.0, 109.0, 65.0, 61.0, 38.0, 33.0, 32.0, 20.0, 11.0, 5.0, 11.0, 5.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.19140625, -4.99627685546875, -4.8011474609375, -4.60601806640625, -4.410888671875, -4.21575927734375, -4.0206298828125, -3.82550048828125, -3.63037109375, -3.43524169921875, -3.2401123046875, -3.04498291015625, -2.849853515625, -2.65472412109375, -2.4595947265625, -2.26446533203125, -2.0693359375, -1.87420654296875, -1.6790771484375, -1.48394775390625, -1.288818359375, -1.09368896484375, -0.8985595703125, -0.70343017578125, -0.50830078125, -0.31317138671875, -0.1180419921875, 0.07708740234375, 0.272216796875, 0.46734619140625, 0.6624755859375, 0.85760498046875, 1.052734375, 1.24786376953125, 1.4429931640625, 1.63812255859375, 1.833251953125, 2.02838134765625, 2.2235107421875, 2.41864013671875, 2.61376953125, 2.80889892578125, 3.0040283203125, 3.19915771484375, 3.394287109375, 3.58941650390625, 3.7845458984375, 3.97967529296875, 4.1748046875, 4.36993408203125, 4.5650634765625, 4.76019287109375, 4.955322265625, 5.15045166015625, 5.3455810546875, 5.54071044921875, 5.73583984375, 5.93096923828125, 6.1260986328125, 6.32122802734375, 6.516357421875, 6.71148681640625, 6.9066162109375, 7.10174560546875, 7.296875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 4.0, 6.0, 3.0, 4.0, 9.0, 9.0, 19.0, 15.0, 22.0, 23.0, 20.0, 45.0, 34.0, 48.0, 43.0, 66.0, 74.0, 67.0, 69.0, 62.0, 60.0, 46.0, 51.0, 34.0, 19.0, 18.0, 28.0, 16.0, 18.0, 12.0, 9.0, 7.0, 10.0, 6.0, 2.0, 2.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.273786544799805, -18.626934051513672, -17.98008155822754, -17.333229064941406, -16.686378479003906, -16.039525985717773, -15.39267349243164, -14.745820999145508, -14.098968505859375, -13.452116012573242, -12.80526351928711, -12.158411979675293, -11.51155948638916, -10.864706993103027, -10.217855453491211, -9.571002960205078, -8.924150466918945, -8.277297973632812, -7.630445957183838, -6.983593940734863, -6.3367414474487305, -5.689888954162598, -5.043036937713623, -4.396184921264648, -3.7493324279785156, -3.102480173110962, -2.455627918243408, -1.8087756633758545, -1.1619234085083008, -0.5150711536407471, 0.13178110122680664, 0.7786331176757812, 1.425485610961914, 2.0723378658294678, 2.7191901206970215, 3.366042375564575, 4.012894630432129, 4.659747123718262, 5.306599140167236, 5.953451156616211, 6.600303649902344, 7.247156143188477, 7.894008159637451, 8.540860176086426, 9.187712669372559, 9.834565162658691, 10.481416702270508, 11.12826919555664, 11.775121688842773, 12.421974182128906, 13.068826675415039, 13.715678215026855, 14.362530708312988, 15.009383201599121, 15.656234741210938, 16.30308723449707, 16.949939727783203, 17.596792221069336, 18.24364471435547, 18.8904972076416, 19.537349700927734, 20.184200286865234, 20.831052780151367, 21.4779052734375, 22.124757766723633]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 4.0, 9.0, 6.0, 18.0, 12.0, 18.0, 12.0, 24.0, 24.0, 29.0, 25.0, 32.0, 33.0, 40.0, 43.0, 43.0, 49.0, 45.0, 41.0, 63.0, 44.0, 39.0, 37.0, 38.0, 42.0, 25.0, 25.0, 31.0, 30.0, 22.0, 19.0, 18.0, 14.0, 9.0, 13.0, 8.0, 1.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.629175186157227, -10.27098560333252, -9.912796020507812, -9.554606437683105, -9.196416854858398, -8.838227272033691, -8.480037689208984, -8.121848106384277, -7.76365852355957, -7.405468940734863, -7.047279357910156, -6.689089775085449, -6.330900192260742, -5.972710609436035, -5.614521026611328, -5.256331443786621, -4.898141860961914, -4.539952278137207, -4.1817626953125, -3.823573112487793, -3.465383529663086, -3.107193946838379, -2.749004364013672, -2.390814781188965, -2.032625198364258, -1.6744356155395508, -1.3162460327148438, -0.9580564498901367, -0.5998668670654297, -0.24167728424072266, 0.11651229858398438, 0.4747018814086914, 0.832890510559082, 1.191080093383789, 1.549269676208496, 1.9074592590332031, 2.26564884185791, 2.623838424682617, 2.982028007507324, 3.3402175903320312, 3.6984071731567383, 4.056596755981445, 4.414786338806152, 4.772975921630859, 5.131165504455566, 5.489355087280273, 5.8475446701049805, 6.2057342529296875, 6.5639238357543945, 6.922113418579102, 7.280303001403809, 7.638492584228516, 7.996682167053223, 8.35487174987793, 8.713061332702637, 9.071250915527344, 9.42944049835205, 9.787630081176758, 10.145819664001465, 10.504009246826172, 10.862198829650879, 11.220388412475586, 11.578577995300293, 11.936767578125, 12.294957160949707]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 5.0, 6.0, 6.0, 10.0, 10.0, 12.0, 21.0, 34.0, 51.0, 65.0, 85.0, 112.0, 186.0, 279.0, 393.0, 526.0, 833.0, 1343.0, 2006.0, 3336.0, 5647.0, 9537.0, 16024.0, 28479.0, 49858.0, 87495.0, 140043.0, 185596.0, 183389.0, 135696.0, 83814.0, 48099.0, 27109.0, 15159.0, 9010.0, 5357.0, 3180.0, 1947.0, 1261.0, 834.0, 589.0, 333.0, 219.0, 172.0, 125.0, 67.0, 58.0, 46.0, 24.0, 34.0, 12.0, 5.0, 11.0, 8.0, 4.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0], "bins": [-11.265625, -10.9017333984375, -10.537841796875, -10.1739501953125, -9.81005859375, -9.4461669921875, -9.082275390625, -8.7183837890625, -8.3544921875, -7.9906005859375, -7.626708984375, -7.2628173828125, -6.89892578125, -6.5350341796875, -6.171142578125, -5.8072509765625, -5.443359375, -5.0794677734375, -4.715576171875, -4.3516845703125, -3.98779296875, -3.6239013671875, -3.260009765625, -2.8961181640625, -2.5322265625, -2.1683349609375, -1.804443359375, -1.4405517578125, -1.07666015625, -0.7127685546875, -0.348876953125, 0.0150146484375, 0.37890625, 0.7427978515625, 1.106689453125, 1.4705810546875, 1.83447265625, 2.1983642578125, 2.562255859375, 2.9261474609375, 3.2900390625, 3.6539306640625, 4.017822265625, 4.3817138671875, 4.74560546875, 5.1094970703125, 5.473388671875, 5.8372802734375, 6.201171875, 6.5650634765625, 6.928955078125, 7.2928466796875, 7.65673828125, 8.0206298828125, 8.384521484375, 8.7484130859375, 9.1123046875, 9.4761962890625, 9.840087890625, 10.2039794921875, 10.56787109375, 10.9317626953125, 11.295654296875, 11.6595458984375, 12.0234375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 9.0, 6.0, 11.0, 7.0, 17.0, 10.0, 17.0, 17.0, 25.0, 22.0, 34.0, 37.0, 32.0, 21.0, 41.0, 50.0, 58.0, 43.0, 43.0, 60.0, 45.0, 47.0, 49.0, 34.0, 30.0, 27.0, 26.0, 36.0, 30.0, 20.0, 20.0, 13.0, 15.0, 12.0, 13.0, 10.0, 5.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.1796875, -11.789306640625, -11.39892578125, -11.008544921875, -10.6181640625, -10.227783203125, -9.83740234375, -9.447021484375, -9.056640625, -8.666259765625, -8.27587890625, -7.885498046875, -7.4951171875, -7.104736328125, -6.71435546875, -6.323974609375, -5.93359375, -5.543212890625, -5.15283203125, -4.762451171875, -4.3720703125, -3.981689453125, -3.59130859375, -3.200927734375, -2.810546875, -2.420166015625, -2.02978515625, -1.639404296875, -1.2490234375, -0.858642578125, -0.46826171875, -0.077880859375, 0.3125, 0.702880859375, 1.09326171875, 1.483642578125, 1.8740234375, 2.264404296875, 2.65478515625, 3.045166015625, 3.435546875, 3.825927734375, 4.21630859375, 4.606689453125, 4.9970703125, 5.387451171875, 5.77783203125, 6.168212890625, 6.55859375, 6.948974609375, 7.33935546875, 7.729736328125, 8.1201171875, 8.510498046875, 8.90087890625, 9.291259765625, 9.681640625, 10.072021484375, 10.46240234375, 10.852783203125, 11.2431640625, 11.633544921875, 12.02392578125, 12.414306640625, 12.8046875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 5.0, 8.0, 7.0, 13.0, 28.0, 35.0, 56.0, 80.0, 158.0, 203.0, 324.0, 658.0, 1134.0, 2046.0, 3939.0, 8433.0, 19049.0, 45334.0, 110973.0, 245685.0, 310000.0, 172985.0, 72177.0, 29856.0, 12864.0, 5904.0, 2912.0, 1556.0, 849.0, 499.0, 282.0, 159.0, 114.0, 83.0, 54.0, 23.0, 24.0, 20.0, 9.0, 3.0, 9.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.4375, -15.8115234375, -15.185546875, -14.5595703125, -13.93359375, -13.3076171875, -12.681640625, -12.0556640625, -11.4296875, -10.8037109375, -10.177734375, -9.5517578125, -8.92578125, -8.2998046875, -7.673828125, -7.0478515625, -6.421875, -5.7958984375, -5.169921875, -4.5439453125, -3.91796875, -3.2919921875, -2.666015625, -2.0400390625, -1.4140625, -0.7880859375, -0.162109375, 0.4638671875, 1.08984375, 1.7158203125, 2.341796875, 2.9677734375, 3.59375, 4.2197265625, 4.845703125, 5.4716796875, 6.09765625, 6.7236328125, 7.349609375, 7.9755859375, 8.6015625, 9.2275390625, 9.853515625, 10.4794921875, 11.10546875, 11.7314453125, 12.357421875, 12.9833984375, 13.609375, 14.2353515625, 14.861328125, 15.4873046875, 16.11328125, 16.7392578125, 17.365234375, 17.9912109375, 18.6171875, 19.2431640625, 19.869140625, 20.4951171875, 21.12109375, 21.7470703125, 22.373046875, 22.9990234375, 23.625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 2.0, 3.0, 5.0, 6.0, 10.0, 18.0, 22.0, 20.0, 32.0, 29.0, 22.0, 39.0, 46.0, 41.0, 42.0, 47.0, 41.0, 44.0, 47.0, 46.0, 39.0, 41.0, 36.0, 40.0, 36.0, 41.0, 39.0, 27.0, 25.0, 28.0, 20.0, 17.0, 7.0, 9.0, 13.0, 11.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.03125, -6.7958984375, -6.560546875, -6.3251953125, -6.08984375, -5.8544921875, -5.619140625, -5.3837890625, -5.1484375, -4.9130859375, -4.677734375, -4.4423828125, -4.20703125, -3.9716796875, -3.736328125, -3.5009765625, -3.265625, -3.0302734375, -2.794921875, -2.5595703125, -2.32421875, -2.0888671875, -1.853515625, -1.6181640625, -1.3828125, -1.1474609375, -0.912109375, -0.6767578125, -0.44140625, -0.2060546875, 0.029296875, 0.2646484375, 0.5, 0.7353515625, 0.970703125, 1.2060546875, 1.44140625, 1.6767578125, 1.912109375, 2.1474609375, 2.3828125, 2.6181640625, 2.853515625, 3.0888671875, 3.32421875, 3.5595703125, 3.794921875, 4.0302734375, 4.265625, 4.5009765625, 4.736328125, 4.9716796875, 5.20703125, 5.4423828125, 5.677734375, 5.9130859375, 6.1484375, 6.3837890625, 6.619140625, 6.8544921875, 7.08984375, 7.3251953125, 7.560546875, 7.7958984375, 8.03125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 5.0, 3.0, 4.0, 11.0, 16.0, 13.0, 21.0, 44.0, 42.0, 60.0, 107.0, 180.0, 249.0, 393.0, 737.0, 1275.0, 2319.0, 4479.0, 9404.0, 20295.0, 45979.0, 109466.0, 240736.0, 309134.0, 171005.0, 73401.0, 31187.0, 13983.0, 6570.0, 3225.0, 1701.0, 964.0, 586.0, 319.0, 248.0, 119.0, 99.0, 55.0, 34.0, 29.0, 18.0, 17.0, 7.0, 12.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.1015625, -8.8280029296875, -8.554443359375, -8.2808837890625, -8.00732421875, -7.7337646484375, -7.460205078125, -7.1866455078125, -6.9130859375, -6.6395263671875, -6.365966796875, -6.0924072265625, -5.81884765625, -5.5452880859375, -5.271728515625, -4.9981689453125, -4.724609375, -4.4510498046875, -4.177490234375, -3.9039306640625, -3.63037109375, -3.3568115234375, -3.083251953125, -2.8096923828125, -2.5361328125, -2.2625732421875, -1.989013671875, -1.7154541015625, -1.44189453125, -1.1683349609375, -0.894775390625, -0.6212158203125, -0.34765625, -0.0740966796875, 0.199462890625, 0.4730224609375, 0.74658203125, 1.0201416015625, 1.293701171875, 1.5672607421875, 1.8408203125, 2.1143798828125, 2.387939453125, 2.6614990234375, 2.93505859375, 3.2086181640625, 3.482177734375, 3.7557373046875, 4.029296875, 4.3028564453125, 4.576416015625, 4.8499755859375, 5.12353515625, 5.3970947265625, 5.670654296875, 5.9442138671875, 6.2177734375, 6.4913330078125, 6.764892578125, 7.0384521484375, 7.31201171875, 7.5855712890625, 7.859130859375, 8.1326904296875, 8.40625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 7.0, 7.0, 6.0, 6.0, 17.0, 14.0, 17.0, 15.0, 20.0, 24.0, 38.0, 51.0, 54.0, 58.0, 79.0, 68.0, 64.0, 56.0, 79.0, 52.0, 62.0, 34.0, 40.0, 22.0, 20.0, 19.0, 12.0, 9.0, 17.0, 6.0, 4.0, 3.0, 4.0, 1.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002980232238769531, -0.0002882517874240875, -0.0002784803509712219, -0.0002687089145183563, -0.0002589374780654907, -0.0002491660416126251, -0.00023939460515975952, -0.00022962316870689392, -0.00021985173225402832, -0.00021008029580116272, -0.00020030885934829712, -0.00019053742289543152, -0.00018076598644256592, -0.00017099454998970032, -0.00016122311353683472, -0.00015145167708396912, -0.00014168024063110352, -0.00013190880417823792, -0.00012213736772537231, -0.00011236593127250671, -0.00010259449481964111, -9.282305836677551e-05, -8.305162191390991e-05, -7.328018546104431e-05, -6.350874900817871e-05, -5.373731255531311e-05, -4.396587610244751e-05, -3.419443964958191e-05, -2.442300319671631e-05, -1.4651566743850708e-05, -4.880130290985107e-06, 4.891306161880493e-06, 1.4662742614746094e-05, 2.4434179067611694e-05, 3.4205615520477295e-05, 4.3977051973342896e-05, 5.3748488426208496e-05, 6.35199248790741e-05, 7.32913613319397e-05, 8.30627977848053e-05, 9.28342342376709e-05, 0.0001026056706905365, 0.0001123771071434021, 0.0001221485435962677, 0.0001319199800491333, 0.0001416914165019989, 0.0001514628529548645, 0.0001612342894077301, 0.0001710057258605957, 0.0001807771623134613, 0.0001905485987663269, 0.0002003200352191925, 0.0002100914716720581, 0.0002198629081249237, 0.0002296343445777893, 0.0002394057810306549, 0.0002491772174835205, 0.0002589486539363861, 0.0002687200903892517, 0.0002784915268421173, 0.0002882629632949829, 0.0002980343997478485, 0.0003078058362007141, 0.0003175772726535797, 0.0003273487091064453]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 3.0, 3.0, 6.0, 3.0, 11.0, 18.0, 13.0, 29.0, 34.0, 57.0, 91.0, 128.0, 191.0, 319.0, 387.0, 600.0, 947.0, 1563.0, 2632.0, 4654.0, 8422.0, 15615.0, 31224.0, 60140.0, 112702.0, 182010.0, 216921.0, 177022.0, 109268.0, 58458.0, 30101.0, 15393.0, 8206.0, 4475.0, 2617.0, 1478.0, 960.0, 634.0, 388.0, 273.0, 187.0, 121.0, 81.0, 60.0, 44.0, 20.0, 19.0, 16.0, 4.0, 6.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.9296875, -5.735107421875, -5.54052734375, -5.345947265625, -5.1513671875, -4.956787109375, -4.76220703125, -4.567626953125, -4.373046875, -4.178466796875, -3.98388671875, -3.789306640625, -3.5947265625, -3.400146484375, -3.20556640625, -3.010986328125, -2.81640625, -2.621826171875, -2.42724609375, -2.232666015625, -2.0380859375, -1.843505859375, -1.64892578125, -1.454345703125, -1.259765625, -1.065185546875, -0.87060546875, -0.676025390625, -0.4814453125, -0.286865234375, -0.09228515625, 0.102294921875, 0.296875, 0.491455078125, 0.68603515625, 0.880615234375, 1.0751953125, 1.269775390625, 1.46435546875, 1.658935546875, 1.853515625, 2.048095703125, 2.24267578125, 2.437255859375, 2.6318359375, 2.826416015625, 3.02099609375, 3.215576171875, 3.41015625, 3.604736328125, 3.79931640625, 3.993896484375, 4.1884765625, 4.383056640625, 4.57763671875, 4.772216796875, 4.966796875, 5.161376953125, 5.35595703125, 5.550537109375, 5.7451171875, 5.939697265625, 6.13427734375, 6.328857421875, 6.5234375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 0.0, 2.0, 7.0, 2.0, 7.0, 3.0, 9.0, 15.0, 19.0, 16.0, 28.0, 32.0, 29.0, 32.0, 35.0, 45.0, 58.0, 53.0, 55.0, 54.0, 65.0, 57.0, 57.0, 59.0, 51.0, 51.0, 28.0, 30.0, 22.0, 19.0, 9.0, 7.0, 12.0, 9.0, 1.0, 9.0, 8.0, 3.0, 2.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.736328125, -1.67657470703125, -1.6168212890625, -1.55706787109375, -1.497314453125, -1.43756103515625, -1.3778076171875, -1.31805419921875, -1.25830078125, -1.19854736328125, -1.1387939453125, -1.07904052734375, -1.019287109375, -0.95953369140625, -0.8997802734375, -0.84002685546875, -0.7802734375, -0.72052001953125, -0.6607666015625, -0.60101318359375, -0.541259765625, -0.48150634765625, -0.4217529296875, -0.36199951171875, -0.30224609375, -0.24249267578125, -0.1827392578125, -0.12298583984375, -0.063232421875, -0.00347900390625, 0.0562744140625, 0.11602783203125, 0.17578125, 0.23553466796875, 0.2952880859375, 0.35504150390625, 0.414794921875, 0.47454833984375, 0.5343017578125, 0.59405517578125, 0.65380859375, 0.71356201171875, 0.7733154296875, 0.83306884765625, 0.892822265625, 0.95257568359375, 1.0123291015625, 1.07208251953125, 1.1318359375, 1.19158935546875, 1.2513427734375, 1.31109619140625, 1.370849609375, 1.43060302734375, 1.4903564453125, 1.55010986328125, 1.60986328125, 1.66961669921875, 1.7293701171875, 1.78912353515625, 1.848876953125, 1.90863037109375, 1.9683837890625, 2.02813720703125, 2.087890625]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 7.0, 4.0, 7.0, 3.0, 4.0, 11.0, 15.0, 11.0, 17.0, 22.0, 19.0, 43.0, 32.0, 35.0, 52.0, 63.0, 63.0, 72.0, 69.0, 71.0, 61.0, 57.0, 46.0, 50.0, 22.0, 18.0, 27.0, 23.0, 17.0, 8.0, 10.0, 11.0, 9.0, 6.0, 0.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.129344940185547, -19.466495513916016, -18.803647994995117, -18.140798568725586, -17.477951049804688, -16.815101623535156, -16.152254104614258, -15.489404678344727, -14.826556205749512, -14.163707733154297, -13.500859260559082, -12.838010787963867, -12.175161361694336, -11.512313842773438, -10.849464416503906, -10.186615943908691, -9.523767471313477, -8.860918998718262, -8.198070526123047, -7.535221576690674, -6.872373104095459, -6.209524631500244, -5.546675682067871, -4.883827209472656, -4.220978736877441, -3.5581302642822266, -2.8952815532684326, -2.2324328422546387, -1.5695843696594238, -0.906735897064209, -0.24388718605041504, 0.4189615249633789, 1.081808090209961, 1.7446566820144653, 2.4075052738189697, 3.0703539848327637, 3.7332024574279785, 4.396050930023193, 5.058899879455566, 5.721748352050781, 6.384596824645996, 7.047445297241211, 7.710293769836426, 8.37314224243164, 9.035991668701172, 9.69883918762207, 10.361688613891602, 11.024537086486816, 11.687385559082031, 12.350234031677246, 13.013082504272461, 13.675930976867676, 14.33877944946289, 15.001628875732422, 15.664477348327637, 16.32732582092285, 16.99017333984375, 17.65302276611328, 18.31587028503418, 18.97871971130371, 19.64156723022461, 20.30441665649414, 20.96726417541504, 21.63011360168457, 22.2929630279541]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 3.0, 6.0, 13.0, 14.0, 10.0, 15.0, 18.0, 25.0, 23.0, 25.0, 25.0, 26.0, 34.0, 38.0, 38.0, 34.0, 48.0, 40.0, 48.0, 48.0, 41.0, 37.0, 44.0, 37.0, 32.0, 38.0, 29.0, 25.0, 19.0, 33.0, 20.0, 25.0, 14.0, 14.0, 17.0, 8.0, 9.0, 6.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.874702453613281, -9.548356056213379, -9.22200870513916, -8.895662307739258, -8.569314956665039, -8.242968559265137, -7.916621208190918, -7.590274810791016, -7.263927459716797, -6.937580585479736, -6.611233711242676, -6.284886837005615, -5.958539962768555, -5.632193088531494, -5.305846214294434, -4.979499816894531, -4.653152942657471, -4.32680606842041, -4.00045919418335, -3.674112319946289, -3.3477654457092285, -3.021418571472168, -2.6950719356536865, -2.368725061416626, -2.0423781871795654, -1.7160313129425049, -1.3896844387054443, -1.0633376836776733, -0.7369908094406128, -0.41064393520355225, -0.08429718017578125, 0.2420496940612793, 0.5683965682983398, 0.8947434425354004, 1.221090316772461, 1.547437071800232, 1.8737839460372925, 2.2001309394836426, 2.526477575302124, 2.8528244495391846, 3.179171323776245, 3.5055181980133057, 3.831865072250366, 4.158211708068848, 4.484558582305908, 4.810905456542969, 5.137252330780029, 5.46359920501709, 5.78994607925415, 6.116292953491211, 6.4426398277282715, 6.768986701965332, 7.095333576202393, 7.421680450439453, 7.7480268478393555, 8.074374198913574, 8.400720596313477, 8.727066993713379, 9.053414344787598, 9.3797607421875, 9.706108093261719, 10.032454490661621, 10.35880184173584, 10.685148239135742, 11.011495590209961]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 6.0, 6.0, 7.0, 16.0, 26.0, 30.0, 55.0, 87.0, 135.0, 208.0, 371.0, 628.0, 1163.0, 2228.0, 4489.0, 8944.0, 18498.0, 37723.0, 73628.0, 129921.0, 191645.0, 208267.0, 163324.0, 100287.0, 53934.0, 26745.0, 13099.0, 6321.0, 3101.0, 1570.0, 860.0, 517.0, 272.0, 150.0, 107.0, 63.0, 43.0, 27.0, 22.0, 13.0, 5.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.40625, -15.88134765625, -15.3564453125, -14.83154296875, -14.306640625, -13.78173828125, -13.2568359375, -12.73193359375, -12.20703125, -11.68212890625, -11.1572265625, -10.63232421875, -10.107421875, -9.58251953125, -9.0576171875, -8.53271484375, -8.0078125, -7.48291015625, -6.9580078125, -6.43310546875, -5.908203125, -5.38330078125, -4.8583984375, -4.33349609375, -3.80859375, -3.28369140625, -2.7587890625, -2.23388671875, -1.708984375, -1.18408203125, -0.6591796875, -0.13427734375, 0.390625, 0.91552734375, 1.4404296875, 1.96533203125, 2.490234375, 3.01513671875, 3.5400390625, 4.06494140625, 4.58984375, 5.11474609375, 5.6396484375, 6.16455078125, 6.689453125, 7.21435546875, 7.7392578125, 8.26416015625, 8.7890625, 9.31396484375, 9.8388671875, 10.36376953125, 10.888671875, 11.41357421875, 11.9384765625, 12.46337890625, 12.98828125, 13.51318359375, 14.0380859375, 14.56298828125, 15.087890625, 15.61279296875, 16.1376953125, 16.66259765625, 17.1875]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 5.0, 6.0, 5.0, 4.0, 8.0, 7.0, 10.0, 12.0, 16.0, 21.0, 19.0, 27.0, 29.0, 22.0, 19.0, 27.0, 33.0, 28.0, 39.0, 43.0, 42.0, 45.0, 50.0, 33.0, 34.0, 36.0, 40.0, 39.0, 27.0, 31.0, 28.0, 26.0, 27.0, 25.0, 24.0, 25.0, 18.0, 8.0, 19.0, 12.0, 7.0, 7.0, 4.0, 3.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.953125, -9.6209716796875, -9.288818359375, -8.9566650390625, -8.62451171875, -8.2923583984375, -7.960205078125, -7.6280517578125, -7.2958984375, -6.9637451171875, -6.631591796875, -6.2994384765625, -5.96728515625, -5.6351318359375, -5.302978515625, -4.9708251953125, -4.638671875, -4.3065185546875, -3.974365234375, -3.6422119140625, -3.31005859375, -2.9779052734375, -2.645751953125, -2.3135986328125, -1.9814453125, -1.6492919921875, -1.317138671875, -0.9849853515625, -0.65283203125, -0.3206787109375, 0.011474609375, 0.3436279296875, 0.67578125, 1.0079345703125, 1.340087890625, 1.6722412109375, 2.00439453125, 2.3365478515625, 2.668701171875, 3.0008544921875, 3.3330078125, 3.6651611328125, 3.997314453125, 4.3294677734375, 4.66162109375, 4.9937744140625, 5.325927734375, 5.6580810546875, 5.990234375, 6.3223876953125, 6.654541015625, 6.9866943359375, 7.31884765625, 7.6510009765625, 7.983154296875, 8.3153076171875, 8.6474609375, 8.9796142578125, 9.311767578125, 9.6439208984375, 9.97607421875, 10.3082275390625, 10.640380859375, 10.9725341796875, 11.3046875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 7.0, 11.0, 13.0, 26.0, 38.0, 48.0, 57.0, 69.0, 119.0, 165.0, 246.0, 446.0, 746.0, 1339.0, 2816.0, 6710.0, 17135.0, 44537.0, 109220.0, 216825.0, 278653.0, 203763.0, 98627.0, 39959.0, 15401.0, 5980.0, 2592.0, 1230.0, 678.0, 410.0, 239.0, 145.0, 105.0, 64.0, 41.0, 24.0, 17.0, 21.0, 14.0, 9.0, 4.0, 1.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.09375, -18.42236328125, -17.7509765625, -17.07958984375, -16.408203125, -15.73681640625, -15.0654296875, -14.39404296875, -13.72265625, -13.05126953125, -12.3798828125, -11.70849609375, -11.037109375, -10.36572265625, -9.6943359375, -9.02294921875, -8.3515625, -7.68017578125, -7.0087890625, -6.33740234375, -5.666015625, -4.99462890625, -4.3232421875, -3.65185546875, -2.98046875, -2.30908203125, -1.6376953125, -0.96630859375, -0.294921875, 0.37646484375, 1.0478515625, 1.71923828125, 2.390625, 3.06201171875, 3.7333984375, 4.40478515625, 5.076171875, 5.74755859375, 6.4189453125, 7.09033203125, 7.76171875, 8.43310546875, 9.1044921875, 9.77587890625, 10.447265625, 11.11865234375, 11.7900390625, 12.46142578125, 13.1328125, 13.80419921875, 14.4755859375, 15.14697265625, 15.818359375, 16.48974609375, 17.1611328125, 17.83251953125, 18.50390625, 19.17529296875, 19.8466796875, 20.51806640625, 21.189453125, 21.86083984375, 22.5322265625, 23.20361328125, 23.875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 4.0, 11.0, 6.0, 11.0, 9.0, 10.0, 29.0, 7.0, 14.0, 17.0, 29.0, 18.0, 28.0, 28.0, 32.0, 31.0, 34.0, 38.0, 31.0, 35.0, 31.0, 38.0, 40.0, 31.0, 41.0, 20.0, 29.0, 37.0, 31.0, 29.0, 23.0, 18.0, 33.0, 24.0, 26.0, 13.0, 19.0, 18.0, 17.0, 12.0, 4.0, 17.0, 3.0, 2.0, 5.0, 5.0, 7.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.84765625, -5.6590576171875, -5.470458984375, -5.2818603515625, -5.09326171875, -4.9046630859375, -4.716064453125, -4.5274658203125, -4.3388671875, -4.1502685546875, -3.961669921875, -3.7730712890625, -3.58447265625, -3.3958740234375, -3.207275390625, -3.0186767578125, -2.830078125, -2.6414794921875, -2.452880859375, -2.2642822265625, -2.07568359375, -1.8870849609375, -1.698486328125, -1.5098876953125, -1.3212890625, -1.1326904296875, -0.944091796875, -0.7554931640625, -0.56689453125, -0.3782958984375, -0.189697265625, -0.0010986328125, 0.1875, 0.3760986328125, 0.564697265625, 0.7532958984375, 0.94189453125, 1.1304931640625, 1.319091796875, 1.5076904296875, 1.6962890625, 1.8848876953125, 2.073486328125, 2.2620849609375, 2.45068359375, 2.6392822265625, 2.827880859375, 3.0164794921875, 3.205078125, 3.3936767578125, 3.582275390625, 3.7708740234375, 3.95947265625, 4.1480712890625, 4.336669921875, 4.5252685546875, 4.7138671875, 4.9024658203125, 5.091064453125, 5.2796630859375, 5.46826171875, 5.6568603515625, 5.845458984375, 6.0340576171875, 6.22265625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 9.0, 8.0, 11.0, 20.0, 34.0, 34.0, 72.0, 105.0, 162.0, 234.0, 380.0, 559.0, 812.0, 1227.0, 1916.0, 3071.0, 4616.0, 7441.0, 11793.0, 19078.0, 30929.0, 50086.0, 78853.0, 117520.0, 151793.0, 161875.0, 137070.0, 98691.0, 63892.0, 39782.0, 24915.0, 15192.0, 9467.0, 5995.0, 3804.0, 2477.0, 1651.0, 1011.0, 647.0, 462.0, 297.0, 198.0, 129.0, 82.0, 45.0, 37.0, 31.0, 16.0, 6.0, 7.0, 10.0, 1.0, 4.0, 4.0], "bins": [-6.22265625, -6.04620361328125, -5.8697509765625, -5.69329833984375, -5.516845703125, -5.34039306640625, -5.1639404296875, -4.98748779296875, -4.81103515625, -4.63458251953125, -4.4581298828125, -4.28167724609375, -4.105224609375, -3.92877197265625, -3.7523193359375, -3.57586669921875, -3.3994140625, -3.22296142578125, -3.0465087890625, -2.87005615234375, -2.693603515625, -2.51715087890625, -2.3406982421875, -2.16424560546875, -1.98779296875, -1.81134033203125, -1.6348876953125, -1.45843505859375, -1.281982421875, -1.10552978515625, -0.9290771484375, -0.75262451171875, -0.576171875, -0.39971923828125, -0.2232666015625, -0.04681396484375, 0.129638671875, 0.30609130859375, 0.4825439453125, 0.65899658203125, 0.83544921875, 1.01190185546875, 1.1883544921875, 1.36480712890625, 1.541259765625, 1.71771240234375, 1.8941650390625, 2.07061767578125, 2.2470703125, 2.42352294921875, 2.5999755859375, 2.77642822265625, 2.952880859375, 3.12933349609375, 3.3057861328125, 3.48223876953125, 3.65869140625, 3.83514404296875, 4.0115966796875, 4.18804931640625, 4.364501953125, 4.54095458984375, 4.7174072265625, 4.89385986328125, 5.0703125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 2.0, 6.0, 4.0, 8.0, 12.0, 15.0, 24.0, 21.0, 32.0, 53.0, 48.0, 62.0, 77.0, 78.0, 91.0, 81.0, 89.0, 65.0, 45.0, 41.0, 29.0, 30.0, 24.0, 11.0, 11.0, 11.0, 7.0, 6.0, 6.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006399154663085938, -0.0006174445152282715, -0.0005949735641479492, -0.000572502613067627, -0.0005500316619873047, -0.0005275607109069824, -0.0005050897598266602, -0.0004826188087463379, -0.0004601478576660156, -0.00043767690658569336, -0.0004152059555053711, -0.00039273500442504883, -0.00037026405334472656, -0.0003477931022644043, -0.00032532215118408203, -0.00030285120010375977, -0.0002803802490234375, -0.00025790929794311523, -0.00023543834686279297, -0.0002129673957824707, -0.00019049644470214844, -0.00016802549362182617, -0.0001455545425415039, -0.00012308359146118164, -0.00010061264038085938, -7.814168930053711e-05, -5.5670738220214844e-05, -3.319978713989258e-05, -1.0728836059570312e-05, 1.1742115020751953e-05, 3.421306610107422e-05, 5.6684017181396484e-05, 7.915496826171875e-05, 0.00010162591934204102, 0.00012409687042236328, 0.00014656782150268555, 0.0001690387725830078, 0.00019150972366333008, 0.00021398067474365234, 0.0002364516258239746, 0.0002589225769042969, 0.00028139352798461914, 0.0003038644790649414, 0.00032633543014526367, 0.00034880638122558594, 0.0003712773323059082, 0.00039374828338623047, 0.00041621923446655273, 0.000438690185546875, 0.00046116113662719727, 0.00048363208770751953, 0.0005061030387878418, 0.0005285739898681641, 0.0005510449409484863, 0.0005735158920288086, 0.0005959868431091309, 0.0006184577941894531, 0.0006409287452697754, 0.0006633996963500977, 0.0006858706474304199, 0.0007083415985107422, 0.0007308125495910645, 0.0007532835006713867, 0.000775754451751709, 0.0007982254028320312]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 9.0, 8.0, 5.0, 9.0, 15.0, 14.0, 23.0, 43.0, 40.0, 72.0, 103.0, 144.0, 214.0, 329.0, 519.0, 773.0, 1227.0, 1827.0, 2921.0, 4758.0, 7813.0, 12918.0, 21635.0, 36179.0, 59153.0, 92919.0, 134716.0, 163554.0, 159542.0, 125429.0, 85667.0, 53640.0, 32240.0, 19526.0, 11549.0, 7157.0, 4279.0, 2658.0, 1743.0, 1075.0, 728.0, 434.0, 325.0, 183.0, 144.0, 106.0, 57.0, 46.0, 40.0, 23.0, 11.0, 9.0, 3.0, 5.0, 5.0, 3.0, 0.0, 3.0, 1.0], "bins": [-5.80859375, -5.63201904296875, -5.4554443359375, -5.27886962890625, -5.102294921875, -4.92572021484375, -4.7491455078125, -4.57257080078125, -4.39599609375, -4.21942138671875, -4.0428466796875, -3.86627197265625, -3.689697265625, -3.51312255859375, -3.3365478515625, -3.15997314453125, -2.9833984375, -2.80682373046875, -2.6302490234375, -2.45367431640625, -2.277099609375, -2.10052490234375, -1.9239501953125, -1.74737548828125, -1.57080078125, -1.39422607421875, -1.2176513671875, -1.04107666015625, -0.864501953125, -0.68792724609375, -0.5113525390625, -0.33477783203125, -0.158203125, 0.01837158203125, 0.1949462890625, 0.37152099609375, 0.548095703125, 0.72467041015625, 0.9012451171875, 1.07781982421875, 1.25439453125, 1.43096923828125, 1.6075439453125, 1.78411865234375, 1.960693359375, 2.13726806640625, 2.3138427734375, 2.49041748046875, 2.6669921875, 2.84356689453125, 3.0201416015625, 3.19671630859375, 3.373291015625, 3.54986572265625, 3.7264404296875, 3.90301513671875, 4.07958984375, 4.25616455078125, 4.4327392578125, 4.60931396484375, 4.785888671875, 4.96246337890625, 5.1390380859375, 5.31561279296875, 5.4921875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 7.0, 18.0, 13.0, 11.0, 21.0, 23.0, 21.0, 23.0, 30.0, 49.0, 46.0, 46.0, 50.0, 69.0, 53.0, 56.0, 54.0, 35.0, 70.0, 45.0, 41.0, 29.0, 35.0, 14.0, 27.0, 21.0, 18.0, 21.0, 10.0, 10.0, 4.0, 9.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.876953125, -1.81781005859375, -1.7586669921875, -1.69952392578125, -1.640380859375, -1.58123779296875, -1.5220947265625, -1.46295166015625, -1.40380859375, -1.34466552734375, -1.2855224609375, -1.22637939453125, -1.167236328125, -1.10809326171875, -1.0489501953125, -0.98980712890625, -0.9306640625, -0.87152099609375, -0.8123779296875, -0.75323486328125, -0.694091796875, -0.63494873046875, -0.5758056640625, -0.51666259765625, -0.45751953125, -0.39837646484375, -0.3392333984375, -0.28009033203125, -0.220947265625, -0.16180419921875, -0.1026611328125, -0.04351806640625, 0.015625, 0.07476806640625, 0.1339111328125, 0.19305419921875, 0.252197265625, 0.31134033203125, 0.3704833984375, 0.42962646484375, 0.48876953125, 0.54791259765625, 0.6070556640625, 0.66619873046875, 0.725341796875, 0.78448486328125, 0.8436279296875, 0.90277099609375, 0.9619140625, 1.02105712890625, 1.0802001953125, 1.13934326171875, 1.198486328125, 1.25762939453125, 1.3167724609375, 1.37591552734375, 1.43505859375, 1.49420166015625, 1.5533447265625, 1.61248779296875, 1.671630859375, 1.73077392578125, 1.7899169921875, 1.84906005859375, 1.908203125]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 6.0, 3.0, 2.0, 7.0, 9.0, 10.0, 19.0, 18.0, 26.0, 30.0, 41.0, 50.0, 50.0, 61.0, 75.0, 57.0, 72.0, 81.0, 71.0, 59.0, 55.0, 46.0, 25.0, 18.0, 21.0, 15.0, 17.0, 12.0, 10.0, 9.0, 8.0, 3.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-22.58266830444336, -21.86414337158203, -21.145618438720703, -20.427093505859375, -19.708568572998047, -18.99004364013672, -18.27151870727539, -17.552993774414062, -16.834468841552734, -16.115943908691406, -15.397418975830078, -14.67889404296875, -13.960369110107422, -13.241844177246094, -12.523320198059082, -11.804795265197754, -11.086271286010742, -10.367746353149414, -9.649221420288086, -8.930696487426758, -8.21217155456543, -7.49364709854126, -6.77512264251709, -6.056597709655762, -5.338072776794434, -4.6195478439331055, -3.9010231494903564, -3.1824984550476074, -2.4639735221862793, -1.7454485893249512, -1.0269241333007812, -0.3083992004394531, 0.410125732421875, 1.1286505460739136, 1.8471753597259521, 2.565700054168701, 3.2842249870300293, 4.002749919891357, 4.721274375915527, 5.4397993087768555, 6.158324241638184, 6.876849174499512, 7.59537410736084, 8.313898086547852, 9.03242301940918, 9.750947952270508, 10.469472885131836, 11.187997817993164, 11.906522750854492, 12.62504768371582, 13.343572616577148, 14.062097549438477, 14.780622482299805, 15.499147415161133, 16.217670440673828, 16.936195373535156, 17.654720306396484, 18.373245239257812, 19.09177017211914, 19.81029510498047, 20.528820037841797, 21.247344970703125, 21.965869903564453, 22.68439483642578, 23.40291976928711]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 3.0, 3.0, 1.0, 5.0, 11.0, 7.0, 7.0, 4.0, 9.0, 11.0, 15.0, 18.0, 24.0, 23.0, 18.0, 26.0, 32.0, 29.0, 44.0, 46.0, 47.0, 37.0, 27.0, 45.0, 37.0, 38.0, 45.0, 45.0, 39.0, 28.0, 44.0, 27.0, 25.0, 23.0, 20.0, 18.0, 21.0, 21.0, 19.0, 13.0, 9.0, 11.0, 12.0, 4.0, 2.0, 4.0, 8.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.802571296691895, -8.481050491333008, -8.159530639648438, -7.838009834289551, -7.516489505767822, -7.194969177246094, -6.873448371887207, -6.5519280433654785, -6.23040771484375, -5.9088873863220215, -5.587367057800293, -5.265846252441406, -4.944325923919678, -4.622805595397949, -4.3012847900390625, -3.979764461517334, -3.6582441329956055, -3.336723804473877, -3.0152032375335693, -2.6936826705932617, -2.372162342071533, -2.0506420135498047, -1.729121446609497, -1.4076008796691895, -1.086080551147461, -0.7645601034164429, -0.4430396556854248, -0.12151920795440674, 0.20000123977661133, 0.5215216875076294, 0.8430421352386475, 1.164562702178955, 1.4860830307006836, 1.8076034784317017, 2.1291239261627197, 2.4506444931030273, 2.772164821624756, 3.0936851501464844, 3.415205717086792, 3.7367262840270996, 4.058246612548828, 4.379766941070557, 4.701287269592285, 5.022808074951172, 5.3443284034729, 5.665848731994629, 5.987369537353516, 6.308889865875244, 6.630410194396973, 6.951930522918701, 7.27345085144043, 7.594971656799316, 7.916491985321045, 8.238012313842773, 8.55953311920166, 8.881053924560547, 9.202573776245117, 9.524094581604004, 9.845614433288574, 10.167135238647461, 10.488655090332031, 10.810175895690918, 11.131696701049805, 11.453216552734375, 11.774737358093262]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 7.0, 3.0, 11.0, 12.0, 16.0, 25.0, 23.0, 50.0, 72.0, 113.0, 171.0, 284.0, 417.0, 785.0, 1408.0, 2520.0, 5214.0, 10711.0, 22889.0, 51782.0, 124898.0, 331470.0, 902695.0, 1436223.0, 808525.0, 293911.0, 111810.0, 46490.0, 20726.0, 9949.0, 5024.0, 2524.0, 1424.0, 796.0, 474.0, 299.0, 169.0, 126.0, 78.0, 44.0, 37.0, 27.0, 14.0, 20.0, 6.0, 7.0, 1.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-23.953125, -23.23681640625, -22.5205078125, -21.80419921875, -21.087890625, -20.37158203125, -19.6552734375, -18.93896484375, -18.22265625, -17.50634765625, -16.7900390625, -16.07373046875, -15.357421875, -14.64111328125, -13.9248046875, -13.20849609375, -12.4921875, -11.77587890625, -11.0595703125, -10.34326171875, -9.626953125, -8.91064453125, -8.1943359375, -7.47802734375, -6.76171875, -6.04541015625, -5.3291015625, -4.61279296875, -3.896484375, -3.18017578125, -2.4638671875, -1.74755859375, -1.03125, -0.31494140625, 0.4013671875, 1.11767578125, 1.833984375, 2.55029296875, 3.2666015625, 3.98291015625, 4.69921875, 5.41552734375, 6.1318359375, 6.84814453125, 7.564453125, 8.28076171875, 8.9970703125, 9.71337890625, 10.4296875, 11.14599609375, 11.8623046875, 12.57861328125, 13.294921875, 14.01123046875, 14.7275390625, 15.44384765625, 16.16015625, 16.87646484375, 17.5927734375, 18.30908203125, 19.025390625, 19.74169921875, 20.4580078125, 21.17431640625, 21.890625]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 8.0, 5.0, 12.0, 18.0, 13.0, 23.0, 10.0, 27.0, 19.0, 33.0, 37.0, 39.0, 45.0, 37.0, 48.0, 55.0, 51.0, 59.0, 43.0, 47.0, 40.0, 46.0, 38.0, 39.0, 33.0, 30.0, 26.0, 22.0, 23.0, 15.0, 14.0, 8.0, 11.0, 8.0, 4.0, 5.0, 5.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6953125, -7.4146728515625, -7.134033203125, -6.8533935546875, -6.57275390625, -6.2921142578125, -6.011474609375, -5.7308349609375, -5.4501953125, -5.1695556640625, -4.888916015625, -4.6082763671875, -4.32763671875, -4.0469970703125, -3.766357421875, -3.4857177734375, -3.205078125, -2.9244384765625, -2.643798828125, -2.3631591796875, -2.08251953125, -1.8018798828125, -1.521240234375, -1.2406005859375, -0.9599609375, -0.6793212890625, -0.398681640625, -0.1180419921875, 0.16259765625, 0.4432373046875, 0.723876953125, 1.0045166015625, 1.28515625, 1.5657958984375, 1.846435546875, 2.1270751953125, 2.40771484375, 2.6883544921875, 2.968994140625, 3.2496337890625, 3.5302734375, 3.8109130859375, 4.091552734375, 4.3721923828125, 4.65283203125, 4.9334716796875, 5.214111328125, 5.4947509765625, 5.775390625, 6.0560302734375, 6.336669921875, 6.6173095703125, 6.89794921875, 7.1785888671875, 7.459228515625, 7.7398681640625, 8.0205078125, 8.3011474609375, 8.581787109375, 8.8624267578125, 9.14306640625, 9.4237060546875, 9.704345703125, 9.9849853515625, 10.265625]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 8.0, 15.0, 9.0, 11.0, 28.0, 37.0, 57.0, 84.0, 129.0, 183.0, 321.0, 526.0, 856.0, 1400.0, 2266.0, 4026.0, 6829.0, 12496.0, 22174.0, 41410.0, 78777.0, 152526.0, 294826.0, 557030.0, 893641.0, 906856.0, 575189.0, 306470.0, 156697.0, 82111.0, 43095.0, 23434.0, 12884.0, 7114.0, 4230.0, 2509.0, 1529.0, 923.0, 601.0, 339.0, 211.0, 120.0, 98.0, 63.0, 56.0, 30.0, 22.0, 14.0, 10.0, 2.0, 6.0, 2.0, 4.0, 4.0], "bins": [-18.609375, -18.078125, -17.546875, -17.015625, -16.484375, -15.953125, -15.421875, -14.890625, -14.359375, -13.828125, -13.296875, -12.765625, -12.234375, -11.703125, -11.171875, -10.640625, -10.109375, -9.578125, -9.046875, -8.515625, -7.984375, -7.453125, -6.921875, -6.390625, -5.859375, -5.328125, -4.796875, -4.265625, -3.734375, -3.203125, -2.671875, -2.140625, -1.609375, -1.078125, -0.546875, -0.015625, 0.515625, 1.046875, 1.578125, 2.109375, 2.640625, 3.171875, 3.703125, 4.234375, 4.765625, 5.296875, 5.828125, 6.359375, 6.890625, 7.421875, 7.953125, 8.484375, 9.015625, 9.546875, 10.078125, 10.609375, 11.140625, 11.671875, 12.203125, 12.734375, 13.265625, 13.796875, 14.328125, 14.859375, 15.390625]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 5.0, 18.0, 14.0, 16.0, 34.0, 35.0, 71.0, 64.0, 104.0, 150.0, 164.0, 195.0, 274.0, 272.0, 351.0, 322.0, 342.0, 308.0, 259.0, 253.0, 203.0, 177.0, 123.0, 91.0, 67.0, 51.0, 34.0, 20.0, 18.0, 13.0, 5.0, 4.0, 6.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.953125, -5.7525634765625, -5.552001953125, -5.3514404296875, -5.15087890625, -4.9503173828125, -4.749755859375, -4.5491943359375, -4.3486328125, -4.1480712890625, -3.947509765625, -3.7469482421875, -3.54638671875, -3.3458251953125, -3.145263671875, -2.9447021484375, -2.744140625, -2.5435791015625, -2.343017578125, -2.1424560546875, -1.94189453125, -1.7413330078125, -1.540771484375, -1.3402099609375, -1.1396484375, -0.9390869140625, -0.738525390625, -0.5379638671875, -0.33740234375, -0.1368408203125, 0.063720703125, 0.2642822265625, 0.46484375, 0.6654052734375, 0.865966796875, 1.0665283203125, 1.26708984375, 1.4676513671875, 1.668212890625, 1.8687744140625, 2.0693359375, 2.2698974609375, 2.470458984375, 2.6710205078125, 2.87158203125, 3.0721435546875, 3.272705078125, 3.4732666015625, 3.673828125, 3.8743896484375, 4.074951171875, 4.2755126953125, 4.47607421875, 4.6766357421875, 4.877197265625, 5.0777587890625, 5.2783203125, 5.4788818359375, 5.679443359375, 5.8800048828125, 6.08056640625, 6.2811279296875, 6.481689453125, 6.6822509765625, 6.8828125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 7.0, 16.0, 15.0, 14.0, 26.0, 34.0, 43.0, 52.0, 71.0, 57.0, 71.0, 90.0, 86.0, 78.0, 67.0, 59.0, 45.0, 35.0, 30.0, 26.0, 17.0, 15.0, 9.0, 9.0, 5.0, 7.0, 5.0, 3.0, 2.0, 0.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.007352828979492, -24.204038619995117, -23.400724411010742, -22.597408294677734, -21.79409408569336, -20.990779876708984, -20.18746566772461, -19.384151458740234, -18.58083724975586, -17.777523040771484, -16.97420883178711, -16.170894622802734, -15.367578506469727, -14.564264297485352, -13.760950088500977, -12.957635879516602, -12.154319763183594, -11.351005554199219, -10.547690391540527, -9.744376182556152, -8.941061019897461, -8.137746810913086, -7.334432601928711, -6.531117916107178, -5.7278032302856445, -4.924488544464111, -4.121173858642578, -3.317859649658203, -2.51454496383667, -1.7112302780151367, -0.9079160690307617, -0.10460138320922852, 0.6987133026123047, 1.5020278692245483, 2.305342435836792, 3.108656883239746, 3.9119715690612793, 4.7152862548828125, 5.5186004638671875, 6.321915149688721, 7.125229835510254, 7.928544521331787, 8.73185920715332, 9.535173416137695, 10.33848762512207, 11.141802787780762, 11.945116996765137, 12.748432159423828, 13.551746368408203, 14.355060577392578, 15.15837574005127, 15.961689949035645, 16.765005111694336, 17.56831932067871, 18.371633529663086, 19.17494773864746, 19.97826385498047, 20.781578063964844, 21.58489227294922, 22.388206481933594, 23.1915225982666, 23.994836807250977, 24.79815101623535, 25.601465225219727, 26.4047794342041]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 4.0, 5.0, 0.0, 2.0, 3.0, 5.0, 5.0, 10.0, 6.0, 12.0, 18.0, 11.0, 18.0, 21.0, 23.0, 17.0, 23.0, 27.0, 33.0, 29.0, 41.0, 36.0, 37.0, 38.0, 36.0, 47.0, 46.0, 40.0, 29.0, 34.0, 39.0, 34.0, 34.0, 33.0, 26.0, 28.0, 22.0, 24.0, 14.0, 21.0, 16.0, 13.0, 8.0, 6.0, 7.0, 5.0, 8.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.131150245666504, -7.8515729904174805, -7.571995258331299, -7.292417526245117, -7.012840270996094, -6.73326301574707, -6.453685283660889, -6.174107551574707, -5.894530296325684, -5.61495304107666, -5.3353753089904785, -5.055797576904297, -4.776220321655273, -4.49664306640625, -4.217065334320068, -3.937487840652466, -3.6579103469848633, -3.3783328533172607, -3.098755359649658, -2.8191778659820557, -2.539600372314453, -2.2600228786468506, -1.980445384979248, -1.7008678913116455, -1.421290397644043, -1.1417129039764404, -0.8621354103088379, -0.5825579166412354, -0.3029804229736328, -0.023402929306030273, 0.25617456436157227, 0.5357520580291748, 0.8153285980224609, 1.0949060916900635, 1.374483585357666, 1.6540610790252686, 1.933638572692871, 2.2132160663604736, 2.492793560028076, 2.7723710536956787, 3.0519485473632812, 3.331526041030884, 3.6111035346984863, 3.890681028366089, 4.170258522033691, 4.449835777282715, 4.7294135093688965, 5.008991241455078, 5.288568496704102, 5.568145751953125, 5.847723484039307, 6.127301216125488, 6.406878471374512, 6.686455726623535, 6.966033458709717, 7.245611190795898, 7.525188446044922, 7.804765701293945, 8.084342956542969, 8.363921165466309, 8.643498420715332, 8.923075675964355, 9.202653884887695, 9.482231140136719, 9.761808395385742]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 6.0, 2.0, 8.0, 16.0, 15.0, 25.0, 37.0, 66.0, 85.0, 136.0, 185.0, 298.0, 443.0, 734.0, 1094.0, 1830.0, 2947.0, 5176.0, 8993.0, 16064.0, 28659.0, 51849.0, 91063.0, 146598.0, 193830.0, 183685.0, 132459.0, 79369.0, 44749.0, 24849.0, 13913.0, 7709.0, 4474.0, 2701.0, 1610.0, 1045.0, 631.0, 410.0, 273.0, 166.0, 129.0, 83.0, 50.0, 36.0, 20.0, 17.0, 7.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0], "bins": [-11.4453125, -11.09716796875, -10.7490234375, -10.40087890625, -10.052734375, -9.70458984375, -9.3564453125, -9.00830078125, -8.66015625, -8.31201171875, -7.9638671875, -7.61572265625, -7.267578125, -6.91943359375, -6.5712890625, -6.22314453125, -5.875, -5.52685546875, -5.1787109375, -4.83056640625, -4.482421875, -4.13427734375, -3.7861328125, -3.43798828125, -3.08984375, -2.74169921875, -2.3935546875, -2.04541015625, -1.697265625, -1.34912109375, -1.0009765625, -0.65283203125, -0.3046875, 0.04345703125, 0.3916015625, 0.73974609375, 1.087890625, 1.43603515625, 1.7841796875, 2.13232421875, 2.48046875, 2.82861328125, 3.1767578125, 3.52490234375, 3.873046875, 4.22119140625, 4.5693359375, 4.91748046875, 5.265625, 5.61376953125, 5.9619140625, 6.31005859375, 6.658203125, 7.00634765625, 7.3544921875, 7.70263671875, 8.05078125, 8.39892578125, 8.7470703125, 9.09521484375, 9.443359375, 9.79150390625, 10.1396484375, 10.48779296875, 10.8359375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 7.0, 3.0, 4.0, 5.0, 5.0, 11.0, 17.0, 15.0, 17.0, 18.0, 20.0, 30.0, 28.0, 45.0, 36.0, 39.0, 52.0, 38.0, 48.0, 46.0, 53.0, 45.0, 33.0, 42.0, 51.0, 42.0, 34.0, 33.0, 29.0, 24.0, 27.0, 25.0, 16.0, 20.0, 15.0, 5.0, 4.0, 3.0, 8.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.109375, -10.74853515625, -10.3876953125, -10.02685546875, -9.666015625, -9.30517578125, -8.9443359375, -8.58349609375, -8.22265625, -7.86181640625, -7.5009765625, -7.14013671875, -6.779296875, -6.41845703125, -6.0576171875, -5.69677734375, -5.3359375, -4.97509765625, -4.6142578125, -4.25341796875, -3.892578125, -3.53173828125, -3.1708984375, -2.81005859375, -2.44921875, -2.08837890625, -1.7275390625, -1.36669921875, -1.005859375, -0.64501953125, -0.2841796875, 0.07666015625, 0.4375, 0.79833984375, 1.1591796875, 1.52001953125, 1.880859375, 2.24169921875, 2.6025390625, 2.96337890625, 3.32421875, 3.68505859375, 4.0458984375, 4.40673828125, 4.767578125, 5.12841796875, 5.4892578125, 5.85009765625, 6.2109375, 6.57177734375, 6.9326171875, 7.29345703125, 7.654296875, 8.01513671875, 8.3759765625, 8.73681640625, 9.09765625, 9.45849609375, 9.8193359375, 10.18017578125, 10.541015625, 10.90185546875, 11.2626953125, 11.62353515625, 11.984375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 11.0, 5.0, 13.0, 17.0, 22.0, 34.0, 40.0, 71.0, 98.0, 150.0, 233.0, 329.0, 523.0, 770.0, 1208.0, 2249.0, 3675.0, 6694.0, 12547.0, 24503.0, 49178.0, 99288.0, 189977.0, 259609.0, 192228.0, 101399.0, 49804.0, 24625.0, 12881.0, 6754.0, 3843.0, 2170.0, 1291.0, 820.0, 492.0, 330.0, 224.0, 147.0, 92.0, 67.0, 41.0, 35.0, 19.0, 19.0, 9.0, 6.0, 7.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-15.4375, -14.976806640625, -14.51611328125, -14.055419921875, -13.5947265625, -13.134033203125, -12.67333984375, -12.212646484375, -11.751953125, -11.291259765625, -10.83056640625, -10.369873046875, -9.9091796875, -9.448486328125, -8.98779296875, -8.527099609375, -8.06640625, -7.605712890625, -7.14501953125, -6.684326171875, -6.2236328125, -5.762939453125, -5.30224609375, -4.841552734375, -4.380859375, -3.920166015625, -3.45947265625, -2.998779296875, -2.5380859375, -2.077392578125, -1.61669921875, -1.156005859375, -0.6953125, -0.234619140625, 0.22607421875, 0.686767578125, 1.1474609375, 1.608154296875, 2.06884765625, 2.529541015625, 2.990234375, 3.450927734375, 3.91162109375, 4.372314453125, 4.8330078125, 5.293701171875, 5.75439453125, 6.215087890625, 6.67578125, 7.136474609375, 7.59716796875, 8.057861328125, 8.5185546875, 8.979248046875, 9.43994140625, 9.900634765625, 10.361328125, 10.822021484375, 11.28271484375, 11.743408203125, 12.2041015625, 12.664794921875, 13.12548828125, 13.586181640625, 14.046875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 4.0, 3.0, 8.0, 11.0, 8.0, 14.0, 8.0, 15.0, 20.0, 28.0, 35.0, 22.0, 28.0, 29.0, 31.0, 37.0, 43.0, 47.0, 43.0, 52.0, 48.0, 53.0, 44.0, 33.0, 40.0, 43.0, 38.0, 32.0, 28.0, 29.0, 28.0, 17.0, 15.0, 14.0, 14.0, 11.0, 8.0, 10.0, 4.0, 6.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0], "bins": [-8.046875, -7.83538818359375, -7.6239013671875, -7.41241455078125, -7.200927734375, -6.98944091796875, -6.7779541015625, -6.56646728515625, -6.35498046875, -6.14349365234375, -5.9320068359375, -5.72052001953125, -5.509033203125, -5.29754638671875, -5.0860595703125, -4.87457275390625, -4.6630859375, -4.45159912109375, -4.2401123046875, -4.02862548828125, -3.817138671875, -3.60565185546875, -3.3941650390625, -3.18267822265625, -2.97119140625, -2.75970458984375, -2.5482177734375, -2.33673095703125, -2.125244140625, -1.91375732421875, -1.7022705078125, -1.49078369140625, -1.279296875, -1.06781005859375, -0.8563232421875, -0.64483642578125, -0.433349609375, -0.22186279296875, -0.0103759765625, 0.20111083984375, 0.41259765625, 0.62408447265625, 0.8355712890625, 1.04705810546875, 1.258544921875, 1.47003173828125, 1.6815185546875, 1.89300537109375, 2.1044921875, 2.31597900390625, 2.5274658203125, 2.73895263671875, 2.950439453125, 3.16192626953125, 3.3734130859375, 3.58489990234375, 3.79638671875, 4.00787353515625, 4.2193603515625, 4.43084716796875, 4.642333984375, 4.85382080078125, 5.0653076171875, 5.27679443359375, 5.48828125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 7.0, 7.0, 9.0, 16.0, 14.0, 19.0, 31.0, 39.0, 64.0, 72.0, 129.0, 167.0, 235.0, 389.0, 581.0, 937.0, 1626.0, 3160.0, 7230.0, 20510.0, 70277.0, 269987.0, 451755.0, 156382.0, 40970.0, 13134.0, 4986.0, 2328.0, 1243.0, 739.0, 457.0, 347.0, 223.0, 135.0, 105.0, 67.0, 59.0, 32.0, 26.0, 18.0, 13.0, 12.0, 7.0, 8.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-13.4375, -13.0213623046875, -12.605224609375, -12.1890869140625, -11.77294921875, -11.3568115234375, -10.940673828125, -10.5245361328125, -10.1083984375, -9.6922607421875, -9.276123046875, -8.8599853515625, -8.44384765625, -8.0277099609375, -7.611572265625, -7.1954345703125, -6.779296875, -6.3631591796875, -5.947021484375, -5.5308837890625, -5.11474609375, -4.6986083984375, -4.282470703125, -3.8663330078125, -3.4501953125, -3.0340576171875, -2.617919921875, -2.2017822265625, -1.78564453125, -1.3695068359375, -0.953369140625, -0.5372314453125, -0.12109375, 0.2950439453125, 0.711181640625, 1.1273193359375, 1.54345703125, 1.9595947265625, 2.375732421875, 2.7918701171875, 3.2080078125, 3.6241455078125, 4.040283203125, 4.4564208984375, 4.87255859375, 5.2886962890625, 5.704833984375, 6.1209716796875, 6.537109375, 6.9532470703125, 7.369384765625, 7.7855224609375, 8.20166015625, 8.6177978515625, 9.033935546875, 9.4500732421875, 9.8662109375, 10.2823486328125, 10.698486328125, 11.1146240234375, 11.53076171875, 11.9468994140625, 12.363037109375, 12.7791748046875, 13.1953125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 1.0, 3.0, 7.0, 16.0, 12.0, 16.0, 20.0, 27.0, 37.0, 54.0, 70.0, 75.0, 84.0, 74.0, 77.0, 77.0, 65.0, 69.0, 57.0, 39.0, 36.0, 22.0, 20.0, 5.0, 12.0, 8.0, 9.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0003781318664550781, -0.00036704540252685547, -0.0003559589385986328, -0.00034487247467041016, -0.0003337860107421875, -0.00032269954681396484, -0.0003116130828857422, -0.00030052661895751953, -0.0002894401550292969, -0.0002783536911010742, -0.00026726722717285156, -0.0002561807632446289, -0.00024509429931640625, -0.0002340078353881836, -0.00022292137145996094, -0.00021183490753173828, -0.00020074844360351562, -0.00018966197967529297, -0.0001785755157470703, -0.00016748905181884766, -0.000156402587890625, -0.00014531612396240234, -0.0001342296600341797, -0.00012314319610595703, -0.00011205673217773438, -0.00010097026824951172, -8.988380432128906e-05, -7.87973403930664e-05, -6.771087646484375e-05, -5.6624412536621094e-05, -4.553794860839844e-05, -3.445148468017578e-05, -2.3365020751953125e-05, -1.2278556823730469e-05, -1.1920928955078125e-06, 9.894371032714844e-06, 2.09808349609375e-05, 3.2067298889160156e-05, 4.315376281738281e-05, 5.424022674560547e-05, 6.532669067382812e-05, 7.641315460205078e-05, 8.749961853027344e-05, 9.85860824584961e-05, 0.00010967254638671875, 0.0001207590103149414, 0.00013184547424316406, 0.00014293193817138672, 0.00015401840209960938, 0.00016510486602783203, 0.0001761913299560547, 0.00018727779388427734, 0.0001983642578125, 0.00020945072174072266, 0.0002205371856689453, 0.00023162364959716797, 0.00024271011352539062, 0.0002537965774536133, 0.00026488304138183594, 0.0002759695053100586, 0.00028705596923828125, 0.0002981424331665039, 0.00030922889709472656, 0.0003203153610229492, 0.0003314018249511719]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 4.0, 17.0, 14.0, 18.0, 24.0, 41.0, 46.0, 74.0, 96.0, 142.0, 191.0, 241.0, 385.0, 494.0, 774.0, 1179.0, 1901.0, 3252.0, 6626.0, 16370.0, 50743.0, 168097.0, 367367.0, 281941.0, 96675.0, 29704.0, 10269.0, 4659.0, 2524.0, 1528.0, 987.0, 640.0, 452.0, 315.0, 217.0, 151.0, 98.0, 87.0, 53.0, 46.0, 39.0, 20.0, 13.0, 15.0, 8.0, 6.0, 7.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-11.125, -10.7955322265625, -10.466064453125, -10.1365966796875, -9.80712890625, -9.4776611328125, -9.148193359375, -8.8187255859375, -8.4892578125, -8.1597900390625, -7.830322265625, -7.5008544921875, -7.17138671875, -6.8419189453125, -6.512451171875, -6.1829833984375, -5.853515625, -5.5240478515625, -5.194580078125, -4.8651123046875, -4.53564453125, -4.2061767578125, -3.876708984375, -3.5472412109375, -3.2177734375, -2.8883056640625, -2.558837890625, -2.2293701171875, -1.89990234375, -1.5704345703125, -1.240966796875, -0.9114990234375, -0.58203125, -0.2525634765625, 0.076904296875, 0.4063720703125, 0.73583984375, 1.0653076171875, 1.394775390625, 1.7242431640625, 2.0537109375, 2.3831787109375, 2.712646484375, 3.0421142578125, 3.37158203125, 3.7010498046875, 4.030517578125, 4.3599853515625, 4.689453125, 5.0189208984375, 5.348388671875, 5.6778564453125, 6.00732421875, 6.3367919921875, 6.666259765625, 6.9957275390625, 7.3251953125, 7.6546630859375, 7.984130859375, 8.3135986328125, 8.64306640625, 8.9725341796875, 9.302001953125, 9.6314697265625, 9.9609375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 9.0, 12.0, 19.0, 32.0, 31.0, 37.0, 52.0, 62.0, 62.0, 74.0, 85.0, 83.0, 83.0, 79.0, 59.0, 63.0, 69.0, 24.0, 21.0, 20.0, 7.0, 5.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.171875, -2.101959228515625, -2.03204345703125, -1.962127685546875, -1.8922119140625, -1.822296142578125, -1.75238037109375, -1.682464599609375, -1.612548828125, -1.542633056640625, -1.47271728515625, -1.402801513671875, -1.3328857421875, -1.262969970703125, -1.19305419921875, -1.123138427734375, -1.05322265625, -0.983306884765625, -0.91339111328125, -0.843475341796875, -0.7735595703125, -0.703643798828125, -0.63372802734375, -0.563812255859375, -0.493896484375, -0.423980712890625, -0.35406494140625, -0.284149169921875, -0.2142333984375, -0.144317626953125, -0.07440185546875, -0.004486083984375, 0.0654296875, 0.135345458984375, 0.20526123046875, 0.275177001953125, 0.3450927734375, 0.415008544921875, 0.48492431640625, 0.554840087890625, 0.624755859375, 0.694671630859375, 0.76458740234375, 0.834503173828125, 0.9044189453125, 0.974334716796875, 1.04425048828125, 1.114166259765625, 1.18408203125, 1.253997802734375, 1.32391357421875, 1.393829345703125, 1.4637451171875, 1.533660888671875, 1.60357666015625, 1.673492431640625, 1.743408203125, 1.813323974609375, 1.88323974609375, 1.953155517578125, 2.0230712890625, 2.092987060546875, 2.16290283203125, 2.232818603515625, 2.302734375]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 6.0, 1.0, 8.0, 7.0, 11.0, 18.0, 13.0, 24.0, 38.0, 52.0, 45.0, 65.0, 73.0, 74.0, 67.0, 95.0, 81.0, 66.0, 51.0, 50.0, 37.0, 29.0, 17.0, 20.0, 11.0, 10.0, 10.0, 8.0, 4.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.588699340820312, -22.803377151489258, -22.018054962158203, -21.23273468017578, -20.447412490844727, -19.662090301513672, -18.87677001953125, -18.091447830200195, -17.30612564086914, -16.520803451538086, -15.735482215881348, -14.95016098022461, -14.164838790893555, -13.3795166015625, -12.594195365905762, -11.808874130249023, -11.023551940917969, -10.238229751586914, -9.452908515930176, -8.667587280273438, -7.882265090942383, -7.096943378448486, -6.31162166595459, -5.526299953460693, -4.740978240966797, -3.9556565284729004, -3.170334815979004, -2.3850131034851074, -1.599691390991211, -0.8143696784973145, -0.02904796600341797, 0.7562737464904785, 1.5415935516357422, 2.3269152641296387, 3.112236976623535, 3.8975586891174316, 4.682880401611328, 5.468202114105225, 6.253523826599121, 7.038845539093018, 7.824167251586914, 8.609489440917969, 9.394810676574707, 10.180131912231445, 10.9654541015625, 11.750776290893555, 12.536097526550293, 13.321418762207031, 14.106740951538086, 14.89206314086914, 15.677384376525879, 16.462705612182617, 17.248027801513672, 18.033349990844727, 18.81867218017578, 19.603992462158203, 20.389314651489258, 21.174636840820312, 21.959957122802734, 22.74527931213379, 23.530601501464844, 24.3159236907959, 25.101245880126953, 25.886566162109375, 26.67188835144043]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 5.0, 3.0, 1.0, 2.0, 5.0, 4.0, 6.0, 11.0, 11.0, 10.0, 15.0, 21.0, 16.0, 26.0, 22.0, 16.0, 21.0, 31.0, 39.0, 28.0, 32.0, 36.0, 42.0, 48.0, 44.0, 43.0, 35.0, 28.0, 35.0, 33.0, 45.0, 38.0, 28.0, 27.0, 26.0, 23.0, 28.0, 13.0, 25.0, 14.0, 10.0, 16.0, 7.0, 3.0, 7.0, 12.0, 4.0, 5.0, 5.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.110013008117676, -7.8352484703063965, -7.560483932495117, -7.285719394683838, -7.010954856872559, -6.736190319061279, -6.46142578125, -6.186661243438721, -5.911896705627441, -5.637132167816162, -5.362367630004883, -5.0876030921936035, -4.812838554382324, -4.538074016571045, -4.263309478759766, -3.9885449409484863, -3.713780403137207, -3.4390158653259277, -3.1642513275146484, -2.889486789703369, -2.61472225189209, -2.3399577140808105, -2.0651931762695312, -1.790428638458252, -1.5156641006469727, -1.2408995628356934, -0.9661350250244141, -0.6913704872131348, -0.41660594940185547, -0.14184141159057617, 0.13292312622070312, 0.4076876640319824, 0.6824531555175781, 0.9572176933288574, 1.2319822311401367, 1.506746768951416, 1.7815113067626953, 2.0562758445739746, 2.331040382385254, 2.605804920196533, 2.8805694580078125, 3.155333995819092, 3.430098533630371, 3.7048630714416504, 3.9796276092529297, 4.254392147064209, 4.529156684875488, 4.803921222686768, 5.078685760498047, 5.353450298309326, 5.6282148361206055, 5.902979373931885, 6.177743911743164, 6.452508449554443, 6.727272987365723, 7.002037525177002, 7.276802062988281, 7.5515666007995605, 7.82633113861084, 8.101095199584961, 8.375860214233398, 8.650625228881836, 8.925389289855957, 9.200153350830078, 9.474918365478516]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 5.0, 15.0, 19.0, 33.0, 37.0, 73.0, 111.0, 131.0, 224.0, 384.0, 580.0, 983.0, 1653.0, 2765.0, 4598.0, 7844.0, 13847.0, 23744.0, 39975.0, 66761.0, 101297.0, 137819.0, 160017.0, 152763.0, 121325.0, 83439.0, 52792.0, 31319.0, 18258.0, 10496.0, 6038.0, 3546.0, 2153.0, 1324.0, 822.0, 523.0, 311.0, 179.0, 110.0, 85.0, 57.0, 26.0, 21.0, 20.0, 14.0, 4.0, 5.0, 5.0, 0.0, 4.0, 0.0, 0.0, 1.0], "bins": [-12.4921875, -12.1221923828125, -11.752197265625, -11.3822021484375, -11.01220703125, -10.6422119140625, -10.272216796875, -9.9022216796875, -9.5322265625, -9.1622314453125, -8.792236328125, -8.4222412109375, -8.05224609375, -7.6822509765625, -7.312255859375, -6.9422607421875, -6.572265625, -6.2022705078125, -5.832275390625, -5.4622802734375, -5.09228515625, -4.7222900390625, -4.352294921875, -3.9822998046875, -3.6123046875, -3.2423095703125, -2.872314453125, -2.5023193359375, -2.13232421875, -1.7623291015625, -1.392333984375, -1.0223388671875, -0.65234375, -0.2823486328125, 0.087646484375, 0.4576416015625, 0.82763671875, 1.1976318359375, 1.567626953125, 1.9376220703125, 2.3076171875, 2.6776123046875, 3.047607421875, 3.4176025390625, 3.78759765625, 4.1575927734375, 4.527587890625, 4.8975830078125, 5.267578125, 5.6375732421875, 6.007568359375, 6.3775634765625, 6.74755859375, 7.1175537109375, 7.487548828125, 7.8575439453125, 8.2275390625, 8.5975341796875, 8.967529296875, 9.3375244140625, 9.70751953125, 10.0775146484375, 10.447509765625, 10.8175048828125, 11.1875]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 8.0, 2.0, 10.0, 10.0, 15.0, 28.0, 23.0, 25.0, 27.0, 40.0, 44.0, 48.0, 49.0, 57.0, 42.0, 58.0, 54.0, 49.0, 56.0, 37.0, 40.0, 32.0, 44.0, 36.0, 37.0, 29.0, 19.0, 21.0, 11.0, 13.0, 2.0, 7.0, 7.0, 5.0, 6.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.0234375, -12.6182861328125, -12.213134765625, -11.8079833984375, -11.40283203125, -10.9976806640625, -10.592529296875, -10.1873779296875, -9.7822265625, -9.3770751953125, -8.971923828125, -8.5667724609375, -8.16162109375, -7.7564697265625, -7.351318359375, -6.9461669921875, -6.541015625, -6.1358642578125, -5.730712890625, -5.3255615234375, -4.92041015625, -4.5152587890625, -4.110107421875, -3.7049560546875, -3.2998046875, -2.8946533203125, -2.489501953125, -2.0843505859375, -1.67919921875, -1.2740478515625, -0.868896484375, -0.4637451171875, -0.05859375, 0.3465576171875, 0.751708984375, 1.1568603515625, 1.56201171875, 1.9671630859375, 2.372314453125, 2.7774658203125, 3.1826171875, 3.5877685546875, 3.992919921875, 4.3980712890625, 4.80322265625, 5.2083740234375, 5.613525390625, 6.0186767578125, 6.423828125, 6.8289794921875, 7.234130859375, 7.6392822265625, 8.04443359375, 8.4495849609375, 8.854736328125, 9.2598876953125, 9.6650390625, 10.0701904296875, 10.475341796875, 10.8804931640625, 11.28564453125, 11.6907958984375, 12.095947265625, 12.5010986328125, 12.90625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 12.0, 24.0, 25.0, 38.0, 52.0, 77.0, 128.0, 181.0, 233.0, 386.0, 568.0, 888.0, 1432.0, 2244.0, 3577.0, 5687.0, 9287.0, 14842.0, 23793.0, 37284.0, 57228.0, 83603.0, 113339.0, 135869.0, 140900.0, 125851.0, 97651.0, 68953.0, 45581.0, 29354.0, 18476.0, 11506.0, 7128.0, 4450.0, 2873.0, 1736.0, 1082.0, 804.0, 473.0, 313.0, 203.0, 135.0, 93.0, 61.0, 48.0, 35.0, 15.0, 18.0, 6.0, 5.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.1953125, -9.868896484375, -9.54248046875, -9.216064453125, -8.8896484375, -8.563232421875, -8.23681640625, -7.910400390625, -7.583984375, -7.257568359375, -6.93115234375, -6.604736328125, -6.2783203125, -5.951904296875, -5.62548828125, -5.299072265625, -4.97265625, -4.646240234375, -4.31982421875, -3.993408203125, -3.6669921875, -3.340576171875, -3.01416015625, -2.687744140625, -2.361328125, -2.034912109375, -1.70849609375, -1.382080078125, -1.0556640625, -0.729248046875, -0.40283203125, -0.076416015625, 0.25, 0.576416015625, 0.90283203125, 1.229248046875, 1.5556640625, 1.882080078125, 2.20849609375, 2.534912109375, 2.861328125, 3.187744140625, 3.51416015625, 3.840576171875, 4.1669921875, 4.493408203125, 4.81982421875, 5.146240234375, 5.47265625, 5.799072265625, 6.12548828125, 6.451904296875, 6.7783203125, 7.104736328125, 7.43115234375, 7.757568359375, 8.083984375, 8.410400390625, 8.73681640625, 9.063232421875, 9.3896484375, 9.716064453125, 10.04248046875, 10.368896484375, 10.6953125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 8.0, 7.0, 9.0, 11.0, 17.0, 15.0, 15.0, 12.0, 25.0, 30.0, 25.0, 17.0, 41.0, 34.0, 34.0, 31.0, 44.0, 36.0, 37.0, 50.0, 52.0, 45.0, 35.0, 38.0, 35.0, 32.0, 32.0, 30.0, 23.0, 34.0, 27.0, 30.0, 19.0, 8.0, 7.0, 12.0, 9.0, 12.0, 4.0, 6.0, 4.0, 5.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.140625, -5.9434814453125, -5.746337890625, -5.5491943359375, -5.35205078125, -5.1549072265625, -4.957763671875, -4.7606201171875, -4.5634765625, -4.3663330078125, -4.169189453125, -3.9720458984375, -3.77490234375, -3.5777587890625, -3.380615234375, -3.1834716796875, -2.986328125, -2.7891845703125, -2.592041015625, -2.3948974609375, -2.19775390625, -2.0006103515625, -1.803466796875, -1.6063232421875, -1.4091796875, -1.2120361328125, -1.014892578125, -0.8177490234375, -0.62060546875, -0.4234619140625, -0.226318359375, -0.0291748046875, 0.16796875, 0.3651123046875, 0.562255859375, 0.7593994140625, 0.95654296875, 1.1536865234375, 1.350830078125, 1.5479736328125, 1.7451171875, 1.9422607421875, 2.139404296875, 2.3365478515625, 2.53369140625, 2.7308349609375, 2.927978515625, 3.1251220703125, 3.322265625, 3.5194091796875, 3.716552734375, 3.9136962890625, 4.11083984375, 4.3079833984375, 4.505126953125, 4.7022705078125, 4.8994140625, 5.0965576171875, 5.293701171875, 5.4908447265625, 5.68798828125, 5.8851318359375, 6.082275390625, 6.2794189453125, 6.4765625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 8.0, 9.0, 16.0, 22.0, 38.0, 67.0, 99.0, 114.0, 194.0, 298.0, 434.0, 687.0, 1191.0, 1947.0, 3256.0, 5255.0, 9074.0, 15267.0, 25542.0, 43012.0, 70742.0, 107777.0, 148180.0, 168641.0, 151307.0, 111548.0, 72578.0, 45162.0, 26746.0, 16000.0, 9287.0, 5417.0, 3335.0, 2074.0, 1172.0, 777.0, 470.0, 258.0, 177.0, 145.0, 69.0, 46.0, 32.0, 22.0, 25.0, 15.0, 12.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.3125, -5.14923095703125, -4.9859619140625, -4.82269287109375, -4.659423828125, -4.49615478515625, -4.3328857421875, -4.16961669921875, -4.00634765625, -3.84307861328125, -3.6798095703125, -3.51654052734375, -3.353271484375, -3.19000244140625, -3.0267333984375, -2.86346435546875, -2.7001953125, -2.53692626953125, -2.3736572265625, -2.21038818359375, -2.047119140625, -1.88385009765625, -1.7205810546875, -1.55731201171875, -1.39404296875, -1.23077392578125, -1.0675048828125, -0.90423583984375, -0.740966796875, -0.57769775390625, -0.4144287109375, -0.25115966796875, -0.087890625, 0.07537841796875, 0.2386474609375, 0.40191650390625, 0.565185546875, 0.72845458984375, 0.8917236328125, 1.05499267578125, 1.21826171875, 1.38153076171875, 1.5447998046875, 1.70806884765625, 1.871337890625, 2.03460693359375, 2.1978759765625, 2.36114501953125, 2.5244140625, 2.68768310546875, 2.8509521484375, 3.01422119140625, 3.177490234375, 3.34075927734375, 3.5040283203125, 3.66729736328125, 3.83056640625, 3.99383544921875, 4.1571044921875, 4.32037353515625, 4.483642578125, 4.64691162109375, 4.8101806640625, 4.97344970703125, 5.13671875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 6.0, 4.0, 9.0, 7.0, 4.0, 23.0, 21.0, 19.0, 30.0, 36.0, 44.0, 53.0, 56.0, 76.0, 57.0, 71.0, 97.0, 62.0, 60.0, 57.0, 43.0, 37.0, 34.0, 25.0, 14.0, 20.0, 9.0, 10.0, 7.0, 8.0, 1.0, 2.0, 2.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0006604194641113281, -0.0006402879953384399, -0.0006201565265655518, -0.0006000250577926636, -0.0005798935890197754, -0.0005597621202468872, -0.000539630651473999, -0.0005194991827011108, -0.0004993677139282227, -0.00047923624515533447, -0.0004591047763824463, -0.0004389733076095581, -0.0004188418388366699, -0.00039871037006378174, -0.00037857890129089355, -0.00035844743251800537, -0.0003383159637451172, -0.000318184494972229, -0.0002980530261993408, -0.00027792155742645264, -0.00025779008865356445, -0.00023765861988067627, -0.00021752715110778809, -0.0001973956823348999, -0.00017726421356201172, -0.00015713274478912354, -0.00013700127601623535, -0.00011686980724334717, -9.673833847045898e-05, -7.66068696975708e-05, -5.647540092468262e-05, -3.6343932151794434e-05, -1.621246337890625e-05, 3.919005393981934e-06, 2.4050474166870117e-05, 4.41819429397583e-05, 6.431341171264648e-05, 8.444488048553467e-05, 0.00010457634925842285, 0.00012470781803131104, 0.00014483928680419922, 0.0001649707555770874, 0.00018510222434997559, 0.00020523369312286377, 0.00022536516189575195, 0.00024549663066864014, 0.0002656280994415283, 0.0002857595682144165, 0.0003058910369873047, 0.00032602250576019287, 0.00034615397453308105, 0.00036628544330596924, 0.0003864169120788574, 0.0004065483808517456, 0.0004266798496246338, 0.00044681131839752197, 0.00046694278717041016, 0.00048707425594329834, 0.0005072057247161865, 0.0005273371934890747, 0.0005474686622619629, 0.0005676001310348511, 0.0005877315998077393, 0.0006078630685806274, 0.0006279945373535156]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 8.0, 7.0, 5.0, 12.0, 17.0, 23.0, 39.0, 65.0, 103.0, 146.0, 220.0, 291.0, 505.0, 752.0, 1237.0, 1900.0, 2871.0, 4689.0, 7381.0, 11864.0, 19064.0, 30574.0, 48749.0, 74657.0, 108463.0, 140144.0, 154320.0, 137424.0, 105297.0, 72148.0, 47053.0, 29239.0, 18348.0, 11282.0, 7231.0, 4439.0, 2866.0, 1821.0, 1135.0, 725.0, 505.0, 341.0, 211.0, 147.0, 77.0, 63.0, 36.0, 23.0, 17.0, 11.0, 6.0, 4.0, 6.0, 3.0, 0.0, 1.0, 2.0, 3.0], "bins": [-4.84375, -4.69451904296875, -4.5452880859375, -4.39605712890625, -4.246826171875, -4.09759521484375, -3.9483642578125, -3.79913330078125, -3.64990234375, -3.50067138671875, -3.3514404296875, -3.20220947265625, -3.052978515625, -2.90374755859375, -2.7545166015625, -2.60528564453125, -2.4560546875, -2.30682373046875, -2.1575927734375, -2.00836181640625, -1.859130859375, -1.70989990234375, -1.5606689453125, -1.41143798828125, -1.26220703125, -1.11297607421875, -0.9637451171875, -0.81451416015625, -0.665283203125, -0.51605224609375, -0.3668212890625, -0.21759033203125, -0.068359375, 0.08087158203125, 0.2301025390625, 0.37933349609375, 0.528564453125, 0.67779541015625, 0.8270263671875, 0.97625732421875, 1.12548828125, 1.27471923828125, 1.4239501953125, 1.57318115234375, 1.722412109375, 1.87164306640625, 2.0208740234375, 2.17010498046875, 2.3193359375, 2.46856689453125, 2.6177978515625, 2.76702880859375, 2.916259765625, 3.06549072265625, 3.2147216796875, 3.36395263671875, 3.51318359375, 3.66241455078125, 3.8116455078125, 3.96087646484375, 4.110107421875, 4.25933837890625, 4.4085693359375, 4.55780029296875, 4.70703125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 8.0, 9.0, 7.0, 12.0, 19.0, 24.0, 28.0, 34.0, 46.0, 64.0, 52.0, 62.0, 66.0, 75.0, 67.0, 56.0, 62.0, 48.0, 54.0, 55.0, 32.0, 20.0, 17.0, 19.0, 10.0, 10.0, 12.0, 5.0, 3.0, 3.0, 2.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7646484375, -1.7018890380859375, -1.639129638671875, -1.5763702392578125, -1.51361083984375, -1.4508514404296875, -1.388092041015625, -1.3253326416015625, -1.2625732421875, -1.1998138427734375, -1.137054443359375, -1.0742950439453125, -1.01153564453125, -0.9487762451171875, -0.886016845703125, -0.8232574462890625, -0.760498046875, -0.6977386474609375, -0.634979248046875, -0.5722198486328125, -0.50946044921875, -0.4467010498046875, -0.383941650390625, -0.3211822509765625, -0.2584228515625, -0.1956634521484375, -0.132904052734375, -0.0701446533203125, -0.00738525390625, 0.0553741455078125, 0.118133544921875, 0.1808929443359375, 0.24365234375, 0.3064117431640625, 0.369171142578125, 0.4319305419921875, 0.49468994140625, 0.5574493408203125, 0.620208740234375, 0.6829681396484375, 0.7457275390625, 0.8084869384765625, 0.871246337890625, 0.9340057373046875, 0.99676513671875, 1.0595245361328125, 1.122283935546875, 1.1850433349609375, 1.247802734375, 1.3105621337890625, 1.373321533203125, 1.4360809326171875, 1.49884033203125, 1.5615997314453125, 1.624359130859375, 1.6871185302734375, 1.7498779296875, 1.8126373291015625, 1.875396728515625, 1.9381561279296875, 2.00091552734375, 2.0636749267578125, 2.126434326171875, 2.1891937255859375, 2.251953125]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 8.0, 11.0, 11.0, 9.0, 27.0, 23.0, 41.0, 51.0, 62.0, 48.0, 68.0, 84.0, 70.0, 75.0, 73.0, 70.0, 57.0, 40.0, 35.0, 19.0, 28.0, 13.0, 18.0, 10.0, 6.0, 11.0, 5.0, 5.0, 4.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.393449783325195, -21.668926239013672, -20.94440269470215, -20.219879150390625, -19.49535369873047, -18.770830154418945, -18.046306610107422, -17.3217830657959, -16.597259521484375, -15.872735977172852, -15.148212432861328, -14.423687934875488, -13.699164390563965, -12.974640846252441, -12.250116348266602, -11.525592803955078, -10.801069259643555, -10.076545715332031, -9.352022171020508, -8.627497673034668, -7.9029741287231445, -7.178450584411621, -6.4539265632629395, -5.729402542114258, -5.004878997802734, -4.280355453491211, -3.5558314323425293, -2.8313076496124268, -2.106783866882324, -1.3822600841522217, -0.6577363014221191, 0.0667877197265625, 0.7913093566894531, 1.5158331394195557, 2.240356922149658, 2.9648807048797607, 3.6894044876098633, 4.413928031921387, 5.138452053070068, 5.86297607421875, 6.587499618530273, 7.312023162841797, 8.03654670715332, 8.76107120513916, 9.485594749450684, 10.210118293762207, 10.934642791748047, 11.65916633605957, 12.383689880371094, 13.108213424682617, 13.83273696899414, 14.55726146697998, 15.281785011291504, 16.006309509277344, 16.730833053588867, 17.45535659790039, 18.179880142211914, 18.904403686523438, 19.62892723083496, 20.353450775146484, 21.07797622680664, 21.802499771118164, 22.527023315429688, 23.25154685974121, 23.976070404052734]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 2.0, 5.0, 5.0, 14.0, 17.0, 13.0, 14.0, 16.0, 20.0, 30.0, 24.0, 33.0, 31.0, 26.0, 43.0, 38.0, 38.0, 42.0, 52.0, 50.0, 44.0, 43.0, 54.0, 32.0, 40.0, 38.0, 34.0, 30.0, 20.0, 25.0, 24.0, 15.0, 23.0, 15.0, 9.0, 5.0, 13.0, 3.0, 8.0, 2.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.620841979980469, -9.307011604309082, -8.993182182312012, -8.679351806640625, -8.365522384643555, -8.051692008972168, -7.7378621101379395, -7.424032211303711, -7.110201835632324, -6.796371936798096, -6.482542037963867, -6.1687116622924805, -5.854881763458252, -5.541051864624023, -5.227221965789795, -4.913392066955566, -4.599562168121338, -4.285732269287109, -3.9719021320343018, -3.6580722332000732, -3.3442420959472656, -3.030412197113037, -2.7165822982788086, -2.402752161026001, -2.0889222621917725, -1.7750922441482544, -1.4612622261047363, -1.1474323272705078, -0.8336023092269897, -0.5197722911834717, -0.20594239234924316, 0.10788774490356445, 0.42171764373779297, 0.735547661781311, 1.049377679824829, 1.3632075786590576, 1.6770375967025757, 1.9908676147460938, 2.3046975135803223, 2.61852765083313, 2.9323575496673584, 3.246187448501587, 3.5600175857543945, 3.873847484588623, 4.187677383422852, 4.501507759094238, 4.815337181091309, 5.129167556762695, 5.442997455596924, 5.756827354431152, 6.070657253265381, 6.384487152099609, 6.698317527770996, 7.012147426605225, 7.325977325439453, 7.63980770111084, 7.95363712310791, 8.267467498779297, 8.581296920776367, 8.895127296447754, 9.208956718444824, 9.522787094116211, 9.836616516113281, 10.150446891784668, 10.464277267456055]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 12.0, 12.0, 16.0, 36.0, 41.0, 41.0, 82.0, 119.0, 181.0, 329.0, 454.0, 760.0, 1269.0, 2154.0, 3628.0, 6808.0, 12233.0, 23108.0, 44323.0, 89697.0, 193065.0, 433588.0, 920256.0, 1160130.0, 707608.0, 313208.0, 140803.0, 67147.0, 33407.0, 17384.0, 9324.0, 5243.0, 2997.0, 1785.0, 1110.0, 671.0, 403.0, 288.0, 180.0, 119.0, 89.0, 51.0, 38.0, 30.0, 22.0, 9.0, 8.0, 5.0, 5.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0], "bins": [-17.5, -16.958251953125, -16.41650390625, -15.874755859375, -15.3330078125, -14.791259765625, -14.24951171875, -13.707763671875, -13.166015625, -12.624267578125, -12.08251953125, -11.540771484375, -10.9990234375, -10.457275390625, -9.91552734375, -9.373779296875, -8.83203125, -8.290283203125, -7.74853515625, -7.206787109375, -6.6650390625, -6.123291015625, -5.58154296875, -5.039794921875, -4.498046875, -3.956298828125, -3.41455078125, -2.872802734375, -2.3310546875, -1.789306640625, -1.24755859375, -0.705810546875, -0.1640625, 0.377685546875, 0.91943359375, 1.461181640625, 2.0029296875, 2.544677734375, 3.08642578125, 3.628173828125, 4.169921875, 4.711669921875, 5.25341796875, 5.795166015625, 6.3369140625, 6.878662109375, 7.42041015625, 7.962158203125, 8.50390625, 9.045654296875, 9.58740234375, 10.129150390625, 10.6708984375, 11.212646484375, 11.75439453125, 12.296142578125, 12.837890625, 13.379638671875, 13.92138671875, 14.463134765625, 15.0048828125, 15.546630859375, 16.08837890625, 16.630126953125, 17.171875]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 7.0, 8.0, 12.0, 15.0, 11.0, 20.0, 21.0, 16.0, 26.0, 37.0, 28.0, 34.0, 38.0, 45.0, 51.0, 39.0, 54.0, 41.0, 50.0, 49.0, 52.0, 50.0, 47.0, 28.0, 33.0, 26.0, 31.0, 17.0, 24.0, 18.0, 15.0, 23.0, 6.0, 9.0, 3.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5703125, -8.31622314453125, -8.0621337890625, -7.80804443359375, -7.553955078125, -7.29986572265625, -7.0457763671875, -6.79168701171875, -6.53759765625, -6.28350830078125, -6.0294189453125, -5.77532958984375, -5.521240234375, -5.26715087890625, -5.0130615234375, -4.75897216796875, -4.5048828125, -4.25079345703125, -3.9967041015625, -3.74261474609375, -3.488525390625, -3.23443603515625, -2.9803466796875, -2.72625732421875, -2.47216796875, -2.21807861328125, -1.9639892578125, -1.70989990234375, -1.455810546875, -1.20172119140625, -0.9476318359375, -0.69354248046875, -0.439453125, -0.18536376953125, 0.0687255859375, 0.32281494140625, 0.576904296875, 0.83099365234375, 1.0850830078125, 1.33917236328125, 1.59326171875, 1.84735107421875, 2.1014404296875, 2.35552978515625, 2.609619140625, 2.86370849609375, 3.1177978515625, 3.37188720703125, 3.6259765625, 3.88006591796875, 4.1341552734375, 4.38824462890625, 4.642333984375, 4.89642333984375, 5.1505126953125, 5.40460205078125, 5.65869140625, 5.91278076171875, 6.1668701171875, 6.42095947265625, 6.675048828125, 6.92913818359375, 7.1832275390625, 7.43731689453125, 7.69140625]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 7.0, 15.0, 10.0, 18.0, 30.0, 38.0, 59.0, 101.0, 151.0, 191.0, 324.0, 529.0, 782.0, 1214.0, 1908.0, 3068.0, 5120.0, 8803.0, 15161.0, 26720.0, 48072.0, 88251.0, 163854.0, 303449.0, 546089.0, 846154.0, 864364.0, 569016.0, 318537.0, 171116.0, 92318.0, 50896.0, 28279.0, 15863.0, 9467.0, 5469.0, 3299.0, 1935.0, 1324.0, 792.0, 520.0, 343.0, 216.0, 119.0, 107.0, 81.0, 32.0, 29.0, 14.0, 14.0, 8.0, 8.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.453125, -14.9708251953125, -14.488525390625, -14.0062255859375, -13.52392578125, -13.0416259765625, -12.559326171875, -12.0770263671875, -11.5947265625, -11.1124267578125, -10.630126953125, -10.1478271484375, -9.66552734375, -9.1832275390625, -8.700927734375, -8.2186279296875, -7.736328125, -7.2540283203125, -6.771728515625, -6.2894287109375, -5.80712890625, -5.3248291015625, -4.842529296875, -4.3602294921875, -3.8779296875, -3.3956298828125, -2.913330078125, -2.4310302734375, -1.94873046875, -1.4664306640625, -0.984130859375, -0.5018310546875, -0.01953125, 0.4627685546875, 0.945068359375, 1.4273681640625, 1.90966796875, 2.3919677734375, 2.874267578125, 3.3565673828125, 3.8388671875, 4.3211669921875, 4.803466796875, 5.2857666015625, 5.76806640625, 6.2503662109375, 6.732666015625, 7.2149658203125, 7.697265625, 8.1795654296875, 8.661865234375, 9.1441650390625, 9.62646484375, 10.1087646484375, 10.591064453125, 11.0733642578125, 11.5556640625, 12.0379638671875, 12.520263671875, 13.0025634765625, 13.48486328125, 13.9671630859375, 14.449462890625, 14.9317626953125, 15.4140625]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 10.0, 11.0, 23.0, 22.0, 23.0, 26.0, 31.0, 40.0, 60.0, 101.0, 105.0, 125.0, 150.0, 203.0, 244.0, 260.0, 281.0, 287.0, 295.0, 267.0, 289.0, 233.0, 195.0, 156.0, 145.0, 112.0, 70.0, 75.0, 54.0, 53.0, 34.0, 23.0, 14.0, 13.0, 13.0, 8.0, 3.0, 4.0, 7.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.875, -4.7135009765625, -4.552001953125, -4.3905029296875, -4.22900390625, -4.0675048828125, -3.906005859375, -3.7445068359375, -3.5830078125, -3.4215087890625, -3.260009765625, -3.0985107421875, -2.93701171875, -2.7755126953125, -2.614013671875, -2.4525146484375, -2.291015625, -2.1295166015625, -1.968017578125, -1.8065185546875, -1.64501953125, -1.4835205078125, -1.322021484375, -1.1605224609375, -0.9990234375, -0.8375244140625, -0.676025390625, -0.5145263671875, -0.35302734375, -0.1915283203125, -0.030029296875, 0.1314697265625, 0.29296875, 0.4544677734375, 0.615966796875, 0.7774658203125, 0.93896484375, 1.1004638671875, 1.261962890625, 1.4234619140625, 1.5849609375, 1.7464599609375, 1.907958984375, 2.0694580078125, 2.23095703125, 2.3924560546875, 2.553955078125, 2.7154541015625, 2.876953125, 3.0384521484375, 3.199951171875, 3.3614501953125, 3.52294921875, 3.6844482421875, 3.845947265625, 4.0074462890625, 4.1689453125, 4.3304443359375, 4.491943359375, 4.6534423828125, 4.81494140625, 4.9764404296875, 5.137939453125, 5.2994384765625, 5.4609375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 11.0, 5.0, 11.0, 15.0, 23.0, 22.0, 29.0, 39.0, 45.0, 60.0, 71.0, 75.0, 82.0, 71.0, 70.0, 70.0, 57.0, 53.0, 30.0, 26.0, 33.0, 21.0, 16.0, 12.0, 10.0, 8.0, 8.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.947229385375977, -22.237016677856445, -21.526803970336914, -20.816591262817383, -20.10637855529785, -19.39616584777832, -18.685951232910156, -17.975738525390625, -17.265525817871094, -16.555313110351562, -15.845100402832031, -15.1348876953125, -14.424674987792969, -13.714462280273438, -13.00424861907959, -12.294035911560059, -11.583824157714844, -10.873611450195312, -10.163398742675781, -9.45318603515625, -8.742973327636719, -8.032760620117188, -7.32254695892334, -6.612334251403809, -5.902121543884277, -5.191908836364746, -4.481696128845215, -3.7714829444885254, -3.061270236968994, -2.351057529449463, -1.6408443450927734, -0.9306316375732422, -0.22041893005371094, 0.48979389667510986, 1.2000067234039307, 1.910219669342041, 2.6204323768615723, 3.3306450843811035, 4.040858268737793, 4.751070976257324, 5.4612836837768555, 6.171496391296387, 6.881709098815918, 7.591922283172607, 8.302135467529297, 9.012348175048828, 9.72256088256836, 10.43277359008789, 11.142986297607422, 11.853199005126953, 12.563411712646484, 13.273624420166016, 13.983837127685547, 14.694049835205078, 15.404263496398926, 16.11447525024414, 16.824687957763672, 17.534900665283203, 18.245113372802734, 18.955326080322266, 19.665538787841797, 20.375751495361328, 21.08596420288086, 21.79617691040039, 22.506391525268555]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 4.0, 8.0, 5.0, 16.0, 8.0, 14.0, 15.0, 17.0, 16.0, 28.0, 34.0, 37.0, 31.0, 47.0, 38.0, 35.0, 49.0, 43.0, 38.0, 50.0, 48.0, 56.0, 43.0, 36.0, 41.0, 30.0, 31.0, 27.0, 21.0, 21.0, 13.0, 17.0, 18.0, 16.0, 12.0, 7.0, 9.0, 5.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.6331353187561035, -7.344013214111328, -7.054891109466553, -6.765769004821777, -6.476646900177002, -6.187524795532227, -5.898402214050293, -5.609280586242676, -5.320158004760742, -5.031035900115967, -4.741913795471191, -4.452791690826416, -4.163669586181641, -3.8745474815368652, -3.5854251384735107, -3.2963030338287354, -3.007181167602539, -2.7180590629577637, -2.4289369583129883, -2.139814853668213, -1.850692629814148, -1.5615705251693726, -1.2724483013153076, -0.9833261966705322, -0.6942040920257568, -0.40508195757865906, -0.11595982313156128, 0.1731623411178589, 0.4622844457626343, 0.7514065504074097, 1.0405287742614746, 1.32965087890625, 1.6187725067138672, 1.9078946113586426, 2.197016716003418, 2.4861388206481934, 2.7752609252929688, 3.064383029937744, 3.3535053730010986, 3.642627477645874, 3.9317495822906494, 4.220871925354004, 4.509994029998779, 4.799116134643555, 5.08823823928833, 5.3773603439331055, 5.666482448577881, 5.955604553222656, 6.244726657867432, 6.533848762512207, 6.822970867156982, 7.112092971801758, 7.401215076446533, 7.690337181091309, 7.979459762573242, 8.26858139038086, 8.557703971862793, 8.846826553344727, 9.135948181152344, 9.425070762634277, 9.714192390441895, 10.003314971923828, 10.292436599731445, 10.581559181213379, 10.870680809020996]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 7.0, 7.0, 11.0, 7.0, 17.0, 28.0, 53.0, 84.0, 121.0, 193.0, 248.0, 485.0, 780.0, 1408.0, 2515.0, 4650.0, 8796.0, 18493.0, 40494.0, 90993.0, 192971.0, 280828.0, 211845.0, 104424.0, 46298.0, 21047.0, 10101.0, 5193.0, 2635.0, 1558.0, 855.0, 527.0, 328.0, 181.0, 127.0, 99.0, 41.0, 29.0, 29.0, 18.0, 12.0, 10.0, 1.0, 5.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-16.15625, -15.6751708984375, -15.194091796875, -14.7130126953125, -14.23193359375, -13.7508544921875, -13.269775390625, -12.7886962890625, -12.3076171875, -11.8265380859375, -11.345458984375, -10.8643798828125, -10.38330078125, -9.9022216796875, -9.421142578125, -8.9400634765625, -8.458984375, -7.9779052734375, -7.496826171875, -7.0157470703125, -6.53466796875, -6.0535888671875, -5.572509765625, -5.0914306640625, -4.6103515625, -4.1292724609375, -3.648193359375, -3.1671142578125, -2.68603515625, -2.2049560546875, -1.723876953125, -1.2427978515625, -0.76171875, -0.2806396484375, 0.200439453125, 0.6815185546875, 1.16259765625, 1.6436767578125, 2.124755859375, 2.6058349609375, 3.0869140625, 3.5679931640625, 4.049072265625, 4.5301513671875, 5.01123046875, 5.4923095703125, 5.973388671875, 6.4544677734375, 6.935546875, 7.4166259765625, 7.897705078125, 8.3787841796875, 8.85986328125, 9.3409423828125, 9.822021484375, 10.3031005859375, 10.7841796875, 11.2652587890625, 11.746337890625, 12.2274169921875, 12.70849609375, 13.1895751953125, 13.670654296875, 14.1517333984375, 14.6328125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 4.0, 6.0, 3.0, 10.0, 13.0, 12.0, 27.0, 19.0, 30.0, 28.0, 27.0, 38.0, 48.0, 49.0, 56.0, 50.0, 57.0, 44.0, 52.0, 47.0, 48.0, 42.0, 39.0, 40.0, 34.0, 28.0, 22.0, 28.0, 16.0, 22.0, 14.0, 14.0, 3.0, 8.0, 9.0, 2.0, 4.0, 2.0, 2.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8203125, -10.4588623046875, -10.097412109375, -9.7359619140625, -9.37451171875, -9.0130615234375, -8.651611328125, -8.2901611328125, -7.9287109375, -7.5672607421875, -7.205810546875, -6.8443603515625, -6.48291015625, -6.1214599609375, -5.760009765625, -5.3985595703125, -5.037109375, -4.6756591796875, -4.314208984375, -3.9527587890625, -3.59130859375, -3.2298583984375, -2.868408203125, -2.5069580078125, -2.1455078125, -1.7840576171875, -1.422607421875, -1.0611572265625, -0.69970703125, -0.3382568359375, 0.023193359375, 0.3846435546875, 0.74609375, 1.1075439453125, 1.468994140625, 1.8304443359375, 2.19189453125, 2.5533447265625, 2.914794921875, 3.2762451171875, 3.6376953125, 3.9991455078125, 4.360595703125, 4.7220458984375, 5.08349609375, 5.4449462890625, 5.806396484375, 6.1678466796875, 6.529296875, 6.8907470703125, 7.252197265625, 7.6136474609375, 7.97509765625, 8.3365478515625, 8.697998046875, 9.0594482421875, 9.4208984375, 9.7823486328125, 10.143798828125, 10.5052490234375, 10.86669921875, 11.2281494140625, 11.589599609375, 11.9510498046875, 12.3125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 11.0, 9.0, 17.0, 31.0, 31.0, 45.0, 71.0, 105.0, 174.0, 265.0, 446.0, 769.0, 1541.0, 3168.0, 7548.0, 19885.0, 61183.0, 204820.0, 430399.0, 217958.0, 64272.0, 21012.0, 7792.0, 3391.0, 1564.0, 811.0, 466.0, 269.0, 174.0, 100.0, 67.0, 37.0, 41.0, 25.0, 16.0, 6.0, 9.0, 10.0, 3.0, 7.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-27.703125, -26.92333984375, -26.1435546875, -25.36376953125, -24.583984375, -23.80419921875, -23.0244140625, -22.24462890625, -21.46484375, -20.68505859375, -19.9052734375, -19.12548828125, -18.345703125, -17.56591796875, -16.7861328125, -16.00634765625, -15.2265625, -14.44677734375, -13.6669921875, -12.88720703125, -12.107421875, -11.32763671875, -10.5478515625, -9.76806640625, -8.98828125, -8.20849609375, -7.4287109375, -6.64892578125, -5.869140625, -5.08935546875, -4.3095703125, -3.52978515625, -2.75, -1.97021484375, -1.1904296875, -0.41064453125, 0.369140625, 1.14892578125, 1.9287109375, 2.70849609375, 3.48828125, 4.26806640625, 5.0478515625, 5.82763671875, 6.607421875, 7.38720703125, 8.1669921875, 8.94677734375, 9.7265625, 10.50634765625, 11.2861328125, 12.06591796875, 12.845703125, 13.62548828125, 14.4052734375, 15.18505859375, 15.96484375, 16.74462890625, 17.5244140625, 18.30419921875, 19.083984375, 19.86376953125, 20.6435546875, 21.42333984375, 22.203125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 5.0, 4.0, 10.0, 13.0, 12.0, 21.0, 22.0, 16.0, 15.0, 28.0, 24.0, 35.0, 29.0, 35.0, 43.0, 34.0, 52.0, 38.0, 45.0, 37.0, 44.0, 41.0, 45.0, 49.0, 45.0, 28.0, 27.0, 29.0, 22.0, 14.0, 19.0, 18.0, 19.0, 11.0, 12.0, 11.0, 8.0, 9.0, 6.0, 7.0, 4.0, 0.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.98046875, -5.79559326171875, -5.6107177734375, -5.42584228515625, -5.240966796875, -5.05609130859375, -4.8712158203125, -4.68634033203125, -4.50146484375, -4.31658935546875, -4.1317138671875, -3.94683837890625, -3.761962890625, -3.57708740234375, -3.3922119140625, -3.20733642578125, -3.0224609375, -2.83758544921875, -2.6527099609375, -2.46783447265625, -2.282958984375, -2.09808349609375, -1.9132080078125, -1.72833251953125, -1.54345703125, -1.35858154296875, -1.1737060546875, -0.98883056640625, -0.803955078125, -0.61907958984375, -0.4342041015625, -0.24932861328125, -0.064453125, 0.12042236328125, 0.3052978515625, 0.49017333984375, 0.675048828125, 0.85992431640625, 1.0447998046875, 1.22967529296875, 1.41455078125, 1.59942626953125, 1.7843017578125, 1.96917724609375, 2.154052734375, 2.33892822265625, 2.5238037109375, 2.70867919921875, 2.8935546875, 3.07843017578125, 3.2633056640625, 3.44818115234375, 3.633056640625, 3.81793212890625, 4.0028076171875, 4.18768310546875, 4.37255859375, 4.55743408203125, 4.7423095703125, 4.92718505859375, 5.112060546875, 5.29693603515625, 5.4818115234375, 5.66668701171875, 5.8515625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 8.0, 3.0, 2.0, 4.0, 3.0, 12.0, 11.0, 13.0, 24.0, 21.0, 44.0, 57.0, 76.0, 111.0, 129.0, 212.0, 254.0, 399.0, 614.0, 900.0, 1261.0, 1837.0, 2755.0, 4360.0, 6861.0, 11031.0, 19325.0, 35062.0, 67905.0, 134879.0, 240356.0, 237161.0, 132465.0, 66318.0, 34541.0, 19108.0, 10954.0, 6591.0, 4291.0, 2729.0, 1797.0, 1224.0, 841.0, 583.0, 387.0, 277.0, 218.0, 165.0, 121.0, 66.0, 60.0, 39.0, 32.0, 18.0, 17.0, 14.0, 10.0, 9.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-6.671875, -6.4632568359375, -6.254638671875, -6.0460205078125, -5.83740234375, -5.6287841796875, -5.420166015625, -5.2115478515625, -5.0029296875, -4.7943115234375, -4.585693359375, -4.3770751953125, -4.16845703125, -3.9598388671875, -3.751220703125, -3.5426025390625, -3.333984375, -3.1253662109375, -2.916748046875, -2.7081298828125, -2.49951171875, -2.2908935546875, -2.082275390625, -1.8736572265625, -1.6650390625, -1.4564208984375, -1.247802734375, -1.0391845703125, -0.83056640625, -0.6219482421875, -0.413330078125, -0.2047119140625, 0.00390625, 0.2125244140625, 0.421142578125, 0.6297607421875, 0.83837890625, 1.0469970703125, 1.255615234375, 1.4642333984375, 1.6728515625, 1.8814697265625, 2.090087890625, 2.2987060546875, 2.50732421875, 2.7159423828125, 2.924560546875, 3.1331787109375, 3.341796875, 3.5504150390625, 3.759033203125, 3.9676513671875, 4.17626953125, 4.3848876953125, 4.593505859375, 4.8021240234375, 5.0107421875, 5.2193603515625, 5.427978515625, 5.6365966796875, 5.84521484375, 6.0538330078125, 6.262451171875, 6.4710693359375, 6.6796875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 5.0, 7.0, 10.0, 6.0, 8.0, 11.0, 14.0, 20.0, 22.0, 30.0, 43.0, 75.0, 92.0, 93.0, 98.0, 115.0, 71.0, 69.0, 55.0, 47.0, 33.0, 19.0, 13.0, 13.0, 9.0, 6.0, 10.0, 4.0, 1.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00044727325439453125, -0.00043395906686782837, -0.0004206448793411255, -0.0004073306918144226, -0.0003940165042877197, -0.00038070231676101685, -0.00036738812923431396, -0.0003540739417076111, -0.0003407597541809082, -0.0003274455666542053, -0.00031413137912750244, -0.00030081719160079956, -0.0002875030040740967, -0.0002741888165473938, -0.0002608746290206909, -0.00024756044149398804, -0.00023424625396728516, -0.00022093206644058228, -0.0002076178789138794, -0.00019430369138717651, -0.00018098950386047363, -0.00016767531633377075, -0.00015436112880706787, -0.000141046941280365, -0.0001277327537536621, -0.00011441856622695923, -0.00010110437870025635, -8.779019117355347e-05, -7.447600364685059e-05, -6.11618161201477e-05, -4.7847628593444824e-05, -3.453344106674194e-05, -2.1219253540039062e-05, -7.905066013336182e-06, 5.409121513366699e-06, 1.872330904006958e-05, 3.203749656677246e-05, 4.535168409347534e-05, 5.866587162017822e-05, 7.19800591468811e-05, 8.529424667358398e-05, 9.860843420028687e-05, 0.00011192262172698975, 0.00012523680925369263, 0.0001385509967803955, 0.0001518651843070984, 0.00016517937183380127, 0.00017849355936050415, 0.00019180774688720703, 0.0002051219344139099, 0.0002184361219406128, 0.00023175030946731567, 0.00024506449699401855, 0.00025837868452072144, 0.0002716928720474243, 0.0002850070595741272, 0.0002983212471008301, 0.00031163543462753296, 0.00032494962215423584, 0.0003382638096809387, 0.0003515779972076416, 0.0003648921847343445, 0.00037820637226104736, 0.00039152055978775024, 0.0004048347473144531]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 19.0, 10.0, 21.0, 37.0, 48.0, 68.0, 98.0, 138.0, 249.0, 422.0, 649.0, 1106.0, 1869.0, 3178.0, 5576.0, 10281.0, 19984.0, 40492.0, 85818.0, 173048.0, 260451.0, 217306.0, 116015.0, 54510.0, 26711.0, 13590.0, 7106.0, 3923.0, 2201.0, 1383.0, 847.0, 505.0, 340.0, 194.0, 123.0, 80.0, 49.0, 38.0, 22.0, 16.0, 6.0, 6.0, 5.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9296875, -6.71112060546875, -6.4925537109375, -6.27398681640625, -6.055419921875, -5.83685302734375, -5.6182861328125, -5.39971923828125, -5.18115234375, -4.96258544921875, -4.7440185546875, -4.52545166015625, -4.306884765625, -4.08831787109375, -3.8697509765625, -3.65118408203125, -3.4326171875, -3.21405029296875, -2.9954833984375, -2.77691650390625, -2.558349609375, -2.33978271484375, -2.1212158203125, -1.90264892578125, -1.68408203125, -1.46551513671875, -1.2469482421875, -1.02838134765625, -0.809814453125, -0.59124755859375, -0.3726806640625, -0.15411376953125, 0.064453125, 0.28302001953125, 0.5015869140625, 0.72015380859375, 0.938720703125, 1.15728759765625, 1.3758544921875, 1.59442138671875, 1.81298828125, 2.03155517578125, 2.2501220703125, 2.46868896484375, 2.687255859375, 2.90582275390625, 3.1243896484375, 3.34295654296875, 3.5615234375, 3.78009033203125, 3.9986572265625, 4.21722412109375, 4.435791015625, 4.65435791015625, 4.8729248046875, 5.09149169921875, 5.31005859375, 5.52862548828125, 5.7471923828125, 5.96575927734375, 6.184326171875, 6.40289306640625, 6.6214599609375, 6.84002685546875, 7.05859375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 6.0, 4.0, 6.0, 13.0, 4.0, 8.0, 5.0, 18.0, 19.0, 22.0, 21.0, 31.0, 38.0, 34.0, 67.0, 66.0, 62.0, 46.0, 64.0, 52.0, 47.0, 56.0, 42.0, 48.0, 32.0, 45.0, 27.0, 20.0, 10.0, 17.0, 16.0, 11.0, 9.0, 4.0, 5.0, 5.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-1.384765625, -1.3418731689453125, -1.298980712890625, -1.2560882568359375, -1.21319580078125, -1.1703033447265625, -1.127410888671875, -1.0845184326171875, -1.0416259765625, -0.9987335205078125, -0.955841064453125, -0.9129486083984375, -0.87005615234375, -0.8271636962890625, -0.784271240234375, -0.7413787841796875, -0.698486328125, -0.6555938720703125, -0.612701416015625, -0.5698089599609375, -0.52691650390625, -0.4840240478515625, -0.441131591796875, -0.3982391357421875, -0.3553466796875, -0.3124542236328125, -0.269561767578125, -0.2266693115234375, -0.18377685546875, -0.1408843994140625, -0.097991943359375, -0.0550994873046875, -0.01220703125, 0.0306854248046875, 0.073577880859375, 0.1164703369140625, 0.15936279296875, 0.2022552490234375, 0.245147705078125, 0.2880401611328125, 0.3309326171875, 0.3738250732421875, 0.416717529296875, 0.4596099853515625, 0.50250244140625, 0.5453948974609375, 0.588287353515625, 0.6311798095703125, 0.674072265625, 0.7169647216796875, 0.759857177734375, 0.8027496337890625, 0.84564208984375, 0.8885345458984375, 0.931427001953125, 0.9743194580078125, 1.0172119140625, 1.0601043701171875, 1.102996826171875, 1.1458892822265625, 1.18878173828125, 1.2316741943359375, 1.274566650390625, 1.3174591064453125, 1.3603515625]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 7.0, 3.0, 13.0, 8.0, 10.0, 14.0, 21.0, 29.0, 37.0, 45.0, 51.0, 58.0, 81.0, 83.0, 77.0, 62.0, 71.0, 69.0, 53.0, 49.0, 36.0, 22.0, 23.0, 14.0, 11.0, 14.0, 11.0, 6.0, 4.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0], "bins": [-25.621694564819336, -24.904603958129883, -24.18751335144043, -23.470422744750977, -22.753334045410156, -22.036243438720703, -21.31915283203125, -20.602062225341797, -19.884971618652344, -19.16788101196289, -18.450790405273438, -17.733699798583984, -17.01660919189453, -16.29952049255371, -15.582429885864258, -14.865339279174805, -14.148248672485352, -13.431158065795898, -12.714067459106445, -11.996977806091309, -11.279887199401855, -10.562796592712402, -9.845706939697266, -9.128616333007812, -8.41152572631836, -7.694435119628906, -6.977344989776611, -6.260254859924316, -5.543164253234863, -4.82607364654541, -4.108983516693115, -3.3918933868408203, -2.6748046875, -1.957714319229126, -1.240623950958252, -0.5235335826873779, 0.1935567855834961, 0.9106471538543701, 1.6277375221252441, 2.344827651977539, 3.061918258666992, 3.779008626937866, 4.49609899520874, 5.213189125061035, 5.930279731750488, 6.647370338439941, 7.364460468292236, 8.081550598144531, 8.798641204833984, 9.515731811523438, 10.23282241821289, 10.949912071228027, 11.66700267791748, 12.384093284606934, 13.10118293762207, 13.818273544311523, 14.535364151000977, 15.25245475769043, 15.969545364379883, 16.686635971069336, 17.403724670410156, 18.12081527709961, 18.837905883789062, 19.554996490478516, 20.27208709716797]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 4.0, 2.0, 6.0, 10.0, 8.0, 7.0, 12.0, 7.0, 24.0, 13.0, 13.0, 27.0, 31.0, 37.0, 38.0, 33.0, 36.0, 48.0, 36.0, 32.0, 40.0, 53.0, 46.0, 46.0, 46.0, 47.0, 36.0, 36.0, 31.0, 28.0, 25.0, 16.0, 22.0, 9.0, 20.0, 16.0, 18.0, 10.0, 9.0, 10.0, 3.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.047958850860596, -6.774683952331543, -6.501409530639648, -6.228134632110596, -5.954859733581543, -5.68158483505249, -5.4083099365234375, -5.135035514831543, -4.86176061630249, -4.5884857177734375, -4.315211296081543, -4.04193639755249, -3.7686614990234375, -3.4953866004943848, -3.222111940383911, -2.9488372802734375, -2.6755623817443848, -2.402287483215332, -2.1290128231048584, -1.8557380437850952, -1.582463264465332, -1.3091884851455688, -1.0359137058258057, -0.7626389265060425, -0.4893641471862793, -0.2160893678665161, 0.05718541145324707, 0.33046019077301025, 0.6037349700927734, 0.8770097494125366, 1.1502845287322998, 1.423559308052063, 1.6968345642089844, 1.9701093435287476, 2.2433841228485107, 2.5166587829589844, 2.789933681488037, 3.06320858001709, 3.3364832401275635, 3.609757900238037, 3.88303279876709, 4.156307697296143, 4.429582595825195, 4.70285701751709, 4.976131916046143, 5.249406814575195, 5.52268123626709, 5.795956134796143, 6.069231033325195, 6.342505931854248, 6.615780830383301, 6.889055252075195, 7.162330150604248, 7.435605049133301, 7.708879470825195, 7.982154369354248, 8.2554292678833, 8.528703689575195, 8.801979064941406, 9.0752534866333, 9.348527908325195, 9.621803283691406, 9.8950777053833, 10.168353080749512, 10.441627502441406]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 3.0, 12.0, 18.0, 22.0, 23.0, 42.0, 61.0, 94.0, 154.0, 230.0, 380.0, 624.0, 896.0, 1578.0, 2601.0, 4664.0, 7887.0, 14002.0, 24700.0, 43223.0, 72982.0, 115304.0, 158621.0, 175972.0, 153260.0, 109188.0, 68729.0, 39911.0, 22630.0, 12879.0, 7380.0, 4261.0, 2460.0, 1419.0, 868.0, 546.0, 321.0, 186.0, 123.0, 113.0, 54.0, 34.0, 27.0, 25.0, 12.0, 10.0, 8.0, 8.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.890625, -12.48046875, -12.0703125, -11.66015625, -11.25, -10.83984375, -10.4296875, -10.01953125, -9.609375, -9.19921875, -8.7890625, -8.37890625, -7.96875, -7.55859375, -7.1484375, -6.73828125, -6.328125, -5.91796875, -5.5078125, -5.09765625, -4.6875, -4.27734375, -3.8671875, -3.45703125, -3.046875, -2.63671875, -2.2265625, -1.81640625, -1.40625, -0.99609375, -0.5859375, -0.17578125, 0.234375, 0.64453125, 1.0546875, 1.46484375, 1.875, 2.28515625, 2.6953125, 3.10546875, 3.515625, 3.92578125, 4.3359375, 4.74609375, 5.15625, 5.56640625, 5.9765625, 6.38671875, 6.796875, 7.20703125, 7.6171875, 8.02734375, 8.4375, 8.84765625, 9.2578125, 9.66796875, 10.078125, 10.48828125, 10.8984375, 11.30859375, 11.71875, 12.12890625, 12.5390625, 12.94921875, 13.359375]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 4.0, 1.0, 9.0, 10.0, 9.0, 7.0, 14.0, 16.0, 23.0, 25.0, 17.0, 36.0, 44.0, 40.0, 35.0, 36.0, 52.0, 39.0, 47.0, 49.0, 39.0, 39.0, 45.0, 47.0, 34.0, 43.0, 27.0, 34.0, 20.0, 25.0, 18.0, 16.0, 19.0, 13.0, 11.0, 13.0, 6.0, 9.0, 7.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.0859375, -9.7691650390625, -9.452392578125, -9.1356201171875, -8.81884765625, -8.5020751953125, -8.185302734375, -7.8685302734375, -7.5517578125, -7.2349853515625, -6.918212890625, -6.6014404296875, -6.28466796875, -5.9678955078125, -5.651123046875, -5.3343505859375, -5.017578125, -4.7008056640625, -4.384033203125, -4.0672607421875, -3.75048828125, -3.4337158203125, -3.116943359375, -2.8001708984375, -2.4833984375, -2.1666259765625, -1.849853515625, -1.5330810546875, -1.21630859375, -0.8995361328125, -0.582763671875, -0.2659912109375, 0.05078125, 0.3675537109375, 0.684326171875, 1.0010986328125, 1.31787109375, 1.6346435546875, 1.951416015625, 2.2681884765625, 2.5849609375, 2.9017333984375, 3.218505859375, 3.5352783203125, 3.85205078125, 4.1688232421875, 4.485595703125, 4.8023681640625, 5.119140625, 5.4359130859375, 5.752685546875, 6.0694580078125, 6.38623046875, 6.7030029296875, 7.019775390625, 7.3365478515625, 7.6533203125, 7.9700927734375, 8.286865234375, 8.6036376953125, 8.92041015625, 9.2371826171875, 9.553955078125, 9.8707275390625, 10.1875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 3.0, 9.0, 12.0, 13.0, 36.0, 36.0, 62.0, 89.0, 152.0, 237.0, 419.0, 803.0, 1493.0, 2840.0, 5695.0, 11663.0, 24566.0, 49306.0, 95149.0, 159970.0, 210294.0, 197395.0, 135392.0, 76441.0, 39094.0, 18982.0, 8997.0, 4539.0, 2218.0, 1095.0, 614.0, 350.0, 199.0, 123.0, 99.0, 46.0, 36.0, 22.0, 25.0, 9.0, 14.0, 7.0, 5.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.6640625, -15.1558837890625, -14.647705078125, -14.1395263671875, -13.63134765625, -13.1231689453125, -12.614990234375, -12.1068115234375, -11.5986328125, -11.0904541015625, -10.582275390625, -10.0740966796875, -9.56591796875, -9.0577392578125, -8.549560546875, -8.0413818359375, -7.533203125, -7.0250244140625, -6.516845703125, -6.0086669921875, -5.50048828125, -4.9923095703125, -4.484130859375, -3.9759521484375, -3.4677734375, -2.9595947265625, -2.451416015625, -1.9432373046875, -1.43505859375, -0.9268798828125, -0.418701171875, 0.0894775390625, 0.59765625, 1.1058349609375, 1.614013671875, 2.1221923828125, 2.63037109375, 3.1385498046875, 3.646728515625, 4.1549072265625, 4.6630859375, 5.1712646484375, 5.679443359375, 6.1876220703125, 6.69580078125, 7.2039794921875, 7.712158203125, 8.2203369140625, 8.728515625, 9.2366943359375, 9.744873046875, 10.2530517578125, 10.76123046875, 11.2694091796875, 11.777587890625, 12.2857666015625, 12.7939453125, 13.3021240234375, 13.810302734375, 14.3184814453125, 14.82666015625, 15.3348388671875, 15.843017578125, 16.3511962890625, 16.859375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 5.0, 3.0, 5.0, 5.0, 7.0, 14.0, 12.0, 6.0, 23.0, 17.0, 24.0, 13.0, 20.0, 31.0, 35.0, 31.0, 33.0, 25.0, 38.0, 28.0, 39.0, 40.0, 38.0, 36.0, 41.0, 38.0, 40.0, 45.0, 44.0, 37.0, 28.0, 35.0, 31.0, 19.0, 21.0, 12.0, 14.0, 13.0, 9.0, 6.0, 15.0, 7.0, 6.0, 9.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.65625, -4.4765625, -4.296875, -4.1171875, -3.9375, -3.7578125, -3.578125, -3.3984375, -3.21875, -3.0390625, -2.859375, -2.6796875, -2.5, -2.3203125, -2.140625, -1.9609375, -1.78125, -1.6015625, -1.421875, -1.2421875, -1.0625, -0.8828125, -0.703125, -0.5234375, -0.34375, -0.1640625, 0.015625, 0.1953125, 0.375, 0.5546875, 0.734375, 0.9140625, 1.09375, 1.2734375, 1.453125, 1.6328125, 1.8125, 1.9921875, 2.171875, 2.3515625, 2.53125, 2.7109375, 2.890625, 3.0703125, 3.25, 3.4296875, 3.609375, 3.7890625, 3.96875, 4.1484375, 4.328125, 4.5078125, 4.6875, 4.8671875, 5.046875, 5.2265625, 5.40625, 5.5859375, 5.765625, 5.9453125, 6.125, 6.3046875, 6.484375, 6.6640625, 6.84375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 4.0, 6.0, 8.0, 10.0, 9.0, 23.0, 16.0, 26.0, 53.0, 58.0, 81.0, 95.0, 165.0, 220.0, 318.0, 510.0, 890.0, 1581.0, 2897.0, 5876.0, 13263.0, 31685.0, 80812.0, 186615.0, 295145.0, 236329.0, 112411.0, 44919.0, 18025.0, 7713.0, 3820.0, 2031.0, 1094.0, 626.0, 373.0, 273.0, 151.0, 129.0, 88.0, 61.0, 39.0, 27.0, 21.0, 14.0, 13.0, 14.0, 4.0, 6.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-10.15625, -9.854736328125, -9.55322265625, -9.251708984375, -8.9501953125, -8.648681640625, -8.34716796875, -8.045654296875, -7.744140625, -7.442626953125, -7.14111328125, -6.839599609375, -6.5380859375, -6.236572265625, -5.93505859375, -5.633544921875, -5.33203125, -5.030517578125, -4.72900390625, -4.427490234375, -4.1259765625, -3.824462890625, -3.52294921875, -3.221435546875, -2.919921875, -2.618408203125, -2.31689453125, -2.015380859375, -1.7138671875, -1.412353515625, -1.11083984375, -0.809326171875, -0.5078125, -0.206298828125, 0.09521484375, 0.396728515625, 0.6982421875, 0.999755859375, 1.30126953125, 1.602783203125, 1.904296875, 2.205810546875, 2.50732421875, 2.808837890625, 3.1103515625, 3.411865234375, 3.71337890625, 4.014892578125, 4.31640625, 4.617919921875, 4.91943359375, 5.220947265625, 5.5224609375, 5.823974609375, 6.12548828125, 6.427001953125, 6.728515625, 7.030029296875, 7.33154296875, 7.633056640625, 7.9345703125, 8.236083984375, 8.53759765625, 8.839111328125, 9.140625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 5.0, 7.0, 5.0, 5.0, 7.0, 7.0, 12.0, 12.0, 29.0, 23.0, 29.0, 29.0, 36.0, 37.0, 45.0, 54.0, 60.0, 57.0, 62.0, 49.0, 55.0, 52.0, 56.0, 44.0, 43.0, 31.0, 33.0, 22.0, 20.0, 16.0, 10.0, 15.0, 14.0, 8.0, 5.0, 4.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0004963874816894531, -0.00047941505908966064, -0.00046244263648986816, -0.0004454702138900757, -0.0004284977912902832, -0.0004115253686904907, -0.00039455294609069824, -0.00037758052349090576, -0.0003606081008911133, -0.0003436356782913208, -0.0003266632556915283, -0.00030969083309173584, -0.00029271841049194336, -0.0002757459878921509, -0.0002587735652923584, -0.00024180114269256592, -0.00022482872009277344, -0.00020785629749298096, -0.00019088387489318848, -0.000173911452293396, -0.00015693902969360352, -0.00013996660709381104, -0.00012299418449401855, -0.00010602176189422607, -8.90493392944336e-05, -7.207691669464111e-05, -5.510449409484863e-05, -3.813207149505615e-05, -2.1159648895263672e-05, -4.187226295471191e-06, 1.2785196304321289e-05, 2.975761890411377e-05, 4.673004150390625e-05, 6.370246410369873e-05, 8.067488670349121e-05, 9.764730930328369e-05, 0.00011461973190307617, 0.00013159215450286865, 0.00014856457710266113, 0.0001655369997024536, 0.0001825094223022461, 0.00019948184490203857, 0.00021645426750183105, 0.00023342669010162354, 0.000250399112701416, 0.0002673715353012085, 0.000284343957901001, 0.00030131638050079346, 0.00031828880310058594, 0.0003352612257003784, 0.0003522336483001709, 0.0003692060708999634, 0.00038617849349975586, 0.00040315091609954834, 0.0004201233386993408, 0.0004370957612991333, 0.0004540681838989258, 0.00047104060649871826, 0.00048801302909851074, 0.0005049854516983032, 0.0005219578742980957, 0.0005389302968978882, 0.0005559027194976807, 0.0005728751420974731, 0.0005898475646972656]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 9.0, 2.0, 7.0, 8.0, 9.0, 16.0, 13.0, 18.0, 38.0, 49.0, 75.0, 107.0, 140.0, 211.0, 309.0, 510.0, 748.0, 1178.0, 1964.0, 3369.0, 6126.0, 10828.0, 20216.0, 37614.0, 67563.0, 114816.0, 168142.0, 193541.0, 165033.0, 110730.0, 65062.0, 35953.0, 19425.0, 10432.0, 5773.0, 3281.0, 1995.0, 1130.0, 725.0, 448.0, 294.0, 199.0, 139.0, 92.0, 66.0, 40.0, 29.0, 31.0, 18.0, 11.0, 13.0, 8.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-5.734375, -5.5521240234375, -5.369873046875, -5.1876220703125, -5.00537109375, -4.8231201171875, -4.640869140625, -4.4586181640625, -4.2763671875, -4.0941162109375, -3.911865234375, -3.7296142578125, -3.54736328125, -3.3651123046875, -3.182861328125, -3.0006103515625, -2.818359375, -2.6361083984375, -2.453857421875, -2.2716064453125, -2.08935546875, -1.9071044921875, -1.724853515625, -1.5426025390625, -1.3603515625, -1.1781005859375, -0.995849609375, -0.8135986328125, -0.63134765625, -0.4490966796875, -0.266845703125, -0.0845947265625, 0.09765625, 0.2799072265625, 0.462158203125, 0.6444091796875, 0.82666015625, 1.0089111328125, 1.191162109375, 1.3734130859375, 1.5556640625, 1.7379150390625, 1.920166015625, 2.1024169921875, 2.28466796875, 2.4669189453125, 2.649169921875, 2.8314208984375, 3.013671875, 3.1959228515625, 3.378173828125, 3.5604248046875, 3.74267578125, 3.9249267578125, 4.107177734375, 4.2894287109375, 4.4716796875, 4.6539306640625, 4.836181640625, 5.0184326171875, 5.20068359375, 5.3829345703125, 5.565185546875, 5.7474365234375, 5.9296875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 7.0, 7.0, 14.0, 9.0, 19.0, 20.0, 23.0, 33.0, 42.0, 40.0, 56.0, 69.0, 60.0, 79.0, 70.0, 76.0, 55.0, 46.0, 57.0, 43.0, 43.0, 37.0, 21.0, 18.0, 5.0, 15.0, 10.0, 3.0, 6.0, 6.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9248046875, -1.8626861572265625, -1.800567626953125, -1.7384490966796875, -1.67633056640625, -1.6142120361328125, -1.552093505859375, -1.4899749755859375, -1.4278564453125, -1.3657379150390625, -1.303619384765625, -1.2415008544921875, -1.17938232421875, -1.1172637939453125, -1.055145263671875, -0.9930267333984375, -0.930908203125, -0.8687896728515625, -0.806671142578125, -0.7445526123046875, -0.68243408203125, -0.6203155517578125, -0.558197021484375, -0.4960784912109375, -0.4339599609375, -0.3718414306640625, -0.309722900390625, -0.2476043701171875, -0.18548583984375, -0.1233673095703125, -0.061248779296875, 0.0008697509765625, 0.06298828125, 0.1251068115234375, 0.187225341796875, 0.2493438720703125, 0.31146240234375, 0.3735809326171875, 0.435699462890625, 0.4978179931640625, 0.5599365234375, 0.6220550537109375, 0.684173583984375, 0.7462921142578125, 0.80841064453125, 0.8705291748046875, 0.932647705078125, 0.9947662353515625, 1.056884765625, 1.1190032958984375, 1.181121826171875, 1.2432403564453125, 1.30535888671875, 1.3674774169921875, 1.429595947265625, 1.4917144775390625, 1.5538330078125, 1.6159515380859375, 1.678070068359375, 1.7401885986328125, 1.80230712890625, 1.8644256591796875, 1.926544189453125, 1.9886627197265625, 2.05078125]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 9.0, 3.0, 10.0, 10.0, 16.0, 16.0, 21.0, 28.0, 46.0, 50.0, 63.0, 74.0, 93.0, 79.0, 96.0, 64.0, 71.0, 66.0, 31.0, 36.0, 31.0, 27.0, 9.0, 12.0, 13.0, 5.0, 4.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.34234046936035, -26.557292938232422, -25.772245407104492, -24.987197875976562, -24.202150344848633, -23.417102813720703, -22.63205337524414, -21.847007751464844, -21.06195831298828, -20.27691078186035, -19.491863250732422, -18.706815719604492, -17.921768188476562, -17.136720657348633, -16.351673126220703, -15.566624641418457, -14.781578063964844, -13.996530532836914, -13.211483001708984, -12.426435470581055, -11.641387939453125, -10.856340408325195, -10.07129192352295, -9.28624439239502, -8.50119686126709, -7.71614933013916, -6.9311017990112305, -6.146053791046143, -5.361006259918213, -4.575958728790283, -3.7909107208251953, -3.0058631896972656, -2.220815658569336, -1.4357680082321167, -0.6507203578948975, 0.13432741165161133, 0.919374942779541, 1.7044224739074707, 2.4894704818725586, 3.2745180130004883, 4.059565544128418, 4.844613075256348, 5.629660606384277, 6.414708614349365, 7.199756145477295, 7.984803676605225, 8.769851684570312, 9.554899215698242, 10.339946746826172, 11.124994277954102, 11.910041809082031, 12.695089340209961, 13.48013687133789, 14.26518440246582, 15.050232887268066, 15.835280418395996, 16.62032699584961, 17.40537452697754, 18.19042205810547, 18.9754695892334, 19.760517120361328, 20.545564651489258, 21.330612182617188, 22.11566162109375, 22.90070915222168]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 8.0, 6.0, 11.0, 12.0, 13.0, 13.0, 8.0, 23.0, 20.0, 20.0, 25.0, 23.0, 29.0, 40.0, 32.0, 52.0, 43.0, 38.0, 32.0, 46.0, 63.0, 42.0, 36.0, 40.0, 41.0, 46.0, 32.0, 34.0, 26.0, 28.0, 18.0, 22.0, 10.0, 6.0, 14.0, 15.0, 14.0, 7.0, 2.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.717850208282471, -7.419209957122803, -7.120569705963135, -6.821929454803467, -6.523289203643799, -6.224648952484131, -5.926008701324463, -5.627368450164795, -5.328728199005127, -5.030087947845459, -4.731447696685791, -4.432807445526123, -4.134167194366455, -3.835526943206787, -3.536886692047119, -3.238246440887451, -2.939606189727783, -2.6409659385681152, -2.3423256874084473, -2.0436854362487793, -1.7450451850891113, -1.4464049339294434, -1.1477646827697754, -0.8491244316101074, -0.5504841804504395, -0.2518439292907715, 0.046796321868896484, 0.34543657302856445, 0.6440768241882324, 0.9427170753479004, 1.2413573265075684, 1.5399975776672363, 1.838637351989746, 2.137277603149414, 2.435917854309082, 2.73455810546875, 3.033198356628418, 3.331838607788086, 3.630478858947754, 3.929119110107422, 4.22775936126709, 4.526399612426758, 4.825039863586426, 5.123680114746094, 5.422320365905762, 5.72096061706543, 6.019600868225098, 6.318241119384766, 6.616881370544434, 6.915521621704102, 7.2141618728637695, 7.5128021240234375, 7.8114423751831055, 8.110082626342773, 8.408722877502441, 8.70736312866211, 9.006003379821777, 9.304643630981445, 9.603283882141113, 9.901924133300781, 10.20056438446045, 10.499204635620117, 10.797844886779785, 11.096485137939453, 11.395125389099121]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 6.0, 10.0, 10.0, 19.0, 26.0, 40.0, 60.0, 95.0, 155.0, 223.0, 413.0, 637.0, 1182.0, 1927.0, 3337.0, 6259.0, 12609.0, 25167.0, 52574.0, 117310.0, 278734.0, 690717.0, 1276717.0, 981621.0, 420102.0, 173308.0, 77183.0, 35898.0, 17722.0, 9130.0, 4725.0, 2657.0, 1511.0, 859.0, 499.0, 319.0, 184.0, 131.0, 69.0, 50.0, 30.0, 19.0, 13.0, 8.0, 4.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-18.671875, -18.064208984375, -17.45654296875, -16.848876953125, -16.2412109375, -15.633544921875, -15.02587890625, -14.418212890625, -13.810546875, -13.202880859375, -12.59521484375, -11.987548828125, -11.3798828125, -10.772216796875, -10.16455078125, -9.556884765625, -8.94921875, -8.341552734375, -7.73388671875, -7.126220703125, -6.5185546875, -5.910888671875, -5.30322265625, -4.695556640625, -4.087890625, -3.480224609375, -2.87255859375, -2.264892578125, -1.6572265625, -1.049560546875, -0.44189453125, 0.165771484375, 0.7734375, 1.381103515625, 1.98876953125, 2.596435546875, 3.2041015625, 3.811767578125, 4.41943359375, 5.027099609375, 5.634765625, 6.242431640625, 6.85009765625, 7.457763671875, 8.0654296875, 8.673095703125, 9.28076171875, 9.888427734375, 10.49609375, 11.103759765625, 11.71142578125, 12.319091796875, 12.9267578125, 13.534423828125, 14.14208984375, 14.749755859375, 15.357421875, 15.965087890625, 16.57275390625, 17.180419921875, 17.7880859375, 18.395751953125, 19.00341796875, 19.611083984375, 20.21875]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 5.0, 7.0, 12.0, 7.0, 13.0, 7.0, 13.0, 20.0, 17.0, 21.0, 27.0, 30.0, 24.0, 27.0, 37.0, 29.0, 41.0, 44.0, 48.0, 50.0, 41.0, 35.0, 52.0, 46.0, 33.0, 43.0, 48.0, 32.0, 33.0, 25.0, 20.0, 21.0, 21.0, 12.0, 13.0, 16.0, 11.0, 9.0, 5.0, 5.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.125, -5.9002685546875, -5.675537109375, -5.4508056640625, -5.22607421875, -5.0013427734375, -4.776611328125, -4.5518798828125, -4.3271484375, -4.1024169921875, -3.877685546875, -3.6529541015625, -3.42822265625, -3.2034912109375, -2.978759765625, -2.7540283203125, -2.529296875, -2.3045654296875, -2.079833984375, -1.8551025390625, -1.63037109375, -1.4056396484375, -1.180908203125, -0.9561767578125, -0.7314453125, -0.5067138671875, -0.281982421875, -0.0572509765625, 0.16748046875, 0.3922119140625, 0.616943359375, 0.8416748046875, 1.06640625, 1.2911376953125, 1.515869140625, 1.7406005859375, 1.96533203125, 2.1900634765625, 2.414794921875, 2.6395263671875, 2.8642578125, 3.0889892578125, 3.313720703125, 3.5384521484375, 3.76318359375, 3.9879150390625, 4.212646484375, 4.4373779296875, 4.662109375, 4.8868408203125, 5.111572265625, 5.3363037109375, 5.56103515625, 5.7857666015625, 6.010498046875, 6.2352294921875, 6.4599609375, 6.6846923828125, 6.909423828125, 7.1341552734375, 7.35888671875, 7.5836181640625, 7.808349609375, 8.0330810546875, 8.2578125]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 5.0, 6.0, 14.0, 16.0, 19.0, 50.0, 73.0, 98.0, 178.0, 226.0, 390.0, 611.0, 1036.0, 1723.0, 2951.0, 5233.0, 9068.0, 15928.0, 28858.0, 53743.0, 102391.0, 197687.0, 382617.0, 694030.0, 959245.0, 785904.0, 453863.0, 235495.0, 121026.0, 63869.0, 33960.0, 18675.0, 10674.0, 6126.0, 3440.0, 1995.0, 1168.0, 722.0, 428.0, 270.0, 188.0, 100.0, 66.0, 43.0, 29.0, 13.0, 14.0, 9.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.53125, -16.024658203125, -15.51806640625, -15.011474609375, -14.5048828125, -13.998291015625, -13.49169921875, -12.985107421875, -12.478515625, -11.971923828125, -11.46533203125, -10.958740234375, -10.4521484375, -9.945556640625, -9.43896484375, -8.932373046875, -8.42578125, -7.919189453125, -7.41259765625, -6.906005859375, -6.3994140625, -5.892822265625, -5.38623046875, -4.879638671875, -4.373046875, -3.866455078125, -3.35986328125, -2.853271484375, -2.3466796875, -1.840087890625, -1.33349609375, -0.826904296875, -0.3203125, 0.186279296875, 0.69287109375, 1.199462890625, 1.7060546875, 2.212646484375, 2.71923828125, 3.225830078125, 3.732421875, 4.239013671875, 4.74560546875, 5.252197265625, 5.7587890625, 6.265380859375, 6.77197265625, 7.278564453125, 7.78515625, 8.291748046875, 8.79833984375, 9.304931640625, 9.8115234375, 10.318115234375, 10.82470703125, 11.331298828125, 11.837890625, 12.344482421875, 12.85107421875, 13.357666015625, 13.8642578125, 14.370849609375, 14.87744140625, 15.384033203125, 15.890625]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 3.0, 7.0, 10.0, 8.0, 23.0, 25.0, 33.0, 52.0, 62.0, 62.0, 87.0, 112.0, 127.0, 186.0, 206.0, 241.0, 265.0, 297.0, 274.0, 304.0, 276.0, 242.0, 215.0, 196.0, 161.0, 137.0, 127.0, 75.0, 69.0, 55.0, 31.0, 25.0, 21.0, 21.0, 10.0, 13.0, 7.0, 4.0, 2.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.98046875, -4.82391357421875, -4.6673583984375, -4.51080322265625, -4.354248046875, -4.19769287109375, -4.0411376953125, -3.88458251953125, -3.72802734375, -3.57147216796875, -3.4149169921875, -3.25836181640625, -3.101806640625, -2.94525146484375, -2.7886962890625, -2.63214111328125, -2.4755859375, -2.31903076171875, -2.1624755859375, -2.00592041015625, -1.849365234375, -1.69281005859375, -1.5362548828125, -1.37969970703125, -1.22314453125, -1.06658935546875, -0.9100341796875, -0.75347900390625, -0.596923828125, -0.44036865234375, -0.2838134765625, -0.12725830078125, 0.029296875, 0.18585205078125, 0.3424072265625, 0.49896240234375, 0.655517578125, 0.81207275390625, 0.9686279296875, 1.12518310546875, 1.28173828125, 1.43829345703125, 1.5948486328125, 1.75140380859375, 1.907958984375, 2.06451416015625, 2.2210693359375, 2.37762451171875, 2.5341796875, 2.69073486328125, 2.8472900390625, 3.00384521484375, 3.160400390625, 3.31695556640625, 3.4735107421875, 3.63006591796875, 3.78662109375, 3.94317626953125, 4.0997314453125, 4.25628662109375, 4.412841796875, 4.56939697265625, 4.7259521484375, 4.88250732421875, 5.0390625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 5.0, 12.0, 13.0, 12.0, 23.0, 42.0, 46.0, 49.0, 63.0, 70.0, 68.0, 75.0, 87.0, 92.0, 64.0, 46.0, 46.0, 46.0, 34.0, 18.0, 20.0, 12.0, 15.0, 10.0, 6.0, 5.0, 6.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.599149703979492, -23.857467651367188, -23.11578369140625, -22.374101638793945, -21.63241958618164, -20.890735626220703, -20.1490535736084, -19.407371520996094, -18.665687561035156, -17.92400550842285, -17.182321548461914, -16.44063949584961, -15.698956489562988, -14.957273483276367, -14.215591430664062, -13.473908424377441, -12.73222541809082, -11.9905424118042, -11.248859405517578, -10.507177352905273, -9.765494346618652, -9.023811340332031, -8.282129287719727, -7.5404462814331055, -6.798763275146484, -6.057080268859863, -5.3153977394104, -4.5737152099609375, -3.8320322036743164, -3.0903494358062744, -2.3486666679382324, -1.6069841384887695, -0.8652992248535156, -0.12361645698547363, 0.6180663108825684, 1.3597490787506104, 2.1014318466186523, 2.8431146144866943, 3.5847973823547363, 4.326479911804199, 5.06816291809082, 5.809845924377441, 6.551528453826904, 7.293210983276367, 8.034893989562988, 8.77657699584961, 9.518259048461914, 10.259942054748535, 11.001625061035156, 11.743308067321777, 12.484991073608398, 13.226673126220703, 13.968356132507324, 14.710039138793945, 15.45172119140625, 16.193405151367188, 16.935087203979492, 17.676769256591797, 18.418453216552734, 19.16013526916504, 19.901817321777344, 20.64350128173828, 21.385183334350586, 22.12686538696289, 22.868549346923828]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 6.0, 12.0, 12.0, 14.0, 11.0, 23.0, 19.0, 24.0, 31.0, 33.0, 30.0, 36.0, 32.0, 36.0, 45.0, 43.0, 49.0, 41.0, 38.0, 43.0, 38.0, 35.0, 46.0, 35.0, 25.0, 39.0, 28.0, 29.0, 28.0, 13.0, 14.0, 12.0, 15.0, 14.0, 10.0, 7.0, 6.0, 9.0, 3.0, 6.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.250918388366699, -6.986877918243408, -6.722837924957275, -6.458797454833984, -6.194757461547852, -5.9307169914245605, -5.6666765213012695, -5.402636528015137, -5.138596057891846, -4.874555587768555, -4.610515594482422, -4.346475124359131, -4.08243465423584, -3.818394660949707, -3.554354190826416, -3.290313959121704, -3.026273727416992, -2.7622334957122803, -2.4981932640075684, -2.2341527938842773, -1.9701125621795654, -1.7060723304748535, -1.442031979560852, -1.1779916286468506, -0.9139513969421387, -0.649911105632782, -0.3858708143234253, -0.1218305230140686, 0.14220976829528809, 0.40625, 0.6702903509140015, 0.9343307018280029, 1.1983709335327148, 1.4624111652374268, 1.7264515161514282, 1.9904918670654297, 2.2545320987701416, 2.5185723304748535, 2.7826128005981445, 3.0466530323028564, 3.3106932640075684, 3.5747334957122803, 3.838773727416992, 4.102814197540283, 4.366854667663574, 4.630894660949707, 4.894935131072998, 5.158975601196289, 5.423015594482422, 5.687056064605713, 5.951096057891846, 6.215136528015137, 6.4791765213012695, 6.7432169914245605, 7.007257461547852, 7.271297454833984, 7.535337924957275, 7.799378395080566, 8.0634183883667, 8.327458381652832, 8.591499328613281, 8.855539321899414, 9.119579315185547, 9.383620262145996, 9.647660255432129]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 4.0, 5.0, 8.0, 12.0, 23.0, 35.0, 33.0, 71.0, 100.0, 156.0, 265.0, 398.0, 658.0, 1006.0, 1662.0, 2859.0, 4652.0, 7814.0, 13232.0, 22623.0, 38257.0, 63084.0, 99364.0, 138930.0, 164313.0, 156854.0, 122564.0, 82549.0, 51940.0, 30649.0, 18110.0, 10438.0, 6334.0, 3639.0, 2228.0, 1350.0, 845.0, 539.0, 308.0, 216.0, 159.0, 85.0, 69.0, 46.0, 26.0, 32.0, 5.0, 9.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.796875, -6.560791015625, -6.32470703125, -6.088623046875, -5.8525390625, -5.616455078125, -5.38037109375, -5.144287109375, -4.908203125, -4.672119140625, -4.43603515625, -4.199951171875, -3.9638671875, -3.727783203125, -3.49169921875, -3.255615234375, -3.01953125, -2.783447265625, -2.54736328125, -2.311279296875, -2.0751953125, -1.839111328125, -1.60302734375, -1.366943359375, -1.130859375, -0.894775390625, -0.65869140625, -0.422607421875, -0.1865234375, 0.049560546875, 0.28564453125, 0.521728515625, 0.7578125, 0.993896484375, 1.22998046875, 1.466064453125, 1.7021484375, 1.938232421875, 2.17431640625, 2.410400390625, 2.646484375, 2.882568359375, 3.11865234375, 3.354736328125, 3.5908203125, 3.826904296875, 4.06298828125, 4.299072265625, 4.53515625, 4.771240234375, 5.00732421875, 5.243408203125, 5.4794921875, 5.715576171875, 5.95166015625, 6.187744140625, 6.423828125, 6.659912109375, 6.89599609375, 7.132080078125, 7.3681640625, 7.604248046875, 7.84033203125, 8.076416015625, 8.3125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 7.0, 8.0, 13.0, 11.0, 14.0, 21.0, 26.0, 22.0, 26.0, 28.0, 32.0, 49.0, 34.0, 44.0, 48.0, 48.0, 47.0, 34.0, 58.0, 57.0, 46.0, 46.0, 39.0, 34.0, 34.0, 22.0, 28.0, 21.0, 17.0, 17.0, 20.0, 11.0, 5.0, 6.0, 11.0, 6.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3046875, -8.9765625, -8.6484375, -8.3203125, -7.9921875, -7.6640625, -7.3359375, -7.0078125, -6.6796875, -6.3515625, -6.0234375, -5.6953125, -5.3671875, -5.0390625, -4.7109375, -4.3828125, -4.0546875, -3.7265625, -3.3984375, -3.0703125, -2.7421875, -2.4140625, -2.0859375, -1.7578125, -1.4296875, -1.1015625, -0.7734375, -0.4453125, -0.1171875, 0.2109375, 0.5390625, 0.8671875, 1.1953125, 1.5234375, 1.8515625, 2.1796875, 2.5078125, 2.8359375, 3.1640625, 3.4921875, 3.8203125, 4.1484375, 4.4765625, 4.8046875, 5.1328125, 5.4609375, 5.7890625, 6.1171875, 6.4453125, 6.7734375, 7.1015625, 7.4296875, 7.7578125, 8.0859375, 8.4140625, 8.7421875, 9.0703125, 9.3984375, 9.7265625, 10.0546875, 10.3828125, 10.7109375, 11.0390625, 11.3671875, 11.6953125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 4.0, 7.0, 9.0, 22.0, 18.0, 30.0, 58.0, 79.0, 116.0, 172.0, 261.0, 363.0, 522.0, 853.0, 1271.0, 2013.0, 3348.0, 5513.0, 9028.0, 15156.0, 25262.0, 43311.0, 72413.0, 116794.0, 168501.0, 187242.0, 149228.0, 98188.0, 60020.0, 35883.0, 20650.0, 12379.0, 7545.0, 4644.0, 2745.0, 1803.0, 1110.0, 663.0, 412.0, 285.0, 215.0, 120.0, 92.0, 69.0, 41.0, 32.0, 22.0, 13.0, 15.0, 6.0, 7.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0], "bins": [-8.9140625, -8.63818359375, -8.3623046875, -8.08642578125, -7.810546875, -7.53466796875, -7.2587890625, -6.98291015625, -6.70703125, -6.43115234375, -6.1552734375, -5.87939453125, -5.603515625, -5.32763671875, -5.0517578125, -4.77587890625, -4.5, -4.22412109375, -3.9482421875, -3.67236328125, -3.396484375, -3.12060546875, -2.8447265625, -2.56884765625, -2.29296875, -2.01708984375, -1.7412109375, -1.46533203125, -1.189453125, -0.91357421875, -0.6376953125, -0.36181640625, -0.0859375, 0.18994140625, 0.4658203125, 0.74169921875, 1.017578125, 1.29345703125, 1.5693359375, 1.84521484375, 2.12109375, 2.39697265625, 2.6728515625, 2.94873046875, 3.224609375, 3.50048828125, 3.7763671875, 4.05224609375, 4.328125, 4.60400390625, 4.8798828125, 5.15576171875, 5.431640625, 5.70751953125, 5.9833984375, 6.25927734375, 6.53515625, 6.81103515625, 7.0869140625, 7.36279296875, 7.638671875, 7.91455078125, 8.1904296875, 8.46630859375, 8.7421875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 4.0, 4.0, 10.0, 4.0, 11.0, 14.0, 14.0, 15.0, 18.0, 20.0, 21.0, 27.0, 29.0, 28.0, 41.0, 26.0, 38.0, 45.0, 45.0, 38.0, 38.0, 49.0, 44.0, 41.0, 39.0, 46.0, 42.0, 32.0, 35.0, 24.0, 25.0, 21.0, 25.0, 17.0, 12.0, 12.0, 13.0, 9.0, 5.0, 7.0, 4.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.921875, -4.74652099609375, -4.5711669921875, -4.39581298828125, -4.220458984375, -4.04510498046875, -3.8697509765625, -3.69439697265625, -3.51904296875, -3.34368896484375, -3.1683349609375, -2.99298095703125, -2.817626953125, -2.64227294921875, -2.4669189453125, -2.29156494140625, -2.1162109375, -1.94085693359375, -1.7655029296875, -1.59014892578125, -1.414794921875, -1.23944091796875, -1.0640869140625, -0.88873291015625, -0.71337890625, -0.53802490234375, -0.3626708984375, -0.18731689453125, -0.011962890625, 0.16339111328125, 0.3387451171875, 0.51409912109375, 0.689453125, 0.86480712890625, 1.0401611328125, 1.21551513671875, 1.390869140625, 1.56622314453125, 1.7415771484375, 1.91693115234375, 2.09228515625, 2.26763916015625, 2.4429931640625, 2.61834716796875, 2.793701171875, 2.96905517578125, 3.1444091796875, 3.31976318359375, 3.4951171875, 3.67047119140625, 3.8458251953125, 4.02117919921875, 4.196533203125, 4.37188720703125, 4.5472412109375, 4.72259521484375, 4.89794921875, 5.07330322265625, 5.2486572265625, 5.42401123046875, 5.599365234375, 5.77471923828125, 5.9500732421875, 6.12542724609375, 6.30078125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 9.0, 16.0, 15.0, 22.0, 39.0, 77.0, 113.0, 161.0, 275.0, 406.0, 678.0, 1121.0, 1847.0, 2928.0, 4989.0, 8315.0, 14539.0, 25520.0, 45036.0, 79193.0, 137057.0, 202794.0, 202844.0, 136084.0, 79425.0, 44611.0, 25176.0, 14539.0, 8236.0, 4978.0, 2923.0, 1711.0, 1126.0, 629.0, 408.0, 253.0, 153.0, 100.0, 82.0, 46.0, 29.0, 25.0, 18.0, 6.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.9140625, -4.76513671875, -4.6162109375, -4.46728515625, -4.318359375, -4.16943359375, -4.0205078125, -3.87158203125, -3.72265625, -3.57373046875, -3.4248046875, -3.27587890625, -3.126953125, -2.97802734375, -2.8291015625, -2.68017578125, -2.53125, -2.38232421875, -2.2333984375, -2.08447265625, -1.935546875, -1.78662109375, -1.6376953125, -1.48876953125, -1.33984375, -1.19091796875, -1.0419921875, -0.89306640625, -0.744140625, -0.59521484375, -0.4462890625, -0.29736328125, -0.1484375, 0.00048828125, 0.1494140625, 0.29833984375, 0.447265625, 0.59619140625, 0.7451171875, 0.89404296875, 1.04296875, 1.19189453125, 1.3408203125, 1.48974609375, 1.638671875, 1.78759765625, 1.9365234375, 2.08544921875, 2.234375, 2.38330078125, 2.5322265625, 2.68115234375, 2.830078125, 2.97900390625, 3.1279296875, 3.27685546875, 3.42578125, 3.57470703125, 3.7236328125, 3.87255859375, 4.021484375, 4.17041015625, 4.3193359375, 4.46826171875, 4.6171875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 5.0, 3.0, 11.0, 5.0, 16.0, 11.0, 25.0, 25.0, 31.0, 41.0, 42.0, 53.0, 58.0, 64.0, 54.0, 65.0, 70.0, 50.0, 68.0, 54.0, 36.0, 37.0, 45.0, 21.0, 22.0, 15.0, 23.0, 14.0, 7.0, 10.0, 5.0, 3.0, 2.0, 4.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0002429485321044922, -0.00023453310132026672, -0.00022611767053604126, -0.0002177022397518158, -0.00020928680896759033, -0.00020087137818336487, -0.0001924559473991394, -0.00018404051661491394, -0.00017562508583068848, -0.000167209655046463, -0.00015879422426223755, -0.00015037879347801208, -0.00014196336269378662, -0.00013354793190956116, -0.0001251325011253357, -0.00011671707034111023, -0.00010830163955688477, -9.98862087726593e-05, -9.147077798843384e-05, -8.305534720420837e-05, -7.463991641998291e-05, -6.622448563575745e-05, -5.780905485153198e-05, -4.939362406730652e-05, -4.0978193283081055e-05, -3.256276249885559e-05, -2.4147331714630127e-05, -1.5731900930404663e-05, -7.316470146179199e-06, 1.0989606380462646e-06, 9.514391422271729e-06, 1.7929822206497192e-05, 2.6345252990722656e-05, 3.476068377494812e-05, 4.3176114559173584e-05, 5.159154534339905e-05, 6.000697612762451e-05, 6.842240691184998e-05, 7.683783769607544e-05, 8.52532684803009e-05, 9.366869926452637e-05, 0.00010208413004875183, 0.0001104995608329773, 0.00011891499161720276, 0.00012733042240142822, 0.0001357458531856537, 0.00014416128396987915, 0.00015257671475410461, 0.00016099214553833008, 0.00016940757632255554, 0.000177823007106781, 0.00018623843789100647, 0.00019465386867523193, 0.0002030692994594574, 0.00021148473024368286, 0.00021990016102790833, 0.0002283155918121338, 0.00023673102259635925, 0.0002451464533805847, 0.0002535618841648102, 0.00026197731494903564, 0.0002703927457332611, 0.00027880817651748657, 0.00028722360730171204, 0.0002956390380859375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 4.0, 2.0, 6.0, 4.0, 5.0, 8.0, 16.0, 24.0, 40.0, 53.0, 75.0, 110.0, 159.0, 231.0, 354.0, 624.0, 865.0, 1396.0, 2068.0, 3336.0, 5329.0, 8479.0, 13566.0, 20736.0, 32973.0, 51534.0, 77120.0, 107484.0, 136071.0, 146233.0, 131985.0, 102713.0, 72381.0, 48189.0, 30708.0, 19558.0, 12439.0, 7856.0, 4987.0, 3111.0, 2002.0, 1314.0, 851.0, 510.0, 361.0, 265.0, 135.0, 98.0, 65.0, 41.0, 20.0, 23.0, 16.0, 16.0, 6.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0], "bins": [-3.458984375, -3.352294921875, -3.24560546875, -3.138916015625, -3.0322265625, -2.925537109375, -2.81884765625, -2.712158203125, -2.60546875, -2.498779296875, -2.39208984375, -2.285400390625, -2.1787109375, -2.072021484375, -1.96533203125, -1.858642578125, -1.751953125, -1.645263671875, -1.53857421875, -1.431884765625, -1.3251953125, -1.218505859375, -1.11181640625, -1.005126953125, -0.8984375, -0.791748046875, -0.68505859375, -0.578369140625, -0.4716796875, -0.364990234375, -0.25830078125, -0.151611328125, -0.044921875, 0.061767578125, 0.16845703125, 0.275146484375, 0.3818359375, 0.488525390625, 0.59521484375, 0.701904296875, 0.80859375, 0.915283203125, 1.02197265625, 1.128662109375, 1.2353515625, 1.342041015625, 1.44873046875, 1.555419921875, 1.662109375, 1.768798828125, 1.87548828125, 1.982177734375, 2.0888671875, 2.195556640625, 2.30224609375, 2.408935546875, 2.515625, 2.622314453125, 2.72900390625, 2.835693359375, 2.9423828125, 3.049072265625, 3.15576171875, 3.262451171875, 3.369140625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 2.0, 10.0, 5.0, 12.0, 19.0, 10.0, 16.0, 26.0, 20.0, 27.0, 27.0, 34.0, 29.0, 55.0, 37.0, 34.0, 46.0, 48.0, 49.0, 46.0, 42.0, 37.0, 41.0, 46.0, 32.0, 33.0, 29.0, 34.0, 22.0, 20.0, 13.0, 12.0, 11.0, 16.0, 13.0, 7.0, 8.0, 8.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.96728515625, -0.93695068359375, -0.9066162109375, -0.87628173828125, -0.845947265625, -0.81561279296875, -0.7852783203125, -0.75494384765625, -0.724609375, -0.69427490234375, -0.6639404296875, -0.63360595703125, -0.603271484375, -0.57293701171875, -0.5426025390625, -0.51226806640625, -0.48193359375, -0.45159912109375, -0.4212646484375, -0.39093017578125, -0.360595703125, -0.33026123046875, -0.2999267578125, -0.26959228515625, -0.2392578125, -0.20892333984375, -0.1785888671875, -0.14825439453125, -0.117919921875, -0.08758544921875, -0.0572509765625, -0.02691650390625, 0.00341796875, 0.03375244140625, 0.0640869140625, 0.09442138671875, 0.124755859375, 0.15509033203125, 0.1854248046875, 0.21575927734375, 0.24609375, 0.27642822265625, 0.3067626953125, 0.33709716796875, 0.367431640625, 0.39776611328125, 0.4281005859375, 0.45843505859375, 0.48876953125, 0.51910400390625, 0.5494384765625, 0.57977294921875, 0.610107421875, 0.64044189453125, 0.6707763671875, 0.70111083984375, 0.7314453125, 0.76177978515625, 0.7921142578125, 0.82244873046875, 0.852783203125, 0.88311767578125, 0.9134521484375, 0.94378662109375, 0.97412109375]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 6.0, 6.0, 11.0, 10.0, 23.0, 16.0, 39.0, 46.0, 48.0, 59.0, 80.0, 50.0, 85.0, 87.0, 92.0, 64.0, 48.0, 43.0, 43.0, 30.0, 25.0, 19.0, 14.0, 12.0, 15.0, 6.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.877593994140625, -23.158777236938477, -22.439960479736328, -21.721141815185547, -21.0023250579834, -20.28350830078125, -19.5646915435791, -18.845874786376953, -18.127058029174805, -17.408241271972656, -16.689424514770508, -15.970606803894043, -15.251790046691895, -14.53297233581543, -13.814155578613281, -13.095338821411133, -12.376521110534668, -11.65770435333252, -10.938886642456055, -10.220069885253906, -9.501253128051758, -8.78243637084961, -8.063618659973145, -7.344801902770996, -6.6259846687316895, -5.907167434692383, -5.188350677490234, -4.469533443450928, -3.7507164478302, -3.0318994522094727, -2.313082218170166, -1.5942654609680176, -0.8754482269287109, -0.15663117170333862, 0.5621858835220337, 1.2810029983520508, 1.9998199939727783, 2.718636989593506, 3.4374542236328125, 4.156270980834961, 4.875088214874268, 5.593905448913574, 6.312722206115723, 7.031539440155029, 7.750356674194336, 8.469173431396484, 9.187990188598633, 9.906806945800781, 10.625624656677246, 11.344441413879395, 12.06325912475586, 12.782075881958008, 13.500892639160156, 14.219709396362305, 14.93852710723877, 15.657343864440918, 16.376161575317383, 17.09497833251953, 17.81379508972168, 18.532611846923828, 19.25143051147461, 19.970247268676758, 20.689064025878906, 21.407880783081055, 22.126697540283203]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 3.0, 1.0, 5.0, 14.0, 13.0, 12.0, 14.0, 20.0, 25.0, 24.0, 23.0, 41.0, 26.0, 40.0, 30.0, 39.0, 43.0, 54.0, 48.0, 45.0, 37.0, 34.0, 55.0, 29.0, 38.0, 31.0, 33.0, 23.0, 42.0, 26.0, 19.0, 17.0, 16.0, 11.0, 17.0, 12.0, 10.0, 9.0, 3.0, 7.0, 3.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.34538459777832, -7.082252025604248, -6.819119453430176, -6.555986404418945, -6.292853832244873, -6.029721260070801, -5.76658821105957, -5.503455638885498, -5.240323066711426, -4.9771904945373535, -4.714057922363281, -4.450924873352051, -4.1877923011779785, -3.9246597290039062, -3.661526918411255, -3.3983941078186035, -3.1352615356445312, -2.872128963470459, -2.6089961528778076, -2.3458633422851562, -2.082730770111084, -1.8195980787277222, -1.5564653873443604, -1.2933326959609985, -1.0302000045776367, -0.7670673131942749, -0.5039346218109131, -0.24080193042755127, 0.022330760955810547, 0.28546345233917236, 0.5485961437225342, 0.811728835105896, 1.0748615264892578, 1.3379942178726196, 1.6011269092559814, 1.8642596006393433, 2.127392292022705, 2.3905248641967773, 2.6536576747894287, 2.91679048538208, 3.1799230575561523, 3.4430556297302246, 3.706188440322876, 3.9693212509155273, 4.2324538230896, 4.495586395263672, 4.758719444274902, 5.021852016448975, 5.284984588623047, 5.548117160797119, 5.811249732971191, 6.074382781982422, 6.337515354156494, 6.600647926330566, 6.863780975341797, 7.126913547515869, 7.390046119689941, 7.653178691864014, 7.916311264038086, 8.179444313049316, 8.442577362060547, 8.705709457397461, 8.968842506408691, 9.231974601745605, 9.495107650756836]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 5.0, 8.0, 5.0, 5.0, 10.0, 22.0, 30.0, 54.0, 74.0, 112.0, 199.0, 247.0, 409.0, 625.0, 994.0, 1522.0, 2279.0, 3680.0, 5735.0, 9338.0, 14549.0, 22630.0, 34685.0, 51624.0, 73368.0, 98198.0, 119614.0, 129898.0, 123666.0, 105216.0, 80975.0, 57704.0, 39409.0, 25789.0, 16776.0, 10669.0, 6813.0, 4224.0, 2660.0, 1695.0, 1038.0, 703.0, 438.0, 289.0, 198.0, 123.0, 82.0, 61.0, 38.0, 18.0, 21.0, 16.0, 7.0, 13.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.4921875, -8.223876953125, -7.95556640625, -7.687255859375, -7.4189453125, -7.150634765625, -6.88232421875, -6.614013671875, -6.345703125, -6.077392578125, -5.80908203125, -5.540771484375, -5.2724609375, -5.004150390625, -4.73583984375, -4.467529296875, -4.19921875, -3.930908203125, -3.66259765625, -3.394287109375, -3.1259765625, -2.857666015625, -2.58935546875, -2.321044921875, -2.052734375, -1.784423828125, -1.51611328125, -1.247802734375, -0.9794921875, -0.711181640625, -0.44287109375, -0.174560546875, 0.09375, 0.362060546875, 0.63037109375, 0.898681640625, 1.1669921875, 1.435302734375, 1.70361328125, 1.971923828125, 2.240234375, 2.508544921875, 2.77685546875, 3.045166015625, 3.3134765625, 3.581787109375, 3.85009765625, 4.118408203125, 4.38671875, 4.655029296875, 4.92333984375, 5.191650390625, 5.4599609375, 5.728271484375, 5.99658203125, 6.264892578125, 6.533203125, 6.801513671875, 7.06982421875, 7.338134765625, 7.6064453125, 7.874755859375, 8.14306640625, 8.411376953125, 8.6796875]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 9.0, 3.0, 6.0, 6.0, 6.0, 13.0, 17.0, 18.0, 19.0, 26.0, 25.0, 19.0, 30.0, 29.0, 37.0, 34.0, 42.0, 45.0, 38.0, 51.0, 48.0, 42.0, 37.0, 41.0, 40.0, 38.0, 32.0, 32.0, 26.0, 30.0, 26.0, 19.0, 20.0, 18.0, 22.0, 9.0, 17.0, 8.0, 8.0, 4.0, 5.0, 6.0, 3.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.2734375, -8.98095703125, -8.6884765625, -8.39599609375, -8.103515625, -7.81103515625, -7.5185546875, -7.22607421875, -6.93359375, -6.64111328125, -6.3486328125, -6.05615234375, -5.763671875, -5.47119140625, -5.1787109375, -4.88623046875, -4.59375, -4.30126953125, -4.0087890625, -3.71630859375, -3.423828125, -3.13134765625, -2.8388671875, -2.54638671875, -2.25390625, -1.96142578125, -1.6689453125, -1.37646484375, -1.083984375, -0.79150390625, -0.4990234375, -0.20654296875, 0.0859375, 0.37841796875, 0.6708984375, 0.96337890625, 1.255859375, 1.54833984375, 1.8408203125, 2.13330078125, 2.42578125, 2.71826171875, 3.0107421875, 3.30322265625, 3.595703125, 3.88818359375, 4.1806640625, 4.47314453125, 4.765625, 5.05810546875, 5.3505859375, 5.64306640625, 5.935546875, 6.22802734375, 6.5205078125, 6.81298828125, 7.10546875, 7.39794921875, 7.6904296875, 7.98291015625, 8.275390625, 8.56787109375, 8.8603515625, 9.15283203125, 9.4453125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 6.0, 7.0, 8.0, 20.0, 28.0, 40.0, 42.0, 77.0, 152.0, 240.0, 330.0, 626.0, 1063.0, 1812.0, 3182.0, 5370.0, 9127.0, 15484.0, 25758.0, 41363.0, 64579.0, 94519.0, 125005.0, 146018.0, 142799.0, 121592.0, 90267.0, 60896.0, 39372.0, 23786.0, 14295.0, 8634.0, 4927.0, 2900.0, 1739.0, 977.0, 571.0, 347.0, 201.0, 142.0, 98.0, 54.0, 32.0, 19.0, 17.0, 5.0, 16.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 3.0], "bins": [-10.703125, -10.3876953125, -10.072265625, -9.7568359375, -9.44140625, -9.1259765625, -8.810546875, -8.4951171875, -8.1796875, -7.8642578125, -7.548828125, -7.2333984375, -6.91796875, -6.6025390625, -6.287109375, -5.9716796875, -5.65625, -5.3408203125, -5.025390625, -4.7099609375, -4.39453125, -4.0791015625, -3.763671875, -3.4482421875, -3.1328125, -2.8173828125, -2.501953125, -2.1865234375, -1.87109375, -1.5556640625, -1.240234375, -0.9248046875, -0.609375, -0.2939453125, 0.021484375, 0.3369140625, 0.65234375, 0.9677734375, 1.283203125, 1.5986328125, 1.9140625, 2.2294921875, 2.544921875, 2.8603515625, 3.17578125, 3.4912109375, 3.806640625, 4.1220703125, 4.4375, 4.7529296875, 5.068359375, 5.3837890625, 5.69921875, 6.0146484375, 6.330078125, 6.6455078125, 6.9609375, 7.2763671875, 7.591796875, 7.9072265625, 8.22265625, 8.5380859375, 8.853515625, 9.1689453125, 9.484375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 6.0, 5.0, 0.0, 8.0, 9.0, 7.0, 12.0, 12.0, 21.0, 21.0, 18.0, 25.0, 29.0, 31.0, 25.0, 36.0, 37.0, 38.0, 37.0, 44.0, 47.0, 42.0, 47.0, 45.0, 60.0, 37.0, 29.0, 41.0, 33.0, 35.0, 27.0, 25.0, 15.0, 19.0, 19.0, 11.0, 8.0, 13.0, 11.0, 8.0, 7.0, 4.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.15234375, -5.9656982421875, -5.779052734375, -5.5924072265625, -5.40576171875, -5.2191162109375, -5.032470703125, -4.8458251953125, -4.6591796875, -4.4725341796875, -4.285888671875, -4.0992431640625, -3.91259765625, -3.7259521484375, -3.539306640625, -3.3526611328125, -3.166015625, -2.9793701171875, -2.792724609375, -2.6060791015625, -2.41943359375, -2.2327880859375, -2.046142578125, -1.8594970703125, -1.6728515625, -1.4862060546875, -1.299560546875, -1.1129150390625, -0.92626953125, -0.7396240234375, -0.552978515625, -0.3663330078125, -0.1796875, 0.0069580078125, 0.193603515625, 0.3802490234375, 0.56689453125, 0.7535400390625, 0.940185546875, 1.1268310546875, 1.3134765625, 1.5001220703125, 1.686767578125, 1.8734130859375, 2.06005859375, 2.2467041015625, 2.433349609375, 2.6199951171875, 2.806640625, 2.9932861328125, 3.179931640625, 3.3665771484375, 3.55322265625, 3.7398681640625, 3.926513671875, 4.1131591796875, 4.2998046875, 4.4864501953125, 4.673095703125, 4.8597412109375, 5.04638671875, 5.2330322265625, 5.419677734375, 5.6063232421875, 5.79296875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 8.0, 11.0, 16.0, 26.0, 36.0, 85.0, 101.0, 176.0, 256.0, 407.0, 671.0, 1035.0, 1745.0, 2885.0, 4683.0, 7473.0, 12163.0, 19602.0, 31126.0, 48066.0, 71451.0, 99613.0, 127535.0, 141185.0, 134357.0, 110737.0, 80653.0, 55881.0, 36157.0, 22990.0, 14427.0, 8830.0, 5346.0, 3220.0, 2142.0, 1302.0, 844.0, 493.0, 303.0, 184.0, 128.0, 83.0, 40.0, 31.0, 12.0, 15.0, 11.0, 9.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-4.02734375, -3.904083251953125, -3.78082275390625, -3.657562255859375, -3.5343017578125, -3.411041259765625, -3.28778076171875, -3.164520263671875, -3.041259765625, -2.917999267578125, -2.79473876953125, -2.671478271484375, -2.5482177734375, -2.424957275390625, -2.30169677734375, -2.178436279296875, -2.05517578125, -1.931915283203125, -1.80865478515625, -1.685394287109375, -1.5621337890625, -1.438873291015625, -1.31561279296875, -1.192352294921875, -1.069091796875, -0.945831298828125, -0.82257080078125, -0.699310302734375, -0.5760498046875, -0.452789306640625, -0.32952880859375, -0.206268310546875, -0.0830078125, 0.040252685546875, 0.16351318359375, 0.286773681640625, 0.4100341796875, 0.533294677734375, 0.65655517578125, 0.779815673828125, 0.903076171875, 1.026336669921875, 1.14959716796875, 1.272857666015625, 1.3961181640625, 1.519378662109375, 1.64263916015625, 1.765899658203125, 1.88916015625, 2.012420654296875, 2.13568115234375, 2.258941650390625, 2.3822021484375, 2.505462646484375, 2.62872314453125, 2.751983642578125, 2.875244140625, 2.998504638671875, 3.12176513671875, 3.245025634765625, 3.3682861328125, 3.491546630859375, 3.61480712890625, 3.738067626953125, 3.861328125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 1.0, 2.0, 9.0, 10.0, 6.0, 11.0, 18.0, 32.0, 36.0, 37.0, 53.0, 60.0, 59.0, 81.0, 87.0, 69.0, 66.0, 70.0, 51.0, 47.0, 36.0, 36.0, 33.0, 27.0, 19.0, 11.0, 11.0, 7.0, 8.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005793571472167969, -0.0005607008934020996, -0.0005420446395874023, -0.0005233883857727051, -0.0005047321319580078, -0.00048607587814331055, -0.0004674196243286133, -0.000448763370513916, -0.00043010711669921875, -0.0004114508628845215, -0.0003927946090698242, -0.00037413835525512695, -0.0003554821014404297, -0.0003368258476257324, -0.00031816959381103516, -0.0002995133399963379, -0.0002808570861816406, -0.00026220083236694336, -0.0002435445785522461, -0.00022488832473754883, -0.00020623207092285156, -0.0001875758171081543, -0.00016891956329345703, -0.00015026330947875977, -0.0001316070556640625, -0.00011295080184936523, -9.429454803466797e-05, -7.56382942199707e-05, -5.698204040527344e-05, -3.832578659057617e-05, -1.9669532775878906e-05, -1.0132789611816406e-06, 1.7642974853515625e-05, 3.629922866821289e-05, 5.4955482482910156e-05, 7.361173629760742e-05, 9.226799011230469e-05, 0.00011092424392700195, 0.00012958049774169922, 0.00014823675155639648, 0.00016689300537109375, 0.00018554925918579102, 0.00020420551300048828, 0.00022286176681518555, 0.0002415180206298828, 0.0002601742744445801, 0.00027883052825927734, 0.0002974867820739746, 0.0003161430358886719, 0.00033479928970336914, 0.0003534555435180664, 0.00037211179733276367, 0.00039076805114746094, 0.0004094243049621582, 0.00042808055877685547, 0.00044673681259155273, 0.00046539306640625, 0.00048404932022094727, 0.0005027055740356445, 0.0005213618278503418, 0.0005400180816650391, 0.0005586743354797363, 0.0005773305892944336, 0.0005959868431091309, 0.0006146430969238281]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 7.0, 8.0, 13.0, 21.0, 33.0, 49.0, 69.0, 119.0, 161.0, 248.0, 386.0, 572.0, 892.0, 1328.0, 2153.0, 3243.0, 5030.0, 7392.0, 11436.0, 17523.0, 25975.0, 38533.0, 55562.0, 74980.0, 97310.0, 115445.0, 124092.0, 116973.0, 98997.0, 76793.0, 55767.0, 39222.0, 26252.0, 17850.0, 11809.0, 7772.0, 4915.0, 3418.0, 2237.0, 1398.0, 916.0, 547.0, 338.0, 274.0, 169.0, 112.0, 76.0, 57.0, 25.0, 17.0, 21.0, 13.0, 6.0, 4.0, 1.0, 3.0, 1.0], "bins": [-3.5390625, -3.433502197265625, -3.32794189453125, -3.222381591796875, -3.1168212890625, -3.011260986328125, -2.90570068359375, -2.800140380859375, -2.694580078125, -2.589019775390625, -2.48345947265625, -2.377899169921875, -2.2723388671875, -2.166778564453125, -2.06121826171875, -1.955657958984375, -1.85009765625, -1.744537353515625, -1.63897705078125, -1.533416748046875, -1.4278564453125, -1.322296142578125, -1.21673583984375, -1.111175537109375, -1.005615234375, -0.900054931640625, -0.79449462890625, -0.688934326171875, -0.5833740234375, -0.477813720703125, -0.37225341796875, -0.266693115234375, -0.1611328125, -0.055572509765625, 0.04998779296875, 0.155548095703125, 0.2611083984375, 0.366668701171875, 0.47222900390625, 0.577789306640625, 0.683349609375, 0.788909912109375, 0.89447021484375, 1.000030517578125, 1.1055908203125, 1.211151123046875, 1.31671142578125, 1.422271728515625, 1.52783203125, 1.633392333984375, 1.73895263671875, 1.844512939453125, 1.9500732421875, 2.055633544921875, 2.16119384765625, 2.266754150390625, 2.372314453125, 2.477874755859375, 2.58343505859375, 2.688995361328125, 2.7945556640625, 2.900115966796875, 3.00567626953125, 3.111236572265625, 3.216796875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 6.0, 3.0, 5.0, 6.0, 8.0, 11.0, 13.0, 11.0, 15.0, 13.0, 32.0, 24.0, 20.0, 27.0, 26.0, 34.0, 45.0, 38.0, 39.0, 35.0, 47.0, 44.0, 50.0, 40.0, 47.0, 36.0, 34.0, 33.0, 27.0, 38.0, 27.0, 24.0, 21.0, 18.0, 13.0, 12.0, 13.0, 12.0, 10.0, 13.0, 3.0, 5.0, 5.0, 4.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.1240234375, -1.089202880859375, -1.05438232421875, -1.019561767578125, -0.9847412109375, -0.949920654296875, -0.91510009765625, -0.880279541015625, -0.845458984375, -0.810638427734375, -0.77581787109375, -0.740997314453125, -0.7061767578125, -0.671356201171875, -0.63653564453125, -0.601715087890625, -0.56689453125, -0.532073974609375, -0.49725341796875, -0.462432861328125, -0.4276123046875, -0.392791748046875, -0.35797119140625, -0.323150634765625, -0.288330078125, -0.253509521484375, -0.21868896484375, -0.183868408203125, -0.1490478515625, -0.114227294921875, -0.07940673828125, -0.044586181640625, -0.009765625, 0.025054931640625, 0.05987548828125, 0.094696044921875, 0.1295166015625, 0.164337158203125, 0.19915771484375, 0.233978271484375, 0.268798828125, 0.303619384765625, 0.33843994140625, 0.373260498046875, 0.4080810546875, 0.442901611328125, 0.47772216796875, 0.512542724609375, 0.54736328125, 0.582183837890625, 0.61700439453125, 0.651824951171875, 0.6866455078125, 0.721466064453125, 0.75628662109375, 0.791107177734375, 0.825927734375, 0.860748291015625, 0.89556884765625, 0.930389404296875, 0.9652099609375, 1.000030517578125, 1.03485107421875, 1.069671630859375, 1.1044921875]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 7.0, 3.0, 5.0, 10.0, 15.0, 21.0, 27.0, 31.0, 43.0, 41.0, 66.0, 74.0, 83.0, 78.0, 77.0, 81.0, 65.0, 52.0, 51.0, 40.0, 32.0, 22.0, 12.0, 16.0, 15.0, 10.0, 7.0, 2.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-25.025188446044922, -24.291629791259766, -23.558069229125977, -22.82451057434082, -22.09095001220703, -21.357391357421875, -20.62383270263672, -19.89027214050293, -19.15671157836914, -18.423152923583984, -17.689592361450195, -16.95603370666504, -16.22247314453125, -15.488914489746094, -14.755354881286621, -14.021795272827148, -13.288236618041992, -12.55467700958252, -11.821117401123047, -11.08755874633789, -10.353998184204102, -9.620439529418945, -8.886879920959473, -8.1533203125, -7.419760704040527, -6.686201095581055, -5.952641487121582, -5.219082355499268, -4.485522747039795, -3.7519631385803223, -3.018404006958008, -2.284844398498535, -1.5512828826904297, -0.8177233934402466, -0.08416390419006348, 0.6493954658508301, 1.3829550743103027, 2.1165146827697754, 2.85007381439209, 3.5836334228515625, 4.317193031311035, 5.050752639770508, 5.7843122482299805, 6.517871379852295, 7.251430988311768, 7.98499059677124, 8.718549728393555, 9.452109336853027, 10.1856689453125, 10.919228553771973, 11.652788162231445, 12.386346817016602, 13.11990737915039, 13.853466033935547, 14.58702564239502, 15.320585250854492, 16.05414581298828, 16.787704467773438, 17.521265029907227, 18.254823684692383, 18.988384246826172, 19.721942901611328, 20.455501556396484, 21.189062118530273, 21.92262077331543]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 9.0, 10.0, 14.0, 14.0, 19.0, 19.0, 14.0, 28.0, 17.0, 27.0, 29.0, 51.0, 36.0, 36.0, 40.0, 49.0, 51.0, 50.0, 41.0, 50.0, 33.0, 36.0, 36.0, 40.0, 24.0, 36.0, 32.0, 18.0, 17.0, 23.0, 16.0, 18.0, 5.0, 13.0, 15.0, 7.0, 8.0, 5.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.810589790344238, -8.527017593383789, -8.243444442749023, -7.959872245788574, -7.676299571990967, -7.392726898193359, -7.10915470123291, -6.825582027435303, -6.542009353637695, -6.258436679840088, -5.9748640060424805, -5.691291809082031, -5.407719135284424, -5.124146461486816, -4.840574264526367, -4.55700159072876, -4.273428916931152, -3.989856243133545, -3.7062838077545166, -3.4227113723754883, -3.139138698577881, -2.8555660247802734, -2.571993589401245, -2.288421154022217, -2.0048484802246094, -1.7212759256362915, -1.4377033710479736, -1.1541308164596558, -0.8705582618713379, -0.58698570728302, -0.30341315269470215, -0.019840598106384277, 0.2637319564819336, 0.5473045110702515, 0.8308770656585693, 1.1144496202468872, 1.398022174835205, 1.681594729423523, 1.9651672840118408, 2.248739719390869, 2.5323123931884766, 2.815885066986084, 3.0994575023651123, 3.3830299377441406, 3.666602611541748, 3.9501752853393555, 4.233747482299805, 4.517320156097412, 4.8008928298950195, 5.084465503692627, 5.368038177490234, 5.651610374450684, 5.935183048248291, 6.218755722045898, 6.502327919006348, 6.785900592803955, 7.0694732666015625, 7.35304594039917, 7.636618614196777, 7.920190811157227, 8.203763961791992, 8.487336158752441, 8.77090835571289, 9.054481506347656, 9.338053703308105]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 6.0, 2.0, 15.0, 18.0, 26.0, 37.0, 56.0, 76.0, 95.0, 140.0, 246.0, 385.0, 582.0, 976.0, 1832.0, 3084.0, 5583.0, 10401.0, 20757.0, 42792.0, 93038.0, 215440.0, 529385.0, 1138360.0, 1166090.0, 551700.0, 224289.0, 95870.0, 44702.0, 22163.0, 11593.0, 6191.0, 3370.0, 1922.0, 1154.0, 723.0, 433.0, 243.0, 178.0, 99.0, 75.0, 45.0, 32.0, 29.0, 18.0, 15.0, 6.0, 2.0, 4.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-18.578125, -17.998046875, -17.41796875, -16.837890625, -16.2578125, -15.677734375, -15.09765625, -14.517578125, -13.9375, -13.357421875, -12.77734375, -12.197265625, -11.6171875, -11.037109375, -10.45703125, -9.876953125, -9.296875, -8.716796875, -8.13671875, -7.556640625, -6.9765625, -6.396484375, -5.81640625, -5.236328125, -4.65625, -4.076171875, -3.49609375, -2.916015625, -2.3359375, -1.755859375, -1.17578125, -0.595703125, -0.015625, 0.564453125, 1.14453125, 1.724609375, 2.3046875, 2.884765625, 3.46484375, 4.044921875, 4.625, 5.205078125, 5.78515625, 6.365234375, 6.9453125, 7.525390625, 8.10546875, 8.685546875, 9.265625, 9.845703125, 10.42578125, 11.005859375, 11.5859375, 12.166015625, 12.74609375, 13.326171875, 13.90625, 14.486328125, 15.06640625, 15.646484375, 16.2265625, 16.806640625, 17.38671875, 17.966796875, 18.546875]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 7.0, 10.0, 5.0, 14.0, 16.0, 19.0, 18.0, 12.0, 26.0, 39.0, 28.0, 23.0, 37.0, 37.0, 32.0, 38.0, 34.0, 42.0, 41.0, 57.0, 43.0, 51.0, 48.0, 35.0, 33.0, 27.0, 35.0, 35.0, 31.0, 18.0, 16.0, 17.0, 10.0, 10.0, 12.0, 12.0, 5.0, 6.0, 6.0, 5.0, 2.0, 2.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.1015625, -6.87933349609375, -6.6571044921875, -6.43487548828125, -6.212646484375, -5.99041748046875, -5.7681884765625, -5.54595947265625, -5.32373046875, -5.10150146484375, -4.8792724609375, -4.65704345703125, -4.434814453125, -4.21258544921875, -3.9903564453125, -3.76812744140625, -3.5458984375, -3.32366943359375, -3.1014404296875, -2.87921142578125, -2.656982421875, -2.43475341796875, -2.2125244140625, -1.99029541015625, -1.76806640625, -1.54583740234375, -1.3236083984375, -1.10137939453125, -0.879150390625, -0.65692138671875, -0.4346923828125, -0.21246337890625, 0.009765625, 0.23199462890625, 0.4542236328125, 0.67645263671875, 0.898681640625, 1.12091064453125, 1.3431396484375, 1.56536865234375, 1.78759765625, 2.00982666015625, 2.2320556640625, 2.45428466796875, 2.676513671875, 2.89874267578125, 3.1209716796875, 3.34320068359375, 3.5654296875, 3.78765869140625, 4.0098876953125, 4.23211669921875, 4.454345703125, 4.67657470703125, 4.8988037109375, 5.12103271484375, 5.34326171875, 5.56549072265625, 5.7877197265625, 6.00994873046875, 6.232177734375, 6.45440673828125, 6.6766357421875, 6.89886474609375, 7.12109375]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 8.0, 8.0, 13.0, 21.0, 42.0, 65.0, 91.0, 146.0, 236.0, 333.0, 566.0, 902.0, 1471.0, 2358.0, 3987.0, 6940.0, 11424.0, 20366.0, 36080.0, 65018.0, 120805.0, 226193.0, 421760.0, 721622.0, 920162.0, 718435.0, 420285.0, 224840.0, 119826.0, 64875.0, 36088.0, 20102.0, 11835.0, 6865.0, 4089.0, 2491.0, 1479.0, 880.0, 606.0, 368.0, 222.0, 132.0, 88.0, 57.0, 41.0, 26.0, 12.0, 14.0, 8.0, 2.0, 2.0, 3.0, 2.0, 1.0], "bins": [-16.40625, -15.9306640625, -15.455078125, -14.9794921875, -14.50390625, -14.0283203125, -13.552734375, -13.0771484375, -12.6015625, -12.1259765625, -11.650390625, -11.1748046875, -10.69921875, -10.2236328125, -9.748046875, -9.2724609375, -8.796875, -8.3212890625, -7.845703125, -7.3701171875, -6.89453125, -6.4189453125, -5.943359375, -5.4677734375, -4.9921875, -4.5166015625, -4.041015625, -3.5654296875, -3.08984375, -2.6142578125, -2.138671875, -1.6630859375, -1.1875, -0.7119140625, -0.236328125, 0.2392578125, 0.71484375, 1.1904296875, 1.666015625, 2.1416015625, 2.6171875, 3.0927734375, 3.568359375, 4.0439453125, 4.51953125, 4.9951171875, 5.470703125, 5.9462890625, 6.421875, 6.8974609375, 7.373046875, 7.8486328125, 8.32421875, 8.7998046875, 9.275390625, 9.7509765625, 10.2265625, 10.7021484375, 11.177734375, 11.6533203125, 12.12890625, 12.6044921875, 13.080078125, 13.5556640625, 14.03125]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 8.0, 6.0, 10.0, 7.0, 10.0, 15.0, 25.0, 18.0, 38.0, 45.0, 65.0, 92.0, 119.0, 166.0, 174.0, 234.0, 269.0, 287.0, 311.0, 293.0, 301.0, 281.0, 259.0, 232.0, 178.0, 133.0, 111.0, 74.0, 86.0, 66.0, 36.0, 32.0, 30.0, 15.0, 13.0, 13.0, 8.0, 8.0, 6.0, 3.0, 1.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.74609375, -5.5792236328125, -5.412353515625, -5.2454833984375, -5.07861328125, -4.9117431640625, -4.744873046875, -4.5780029296875, -4.4111328125, -4.2442626953125, -4.077392578125, -3.9105224609375, -3.74365234375, -3.5767822265625, -3.409912109375, -3.2430419921875, -3.076171875, -2.9093017578125, -2.742431640625, -2.5755615234375, -2.40869140625, -2.2418212890625, -2.074951171875, -1.9080810546875, -1.7412109375, -1.5743408203125, -1.407470703125, -1.2406005859375, -1.07373046875, -0.9068603515625, -0.739990234375, -0.5731201171875, -0.40625, -0.2393798828125, -0.072509765625, 0.0943603515625, 0.26123046875, 0.4281005859375, 0.594970703125, 0.7618408203125, 0.9287109375, 1.0955810546875, 1.262451171875, 1.4293212890625, 1.59619140625, 1.7630615234375, 1.929931640625, 2.0968017578125, 2.263671875, 2.4305419921875, 2.597412109375, 2.7642822265625, 2.93115234375, 3.0980224609375, 3.264892578125, 3.4317626953125, 3.5986328125, 3.7655029296875, 3.932373046875, 4.0992431640625, 4.26611328125, 4.4329833984375, 4.599853515625, 4.7667236328125, 4.93359375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 10.0, 8.0, 6.0, 12.0, 14.0, 33.0, 33.0, 22.0, 41.0, 54.0, 54.0, 68.0, 71.0, 61.0, 77.0, 73.0, 56.0, 53.0, 42.0, 35.0, 32.0, 32.0, 15.0, 20.0, 10.0, 4.0, 12.0, 11.0, 4.0, 4.0, 6.0, 3.0, 4.0, 3.0, 2.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.09366798400879, -18.480443954467773, -17.867218017578125, -17.25399398803711, -16.64076805114746, -16.027544021606445, -15.414319038391113, -14.801094055175781, -14.18786907196045, -13.574644088745117, -12.961419105529785, -12.348194122314453, -11.734970092773438, -11.121744155883789, -10.508520126342773, -9.895295143127441, -9.28207015991211, -8.668845176696777, -8.055620193481445, -7.4423956871032715, -6.8291707038879395, -6.215945720672607, -5.602721214294434, -4.989496231079102, -4.3762712478637695, -3.7630462646484375, -3.1498215198516846, -2.5365967750549316, -1.9233717918395996, -1.3101468086242676, -0.6969220638275146, -0.08369731903076172, 0.5295276641845703, 1.1427525281906128, 1.7559773921966553, 2.369202136993408, 2.9824271202087402, 3.5956521034240723, 4.208876609802246, 4.822101593017578, 5.43532657623291, 6.048551559448242, 6.661776542663574, 7.275001049041748, 7.88822603225708, 8.50145149230957, 9.114675521850586, 9.727900505065918, 10.34112548828125, 10.954350471496582, 11.567575454711914, 12.180800437927246, 12.794025421142578, 13.407249450683594, 14.020474433898926, 14.633699417114258, 15.24692440032959, 15.860149383544922, 16.473373413085938, 17.086599349975586, 17.6998233795166, 18.31304931640625, 18.926273345947266, 19.53949737548828, 20.15272331237793]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 7.0, 3.0, 5.0, 9.0, 13.0, 13.0, 14.0, 11.0, 22.0, 30.0, 32.0, 19.0, 33.0, 37.0, 35.0, 44.0, 45.0, 39.0, 45.0, 45.0, 59.0, 56.0, 41.0, 36.0, 37.0, 42.0, 24.0, 24.0, 24.0, 17.0, 19.0, 28.0, 18.0, 10.0, 14.0, 5.0, 11.0, 9.0, 5.0, 4.0, 8.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.348005294799805, -8.07004165649414, -7.792078018188477, -7.5141143798828125, -7.236151218414307, -6.958187580108643, -6.6802239418029785, -6.4022603034973145, -6.124297142028809, -5.8463335037231445, -5.5683698654174805, -5.290406227111816, -5.0124430656433105, -4.7344794273376465, -4.456515789031982, -4.178552150726318, -3.9005885124206543, -3.6226248741149902, -3.3446614742279053, -3.066697835922241, -2.7887344360351562, -2.510770797729492, -2.232807159423828, -1.9548436403274536, -1.676880121231079, -1.3989166021347046, -1.12095308303833, -0.842989444732666, -0.5650259256362915, -0.287062406539917, -0.00909876823425293, 0.2688647508621216, 0.5468282699584961, 0.8247917890548706, 1.1027553081512451, 1.3807189464569092, 1.6586824655532837, 1.9366459846496582, 2.2146096229553223, 2.4925732612609863, 2.7705366611480713, 3.0485002994537354, 3.3264636993408203, 3.6044273376464844, 3.8823909759521484, 4.1603546142578125, 4.438318252563477, 4.716281414031982, 4.9942450523376465, 5.2722086906433105, 5.550172328948975, 5.8281354904174805, 6.1060991287231445, 6.384062767028809, 6.662026405334473, 6.939990043640137, 7.217953681945801, 7.495917320251465, 7.773880958557129, 8.051844596862793, 8.329808235168457, 8.607770919799805, 8.885734558105469, 9.163698196411133, 9.441661834716797]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 8.0, 9.0, 11.0, 22.0, 28.0, 54.0, 79.0, 132.0, 206.0, 329.0, 567.0, 920.0, 1618.0, 3055.0, 5831.0, 11472.0, 22080.0, 42717.0, 80288.0, 136228.0, 192485.0, 199576.0, 152880.0, 93059.0, 50670.0, 25750.0, 13353.0, 6939.0, 3566.0, 1928.0, 1112.0, 625.0, 332.0, 210.0, 137.0, 92.0, 53.0, 35.0, 25.0, 16.0, 15.0, 7.0, 7.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0], "bins": [-9.296875, -9.0162353515625, -8.735595703125, -8.4549560546875, -8.17431640625, -7.8936767578125, -7.613037109375, -7.3323974609375, -7.0517578125, -6.7711181640625, -6.490478515625, -6.2098388671875, -5.92919921875, -5.6485595703125, -5.367919921875, -5.0872802734375, -4.806640625, -4.5260009765625, -4.245361328125, -3.9647216796875, -3.68408203125, -3.4034423828125, -3.122802734375, -2.8421630859375, -2.5615234375, -2.2808837890625, -2.000244140625, -1.7196044921875, -1.43896484375, -1.1583251953125, -0.877685546875, -0.5970458984375, -0.31640625, -0.0357666015625, 0.244873046875, 0.5255126953125, 0.80615234375, 1.0867919921875, 1.367431640625, 1.6480712890625, 1.9287109375, 2.2093505859375, 2.489990234375, 2.7706298828125, 3.05126953125, 3.3319091796875, 3.612548828125, 3.8931884765625, 4.173828125, 4.4544677734375, 4.735107421875, 5.0157470703125, 5.29638671875, 5.5770263671875, 5.857666015625, 6.1383056640625, 6.4189453125, 6.6995849609375, 6.980224609375, 7.2608642578125, 7.54150390625, 7.8221435546875, 8.102783203125, 8.3834228515625, 8.6640625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 9.0, 11.0, 13.0, 15.0, 11.0, 24.0, 19.0, 27.0, 25.0, 33.0, 27.0, 33.0, 32.0, 48.0, 34.0, 37.0, 54.0, 36.0, 50.0, 49.0, 40.0, 34.0, 36.0, 40.0, 32.0, 29.0, 27.0, 26.0, 20.0, 14.0, 17.0, 24.0, 5.0, 14.0, 18.0, 6.0, 4.0, 3.0, 5.0, 4.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.1484375, -7.850830078125, -7.55322265625, -7.255615234375, -6.9580078125, -6.660400390625, -6.36279296875, -6.065185546875, -5.767578125, -5.469970703125, -5.17236328125, -4.874755859375, -4.5771484375, -4.279541015625, -3.98193359375, -3.684326171875, -3.38671875, -3.089111328125, -2.79150390625, -2.493896484375, -2.1962890625, -1.898681640625, -1.60107421875, -1.303466796875, -1.005859375, -0.708251953125, -0.41064453125, -0.113037109375, 0.1845703125, 0.482177734375, 0.77978515625, 1.077392578125, 1.375, 1.672607421875, 1.97021484375, 2.267822265625, 2.5654296875, 2.863037109375, 3.16064453125, 3.458251953125, 3.755859375, 4.053466796875, 4.35107421875, 4.648681640625, 4.9462890625, 5.243896484375, 5.54150390625, 5.839111328125, 6.13671875, 6.434326171875, 6.73193359375, 7.029541015625, 7.3271484375, 7.624755859375, 7.92236328125, 8.219970703125, 8.517578125, 8.815185546875, 9.11279296875, 9.410400390625, 9.7080078125, 10.005615234375, 10.30322265625, 10.600830078125, 10.8984375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 8.0, 8.0, 14.0, 23.0, 32.0, 47.0, 100.0, 118.0, 187.0, 311.0, 587.0, 953.0, 1695.0, 3265.0, 6600.0, 13247.0, 28096.0, 60577.0, 127494.0, 228609.0, 258409.0, 164087.0, 80825.0, 38001.0, 17462.0, 8398.0, 4197.0, 2226.0, 1193.0, 718.0, 413.0, 259.0, 140.0, 90.0, 56.0, 43.0, 19.0, 18.0, 9.0, 8.0, 6.0, 7.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2734375, -10.88720703125, -10.5009765625, -10.11474609375, -9.728515625, -9.34228515625, -8.9560546875, -8.56982421875, -8.18359375, -7.79736328125, -7.4111328125, -7.02490234375, -6.638671875, -6.25244140625, -5.8662109375, -5.47998046875, -5.09375, -4.70751953125, -4.3212890625, -3.93505859375, -3.548828125, -3.16259765625, -2.7763671875, -2.39013671875, -2.00390625, -1.61767578125, -1.2314453125, -0.84521484375, -0.458984375, -0.07275390625, 0.3134765625, 0.69970703125, 1.0859375, 1.47216796875, 1.8583984375, 2.24462890625, 2.630859375, 3.01708984375, 3.4033203125, 3.78955078125, 4.17578125, 4.56201171875, 4.9482421875, 5.33447265625, 5.720703125, 6.10693359375, 6.4931640625, 6.87939453125, 7.265625, 7.65185546875, 8.0380859375, 8.42431640625, 8.810546875, 9.19677734375, 9.5830078125, 9.96923828125, 10.35546875, 10.74169921875, 11.1279296875, 11.51416015625, 11.900390625, 12.28662109375, 12.6728515625, 13.05908203125, 13.4453125]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 7.0, 5.0, 4.0, 8.0, 17.0, 12.0, 7.0, 14.0, 22.0, 13.0, 21.0, 18.0, 17.0, 33.0, 33.0, 30.0, 28.0, 40.0, 35.0, 32.0, 32.0, 31.0, 38.0, 45.0, 42.0, 39.0, 40.0, 44.0, 39.0, 27.0, 32.0, 30.0, 23.0, 26.0, 16.0, 21.0, 16.0, 16.0, 15.0, 13.0, 4.0, 5.0, 4.0, 0.0, 6.0, 4.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0], "bins": [-5.390625, -5.22869873046875, -5.0667724609375, -4.90484619140625, -4.742919921875, -4.58099365234375, -4.4190673828125, -4.25714111328125, -4.09521484375, -3.93328857421875, -3.7713623046875, -3.60943603515625, -3.447509765625, -3.28558349609375, -3.1236572265625, -2.96173095703125, -2.7998046875, -2.63787841796875, -2.4759521484375, -2.31402587890625, -2.152099609375, -1.99017333984375, -1.8282470703125, -1.66632080078125, -1.50439453125, -1.34246826171875, -1.1805419921875, -1.01861572265625, -0.856689453125, -0.69476318359375, -0.5328369140625, -0.37091064453125, -0.208984375, -0.04705810546875, 0.1148681640625, 0.27679443359375, 0.438720703125, 0.60064697265625, 0.7625732421875, 0.92449951171875, 1.08642578125, 1.24835205078125, 1.4102783203125, 1.57220458984375, 1.734130859375, 1.89605712890625, 2.0579833984375, 2.21990966796875, 2.3818359375, 2.54376220703125, 2.7056884765625, 2.86761474609375, 3.029541015625, 3.19146728515625, 3.3533935546875, 3.51531982421875, 3.67724609375, 3.83917236328125, 4.0010986328125, 4.16302490234375, 4.324951171875, 4.48687744140625, 4.6488037109375, 4.81072998046875, 4.97265625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 4.0, 10.0, 9.0, 15.0, 10.0, 21.0, 28.0, 41.0, 58.0, 72.0, 104.0, 178.0, 251.0, 452.0, 666.0, 1256.0, 2184.0, 4515.0, 9895.0, 23368.0, 60254.0, 159746.0, 335123.0, 267527.0, 109246.0, 41607.0, 16828.0, 7162.0, 3492.0, 1843.0, 991.0, 556.0, 320.0, 231.0, 154.0, 103.0, 59.0, 44.0, 47.0, 26.0, 18.0, 8.0, 12.0, 8.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.6328125, -8.36962890625, -8.1064453125, -7.84326171875, -7.580078125, -7.31689453125, -7.0537109375, -6.79052734375, -6.52734375, -6.26416015625, -6.0009765625, -5.73779296875, -5.474609375, -5.21142578125, -4.9482421875, -4.68505859375, -4.421875, -4.15869140625, -3.8955078125, -3.63232421875, -3.369140625, -3.10595703125, -2.8427734375, -2.57958984375, -2.31640625, -2.05322265625, -1.7900390625, -1.52685546875, -1.263671875, -1.00048828125, -0.7373046875, -0.47412109375, -0.2109375, 0.05224609375, 0.3154296875, 0.57861328125, 0.841796875, 1.10498046875, 1.3681640625, 1.63134765625, 1.89453125, 2.15771484375, 2.4208984375, 2.68408203125, 2.947265625, 3.21044921875, 3.4736328125, 3.73681640625, 4.0, 4.26318359375, 4.5263671875, 4.78955078125, 5.052734375, 5.31591796875, 5.5791015625, 5.84228515625, 6.10546875, 6.36865234375, 6.6318359375, 6.89501953125, 7.158203125, 7.42138671875, 7.6845703125, 7.94775390625, 8.2109375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 3.0, 3.0, 7.0, 4.0, 7.0, 14.0, 25.0, 29.0, 25.0, 39.0, 50.0, 47.0, 72.0, 91.0, 79.0, 90.0, 83.0, 56.0, 53.0, 48.0, 42.0, 38.0, 24.0, 25.0, 13.0, 6.0, 6.0, 5.0, 3.0, 2.0, 6.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000331878662109375, -0.000321120023727417, -0.000310361385345459, -0.000299602746963501, -0.00028884410858154297, -0.00027808547019958496, -0.00026732683181762695, -0.00025656819343566895, -0.00024580955505371094, -0.00023505091667175293, -0.00022429227828979492, -0.00021353363990783691, -0.0002027750015258789, -0.0001920163631439209, -0.0001812577247619629, -0.00017049908638000488, -0.00015974044799804688, -0.00014898180961608887, -0.00013822317123413086, -0.00012746453285217285, -0.00011670589447021484, -0.00010594725608825684, -9.518861770629883e-05, -8.442997932434082e-05, -7.367134094238281e-05, -6.29127025604248e-05, -5.21540641784668e-05, -4.139542579650879e-05, -3.063678741455078e-05, -1.9878149032592773e-05, -9.119510650634766e-06, 1.6391277313232422e-06, 1.239776611328125e-05, 2.3156404495239258e-05, 3.3915042877197266e-05, 4.4673681259155273e-05, 5.543231964111328e-05, 6.619095802307129e-05, 7.69495964050293e-05, 8.77082347869873e-05, 9.846687316894531e-05, 0.00010922551155090332, 0.00011998414993286133, 0.00013074278831481934, 0.00014150142669677734, 0.00015226006507873535, 0.00016301870346069336, 0.00017377734184265137, 0.00018453598022460938, 0.00019529461860656738, 0.0002060532569885254, 0.0002168118953704834, 0.0002275705337524414, 0.00023832917213439941, 0.0002490878105163574, 0.00025984644889831543, 0.00027060508728027344, 0.00028136372566223145, 0.00029212236404418945, 0.00030288100242614746, 0.00031363964080810547, 0.0003243982791900635, 0.0003351569175720215, 0.0003459155559539795, 0.0003566741943359375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 8.0, 9.0, 12.0, 16.0, 25.0, 32.0, 54.0, 88.0, 130.0, 192.0, 279.0, 508.0, 790.0, 1422.0, 2519.0, 4805.0, 9615.0, 20909.0, 47211.0, 104500.0, 202442.0, 264023.0, 199587.0, 102411.0, 46173.0, 20671.0, 9493.0, 4655.0, 2431.0, 1387.0, 798.0, 509.0, 313.0, 177.0, 122.0, 72.0, 58.0, 51.0, 21.0, 12.0, 14.0, 6.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.63671875, -6.43243408203125, -6.2281494140625, -6.02386474609375, -5.819580078125, -5.61529541015625, -5.4110107421875, -5.20672607421875, -5.00244140625, -4.79815673828125, -4.5938720703125, -4.38958740234375, -4.185302734375, -3.98101806640625, -3.7767333984375, -3.57244873046875, -3.3681640625, -3.16387939453125, -2.9595947265625, -2.75531005859375, -2.551025390625, -2.34674072265625, -2.1424560546875, -1.93817138671875, -1.73388671875, -1.52960205078125, -1.3253173828125, -1.12103271484375, -0.916748046875, -0.71246337890625, -0.5081787109375, -0.30389404296875, -0.099609375, 0.10467529296875, 0.3089599609375, 0.51324462890625, 0.717529296875, 0.92181396484375, 1.1260986328125, 1.33038330078125, 1.53466796875, 1.73895263671875, 1.9432373046875, 2.14752197265625, 2.351806640625, 2.55609130859375, 2.7603759765625, 2.96466064453125, 3.1689453125, 3.37322998046875, 3.5775146484375, 3.78179931640625, 3.986083984375, 4.19036865234375, 4.3946533203125, 4.59893798828125, 4.80322265625, 5.00750732421875, 5.2117919921875, 5.41607666015625, 5.620361328125, 5.82464599609375, 6.0289306640625, 6.23321533203125, 6.4375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 6.0, 8.0, 6.0, 9.0, 8.0, 26.0, 31.0, 40.0, 37.0, 46.0, 53.0, 51.0, 53.0, 62.0, 64.0, 83.0, 57.0, 71.0, 49.0, 49.0, 32.0, 35.0, 33.0, 18.0, 23.0, 8.0, 12.0, 11.0, 2.0, 8.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3876953125, -1.339019775390625, -1.29034423828125, -1.241668701171875, -1.1929931640625, -1.144317626953125, -1.09564208984375, -1.046966552734375, -0.998291015625, -0.949615478515625, -0.90093994140625, -0.852264404296875, -0.8035888671875, -0.754913330078125, -0.70623779296875, -0.657562255859375, -0.60888671875, -0.560211181640625, -0.51153564453125, -0.462860107421875, -0.4141845703125, -0.365509033203125, -0.31683349609375, -0.268157958984375, -0.219482421875, -0.170806884765625, -0.12213134765625, -0.073455810546875, -0.0247802734375, 0.023895263671875, 0.07257080078125, 0.121246337890625, 0.169921875, 0.218597412109375, 0.26727294921875, 0.315948486328125, 0.3646240234375, 0.413299560546875, 0.46197509765625, 0.510650634765625, 0.559326171875, 0.608001708984375, 0.65667724609375, 0.705352783203125, 0.7540283203125, 0.802703857421875, 0.85137939453125, 0.900054931640625, 0.94873046875, 0.997406005859375, 1.04608154296875, 1.094757080078125, 1.1434326171875, 1.192108154296875, 1.24078369140625, 1.289459228515625, 1.338134765625, 1.386810302734375, 1.43548583984375, 1.484161376953125, 1.5328369140625, 1.581512451171875, 1.63018798828125, 1.678863525390625, 1.7275390625]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 12.0, 5.0, 8.0, 9.0, 20.0, 24.0, 30.0, 32.0, 27.0, 43.0, 55.0, 54.0, 54.0, 64.0, 71.0, 65.0, 72.0, 54.0, 49.0, 37.0, 35.0, 25.0, 32.0, 20.0, 18.0, 15.0, 9.0, 11.0, 9.0, 3.0, 7.0, 7.0, 1.0, 4.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.752038955688477, -17.176942825317383, -16.601844787597656, -16.026748657226562, -15.451651573181152, -14.876554489135742, -14.301458358764648, -13.726361274719238, -13.151264190673828, -12.576167106628418, -12.001070022583008, -11.425973892211914, -10.850876808166504, -10.275779724121094, -9.70068359375, -9.12558650970459, -8.55048942565918, -7.9753923416137695, -7.400295734405518, -6.825199127197266, -6.2501020431518555, -5.675004959106445, -5.099908351898193, -4.524811744689941, -3.9497146606445312, -3.3746178150177, -2.799520969390869, -2.224424123764038, -1.649327278137207, -1.074230432510376, -0.4991335868835449, 0.07596302032470703, 0.6510601043701172, 1.2261569499969482, 1.8012537956237793, 2.3763506412506104, 2.9514474868774414, 3.5265443325042725, 4.1016411781311035, 4.6767377853393555, 5.251834869384766, 5.826931953430176, 6.402028560638428, 6.97712516784668, 7.55222225189209, 8.1273193359375, 8.702415466308594, 9.277512550354004, 9.852609634399414, 10.427706718444824, 11.002803802490234, 11.577899932861328, 12.152997016906738, 12.728094100952148, 13.303190231323242, 13.878287315368652, 14.453384399414062, 15.028481483459473, 15.603578567504883, 16.178674697875977, 16.753772735595703, 17.328868865966797, 17.90396499633789, 18.479061126708984, 19.05415916442871]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 3.0, 4.0, 11.0, 13.0, 15.0, 14.0, 16.0, 24.0, 31.0, 31.0, 25.0, 33.0, 43.0, 40.0, 48.0, 30.0, 63.0, 52.0, 48.0, 50.0, 50.0, 34.0, 40.0, 46.0, 28.0, 18.0, 23.0, 25.0, 25.0, 20.0, 15.0, 14.0, 9.0, 12.0, 9.0, 8.0, 4.0, 9.0, 4.0, 4.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.358636856079102, -8.073909759521484, -7.789182186126709, -7.504454612731934, -7.219727516174316, -6.934999942779541, -6.650272369384766, -6.365545272827148, -6.080817699432373, -5.796090126037598, -5.5113630294799805, -5.226635456085205, -4.94190788269043, -4.6571807861328125, -4.372453212738037, -4.087725639343262, -3.8029985427856445, -3.5182712078094482, -3.233543872833252, -2.9488162994384766, -2.6640889644622803, -2.379361629486084, -2.0946340560913086, -1.8099067211151123, -1.525179386138916, -1.2404520511627197, -0.9557245969772339, -0.6709972023963928, -0.38626980781555176, -0.10154247283935547, 0.18318498134613037, 0.4679124355316162, 0.7526388168334961, 1.0373661518096924, 1.3220936059951782, 1.606821060180664, 1.8915483951568604, 2.1762757301330566, 2.461003303527832, 2.7457306385040283, 3.0304579734802246, 3.315185308456421, 3.599912643432617, 3.8846402168273926, 4.169367790222168, 4.454094886779785, 4.7388224601745605, 5.023550033569336, 5.308277130126953, 5.5930047035217285, 5.877731800079346, 6.162459373474121, 6.447186470031738, 6.731914043426514, 7.016641616821289, 7.301368713378906, 7.586096286773682, 7.870823860168457, 8.155550956726074, 8.440278053283691, 8.725006103515625, 9.009733200073242, 9.29446029663086, 9.579188346862793, 9.86391544342041]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 3.0, 10.0, 9.0, 10.0, 18.0, 46.0, 72.0, 104.0, 147.0, 250.0, 407.0, 675.0, 1110.0, 1880.0, 2968.0, 5178.0, 8590.0, 14277.0, 24333.0, 39856.0, 63910.0, 97137.0, 133156.0, 157221.0, 151091.0, 121782.0, 85174.0, 54654.0, 33784.0, 20256.0, 12248.0, 7147.0, 4426.0, 2543.0, 1499.0, 979.0, 597.0, 375.0, 246.0, 134.0, 110.0, 54.0, 35.0, 31.0, 14.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9453125, -9.5880126953125, -9.230712890625, -8.8734130859375, -8.51611328125, -8.1588134765625, -7.801513671875, -7.4442138671875, -7.0869140625, -6.7296142578125, -6.372314453125, -6.0150146484375, -5.65771484375, -5.3004150390625, -4.943115234375, -4.5858154296875, -4.228515625, -3.8712158203125, -3.513916015625, -3.1566162109375, -2.79931640625, -2.4420166015625, -2.084716796875, -1.7274169921875, -1.3701171875, -1.0128173828125, -0.655517578125, -0.2982177734375, 0.05908203125, 0.4163818359375, 0.773681640625, 1.1309814453125, 1.48828125, 1.8455810546875, 2.202880859375, 2.5601806640625, 2.91748046875, 3.2747802734375, 3.632080078125, 3.9893798828125, 4.3466796875, 4.7039794921875, 5.061279296875, 5.4185791015625, 5.77587890625, 6.1331787109375, 6.490478515625, 6.8477783203125, 7.205078125, 7.5623779296875, 7.919677734375, 8.2769775390625, 8.63427734375, 8.9915771484375, 9.348876953125, 9.7061767578125, 10.0634765625, 10.4207763671875, 10.778076171875, 11.1353759765625, 11.49267578125, 11.8499755859375, 12.207275390625, 12.5645751953125, 12.921875]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 9.0, 5.0, 7.0, 9.0, 10.0, 20.0, 8.0, 13.0, 11.0, 16.0, 23.0, 29.0, 33.0, 24.0, 29.0, 44.0, 42.0, 25.0, 50.0, 46.0, 38.0, 50.0, 51.0, 50.0, 41.0, 36.0, 29.0, 28.0, 32.0, 38.0, 24.0, 26.0, 18.0, 16.0, 13.0, 10.0, 12.0, 7.0, 8.0, 9.0, 4.0, 4.0, 1.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.7265625, -9.42431640625, -9.1220703125, -8.81982421875, -8.517578125, -8.21533203125, -7.9130859375, -7.61083984375, -7.30859375, -7.00634765625, -6.7041015625, -6.40185546875, -6.099609375, -5.79736328125, -5.4951171875, -5.19287109375, -4.890625, -4.58837890625, -4.2861328125, -3.98388671875, -3.681640625, -3.37939453125, -3.0771484375, -2.77490234375, -2.47265625, -2.17041015625, -1.8681640625, -1.56591796875, -1.263671875, -0.96142578125, -0.6591796875, -0.35693359375, -0.0546875, 0.24755859375, 0.5498046875, 0.85205078125, 1.154296875, 1.45654296875, 1.7587890625, 2.06103515625, 2.36328125, 2.66552734375, 2.9677734375, 3.27001953125, 3.572265625, 3.87451171875, 4.1767578125, 4.47900390625, 4.78125, 5.08349609375, 5.3857421875, 5.68798828125, 5.990234375, 6.29248046875, 6.5947265625, 6.89697265625, 7.19921875, 7.50146484375, 7.8037109375, 8.10595703125, 8.408203125, 8.71044921875, 9.0126953125, 9.31494140625, 9.6171875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 8.0, 15.0, 15.0, 24.0, 45.0, 80.0, 104.0, 160.0, 265.0, 366.0, 588.0, 911.0, 1521.0, 2493.0, 3915.0, 6168.0, 10112.0, 16608.0, 26311.0, 40850.0, 62254.0, 89542.0, 117350.0, 136074.0, 137422.0, 119894.0, 93086.0, 65860.0, 43190.0, 27601.0, 17217.0, 10762.0, 6602.0, 4207.0, 2543.0, 1591.0, 1021.0, 626.0, 400.0, 258.0, 187.0, 105.0, 70.0, 43.0, 36.0, 20.0, 11.0, 10.0, 11.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.46875, -10.1422119140625, -9.815673828125, -9.4891357421875, -9.16259765625, -8.8360595703125, -8.509521484375, -8.1829833984375, -7.8564453125, -7.5299072265625, -7.203369140625, -6.8768310546875, -6.55029296875, -6.2237548828125, -5.897216796875, -5.5706787109375, -5.244140625, -4.9176025390625, -4.591064453125, -4.2645263671875, -3.93798828125, -3.6114501953125, -3.284912109375, -2.9583740234375, -2.6318359375, -2.3052978515625, -1.978759765625, -1.6522216796875, -1.32568359375, -0.9991455078125, -0.672607421875, -0.3460693359375, -0.01953125, 0.3070068359375, 0.633544921875, 0.9600830078125, 1.28662109375, 1.6131591796875, 1.939697265625, 2.2662353515625, 2.5927734375, 2.9193115234375, 3.245849609375, 3.5723876953125, 3.89892578125, 4.2254638671875, 4.552001953125, 4.8785400390625, 5.205078125, 5.5316162109375, 5.858154296875, 6.1846923828125, 6.51123046875, 6.8377685546875, 7.164306640625, 7.4908447265625, 7.8173828125, 8.1439208984375, 8.470458984375, 8.7969970703125, 9.12353515625, 9.4500732421875, 9.776611328125, 10.1031494140625, 10.4296875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 5.0, 3.0, 5.0, 7.0, 7.0, 7.0, 10.0, 14.0, 10.0, 8.0, 17.0, 28.0, 24.0, 37.0, 40.0, 36.0, 39.0, 36.0, 35.0, 43.0, 44.0, 36.0, 49.0, 50.0, 50.0, 38.0, 43.0, 28.0, 30.0, 30.0, 32.0, 25.0, 14.0, 22.0, 20.0, 14.0, 13.0, 9.0, 9.0, 8.0, 6.0, 5.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-5.35546875, -5.1781005859375, -5.000732421875, -4.8233642578125, -4.64599609375, -4.4686279296875, -4.291259765625, -4.1138916015625, -3.9365234375, -3.7591552734375, -3.581787109375, -3.4044189453125, -3.22705078125, -3.0496826171875, -2.872314453125, -2.6949462890625, -2.517578125, -2.3402099609375, -2.162841796875, -1.9854736328125, -1.80810546875, -1.6307373046875, -1.453369140625, -1.2760009765625, -1.0986328125, -0.9212646484375, -0.743896484375, -0.5665283203125, -0.38916015625, -0.2117919921875, -0.034423828125, 0.1429443359375, 0.3203125, 0.4976806640625, 0.675048828125, 0.8524169921875, 1.02978515625, 1.2071533203125, 1.384521484375, 1.5618896484375, 1.7392578125, 1.9166259765625, 2.093994140625, 2.2713623046875, 2.44873046875, 2.6260986328125, 2.803466796875, 2.9808349609375, 3.158203125, 3.3355712890625, 3.512939453125, 3.6903076171875, 3.86767578125, 4.0450439453125, 4.222412109375, 4.3997802734375, 4.5771484375, 4.7545166015625, 4.931884765625, 5.1092529296875, 5.28662109375, 5.4639892578125, 5.641357421875, 5.8187255859375, 5.99609375]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 10.0, 6.0, 14.0, 10.0, 16.0, 21.0, 26.0, 48.0, 80.0, 103.0, 150.0, 225.0, 360.0, 504.0, 778.0, 1300.0, 2085.0, 3508.0, 6243.0, 10815.0, 20394.0, 37239.0, 66385.0, 112221.0, 165778.0, 192223.0, 165537.0, 112497.0, 66268.0, 37090.0, 20220.0, 11113.0, 6165.0, 3539.0, 2070.0, 1246.0, 775.0, 512.0, 315.0, 208.0, 147.0, 94.0, 63.0, 47.0, 27.0, 22.0, 23.0, 15.0, 8.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0], "bins": [-6.23046875, -6.04986572265625, -5.8692626953125, -5.68865966796875, -5.508056640625, -5.32745361328125, -5.1468505859375, -4.96624755859375, -4.78564453125, -4.60504150390625, -4.4244384765625, -4.24383544921875, -4.063232421875, -3.88262939453125, -3.7020263671875, -3.52142333984375, -3.3408203125, -3.16021728515625, -2.9796142578125, -2.79901123046875, -2.618408203125, -2.43780517578125, -2.2572021484375, -2.07659912109375, -1.89599609375, -1.71539306640625, -1.5347900390625, -1.35418701171875, -1.173583984375, -0.99298095703125, -0.8123779296875, -0.63177490234375, -0.451171875, -0.27056884765625, -0.0899658203125, 0.09063720703125, 0.271240234375, 0.45184326171875, 0.6324462890625, 0.81304931640625, 0.99365234375, 1.17425537109375, 1.3548583984375, 1.53546142578125, 1.716064453125, 1.89666748046875, 2.0772705078125, 2.25787353515625, 2.4384765625, 2.61907958984375, 2.7996826171875, 2.98028564453125, 3.160888671875, 3.34149169921875, 3.5220947265625, 3.70269775390625, 3.88330078125, 4.06390380859375, 4.2445068359375, 4.42510986328125, 4.605712890625, 4.78631591796875, 4.9669189453125, 5.14752197265625, 5.328125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 9.0, 8.0, 4.0, 8.0, 10.0, 19.0, 14.0, 25.0, 44.0, 42.0, 49.0, 56.0, 67.0, 65.0, 88.0, 70.0, 62.0, 59.0, 57.0, 48.0, 43.0, 42.0, 20.0, 24.0, 18.0, 18.0, 10.0, 5.0, 7.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006918907165527344, -0.0006720125675201416, -0.0006521344184875488, -0.0006322562694549561, -0.0006123781204223633, -0.0005924999713897705, -0.0005726218223571777, -0.000552743673324585, -0.0005328655242919922, -0.0005129873752593994, -0.0004931092262268066, -0.00047323107719421387, -0.0004533529281616211, -0.0004334747791290283, -0.00041359663009643555, -0.0003937184810638428, -0.00037384033203125, -0.0003539621829986572, -0.00033408403396606445, -0.0003142058849334717, -0.0002943277359008789, -0.00027444958686828613, -0.00025457143783569336, -0.00023469328880310059, -0.0002148151397705078, -0.00019493699073791504, -0.00017505884170532227, -0.0001551806926727295, -0.00013530254364013672, -0.00011542439460754395, -9.554624557495117e-05, -7.56680965423584e-05, -5.5789947509765625e-05, -3.591179847717285e-05, -1.6033649444580078e-05, 3.844499588012695e-06, 2.372264862060547e-05, 4.360079765319824e-05, 6.347894668579102e-05, 8.335709571838379e-05, 0.00010323524475097656, 0.00012311339378356934, 0.0001429915428161621, 0.00016286969184875488, 0.00018274784088134766, 0.00020262598991394043, 0.0002225041389465332, 0.00024238228797912598, 0.00026226043701171875, 0.0002821385860443115, 0.0003020167350769043, 0.00032189488410949707, 0.00034177303314208984, 0.0003616511821746826, 0.0003815293312072754, 0.00040140748023986816, 0.00042128562927246094, 0.0004411637783050537, 0.0004610419273376465, 0.00048092007637023926, 0.000500798225402832, 0.0005206763744354248, 0.0005405545234680176, 0.0005604326725006104, 0.0005803108215332031]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 8.0, 4.0, 8.0, 18.0, 20.0, 29.0, 41.0, 83.0, 130.0, 142.0, 245.0, 341.0, 620.0, 939.0, 1552.0, 2508.0, 4238.0, 7322.0, 12581.0, 22236.0, 39696.0, 69184.0, 113847.0, 164196.0, 186134.0, 159360.0, 108949.0, 66204.0, 37799.0, 21000.0, 11887.0, 6825.0, 4002.0, 2391.0, 1454.0, 918.0, 565.0, 374.0, 230.0, 155.0, 106.0, 79.0, 39.0, 24.0, 23.0, 14.0, 15.0, 5.0, 3.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0], "bins": [-5.625, -5.45684814453125, -5.2886962890625, -5.12054443359375, -4.952392578125, -4.78424072265625, -4.6160888671875, -4.44793701171875, -4.27978515625, -4.11163330078125, -3.9434814453125, -3.77532958984375, -3.607177734375, -3.43902587890625, -3.2708740234375, -3.10272216796875, -2.9345703125, -2.76641845703125, -2.5982666015625, -2.43011474609375, -2.261962890625, -2.09381103515625, -1.9256591796875, -1.75750732421875, -1.58935546875, -1.42120361328125, -1.2530517578125, -1.08489990234375, -0.916748046875, -0.74859619140625, -0.5804443359375, -0.41229248046875, -0.244140625, -0.07598876953125, 0.0921630859375, 0.26031494140625, 0.428466796875, 0.59661865234375, 0.7647705078125, 0.93292236328125, 1.10107421875, 1.26922607421875, 1.4373779296875, 1.60552978515625, 1.773681640625, 1.94183349609375, 2.1099853515625, 2.27813720703125, 2.4462890625, 2.61444091796875, 2.7825927734375, 2.95074462890625, 3.118896484375, 3.28704833984375, 3.4552001953125, 3.62335205078125, 3.79150390625, 3.95965576171875, 4.1278076171875, 4.29595947265625, 4.464111328125, 4.63226318359375, 4.8004150390625, 4.96856689453125, 5.13671875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 1.0, 4.0, 8.0, 13.0, 7.0, 13.0, 13.0, 17.0, 22.0, 27.0, 25.0, 31.0, 37.0, 42.0, 55.0, 64.0, 45.0, 73.0, 64.0, 64.0, 48.0, 55.0, 41.0, 40.0, 30.0, 48.0, 26.0, 15.0, 17.0, 10.0, 11.0, 6.0, 6.0, 6.0, 5.0, 2.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4228515625, -1.374725341796875, -1.32659912109375, -1.278472900390625, -1.2303466796875, -1.182220458984375, -1.13409423828125, -1.085968017578125, -1.037841796875, -0.989715576171875, -0.94158935546875, -0.893463134765625, -0.8453369140625, -0.797210693359375, -0.74908447265625, -0.700958251953125, -0.65283203125, -0.604705810546875, -0.55657958984375, -0.508453369140625, -0.4603271484375, -0.412200927734375, -0.36407470703125, -0.315948486328125, -0.267822265625, -0.219696044921875, -0.17156982421875, -0.123443603515625, -0.0753173828125, -0.027191162109375, 0.02093505859375, 0.069061279296875, 0.1171875, 0.165313720703125, 0.21343994140625, 0.261566162109375, 0.3096923828125, 0.357818603515625, 0.40594482421875, 0.454071044921875, 0.502197265625, 0.550323486328125, 0.59844970703125, 0.646575927734375, 0.6947021484375, 0.742828369140625, 0.79095458984375, 0.839080810546875, 0.88720703125, 0.935333251953125, 0.98345947265625, 1.031585693359375, 1.0797119140625, 1.127838134765625, 1.17596435546875, 1.224090576171875, 1.272216796875, 1.320343017578125, 1.36846923828125, 1.416595458984375, 1.4647216796875, 1.512847900390625, 1.56097412109375, 1.609100341796875, 1.6572265625]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 3.0, 3.0, 5.0, 8.0, 7.0, 12.0, 12.0, 23.0, 25.0, 28.0, 26.0, 48.0, 44.0, 53.0, 57.0, 75.0, 63.0, 72.0, 77.0, 64.0, 60.0, 40.0, 32.0, 26.0, 27.0, 26.0, 14.0, 12.0, 11.0, 8.0, 14.0, 1.0, 3.0, 7.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.33849334716797, -17.729873657226562, -17.121252059936523, -16.512632369995117, -15.904010772705078, -15.295391082763672, -14.68677043914795, -14.078149795532227, -13.469529151916504, -12.860908508300781, -12.252287864685059, -11.643667221069336, -11.03504753112793, -10.42642593383789, -9.817806243896484, -9.209185600280762, -8.600564956665039, -7.991944313049316, -7.383323669433594, -6.774703502655029, -6.166082859039307, -5.557462215423584, -4.9488420486450195, -4.340221405029297, -3.731600761413574, -3.1229801177978516, -2.514359712600708, -1.905739188194275, -1.2971186637878418, -0.6884980201721191, -0.07987761497497559, 0.528742790222168, 1.1373653411865234, 1.7459858655929565, 2.3546063899993896, 2.963226795196533, 3.571847438812256, 4.1804680824279785, 4.789088249206543, 5.397708892822266, 6.006329536437988, 6.614950180053711, 7.223570823669434, 7.832190990447998, 8.440811157226562, 9.049432754516602, 9.658052444458008, 10.26667308807373, 10.875293731689453, 11.483914375305176, 12.092535018920898, 12.701155662536621, 13.309776306152344, 13.91839599609375, 14.527016639709473, 15.135637283325195, 15.744257926940918, 16.35287857055664, 16.961498260498047, 17.570119857788086, 18.178739547729492, 18.78736114501953, 19.395980834960938, 20.004600524902344, 20.613222122192383]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 5.0, 13.0, 12.0, 16.0, 13.0, 18.0, 28.0, 29.0, 23.0, 36.0, 31.0, 41.0, 51.0, 40.0, 52.0, 43.0, 54.0, 36.0, 45.0, 43.0, 50.0, 41.0, 36.0, 23.0, 22.0, 22.0, 20.0, 25.0, 18.0, 21.0, 11.0, 14.0, 7.0, 13.0, 10.0, 7.0, 7.0, 3.0, 4.0, 5.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.433783531188965, -8.144537925720215, -7.855292797088623, -7.566047668457031, -7.276802062988281, -6.987556457519531, -6.6983113288879395, -6.409066200256348, -6.119820594787598, -5.830574989318848, -5.541329860687256, -5.252084732055664, -4.962839126586914, -4.673593521118164, -4.384348392486572, -4.0951032638549805, -3.8058576583862305, -3.5166122913360596, -3.2273669242858887, -2.9381215572357178, -2.648876190185547, -2.359630823135376, -2.070385456085205, -1.7811400890350342, -1.4918947219848633, -1.2026493549346924, -0.9134039878845215, -0.6241586208343506, -0.3349132537841797, -0.04566788673400879, 0.2435774803161621, 0.532822847366333, 0.8220691680908203, 1.1113145351409912, 1.400559902191162, 1.689805269241333, 1.979050636291504, 2.268296003341675, 2.5575413703918457, 2.8467867374420166, 3.1360321044921875, 3.4252774715423584, 3.7145228385925293, 4.003767967224121, 4.293013572692871, 4.582259178161621, 4.871504306793213, 5.160749435424805, 5.449995040893555, 5.739240646362305, 6.0284857749938965, 6.317730903625488, 6.606976509094238, 6.896222114562988, 7.18546724319458, 7.474712371826172, 7.763957977294922, 8.053203582763672, 8.342449188232422, 8.631693840026855, 8.920939445495605, 9.210185050964355, 9.499429702758789, 9.788675308227539, 10.077920913696289]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 6.0, 18.0, 19.0, 27.0, 49.0, 96.0, 138.0, 215.0, 333.0, 599.0, 1103.0, 2050.0, 4011.0, 8126.0, 17486.0, 39255.0, 95415.0, 249939.0, 696532.0, 1447838.0, 1024094.0, 368907.0, 135293.0, 54827.0, 24062.0, 11402.0, 5603.0, 2924.0, 1630.0, 882.0, 535.0, 291.0, 188.0, 117.0, 84.0, 58.0, 43.0, 29.0, 19.0, 12.0, 9.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.21875, -17.536376953125, -16.85400390625, -16.171630859375, -15.4892578125, -14.806884765625, -14.12451171875, -13.442138671875, -12.759765625, -12.077392578125, -11.39501953125, -10.712646484375, -10.0302734375, -9.347900390625, -8.66552734375, -7.983154296875, -7.30078125, -6.618408203125, -5.93603515625, -5.253662109375, -4.5712890625, -3.888916015625, -3.20654296875, -2.524169921875, -1.841796875, -1.159423828125, -0.47705078125, 0.205322265625, 0.8876953125, 1.570068359375, 2.25244140625, 2.934814453125, 3.6171875, 4.299560546875, 4.98193359375, 5.664306640625, 6.3466796875, 7.029052734375, 7.71142578125, 8.393798828125, 9.076171875, 9.758544921875, 10.44091796875, 11.123291015625, 11.8056640625, 12.488037109375, 13.17041015625, 13.852783203125, 14.53515625, 15.217529296875, 15.89990234375, 16.582275390625, 17.2646484375, 17.947021484375, 18.62939453125, 19.311767578125, 19.994140625, 20.676513671875, 21.35888671875, 22.041259765625, 22.7236328125, 23.406005859375, 24.08837890625, 24.770751953125, 25.453125]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 9.0, 12.0, 12.0, 5.0, 10.0, 15.0, 21.0, 23.0, 30.0, 37.0, 36.0, 41.0, 46.0, 54.0, 43.0, 52.0, 37.0, 38.0, 53.0, 45.0, 56.0, 39.0, 38.0, 35.0, 29.0, 29.0, 26.0, 27.0, 18.0, 11.0, 20.0, 9.0, 6.0, 15.0, 6.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.76953125, -6.52386474609375, -6.2781982421875, -6.03253173828125, -5.786865234375, -5.54119873046875, -5.2955322265625, -5.04986572265625, -4.80419921875, -4.55853271484375, -4.3128662109375, -4.06719970703125, -3.821533203125, -3.57586669921875, -3.3302001953125, -3.08453369140625, -2.8388671875, -2.59320068359375, -2.3475341796875, -2.10186767578125, -1.856201171875, -1.61053466796875, -1.3648681640625, -1.11920166015625, -0.87353515625, -0.62786865234375, -0.3822021484375, -0.13653564453125, 0.109130859375, 0.35479736328125, 0.6004638671875, 0.84613037109375, 1.091796875, 1.33746337890625, 1.5831298828125, 1.82879638671875, 2.074462890625, 2.32012939453125, 2.5657958984375, 2.81146240234375, 3.05712890625, 3.30279541015625, 3.5484619140625, 3.79412841796875, 4.039794921875, 4.28546142578125, 4.5311279296875, 4.77679443359375, 5.0224609375, 5.26812744140625, 5.5137939453125, 5.75946044921875, 6.005126953125, 6.25079345703125, 6.4964599609375, 6.74212646484375, 6.98779296875, 7.23345947265625, 7.4791259765625, 7.72479248046875, 7.970458984375, 8.21612548828125, 8.4617919921875, 8.70745849609375, 8.953125]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 2.0, 5.0, 7.0, 14.0, 24.0, 32.0, 46.0, 56.0, 93.0, 161.0, 252.0, 447.0, 723.0, 1250.0, 2294.0, 4227.0, 8081.0, 15567.0, 32151.0, 66691.0, 144174.0, 317426.0, 678610.0, 1111245.0, 928393.0, 473193.0, 216063.0, 98877.0, 46489.0, 22643.0, 11554.0, 6057.0, 3197.0, 1752.0, 998.0, 576.0, 338.0, 221.0, 132.0, 72.0, 53.0, 35.0, 16.0, 17.0, 11.0, 6.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-20.859375, -20.241455078125, -19.62353515625, -19.005615234375, -18.3876953125, -17.769775390625, -17.15185546875, -16.533935546875, -15.916015625, -15.298095703125, -14.68017578125, -14.062255859375, -13.4443359375, -12.826416015625, -12.20849609375, -11.590576171875, -10.97265625, -10.354736328125, -9.73681640625, -9.118896484375, -8.5009765625, -7.883056640625, -7.26513671875, -6.647216796875, -6.029296875, -5.411376953125, -4.79345703125, -4.175537109375, -3.5576171875, -2.939697265625, -2.32177734375, -1.703857421875, -1.0859375, -0.468017578125, 0.14990234375, 0.767822265625, 1.3857421875, 2.003662109375, 2.62158203125, 3.239501953125, 3.857421875, 4.475341796875, 5.09326171875, 5.711181640625, 6.3291015625, 6.947021484375, 7.56494140625, 8.182861328125, 8.80078125, 9.418701171875, 10.03662109375, 10.654541015625, 11.2724609375, 11.890380859375, 12.50830078125, 13.126220703125, 13.744140625, 14.362060546875, 14.97998046875, 15.597900390625, 16.2158203125, 16.833740234375, 17.45166015625, 18.069580078125, 18.6875]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 8.0, 8.0, 7.0, 12.0, 15.0, 28.0, 36.0, 60.0, 64.0, 94.0, 132.0, 179.0, 239.0, 300.0, 323.0, 384.0, 397.0, 315.0, 327.0, 276.0, 215.0, 174.0, 144.0, 97.0, 78.0, 48.0, 33.0, 34.0, 20.0, 10.0, 8.0, 4.0, 4.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.1171875, -7.91162109375, -7.7060546875, -7.50048828125, -7.294921875, -7.08935546875, -6.8837890625, -6.67822265625, -6.47265625, -6.26708984375, -6.0615234375, -5.85595703125, -5.650390625, -5.44482421875, -5.2392578125, -5.03369140625, -4.828125, -4.62255859375, -4.4169921875, -4.21142578125, -4.005859375, -3.80029296875, -3.5947265625, -3.38916015625, -3.18359375, -2.97802734375, -2.7724609375, -2.56689453125, -2.361328125, -2.15576171875, -1.9501953125, -1.74462890625, -1.5390625, -1.33349609375, -1.1279296875, -0.92236328125, -0.716796875, -0.51123046875, -0.3056640625, -0.10009765625, 0.10546875, 0.31103515625, 0.5166015625, 0.72216796875, 0.927734375, 1.13330078125, 1.3388671875, 1.54443359375, 1.75, 1.95556640625, 2.1611328125, 2.36669921875, 2.572265625, 2.77783203125, 2.9833984375, 3.18896484375, 3.39453125, 3.60009765625, 3.8056640625, 4.01123046875, 4.216796875, 4.42236328125, 4.6279296875, 4.83349609375, 5.0390625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 4.0, 5.0, 8.0, 5.0, 10.0, 14.0, 18.0, 21.0, 26.0, 28.0, 48.0, 52.0, 48.0, 75.0, 81.0, 68.0, 88.0, 65.0, 61.0, 58.0, 49.0, 33.0, 40.0, 20.0, 15.0, 17.0, 7.0, 12.0, 8.0, 7.0, 4.0, 0.0, 2.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.16599464416504, -20.458349227905273, -19.750701904296875, -19.04305648803711, -18.335411071777344, -17.627765655517578, -16.92011833190918, -16.212472915649414, -15.504826545715332, -14.79718017578125, -14.089534759521484, -13.381888389587402, -12.67424201965332, -11.966596603393555, -11.258950233459473, -10.55130386352539, -9.843658447265625, -9.136012077331543, -8.428366661071777, -7.720720291137695, -7.0130743980407715, -6.305428504943848, -5.597782135009766, -4.890136241912842, -4.182490348815918, -3.474844455718994, -2.767198324203491, -2.0595521926879883, -1.3519062995910645, -0.6442604064941406, 0.0633859634399414, 0.7710318565368652, 1.4786758422851562, 2.18632173538208, 2.893967866897583, 3.601613998413086, 4.30925989151001, 5.016905784606934, 5.724552154541016, 6.4321980476379395, 7.139843940734863, 7.847489833831787, 8.555135726928711, 9.262782096862793, 9.970428466796875, 10.67807388305664, 11.385720252990723, 12.093366622924805, 12.80101203918457, 13.508658409118652, 14.216303825378418, 14.9239501953125, 15.631595611572266, 16.33924102783203, 17.04688835144043, 17.754533767700195, 18.462181091308594, 19.16982650756836, 19.877473831176758, 20.585119247436523, 21.29276466369629, 22.000411987304688, 22.708057403564453, 23.41570281982422, 24.123348236083984]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 4.0, 7.0, 5.0, 7.0, 9.0, 14.0, 22.0, 23.0, 17.0, 28.0, 32.0, 31.0, 37.0, 26.0, 48.0, 37.0, 35.0, 46.0, 32.0, 46.0, 44.0, 46.0, 45.0, 49.0, 35.0, 35.0, 31.0, 35.0, 24.0, 22.0, 28.0, 18.0, 16.0, 9.0, 15.0, 3.0, 9.0, 5.0, 9.0, 4.0, 5.0, 2.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.962663173675537, -7.675048351287842, -7.387433052062988, -7.099818229675293, -6.812203407287598, -6.524588584899902, -6.236973285675049, -5.9493584632873535, -5.6617431640625, -5.374128341674805, -5.086513042449951, -4.798898220062256, -4.5112833976745605, -4.223668098449707, -3.9360532760620117, -3.6484384536743164, -3.360823631286621, -3.0732085704803467, -2.7855937480926514, -2.497978687286377, -2.2103638648986816, -1.9227488040924072, -1.6351337432861328, -1.3475189208984375, -1.059903860092163, -0.7722889184951782, -0.4846739172935486, -0.19705891609191895, 0.09055602550506592, 0.3781709671020508, 0.6657860279083252, 0.9534008502960205, 1.2410163879394531, 1.528631329536438, 1.8162462711334229, 2.1038613319396973, 2.3914761543273926, 2.679091215133667, 2.9667062759399414, 3.2543210983276367, 3.541936159133911, 3.8295512199401855, 4.117166042327881, 4.404781341552734, 4.69239616394043, 4.980010986328125, 5.26762580871582, 5.555240631103516, 5.842855930328369, 6.1304707527160645, 6.418086051940918, 6.705700874328613, 6.993315696716309, 7.280930519104004, 7.568545818328857, 7.856160640716553, 8.143775939941406, 8.431390762329102, 8.719005584716797, 9.006620407104492, 9.294236183166504, 9.5818510055542, 9.869465827941895, 10.15708065032959, 10.444695472717285]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 1.0, 6.0, 4.0, 6.0, 10.0, 18.0, 24.0, 38.0, 35.0, 51.0, 76.0, 101.0, 145.0, 205.0, 267.0, 391.0, 601.0, 868.0, 1552.0, 2615.0, 4570.0, 8702.0, 17252.0, 37218.0, 81199.0, 164321.0, 251651.0, 227007.0, 130291.0, 61070.0, 28257.0, 13407.0, 6895.0, 3723.0, 2100.0, 1288.0, 840.0, 546.0, 380.0, 225.0, 181.0, 121.0, 78.0, 66.0, 44.0, 39.0, 18.0, 13.0, 14.0, 7.0, 4.0, 10.0, 4.0, 6.0, 3.0, 0.0, 1.0], "bins": [-14.578125, -14.1470947265625, -13.716064453125, -13.2850341796875, -12.85400390625, -12.4229736328125, -11.991943359375, -11.5609130859375, -11.1298828125, -10.6988525390625, -10.267822265625, -9.8367919921875, -9.40576171875, -8.9747314453125, -8.543701171875, -8.1126708984375, -7.681640625, -7.2506103515625, -6.819580078125, -6.3885498046875, -5.95751953125, -5.5264892578125, -5.095458984375, -4.6644287109375, -4.2333984375, -3.8023681640625, -3.371337890625, -2.9403076171875, -2.50927734375, -2.0782470703125, -1.647216796875, -1.2161865234375, -0.78515625, -0.3541259765625, 0.076904296875, 0.5079345703125, 0.93896484375, 1.3699951171875, 1.801025390625, 2.2320556640625, 2.6630859375, 3.0941162109375, 3.525146484375, 3.9561767578125, 4.38720703125, 4.8182373046875, 5.249267578125, 5.6802978515625, 6.111328125, 6.5423583984375, 6.973388671875, 7.4044189453125, 7.83544921875, 8.2664794921875, 8.697509765625, 9.1285400390625, 9.5595703125, 9.9906005859375, 10.421630859375, 10.8526611328125, 11.28369140625, 11.7147216796875, 12.145751953125, 12.5767822265625, 13.0078125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 5.0, 6.0, 4.0, 5.0, 7.0, 3.0, 5.0, 8.0, 10.0, 11.0, 20.0, 19.0, 17.0, 16.0, 25.0, 25.0, 24.0, 33.0, 26.0, 35.0, 34.0, 37.0, 36.0, 37.0, 35.0, 37.0, 42.0, 40.0, 47.0, 44.0, 30.0, 34.0, 32.0, 29.0, 24.0, 27.0, 20.0, 12.0, 19.0, 15.0, 11.0, 11.0, 8.0, 7.0, 7.0, 8.0, 7.0, 3.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-8.5390625, -8.2655029296875, -7.991943359375, -7.7183837890625, -7.44482421875, -7.1712646484375, -6.897705078125, -6.6241455078125, -6.3505859375, -6.0770263671875, -5.803466796875, -5.5299072265625, -5.25634765625, -4.9827880859375, -4.709228515625, -4.4356689453125, -4.162109375, -3.8885498046875, -3.614990234375, -3.3414306640625, -3.06787109375, -2.7943115234375, -2.520751953125, -2.2471923828125, -1.9736328125, -1.7000732421875, -1.426513671875, -1.1529541015625, -0.87939453125, -0.6058349609375, -0.332275390625, -0.0587158203125, 0.21484375, 0.4884033203125, 0.761962890625, 1.0355224609375, 1.30908203125, 1.5826416015625, 1.856201171875, 2.1297607421875, 2.4033203125, 2.6768798828125, 2.950439453125, 3.2239990234375, 3.49755859375, 3.7711181640625, 4.044677734375, 4.3182373046875, 4.591796875, 4.8653564453125, 5.138916015625, 5.4124755859375, 5.68603515625, 5.9595947265625, 6.233154296875, 6.5067138671875, 6.7802734375, 7.0538330078125, 7.327392578125, 7.6009521484375, 7.87451171875, 8.1480712890625, 8.421630859375, 8.6951904296875, 8.96875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 4.0, 9.0, 18.0, 17.0, 23.0, 39.0, 31.0, 56.0, 79.0, 106.0, 172.0, 209.0, 298.0, 419.0, 690.0, 1065.0, 1839.0, 3412.0, 7570.0, 19542.0, 59221.0, 191086.0, 404617.0, 238431.0, 76038.0, 24595.0, 9176.0, 4168.0, 2101.0, 1271.0, 717.0, 472.0, 312.0, 215.0, 139.0, 110.0, 67.0, 55.0, 48.0, 35.0, 27.0, 12.0, 7.0, 9.0, 9.0, 4.0, 7.0, 1.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.84375, -20.1396484375, -19.435546875, -18.7314453125, -18.02734375, -17.3232421875, -16.619140625, -15.9150390625, -15.2109375, -14.5068359375, -13.802734375, -13.0986328125, -12.39453125, -11.6904296875, -10.986328125, -10.2822265625, -9.578125, -8.8740234375, -8.169921875, -7.4658203125, -6.76171875, -6.0576171875, -5.353515625, -4.6494140625, -3.9453125, -3.2412109375, -2.537109375, -1.8330078125, -1.12890625, -0.4248046875, 0.279296875, 0.9833984375, 1.6875, 2.3916015625, 3.095703125, 3.7998046875, 4.50390625, 5.2080078125, 5.912109375, 6.6162109375, 7.3203125, 8.0244140625, 8.728515625, 9.4326171875, 10.13671875, 10.8408203125, 11.544921875, 12.2490234375, 12.953125, 13.6572265625, 14.361328125, 15.0654296875, 15.76953125, 16.4736328125, 17.177734375, 17.8818359375, 18.5859375, 19.2900390625, 19.994140625, 20.6982421875, 21.40234375, 22.1064453125, 22.810546875, 23.5146484375, 24.21875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 3.0, 4.0, 2.0, 4.0, 11.0, 8.0, 11.0, 15.0, 13.0, 12.0, 25.0, 24.0, 29.0, 37.0, 37.0, 41.0, 42.0, 43.0, 38.0, 36.0, 47.0, 47.0, 39.0, 42.0, 40.0, 49.0, 48.0, 25.0, 31.0, 25.0, 28.0, 23.0, 16.0, 16.0, 16.0, 16.0, 15.0, 12.0, 5.0, 4.0, 4.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.5859375, -5.40032958984375, -5.2147216796875, -5.02911376953125, -4.843505859375, -4.65789794921875, -4.4722900390625, -4.28668212890625, -4.10107421875, -3.91546630859375, -3.7298583984375, -3.54425048828125, -3.358642578125, -3.17303466796875, -2.9874267578125, -2.80181884765625, -2.6162109375, -2.43060302734375, -2.2449951171875, -2.05938720703125, -1.873779296875, -1.68817138671875, -1.5025634765625, -1.31695556640625, -1.13134765625, -0.94573974609375, -0.7601318359375, -0.57452392578125, -0.388916015625, -0.20330810546875, -0.0177001953125, 0.16790771484375, 0.353515625, 0.53912353515625, 0.7247314453125, 0.91033935546875, 1.095947265625, 1.28155517578125, 1.4671630859375, 1.65277099609375, 1.83837890625, 2.02398681640625, 2.2095947265625, 2.39520263671875, 2.580810546875, 2.76641845703125, 2.9520263671875, 3.13763427734375, 3.3232421875, 3.50885009765625, 3.6944580078125, 3.88006591796875, 4.065673828125, 4.25128173828125, 4.4368896484375, 4.62249755859375, 4.80810546875, 4.99371337890625, 5.1793212890625, 5.36492919921875, 5.550537109375, 5.73614501953125, 5.9217529296875, 6.10736083984375, 6.29296875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 2.0, 7.0, 7.0, 22.0, 18.0, 20.0, 38.0, 45.0, 70.0, 83.0, 120.0, 166.0, 227.0, 266.0, 397.0, 549.0, 797.0, 1115.0, 1570.0, 2308.0, 3639.0, 6298.0, 13909.0, 48610.0, 243899.0, 528143.0, 139653.0, 30719.0, 10421.0, 5185.0, 3069.0, 2059.0, 1429.0, 1043.0, 730.0, 536.0, 362.0, 301.0, 189.0, 140.0, 111.0, 81.0, 68.0, 38.0, 29.0, 23.0, 13.0, 11.0, 6.0, 6.0, 6.0, 2.0, 3.0, 2.0], "bins": [-17.140625, -16.655517578125, -16.17041015625, -15.685302734375, -15.2001953125, -14.715087890625, -14.22998046875, -13.744873046875, -13.259765625, -12.774658203125, -12.28955078125, -11.804443359375, -11.3193359375, -10.834228515625, -10.34912109375, -9.864013671875, -9.37890625, -8.893798828125, -8.40869140625, -7.923583984375, -7.4384765625, -6.953369140625, -6.46826171875, -5.983154296875, -5.498046875, -5.012939453125, -4.52783203125, -4.042724609375, -3.5576171875, -3.072509765625, -2.58740234375, -2.102294921875, -1.6171875, -1.132080078125, -0.64697265625, -0.161865234375, 0.3232421875, 0.808349609375, 1.29345703125, 1.778564453125, 2.263671875, 2.748779296875, 3.23388671875, 3.718994140625, 4.2041015625, 4.689208984375, 5.17431640625, 5.659423828125, 6.14453125, 6.629638671875, 7.11474609375, 7.599853515625, 8.0849609375, 8.570068359375, 9.05517578125, 9.540283203125, 10.025390625, 10.510498046875, 10.99560546875, 11.480712890625, 11.9658203125, 12.450927734375, 12.93603515625, 13.421142578125, 13.90625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 4.0, 9.0, 15.0, 33.0, 49.0, 119.0, 195.0, 243.0, 162.0, 78.0, 41.0, 18.0, 12.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.00164794921875, -0.0016115084290504456, -0.0015750676393508911, -0.0015386268496513367, -0.0015021860599517822, -0.0014657452702522278, -0.0014293044805526733, -0.001392863690853119, -0.0013564229011535645, -0.00131998211145401, -0.0012835413217544556, -0.0012471005320549011, -0.0012106597423553467, -0.0011742189526557922, -0.0011377781629562378, -0.0011013373732566833, -0.001064896583557129, -0.0010284557938575745, -0.00099201500415802, -0.0009555742144584656, -0.0009191334247589111, -0.0008826926350593567, -0.0008462518453598022, -0.0008098110556602478, -0.0007733702659606934, -0.0007369294762611389, -0.0007004886865615845, -0.00066404789686203, -0.0006276071071624756, -0.0005911663174629211, -0.0005547255277633667, -0.0005182847380638123, -0.0004818439483642578, -0.00044540315866470337, -0.0004089623689651489, -0.0003725215792655945, -0.00033608078956604004, -0.0002996399998664856, -0.00026319921016693115, -0.0002267584204673767, -0.00019031763076782227, -0.00015387684106826782, -0.00011743605136871338, -8.099526166915894e-05, -4.455447196960449e-05, -8.113682270050049e-06, 2.8327107429504395e-05, 6.476789712905884e-05, 0.00010120868682861328, 0.00013764947652816772, 0.00017409026622772217, 0.0002105310559272766, 0.00024697184562683105, 0.0002834126353263855, 0.00031985342502593994, 0.0003562942147254944, 0.00039273500442504883, 0.00042917579412460327, 0.0004656165838241577, 0.0005020573735237122, 0.0005384981632232666, 0.000574938952922821, 0.0006113797426223755, 0.0006478205323219299, 0.0006842613220214844]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 3.0, 7.0, 7.0, 11.0, 9.0, 22.0, 19.0, 41.0, 46.0, 66.0, 96.0, 126.0, 164.0, 177.0, 284.0, 353.0, 448.0, 617.0, 867.0, 1123.0, 1411.0, 1849.0, 2648.0, 3688.0, 6422.0, 19218.0, 112551.0, 505271.0, 313304.0, 49546.0, 11120.0, 4871.0, 3067.0, 2219.0, 1654.0, 1254.0, 974.0, 734.0, 550.0, 427.0, 344.0, 272.0, 174.0, 143.0, 81.0, 79.0, 58.0, 34.0, 30.0, 24.0, 16.0, 14.0, 10.0, 6.0, 10.0, 3.0, 2.0, 0.0, 1.0, 5.0], "bins": [-16.171875, -15.6630859375, -15.154296875, -14.6455078125, -14.13671875, -13.6279296875, -13.119140625, -12.6103515625, -12.1015625, -11.5927734375, -11.083984375, -10.5751953125, -10.06640625, -9.5576171875, -9.048828125, -8.5400390625, -8.03125, -7.5224609375, -7.013671875, -6.5048828125, -5.99609375, -5.4873046875, -4.978515625, -4.4697265625, -3.9609375, -3.4521484375, -2.943359375, -2.4345703125, -1.92578125, -1.4169921875, -0.908203125, -0.3994140625, 0.109375, 0.6181640625, 1.126953125, 1.6357421875, 2.14453125, 2.6533203125, 3.162109375, 3.6708984375, 4.1796875, 4.6884765625, 5.197265625, 5.7060546875, 6.21484375, 6.7236328125, 7.232421875, 7.7412109375, 8.25, 8.7587890625, 9.267578125, 9.7763671875, 10.28515625, 10.7939453125, 11.302734375, 11.8115234375, 12.3203125, 12.8291015625, 13.337890625, 13.8466796875, 14.35546875, 14.8642578125, 15.373046875, 15.8818359375, 16.390625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 3.0, 7.0, 10.0, 23.0, 55.0, 97.0, 144.0, 189.0, 195.0, 120.0, 71.0, 31.0, 19.0, 9.0, 3.0, 6.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7109375, -3.57171630859375, -3.4324951171875, -3.29327392578125, -3.154052734375, -3.01483154296875, -2.8756103515625, -2.73638916015625, -2.59716796875, -2.45794677734375, -2.3187255859375, -2.17950439453125, -2.040283203125, -1.90106201171875, -1.7618408203125, -1.62261962890625, -1.4833984375, -1.34417724609375, -1.2049560546875, -1.06573486328125, -0.926513671875, -0.78729248046875, -0.6480712890625, -0.50885009765625, -0.36962890625, -0.23040771484375, -0.0911865234375, 0.04803466796875, 0.187255859375, 0.32647705078125, 0.4656982421875, 0.60491943359375, 0.744140625, 0.88336181640625, 1.0225830078125, 1.16180419921875, 1.301025390625, 1.44024658203125, 1.5794677734375, 1.71868896484375, 1.85791015625, 1.99713134765625, 2.1363525390625, 2.27557373046875, 2.414794921875, 2.55401611328125, 2.6932373046875, 2.83245849609375, 2.9716796875, 3.11090087890625, 3.2501220703125, 3.38934326171875, 3.528564453125, 3.66778564453125, 3.8070068359375, 3.94622802734375, 4.08544921875, 4.22467041015625, 4.3638916015625, 4.50311279296875, 4.642333984375, 4.78155517578125, 4.9207763671875, 5.05999755859375, 5.19921875]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 6.0, 6.0, 4.0, 3.0, 15.0, 19.0, 18.0, 23.0, 22.0, 38.0, 30.0, 47.0, 70.0, 69.0, 72.0, 73.0, 86.0, 66.0, 59.0, 63.0, 52.0, 32.0, 26.0, 21.0, 18.0, 15.0, 14.0, 4.0, 8.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 7.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.578258514404297, -19.88836097717285, -19.198463439941406, -18.50856590270996, -17.818668365478516, -17.12877082824707, -16.438873291015625, -15.74897575378418, -15.059078216552734, -14.369180679321289, -13.679283142089844, -12.989385604858398, -12.299488067626953, -11.609590530395508, -10.919692993164062, -10.229795455932617, -9.539897918701172, -8.850000381469727, -8.160102844238281, -7.470205307006836, -6.780307769775391, -6.090410232543945, -5.4005126953125, -4.710615158081055, -4.020717620849609, -3.330820083618164, -2.6409225463867188, -1.9510250091552734, -1.2611274719238281, -0.5712299346923828, 0.1186676025390625, 0.8085651397705078, 1.4984607696533203, 2.1883583068847656, 2.878255844116211, 3.5681533813476562, 4.258050918579102, 4.947948455810547, 5.637845993041992, 6.3277435302734375, 7.017641067504883, 7.707538604736328, 8.397436141967773, 9.087333679199219, 9.777231216430664, 10.46712875366211, 11.157026290893555, 11.846923828125, 12.536821365356445, 13.22671890258789, 13.916616439819336, 14.606513977050781, 15.296411514282227, 15.986309051513672, 16.676206588745117, 17.366104125976562, 18.056001663208008, 18.745899200439453, 19.4357967376709, 20.125694274902344, 20.81559181213379, 21.505489349365234, 22.19538688659668, 22.885284423828125, 23.57518196105957]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 6.0, 6.0, 7.0, 5.0, 10.0, 17.0, 11.0, 22.0, 31.0, 19.0, 37.0, 31.0, 33.0, 26.0, 43.0, 43.0, 41.0, 47.0, 41.0, 40.0, 52.0, 44.0, 35.0, 52.0, 40.0, 33.0, 31.0, 31.0, 28.0, 25.0, 21.0, 15.0, 18.0, 12.0, 5.0, 12.0, 8.0, 5.0, 4.0, 3.0, 4.0, 6.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.086185455322266, -7.793124675750732, -7.500064373016357, -7.207003593444824, -6.913943290710449, -6.620882511138916, -6.327821731567383, -6.034761428833008, -5.741701126098633, -5.4486403465271, -5.155580043792725, -4.862519264221191, -4.569458961486816, -4.276398181915283, -3.983337640762329, -3.690277099609375, -3.397216320037842, -3.1041557788848877, -2.8110952377319336, -2.5180344581604004, -2.2249741554260254, -1.9319134950637817, -1.638852834701538, -1.345792293548584, -1.0527317523956299, -0.7596712112426758, -0.4666106104850769, -0.17355000972747803, 0.11951053142547607, 0.4125710725784302, 0.7056317329406738, 0.9986922740936279, 1.291752815246582, 1.5848133563995361, 1.8778738975524902, 2.1709346771240234, 2.4639949798583984, 2.7570557594299316, 3.0501163005828857, 3.34317684173584, 3.636237382888794, 3.929297924041748, 4.222358703613281, 4.515419006347656, 4.8084797859191895, 5.1015400886535645, 5.394600868225098, 5.687661170959473, 5.980721950531006, 6.273782730102539, 6.566843032836914, 6.859903812408447, 7.152964115142822, 7.4460248947143555, 7.7390851974487305, 8.032146453857422, 8.325206756591797, 8.618267059326172, 8.911328315734863, 9.204388618469238, 9.497448921203613, 9.790509223937988, 10.08357048034668, 10.376630783081055, 10.66969108581543]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 7.0, 5.0, 18.0, 8.0, 28.0, 34.0, 58.0, 79.0, 133.0, 186.0, 339.0, 510.0, 825.0, 1373.0, 2397.0, 4175.0, 7255.0, 13002.0, 23031.0, 40163.0, 68985.0, 108627.0, 149823.0, 172127.0, 157698.0, 117596.0, 75396.0, 44996.0, 25755.0, 14300.0, 8271.0, 4616.0, 2678.0, 1574.0, 942.0, 565.0, 328.0, 245.0, 142.0, 106.0, 62.0, 28.0, 24.0, 12.0, 10.0, 11.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.6171875, -13.199462890625, -12.78173828125, -12.364013671875, -11.9462890625, -11.528564453125, -11.11083984375, -10.693115234375, -10.275390625, -9.857666015625, -9.43994140625, -9.022216796875, -8.6044921875, -8.186767578125, -7.76904296875, -7.351318359375, -6.93359375, -6.515869140625, -6.09814453125, -5.680419921875, -5.2626953125, -4.844970703125, -4.42724609375, -4.009521484375, -3.591796875, -3.174072265625, -2.75634765625, -2.338623046875, -1.9208984375, -1.503173828125, -1.08544921875, -0.667724609375, -0.25, 0.167724609375, 0.58544921875, 1.003173828125, 1.4208984375, 1.838623046875, 2.25634765625, 2.674072265625, 3.091796875, 3.509521484375, 3.92724609375, 4.344970703125, 4.7626953125, 5.180419921875, 5.59814453125, 6.015869140625, 6.43359375, 6.851318359375, 7.26904296875, 7.686767578125, 8.1044921875, 8.522216796875, 8.93994140625, 9.357666015625, 9.775390625, 10.193115234375, 10.61083984375, 11.028564453125, 11.4462890625, 11.864013671875, 12.28173828125, 12.699462890625, 13.1171875]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 4.0, 8.0, 17.0, 11.0, 19.0, 15.0, 19.0, 20.0, 35.0, 25.0, 27.0, 38.0, 37.0, 43.0, 52.0, 52.0, 55.0, 45.0, 46.0, 43.0, 50.0, 50.0, 37.0, 34.0, 36.0, 28.0, 17.0, 27.0, 9.0, 23.0, 12.0, 24.0, 11.0, 6.0, 8.0, 4.0, 1.0, 3.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9375, -9.5906982421875, -9.243896484375, -8.8970947265625, -8.55029296875, -8.2034912109375, -7.856689453125, -7.5098876953125, -7.1630859375, -6.8162841796875, -6.469482421875, -6.1226806640625, -5.77587890625, -5.4290771484375, -5.082275390625, -4.7354736328125, -4.388671875, -4.0418701171875, -3.695068359375, -3.3482666015625, -3.00146484375, -2.6546630859375, -2.307861328125, -1.9610595703125, -1.6142578125, -1.2674560546875, -0.920654296875, -0.5738525390625, -0.22705078125, 0.1197509765625, 0.466552734375, 0.8133544921875, 1.16015625, 1.5069580078125, 1.853759765625, 2.2005615234375, 2.54736328125, 2.8941650390625, 3.240966796875, 3.5877685546875, 3.9345703125, 4.2813720703125, 4.628173828125, 4.9749755859375, 5.32177734375, 5.6685791015625, 6.015380859375, 6.3621826171875, 6.708984375, 7.0557861328125, 7.402587890625, 7.7493896484375, 8.09619140625, 8.4429931640625, 8.789794921875, 9.1365966796875, 9.4833984375, 9.8302001953125, 10.177001953125, 10.5238037109375, 10.87060546875, 11.2174072265625, 11.564208984375, 11.9110107421875, 12.2578125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 6.0, 5.0, 10.0, 7.0, 23.0, 28.0, 38.0, 53.0, 97.0, 121.0, 192.0, 340.0, 584.0, 956.0, 1619.0, 2750.0, 4834.0, 8322.0, 14699.0, 25574.0, 43380.0, 71347.0, 108012.0, 144377.0, 162831.0, 150217.0, 115359.0, 77824.0, 48045.0, 28700.0, 16232.0, 9292.0, 5325.0, 3064.0, 1690.0, 1004.0, 605.0, 380.0, 221.0, 129.0, 98.0, 56.0, 33.0, 28.0, 19.0, 13.0, 8.0, 8.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-14.53125, -14.1112060546875, -13.691162109375, -13.2711181640625, -12.85107421875, -12.4310302734375, -12.010986328125, -11.5909423828125, -11.1708984375, -10.7508544921875, -10.330810546875, -9.9107666015625, -9.49072265625, -9.0706787109375, -8.650634765625, -8.2305908203125, -7.810546875, -7.3905029296875, -6.970458984375, -6.5504150390625, -6.13037109375, -5.7103271484375, -5.290283203125, -4.8702392578125, -4.4501953125, -4.0301513671875, -3.610107421875, -3.1900634765625, -2.77001953125, -2.3499755859375, -1.929931640625, -1.5098876953125, -1.08984375, -0.6697998046875, -0.249755859375, 0.1702880859375, 0.59033203125, 1.0103759765625, 1.430419921875, 1.8504638671875, 2.2705078125, 2.6905517578125, 3.110595703125, 3.5306396484375, 3.95068359375, 4.3707275390625, 4.790771484375, 5.2108154296875, 5.630859375, 6.0509033203125, 6.470947265625, 6.8909912109375, 7.31103515625, 7.7310791015625, 8.151123046875, 8.5711669921875, 8.9912109375, 9.4112548828125, 9.831298828125, 10.2513427734375, 10.67138671875, 11.0914306640625, 11.511474609375, 11.9315185546875, 12.3515625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 9.0, 5.0, 15.0, 9.0, 9.0, 11.0, 14.0, 12.0, 15.0, 24.0, 25.0, 36.0, 20.0, 19.0, 32.0, 29.0, 29.0, 39.0, 37.0, 39.0, 35.0, 35.0, 46.0, 37.0, 50.0, 40.0, 27.0, 35.0, 34.0, 29.0, 33.0, 25.0, 20.0, 14.0, 16.0, 22.0, 16.0, 11.0, 11.0, 11.0, 4.0, 9.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.2890625, -5.10894775390625, -4.9288330078125, -4.74871826171875, -4.568603515625, -4.38848876953125, -4.2083740234375, -4.02825927734375, -3.84814453125, -3.66802978515625, -3.4879150390625, -3.30780029296875, -3.127685546875, -2.94757080078125, -2.7674560546875, -2.58734130859375, -2.4072265625, -2.22711181640625, -2.0469970703125, -1.86688232421875, -1.686767578125, -1.50665283203125, -1.3265380859375, -1.14642333984375, -0.96630859375, -0.78619384765625, -0.6060791015625, -0.42596435546875, -0.245849609375, -0.06573486328125, 0.1143798828125, 0.29449462890625, 0.474609375, 0.65472412109375, 0.8348388671875, 1.01495361328125, 1.195068359375, 1.37518310546875, 1.5552978515625, 1.73541259765625, 1.91552734375, 2.09564208984375, 2.2757568359375, 2.45587158203125, 2.635986328125, 2.81610107421875, 2.9962158203125, 3.17633056640625, 3.3564453125, 3.53656005859375, 3.7166748046875, 3.89678955078125, 4.076904296875, 4.25701904296875, 4.4371337890625, 4.61724853515625, 4.79736328125, 4.97747802734375, 5.1575927734375, 5.33770751953125, 5.517822265625, 5.69793701171875, 5.8780517578125, 6.05816650390625, 6.23828125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 1.0, 8.0, 8.0, 14.0, 19.0, 17.0, 48.0, 48.0, 72.0, 146.0, 194.0, 276.0, 416.0, 607.0, 1026.0, 1534.0, 2422.0, 4004.0, 6872.0, 12709.0, 23837.0, 49500.0, 101850.0, 188921.0, 245067.0, 194109.0, 106702.0, 51856.0, 25261.0, 12975.0, 7019.0, 4059.0, 2438.0, 1545.0, 935.0, 680.0, 455.0, 269.0, 195.0, 148.0, 87.0, 65.0, 54.0, 28.0, 24.0, 10.0, 13.0, 4.0, 3.0, 2.0, 2.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.6484375, -8.3741455078125, -8.099853515625, -7.8255615234375, -7.55126953125, -7.2769775390625, -7.002685546875, -6.7283935546875, -6.4541015625, -6.1798095703125, -5.905517578125, -5.6312255859375, -5.35693359375, -5.0826416015625, -4.808349609375, -4.5340576171875, -4.259765625, -3.9854736328125, -3.711181640625, -3.4368896484375, -3.16259765625, -2.8883056640625, -2.614013671875, -2.3397216796875, -2.0654296875, -1.7911376953125, -1.516845703125, -1.2425537109375, -0.96826171875, -0.6939697265625, -0.419677734375, -0.1453857421875, 0.12890625, 0.4031982421875, 0.677490234375, 0.9517822265625, 1.22607421875, 1.5003662109375, 1.774658203125, 2.0489501953125, 2.3232421875, 2.5975341796875, 2.871826171875, 3.1461181640625, 3.42041015625, 3.6947021484375, 3.968994140625, 4.2432861328125, 4.517578125, 4.7918701171875, 5.066162109375, 5.3404541015625, 5.61474609375, 5.8890380859375, 6.163330078125, 6.4376220703125, 6.7119140625, 6.9862060546875, 7.260498046875, 7.5347900390625, 7.80908203125, 8.0833740234375, 8.357666015625, 8.6319580078125, 8.90625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 5.0, 3.0, 9.0, 6.0, 12.0, 16.0, 12.0, 34.0, 31.0, 38.0, 64.0, 77.0, 80.0, 73.0, 84.0, 99.0, 77.0, 65.0, 52.0, 47.0, 35.0, 19.0, 17.0, 16.0, 5.0, 5.0, 10.0, 6.0, 6.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008287429809570312, -0.0007984191179275513, -0.0007680952548980713, -0.0007377713918685913, -0.0007074475288391113, -0.0006771236658096313, -0.0006467998027801514, -0.0006164759397506714, -0.0005861520767211914, -0.0005558282136917114, -0.0005255043506622314, -0.0004951804876327515, -0.0004648566246032715, -0.0004345327615737915, -0.0004042088985443115, -0.00037388503551483154, -0.00034356117248535156, -0.0003132373094558716, -0.0002829134464263916, -0.0002525895833969116, -0.00022226572036743164, -0.00019194185733795166, -0.00016161799430847168, -0.0001312941312789917, -0.00010097026824951172, -7.064640522003174e-05, -4.032254219055176e-05, -9.998679161071777e-06, 2.0325183868408203e-05, 5.0649046897888184e-05, 8.097290992736816e-05, 0.00011129677295684814, 0.00014162063598632812, 0.0001719444990158081, 0.00020226836204528809, 0.00023259222507476807, 0.00026291608810424805, 0.00029323995113372803, 0.000323563814163208, 0.000353887677192688, 0.00038421154022216797, 0.00041453540325164795, 0.00044485926628112793, 0.0004751831293106079, 0.0005055069923400879, 0.0005358308553695679, 0.0005661547183990479, 0.0005964785814285278, 0.0006268024444580078, 0.0006571263074874878, 0.0006874501705169678, 0.0007177740335464478, 0.0007480978965759277, 0.0007784217596054077, 0.0008087456226348877, 0.0008390694856643677, 0.0008693933486938477, 0.0008997172117233276, 0.0009300410747528076, 0.0009603649377822876, 0.0009906888008117676, 0.0010210126638412476, 0.0010513365268707275, 0.0010816603899002075, 0.0011119842529296875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 7.0, 8.0, 13.0, 10.0, 22.0, 34.0, 43.0, 64.0, 98.0, 144.0, 217.0, 327.0, 496.0, 691.0, 1053.0, 1561.0, 2398.0, 3625.0, 5863.0, 9362.0, 15890.0, 26395.0, 45224.0, 76144.0, 120523.0, 164908.0, 178663.0, 146301.0, 98728.0, 59872.0, 35353.0, 20957.0, 12422.0, 7598.0, 4688.0, 3029.0, 1918.0, 1243.0, 866.0, 582.0, 403.0, 270.0, 182.0, 92.0, 98.0, 51.0, 48.0, 27.0, 16.0, 22.0, 9.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.09375, -5.9049072265625, -5.716064453125, -5.5272216796875, -5.33837890625, -5.1495361328125, -4.960693359375, -4.7718505859375, -4.5830078125, -4.3941650390625, -4.205322265625, -4.0164794921875, -3.82763671875, -3.6387939453125, -3.449951171875, -3.2611083984375, -3.072265625, -2.8834228515625, -2.694580078125, -2.5057373046875, -2.31689453125, -2.1280517578125, -1.939208984375, -1.7503662109375, -1.5615234375, -1.3726806640625, -1.183837890625, -0.9949951171875, -0.80615234375, -0.6173095703125, -0.428466796875, -0.2396240234375, -0.05078125, 0.1380615234375, 0.326904296875, 0.5157470703125, 0.70458984375, 0.8934326171875, 1.082275390625, 1.2711181640625, 1.4599609375, 1.6488037109375, 1.837646484375, 2.0264892578125, 2.21533203125, 2.4041748046875, 2.593017578125, 2.7818603515625, 2.970703125, 3.1595458984375, 3.348388671875, 3.5372314453125, 3.72607421875, 3.9149169921875, 4.103759765625, 4.2926025390625, 4.4814453125, 4.6702880859375, 4.859130859375, 5.0479736328125, 5.23681640625, 5.4256591796875, 5.614501953125, 5.8033447265625, 5.9921875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 6.0, 2.0, 6.0, 6.0, 4.0, 11.0, 9.0, 15.0, 17.0, 22.0, 19.0, 23.0, 30.0, 42.0, 49.0, 44.0, 43.0, 69.0, 65.0, 67.0, 70.0, 54.0, 48.0, 57.0, 30.0, 22.0, 33.0, 31.0, 31.0, 19.0, 14.0, 13.0, 8.0, 3.0, 5.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.103515625, -2.042724609375, -1.98193359375, -1.921142578125, -1.8603515625, -1.799560546875, -1.73876953125, -1.677978515625, -1.6171875, -1.556396484375, -1.49560546875, -1.434814453125, -1.3740234375, -1.313232421875, -1.25244140625, -1.191650390625, -1.130859375, -1.070068359375, -1.00927734375, -0.948486328125, -0.8876953125, -0.826904296875, -0.76611328125, -0.705322265625, -0.64453125, -0.583740234375, -0.52294921875, -0.462158203125, -0.4013671875, -0.340576171875, -0.27978515625, -0.218994140625, -0.158203125, -0.097412109375, -0.03662109375, 0.024169921875, 0.0849609375, 0.145751953125, 0.20654296875, 0.267333984375, 0.328125, 0.388916015625, 0.44970703125, 0.510498046875, 0.5712890625, 0.632080078125, 0.69287109375, 0.753662109375, 0.814453125, 0.875244140625, 0.93603515625, 0.996826171875, 1.0576171875, 1.118408203125, 1.17919921875, 1.239990234375, 1.30078125, 1.361572265625, 1.42236328125, 1.483154296875, 1.5439453125, 1.604736328125, 1.66552734375, 1.726318359375, 1.787109375]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 5.0, 5.0, 12.0, 10.0, 14.0, 18.0, 17.0, 20.0, 23.0, 30.0, 42.0, 48.0, 65.0, 65.0, 73.0, 62.0, 80.0, 78.0, 65.0, 54.0, 39.0, 38.0, 22.0, 25.0, 21.0, 14.0, 13.0, 14.0, 6.0, 11.0, 1.0, 3.0, 4.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.22071647644043, -18.55204963684082, -17.883380889892578, -17.21471405029297, -16.54604721069336, -15.877379417419434, -15.208711624145508, -14.540044784545898, -13.871376991271973, -13.202709197998047, -12.534042358398438, -11.865374565124512, -11.196706771850586, -10.528039932250977, -9.85937213897705, -9.190704345703125, -8.522037506103516, -7.853370189666748, -7.1847028732299805, -6.516035079956055, -5.847367763519287, -5.1787004470825195, -4.510032653808594, -3.841365337371826, -3.1726980209350586, -2.504030704498291, -1.8353631496429443, -1.1666955947875977, -0.4980282783508301, 0.1706390380859375, 0.8393068313598633, 1.5079741477966309, 2.1766414642333984, 2.845308780670166, 3.5139763355255127, 4.182643890380859, 4.851311206817627, 5.5199785232543945, 6.18864631652832, 6.857313632965088, 7.5259809494018555, 8.194648742675781, 8.86331558227539, 9.531983375549316, 10.200651168823242, 10.869318008422852, 11.537985801696777, 12.206653594970703, 12.875320434570312, 13.543988227844238, 14.212655067443848, 14.881322860717773, 15.549989700317383, 16.218658447265625, 16.887325286865234, 17.555992126464844, 18.224658966064453, 18.893325805664062, 19.561994552612305, 20.230661392211914, 20.899328231811523, 21.567996978759766, 22.236663818359375, 22.905330657958984, 23.573999404907227]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 8.0, 6.0, 11.0, 10.0, 10.0, 11.0, 5.0, 22.0, 15.0, 14.0, 20.0, 15.0, 28.0, 28.0, 31.0, 23.0, 43.0, 36.0, 20.0, 40.0, 38.0, 32.0, 37.0, 51.0, 37.0, 36.0, 27.0, 31.0, 36.0, 38.0, 31.0, 34.0, 20.0, 19.0, 23.0, 24.0, 9.0, 18.0, 17.0, 2.0, 10.0, 9.0, 4.0, 3.0, 3.0, 2.0, 5.0, 7.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.744450569152832, -7.483931541442871, -7.22341251373291, -6.962893962860107, -6.7023749351501465, -6.4418559074401855, -6.181337356567383, -5.920818328857422, -5.660299301147461, -5.3997802734375, -5.139261245727539, -4.878742694854736, -4.618223667144775, -4.3577046394348145, -4.097186088562012, -3.836667060852051, -3.57614803314209, -3.315629005432129, -3.055110216140747, -2.7945914268493652, -2.5340723991394043, -2.2735533714294434, -2.0130345821380615, -1.7525156736373901, -1.4919967651367188, -1.2314778566360474, -0.970958948135376, -0.7104400396347046, -0.4499211311340332, -0.18940222263336182, 0.07111668586730957, 0.33163559436798096, 0.5921535491943359, 0.8526724576950073, 1.1131913661956787, 1.37371027469635, 1.6342291831970215, 1.8947480916976929, 2.1552670001983643, 2.415785789489746, 2.676304817199707, 2.936823844909668, 3.19734263420105, 3.4578614234924316, 3.7183804512023926, 3.9788994789123535, 4.239418029785156, 4.499937057495117, 4.760456085205078, 5.020975112915039, 5.281494140625, 5.542012691497803, 5.802531719207764, 6.063050746917725, 6.323569297790527, 6.584088325500488, 6.844607353210449, 7.10512638092041, 7.365645408630371, 7.626163959503174, 7.886682987213135, 8.147201538085938, 8.407720565795898, 8.66823959350586, 8.92875862121582]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [3.0, 4.0, 5.0, 8.0, 27.0, 34.0, 60.0, 96.0, 154.0, 237.0, 307.0, 541.0, 903.0, 1395.0, 2593.0, 4367.0, 7605.0, 14153.0, 27345.0, 54478.0, 114518.0, 254984.0, 585474.0, 1133987.0, 1063404.0, 510661.0, 217767.0, 97877.0, 47018.0, 23839.0, 12736.0, 7205.0, 4109.0, 2406.0, 1399.0, 887.0, 548.0, 373.0, 245.0, 171.0, 97.0, 85.0, 42.0, 40.0, 20.0, 21.0, 15.0, 13.0, 6.0, 13.0, 8.0, 3.0, 4.0, 0.0, 2.0, 6.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.7421875, -13.1676025390625, -12.593017578125, -12.0184326171875, -11.44384765625, -10.8692626953125, -10.294677734375, -9.7200927734375, -9.1455078125, -8.5709228515625, -7.996337890625, -7.4217529296875, -6.84716796875, -6.2725830078125, -5.697998046875, -5.1234130859375, -4.548828125, -3.9742431640625, -3.399658203125, -2.8250732421875, -2.25048828125, -1.6759033203125, -1.101318359375, -0.5267333984375, 0.0478515625, 0.6224365234375, 1.197021484375, 1.7716064453125, 2.34619140625, 2.9207763671875, 3.495361328125, 4.0699462890625, 4.64453125, 5.2191162109375, 5.793701171875, 6.3682861328125, 6.94287109375, 7.5174560546875, 8.092041015625, 8.6666259765625, 9.2412109375, 9.8157958984375, 10.390380859375, 10.9649658203125, 11.53955078125, 12.1141357421875, 12.688720703125, 13.2633056640625, 13.837890625, 14.4124755859375, 14.987060546875, 15.5616455078125, 16.13623046875, 16.7108154296875, 17.285400390625, 17.8599853515625, 18.4345703125, 19.0091552734375, 19.583740234375, 20.1583251953125, 20.73291015625, 21.3074951171875, 21.882080078125, 22.4566650390625, 23.03125]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 7.0, 7.0, 10.0, 12.0, 16.0, 14.0, 15.0, 24.0, 21.0, 18.0, 18.0, 37.0, 42.0, 33.0, 38.0, 50.0, 49.0, 39.0, 47.0, 48.0, 43.0, 45.0, 56.0, 47.0, 37.0, 36.0, 34.0, 19.0, 23.0, 17.0, 22.0, 20.0, 8.0, 14.0, 9.0, 9.0, 9.0, 3.0, 3.0, 4.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5390625, -7.2803955078125, -7.021728515625, -6.7630615234375, -6.50439453125, -6.2457275390625, -5.987060546875, -5.7283935546875, -5.4697265625, -5.2110595703125, -4.952392578125, -4.6937255859375, -4.43505859375, -4.1763916015625, -3.917724609375, -3.6590576171875, -3.400390625, -3.1417236328125, -2.883056640625, -2.6243896484375, -2.36572265625, -2.1070556640625, -1.848388671875, -1.5897216796875, -1.3310546875, -1.0723876953125, -0.813720703125, -0.5550537109375, -0.29638671875, -0.0377197265625, 0.220947265625, 0.4796142578125, 0.73828125, 0.9969482421875, 1.255615234375, 1.5142822265625, 1.77294921875, 2.0316162109375, 2.290283203125, 2.5489501953125, 2.8076171875, 3.0662841796875, 3.324951171875, 3.5836181640625, 3.84228515625, 4.1009521484375, 4.359619140625, 4.6182861328125, 4.876953125, 5.1356201171875, 5.394287109375, 5.6529541015625, 5.91162109375, 6.1702880859375, 6.428955078125, 6.6876220703125, 6.9462890625, 7.2049560546875, 7.463623046875, 7.7222900390625, 7.98095703125, 8.2396240234375, 8.498291015625, 8.7569580078125, 9.015625]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 9.0, 1.0, 9.0, 21.0, 27.0, 32.0, 46.0, 65.0, 103.0, 171.0, 225.0, 370.0, 614.0, 973.0, 1569.0, 2681.0, 4457.0, 7570.0, 13582.0, 24706.0, 46361.0, 88545.0, 173028.0, 334746.0, 623080.0, 942603.0, 856483.0, 510840.0, 267856.0, 137360.0, 70748.0, 37817.0, 20372.0, 11242.0, 6387.0, 3732.0, 2171.0, 1378.0, 837.0, 530.0, 334.0, 213.0, 134.0, 74.0, 58.0, 46.0, 23.0, 17.0, 15.0, 11.0, 5.0, 7.0, 2.0, 3.0, 1.0, 2.0], "bins": [-18.328125, -17.786376953125, -17.24462890625, -16.702880859375, -16.1611328125, -15.619384765625, -15.07763671875, -14.535888671875, -13.994140625, -13.452392578125, -12.91064453125, -12.368896484375, -11.8271484375, -11.285400390625, -10.74365234375, -10.201904296875, -9.66015625, -9.118408203125, -8.57666015625, -8.034912109375, -7.4931640625, -6.951416015625, -6.40966796875, -5.867919921875, -5.326171875, -4.784423828125, -4.24267578125, -3.700927734375, -3.1591796875, -2.617431640625, -2.07568359375, -1.533935546875, -0.9921875, -0.450439453125, 0.09130859375, 0.633056640625, 1.1748046875, 1.716552734375, 2.25830078125, 2.800048828125, 3.341796875, 3.883544921875, 4.42529296875, 4.967041015625, 5.5087890625, 6.050537109375, 6.59228515625, 7.134033203125, 7.67578125, 8.217529296875, 8.75927734375, 9.301025390625, 9.8427734375, 10.384521484375, 10.92626953125, 11.468017578125, 12.009765625, 12.551513671875, 13.09326171875, 13.635009765625, 14.1767578125, 14.718505859375, 15.26025390625, 15.802001953125, 16.34375]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 5.0, 15.0, 20.0, 18.0, 24.0, 37.0, 39.0, 39.0, 73.0, 78.0, 106.0, 97.0, 111.0, 152.0, 201.0, 188.0, 234.0, 253.0, 268.0, 247.0, 258.0, 220.0, 240.0, 205.0, 183.0, 144.0, 115.0, 108.0, 84.0, 73.0, 48.0, 42.0, 18.0, 26.0, 26.0, 14.0, 12.0, 13.0, 8.0, 7.0, 4.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.49609375, -4.3480224609375, -4.199951171875, -4.0518798828125, -3.90380859375, -3.7557373046875, -3.607666015625, -3.4595947265625, -3.3115234375, -3.1634521484375, -3.015380859375, -2.8673095703125, -2.71923828125, -2.5711669921875, -2.423095703125, -2.2750244140625, -2.126953125, -1.9788818359375, -1.830810546875, -1.6827392578125, -1.53466796875, -1.3865966796875, -1.238525390625, -1.0904541015625, -0.9423828125, -0.7943115234375, -0.646240234375, -0.4981689453125, -0.35009765625, -0.2020263671875, -0.053955078125, 0.0941162109375, 0.2421875, 0.3902587890625, 0.538330078125, 0.6864013671875, 0.83447265625, 0.9825439453125, 1.130615234375, 1.2786865234375, 1.4267578125, 1.5748291015625, 1.722900390625, 1.8709716796875, 2.01904296875, 2.1671142578125, 2.315185546875, 2.4632568359375, 2.611328125, 2.7593994140625, 2.907470703125, 3.0555419921875, 3.20361328125, 3.3516845703125, 3.499755859375, 3.6478271484375, 3.7958984375, 3.9439697265625, 4.092041015625, 4.2401123046875, 4.38818359375, 4.5362548828125, 4.684326171875, 4.8323974609375, 4.98046875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 8.0, 8.0, 4.0, 13.0, 11.0, 12.0, 15.0, 16.0, 27.0, 32.0, 37.0, 39.0, 51.0, 72.0, 71.0, 61.0, 86.0, 68.0, 62.0, 58.0, 49.0, 37.0, 28.0, 26.0, 23.0, 20.0, 12.0, 9.0, 12.0, 8.0, 6.0, 3.0, 1.0, 8.0, 2.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.71157455444336, -19.039499282836914, -18.36742401123047, -17.695348739624023, -17.023273468017578, -16.351198196411133, -15.679121971130371, -15.007046699523926, -14.33497142791748, -13.662896156311035, -12.99082088470459, -12.318744659423828, -11.646669387817383, -10.974594116210938, -10.302518844604492, -9.630443572998047, -8.958368301391602, -8.286293029785156, -7.614217758178711, -6.942142009735107, -6.270066738128662, -5.597991466522217, -4.925915718078613, -4.253840446472168, -3.5817651748657227, -2.9096899032592773, -2.237614393234253, -1.5655388832092285, -0.8934636116027832, -0.2213883399963379, 0.4506874084472656, 1.122762680053711, 1.794839859008789, 2.4669151306152344, 3.138990640640259, 3.811066150665283, 4.4831414222717285, 5.155216693878174, 5.827292442321777, 6.499367713928223, 7.171442985534668, 7.843518257141113, 8.515593528747559, 9.18766975402832, 9.859745025634766, 10.531820297241211, 11.203895568847656, 11.875970840454102, 12.548046112060547, 13.220121383666992, 13.892196655273438, 14.564271926879883, 15.236347198486328, 15.908422470092773, 16.58049774169922, 17.252574920654297, 17.92464828491211, 18.596723556518555, 19.268798828125, 19.940874099731445, 20.61294937133789, 21.285024642944336, 21.95709991455078, 22.62917709350586, 23.301252365112305]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 5.0, 3.0, 4.0, 6.0, 5.0, 10.0, 14.0, 19.0, 18.0, 16.0, 19.0, 28.0, 29.0, 21.0, 40.0, 41.0, 31.0, 43.0, 42.0, 44.0, 41.0, 58.0, 54.0, 42.0, 35.0, 33.0, 37.0, 39.0, 27.0, 29.0, 30.0, 24.0, 19.0, 22.0, 16.0, 13.0, 9.0, 11.0, 5.0, 6.0, 7.0, 0.0, 8.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.642413139343262, -9.33700942993164, -9.03160572052002, -8.726202011108398, -8.420797348022461, -8.11539363861084, -7.809989929199219, -7.504586219787598, -7.199182510375977, -6.8937788009643555, -6.588375091552734, -6.282970905303955, -5.977567195892334, -5.672163486480713, -5.366759300231934, -5.0613555908203125, -4.755951881408691, -4.45054817199707, -4.145144462585449, -3.83974027633667, -3.534336566925049, -3.2289328575134277, -2.9235289096832275, -2.6181249618530273, -2.3127212524414062, -2.007317543029785, -1.701913595199585, -1.3965097665786743, -1.0911059379577637, -0.785702109336853, -0.4802982807159424, -0.1748943328857422, 0.1305093765258789, 0.43591320514678955, 0.7413170337677002, 1.0467208623886108, 1.3521246910095215, 1.6575285196304321, 1.9629323482513428, 2.268336296081543, 2.573740005493164, 2.879143714904785, 3.1845476627349854, 3.4899516105651855, 3.7953553199768066, 4.100759029388428, 4.406163215637207, 4.711566925048828, 5.016970634460449, 5.32237434387207, 5.627778053283691, 5.933182239532471, 6.238585948944092, 6.543989658355713, 6.849393844604492, 7.154797554016113, 7.460201263427734, 7.7656049728393555, 8.071008682250977, 8.376412391662598, 8.681816101074219, 8.987220764160156, 9.292624473571777, 9.598028182983398, 9.90343189239502]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 3.0, 9.0, 11.0, 7.0, 9.0, 23.0, 37.0, 42.0, 60.0, 81.0, 144.0, 210.0, 299.0, 461.0, 822.0, 1302.0, 2210.0, 4300.0, 8350.0, 17642.0, 38591.0, 84483.0, 168683.0, 250725.0, 224094.0, 129689.0, 61331.0, 27650.0, 12988.0, 6362.0, 3262.0, 1849.0, 1035.0, 590.0, 389.0, 265.0, 170.0, 127.0, 85.0, 44.0, 41.0, 25.0, 22.0, 10.0, 11.0, 9.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-12.546875, -12.139404296875, -11.73193359375, -11.324462890625, -10.9169921875, -10.509521484375, -10.10205078125, -9.694580078125, -9.287109375, -8.879638671875, -8.47216796875, -8.064697265625, -7.6572265625, -7.249755859375, -6.84228515625, -6.434814453125, -6.02734375, -5.619873046875, -5.21240234375, -4.804931640625, -4.3974609375, -3.989990234375, -3.58251953125, -3.175048828125, -2.767578125, -2.360107421875, -1.95263671875, -1.545166015625, -1.1376953125, -0.730224609375, -0.32275390625, 0.084716796875, 0.4921875, 0.899658203125, 1.30712890625, 1.714599609375, 2.1220703125, 2.529541015625, 2.93701171875, 3.344482421875, 3.751953125, 4.159423828125, 4.56689453125, 4.974365234375, 5.3818359375, 5.789306640625, 6.19677734375, 6.604248046875, 7.01171875, 7.419189453125, 7.82666015625, 8.234130859375, 8.6416015625, 9.049072265625, 9.45654296875, 9.864013671875, 10.271484375, 10.678955078125, 11.08642578125, 11.493896484375, 11.9013671875, 12.308837890625, 12.71630859375, 13.123779296875, 13.53125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 9.0, 5.0, 4.0, 12.0, 10.0, 15.0, 17.0, 16.0, 18.0, 27.0, 30.0, 23.0, 32.0, 37.0, 47.0, 49.0, 40.0, 40.0, 52.0, 49.0, 46.0, 51.0, 43.0, 41.0, 46.0, 31.0, 21.0, 26.0, 26.0, 25.0, 18.0, 14.0, 18.0, 19.0, 12.0, 7.0, 7.0, 6.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.296875, -9.94677734375, -9.5966796875, -9.24658203125, -8.896484375, -8.54638671875, -8.1962890625, -7.84619140625, -7.49609375, -7.14599609375, -6.7958984375, -6.44580078125, -6.095703125, -5.74560546875, -5.3955078125, -5.04541015625, -4.6953125, -4.34521484375, -3.9951171875, -3.64501953125, -3.294921875, -2.94482421875, -2.5947265625, -2.24462890625, -1.89453125, -1.54443359375, -1.1943359375, -0.84423828125, -0.494140625, -0.14404296875, 0.2060546875, 0.55615234375, 0.90625, 1.25634765625, 1.6064453125, 1.95654296875, 2.306640625, 2.65673828125, 3.0068359375, 3.35693359375, 3.70703125, 4.05712890625, 4.4072265625, 4.75732421875, 5.107421875, 5.45751953125, 5.8076171875, 6.15771484375, 6.5078125, 6.85791015625, 7.2080078125, 7.55810546875, 7.908203125, 8.25830078125, 8.6083984375, 8.95849609375, 9.30859375, 9.65869140625, 10.0087890625, 10.35888671875, 10.708984375, 11.05908203125, 11.4091796875, 11.75927734375, 12.109375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 4.0, 11.0, 12.0, 23.0, 33.0, 41.0, 49.0, 100.0, 150.0, 231.0, 334.0, 468.0, 781.0, 1279.0, 2125.0, 3800.0, 6989.0, 13311.0, 26638.0, 55028.0, 113970.0, 213836.0, 262710.0, 173486.0, 87292.0, 41804.0, 20388.0, 10171.0, 5562.0, 3166.0, 1749.0, 1071.0, 661.0, 420.0, 263.0, 194.0, 122.0, 85.0, 60.0, 37.0, 34.0, 20.0, 11.0, 15.0, 9.0, 4.0, 9.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-14.1015625, -13.67822265625, -13.2548828125, -12.83154296875, -12.408203125, -11.98486328125, -11.5615234375, -11.13818359375, -10.71484375, -10.29150390625, -9.8681640625, -9.44482421875, -9.021484375, -8.59814453125, -8.1748046875, -7.75146484375, -7.328125, -6.90478515625, -6.4814453125, -6.05810546875, -5.634765625, -5.21142578125, -4.7880859375, -4.36474609375, -3.94140625, -3.51806640625, -3.0947265625, -2.67138671875, -2.248046875, -1.82470703125, -1.4013671875, -0.97802734375, -0.5546875, -0.13134765625, 0.2919921875, 0.71533203125, 1.138671875, 1.56201171875, 1.9853515625, 2.40869140625, 2.83203125, 3.25537109375, 3.6787109375, 4.10205078125, 4.525390625, 4.94873046875, 5.3720703125, 5.79541015625, 6.21875, 6.64208984375, 7.0654296875, 7.48876953125, 7.912109375, 8.33544921875, 8.7587890625, 9.18212890625, 9.60546875, 10.02880859375, 10.4521484375, 10.87548828125, 11.298828125, 11.72216796875, 12.1455078125, 12.56884765625, 12.9921875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 7.0, 9.0, 9.0, 9.0, 14.0, 15.0, 10.0, 27.0, 24.0, 19.0, 28.0, 47.0, 50.0, 50.0, 40.0, 51.0, 53.0, 55.0, 54.0, 47.0, 39.0, 53.0, 38.0, 40.0, 47.0, 25.0, 28.0, 33.0, 19.0, 13.0, 7.0, 7.0, 12.0, 7.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.01171875, -5.78448486328125, -5.5572509765625, -5.33001708984375, -5.102783203125, -4.87554931640625, -4.6483154296875, -4.42108154296875, -4.19384765625, -3.96661376953125, -3.7393798828125, -3.51214599609375, -3.284912109375, -3.05767822265625, -2.8304443359375, -2.60321044921875, -2.3759765625, -2.14874267578125, -1.9215087890625, -1.69427490234375, -1.467041015625, -1.23980712890625, -1.0125732421875, -0.78533935546875, -0.55810546875, -0.33087158203125, -0.1036376953125, 0.12359619140625, 0.350830078125, 0.57806396484375, 0.8052978515625, 1.03253173828125, 1.259765625, 1.48699951171875, 1.7142333984375, 1.94146728515625, 2.168701171875, 2.39593505859375, 2.6231689453125, 2.85040283203125, 3.07763671875, 3.30487060546875, 3.5321044921875, 3.75933837890625, 3.986572265625, 4.21380615234375, 4.4410400390625, 4.66827392578125, 4.8955078125, 5.12274169921875, 5.3499755859375, 5.57720947265625, 5.804443359375, 6.03167724609375, 6.2589111328125, 6.48614501953125, 6.71337890625, 6.94061279296875, 7.1678466796875, 7.39508056640625, 7.622314453125, 7.84954833984375, 8.0767822265625, 8.30401611328125, 8.53125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 6.0, 6.0, 13.0, 26.0, 14.0, 26.0, 32.0, 51.0, 71.0, 99.0, 145.0, 245.0, 352.0, 564.0, 920.0, 1430.0, 2515.0, 4468.0, 8459.0, 17344.0, 37362.0, 85058.0, 189990.0, 305712.0, 212550.0, 97515.0, 42626.0, 19561.0, 9549.0, 4982.0, 2627.0, 1593.0, 917.0, 591.0, 359.0, 269.0, 167.0, 88.0, 71.0, 58.0, 31.0, 27.0, 16.0, 13.0, 10.0, 10.0, 8.0, 6.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-7.68359375, -7.44775390625, -7.2119140625, -6.97607421875, -6.740234375, -6.50439453125, -6.2685546875, -6.03271484375, -5.796875, -5.56103515625, -5.3251953125, -5.08935546875, -4.853515625, -4.61767578125, -4.3818359375, -4.14599609375, -3.91015625, -3.67431640625, -3.4384765625, -3.20263671875, -2.966796875, -2.73095703125, -2.4951171875, -2.25927734375, -2.0234375, -1.78759765625, -1.5517578125, -1.31591796875, -1.080078125, -0.84423828125, -0.6083984375, -0.37255859375, -0.13671875, 0.09912109375, 0.3349609375, 0.57080078125, 0.806640625, 1.04248046875, 1.2783203125, 1.51416015625, 1.75, 1.98583984375, 2.2216796875, 2.45751953125, 2.693359375, 2.92919921875, 3.1650390625, 3.40087890625, 3.63671875, 3.87255859375, 4.1083984375, 4.34423828125, 4.580078125, 4.81591796875, 5.0517578125, 5.28759765625, 5.5234375, 5.75927734375, 5.9951171875, 6.23095703125, 6.466796875, 6.70263671875, 6.9384765625, 7.17431640625, 7.41015625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 9.0, 9.0, 11.0, 11.0, 17.0, 18.0, 26.0, 35.0, 55.0, 51.0, 67.0, 80.0, 60.0, 73.0, 84.0, 72.0, 67.0, 48.0, 54.0, 40.0, 23.0, 18.0, 15.0, 11.0, 7.0, 4.0, 5.0, 8.0, 9.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.000423431396484375, -0.0004111379384994507, -0.00039884448051452637, -0.00038655102252960205, -0.00037425756454467773, -0.0003619641065597534, -0.0003496706485748291, -0.0003373771905899048, -0.00032508373260498047, -0.00031279027462005615, -0.00030049681663513184, -0.0002882033586502075, -0.0002759099006652832, -0.0002636164426803589, -0.00025132298469543457, -0.00023902952671051025, -0.00022673606872558594, -0.00021444261074066162, -0.0002021491527557373, -0.000189855694770813, -0.00017756223678588867, -0.00016526877880096436, -0.00015297532081604004, -0.00014068186283111572, -0.0001283884048461914, -0.00011609494686126709, -0.00010380148887634277, -9.150803089141846e-05, -7.921457290649414e-05, -6.692111492156982e-05, -5.462765693664551e-05, -4.233419895172119e-05, -3.0040740966796875e-05, -1.774728298187256e-05, -5.453824996948242e-06, 6.839632987976074e-06, 1.913309097290039e-05, 3.142654895782471e-05, 4.3720006942749023e-05, 5.601346492767334e-05, 6.830692291259766e-05, 8.060038089752197e-05, 9.289383888244629e-05, 0.0001051872968673706, 0.00011748075485229492, 0.00012977421283721924, 0.00014206767082214355, 0.00015436112880706787, 0.0001666545867919922, 0.0001789480447769165, 0.00019124150276184082, 0.00020353496074676514, 0.00021582841873168945, 0.00022812187671661377, 0.00024041533470153809, 0.0002527087926864624, 0.0002650022506713867, 0.00027729570865631104, 0.00028958916664123535, 0.00030188262462615967, 0.000314176082611084, 0.0003264695405960083, 0.0003387629985809326, 0.00035105645656585693, 0.00036334991455078125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 8.0, 5.0, 9.0, 16.0, 22.0, 31.0, 39.0, 67.0, 62.0, 128.0, 189.0, 277.0, 483.0, 730.0, 1246.0, 2268.0, 4791.0, 10893.0, 29134.0, 83362.0, 212005.0, 327488.0, 227316.0, 92763.0, 32154.0, 11986.0, 5106.0, 2472.0, 1313.0, 780.0, 496.0, 339.0, 164.0, 130.0, 88.0, 63.0, 26.0, 24.0, 23.0, 14.0, 19.0, 7.0, 7.0, 6.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.75, -8.47265625, -8.1953125, -7.91796875, -7.640625, -7.36328125, -7.0859375, -6.80859375, -6.53125, -6.25390625, -5.9765625, -5.69921875, -5.421875, -5.14453125, -4.8671875, -4.58984375, -4.3125, -4.03515625, -3.7578125, -3.48046875, -3.203125, -2.92578125, -2.6484375, -2.37109375, -2.09375, -1.81640625, -1.5390625, -1.26171875, -0.984375, -0.70703125, -0.4296875, -0.15234375, 0.125, 0.40234375, 0.6796875, 0.95703125, 1.234375, 1.51171875, 1.7890625, 2.06640625, 2.34375, 2.62109375, 2.8984375, 3.17578125, 3.453125, 3.73046875, 4.0078125, 4.28515625, 4.5625, 4.83984375, 5.1171875, 5.39453125, 5.671875, 5.94921875, 6.2265625, 6.50390625, 6.78125, 7.05859375, 7.3359375, 7.61328125, 7.890625, 8.16796875, 8.4453125, 8.72265625, 9.0]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 8.0, 4.0, 4.0, 9.0, 17.0, 15.0, 45.0, 35.0, 26.0, 54.0, 63.0, 70.0, 79.0, 92.0, 90.0, 67.0, 70.0, 58.0, 46.0, 31.0, 21.0, 31.0, 14.0, 11.0, 6.0, 6.0, 12.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6171875, -1.56268310546875, -1.5081787109375, -1.45367431640625, -1.399169921875, -1.34466552734375, -1.2901611328125, -1.23565673828125, -1.18115234375, -1.12664794921875, -1.0721435546875, -1.01763916015625, -0.963134765625, -0.90863037109375, -0.8541259765625, -0.79962158203125, -0.7451171875, -0.69061279296875, -0.6361083984375, -0.58160400390625, -0.527099609375, -0.47259521484375, -0.4180908203125, -0.36358642578125, -0.30908203125, -0.25457763671875, -0.2000732421875, -0.14556884765625, -0.091064453125, -0.03656005859375, 0.0179443359375, 0.07244873046875, 0.126953125, 0.18145751953125, 0.2359619140625, 0.29046630859375, 0.344970703125, 0.39947509765625, 0.4539794921875, 0.50848388671875, 0.56298828125, 0.61749267578125, 0.6719970703125, 0.72650146484375, 0.781005859375, 0.83551025390625, 0.8900146484375, 0.94451904296875, 0.9990234375, 1.05352783203125, 1.1080322265625, 1.16253662109375, 1.217041015625, 1.27154541015625, 1.3260498046875, 1.38055419921875, 1.43505859375, 1.48956298828125, 1.5440673828125, 1.59857177734375, 1.653076171875, 1.70758056640625, 1.7620849609375, 1.81658935546875, 1.87109375]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 8.0, 9.0, 5.0, 11.0, 19.0, 16.0, 31.0, 23.0, 25.0, 43.0, 51.0, 54.0, 74.0, 73.0, 89.0, 65.0, 69.0, 52.0, 58.0, 47.0, 25.0, 32.0, 20.0, 29.0, 7.0, 15.0, 14.0, 5.0, 3.0, 7.0, 2.0, 5.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.77476692199707, -19.087709426879883, -18.400651931762695, -17.71359634399414, -17.026538848876953, -16.339481353759766, -15.652423858642578, -14.96536636352539, -14.27830982208252, -13.591252326965332, -12.904195785522461, -12.217138290405273, -11.530080795288086, -10.843024253845215, -10.155966758728027, -9.468910217285156, -8.781852722167969, -8.094795227050781, -7.40773868560791, -6.720681190490723, -6.033624172210693, -5.346567153930664, -4.659509658813477, -3.9724526405334473, -3.285395622253418, -2.5983386039733887, -1.9112813472747803, -1.2242240905761719, -0.5371670722961426, 0.14988994598388672, 0.8369474411010742, 1.5240044593811035, 2.2110595703125, 2.8981165885925293, 3.5851738452911377, 4.272231101989746, 4.959288120269775, 5.646345138549805, 6.333402633666992, 7.0204596519470215, 7.707516670227051, 8.394574165344238, 9.08163070678711, 9.768688201904297, 10.455745697021484, 11.142802238464355, 11.829859733581543, 12.516916275024414, 13.203973770141602, 13.891031265258789, 14.57808780670166, 15.265145301818848, 15.952201843261719, 16.639259338378906, 17.326316833496094, 18.01337432861328, 18.70043182373047, 19.387489318847656, 20.074546813964844, 20.76160430908203, 21.448659896850586, 22.135717391967773, 22.82277488708496, 23.50983238220215, 24.196887969970703]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 0.0, 6.0, 2.0, 6.0, 3.0, 12.0, 12.0, 19.0, 15.0, 18.0, 17.0, 22.0, 27.0, 30.0, 35.0, 38.0, 37.0, 34.0, 45.0, 44.0, 47.0, 54.0, 53.0, 47.0, 41.0, 28.0, 34.0, 33.0, 35.0, 29.0, 30.0, 30.0, 15.0, 25.0, 13.0, 17.0, 11.0, 6.0, 11.0, 5.0, 6.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.260191917419434, -8.958500862121582, -8.65680980682373, -8.355118751525879, -8.053426742553711, -7.751736164093018, -7.450044631958008, -7.148353576660156, -6.846662521362305, -6.544971466064453, -6.243280410766602, -5.941588878631592, -5.63989782333374, -5.338206768035889, -5.036515235900879, -4.734824180603027, -4.433133125305176, -4.131442070007324, -3.8297507762908936, -3.528059482574463, -3.2263684272766113, -2.9246773719787598, -2.622986078262329, -2.3212947845458984, -2.019603729248047, -1.7179125547409058, -1.4162213802337646, -1.1145302057266235, -0.8128390312194824, -0.5111478567123413, -0.2094566822052002, 0.09223461151123047, 0.39392662048339844, 0.6956177949905396, 0.9973089694976807, 1.2990001440048218, 1.600691318511963, 1.902382493019104, 2.204073667526245, 2.505764961242676, 2.8074560165405273, 3.109147071838379, 3.4108383655548096, 3.7125296592712402, 4.014220714569092, 4.315911769866943, 4.617603302001953, 4.919294357299805, 5.220985412597656, 5.522676467895508, 5.824367523193359, 6.126059055328369, 6.427750110626221, 6.729441165924072, 7.031132698059082, 7.332823753356934, 7.634514808654785, 7.936205863952637, 8.237896919250488, 8.53958797454834, 8.841279983520508, 9.14297103881836, 9.444662094116211, 9.746353149414062, 10.048044204711914]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 7.0, 4.0, 10.0, 12.0, 12.0, 29.0, 37.0, 66.0, 124.0, 198.0, 328.0, 601.0, 1189.0, 2226.0, 4381.0, 8619.0, 17752.0, 35645.0, 71264.0, 129424.0, 195040.0, 213724.0, 165721.0, 99137.0, 51979.0, 25428.0, 12583.0, 6075.0, 3207.0, 1677.0, 880.0, 487.0, 274.0, 173.0, 98.0, 48.0, 35.0, 23.0, 14.0, 8.0, 6.0, 7.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.765625, -16.150634765625, -15.53564453125, -14.920654296875, -14.3056640625, -13.690673828125, -13.07568359375, -12.460693359375, -11.845703125, -11.230712890625, -10.61572265625, -10.000732421875, -9.3857421875, -8.770751953125, -8.15576171875, -7.540771484375, -6.92578125, -6.310791015625, -5.69580078125, -5.080810546875, -4.4658203125, -3.850830078125, -3.23583984375, -2.620849609375, -2.005859375, -1.390869140625, -0.77587890625, -0.160888671875, 0.4541015625, 1.069091796875, 1.68408203125, 2.299072265625, 2.9140625, 3.529052734375, 4.14404296875, 4.759033203125, 5.3740234375, 5.989013671875, 6.60400390625, 7.218994140625, 7.833984375, 8.448974609375, 9.06396484375, 9.678955078125, 10.2939453125, 10.908935546875, 11.52392578125, 12.138916015625, 12.75390625, 13.368896484375, 13.98388671875, 14.598876953125, 15.2138671875, 15.828857421875, 16.44384765625, 17.058837890625, 17.673828125, 18.288818359375, 18.90380859375, 19.518798828125, 20.1337890625, 20.748779296875, 21.36376953125, 21.978759765625, 22.59375]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 3.0, 4.0, 4.0, 3.0, 9.0, 9.0, 13.0, 14.0, 15.0, 18.0, 22.0, 22.0, 21.0, 25.0, 32.0, 33.0, 35.0, 37.0, 41.0, 38.0, 34.0, 41.0, 44.0, 39.0, 48.0, 38.0, 41.0, 21.0, 38.0, 40.0, 26.0, 26.0, 25.0, 22.0, 22.0, 12.0, 9.0, 18.0, 10.0, 10.0, 7.0, 9.0, 7.0, 3.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-10.34375, -10.0341796875, -9.724609375, -9.4150390625, -9.10546875, -8.7958984375, -8.486328125, -8.1767578125, -7.8671875, -7.5576171875, -7.248046875, -6.9384765625, -6.62890625, -6.3193359375, -6.009765625, -5.7001953125, -5.390625, -5.0810546875, -4.771484375, -4.4619140625, -4.15234375, -3.8427734375, -3.533203125, -3.2236328125, -2.9140625, -2.6044921875, -2.294921875, -1.9853515625, -1.67578125, -1.3662109375, -1.056640625, -0.7470703125, -0.4375, -0.1279296875, 0.181640625, 0.4912109375, 0.80078125, 1.1103515625, 1.419921875, 1.7294921875, 2.0390625, 2.3486328125, 2.658203125, 2.9677734375, 3.27734375, 3.5869140625, 3.896484375, 4.2060546875, 4.515625, 4.8251953125, 5.134765625, 5.4443359375, 5.75390625, 6.0634765625, 6.373046875, 6.6826171875, 6.9921875, 7.3017578125, 7.611328125, 7.9208984375, 8.23046875, 8.5400390625, 8.849609375, 9.1591796875, 9.46875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 6.0, 8.0, 14.0, 18.0, 36.0, 44.0, 70.0, 125.0, 169.0, 247.0, 361.0, 601.0, 889.0, 1309.0, 2035.0, 3097.0, 4656.0, 7360.0, 11432.0, 17372.0, 26151.0, 38887.0, 56408.0, 77272.0, 99693.0, 118358.0, 125136.0, 117054.0, 98301.0, 75418.0, 54502.0, 37540.0, 25676.0, 16774.0, 11025.0, 7130.0, 4587.0, 3062.0, 1974.0, 1294.0, 833.0, 567.0, 361.0, 248.0, 163.0, 95.0, 68.0, 50.0, 27.0, 24.0, 15.0, 8.0, 8.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-12.359375, -11.9786376953125, -11.597900390625, -11.2171630859375, -10.83642578125, -10.4556884765625, -10.074951171875, -9.6942138671875, -9.3134765625, -8.9327392578125, -8.552001953125, -8.1712646484375, -7.79052734375, -7.4097900390625, -7.029052734375, -6.6483154296875, -6.267578125, -5.8868408203125, -5.506103515625, -5.1253662109375, -4.74462890625, -4.3638916015625, -3.983154296875, -3.6024169921875, -3.2216796875, -2.8409423828125, -2.460205078125, -2.0794677734375, -1.69873046875, -1.3179931640625, -0.937255859375, -0.5565185546875, -0.17578125, 0.2049560546875, 0.585693359375, 0.9664306640625, 1.34716796875, 1.7279052734375, 2.108642578125, 2.4893798828125, 2.8701171875, 3.2508544921875, 3.631591796875, 4.0123291015625, 4.39306640625, 4.7738037109375, 5.154541015625, 5.5352783203125, 5.916015625, 6.2967529296875, 6.677490234375, 7.0582275390625, 7.43896484375, 7.8197021484375, 8.200439453125, 8.5811767578125, 8.9619140625, 9.3426513671875, 9.723388671875, 10.1041259765625, 10.48486328125, 10.8656005859375, 11.246337890625, 11.6270751953125, 12.0078125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 1.0, 5.0, 4.0, 11.0, 10.0, 11.0, 12.0, 19.0, 13.0, 11.0, 13.0, 25.0, 23.0, 28.0, 25.0, 37.0, 27.0, 41.0, 45.0, 43.0, 43.0, 43.0, 43.0, 31.0, 45.0, 51.0, 31.0, 42.0, 30.0, 32.0, 37.0, 34.0, 17.0, 20.0, 18.0, 16.0, 12.0, 14.0, 10.0, 9.0, 2.0, 7.0, 3.0, 0.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.4453125, -6.244140625, -6.04296875, -5.841796875, -5.640625, -5.439453125, -5.23828125, -5.037109375, -4.8359375, -4.634765625, -4.43359375, -4.232421875, -4.03125, -3.830078125, -3.62890625, -3.427734375, -3.2265625, -3.025390625, -2.82421875, -2.623046875, -2.421875, -2.220703125, -2.01953125, -1.818359375, -1.6171875, -1.416015625, -1.21484375, -1.013671875, -0.8125, -0.611328125, -0.41015625, -0.208984375, -0.0078125, 0.193359375, 0.39453125, 0.595703125, 0.796875, 0.998046875, 1.19921875, 1.400390625, 1.6015625, 1.802734375, 2.00390625, 2.205078125, 2.40625, 2.607421875, 2.80859375, 3.009765625, 3.2109375, 3.412109375, 3.61328125, 3.814453125, 4.015625, 4.216796875, 4.41796875, 4.619140625, 4.8203125, 5.021484375, 5.22265625, 5.423828125, 5.625, 5.826171875, 6.02734375, 6.228515625, 6.4296875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 3.0, 4.0, 5.0, 18.0, 22.0, 31.0, 30.0, 49.0, 65.0, 87.0, 147.0, 222.0, 366.0, 548.0, 885.0, 1530.0, 2667.0, 4613.0, 8132.0, 15203.0, 29253.0, 57656.0, 110582.0, 186015.0, 227365.0, 180950.0, 106214.0, 54970.0, 27779.0, 14420.0, 7801.0, 4525.0, 2487.0, 1518.0, 871.0, 536.0, 335.0, 206.0, 157.0, 101.0, 56.0, 47.0, 36.0, 30.0, 6.0, 5.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.734375, -11.3729248046875, -11.011474609375, -10.6500244140625, -10.28857421875, -9.9271240234375, -9.565673828125, -9.2042236328125, -8.8427734375, -8.4813232421875, -8.119873046875, -7.7584228515625, -7.39697265625, -7.0355224609375, -6.674072265625, -6.3126220703125, -5.951171875, -5.5897216796875, -5.228271484375, -4.8668212890625, -4.50537109375, -4.1439208984375, -3.782470703125, -3.4210205078125, -3.0595703125, -2.6981201171875, -2.336669921875, -1.9752197265625, -1.61376953125, -1.2523193359375, -0.890869140625, -0.5294189453125, -0.16796875, 0.1934814453125, 0.554931640625, 0.9163818359375, 1.27783203125, 1.6392822265625, 2.000732421875, 2.3621826171875, 2.7236328125, 3.0850830078125, 3.446533203125, 3.8079833984375, 4.16943359375, 4.5308837890625, 4.892333984375, 5.2537841796875, 5.615234375, 5.9766845703125, 6.338134765625, 6.6995849609375, 7.06103515625, 7.4224853515625, 7.783935546875, 8.1453857421875, 8.5068359375, 8.8682861328125, 9.229736328125, 9.5911865234375, 9.95263671875, 10.3140869140625, 10.675537109375, 11.0369873046875, 11.3984375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 5.0, 9.0, 15.0, 9.0, 6.0, 12.0, 11.0, 29.0, 30.0, 35.0, 60.0, 42.0, 57.0, 69.0, 75.0, 65.0, 75.0, 74.0, 45.0, 56.0, 40.0, 37.0, 33.0, 21.0, 20.0, 11.0, 10.0, 16.0, 8.0, 7.0, 4.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0011281967163085938, -0.0010912269353866577, -0.0010542571544647217, -0.0010172873735427856, -0.0009803175926208496, -0.0009433478116989136, -0.0009063780307769775, -0.0008694082498550415, -0.0008324384689331055, -0.0007954686880111694, -0.0007584989070892334, -0.0007215291261672974, -0.0006845593452453613, -0.0006475895643234253, -0.0006106197834014893, -0.0005736500024795532, -0.0005366802215576172, -0.0004997104406356812, -0.0004627406597137451, -0.0004257708787918091, -0.00038880109786987305, -0.000351831316947937, -0.000314861536026001, -0.00027789175510406494, -0.0002409219741821289, -0.00020395219326019287, -0.00016698241233825684, -0.0001300126314163208, -9.304285049438477e-05, -5.607306957244873e-05, -1.9103288650512695e-05, 1.786649227142334e-05, 5.4836273193359375e-05, 9.180605411529541e-05, 0.00012877583503723145, 0.00016574561595916748, 0.00020271539688110352, 0.00023968517780303955, 0.0002766549587249756, 0.0003136247396469116, 0.00035059452056884766, 0.0003875643014907837, 0.0004245340824127197, 0.00046150386333465576, 0.0004984736442565918, 0.0005354434251785278, 0.0005724132061004639, 0.0006093829870223999, 0.0006463527679443359, 0.000683322548866272, 0.000720292329788208, 0.000757262110710144, 0.0007942318916320801, 0.0008312016725540161, 0.0008681714534759521, 0.0009051412343978882, 0.0009421110153198242, 0.0009790807962417603, 0.0010160505771636963, 0.0010530203580856323, 0.0010899901390075684, 0.0011269599199295044, 0.0011639297008514404, 0.0012008994817733765, 0.0012378692626953125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 9.0, 8.0, 20.0, 23.0, 32.0, 50.0, 56.0, 83.0, 116.0, 199.0, 311.0, 458.0, 716.0, 1145.0, 1884.0, 3169.0, 5289.0, 9035.0, 15929.0, 28232.0, 49698.0, 84454.0, 131496.0, 172771.0, 177100.0, 141466.0, 93614.0, 55985.0, 31840.0, 18341.0, 10076.0, 5875.0, 3441.0, 2090.0, 1288.0, 780.0, 484.0, 314.0, 218.0, 126.0, 101.0, 72.0, 60.0, 28.0, 24.0, 15.0, 15.0, 7.0, 7.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.015625, -7.7579345703125, -7.500244140625, -7.2425537109375, -6.98486328125, -6.7271728515625, -6.469482421875, -6.2117919921875, -5.9541015625, -5.6964111328125, -5.438720703125, -5.1810302734375, -4.92333984375, -4.6656494140625, -4.407958984375, -4.1502685546875, -3.892578125, -3.6348876953125, -3.377197265625, -3.1195068359375, -2.86181640625, -2.6041259765625, -2.346435546875, -2.0887451171875, -1.8310546875, -1.5733642578125, -1.315673828125, -1.0579833984375, -0.80029296875, -0.5426025390625, -0.284912109375, -0.0272216796875, 0.23046875, 0.4881591796875, 0.745849609375, 1.0035400390625, 1.26123046875, 1.5189208984375, 1.776611328125, 2.0343017578125, 2.2919921875, 2.5496826171875, 2.807373046875, 3.0650634765625, 3.32275390625, 3.5804443359375, 3.838134765625, 4.0958251953125, 4.353515625, 4.6112060546875, 4.868896484375, 5.1265869140625, 5.38427734375, 5.6419677734375, 5.899658203125, 6.1573486328125, 6.4150390625, 6.6727294921875, 6.930419921875, 7.1881103515625, 7.44580078125, 7.7034912109375, 7.961181640625, 8.2188720703125, 8.4765625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 8.0, 5.0, 9.0, 5.0, 12.0, 14.0, 13.0, 14.0, 22.0, 21.0, 39.0, 37.0, 43.0, 42.0, 49.0, 52.0, 60.0, 47.0, 54.0, 61.0, 61.0, 45.0, 35.0, 41.0, 41.0, 33.0, 34.0, 27.0, 17.0, 18.0, 9.0, 10.0, 4.0, 2.0, 2.0, 3.0, 2.0, 5.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.42578125, -2.35546875, -2.28515625, -2.21484375, -2.14453125, -2.07421875, -2.00390625, -1.93359375, -1.86328125, -1.79296875, -1.72265625, -1.65234375, -1.58203125, -1.51171875, -1.44140625, -1.37109375, -1.30078125, -1.23046875, -1.16015625, -1.08984375, -1.01953125, -0.94921875, -0.87890625, -0.80859375, -0.73828125, -0.66796875, -0.59765625, -0.52734375, -0.45703125, -0.38671875, -0.31640625, -0.24609375, -0.17578125, -0.10546875, -0.03515625, 0.03515625, 0.10546875, 0.17578125, 0.24609375, 0.31640625, 0.38671875, 0.45703125, 0.52734375, 0.59765625, 0.66796875, 0.73828125, 0.80859375, 0.87890625, 0.94921875, 1.01953125, 1.08984375, 1.16015625, 1.23046875, 1.30078125, 1.37109375, 1.44140625, 1.51171875, 1.58203125, 1.65234375, 1.72265625, 1.79296875, 1.86328125, 1.93359375, 2.00390625, 2.07421875]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 6.0, 9.0, 12.0, 15.0, 18.0, 15.0, 30.0, 38.0, 35.0, 59.0, 64.0, 58.0, 77.0, 69.0, 75.0, 76.0, 68.0, 53.0, 43.0, 35.0, 29.0, 22.0, 20.0, 13.0, 15.0, 5.0, 9.0, 9.0, 4.0, 7.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.27089500427246, -18.551015853881836, -17.83113670349121, -17.11125946044922, -16.391380310058594, -15.671501159667969, -14.951622009277344, -14.231742858886719, -13.51186466217041, -12.791985511779785, -12.072107315063477, -11.352228164672852, -10.632349014282227, -9.912470817565918, -9.192591667175293, -8.472713470458984, -7.752834320068359, -7.032955646514893, -6.313076972961426, -5.593197822570801, -4.873319149017334, -4.153440475463867, -3.433561325073242, -2.7136826515197754, -1.9938039779663086, -1.2739251852035522, -0.5540463924407959, 0.16583251953125, 0.8857111930847168, 1.6055898666381836, 2.3254690170288086, 3.0453476905822754, 3.765228271484375, 4.485106945037842, 5.204985618591309, 5.924864768981934, 6.6447434425354, 7.364622116088867, 8.084501266479492, 8.804380416870117, 9.524258613586426, 10.24413776397705, 10.96401596069336, 11.683895111083984, 12.40377426147461, 13.123652458190918, 13.843531608581543, 14.563409805297852, 15.283288955688477, 16.0031681060791, 16.723047256469727, 17.44292449951172, 18.162803649902344, 18.88268280029297, 19.602561950683594, 20.32244110107422, 21.042320251464844, 21.76219940185547, 22.482078552246094, 23.20195770263672, 23.92183494567871, 24.641714096069336, 25.36159324645996, 26.081472396850586, 26.801349639892578]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 10.0, 4.0, 9.0, 8.0, 12.0, 17.0, 15.0, 23.0, 24.0, 24.0, 31.0, 21.0, 36.0, 42.0, 45.0, 32.0, 42.0, 43.0, 47.0, 44.0, 40.0, 45.0, 35.0, 39.0, 38.0, 29.0, 24.0, 35.0, 19.0, 23.0, 22.0, 15.0, 23.0, 11.0, 16.0, 13.0, 10.0, 12.0, 7.0, 3.0, 5.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.428163528442383, -9.131139755249023, -8.834115982055664, -8.537092208862305, -8.240068435668945, -7.943045139312744, -7.646021366119385, -7.348998069763184, -7.051974296569824, -6.754950523376465, -6.4579267501831055, -6.160902976989746, -5.863879680633545, -5.5668559074401855, -5.269832134246826, -4.972808837890625, -4.675784587860107, -4.378760814666748, -4.081737041473389, -3.7847135066986084, -3.487689971923828, -3.1906661987304688, -2.8936424255371094, -2.596618890762329, -2.2995951175689697, -2.0025713443756104, -1.70554780960083, -1.4085240364074707, -1.1115003824234009, -0.814476728439331, -0.5174529552459717, -0.2204294204711914, 0.07659435272216797, 0.3736180365085602, 0.6706417202949524, 0.967665433883667, 1.2646890878677368, 1.5617127418518066, 1.858736515045166, 2.1557600498199463, 2.4527838230133057, 2.749807596206665, 3.0468311309814453, 3.3438549041748047, 3.640878677368164, 3.9379022121429443, 4.234926223754883, 4.531949520111084, 4.828973293304443, 5.125997066497803, 5.423020839691162, 5.720044136047363, 6.017067909240723, 6.314091682434082, 6.611115455627441, 6.908139228820801, 7.20516300201416, 7.5021867752075195, 7.799210548400879, 8.096234321594238, 8.393258094787598, 8.69028091430664, 8.9873046875, 9.28432846069336, 9.581352233886719]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 12.0, 12.0, 19.0, 48.0, 62.0, 92.0, 142.0, 250.0, 468.0, 812.0, 1442.0, 2578.0, 4815.0, 9495.0, 19446.0, 40661.0, 91648.0, 218491.0, 562537.0, 1221540.0, 1159082.0, 507554.0, 197779.0, 82172.0, 36799.0, 17538.0, 8674.0, 4359.0, 2430.0, 1369.0, 748.0, 477.0, 274.0, 150.0, 85.0, 62.0, 37.0, 21.0, 22.0, 22.0, 18.0, 9.0, 14.0, 9.0, 5.0, 4.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.6328125, -14.9515380859375, -14.270263671875, -13.5889892578125, -12.90771484375, -12.2264404296875, -11.545166015625, -10.8638916015625, -10.1826171875, -9.5013427734375, -8.820068359375, -8.1387939453125, -7.45751953125, -6.7762451171875, -6.094970703125, -5.4136962890625, -4.732421875, -4.0511474609375, -3.369873046875, -2.6885986328125, -2.00732421875, -1.3260498046875, -0.644775390625, 0.0364990234375, 0.7177734375, 1.3990478515625, 2.080322265625, 2.7615966796875, 3.44287109375, 4.1241455078125, 4.805419921875, 5.4866943359375, 6.16796875, 6.8492431640625, 7.530517578125, 8.2117919921875, 8.89306640625, 9.5743408203125, 10.255615234375, 10.9368896484375, 11.6181640625, 12.2994384765625, 12.980712890625, 13.6619873046875, 14.34326171875, 15.0245361328125, 15.705810546875, 16.3870849609375, 17.068359375, 17.7496337890625, 18.430908203125, 19.1121826171875, 19.79345703125, 20.4747314453125, 21.156005859375, 21.8372802734375, 22.5185546875, 23.1998291015625, 23.881103515625, 24.5623779296875, 25.24365234375, 25.9249267578125, 26.606201171875, 27.2874755859375, 27.96875]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 6.0, 8.0, 7.0, 12.0, 13.0, 12.0, 21.0, 24.0, 23.0, 27.0, 40.0, 29.0, 35.0, 36.0, 41.0, 62.0, 57.0, 47.0, 50.0, 39.0, 46.0, 35.0, 49.0, 40.0, 45.0, 29.0, 23.0, 18.0, 23.0, 14.0, 13.0, 14.0, 14.0, 7.0, 8.0, 8.0, 7.0, 9.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4453125, -8.174560546875, -7.90380859375, -7.633056640625, -7.3623046875, -7.091552734375, -6.82080078125, -6.550048828125, -6.279296875, -6.008544921875, -5.73779296875, -5.467041015625, -5.1962890625, -4.925537109375, -4.65478515625, -4.384033203125, -4.11328125, -3.842529296875, -3.57177734375, -3.301025390625, -3.0302734375, -2.759521484375, -2.48876953125, -2.218017578125, -1.947265625, -1.676513671875, -1.40576171875, -1.135009765625, -0.8642578125, -0.593505859375, -0.32275390625, -0.052001953125, 0.21875, 0.489501953125, 0.76025390625, 1.031005859375, 1.3017578125, 1.572509765625, 1.84326171875, 2.114013671875, 2.384765625, 2.655517578125, 2.92626953125, 3.197021484375, 3.4677734375, 3.738525390625, 4.00927734375, 4.280029296875, 4.55078125, 4.821533203125, 5.09228515625, 5.363037109375, 5.6337890625, 5.904541015625, 6.17529296875, 6.446044921875, 6.716796875, 6.987548828125, 7.25830078125, 7.529052734375, 7.7998046875, 8.070556640625, 8.34130859375, 8.612060546875, 8.8828125]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 9.0, 17.0, 18.0, 28.0, 37.0, 66.0, 98.0, 142.0, 239.0, 341.0, 509.0, 852.0, 1360.0, 2239.0, 3479.0, 5997.0, 10244.0, 17611.0, 32275.0, 60352.0, 113445.0, 215016.0, 405964.0, 701669.0, 922602.0, 745870.0, 442421.0, 238656.0, 124413.0, 65861.0, 35293.0, 19535.0, 11051.0, 6508.0, 3704.0, 2295.0, 1378.0, 938.0, 590.0, 395.0, 273.0, 166.0, 115.0, 73.0, 46.0, 27.0, 23.0, 13.0, 11.0, 7.0, 5.0, 5.0, 2.0, 0.0, 1.0, 2.0], "bins": [-17.75, -17.205078125, -16.66015625, -16.115234375, -15.5703125, -15.025390625, -14.48046875, -13.935546875, -13.390625, -12.845703125, -12.30078125, -11.755859375, -11.2109375, -10.666015625, -10.12109375, -9.576171875, -9.03125, -8.486328125, -7.94140625, -7.396484375, -6.8515625, -6.306640625, -5.76171875, -5.216796875, -4.671875, -4.126953125, -3.58203125, -3.037109375, -2.4921875, -1.947265625, -1.40234375, -0.857421875, -0.3125, 0.232421875, 0.77734375, 1.322265625, 1.8671875, 2.412109375, 2.95703125, 3.501953125, 4.046875, 4.591796875, 5.13671875, 5.681640625, 6.2265625, 6.771484375, 7.31640625, 7.861328125, 8.40625, 8.951171875, 9.49609375, 10.041015625, 10.5859375, 11.130859375, 11.67578125, 12.220703125, 12.765625, 13.310546875, 13.85546875, 14.400390625, 14.9453125, 15.490234375, 16.03515625, 16.580078125, 17.125]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 7.0, 11.0, 11.0, 19.0, 16.0, 23.0, 35.0, 52.0, 59.0, 56.0, 99.0, 135.0, 125.0, 173.0, 239.0, 285.0, 303.0, 324.0, 273.0, 286.0, 281.0, 251.0, 210.0, 184.0, 131.0, 126.0, 80.0, 68.0, 48.0, 42.0, 27.0, 29.0, 20.0, 11.0, 11.0, 12.0, 3.0, 5.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.33203125, -6.1473388671875, -5.962646484375, -5.7779541015625, -5.59326171875, -5.4085693359375, -5.223876953125, -5.0391845703125, -4.8544921875, -4.6697998046875, -4.485107421875, -4.3004150390625, -4.11572265625, -3.9310302734375, -3.746337890625, -3.5616455078125, -3.376953125, -3.1922607421875, -3.007568359375, -2.8228759765625, -2.63818359375, -2.4534912109375, -2.268798828125, -2.0841064453125, -1.8994140625, -1.7147216796875, -1.530029296875, -1.3453369140625, -1.16064453125, -0.9759521484375, -0.791259765625, -0.6065673828125, -0.421875, -0.2371826171875, -0.052490234375, 0.1322021484375, 0.31689453125, 0.5015869140625, 0.686279296875, 0.8709716796875, 1.0556640625, 1.2403564453125, 1.425048828125, 1.6097412109375, 1.79443359375, 1.9791259765625, 2.163818359375, 2.3485107421875, 2.533203125, 2.7178955078125, 2.902587890625, 3.0872802734375, 3.27197265625, 3.4566650390625, 3.641357421875, 3.8260498046875, 4.0107421875, 4.1954345703125, 4.380126953125, 4.5648193359375, 4.74951171875, 4.9342041015625, 5.118896484375, 5.3035888671875, 5.48828125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 3.0, 8.0, 5.0, 9.0, 13.0, 17.0, 14.0, 19.0, 28.0, 27.0, 41.0, 49.0, 48.0, 63.0, 56.0, 68.0, 82.0, 60.0, 52.0, 67.0, 47.0, 38.0, 36.0, 35.0, 19.0, 21.0, 17.0, 13.0, 5.0, 9.0, 6.0, 7.0, 6.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.768938064575195, -20.087682723999023, -19.406429290771484, -18.725173950195312, -18.04391860961914, -17.36266326904297, -16.68140983581543, -16.000154495239258, -15.318899154663086, -14.63764476776123, -13.956389427185059, -13.275135040283203, -12.593879699707031, -11.912625312805176, -11.23137092590332, -10.550115585327148, -9.868861198425293, -9.187606811523438, -8.506351470947266, -7.82509708404541, -7.143841743469238, -6.462587356567383, -5.781332492828369, -5.1000776290893555, -4.418822765350342, -3.737567901611328, -3.0563130378723145, -2.37505841255188, -1.6938035488128662, -1.0125486850738525, -0.33129405975341797, 0.3499608039855957, 1.0312156677246094, 1.712470531463623, 2.3937253952026367, 3.0749800205230713, 3.756234884262085, 4.4374895095825195, 5.118744373321533, 5.799999237060547, 6.4812541007995605, 7.162508964538574, 7.843763828277588, 8.525018692016602, 9.206273078918457, 9.887528419494629, 10.568782806396484, 11.250038146972656, 11.931292533874512, 12.612546920776367, 13.293802261352539, 13.975056648254395, 14.656311988830566, 15.337566375732422, 16.018821716308594, 16.700077056884766, 17.381330490112305, 18.062585830688477, 18.743839263916016, 19.425094604492188, 20.10634994506836, 20.78760528564453, 21.46885871887207, 22.150114059448242, 22.831369400024414]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 8.0, 3.0, 4.0, 11.0, 10.0, 6.0, 13.0, 13.0, 15.0, 14.0, 27.0, 21.0, 20.0, 28.0, 23.0, 31.0, 39.0, 35.0, 41.0, 25.0, 48.0, 41.0, 41.0, 42.0, 34.0, 37.0, 40.0, 29.0, 34.0, 27.0, 27.0, 27.0, 19.0, 35.0, 18.0, 15.0, 16.0, 17.0, 14.0, 10.0, 14.0, 11.0, 8.0, 4.0, 4.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.9055757522583, -8.616514205932617, -8.327452659606934, -8.03839111328125, -7.749330043792725, -7.460268497467041, -7.171207427978516, -6.882145881652832, -6.593084335327148, -6.304022789001465, -6.014961242675781, -5.725900173187256, -5.436838626861572, -5.147777080535889, -4.858716011047363, -4.56965446472168, -4.280592918395996, -3.9915313720703125, -3.702470064163208, -3.4134087562561035, -3.12434720993042, -2.8352856636047363, -2.546224355697632, -2.2571630477905273, -1.9681015014648438, -1.6790400743484497, -1.3899786472320557, -1.1009172201156616, -0.8118557929992676, -0.5227943658828735, -0.2337329387664795, 0.055328369140625, 0.3443889617919922, 0.6334503889083862, 0.9225118160247803, 1.2115732431411743, 1.5006346702575684, 1.7896960973739624, 2.0787575244903564, 2.367818832397461, 2.6568803787231445, 2.945941925048828, 3.2350032329559326, 3.524064540863037, 3.8131260871887207, 4.102187633514404, 4.39124870300293, 4.680310249328613, 4.969371795654297, 5.2584333419799805, 5.547494888305664, 5.8365559577941895, 6.125617504119873, 6.414679050445557, 6.703740119934082, 6.992801666259766, 7.281863212585449, 7.570924758911133, 7.859986305236816, 8.1490478515625, 8.438108444213867, 8.72716999053955, 9.016231536865234, 9.305293083190918, 9.594354629516602]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 6.0, 6.0, 5.0, 12.0, 14.0, 20.0, 35.0, 43.0, 69.0, 89.0, 128.0, 183.0, 255.0, 385.0, 543.0, 759.0, 1159.0, 1733.0, 2870.0, 4818.0, 8386.0, 15661.0, 29984.0, 58548.0, 107101.0, 172408.0, 210186.0, 180176.0, 115927.0, 63809.0, 32901.0, 17255.0, 9319.0, 5015.0, 3064.0, 1860.0, 1196.0, 803.0, 568.0, 346.0, 287.0, 179.0, 146.0, 98.0, 70.0, 45.0, 27.0, 21.0, 11.0, 14.0, 10.0, 6.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5703125, -10.1868896484375, -9.803466796875, -9.4200439453125, -9.03662109375, -8.6531982421875, -8.269775390625, -7.8863525390625, -7.5029296875, -7.1195068359375, -6.736083984375, -6.3526611328125, -5.96923828125, -5.5858154296875, -5.202392578125, -4.8189697265625, -4.435546875, -4.0521240234375, -3.668701171875, -3.2852783203125, -2.90185546875, -2.5184326171875, -2.135009765625, -1.7515869140625, -1.3681640625, -0.9847412109375, -0.601318359375, -0.2178955078125, 0.16552734375, 0.5489501953125, 0.932373046875, 1.3157958984375, 1.69921875, 2.0826416015625, 2.466064453125, 2.8494873046875, 3.23291015625, 3.6163330078125, 3.999755859375, 4.3831787109375, 4.7666015625, 5.1500244140625, 5.533447265625, 5.9168701171875, 6.30029296875, 6.6837158203125, 7.067138671875, 7.4505615234375, 7.833984375, 8.2174072265625, 8.600830078125, 8.9842529296875, 9.36767578125, 9.7510986328125, 10.134521484375, 10.5179443359375, 10.9013671875, 11.2847900390625, 11.668212890625, 12.0516357421875, 12.43505859375, 12.8184814453125, 13.201904296875, 13.5853271484375, 13.96875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 3.0, 5.0, 4.0, 6.0, 4.0, 7.0, 17.0, 16.0, 8.0, 17.0, 18.0, 20.0, 24.0, 36.0, 34.0, 34.0, 48.0, 44.0, 41.0, 50.0, 35.0, 46.0, 41.0, 43.0, 37.0, 44.0, 32.0, 35.0, 30.0, 34.0, 24.0, 32.0, 26.0, 14.0, 21.0, 15.0, 10.0, 8.0, 15.0, 10.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.7578125, -10.3970947265625, -10.036376953125, -9.6756591796875, -9.31494140625, -8.9542236328125, -8.593505859375, -8.2327880859375, -7.8720703125, -7.5113525390625, -7.150634765625, -6.7899169921875, -6.42919921875, -6.0684814453125, -5.707763671875, -5.3470458984375, -4.986328125, -4.6256103515625, -4.264892578125, -3.9041748046875, -3.54345703125, -3.1827392578125, -2.822021484375, -2.4613037109375, -2.1005859375, -1.7398681640625, -1.379150390625, -1.0184326171875, -0.65771484375, -0.2969970703125, 0.063720703125, 0.4244384765625, 0.78515625, 1.1458740234375, 1.506591796875, 1.8673095703125, 2.22802734375, 2.5887451171875, 2.949462890625, 3.3101806640625, 3.6708984375, 4.0316162109375, 4.392333984375, 4.7530517578125, 5.11376953125, 5.4744873046875, 5.835205078125, 6.1959228515625, 6.556640625, 6.9173583984375, 7.278076171875, 7.6387939453125, 7.99951171875, 8.3602294921875, 8.720947265625, 9.0816650390625, 9.4423828125, 9.8031005859375, 10.163818359375, 10.5245361328125, 10.88525390625, 11.2459716796875, 11.606689453125, 11.9674072265625, 12.328125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 14.0, 12.0, 12.0, 14.0, 28.0, 37.0, 47.0, 53.0, 62.0, 101.0, 135.0, 182.0, 234.0, 339.0, 513.0, 963.0, 1924.0, 5046.0, 16143.0, 64834.0, 286758.0, 475723.0, 146123.0, 33000.0, 9274.0, 3259.0, 1488.0, 718.0, 386.0, 303.0, 222.0, 149.0, 112.0, 100.0, 58.0, 49.0, 41.0, 25.0, 11.0, 26.0, 4.0, 9.0, 6.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.203125, -28.205322265625, -27.20751953125, -26.209716796875, -25.2119140625, -24.214111328125, -23.21630859375, -22.218505859375, -21.220703125, -20.222900390625, -19.22509765625, -18.227294921875, -17.2294921875, -16.231689453125, -15.23388671875, -14.236083984375, -13.23828125, -12.240478515625, -11.24267578125, -10.244873046875, -9.2470703125, -8.249267578125, -7.25146484375, -6.253662109375, -5.255859375, -4.258056640625, -3.26025390625, -2.262451171875, -1.2646484375, -0.266845703125, 0.73095703125, 1.728759765625, 2.7265625, 3.724365234375, 4.72216796875, 5.719970703125, 6.7177734375, 7.715576171875, 8.71337890625, 9.711181640625, 10.708984375, 11.706787109375, 12.70458984375, 13.702392578125, 14.7001953125, 15.697998046875, 16.69580078125, 17.693603515625, 18.69140625, 19.689208984375, 20.68701171875, 21.684814453125, 22.6826171875, 23.680419921875, 24.67822265625, 25.676025390625, 26.673828125, 27.671630859375, 28.66943359375, 29.667236328125, 30.6650390625, 31.662841796875, 32.66064453125, 33.658447265625, 34.65625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 4.0, 3.0, 4.0, 2.0, 2.0, 4.0, 2.0, 9.0, 6.0, 13.0, 8.0, 15.0, 18.0, 20.0, 28.0, 22.0, 24.0, 25.0, 27.0, 30.0, 46.0, 32.0, 39.0, 40.0, 39.0, 48.0, 45.0, 49.0, 36.0, 29.0, 40.0, 24.0, 41.0, 26.0, 28.0, 23.0, 22.0, 19.0, 18.0, 13.0, 12.0, 14.0, 13.0, 8.0, 14.0, 9.0, 3.0, 6.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.68359375, -5.492919921875, -5.30224609375, -5.111572265625, -4.9208984375, -4.730224609375, -4.53955078125, -4.348876953125, -4.158203125, -3.967529296875, -3.77685546875, -3.586181640625, -3.3955078125, -3.204833984375, -3.01416015625, -2.823486328125, -2.6328125, -2.442138671875, -2.25146484375, -2.060791015625, -1.8701171875, -1.679443359375, -1.48876953125, -1.298095703125, -1.107421875, -0.916748046875, -0.72607421875, -0.535400390625, -0.3447265625, -0.154052734375, 0.03662109375, 0.227294921875, 0.41796875, 0.608642578125, 0.79931640625, 0.989990234375, 1.1806640625, 1.371337890625, 1.56201171875, 1.752685546875, 1.943359375, 2.134033203125, 2.32470703125, 2.515380859375, 2.7060546875, 2.896728515625, 3.08740234375, 3.278076171875, 3.46875, 3.659423828125, 3.85009765625, 4.040771484375, 4.2314453125, 4.422119140625, 4.61279296875, 4.803466796875, 4.994140625, 5.184814453125, 5.37548828125, 5.566162109375, 5.7568359375, 5.947509765625, 6.13818359375, 6.328857421875, 6.51953125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 2.0, 5.0, 18.0, 17.0, 23.0, 45.0, 55.0, 86.0, 119.0, 162.0, 226.0, 320.0, 458.0, 730.0, 1018.0, 1481.0, 2234.0, 3656.0, 6863.0, 19218.0, 81617.0, 399956.0, 408475.0, 84306.0, 19959.0, 7002.0, 3571.0, 2224.0, 1458.0, 1026.0, 686.0, 469.0, 315.0, 240.0, 155.0, 103.0, 76.0, 56.0, 46.0, 29.0, 12.0, 13.0, 14.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-20.09375, -19.519775390625, -18.94580078125, -18.371826171875, -17.7978515625, -17.223876953125, -16.64990234375, -16.075927734375, -15.501953125, -14.927978515625, -14.35400390625, -13.780029296875, -13.2060546875, -12.632080078125, -12.05810546875, -11.484130859375, -10.91015625, -10.336181640625, -9.76220703125, -9.188232421875, -8.6142578125, -8.040283203125, -7.46630859375, -6.892333984375, -6.318359375, -5.744384765625, -5.17041015625, -4.596435546875, -4.0224609375, -3.448486328125, -2.87451171875, -2.300537109375, -1.7265625, -1.152587890625, -0.57861328125, -0.004638671875, 0.5693359375, 1.143310546875, 1.71728515625, 2.291259765625, 2.865234375, 3.439208984375, 4.01318359375, 4.587158203125, 5.1611328125, 5.735107421875, 6.30908203125, 6.883056640625, 7.45703125, 8.031005859375, 8.60498046875, 9.178955078125, 9.7529296875, 10.326904296875, 10.90087890625, 11.474853515625, 12.048828125, 12.622802734375, 13.19677734375, 13.770751953125, 14.3447265625, 14.918701171875, 15.49267578125, 16.066650390625, 16.640625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 14.0, 14.0, 10.0, 22.0, 55.0, 78.0, 120.0, 151.0, 142.0, 136.0, 97.0, 64.0, 38.0, 22.0, 10.0, 9.0, 5.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011377334594726562, -0.0011100620031356812, -0.001082390546798706, -0.001054719090461731, -0.0010270476341247559, -0.0009993761777877808, -0.0009717047214508057, -0.0009440332651138306, -0.0009163618087768555, -0.0008886903524398804, -0.0008610188961029053, -0.0008333474397659302, -0.0008056759834289551, -0.00077800452709198, -0.0007503330707550049, -0.0007226616144180298, -0.0006949901580810547, -0.0006673187017440796, -0.0006396472454071045, -0.0006119757890701294, -0.0005843043327331543, -0.0005566328763961792, -0.0005289614200592041, -0.000501289963722229, -0.0004736185073852539, -0.0004459470510482788, -0.0004182755947113037, -0.0003906041383743286, -0.0003629326820373535, -0.0003352612257003784, -0.0003075897693634033, -0.0002799183130264282, -0.0002522468566894531, -0.00022457540035247803, -0.00019690394401550293, -0.00016923248767852783, -0.00014156103134155273, -0.00011388957500457764, -8.621811866760254e-05, -5.854666233062744e-05, -3.0875205993652344e-05, -3.203749656677246e-06, 2.446770668029785e-05, 5.213916301727295e-05, 7.981061935424805e-05, 0.00010748207569122314, 0.00013515353202819824, 0.00016282498836517334, 0.00019049644470214844, 0.00021816790103912354, 0.00024583935737609863, 0.00027351081371307373, 0.00030118227005004883, 0.0003288537263870239, 0.000356525182723999, 0.0003841966390609741, 0.0004118680953979492, 0.0004395395517349243, 0.0004672110080718994, 0.0004948824644088745, 0.0005225539207458496, 0.0005502253770828247, 0.0005778968334197998, 0.0006055682897567749, 0.00063323974609375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 2.0, 4.0, 7.0, 10.0, 9.0, 21.0, 16.0, 21.0, 35.0, 55.0, 64.0, 100.0, 166.0, 196.0, 274.0, 363.0, 514.0, 721.0, 951.0, 1327.0, 1801.0, 2541.0, 3843.0, 7418.0, 24394.0, 125070.0, 452066.0, 326521.0, 68192.0, 14916.0, 5541.0, 3286.0, 2219.0, 1556.0, 1219.0, 858.0, 617.0, 445.0, 323.0, 254.0, 156.0, 133.0, 103.0, 74.0, 41.0, 43.0, 28.0, 14.0, 12.0, 10.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-16.140625, -15.599365234375, -15.05810546875, -14.516845703125, -13.9755859375, -13.434326171875, -12.89306640625, -12.351806640625, -11.810546875, -11.269287109375, -10.72802734375, -10.186767578125, -9.6455078125, -9.104248046875, -8.56298828125, -8.021728515625, -7.48046875, -6.939208984375, -6.39794921875, -5.856689453125, -5.3154296875, -4.774169921875, -4.23291015625, -3.691650390625, -3.150390625, -2.609130859375, -2.06787109375, -1.526611328125, -0.9853515625, -0.444091796875, 0.09716796875, 0.638427734375, 1.1796875, 1.720947265625, 2.26220703125, 2.803466796875, 3.3447265625, 3.885986328125, 4.42724609375, 4.968505859375, 5.509765625, 6.051025390625, 6.59228515625, 7.133544921875, 7.6748046875, 8.216064453125, 8.75732421875, 9.298583984375, 9.83984375, 10.381103515625, 10.92236328125, 11.463623046875, 12.0048828125, 12.546142578125, 13.08740234375, 13.628662109375, 14.169921875, 14.711181640625, 15.25244140625, 15.793701171875, 16.3349609375, 16.876220703125, 17.41748046875, 17.958740234375, 18.5]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 10.0, 16.0, 22.0, 30.0, 47.0, 101.0, 127.0, 134.0, 151.0, 126.0, 89.0, 51.0, 37.0, 20.0, 8.0, 9.0, 3.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.44140625, -4.314208984375, -4.18701171875, -4.059814453125, -3.9326171875, -3.805419921875, -3.67822265625, -3.551025390625, -3.423828125, -3.296630859375, -3.16943359375, -3.042236328125, -2.9150390625, -2.787841796875, -2.66064453125, -2.533447265625, -2.40625, -2.279052734375, -2.15185546875, -2.024658203125, -1.8974609375, -1.770263671875, -1.64306640625, -1.515869140625, -1.388671875, -1.261474609375, -1.13427734375, -1.007080078125, -0.8798828125, -0.752685546875, -0.62548828125, -0.498291015625, -0.37109375, -0.243896484375, -0.11669921875, 0.010498046875, 0.1376953125, 0.264892578125, 0.39208984375, 0.519287109375, 0.646484375, 0.773681640625, 0.90087890625, 1.028076171875, 1.1552734375, 1.282470703125, 1.40966796875, 1.536865234375, 1.6640625, 1.791259765625, 1.91845703125, 2.045654296875, 2.1728515625, 2.300048828125, 2.42724609375, 2.554443359375, 2.681640625, 2.808837890625, 2.93603515625, 3.063232421875, 3.1904296875, 3.317626953125, 3.44482421875, 3.572021484375, 3.69921875]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 1.0, 5.0, 3.0, 4.0, 6.0, 8.0, 12.0, 19.0, 14.0, 24.0, 28.0, 24.0, 41.0, 33.0, 47.0, 63.0, 63.0, 66.0, 82.0, 65.0, 59.0, 43.0, 51.0, 43.0, 35.0, 25.0, 32.0, 24.0, 11.0, 11.0, 15.0, 11.0, 3.0, 8.0, 9.0, 0.0, 7.0, 0.0, 4.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.522510528564453, -16.86768341064453, -16.212858200073242, -15.558032035827637, -14.903205871582031, -14.248379707336426, -13.59355354309082, -12.938727378845215, -12.28390121459961, -11.629075050354004, -10.974248886108398, -10.319422721862793, -9.664596557617188, -9.009770393371582, -8.354944229125977, -7.700118064880371, -7.045291900634766, -6.39046573638916, -5.735639572143555, -5.080813407897949, -4.425987243652344, -3.7711610794067383, -3.116334915161133, -2.4615087509155273, -1.8066825866699219, -1.1518564224243164, -0.49703025817871094, 0.15779590606689453, 0.8126220703125, 1.4674482345581055, 2.122274398803711, 2.7771005630493164, 3.4319286346435547, 4.08675479888916, 4.741580963134766, 5.396407127380371, 6.051233291625977, 6.706059455871582, 7.3608856201171875, 8.015711784362793, 8.670537948608398, 9.325364112854004, 9.98019027709961, 10.635016441345215, 11.28984260559082, 11.944668769836426, 12.599494934082031, 13.254321098327637, 13.909147262573242, 14.563973426818848, 15.218799591064453, 15.873625755310059, 16.528451919555664, 17.183277130126953, 17.838104248046875, 18.492931365966797, 19.147756576538086, 19.802581787109375, 20.457408905029297, 21.11223602294922, 21.767061233520508, 22.421886444091797, 23.07671356201172, 23.73154067993164, 24.38636589050293]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 4.0, 1.0, 12.0, 8.0, 7.0, 19.0, 12.0, 12.0, 18.0, 23.0, 18.0, 23.0, 23.0, 31.0, 26.0, 32.0, 37.0, 39.0, 33.0, 44.0, 45.0, 34.0, 38.0, 48.0, 34.0, 35.0, 40.0, 29.0, 36.0, 27.0, 22.0, 25.0, 14.0, 26.0, 15.0, 15.0, 17.0, 14.0, 22.0, 8.0, 7.0, 9.0, 8.0, 4.0, 3.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.298133850097656, -8.011815071105957, -7.725496292114258, -7.439177513122559, -7.152858734130859, -6.86653995513916, -6.580220699310303, -6.2939019203186035, -6.007583141326904, -5.721264362335205, -5.434945583343506, -5.148626804351807, -4.862307548522949, -4.57598876953125, -4.289669990539551, -4.003351211547852, -3.7170324325561523, -3.430713653564453, -3.144394874572754, -2.8580758571624756, -2.5717570781707764, -2.285438299179077, -1.9991194009780884, -1.7128005027770996, -1.4264817237854004, -1.1401629447937012, -0.8538440465927124, -0.5675252079963684, -0.2812063694000244, 0.005112409591674805, 0.2914313077926636, 0.5777502059936523, 0.8640689849853516, 1.1503877639770508, 1.4367066621780396, 1.7230255603790283, 2.0093443393707275, 2.2956631183624268, 2.581982135772705, 2.8683009147644043, 3.1546196937561035, 3.4409384727478027, 3.727257251739502, 4.013576030731201, 4.299895286560059, 4.586214065551758, 4.872532844543457, 5.158851623535156, 5.4451704025268555, 5.731489181518555, 6.017807960510254, 6.304126739501953, 6.590445518493652, 6.876764297485352, 7.163083553314209, 7.449402332305908, 7.735721111297607, 8.022040367126465, 8.308359146118164, 8.594677925109863, 8.880996704101562, 9.167315483093262, 9.453634262084961, 9.73995304107666, 10.02627182006836]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 5.0, 5.0, 6.0, 8.0, 11.0, 21.0, 28.0, 50.0, 97.0, 179.0, 314.0, 478.0, 1031.0, 2023.0, 4468.0, 9856.0, 22085.0, 49816.0, 106576.0, 191657.0, 243619.0, 200656.0, 115732.0, 55214.0, 24283.0, 10727.0, 4857.0, 2348.0, 1082.0, 572.0, 347.0, 167.0, 91.0, 51.0, 35.0, 18.0, 16.0, 14.0, 7.0, 6.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.53125, -22.76123046875, -21.9912109375, -21.22119140625, -20.451171875, -19.68115234375, -18.9111328125, -18.14111328125, -17.37109375, -16.60107421875, -15.8310546875, -15.06103515625, -14.291015625, -13.52099609375, -12.7509765625, -11.98095703125, -11.2109375, -10.44091796875, -9.6708984375, -8.90087890625, -8.130859375, -7.36083984375, -6.5908203125, -5.82080078125, -5.05078125, -4.28076171875, -3.5107421875, -2.74072265625, -1.970703125, -1.20068359375, -0.4306640625, 0.33935546875, 1.109375, 1.87939453125, 2.6494140625, 3.41943359375, 4.189453125, 4.95947265625, 5.7294921875, 6.49951171875, 7.26953125, 8.03955078125, 8.8095703125, 9.57958984375, 10.349609375, 11.11962890625, 11.8896484375, 12.65966796875, 13.4296875, 14.19970703125, 14.9697265625, 15.73974609375, 16.509765625, 17.27978515625, 18.0498046875, 18.81982421875, 19.58984375, 20.35986328125, 21.1298828125, 21.89990234375, 22.669921875, 23.43994140625, 24.2099609375, 24.97998046875, 25.75]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 1.0, 2.0, 5.0, 5.0, 7.0, 8.0, 16.0, 13.0, 25.0, 25.0, 15.0, 18.0, 37.0, 25.0, 37.0, 47.0, 44.0, 59.0, 56.0, 54.0, 58.0, 49.0, 53.0, 50.0, 31.0, 34.0, 31.0, 37.0, 34.0, 24.0, 24.0, 17.0, 24.0, 10.0, 9.0, 7.0, 9.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9140625, -9.5062255859375, -9.098388671875, -8.6905517578125, -8.28271484375, -7.8748779296875, -7.467041015625, -7.0592041015625, -6.6513671875, -6.2435302734375, -5.835693359375, -5.4278564453125, -5.02001953125, -4.6121826171875, -4.204345703125, -3.7965087890625, -3.388671875, -2.9808349609375, -2.572998046875, -2.1651611328125, -1.75732421875, -1.3494873046875, -0.941650390625, -0.5338134765625, -0.1259765625, 0.2818603515625, 0.689697265625, 1.0975341796875, 1.50537109375, 1.9132080078125, 2.321044921875, 2.7288818359375, 3.13671875, 3.5445556640625, 3.952392578125, 4.3602294921875, 4.76806640625, 5.1759033203125, 5.583740234375, 5.9915771484375, 6.3994140625, 6.8072509765625, 7.215087890625, 7.6229248046875, 8.03076171875, 8.4385986328125, 8.846435546875, 9.2542724609375, 9.662109375, 10.0699462890625, 10.477783203125, 10.8856201171875, 11.29345703125, 11.7012939453125, 12.109130859375, 12.5169677734375, 12.9248046875, 13.3326416015625, 13.740478515625, 14.1483154296875, 14.55615234375, 14.9639892578125, 15.371826171875, 15.7796630859375, 16.1875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 7.0, 9.0, 4.0, 22.0, 21.0, 29.0, 32.0, 52.0, 96.0, 137.0, 216.0, 302.0, 526.0, 731.0, 1140.0, 1783.0, 2701.0, 4409.0, 6682.0, 10563.0, 16257.0, 25016.0, 37983.0, 55527.0, 76937.0, 99498.0, 118346.0, 126291.0, 118813.0, 100309.0, 77414.0, 56051.0, 38819.0, 25400.0, 16689.0, 10635.0, 6780.0, 4314.0, 2770.0, 1868.0, 1176.0, 715.0, 472.0, 345.0, 214.0, 151.0, 105.0, 75.0, 41.0, 27.0, 23.0, 11.0, 9.0, 8.0, 7.0, 6.0, 1.0, 0.0, 5.0], "bins": [-13.0078125, -12.6077880859375, -12.207763671875, -11.8077392578125, -11.40771484375, -11.0076904296875, -10.607666015625, -10.2076416015625, -9.8076171875, -9.4075927734375, -9.007568359375, -8.6075439453125, -8.20751953125, -7.8074951171875, -7.407470703125, -7.0074462890625, -6.607421875, -6.2073974609375, -5.807373046875, -5.4073486328125, -5.00732421875, -4.6072998046875, -4.207275390625, -3.8072509765625, -3.4072265625, -3.0072021484375, -2.607177734375, -2.2071533203125, -1.80712890625, -1.4071044921875, -1.007080078125, -0.6070556640625, -0.20703125, 0.1929931640625, 0.593017578125, 0.9930419921875, 1.39306640625, 1.7930908203125, 2.193115234375, 2.5931396484375, 2.9931640625, 3.3931884765625, 3.793212890625, 4.1932373046875, 4.59326171875, 4.9932861328125, 5.393310546875, 5.7933349609375, 6.193359375, 6.5933837890625, 6.993408203125, 7.3934326171875, 7.79345703125, 8.1934814453125, 8.593505859375, 8.9935302734375, 9.3935546875, 9.7935791015625, 10.193603515625, 10.5936279296875, 10.99365234375, 11.3936767578125, 11.793701171875, 12.1937255859375, 12.59375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 2.0, 6.0, 5.0, 8.0, 2.0, 8.0, 12.0, 14.0, 17.0, 9.0, 19.0, 19.0, 27.0, 21.0, 35.0, 29.0, 28.0, 29.0, 39.0, 43.0, 54.0, 42.0, 40.0, 42.0, 34.0, 38.0, 45.0, 45.0, 40.0, 31.0, 22.0, 29.0, 29.0, 29.0, 18.0, 21.0, 16.0, 9.0, 7.0, 7.0, 6.0, 6.0, 6.0, 5.0, 4.0, 2.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.47265625, -6.2720947265625, -6.071533203125, -5.8709716796875, -5.67041015625, -5.4698486328125, -5.269287109375, -5.0687255859375, -4.8681640625, -4.6676025390625, -4.467041015625, -4.2664794921875, -4.06591796875, -3.8653564453125, -3.664794921875, -3.4642333984375, -3.263671875, -3.0631103515625, -2.862548828125, -2.6619873046875, -2.46142578125, -2.2608642578125, -2.060302734375, -1.8597412109375, -1.6591796875, -1.4586181640625, -1.258056640625, -1.0574951171875, -0.85693359375, -0.6563720703125, -0.455810546875, -0.2552490234375, -0.0546875, 0.1458740234375, 0.346435546875, 0.5469970703125, 0.74755859375, 0.9481201171875, 1.148681640625, 1.3492431640625, 1.5498046875, 1.7503662109375, 1.950927734375, 2.1514892578125, 2.35205078125, 2.5526123046875, 2.753173828125, 2.9537353515625, 3.154296875, 3.3548583984375, 3.555419921875, 3.7559814453125, 3.95654296875, 4.1571044921875, 4.357666015625, 4.5582275390625, 4.7587890625, 4.9593505859375, 5.159912109375, 5.3604736328125, 5.56103515625, 5.7615966796875, 5.962158203125, 6.1627197265625, 6.36328125]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 12.0, 21.0, 17.0, 17.0, 30.0, 58.0, 63.0, 121.0, 163.0, 248.0, 339.0, 449.0, 642.0, 964.0, 1292.0, 1971.0, 2881.0, 4419.0, 6555.0, 10464.0, 16818.0, 28832.0, 51259.0, 93271.0, 163058.0, 218812.0, 184976.0, 111549.0, 60731.0, 33922.0, 19858.0, 12051.0, 7425.0, 4889.0, 3290.0, 2127.0, 1514.0, 1062.0, 734.0, 501.0, 343.0, 257.0, 177.0, 120.0, 78.0, 60.0, 29.0, 31.0, 25.0, 8.0, 10.0, 4.0, 3.0, 1.0, 6.0, 2.0, 0.0, 1.0], "bins": [-10.828125, -10.4859619140625, -10.143798828125, -9.8016357421875, -9.45947265625, -9.1173095703125, -8.775146484375, -8.4329833984375, -8.0908203125, -7.7486572265625, -7.406494140625, -7.0643310546875, -6.72216796875, -6.3800048828125, -6.037841796875, -5.6956787109375, -5.353515625, -5.0113525390625, -4.669189453125, -4.3270263671875, -3.98486328125, -3.6427001953125, -3.300537109375, -2.9583740234375, -2.6162109375, -2.2740478515625, -1.931884765625, -1.5897216796875, -1.24755859375, -0.9053955078125, -0.563232421875, -0.2210693359375, 0.12109375, 0.4632568359375, 0.805419921875, 1.1475830078125, 1.48974609375, 1.8319091796875, 2.174072265625, 2.5162353515625, 2.8583984375, 3.2005615234375, 3.542724609375, 3.8848876953125, 4.22705078125, 4.5692138671875, 4.911376953125, 5.2535400390625, 5.595703125, 5.9378662109375, 6.280029296875, 6.6221923828125, 6.96435546875, 7.3065185546875, 7.648681640625, 7.9908447265625, 8.3330078125, 8.6751708984375, 9.017333984375, 9.3594970703125, 9.70166015625, 10.0438232421875, 10.385986328125, 10.7281494140625, 11.0703125]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 8.0, 10.0, 6.0, 7.0, 11.0, 8.0, 12.0, 22.0, 14.0, 29.0, 28.0, 57.0, 50.0, 56.0, 57.0, 71.0, 77.0, 100.0, 73.0, 55.0, 44.0, 44.0, 27.0, 22.0, 17.0, 24.0, 15.0, 8.0, 13.0, 10.0, 5.0, 2.0, 3.0, 2.0, 4.0, 1.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00109100341796875, -0.0010495781898498535, -0.001008152961730957, -0.0009667277336120605, -0.0009253025054931641, -0.0008838772773742676, -0.0008424520492553711, -0.0008010268211364746, -0.0007596015930175781, -0.0007181763648986816, -0.0006767511367797852, -0.0006353259086608887, -0.0005939006805419922, -0.0005524754524230957, -0.0005110502243041992, -0.00046962499618530273, -0.00042819976806640625, -0.00038677453994750977, -0.0003453493118286133, -0.0003039240837097168, -0.0002624988555908203, -0.00022107362747192383, -0.00017964839935302734, -0.00013822317123413086, -9.679794311523438e-05, -5.537271499633789e-05, -1.3947486877441406e-05, 2.7477741241455078e-05, 6.890296936035156e-05, 0.00011032819747924805, 0.00015175342559814453, 0.00019317865371704102, 0.0002346038818359375, 0.000276029109954834, 0.00031745433807373047, 0.00035887956619262695, 0.00040030479431152344, 0.0004417300224304199, 0.0004831552505493164, 0.0005245804786682129, 0.0005660057067871094, 0.0006074309349060059, 0.0006488561630249023, 0.0006902813911437988, 0.0007317066192626953, 0.0007731318473815918, 0.0008145570755004883, 0.0008559823036193848, 0.0008974075317382812, 0.0009388327598571777, 0.0009802579879760742, 0.0010216832160949707, 0.0010631084442138672, 0.0011045336723327637, 0.0011459589004516602, 0.0011873841285705566, 0.0012288093566894531, 0.0012702345848083496, 0.001311659812927246, 0.0013530850410461426, 0.001394510269165039, 0.0014359354972839355, 0.001477360725402832, 0.0015187859535217285, 0.001560211181640625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 10.0, 16.0, 5.0, 29.0, 39.0, 52.0, 86.0, 112.0, 176.0, 278.0, 392.0, 575.0, 912.0, 1446.0, 2186.0, 3577.0, 5569.0, 9457.0, 16076.0, 28420.0, 51911.0, 95075.0, 160080.0, 210813.0, 187389.0, 119923.0, 66760.0, 36362.0, 20359.0, 11595.0, 6928.0, 4250.0, 2686.0, 1730.0, 1117.0, 745.0, 489.0, 306.0, 205.0, 148.0, 87.0, 55.0, 41.0, 37.0, 15.0, 16.0, 8.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-9.2734375, -8.971435546875, -8.66943359375, -8.367431640625, -8.0654296875, -7.763427734375, -7.46142578125, -7.159423828125, -6.857421875, -6.555419921875, -6.25341796875, -5.951416015625, -5.6494140625, -5.347412109375, -5.04541015625, -4.743408203125, -4.44140625, -4.139404296875, -3.83740234375, -3.535400390625, -3.2333984375, -2.931396484375, -2.62939453125, -2.327392578125, -2.025390625, -1.723388671875, -1.42138671875, -1.119384765625, -0.8173828125, -0.515380859375, -0.21337890625, 0.088623046875, 0.390625, 0.692626953125, 0.99462890625, 1.296630859375, 1.5986328125, 1.900634765625, 2.20263671875, 2.504638671875, 2.806640625, 3.108642578125, 3.41064453125, 3.712646484375, 4.0146484375, 4.316650390625, 4.61865234375, 4.920654296875, 5.22265625, 5.524658203125, 5.82666015625, 6.128662109375, 6.4306640625, 6.732666015625, 7.03466796875, 7.336669921875, 7.638671875, 7.940673828125, 8.24267578125, 8.544677734375, 8.8466796875, 9.148681640625, 9.45068359375, 9.752685546875, 10.0546875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 7.0, 3.0, 10.0, 10.0, 16.0, 13.0, 22.0, 25.0, 25.0, 36.0, 45.0, 60.0, 73.0, 70.0, 77.0, 84.0, 72.0, 68.0, 46.0, 53.0, 35.0, 26.0, 24.0, 25.0, 11.0, 9.0, 9.0, 13.0, 6.0, 7.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.20703125, -3.10699462890625, -3.0069580078125, -2.90692138671875, -2.806884765625, -2.70684814453125, -2.6068115234375, -2.50677490234375, -2.40673828125, -2.30670166015625, -2.2066650390625, -2.10662841796875, -2.006591796875, -1.90655517578125, -1.8065185546875, -1.70648193359375, -1.6064453125, -1.50640869140625, -1.4063720703125, -1.30633544921875, -1.206298828125, -1.10626220703125, -1.0062255859375, -0.90618896484375, -0.80615234375, -0.70611572265625, -0.6060791015625, -0.50604248046875, -0.406005859375, -0.30596923828125, -0.2059326171875, -0.10589599609375, -0.005859375, 0.09417724609375, 0.1942138671875, 0.29425048828125, 0.394287109375, 0.49432373046875, 0.5943603515625, 0.69439697265625, 0.79443359375, 0.89447021484375, 0.9945068359375, 1.09454345703125, 1.194580078125, 1.29461669921875, 1.3946533203125, 1.49468994140625, 1.5947265625, 1.69476318359375, 1.7947998046875, 1.89483642578125, 1.994873046875, 2.09490966796875, 2.1949462890625, 2.29498291015625, 2.39501953125, 2.49505615234375, 2.5950927734375, 2.69512939453125, 2.795166015625, 2.89520263671875, 2.9952392578125, 3.09527587890625, 3.1953125]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 3.0, 8.0, 5.0, 5.0, 12.0, 17.0, 16.0, 20.0, 22.0, 27.0, 35.0, 48.0, 41.0, 58.0, 56.0, 64.0, 77.0, 77.0, 58.0, 48.0, 51.0, 45.0, 44.0, 31.0, 30.0, 23.0, 18.0, 12.0, 7.0, 8.0, 6.0, 9.0, 6.0, 2.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-21.015472412109375, -20.329940795898438, -19.644407272338867, -18.958873748779297, -18.27334213256836, -17.587810516357422, -16.90227699279785, -16.21674346923828, -15.531211853027344, -14.84567928314209, -14.160146713256836, -13.474614143371582, -12.789081573486328, -12.103549003601074, -11.41801643371582, -10.732483863830566, -10.046951293945312, -9.361418724060059, -8.675886154174805, -7.990353584289551, -7.304821014404297, -6.619288444519043, -5.933755874633789, -5.248223304748535, -4.562690734863281, -3.8771581649780273, -3.1916255950927734, -2.5060930252075195, -1.8205604553222656, -1.1350278854370117, -0.4494953155517578, 0.2360372543334961, 0.92156982421875, 1.607102394104004, 2.292634963989258, 2.9781675338745117, 3.6637001037597656, 4.3492326736450195, 5.034765243530273, 5.720297813415527, 6.405830383300781, 7.091362953186035, 7.776895523071289, 8.462428092956543, 9.147960662841797, 9.83349323272705, 10.519025802612305, 11.204558372497559, 11.890090942382812, 12.575623512268066, 13.26115608215332, 13.946688652038574, 14.632221221923828, 15.317753791809082, 16.003286361694336, 16.688819885253906, 17.374351501464844, 18.05988311767578, 18.74541664123535, 19.430950164794922, 20.11648178100586, 20.802013397216797, 21.487546920776367, 22.173080444335938, 22.858612060546875]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 6.0, 8.0, 3.0, 3.0, 4.0, 9.0, 5.0, 9.0, 11.0, 11.0, 17.0, 21.0, 23.0, 18.0, 30.0, 30.0, 17.0, 25.0, 37.0, 39.0, 41.0, 33.0, 36.0, 43.0, 37.0, 41.0, 36.0, 44.0, 40.0, 34.0, 26.0, 34.0, 31.0, 24.0, 25.0, 25.0, 18.0, 16.0, 14.0, 15.0, 13.0, 17.0, 5.0, 8.0, 7.0, 3.0, 5.0, 7.0, 2.0, 3.0, 1.0, 1.0, 3.0], "bins": [-10.551229476928711, -10.25379467010498, -9.956360816955566, -9.658926010131836, -9.361491203308105, -9.064057350158691, -8.766622543334961, -8.469188690185547, -8.171753883361816, -7.874319553375244, -7.576884746551514, -7.279450416564941, -6.982016086578369, -6.684581756591797, -6.387146949768066, -6.089712619781494, -5.792277812957764, -5.494843482971191, -5.197408676147461, -4.899974346160889, -4.602540016174316, -4.305105209350586, -4.007670879364014, -3.7102365493774414, -3.41280198097229, -3.1153674125671387, -2.8179330825805664, -2.520498514175415, -2.2230639457702637, -1.9256296157836914, -1.62819504737854, -1.3307607173919678, -1.0333261489868164, -0.7358916997909546, -0.438457190990448, -0.1410226821899414, 0.1564117670059204, 0.4538462162017822, 0.7512807846069336, 1.0487151145935059, 1.3461496829986572, 1.643584132194519, 1.9410185813903809, 2.2384531497955322, 2.5358877182006836, 2.833322048187256, 3.1307566165924072, 3.4281909465789795, 3.725625514984131, 4.023059844970703, 4.320494651794434, 4.617928981781006, 4.915363311767578, 5.212798118591309, 5.510232448577881, 5.807666778564453, 6.105101585388184, 6.402535915374756, 6.699970722198486, 6.997405052185059, 7.294839382171631, 7.592273712158203, 7.889708518981934, 8.187143325805664, 8.484577178955078]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 6.0, 3.0, 5.0, 10.0, 15.0, 22.0, 31.0, 47.0, 60.0, 84.0, 137.0, 221.0, 340.0, 558.0, 964.0, 1584.0, 3008.0, 5452.0, 10598.0, 22913.0, 50169.0, 118510.0, 298956.0, 761194.0, 1316778.0, 942052.0, 390717.0, 152590.0, 62293.0, 27534.0, 12859.0, 6501.0, 3307.0, 1939.0, 1072.0, 631.0, 393.0, 250.0, 140.0, 126.0, 60.0, 50.0, 31.0, 22.0, 17.0, 13.0, 10.0, 3.0, 3.0, 2.0, 8.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-19.90625, -19.18603515625, -18.4658203125, -17.74560546875, -17.025390625, -16.30517578125, -15.5849609375, -14.86474609375, -14.14453125, -13.42431640625, -12.7041015625, -11.98388671875, -11.263671875, -10.54345703125, -9.8232421875, -9.10302734375, -8.3828125, -7.66259765625, -6.9423828125, -6.22216796875, -5.501953125, -4.78173828125, -4.0615234375, -3.34130859375, -2.62109375, -1.90087890625, -1.1806640625, -0.46044921875, 0.259765625, 0.97998046875, 1.7001953125, 2.42041015625, 3.140625, 3.86083984375, 4.5810546875, 5.30126953125, 6.021484375, 6.74169921875, 7.4619140625, 8.18212890625, 8.90234375, 9.62255859375, 10.3427734375, 11.06298828125, 11.783203125, 12.50341796875, 13.2236328125, 13.94384765625, 14.6640625, 15.38427734375, 16.1044921875, 16.82470703125, 17.544921875, 18.26513671875, 18.9853515625, 19.70556640625, 20.42578125, 21.14599609375, 21.8662109375, 22.58642578125, 23.306640625, 24.02685546875, 24.7470703125, 25.46728515625, 26.1875]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 1.0, 4.0, 8.0, 6.0, 5.0, 11.0, 12.0, 26.0, 16.0, 30.0, 29.0, 37.0, 38.0, 41.0, 55.0, 56.0, 49.0, 54.0, 58.0, 58.0, 63.0, 61.0, 43.0, 34.0, 44.0, 34.0, 25.0, 22.0, 31.0, 18.0, 10.0, 9.0, 7.0, 4.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7578125, -9.399169921875, -9.04052734375, -8.681884765625, -8.3232421875, -7.964599609375, -7.60595703125, -7.247314453125, -6.888671875, -6.530029296875, -6.17138671875, -5.812744140625, -5.4541015625, -5.095458984375, -4.73681640625, -4.378173828125, -4.01953125, -3.660888671875, -3.30224609375, -2.943603515625, -2.5849609375, -2.226318359375, -1.86767578125, -1.509033203125, -1.150390625, -0.791748046875, -0.43310546875, -0.074462890625, 0.2841796875, 0.642822265625, 1.00146484375, 1.360107421875, 1.71875, 2.077392578125, 2.43603515625, 2.794677734375, 3.1533203125, 3.511962890625, 3.87060546875, 4.229248046875, 4.587890625, 4.946533203125, 5.30517578125, 5.663818359375, 6.0224609375, 6.381103515625, 6.73974609375, 7.098388671875, 7.45703125, 7.815673828125, 8.17431640625, 8.532958984375, 8.8916015625, 9.250244140625, 9.60888671875, 9.967529296875, 10.326171875, 10.684814453125, 11.04345703125, 11.402099609375, 11.7607421875, 12.119384765625, 12.47802734375, 12.836669921875, 13.1953125]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 6.0, 11.0, 20.0, 21.0, 36.0, 79.0, 98.0, 160.0, 259.0, 435.0, 809.0, 1465.0, 2569.0, 4827.0, 9538.0, 19315.0, 42011.0, 93380.0, 215331.0, 485968.0, 952529.0, 1123965.0, 678551.0, 311800.0, 136639.0, 59593.0, 27360.0, 13170.0, 6606.0, 3385.0, 1905.0, 948.0, 639.0, 321.0, 204.0, 128.0, 77.0, 49.0, 33.0, 25.0, 8.0, 6.0, 6.0, 0.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.625, -25.869140625, -25.11328125, -24.357421875, -23.6015625, -22.845703125, -22.08984375, -21.333984375, -20.578125, -19.822265625, -19.06640625, -18.310546875, -17.5546875, -16.798828125, -16.04296875, -15.287109375, -14.53125, -13.775390625, -13.01953125, -12.263671875, -11.5078125, -10.751953125, -9.99609375, -9.240234375, -8.484375, -7.728515625, -6.97265625, -6.216796875, -5.4609375, -4.705078125, -3.94921875, -3.193359375, -2.4375, -1.681640625, -0.92578125, -0.169921875, 0.5859375, 1.341796875, 2.09765625, 2.853515625, 3.609375, 4.365234375, 5.12109375, 5.876953125, 6.6328125, 7.388671875, 8.14453125, 8.900390625, 9.65625, 10.412109375, 11.16796875, 11.923828125, 12.6796875, 13.435546875, 14.19140625, 14.947265625, 15.703125, 16.458984375, 17.21484375, 17.970703125, 18.7265625, 19.482421875, 20.23828125, 20.994140625, 21.75]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 6.0, 8.0, 11.0, 14.0, 20.0, 15.0, 28.0, 39.0, 60.0, 70.0, 112.0, 146.0, 182.0, 246.0, 273.0, 278.0, 326.0, 312.0, 364.0, 308.0, 283.0, 212.0, 180.0, 159.0, 121.0, 80.0, 58.0, 49.0, 48.0, 25.0, 10.0, 12.0, 9.0, 5.0, 3.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.609375, -8.38525390625, -8.1611328125, -7.93701171875, -7.712890625, -7.48876953125, -7.2646484375, -7.04052734375, -6.81640625, -6.59228515625, -6.3681640625, -6.14404296875, -5.919921875, -5.69580078125, -5.4716796875, -5.24755859375, -5.0234375, -4.79931640625, -4.5751953125, -4.35107421875, -4.126953125, -3.90283203125, -3.6787109375, -3.45458984375, -3.23046875, -3.00634765625, -2.7822265625, -2.55810546875, -2.333984375, -2.10986328125, -1.8857421875, -1.66162109375, -1.4375, -1.21337890625, -0.9892578125, -0.76513671875, -0.541015625, -0.31689453125, -0.0927734375, 0.13134765625, 0.35546875, 0.57958984375, 0.8037109375, 1.02783203125, 1.251953125, 1.47607421875, 1.7001953125, 1.92431640625, 2.1484375, 2.37255859375, 2.5966796875, 2.82080078125, 3.044921875, 3.26904296875, 3.4931640625, 3.71728515625, 3.94140625, 4.16552734375, 4.3896484375, 4.61376953125, 4.837890625, 5.06201171875, 5.2861328125, 5.51025390625, 5.734375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 7.0, 14.0, 13.0, 14.0, 18.0, 29.0, 38.0, 46.0, 52.0, 75.0, 66.0, 73.0, 90.0, 73.0, 77.0, 63.0, 62.0, 33.0, 45.0, 23.0, 22.0, 16.0, 16.0, 6.0, 5.0, 10.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.674388885498047, -23.811080932617188, -22.947772979736328, -22.08446502685547, -21.22115707397461, -20.35784912109375, -19.494543075561523, -18.631235122680664, -17.767927169799805, -16.904619216918945, -16.041311264038086, -15.178004264831543, -14.314696311950684, -13.451388359069824, -12.588081359863281, -11.724773406982422, -10.861465454101562, -9.998157501220703, -9.134849548339844, -8.2715425491333, -7.408234596252441, -6.544926643371582, -5.681619167327881, -4.81831169128418, -3.9550037384033203, -3.09169602394104, -2.2283883094787598, -1.3650805950164795, -0.5017728805541992, 0.36153507232666016, 1.2248425483703613, 2.0881500244140625, 2.951457977294922, 3.814765691757202, 4.678073406219482, 5.541380882263184, 6.404688835144043, 7.267996788024902, 8.131303787231445, 8.994611740112305, 9.857919692993164, 10.721227645874023, 11.584535598754883, 12.447842597961426, 13.311150550842285, 14.174458503723145, 15.037765502929688, 15.901073455810547, 16.764381408691406, 17.627689361572266, 18.490997314453125, 19.354305267333984, 20.217613220214844, 21.080921173095703, 21.94422721862793, 22.80753517150879, 23.67084312438965, 24.534151077270508, 25.397459030151367, 26.260766983032227, 27.124073028564453, 27.987380981445312, 28.850688934326172, 29.71399688720703, 30.57730484008789]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 4.0, 6.0, 3.0, 8.0, 5.0, 12.0, 5.0, 8.0, 14.0, 22.0, 18.0, 12.0, 11.0, 30.0, 30.0, 30.0, 29.0, 33.0, 31.0, 36.0, 40.0, 40.0, 43.0, 43.0, 37.0, 41.0, 40.0, 33.0, 33.0, 38.0, 18.0, 37.0, 22.0, 22.0, 22.0, 21.0, 18.0, 17.0, 12.0, 11.0, 15.0, 15.0, 7.0, 10.0, 5.0, 5.0, 3.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0], "bins": [-10.755313873291016, -10.445636749267578, -10.13595962524414, -9.826282501220703, -9.516605377197266, -9.206928253173828, -8.89725112915039, -8.587574005126953, -8.277896881103516, -7.968219757080078, -7.658542633056641, -7.348865509033203, -7.039188385009766, -6.729511260986328, -6.419834613800049, -6.110157489776611, -5.800480842590332, -5.4908037185668945, -5.181126594543457, -4.8714494705200195, -4.561772346496582, -4.2520952224731445, -3.9424185752868652, -3.6327414512634277, -3.3230643272399902, -3.0133872032165527, -2.7037100791931152, -2.394033193588257, -2.0843560695648193, -1.7746789455413818, -1.4650019407272339, -1.155324935913086, -0.8456487655639648, -0.5359717011451721, -0.2262946367263794, 0.08338242769241333, 0.39305949211120605, 0.7027366161346436, 1.0124136209487915, 1.3220906257629395, 1.631767749786377, 1.9414448738098145, 2.251121997833252, 2.5607988834381104, 2.870476007461548, 3.1801531314849854, 3.4898300170898438, 3.7995071411132812, 4.109184265136719, 4.418861389160156, 4.728538513183594, 5.038215637207031, 5.347892761230469, 5.657569885253906, 5.9672465324401855, 6.276923656463623, 6.5866007804870605, 6.896277904510498, 7.2059550285339355, 7.515632152557373, 7.825308799743652, 8.13498592376709, 8.444663047790527, 8.754340171813965, 9.064017295837402]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 9.0, 6.0, 8.0, 9.0, 11.0, 18.0, 27.0, 47.0, 70.0, 88.0, 118.0, 247.0, 319.0, 512.0, 858.0, 1682.0, 2787.0, 5615.0, 11143.0, 23089.0, 48031.0, 96707.0, 170518.0, 228127.0, 201876.0, 127258.0, 65861.0, 31815.0, 15205.0, 7600.0, 3853.0, 2070.0, 1155.0, 673.0, 388.0, 230.0, 154.0, 101.0, 81.0, 49.0, 46.0, 36.0, 18.0, 17.0, 10.0, 7.0, 4.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.7265625, -12.312255859375, -11.89794921875, -11.483642578125, -11.0693359375, -10.655029296875, -10.24072265625, -9.826416015625, -9.412109375, -8.997802734375, -8.58349609375, -8.169189453125, -7.7548828125, -7.340576171875, -6.92626953125, -6.511962890625, -6.09765625, -5.683349609375, -5.26904296875, -4.854736328125, -4.4404296875, -4.026123046875, -3.61181640625, -3.197509765625, -2.783203125, -2.368896484375, -1.95458984375, -1.540283203125, -1.1259765625, -0.711669921875, -0.29736328125, 0.116943359375, 0.53125, 0.945556640625, 1.35986328125, 1.774169921875, 2.1884765625, 2.602783203125, 3.01708984375, 3.431396484375, 3.845703125, 4.260009765625, 4.67431640625, 5.088623046875, 5.5029296875, 5.917236328125, 6.33154296875, 6.745849609375, 7.16015625, 7.574462890625, 7.98876953125, 8.403076171875, 8.8173828125, 9.231689453125, 9.64599609375, 10.060302734375, 10.474609375, 10.888916015625, 11.30322265625, 11.717529296875, 12.1318359375, 12.546142578125, 12.96044921875, 13.374755859375, 13.7890625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 2.0, 6.0, 4.0, 3.0, 10.0, 8.0, 12.0, 10.0, 21.0, 16.0, 13.0, 22.0, 26.0, 37.0, 29.0, 35.0, 41.0, 37.0, 38.0, 32.0, 50.0, 52.0, 48.0, 48.0, 37.0, 41.0, 43.0, 42.0, 30.0, 31.0, 21.0, 21.0, 23.0, 23.0, 18.0, 17.0, 15.0, 9.0, 4.0, 8.0, 2.0, 6.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.796875, -12.4193115234375, -12.041748046875, -11.6641845703125, -11.28662109375, -10.9090576171875, -10.531494140625, -10.1539306640625, -9.7763671875, -9.3988037109375, -9.021240234375, -8.6436767578125, -8.26611328125, -7.8885498046875, -7.510986328125, -7.1334228515625, -6.755859375, -6.3782958984375, -6.000732421875, -5.6231689453125, -5.24560546875, -4.8680419921875, -4.490478515625, -4.1129150390625, -3.7353515625, -3.3577880859375, -2.980224609375, -2.6026611328125, -2.22509765625, -1.8475341796875, -1.469970703125, -1.0924072265625, -0.71484375, -0.3372802734375, 0.040283203125, 0.4178466796875, 0.79541015625, 1.1729736328125, 1.550537109375, 1.9281005859375, 2.3056640625, 2.6832275390625, 3.060791015625, 3.4383544921875, 3.81591796875, 4.1934814453125, 4.571044921875, 4.9486083984375, 5.326171875, 5.7037353515625, 6.081298828125, 6.4588623046875, 6.83642578125, 7.2139892578125, 7.591552734375, 7.9691162109375, 8.3466796875, 8.7242431640625, 9.101806640625, 9.4793701171875, 9.85693359375, 10.2344970703125, 10.612060546875, 10.9896240234375, 11.3671875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 6.0, 10.0, 14.0, 11.0, 16.0, 27.0, 45.0, 75.0, 119.0, 224.0, 342.0, 631.0, 1079.0, 1912.0, 3746.0, 7298.0, 15415.0, 33274.0, 72425.0, 150772.0, 256561.0, 243005.0, 137768.0, 65079.0, 30360.0, 13942.0, 6786.0, 3515.0, 1741.0, 970.0, 544.0, 312.0, 201.0, 132.0, 66.0, 41.0, 37.0, 23.0, 12.0, 8.0, 7.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.359375, -15.862548828125, -15.36572265625, -14.868896484375, -14.3720703125, -13.875244140625, -13.37841796875, -12.881591796875, -12.384765625, -11.887939453125, -11.39111328125, -10.894287109375, -10.3974609375, -9.900634765625, -9.40380859375, -8.906982421875, -8.41015625, -7.913330078125, -7.41650390625, -6.919677734375, -6.4228515625, -5.926025390625, -5.42919921875, -4.932373046875, -4.435546875, -3.938720703125, -3.44189453125, -2.945068359375, -2.4482421875, -1.951416015625, -1.45458984375, -0.957763671875, -0.4609375, 0.035888671875, 0.53271484375, 1.029541015625, 1.5263671875, 2.023193359375, 2.52001953125, 3.016845703125, 3.513671875, 4.010498046875, 4.50732421875, 5.004150390625, 5.5009765625, 5.997802734375, 6.49462890625, 6.991455078125, 7.48828125, 7.985107421875, 8.48193359375, 8.978759765625, 9.4755859375, 9.972412109375, 10.46923828125, 10.966064453125, 11.462890625, 11.959716796875, 12.45654296875, 12.953369140625, 13.4501953125, 13.947021484375, 14.44384765625, 14.940673828125, 15.4375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 19.0, 8.0, 13.0, 13.0, 14.0, 19.0, 15.0, 28.0, 28.0, 20.0, 30.0, 39.0, 34.0, 41.0, 41.0, 38.0, 38.0, 35.0, 44.0, 39.0, 44.0, 41.0, 33.0, 36.0, 35.0, 35.0, 27.0, 23.0, 19.0, 21.0, 15.0, 19.0, 13.0, 18.0, 11.0, 12.0, 8.0, 9.0, 6.0, 3.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6953125, -5.4979248046875, -5.300537109375, -5.1031494140625, -4.90576171875, -4.7083740234375, -4.510986328125, -4.3135986328125, -4.1162109375, -3.9188232421875, -3.721435546875, -3.5240478515625, -3.32666015625, -3.1292724609375, -2.931884765625, -2.7344970703125, -2.537109375, -2.3397216796875, -2.142333984375, -1.9449462890625, -1.74755859375, -1.5501708984375, -1.352783203125, -1.1553955078125, -0.9580078125, -0.7606201171875, -0.563232421875, -0.3658447265625, -0.16845703125, 0.0289306640625, 0.226318359375, 0.4237060546875, 0.62109375, 0.8184814453125, 1.015869140625, 1.2132568359375, 1.41064453125, 1.6080322265625, 1.805419921875, 2.0028076171875, 2.2001953125, 2.3975830078125, 2.594970703125, 2.7923583984375, 2.98974609375, 3.1871337890625, 3.384521484375, 3.5819091796875, 3.779296875, 3.9766845703125, 4.174072265625, 4.3714599609375, 4.56884765625, 4.7662353515625, 4.963623046875, 5.1610107421875, 5.3583984375, 5.5557861328125, 5.753173828125, 5.9505615234375, 6.14794921875, 6.3453369140625, 6.542724609375, 6.7401123046875, 6.9375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 4.0, 4.0, 9.0, 9.0, 13.0, 18.0, 27.0, 41.0, 61.0, 91.0, 121.0, 193.0, 263.0, 369.0, 596.0, 832.0, 1158.0, 1761.0, 2609.0, 3890.0, 5881.0, 9023.0, 13436.0, 20784.0, 32354.0, 50246.0, 77524.0, 115310.0, 155103.0, 164577.0, 131786.0, 90966.0, 59402.0, 38364.0, 24656.0, 15910.0, 10437.0, 6907.0, 4517.0, 3028.0, 2004.0, 1347.0, 938.0, 627.0, 411.0, 283.0, 205.0, 148.0, 95.0, 83.0, 59.0, 31.0, 14.0, 16.0, 6.0, 6.0, 6.0, 5.0, 4.0, 1.0, 1.0], "bins": [-4.796875, -4.64788818359375, -4.4989013671875, -4.34991455078125, -4.200927734375, -4.05194091796875, -3.9029541015625, -3.75396728515625, -3.60498046875, -3.45599365234375, -3.3070068359375, -3.15802001953125, -3.009033203125, -2.86004638671875, -2.7110595703125, -2.56207275390625, -2.4130859375, -2.26409912109375, -2.1151123046875, -1.96612548828125, -1.817138671875, -1.66815185546875, -1.5191650390625, -1.37017822265625, -1.22119140625, -1.07220458984375, -0.9232177734375, -0.77423095703125, -0.625244140625, -0.47625732421875, -0.3272705078125, -0.17828369140625, -0.029296875, 0.11968994140625, 0.2686767578125, 0.41766357421875, 0.566650390625, 0.71563720703125, 0.8646240234375, 1.01361083984375, 1.16259765625, 1.31158447265625, 1.4605712890625, 1.60955810546875, 1.758544921875, 1.90753173828125, 2.0565185546875, 2.20550537109375, 2.3544921875, 2.50347900390625, 2.6524658203125, 2.80145263671875, 2.950439453125, 3.09942626953125, 3.2484130859375, 3.39739990234375, 3.54638671875, 3.69537353515625, 3.8443603515625, 3.99334716796875, 4.142333984375, 4.29132080078125, 4.4403076171875, 4.58929443359375, 4.73828125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 1.0, 4.0, 4.0, 10.0, 10.0, 9.0, 20.0, 26.0, 24.0, 28.0, 24.0, 42.0, 52.0, 61.0, 65.0, 57.0, 62.0, 51.0, 55.0, 71.0, 52.0, 53.0, 41.0, 39.0, 23.0, 19.0, 17.0, 14.0, 16.0, 9.0, 9.0, 4.0, 7.0, 3.0, 3.0, 3.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00033473968505859375, -0.00032487884163856506, -0.0003150179982185364, -0.0003051571547985077, -0.000295296311378479, -0.0002854354679584503, -0.00027557462453842163, -0.00026571378111839294, -0.00025585293769836426, -0.00024599209427833557, -0.00023613125085830688, -0.0002262704074382782, -0.0002164095640182495, -0.00020654872059822083, -0.00019668787717819214, -0.00018682703375816345, -0.00017696619033813477, -0.00016710534691810608, -0.0001572445034980774, -0.0001473836600780487, -0.00013752281665802002, -0.00012766197323799133, -0.00011780112981796265, -0.00010794028639793396, -9.807944297790527e-05, -8.821859955787659e-05, -7.83577561378479e-05, -6.849691271781921e-05, -5.863606929779053e-05, -4.877522587776184e-05, -3.8914382457733154e-05, -2.9053539037704468e-05, -1.919269561767578e-05, -9.331852197647095e-06, 5.289912223815918e-07, 1.0389834642410278e-05, 2.0250678062438965e-05, 3.011152148246765e-05, 3.997236490249634e-05, 4.9833208322525024e-05, 5.969405174255371e-05, 6.95548951625824e-05, 7.941573858261108e-05, 8.927658200263977e-05, 9.913742542266846e-05, 0.00010899826884269714, 0.00011885911226272583, 0.00012871995568275452, 0.0001385807991027832, 0.0001484416425228119, 0.00015830248594284058, 0.00016816332936286926, 0.00017802417278289795, 0.00018788501620292664, 0.00019774585962295532, 0.000207606703042984, 0.0002174675464630127, 0.00022732838988304138, 0.00023718923330307007, 0.00024705007672309875, 0.00025691092014312744, 0.00026677176356315613, 0.0002766326069831848, 0.0002864934504032135, 0.0002963542938232422]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 2.0, 8.0, 26.0, 37.0, 48.0, 70.0, 94.0, 124.0, 228.0, 321.0, 447.0, 752.0, 1101.0, 1756.0, 2736.0, 4284.0, 6593.0, 10535.0, 16142.0, 25430.0, 38980.0, 59299.0, 85086.0, 114902.0, 135758.0, 138299.0, 121389.0, 93390.0, 66255.0, 44093.0, 28831.0, 18630.0, 11784.0, 7607.0, 4683.0, 3090.0, 1965.0, 1259.0, 878.0, 517.0, 351.0, 287.0, 157.0, 103.0, 78.0, 50.0, 31.0, 27.0, 15.0, 10.0, 9.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-4.4296875, -4.2918701171875, -4.154052734375, -4.0162353515625, -3.87841796875, -3.7406005859375, -3.602783203125, -3.4649658203125, -3.3271484375, -3.1893310546875, -3.051513671875, -2.9136962890625, -2.77587890625, -2.6380615234375, -2.500244140625, -2.3624267578125, -2.224609375, -2.0867919921875, -1.948974609375, -1.8111572265625, -1.67333984375, -1.5355224609375, -1.397705078125, -1.2598876953125, -1.1220703125, -0.9842529296875, -0.846435546875, -0.7086181640625, -0.57080078125, -0.4329833984375, -0.295166015625, -0.1573486328125, -0.01953125, 0.1182861328125, 0.256103515625, 0.3939208984375, 0.53173828125, 0.6695556640625, 0.807373046875, 0.9451904296875, 1.0830078125, 1.2208251953125, 1.358642578125, 1.4964599609375, 1.63427734375, 1.7720947265625, 1.909912109375, 2.0477294921875, 2.185546875, 2.3233642578125, 2.461181640625, 2.5989990234375, 2.73681640625, 2.8746337890625, 3.012451171875, 3.1502685546875, 3.2880859375, 3.4259033203125, 3.563720703125, 3.7015380859375, 3.83935546875, 3.9771728515625, 4.114990234375, 4.2528076171875, 4.390625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 6.0, 6.0, 7.0, 10.0, 6.0, 12.0, 22.0, 22.0, 22.0, 29.0, 36.0, 32.0, 35.0, 49.0, 41.0, 50.0, 43.0, 59.0, 59.0, 53.0, 61.0, 51.0, 29.0, 43.0, 40.0, 33.0, 33.0, 19.0, 18.0, 17.0, 13.0, 6.0, 11.0, 8.0, 11.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.609375, -1.5604705810546875, -1.511566162109375, -1.4626617431640625, -1.41375732421875, -1.3648529052734375, -1.315948486328125, -1.2670440673828125, -1.2181396484375, -1.1692352294921875, -1.120330810546875, -1.0714263916015625, -1.02252197265625, -0.9736175537109375, -0.924713134765625, -0.8758087158203125, -0.826904296875, -0.7779998779296875, -0.729095458984375, -0.6801910400390625, -0.63128662109375, -0.5823822021484375, -0.533477783203125, -0.4845733642578125, -0.4356689453125, -0.3867645263671875, -0.337860107421875, -0.2889556884765625, -0.24005126953125, -0.1911468505859375, -0.142242431640625, -0.0933380126953125, -0.04443359375, 0.0044708251953125, 0.053375244140625, 0.1022796630859375, 0.15118408203125, 0.2000885009765625, 0.248992919921875, 0.2978973388671875, 0.3468017578125, 0.3957061767578125, 0.444610595703125, 0.4935150146484375, 0.54241943359375, 0.5913238525390625, 0.640228271484375, 0.6891326904296875, 0.738037109375, 0.7869415283203125, 0.835845947265625, 0.8847503662109375, 0.93365478515625, 0.9825592041015625, 1.031463623046875, 1.0803680419921875, 1.1292724609375, 1.1781768798828125, 1.227081298828125, 1.2759857177734375, 1.32489013671875, 1.3737945556640625, 1.422698974609375, 1.4716033935546875, 1.5205078125]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 5.0, 6.0, 17.0, 14.0, 11.0, 14.0, 26.0, 35.0, 38.0, 57.0, 68.0, 66.0, 85.0, 80.0, 68.0, 74.0, 76.0, 61.0, 42.0, 36.0, 27.0, 29.0, 14.0, 20.0, 9.0, 6.0, 5.0, 4.0, 8.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.879331588745117, -22.02912139892578, -21.178913116455078, -20.328702926635742, -19.478492736816406, -18.628284454345703, -17.778074264526367, -16.92786407470703, -16.077655792236328, -15.227446556091309, -14.377236366271973, -13.527027130126953, -12.676817893981934, -11.826608657836914, -10.976398468017578, -10.126189231872559, -9.275979042053223, -8.425769805908203, -7.575560092926025, -6.725350379943848, -5.875141143798828, -5.02493143081665, -4.174721717834473, -3.324512481689453, -2.4743027687072754, -1.6240932941436768, -0.7738837003707886, 0.07632589340209961, 0.9265353679656982, 1.7767448425292969, 2.6269545555114746, 3.477163791656494, 4.327373504638672, 5.17758321762085, 6.027792453765869, 6.878002166748047, 7.728211402893066, 8.578420639038086, 9.428630828857422, 10.278840065002441, 11.129049301147461, 11.97925853729248, 12.829468727111816, 13.679677963256836, 14.529887199401855, 15.380096435546875, 16.23030662536621, 17.080516815185547, 17.93072509765625, 18.780935287475586, 19.63114356994629, 20.481353759765625, 21.33156394958496, 22.181772232055664, 23.031982421875, 23.882190704345703, 24.732402801513672, 25.582612991333008, 26.43282127380371, 27.283031463623047, 28.133241653442383, 28.983449935913086, 29.833660125732422, 30.683868408203125, 31.53407859802246]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 6.0, 2.0, 8.0, 7.0, 3.0, 7.0, 10.0, 12.0, 16.0, 22.0, 15.0, 10.0, 24.0, 21.0, 26.0, 29.0, 33.0, 40.0, 33.0, 33.0, 39.0, 42.0, 37.0, 38.0, 37.0, 47.0, 36.0, 36.0, 32.0, 24.0, 27.0, 31.0, 22.0, 24.0, 24.0, 18.0, 18.0, 18.0, 10.0, 20.0, 8.0, 15.0, 10.0, 5.0, 8.0, 4.0, 5.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0], "bins": [-10.28503704071045, -9.988395690917969, -9.691754341125488, -9.395112991333008, -9.098471641540527, -8.801830291748047, -8.505188941955566, -8.208547592163086, -7.911906719207764, -7.615265369415283, -7.318624019622803, -7.021982669830322, -6.725341796875, -6.4287004470825195, -6.132059097290039, -5.835417747497559, -5.538776397705078, -5.242135047912598, -4.945493698120117, -4.648852348327637, -4.352210998535156, -4.055569648742676, -3.7589287757873535, -3.462287425994873, -3.1656460762023926, -2.869004726409912, -2.5723633766174316, -2.2757222652435303, -1.9790809154510498, -1.6824395656585693, -1.3857983350753784, -1.0891571044921875, -0.7925148010253906, -0.49587351083755493, -0.19923222064971924, 0.09740906953811646, 0.39405035972595215, 0.6906917095184326, 0.9873329401016235, 1.2839741706848145, 1.580615520477295, 1.8772568702697754, 2.173898220062256, 2.4705393314361572, 2.7671806812286377, 3.063822031021118, 3.3604631423950195, 3.6571044921875, 3.9537458419799805, 4.250387191772461, 4.547028541564941, 4.843669891357422, 5.140311241149902, 5.436952590942383, 5.733593463897705, 6.0302348136901855, 6.326876163482666, 6.6235175132751465, 6.920158863067627, 7.216800212860107, 7.51344108581543, 7.81008243560791, 8.10672378540039, 8.403365135192871, 8.700006484985352]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 5.0, 5.0, 9.0, 15.0, 12.0, 26.0, 34.0, 33.0, 41.0, 81.0, 131.0, 166.0, 236.0, 348.0, 525.0, 904.0, 1701.0, 3280.0, 6861.0, 15148.0, 34465.0, 75735.0, 150797.0, 231406.0, 232204.0, 152055.0, 77147.0, 35027.0, 15627.0, 6860.0, 3429.0, 1682.0, 932.0, 539.0, 354.0, 221.0, 158.0, 105.0, 68.0, 43.0, 36.0, 31.0, 19.0, 11.0, 17.0, 5.0, 11.0, 7.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-24.234375, -23.477294921875, -22.72021484375, -21.963134765625, -21.2060546875, -20.448974609375, -19.69189453125, -18.934814453125, -18.177734375, -17.420654296875, -16.66357421875, -15.906494140625, -15.1494140625, -14.392333984375, -13.63525390625, -12.878173828125, -12.12109375, -11.364013671875, -10.60693359375, -9.849853515625, -9.0927734375, -8.335693359375, -7.57861328125, -6.821533203125, -6.064453125, -5.307373046875, -4.55029296875, -3.793212890625, -3.0361328125, -2.279052734375, -1.52197265625, -0.764892578125, -0.0078125, 0.749267578125, 1.50634765625, 2.263427734375, 3.0205078125, 3.777587890625, 4.53466796875, 5.291748046875, 6.048828125, 6.805908203125, 7.56298828125, 8.320068359375, 9.0771484375, 9.834228515625, 10.59130859375, 11.348388671875, 12.10546875, 12.862548828125, 13.61962890625, 14.376708984375, 15.1337890625, 15.890869140625, 16.64794921875, 17.405029296875, 18.162109375, 18.919189453125, 19.67626953125, 20.433349609375, 21.1904296875, 21.947509765625, 22.70458984375, 23.461669921875, 24.21875]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 6.0, 11.0, 6.0, 9.0, 17.0, 16.0, 27.0, 30.0, 22.0, 29.0, 45.0, 34.0, 44.0, 45.0, 35.0, 41.0, 36.0, 43.0, 49.0, 42.0, 39.0, 40.0, 39.0, 26.0, 28.0, 31.0, 18.0, 28.0, 21.0, 20.0, 20.0, 13.0, 17.0, 13.0, 8.0, 7.0, 12.0, 3.0, 5.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.296875, -11.950927734375, -11.60498046875, -11.259033203125, -10.9130859375, -10.567138671875, -10.22119140625, -9.875244140625, -9.529296875, -9.183349609375, -8.83740234375, -8.491455078125, -8.1455078125, -7.799560546875, -7.45361328125, -7.107666015625, -6.76171875, -6.415771484375, -6.06982421875, -5.723876953125, -5.3779296875, -5.031982421875, -4.68603515625, -4.340087890625, -3.994140625, -3.648193359375, -3.30224609375, -2.956298828125, -2.6103515625, -2.264404296875, -1.91845703125, -1.572509765625, -1.2265625, -0.880615234375, -0.53466796875, -0.188720703125, 0.1572265625, 0.503173828125, 0.84912109375, 1.195068359375, 1.541015625, 1.886962890625, 2.23291015625, 2.578857421875, 2.9248046875, 3.270751953125, 3.61669921875, 3.962646484375, 4.30859375, 4.654541015625, 5.00048828125, 5.346435546875, 5.6923828125, 6.038330078125, 6.38427734375, 6.730224609375, 7.076171875, 7.422119140625, 7.76806640625, 8.114013671875, 8.4599609375, 8.805908203125, 9.15185546875, 9.497802734375, 9.84375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 10.0, 11.0, 10.0, 20.0, 38.0, 57.0, 77.0, 126.0, 165.0, 234.0, 432.0, 598.0, 958.0, 1528.0, 2402.0, 3898.0, 6609.0, 10872.0, 18862.0, 31501.0, 50961.0, 79491.0, 114062.0, 143272.0, 154409.0, 137340.0, 104526.0, 71617.0, 45212.0, 27703.0, 16384.0, 9840.0, 5827.0, 3590.0, 2107.0, 1364.0, 831.0, 533.0, 358.0, 261.0, 163.0, 88.0, 73.0, 53.0, 29.0, 17.0, 18.0, 10.0, 6.0, 4.0, 4.0, 4.0, 0.0, 0.0, 2.0], "bins": [-15.4453125, -14.9825439453125, -14.519775390625, -14.0570068359375, -13.59423828125, -13.1314697265625, -12.668701171875, -12.2059326171875, -11.7431640625, -11.2803955078125, -10.817626953125, -10.3548583984375, -9.89208984375, -9.4293212890625, -8.966552734375, -8.5037841796875, -8.041015625, -7.5782470703125, -7.115478515625, -6.6527099609375, -6.18994140625, -5.7271728515625, -5.264404296875, -4.8016357421875, -4.3388671875, -3.8760986328125, -3.413330078125, -2.9505615234375, -2.48779296875, -2.0250244140625, -1.562255859375, -1.0994873046875, -0.63671875, -0.1739501953125, 0.288818359375, 0.7515869140625, 1.21435546875, 1.6771240234375, 2.139892578125, 2.6026611328125, 3.0654296875, 3.5281982421875, 3.990966796875, 4.4537353515625, 4.91650390625, 5.3792724609375, 5.842041015625, 6.3048095703125, 6.767578125, 7.2303466796875, 7.693115234375, 8.1558837890625, 8.61865234375, 9.0814208984375, 9.544189453125, 10.0069580078125, 10.4697265625, 10.9324951171875, 11.395263671875, 11.8580322265625, 12.32080078125, 12.7835693359375, 13.246337890625, 13.7091064453125, 14.171875]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 11.0, 7.0, 15.0, 11.0, 4.0, 15.0, 17.0, 18.0, 22.0, 25.0, 26.0, 18.0, 40.0, 31.0, 30.0, 30.0, 31.0, 32.0, 44.0, 41.0, 33.0, 29.0, 53.0, 35.0, 40.0, 27.0, 39.0, 43.0, 33.0, 33.0, 23.0, 27.0, 24.0, 19.0, 7.0, 12.0, 11.0, 7.0, 6.0, 13.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-6.41015625, -6.21337890625, -6.0166015625, -5.81982421875, -5.623046875, -5.42626953125, -5.2294921875, -5.03271484375, -4.8359375, -4.63916015625, -4.4423828125, -4.24560546875, -4.048828125, -3.85205078125, -3.6552734375, -3.45849609375, -3.26171875, -3.06494140625, -2.8681640625, -2.67138671875, -2.474609375, -2.27783203125, -2.0810546875, -1.88427734375, -1.6875, -1.49072265625, -1.2939453125, -1.09716796875, -0.900390625, -0.70361328125, -0.5068359375, -0.31005859375, -0.11328125, 0.08349609375, 0.2802734375, 0.47705078125, 0.673828125, 0.87060546875, 1.0673828125, 1.26416015625, 1.4609375, 1.65771484375, 1.8544921875, 2.05126953125, 2.248046875, 2.44482421875, 2.6416015625, 2.83837890625, 3.03515625, 3.23193359375, 3.4287109375, 3.62548828125, 3.822265625, 4.01904296875, 4.2158203125, 4.41259765625, 4.609375, 4.80615234375, 5.0029296875, 5.19970703125, 5.396484375, 5.59326171875, 5.7900390625, 5.98681640625, 6.18359375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 5.0, 3.0, 6.0, 7.0, 20.0, 28.0, 34.0, 35.0, 67.0, 91.0, 141.0, 166.0, 235.0, 313.0, 482.0, 715.0, 1040.0, 1544.0, 2416.0, 3725.0, 6363.0, 11653.0, 22204.0, 43493.0, 89521.0, 177935.0, 260854.0, 206159.0, 107882.0, 52146.0, 25618.0, 13772.0, 7535.0, 4327.0, 2605.0, 1677.0, 1171.0, 743.0, 523.0, 365.0, 310.0, 189.0, 148.0, 94.0, 57.0, 44.0, 25.0, 20.0, 14.0, 17.0, 12.0, 4.0, 8.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-12.2421875, -11.8551025390625, -11.468017578125, -11.0809326171875, -10.69384765625, -10.3067626953125, -9.919677734375, -9.5325927734375, -9.1455078125, -8.7584228515625, -8.371337890625, -7.9842529296875, -7.59716796875, -7.2100830078125, -6.822998046875, -6.4359130859375, -6.048828125, -5.6617431640625, -5.274658203125, -4.8875732421875, -4.50048828125, -4.1134033203125, -3.726318359375, -3.3392333984375, -2.9521484375, -2.5650634765625, -2.177978515625, -1.7908935546875, -1.40380859375, -1.0167236328125, -0.629638671875, -0.2425537109375, 0.14453125, 0.5316162109375, 0.918701171875, 1.3057861328125, 1.69287109375, 2.0799560546875, 2.467041015625, 2.8541259765625, 3.2412109375, 3.6282958984375, 4.015380859375, 4.4024658203125, 4.78955078125, 5.1766357421875, 5.563720703125, 5.9508056640625, 6.337890625, 6.7249755859375, 7.112060546875, 7.4991455078125, 7.88623046875, 8.2733154296875, 8.660400390625, 9.0474853515625, 9.4345703125, 9.8216552734375, 10.208740234375, 10.5958251953125, 10.98291015625, 11.3699951171875, 11.757080078125, 12.1441650390625, 12.53125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 4.0, 8.0, 6.0, 9.0, 16.0, 14.0, 18.0, 22.0, 44.0, 32.0, 79.0, 83.0, 116.0, 128.0, 93.0, 89.0, 78.0, 38.0, 37.0, 17.0, 19.0, 13.0, 6.0, 11.0, 6.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017423629760742188, -0.001691579818725586, -0.0016407966613769531, -0.0015900135040283203, -0.0015392303466796875, -0.0014884471893310547, -0.0014376640319824219, -0.001386880874633789, -0.0013360977172851562, -0.0012853145599365234, -0.0012345314025878906, -0.0011837482452392578, -0.001132965087890625, -0.0010821819305419922, -0.0010313987731933594, -0.0009806156158447266, -0.0009298324584960938, -0.0008790493011474609, -0.0008282661437988281, -0.0007774829864501953, -0.0007266998291015625, -0.0006759166717529297, -0.0006251335144042969, -0.0005743503570556641, -0.0005235671997070312, -0.00047278404235839844, -0.0004220008850097656, -0.0003712177276611328, -0.0003204345703125, -0.0002696514129638672, -0.00021886825561523438, -0.00016808509826660156, -0.00011730194091796875, -6.651878356933594e-05, -1.5735626220703125e-05, 3.504753112792969e-05, 8.58306884765625e-05, 0.0001366138458251953, 0.00018739700317382812, 0.00023818016052246094, 0.00028896331787109375, 0.00033974647521972656, 0.0003905296325683594, 0.0004413127899169922, 0.000492095947265625, 0.0005428791046142578, 0.0005936622619628906, 0.0006444454193115234, 0.0006952285766601562, 0.0007460117340087891, 0.0007967948913574219, 0.0008475780487060547, 0.0008983612060546875, 0.0009491443634033203, 0.0009999275207519531, 0.001050710678100586, 0.0011014938354492188, 0.0011522769927978516, 0.0012030601501464844, 0.0012538433074951172, 0.00130462646484375, 0.0013554096221923828, 0.0014061927795410156, 0.0014569759368896484, 0.0015077590942382812]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 6.0, 4.0, 11.0, 1.0, 7.0, 12.0, 14.0, 34.0, 60.0, 48.0, 72.0, 116.0, 166.0, 235.0, 304.0, 442.0, 660.0, 972.0, 1549.0, 2572.0, 4522.0, 8827.0, 19355.0, 45028.0, 111724.0, 243822.0, 301712.0, 174452.0, 72739.0, 30012.0, 13330.0, 6479.0, 3387.0, 1984.0, 1280.0, 832.0, 528.0, 352.0, 247.0, 195.0, 131.0, 102.0, 66.0, 50.0, 38.0, 31.0, 19.0, 14.0, 6.0, 6.0, 5.0, 2.0, 5.0, 0.0, 0.0, 2.0], "bins": [-15.2578125, -14.8125, -14.3671875, -13.921875, -13.4765625, -13.03125, -12.5859375, -12.140625, -11.6953125, -11.25, -10.8046875, -10.359375, -9.9140625, -9.46875, -9.0234375, -8.578125, -8.1328125, -7.6875, -7.2421875, -6.796875, -6.3515625, -5.90625, -5.4609375, -5.015625, -4.5703125, -4.125, -3.6796875, -3.234375, -2.7890625, -2.34375, -1.8984375, -1.453125, -1.0078125, -0.5625, -0.1171875, 0.328125, 0.7734375, 1.21875, 1.6640625, 2.109375, 2.5546875, 3.0, 3.4453125, 3.890625, 4.3359375, 4.78125, 5.2265625, 5.671875, 6.1171875, 6.5625, 7.0078125, 7.453125, 7.8984375, 8.34375, 8.7890625, 9.234375, 9.6796875, 10.125, 10.5703125, 11.015625, 11.4609375, 11.90625, 12.3515625, 12.796875, 13.2421875]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 7.0, 3.0, 4.0, 9.0, 13.0, 6.0, 15.0, 17.0, 19.0, 24.0, 36.0, 39.0, 52.0, 48.0, 58.0, 61.0, 59.0, 57.0, 74.0, 60.0, 56.0, 57.0, 41.0, 33.0, 32.0, 21.0, 14.0, 16.0, 11.0, 10.0, 8.0, 7.0, 8.0, 7.0, 7.0, 5.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.125, -3.034820556640625, -2.94464111328125, -2.854461669921875, -2.7642822265625, -2.674102783203125, -2.58392333984375, -2.493743896484375, -2.403564453125, -2.313385009765625, -2.22320556640625, -2.133026123046875, -2.0428466796875, -1.952667236328125, -1.86248779296875, -1.772308349609375, -1.68212890625, -1.591949462890625, -1.50177001953125, -1.411590576171875, -1.3214111328125, -1.231231689453125, -1.14105224609375, -1.050872802734375, -0.960693359375, -0.870513916015625, -0.78033447265625, -0.690155029296875, -0.5999755859375, -0.509796142578125, -0.41961669921875, -0.329437255859375, -0.2392578125, -0.149078369140625, -0.05889892578125, 0.031280517578125, 0.1214599609375, 0.211639404296875, 0.30181884765625, 0.391998291015625, 0.482177734375, 0.572357177734375, 0.66253662109375, 0.752716064453125, 0.8428955078125, 0.933074951171875, 1.02325439453125, 1.113433837890625, 1.20361328125, 1.293792724609375, 1.38397216796875, 1.474151611328125, 1.5643310546875, 1.654510498046875, 1.74468994140625, 1.834869384765625, 1.925048828125, 2.015228271484375, 2.10540771484375, 2.195587158203125, 2.2857666015625, 2.375946044921875, 2.46612548828125, 2.556304931640625, 2.646484375]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 3.0, 1.0, 9.0, 5.0, 11.0, 15.0, 10.0, 15.0, 26.0, 32.0, 36.0, 40.0, 36.0, 49.0, 49.0, 66.0, 61.0, 60.0, 80.0, 77.0, 49.0, 42.0, 37.0, 41.0, 27.0, 26.0, 23.0, 25.0, 18.0, 11.0, 6.0, 10.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-19.293867111206055, -18.58577537536621, -17.877683639526367, -17.169593811035156, -16.461502075195312, -15.753410339355469, -15.045318603515625, -14.337226867675781, -13.629136085510254, -12.92104434967041, -12.212953567504883, -11.504861831665039, -10.796770095825195, -10.088679313659668, -9.380587577819824, -8.672496795654297, -7.964405059814453, -7.256313800811768, -6.548222541809082, -5.840130805969238, -5.132039546966553, -4.423948287963867, -3.7158565521240234, -3.007765293121338, -2.2996740341186523, -1.5915826559066772, -0.8834912776947021, -0.1753997802734375, 0.532691478729248, 1.2407827377319336, 1.9488744735717773, 2.656965732574463, 3.3650550842285156, 4.073146343231201, 4.781237602233887, 5.4893293380737305, 6.197420597076416, 6.905511856079102, 7.613603591918945, 8.321695327758789, 9.029786109924316, 9.73787784576416, 10.445968627929688, 11.154060363769531, 11.862152099609375, 12.570242881774902, 13.278334617614746, 13.986425399780273, 14.694517135620117, 15.402608871459961, 16.110700607299805, 16.818790435791016, 17.52688217163086, 18.234973907470703, 18.943065643310547, 19.65115737915039, 20.359249114990234, 21.067340850830078, 21.775432586669922, 22.483524322509766, 23.191614151000977, 23.89970588684082, 24.607797622680664, 25.315889358520508, 26.02397918701172]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 5.0, 6.0, 7.0, 10.0, 5.0, 4.0, 14.0, 10.0, 15.0, 24.0, 22.0, 24.0, 27.0, 19.0, 40.0, 33.0, 36.0, 33.0, 46.0, 37.0, 46.0, 28.0, 35.0, 56.0, 53.0, 43.0, 42.0, 36.0, 31.0, 29.0, 21.0, 26.0, 22.0, 26.0, 14.0, 19.0, 13.0, 9.0, 7.0, 4.0, 8.0, 5.0, 4.0, 8.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.718064308166504, -9.37883186340332, -9.03959846496582, -8.700366020202637, -8.361133575439453, -8.02190113067627, -7.682668209075928, -7.343435287475586, -7.004202842712402, -6.664970397949219, -6.325737476348877, -5.986504554748535, -5.647272109985352, -5.308039665222168, -4.968806743621826, -4.629573822021484, -4.290341377258301, -3.951108694076538, -3.6118760108947754, -3.2726433277130127, -2.93341064453125, -2.5941779613494873, -2.2549452781677246, -1.915712594985962, -1.5764799118041992, -1.2372472286224365, -0.8980145454406738, -0.5587818622589111, -0.21954917907714844, 0.11968350410461426, 0.45891618728637695, 0.7981488704681396, 1.1373815536499023, 1.476614236831665, 1.8158469200134277, 2.1550796031951904, 2.494312286376953, 2.833544969558716, 3.1727776527404785, 3.512010335922241, 3.851243019104004, 4.1904754638671875, 4.529708385467529, 4.868941307067871, 5.208173751831055, 5.547406196594238, 5.88663911819458, 6.225872039794922, 6.5651044845581055, 6.904336929321289, 7.243569850921631, 7.582802772521973, 7.922035217285156, 8.26126766204834, 8.600500106811523, 8.939733505249023, 9.278965950012207, 9.61819839477539, 9.95743179321289, 10.296664237976074, 10.635896682739258, 10.975129127502441, 11.314361572265625, 11.653594970703125, 11.992827415466309]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 1.0, 9.0, 10.0, 16.0, 24.0, 27.0, 33.0, 51.0, 66.0, 112.0, 146.0, 217.0, 344.0, 482.0, 836.0, 1163.0, 1852.0, 3073.0, 5224.0, 8874.0, 16601.0, 31389.0, 62480.0, 130923.0, 286982.0, 622053.0, 1053119.0, 970843.0, 528769.0, 242456.0, 110747.0, 53930.0, 27261.0, 14248.0, 8149.0, 4549.0, 2568.0, 1665.0, 1001.0, 665.0, 426.0, 264.0, 215.0, 122.0, 83.0, 70.0, 34.0, 36.0, 24.0, 18.0, 16.0, 9.0, 2.0, 1.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-19.6875, -19.02880859375, -18.3701171875, -17.71142578125, -17.052734375, -16.39404296875, -15.7353515625, -15.07666015625, -14.41796875, -13.75927734375, -13.1005859375, -12.44189453125, -11.783203125, -11.12451171875, -10.4658203125, -9.80712890625, -9.1484375, -8.48974609375, -7.8310546875, -7.17236328125, -6.513671875, -5.85498046875, -5.1962890625, -4.53759765625, -3.87890625, -3.22021484375, -2.5615234375, -1.90283203125, -1.244140625, -0.58544921875, 0.0732421875, 0.73193359375, 1.390625, 2.04931640625, 2.7080078125, 3.36669921875, 4.025390625, 4.68408203125, 5.3427734375, 6.00146484375, 6.66015625, 7.31884765625, 7.9775390625, 8.63623046875, 9.294921875, 9.95361328125, 10.6123046875, 11.27099609375, 11.9296875, 12.58837890625, 13.2470703125, 13.90576171875, 14.564453125, 15.22314453125, 15.8818359375, 16.54052734375, 17.19921875, 17.85791015625, 18.5166015625, 19.17529296875, 19.833984375, 20.49267578125, 21.1513671875, 21.81005859375, 22.46875]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 3.0, 4.0, 3.0, 8.0, 9.0, 12.0, 10.0, 15.0, 17.0, 21.0, 27.0, 31.0, 32.0, 30.0, 33.0, 38.0, 39.0, 48.0, 50.0, 48.0, 53.0, 49.0, 49.0, 39.0, 38.0, 50.0, 33.0, 29.0, 26.0, 32.0, 22.0, 15.0, 9.0, 14.0, 12.0, 10.0, 14.0, 6.0, 7.0, 5.0, 9.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3359375, -9.0272216796875, -8.718505859375, -8.4097900390625, -8.10107421875, -7.7923583984375, -7.483642578125, -7.1749267578125, -6.8662109375, -6.5574951171875, -6.248779296875, -5.9400634765625, -5.63134765625, -5.3226318359375, -5.013916015625, -4.7052001953125, -4.396484375, -4.0877685546875, -3.779052734375, -3.4703369140625, -3.16162109375, -2.8529052734375, -2.544189453125, -2.2354736328125, -1.9267578125, -1.6180419921875, -1.309326171875, -1.0006103515625, -0.69189453125, -0.3831787109375, -0.074462890625, 0.2342529296875, 0.54296875, 0.8516845703125, 1.160400390625, 1.4691162109375, 1.77783203125, 2.0865478515625, 2.395263671875, 2.7039794921875, 3.0126953125, 3.3214111328125, 3.630126953125, 3.9388427734375, 4.24755859375, 4.5562744140625, 4.864990234375, 5.1737060546875, 5.482421875, 5.7911376953125, 6.099853515625, 6.4085693359375, 6.71728515625, 7.0260009765625, 7.334716796875, 7.6434326171875, 7.9521484375, 8.2608642578125, 8.569580078125, 8.8782958984375, 9.18701171875, 9.4957275390625, 9.804443359375, 10.1131591796875, 10.421875]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 7.0, 6.0, 9.0, 12.0, 6.0, 19.0, 21.0, 40.0, 60.0, 60.0, 90.0, 146.0, 221.0, 348.0, 536.0, 879.0, 1406.0, 2259.0, 3802.0, 6575.0, 11286.0, 19651.0, 34508.0, 62868.0, 114539.0, 212807.0, 382621.0, 634483.0, 841551.0, 752811.0, 490491.0, 277905.0, 152857.0, 83064.0, 45143.0, 25451.0, 14633.0, 8431.0, 4835.0, 2924.0, 1811.0, 1130.0, 678.0, 449.0, 303.0, 192.0, 119.0, 95.0, 44.0, 38.0, 22.0, 12.0, 13.0, 11.0, 10.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-19.25, -18.643310546875, -18.03662109375, -17.429931640625, -16.8232421875, -16.216552734375, -15.60986328125, -15.003173828125, -14.396484375, -13.789794921875, -13.18310546875, -12.576416015625, -11.9697265625, -11.363037109375, -10.75634765625, -10.149658203125, -9.54296875, -8.936279296875, -8.32958984375, -7.722900390625, -7.1162109375, -6.509521484375, -5.90283203125, -5.296142578125, -4.689453125, -4.082763671875, -3.47607421875, -2.869384765625, -2.2626953125, -1.656005859375, -1.04931640625, -0.442626953125, 0.1640625, 0.770751953125, 1.37744140625, 1.984130859375, 2.5908203125, 3.197509765625, 3.80419921875, 4.410888671875, 5.017578125, 5.624267578125, 6.23095703125, 6.837646484375, 7.4443359375, 8.051025390625, 8.65771484375, 9.264404296875, 9.87109375, 10.477783203125, 11.08447265625, 11.691162109375, 12.2978515625, 12.904541015625, 13.51123046875, 14.117919921875, 14.724609375, 15.331298828125, 15.93798828125, 16.544677734375, 17.1513671875, 17.758056640625, 18.36474609375, 18.971435546875, 19.578125]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 9.0, 13.0, 13.0, 30.0, 22.0, 38.0, 32.0, 52.0, 84.0, 91.0, 119.0, 143.0, 188.0, 235.0, 248.0, 301.0, 269.0, 302.0, 320.0, 264.0, 262.0, 228.0, 177.0, 122.0, 112.0, 116.0, 67.0, 69.0, 30.0, 27.0, 26.0, 21.0, 9.0, 10.0, 8.0, 2.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.0078125, -7.7862548828125, -7.564697265625, -7.3431396484375, -7.12158203125, -6.9000244140625, -6.678466796875, -6.4569091796875, -6.2353515625, -6.0137939453125, -5.792236328125, -5.5706787109375, -5.34912109375, -5.1275634765625, -4.906005859375, -4.6844482421875, -4.462890625, -4.2413330078125, -4.019775390625, -3.7982177734375, -3.57666015625, -3.3551025390625, -3.133544921875, -2.9119873046875, -2.6904296875, -2.4688720703125, -2.247314453125, -2.0257568359375, -1.80419921875, -1.5826416015625, -1.361083984375, -1.1395263671875, -0.91796875, -0.6964111328125, -0.474853515625, -0.2532958984375, -0.03173828125, 0.1898193359375, 0.411376953125, 0.6329345703125, 0.8544921875, 1.0760498046875, 1.297607421875, 1.5191650390625, 1.74072265625, 1.9622802734375, 2.183837890625, 2.4053955078125, 2.626953125, 2.8485107421875, 3.070068359375, 3.2916259765625, 3.51318359375, 3.7347412109375, 3.956298828125, 4.1778564453125, 4.3994140625, 4.6209716796875, 4.842529296875, 5.0640869140625, 5.28564453125, 5.5072021484375, 5.728759765625, 5.9503173828125, 6.171875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 5.0, 11.0, 12.0, 9.0, 19.0, 14.0, 17.0, 20.0, 28.0, 18.0, 40.0, 44.0, 51.0, 55.0, 43.0, 46.0, 55.0, 47.0, 56.0, 52.0, 52.0, 48.0, 44.0, 41.0, 24.0, 21.0, 21.0, 25.0, 16.0, 13.0, 8.0, 6.0, 9.0, 4.0, 11.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.998210906982422, -16.371292114257812, -15.744372367858887, -15.117452621459961, -14.490533828735352, -13.863615036010742, -13.236695289611816, -12.60977554321289, -11.982856750488281, -11.355937957763672, -10.729018211364746, -10.10209846496582, -9.475179672241211, -8.848260879516602, -8.221341133117676, -7.594421863555908, -6.967502593994141, -6.340583324432373, -5.7136640548706055, -5.086744785308838, -4.45982551574707, -3.8329062461853027, -3.205986976623535, -2.5790677070617676, -1.9521484375, -1.3252291679382324, -0.6983098983764648, -0.07139062881469727, 0.5555286407470703, 1.182447910308838, 1.8093671798706055, 2.436286449432373, 3.063203811645508, 3.6901230812072754, 4.317042350769043, 4.9439616203308105, 5.570880889892578, 6.197800159454346, 6.824719429016113, 7.451638698577881, 8.078557968139648, 8.705476760864258, 9.332396507263184, 9.95931625366211, 10.586235046386719, 11.213153839111328, 11.840073585510254, 12.46699333190918, 13.093912124633789, 13.720830917358398, 14.347750663757324, 14.97467041015625, 15.60158920288086, 16.22850799560547, 16.855426788330078, 17.48234748840332, 18.10926628112793, 18.73618507385254, 19.36310577392578, 19.99002456665039, 20.616943359375, 21.24386215209961, 21.87078094482422, 22.49770164489746, 23.12462043762207]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 4.0, 5.0, 6.0, 11.0, 12.0, 11.0, 20.0, 13.0, 16.0, 24.0, 25.0, 20.0, 33.0, 33.0, 46.0, 42.0, 34.0, 42.0, 35.0, 48.0, 45.0, 41.0, 38.0, 36.0, 34.0, 37.0, 38.0, 32.0, 35.0, 24.0, 27.0, 26.0, 17.0, 15.0, 12.0, 15.0, 7.0, 11.0, 10.0, 3.0, 2.0, 4.0, 3.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6232271194458, -12.234650611877441, -11.846074104309082, -11.457497596740723, -11.06892204284668, -10.68034553527832, -10.291769027709961, -9.903192520141602, -9.514616012573242, -9.126039505004883, -8.737462997436523, -8.348886489868164, -7.960310459136963, -7.5717339515686035, -7.183157920837402, -6.794581413269043, -6.406004905700684, -6.017428398132324, -5.628851890563965, -5.240275859832764, -4.851699352264404, -4.463122844696045, -4.074546813964844, -3.6859703063964844, -3.297393798828125, -2.9088172912597656, -2.5202410221099854, -2.131664752960205, -1.7430882453918457, -1.3545118570327759, -0.965935468673706, -0.5773591995239258, -0.1887836456298828, 0.199792742729187, 0.5883691310882568, 0.9769455194473267, 1.3655219078063965, 1.7540982961654663, 2.142674684524536, 2.5312509536743164, 2.919827461242676, 3.308403968811035, 3.6969802379608154, 4.085556507110596, 4.474133014678955, 4.8627095222473145, 5.251285552978516, 5.639862060546875, 6.028438568115234, 6.417015075683594, 6.805591583251953, 7.194167613983154, 7.582744121551514, 7.971320629119873, 8.359896659851074, 8.748473167419434, 9.137049674987793, 9.525626182556152, 9.914202690124512, 10.302779197692871, 10.691354751586914, 11.079931259155273, 11.468507766723633, 11.857084274291992, 12.245660781860352]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 9.0, 12.0, 8.0, 18.0, 44.0, 44.0, 67.0, 84.0, 148.0, 202.0, 306.0, 535.0, 818.0, 1342.0, 2163.0, 3814.0, 6910.0, 13635.0, 30306.0, 76403.0, 188641.0, 310426.0, 234222.0, 101651.0, 40063.0, 17178.0, 8418.0, 4409.0, 2652.0, 1519.0, 870.0, 528.0, 372.0, 237.0, 145.0, 119.0, 66.0, 38.0, 41.0, 27.0, 15.0, 20.0, 5.0, 14.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.515625, -21.729736328125, -20.94384765625, -20.157958984375, -19.3720703125, -18.586181640625, -17.80029296875, -17.014404296875, -16.228515625, -15.442626953125, -14.65673828125, -13.870849609375, -13.0849609375, -12.299072265625, -11.51318359375, -10.727294921875, -9.94140625, -9.155517578125, -8.36962890625, -7.583740234375, -6.7978515625, -6.011962890625, -5.22607421875, -4.440185546875, -3.654296875, -2.868408203125, -2.08251953125, -1.296630859375, -0.5107421875, 0.275146484375, 1.06103515625, 1.846923828125, 2.6328125, 3.418701171875, 4.20458984375, 4.990478515625, 5.7763671875, 6.562255859375, 7.34814453125, 8.134033203125, 8.919921875, 9.705810546875, 10.49169921875, 11.277587890625, 12.0634765625, 12.849365234375, 13.63525390625, 14.421142578125, 15.20703125, 15.992919921875, 16.77880859375, 17.564697265625, 18.3505859375, 19.136474609375, 19.92236328125, 20.708251953125, 21.494140625, 22.280029296875, 23.06591796875, 23.851806640625, 24.6376953125, 25.423583984375, 26.20947265625, 26.995361328125, 27.78125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 4.0, 4.0, 6.0, 10.0, 4.0, 13.0, 19.0, 13.0, 21.0, 16.0, 24.0, 23.0, 32.0, 37.0, 33.0, 38.0, 41.0, 44.0, 40.0, 41.0, 32.0, 43.0, 44.0, 42.0, 36.0, 41.0, 39.0, 32.0, 27.0, 25.0, 26.0, 26.0, 23.0, 16.0, 15.0, 10.0, 10.0, 12.0, 11.0, 6.0, 5.0, 1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0], "bins": [-14.453125, -14.03759765625, -13.6220703125, -13.20654296875, -12.791015625, -12.37548828125, -11.9599609375, -11.54443359375, -11.12890625, -10.71337890625, -10.2978515625, -9.88232421875, -9.466796875, -9.05126953125, -8.6357421875, -8.22021484375, -7.8046875, -7.38916015625, -6.9736328125, -6.55810546875, -6.142578125, -5.72705078125, -5.3115234375, -4.89599609375, -4.48046875, -4.06494140625, -3.6494140625, -3.23388671875, -2.818359375, -2.40283203125, -1.9873046875, -1.57177734375, -1.15625, -0.74072265625, -0.3251953125, 0.09033203125, 0.505859375, 0.92138671875, 1.3369140625, 1.75244140625, 2.16796875, 2.58349609375, 2.9990234375, 3.41455078125, 3.830078125, 4.24560546875, 4.6611328125, 5.07666015625, 5.4921875, 5.90771484375, 6.3232421875, 6.73876953125, 7.154296875, 7.56982421875, 7.9853515625, 8.40087890625, 8.81640625, 9.23193359375, 9.6474609375, 10.06298828125, 10.478515625, 10.89404296875, 11.3095703125, 11.72509765625, 12.140625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 9.0, 9.0, 7.0, 16.0, 18.0, 27.0, 32.0, 54.0, 59.0, 93.0, 116.0, 157.0, 226.0, 333.0, 422.0, 630.0, 928.0, 1436.0, 2473.0, 4365.0, 8644.0, 20467.0, 61866.0, 232867.0, 451484.0, 178812.0, 48238.0, 16795.0, 7581.0, 3820.0, 2255.0, 1423.0, 868.0, 590.0, 416.0, 284.0, 218.0, 125.0, 91.0, 88.0, 50.0, 49.0, 39.0, 24.0, 15.0, 12.0, 7.0, 3.0, 5.0, 9.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.40625, -36.21484375, -35.0234375, -33.83203125, -32.640625, -31.44921875, -30.2578125, -29.06640625, -27.875, -26.68359375, -25.4921875, -24.30078125, -23.109375, -21.91796875, -20.7265625, -19.53515625, -18.34375, -17.15234375, -15.9609375, -14.76953125, -13.578125, -12.38671875, -11.1953125, -10.00390625, -8.8125, -7.62109375, -6.4296875, -5.23828125, -4.046875, -2.85546875, -1.6640625, -0.47265625, 0.71875, 1.91015625, 3.1015625, 4.29296875, 5.484375, 6.67578125, 7.8671875, 9.05859375, 10.25, 11.44140625, 12.6328125, 13.82421875, 15.015625, 16.20703125, 17.3984375, 18.58984375, 19.78125, 20.97265625, 22.1640625, 23.35546875, 24.546875, 25.73828125, 26.9296875, 28.12109375, 29.3125, 30.50390625, 31.6953125, 32.88671875, 34.078125, 35.26953125, 36.4609375, 37.65234375, 38.84375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 2.0, 3.0, 1.0, 5.0, 6.0, 9.0, 6.0, 14.0, 12.0, 16.0, 19.0, 19.0, 20.0, 23.0, 35.0, 26.0, 26.0, 40.0, 28.0, 38.0, 38.0, 45.0, 35.0, 47.0, 27.0, 44.0, 41.0, 38.0, 35.0, 35.0, 36.0, 30.0, 31.0, 25.0, 21.0, 17.0, 17.0, 15.0, 8.0, 14.0, 8.0, 5.0, 12.0, 9.0, 4.0, 3.0, 3.0, 4.0, 4.0, 3.0, 3.0, 5.0, 2.0, 0.0, 1.0], "bins": [-7.62890625, -7.397216796875, -7.16552734375, -6.933837890625, -6.7021484375, -6.470458984375, -6.23876953125, -6.007080078125, -5.775390625, -5.543701171875, -5.31201171875, -5.080322265625, -4.8486328125, -4.616943359375, -4.38525390625, -4.153564453125, -3.921875, -3.690185546875, -3.45849609375, -3.226806640625, -2.9951171875, -2.763427734375, -2.53173828125, -2.300048828125, -2.068359375, -1.836669921875, -1.60498046875, -1.373291015625, -1.1416015625, -0.909912109375, -0.67822265625, -0.446533203125, -0.21484375, 0.016845703125, 0.24853515625, 0.480224609375, 0.7119140625, 0.943603515625, 1.17529296875, 1.406982421875, 1.638671875, 1.870361328125, 2.10205078125, 2.333740234375, 2.5654296875, 2.797119140625, 3.02880859375, 3.260498046875, 3.4921875, 3.723876953125, 3.95556640625, 4.187255859375, 4.4189453125, 4.650634765625, 4.88232421875, 5.114013671875, 5.345703125, 5.577392578125, 5.80908203125, 6.040771484375, 6.2724609375, 6.504150390625, 6.73583984375, 6.967529296875, 7.19921875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 7.0, 12.0, 10.0, 14.0, 21.0, 34.0, 51.0, 59.0, 84.0, 126.0, 180.0, 292.0, 399.0, 584.0, 853.0, 1227.0, 1850.0, 2689.0, 4400.0, 7232.0, 13801.0, 31358.0, 92852.0, 299693.0, 377313.0, 131713.0, 41387.0, 16993.0, 8624.0, 5015.0, 3120.0, 2081.0, 1416.0, 952.0, 625.0, 476.0, 321.0, 209.0, 147.0, 114.0, 81.0, 47.0, 31.0, 20.0, 8.0, 16.0, 10.0, 5.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-17.0, -16.487060546875, -15.97412109375, -15.461181640625, -14.9482421875, -14.435302734375, -13.92236328125, -13.409423828125, -12.896484375, -12.383544921875, -11.87060546875, -11.357666015625, -10.8447265625, -10.331787109375, -9.81884765625, -9.305908203125, -8.79296875, -8.280029296875, -7.76708984375, -7.254150390625, -6.7412109375, -6.228271484375, -5.71533203125, -5.202392578125, -4.689453125, -4.176513671875, -3.66357421875, -3.150634765625, -2.6376953125, -2.124755859375, -1.61181640625, -1.098876953125, -0.5859375, -0.072998046875, 0.43994140625, 0.952880859375, 1.4658203125, 1.978759765625, 2.49169921875, 3.004638671875, 3.517578125, 4.030517578125, 4.54345703125, 5.056396484375, 5.5693359375, 6.082275390625, 6.59521484375, 7.108154296875, 7.62109375, 8.134033203125, 8.64697265625, 9.159912109375, 9.6728515625, 10.185791015625, 10.69873046875, 11.211669921875, 11.724609375, 12.237548828125, 12.75048828125, 13.263427734375, 13.7763671875, 14.289306640625, 14.80224609375, 15.315185546875, 15.828125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 3.0, 0.0, 5.0, 7.0, 3.0, 2.0, 12.0, 13.0, 18.0, 26.0, 55.0, 76.0, 122.0, 143.0, 142.0, 120.0, 82.0, 55.0, 30.0, 19.0, 16.0, 9.0, 12.0, 3.0, 2.0, 2.0, 6.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0008711814880371094, -0.0008402243256568909, -0.0008092671632766724, -0.0007783100008964539, -0.0007473528385162354, -0.0007163956761360168, -0.0006854385137557983, -0.0006544813513755798, -0.0006235241889953613, -0.0005925670266151428, -0.0005616098642349243, -0.0005306527018547058, -0.0004996955394744873, -0.0004687383770942688, -0.0004377812147140503, -0.0004068240523338318, -0.0003758668899536133, -0.0003449097275733948, -0.00031395256519317627, -0.00028299540281295776, -0.00025203824043273926, -0.00022108107805252075, -0.00019012391567230225, -0.00015916675329208374, -0.00012820959091186523, -9.725242853164673e-05, -6.629526615142822e-05, -3.533810377120972e-05, -4.380941390991211e-06, 2.6576220989227295e-05, 5.75333833694458e-05, 8.84905457496643e-05, 0.00011944770812988281, 0.00015040487051010132, 0.00018136203289031982, 0.00021231919527053833, 0.00024327635765075684, 0.00027423352003097534, 0.00030519068241119385, 0.00033614784479141235, 0.00036710500717163086, 0.00039806216955184937, 0.00042901933193206787, 0.0004599764943122864, 0.0004909336566925049, 0.0005218908190727234, 0.0005528479814529419, 0.0005838051438331604, 0.0006147623062133789, 0.0006457194685935974, 0.0006766766309738159, 0.0007076337933540344, 0.0007385909557342529, 0.0007695481181144714, 0.0008005052804946899, 0.0008314624428749084, 0.000862419605255127, 0.0008933767676353455, 0.000924333930015564, 0.0009552910923957825, 0.000986248254776001, 0.0010172054171562195, 0.001048162579536438, 0.0010791197419166565, 0.001110076904296875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 4.0, 8.0, 8.0, 9.0, 15.0, 15.0, 31.0, 29.0, 60.0, 97.0, 90.0, 135.0, 179.0, 266.0, 326.0, 498.0, 676.0, 1000.0, 1314.0, 1765.0, 2334.0, 3454.0, 4993.0, 7652.0, 13254.0, 29506.0, 85327.0, 242484.0, 351801.0, 184129.0, 60911.0, 22694.0, 11171.0, 6525.0, 4509.0, 3119.0, 2280.0, 1541.0, 1168.0, 889.0, 676.0, 458.0, 349.0, 230.0, 159.0, 121.0, 86.0, 64.0, 52.0, 37.0, 18.0, 16.0, 9.0, 10.0, 3.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0], "bins": [-15.1171875, -14.635009765625, -14.15283203125, -13.670654296875, -13.1884765625, -12.706298828125, -12.22412109375, -11.741943359375, -11.259765625, -10.777587890625, -10.29541015625, -9.813232421875, -9.3310546875, -8.848876953125, -8.36669921875, -7.884521484375, -7.40234375, -6.920166015625, -6.43798828125, -5.955810546875, -5.4736328125, -4.991455078125, -4.50927734375, -4.027099609375, -3.544921875, -3.062744140625, -2.58056640625, -2.098388671875, -1.6162109375, -1.134033203125, -0.65185546875, -0.169677734375, 0.3125, 0.794677734375, 1.27685546875, 1.759033203125, 2.2412109375, 2.723388671875, 3.20556640625, 3.687744140625, 4.169921875, 4.652099609375, 5.13427734375, 5.616455078125, 6.0986328125, 6.580810546875, 7.06298828125, 7.545166015625, 8.02734375, 8.509521484375, 8.99169921875, 9.473876953125, 9.9560546875, 10.438232421875, 10.92041015625, 11.402587890625, 11.884765625, 12.366943359375, 12.84912109375, 13.331298828125, 13.8134765625, 14.295654296875, 14.77783203125, 15.260009765625, 15.7421875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 6.0, 7.0, 6.0, 7.0, 10.0, 18.0, 20.0, 33.0, 61.0, 108.0, 126.0, 135.0, 143.0, 120.0, 60.0, 44.0, 22.0, 17.0, 9.0, 10.0, 3.0, 4.0, 6.0, 7.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.99609375, -4.8157958984375, -4.635498046875, -4.4552001953125, -4.27490234375, -4.0946044921875, -3.914306640625, -3.7340087890625, -3.5537109375, -3.3734130859375, -3.193115234375, -3.0128173828125, -2.83251953125, -2.6522216796875, -2.471923828125, -2.2916259765625, -2.111328125, -1.9310302734375, -1.750732421875, -1.5704345703125, -1.39013671875, -1.2098388671875, -1.029541015625, -0.8492431640625, -0.6689453125, -0.4886474609375, -0.308349609375, -0.1280517578125, 0.05224609375, 0.2325439453125, 0.412841796875, 0.5931396484375, 0.7734375, 0.9537353515625, 1.134033203125, 1.3143310546875, 1.49462890625, 1.6749267578125, 1.855224609375, 2.0355224609375, 2.2158203125, 2.3961181640625, 2.576416015625, 2.7567138671875, 2.93701171875, 3.1173095703125, 3.297607421875, 3.4779052734375, 3.658203125, 3.8385009765625, 4.018798828125, 4.1990966796875, 4.37939453125, 4.5596923828125, 4.739990234375, 4.9202880859375, 5.1005859375, 5.2808837890625, 5.461181640625, 5.6414794921875, 5.82177734375, 6.0020751953125, 6.182373046875, 6.3626708984375, 6.54296875]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 9.0, 2.0, 13.0, 11.0, 12.0, 16.0, 18.0, 15.0, 24.0, 23.0, 35.0, 39.0, 46.0, 58.0, 59.0, 54.0, 64.0, 48.0, 69.0, 62.0, 57.0, 43.0, 45.0, 29.0, 27.0, 40.0, 22.0, 17.0, 3.0, 8.0, 10.0, 8.0, 7.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.16149139404297, -19.467941284179688, -18.774391174316406, -18.080839157104492, -17.38728904724121, -16.69373893737793, -16.000186920166016, -15.306636810302734, -14.613086700439453, -13.919536590576172, -13.225985527038574, -12.532434463500977, -11.838884353637695, -11.145334243774414, -10.451783180236816, -9.758232116699219, -9.064682006835938, -8.371131896972656, -7.677580833435059, -6.984030246734619, -6.29047966003418, -5.59692907333374, -4.903378486633301, -4.209827899932861, -3.516277313232422, -2.8227267265319824, -2.129176139831543, -1.4356255531311035, -0.7420749664306641, -0.04852437973022461, 0.6450262069702148, 1.3385767936706543, 2.0321273803710938, 2.725677967071533, 3.4192285537719727, 4.112779140472412, 4.806329727172852, 5.499880313873291, 6.1934309005737305, 6.88698148727417, 7.580532073974609, 8.27408218383789, 8.967633247375488, 9.661184310913086, 10.354734420776367, 11.048284530639648, 11.741835594177246, 12.435386657714844, 13.128936767578125, 13.822486877441406, 14.516037940979004, 15.209589004516602, 15.903139114379883, 16.596689224243164, 17.290241241455078, 17.98379135131836, 18.67734146118164, 19.370891571044922, 20.064441680908203, 20.757993698120117, 21.4515438079834, 22.14509391784668, 22.838645935058594, 23.532196044921875, 24.225746154785156]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 0.0, 5.0, 6.0, 5.0, 8.0, 13.0, 9.0, 12.0, 12.0, 15.0, 22.0, 24.0, 19.0, 33.0, 27.0, 32.0, 38.0, 46.0, 34.0, 41.0, 42.0, 37.0, 39.0, 32.0, 47.0, 34.0, 38.0, 34.0, 43.0, 37.0, 30.0, 25.0, 28.0, 17.0, 26.0, 12.0, 17.0, 13.0, 14.0, 9.0, 8.0, 3.0, 2.0, 2.0, 4.0, 8.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-12.440733909606934, -12.069839477539062, -11.698945045471191, -11.32805061340332, -10.957157135009766, -10.586262702941895, -10.215368270874023, -9.844473838806152, -9.473579406738281, -9.10268497467041, -8.731790542602539, -8.360896110534668, -7.990002155303955, -7.619107723236084, -7.248213768005371, -6.8773193359375, -6.506424903869629, -6.135530471801758, -5.764636039733887, -5.393742084503174, -5.022847652435303, -4.651953220367432, -4.281059265136719, -3.9101648330688477, -3.5392704010009766, -3.1683759689331055, -2.7974817752838135, -2.4265875816345215, -2.0556931495666504, -1.6847988367080688, -1.3139045238494873, -0.9430103302001953, -0.5721149444580078, -0.20122063159942627, 0.16967368125915527, 0.5405679941177368, 0.9114623069763184, 1.2823566198349, 1.6532509326934814, 2.0241451263427734, 2.3950395584106445, 2.7659339904785156, 3.1368281841278076, 3.5077223777770996, 3.8786168098449707, 4.249511241912842, 4.620405197143555, 4.991299629211426, 5.362194061279297, 5.733088493347168, 6.103982925415039, 6.474876880645752, 6.845771312713623, 7.216665744781494, 7.587559700012207, 7.958454132080078, 8.32934856414795, 8.70024299621582, 9.071137428283691, 9.442031860351562, 9.812925338745117, 10.183819770812988, 10.55471420288086, 10.92560863494873, 11.296503067016602]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 9.0, 12.0, 20.0, 22.0, 24.0, 52.0, 70.0, 119.0, 172.0, 288.0, 394.0, 654.0, 998.0, 1620.0, 2649.0, 4147.0, 6606.0, 10747.0, 16956.0, 26570.0, 40557.0, 61366.0, 85718.0, 112100.0, 130219.0, 133303.0, 119228.0, 94835.0, 68534.0, 46980.0, 30792.0, 19592.0, 12397.0, 7808.0, 4811.0, 3105.0, 1956.0, 1155.0, 717.0, 449.0, 265.0, 174.0, 123.0, 88.0, 45.0, 38.0, 26.0, 16.0, 9.0, 8.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0], "bins": [-12.296875, -11.91455078125, -11.5322265625, -11.14990234375, -10.767578125, -10.38525390625, -10.0029296875, -9.62060546875, -9.23828125, -8.85595703125, -8.4736328125, -8.09130859375, -7.708984375, -7.32666015625, -6.9443359375, -6.56201171875, -6.1796875, -5.79736328125, -5.4150390625, -5.03271484375, -4.650390625, -4.26806640625, -3.8857421875, -3.50341796875, -3.12109375, -2.73876953125, -2.3564453125, -1.97412109375, -1.591796875, -1.20947265625, -0.8271484375, -0.44482421875, -0.0625, 0.31982421875, 0.7021484375, 1.08447265625, 1.466796875, 1.84912109375, 2.2314453125, 2.61376953125, 2.99609375, 3.37841796875, 3.7607421875, 4.14306640625, 4.525390625, 4.90771484375, 5.2900390625, 5.67236328125, 6.0546875, 6.43701171875, 6.8193359375, 7.20166015625, 7.583984375, 7.96630859375, 8.3486328125, 8.73095703125, 9.11328125, 9.49560546875, 9.8779296875, 10.26025390625, 10.642578125, 11.02490234375, 11.4072265625, 11.78955078125, 12.171875]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 8.0, 11.0, 6.0, 10.0, 14.0, 14.0, 14.0, 27.0, 19.0, 28.0, 26.0, 29.0, 41.0, 30.0, 32.0, 39.0, 35.0, 51.0, 46.0, 53.0, 40.0, 42.0, 37.0, 41.0, 44.0, 37.0, 38.0, 33.0, 14.0, 23.0, 15.0, 24.0, 16.0, 12.0, 19.0, 1.0, 4.0, 9.0, 7.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.953125, -12.5404052734375, -12.127685546875, -11.7149658203125, -11.30224609375, -10.8895263671875, -10.476806640625, -10.0640869140625, -9.6513671875, -9.2386474609375, -8.825927734375, -8.4132080078125, -8.00048828125, -7.5877685546875, -7.175048828125, -6.7623291015625, -6.349609375, -5.9368896484375, -5.524169921875, -5.1114501953125, -4.69873046875, -4.2860107421875, -3.873291015625, -3.4605712890625, -3.0478515625, -2.6351318359375, -2.222412109375, -1.8096923828125, -1.39697265625, -0.9842529296875, -0.571533203125, -0.1588134765625, 0.25390625, 0.6666259765625, 1.079345703125, 1.4920654296875, 1.90478515625, 2.3175048828125, 2.730224609375, 3.1429443359375, 3.5556640625, 3.9683837890625, 4.381103515625, 4.7938232421875, 5.20654296875, 5.6192626953125, 6.031982421875, 6.4447021484375, 6.857421875, 7.2701416015625, 7.682861328125, 8.0955810546875, 8.50830078125, 8.9210205078125, 9.333740234375, 9.7464599609375, 10.1591796875, 10.5718994140625, 10.984619140625, 11.3973388671875, 11.81005859375, 12.2227783203125, 12.635498046875, 13.0482177734375, 13.4609375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 12.0, 11.0, 17.0, 36.0, 45.0, 78.0, 96.0, 136.0, 222.0, 303.0, 490.0, 722.0, 1178.0, 1883.0, 2842.0, 4403.0, 7068.0, 10501.0, 16721.0, 26065.0, 38732.0, 57043.0, 79537.0, 101494.0, 120792.0, 127239.0, 118298.0, 99168.0, 75310.0, 53637.0, 36821.0, 23955.0, 15437.0, 10225.0, 6396.0, 4224.0, 2662.0, 1617.0, 1108.0, 700.0, 489.0, 259.0, 190.0, 134.0, 85.0, 60.0, 40.0, 20.0, 16.0, 10.0, 12.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-10.984375, -10.634765625, -10.28515625, -9.935546875, -9.5859375, -9.236328125, -8.88671875, -8.537109375, -8.1875, -7.837890625, -7.48828125, -7.138671875, -6.7890625, -6.439453125, -6.08984375, -5.740234375, -5.390625, -5.041015625, -4.69140625, -4.341796875, -3.9921875, -3.642578125, -3.29296875, -2.943359375, -2.59375, -2.244140625, -1.89453125, -1.544921875, -1.1953125, -0.845703125, -0.49609375, -0.146484375, 0.203125, 0.552734375, 0.90234375, 1.251953125, 1.6015625, 1.951171875, 2.30078125, 2.650390625, 3.0, 3.349609375, 3.69921875, 4.048828125, 4.3984375, 4.748046875, 5.09765625, 5.447265625, 5.796875, 6.146484375, 6.49609375, 6.845703125, 7.1953125, 7.544921875, 7.89453125, 8.244140625, 8.59375, 8.943359375, 9.29296875, 9.642578125, 9.9921875, 10.341796875, 10.69140625, 11.041015625, 11.390625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 3.0, 6.0, 5.0, 5.0, 7.0, 5.0, 11.0, 13.0, 21.0, 15.0, 22.0, 26.0, 37.0, 33.0, 24.0, 37.0, 46.0, 38.0, 46.0, 32.0, 30.0, 37.0, 32.0, 49.0, 29.0, 41.0, 30.0, 31.0, 32.0, 42.0, 24.0, 29.0, 26.0, 20.0, 17.0, 13.0, 8.0, 20.0, 11.0, 7.0, 10.0, 6.0, 7.0, 5.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-7.4921875, -7.26995849609375, -7.0477294921875, -6.82550048828125, -6.603271484375, -6.38104248046875, -6.1588134765625, -5.93658447265625, -5.71435546875, -5.49212646484375, -5.2698974609375, -5.04766845703125, -4.825439453125, -4.60321044921875, -4.3809814453125, -4.15875244140625, -3.9365234375, -3.71429443359375, -3.4920654296875, -3.26983642578125, -3.047607421875, -2.82537841796875, -2.6031494140625, -2.38092041015625, -2.15869140625, -1.93646240234375, -1.7142333984375, -1.49200439453125, -1.269775390625, -1.04754638671875, -0.8253173828125, -0.60308837890625, -0.380859375, -0.15863037109375, 0.0635986328125, 0.28582763671875, 0.508056640625, 0.73028564453125, 0.9525146484375, 1.17474365234375, 1.39697265625, 1.61920166015625, 1.8414306640625, 2.06365966796875, 2.285888671875, 2.50811767578125, 2.7303466796875, 2.95257568359375, 3.1748046875, 3.39703369140625, 3.6192626953125, 3.84149169921875, 4.063720703125, 4.28594970703125, 4.5081787109375, 4.73040771484375, 4.95263671875, 5.17486572265625, 5.3970947265625, 5.61932373046875, 5.841552734375, 6.06378173828125, 6.2860107421875, 6.50823974609375, 6.73046875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 7.0, 9.0, 12.0, 10.0, 17.0, 31.0, 38.0, 78.0, 97.0, 139.0, 224.0, 294.0, 411.0, 683.0, 1012.0, 1532.0, 2437.0, 3805.0, 6075.0, 9750.0, 15544.0, 25139.0, 39473.0, 60272.0, 88270.0, 117255.0, 139236.0, 141343.0, 122371.0, 92680.0, 64914.0, 42664.0, 27100.0, 16959.0, 10397.0, 6417.0, 4220.0, 2743.0, 1734.0, 1074.0, 687.0, 445.0, 327.0, 201.0, 133.0, 104.0, 63.0, 41.0, 25.0, 13.0, 17.0, 10.0, 9.0, 5.0, 6.0, 4.0, 3.0, 3.0], "bins": [-6.19921875, -6.0118408203125, -5.824462890625, -5.6370849609375, -5.44970703125, -5.2623291015625, -5.074951171875, -4.8875732421875, -4.7001953125, -4.5128173828125, -4.325439453125, -4.1380615234375, -3.95068359375, -3.7633056640625, -3.575927734375, -3.3885498046875, -3.201171875, -3.0137939453125, -2.826416015625, -2.6390380859375, -2.45166015625, -2.2642822265625, -2.076904296875, -1.8895263671875, -1.7021484375, -1.5147705078125, -1.327392578125, -1.1400146484375, -0.95263671875, -0.7652587890625, -0.577880859375, -0.3905029296875, -0.203125, -0.0157470703125, 0.171630859375, 0.3590087890625, 0.54638671875, 0.7337646484375, 0.921142578125, 1.1085205078125, 1.2958984375, 1.4832763671875, 1.670654296875, 1.8580322265625, 2.04541015625, 2.2327880859375, 2.420166015625, 2.6075439453125, 2.794921875, 2.9822998046875, 3.169677734375, 3.3570556640625, 3.54443359375, 3.7318115234375, 3.919189453125, 4.1065673828125, 4.2939453125, 4.4813232421875, 4.668701171875, 4.8560791015625, 5.04345703125, 5.2308349609375, 5.418212890625, 5.6055908203125, 5.79296875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 7.0, 3.0, 14.0, 10.0, 15.0, 19.0, 15.0, 30.0, 35.0, 44.0, 49.0, 58.0, 62.0, 71.0, 82.0, 76.0, 77.0, 57.0, 48.0, 42.0, 36.0, 40.0, 26.0, 21.0, 15.0, 15.0, 9.0, 8.0, 6.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0008788108825683594, -0.0008503124117851257, -0.0008218139410018921, -0.0007933154702186584, -0.0007648169994354248, -0.0007363185286521912, -0.0007078200578689575, -0.0006793215870857239, -0.0006508231163024902, -0.0006223246455192566, -0.000593826174736023, -0.0005653277039527893, -0.0005368292331695557, -0.000508330762386322, -0.0004798322916030884, -0.00045133382081985474, -0.0004228353500366211, -0.00039433687925338745, -0.0003658384084701538, -0.00033733993768692017, -0.0003088414669036865, -0.0002803429961204529, -0.00025184452533721924, -0.0002233460545539856, -0.00019484758377075195, -0.0001663491129875183, -0.00013785064220428467, -0.00010935217142105103, -8.085370063781738e-05, -5.235522985458374e-05, -2.3856759071350098e-05, 4.641711711883545e-06, 3.314018249511719e-05, 6.163865327835083e-05, 9.013712406158447e-05, 0.00011863559484481812, 0.00014713406562805176, 0.0001756325364112854, 0.00020413100719451904, 0.00023262947797775269, 0.00026112794876098633, 0.00028962641954421997, 0.0003181248903274536, 0.00034662336111068726, 0.0003751218318939209, 0.00040362030267715454, 0.0004321187734603882, 0.0004606172442436218, 0.0004891157150268555, 0.0005176141858100891, 0.0005461126565933228, 0.0005746111273765564, 0.00060310959815979, 0.0006316080689430237, 0.0006601065397262573, 0.000688605010509491, 0.0007171034812927246, 0.0007456019520759583, 0.0007741004228591919, 0.0008025988936424255, 0.0008310973644256592, 0.0008595958352088928, 0.0008880943059921265, 0.0009165927767753601, 0.0009450912475585938]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 9.0, 11.0, 18.0, 26.0, 27.0, 52.0, 70.0, 112.0, 194.0, 313.0, 452.0, 713.0, 1133.0, 1801.0, 2911.0, 5053.0, 7676.0, 13016.0, 20967.0, 33646.0, 52131.0, 77653.0, 106268.0, 131775.0, 141052.0, 130608.0, 105571.0, 77126.0, 51866.0, 32834.0, 20423.0, 12657.0, 7724.0, 4749.0, 2900.0, 1864.0, 1172.0, 705.0, 472.0, 302.0, 194.0, 131.0, 73.0, 49.0, 25.0, 9.0, 13.0, 5.0, 5.0, 1.0, 0.0, 1.0, 3.0, 2.0], "bins": [-6.5625, -6.3721923828125, -6.181884765625, -5.9915771484375, -5.80126953125, -5.6109619140625, -5.420654296875, -5.2303466796875, -5.0400390625, -4.8497314453125, -4.659423828125, -4.4691162109375, -4.27880859375, -4.0885009765625, -3.898193359375, -3.7078857421875, -3.517578125, -3.3272705078125, -3.136962890625, -2.9466552734375, -2.75634765625, -2.5660400390625, -2.375732421875, -2.1854248046875, -1.9951171875, -1.8048095703125, -1.614501953125, -1.4241943359375, -1.23388671875, -1.0435791015625, -0.853271484375, -0.6629638671875, -0.47265625, -0.2823486328125, -0.092041015625, 0.0982666015625, 0.28857421875, 0.4788818359375, 0.669189453125, 0.8594970703125, 1.0498046875, 1.2401123046875, 1.430419921875, 1.6207275390625, 1.81103515625, 2.0013427734375, 2.191650390625, 2.3819580078125, 2.572265625, 2.7625732421875, 2.952880859375, 3.1431884765625, 3.33349609375, 3.5238037109375, 3.714111328125, 3.9044189453125, 4.0947265625, 4.2850341796875, 4.475341796875, 4.6656494140625, 4.85595703125, 5.0462646484375, 5.236572265625, 5.4268798828125, 5.6171875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 3.0, 5.0, 3.0, 4.0, 11.0, 11.0, 12.0, 7.0, 16.0, 14.0, 15.0, 16.0, 18.0, 27.0, 22.0, 38.0, 30.0, 39.0, 33.0, 54.0, 35.0, 44.0, 41.0, 44.0, 39.0, 50.0, 52.0, 36.0, 29.0, 30.0, 25.0, 29.0, 35.0, 23.0, 12.0, 19.0, 16.0, 16.0, 10.0, 8.0, 7.0, 8.0, 5.0, 7.0, 5.0, 0.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6494140625, -1.5979766845703125, -1.546539306640625, -1.4951019287109375, -1.44366455078125, -1.3922271728515625, -1.340789794921875, -1.2893524169921875, -1.2379150390625, -1.1864776611328125, -1.135040283203125, -1.0836029052734375, -1.03216552734375, -0.9807281494140625, -0.929290771484375, -0.8778533935546875, -0.826416015625, -0.7749786376953125, -0.723541259765625, -0.6721038818359375, -0.62066650390625, -0.5692291259765625, -0.517791748046875, -0.4663543701171875, -0.4149169921875, -0.3634796142578125, -0.312042236328125, -0.2606048583984375, -0.20916748046875, -0.1577301025390625, -0.106292724609375, -0.0548553466796875, -0.00341796875, 0.0480194091796875, 0.099456787109375, 0.1508941650390625, 0.20233154296875, 0.2537689208984375, 0.305206298828125, 0.3566436767578125, 0.4080810546875, 0.4595184326171875, 0.510955810546875, 0.5623931884765625, 0.61383056640625, 0.6652679443359375, 0.716705322265625, 0.7681427001953125, 0.819580078125, 0.8710174560546875, 0.922454833984375, 0.9738922119140625, 1.02532958984375, 1.0767669677734375, 1.128204345703125, 1.1796417236328125, 1.2310791015625, 1.2825164794921875, 1.333953857421875, 1.3853912353515625, 1.43682861328125, 1.4882659912109375, 1.539703369140625, 1.5911407470703125, 1.642578125]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 6.0, 6.0, 12.0, 10.0, 15.0, 13.0, 16.0, 26.0, 21.0, 34.0, 31.0, 48.0, 46.0, 57.0, 50.0, 60.0, 52.0, 60.0, 56.0, 59.0, 39.0, 40.0, 39.0, 44.0, 28.0, 21.0, 22.0, 16.0, 16.0, 12.0, 11.0, 4.0, 6.0, 5.0, 5.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-18.861387252807617, -18.211864471435547, -17.562341690063477, -16.912818908691406, -16.263296127319336, -15.613773345947266, -14.964249610900879, -14.314726829528809, -13.665204048156738, -13.015681266784668, -12.366158485412598, -11.716635704040527, -11.06711196899414, -10.41758918762207, -9.76806640625, -9.11854362487793, -8.46902084350586, -7.819498062133789, -7.169975280761719, -6.52045202255249, -5.87092924118042, -5.22140645980835, -4.571883201599121, -3.922360420227051, -3.2728376388549805, -2.62331485748291, -1.9737918376922607, -1.3242689371109009, -0.674746036529541, -0.025223255157470703, 0.6242997646331787, 1.2738227844238281, 1.9233474731445312, 2.5728702545166016, 3.222393274307251, 3.8719162940979004, 4.521439075469971, 5.170961856842041, 5.8204851150512695, 6.47000789642334, 7.11953067779541, 7.7690534591674805, 8.41857624053955, 9.068099021911621, 9.717622756958008, 10.367145538330078, 11.016668319702148, 11.666191101074219, 12.315713882446289, 12.96523666381836, 13.61475944519043, 14.2642822265625, 14.91380500793457, 15.56332778930664, 16.21285057067871, 16.86237335205078, 17.511898040771484, 18.161420822143555, 18.810943603515625, 19.460466384887695, 20.109989166259766, 20.759511947631836, 21.409034729003906, 22.05855941772461, 22.708080291748047]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 10.0, 7.0, 5.0, 6.0, 3.0, 12.0, 9.0, 4.0, 10.0, 19.0, 17.0, 16.0, 27.0, 23.0, 22.0, 24.0, 27.0, 33.0, 37.0, 39.0, 33.0, 39.0, 44.0, 40.0, 33.0, 40.0, 29.0, 31.0, 37.0, 37.0, 27.0, 36.0, 37.0, 26.0, 29.0, 18.0, 17.0, 18.0, 12.0, 5.0, 14.0, 17.0, 7.0, 9.0, 7.0, 4.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-10.427643775939941, -10.08294677734375, -9.738249778747559, -9.393552780151367, -9.048856735229492, -8.7041597366333, -8.35946273803711, -8.014765739440918, -7.670069217681885, -7.325372219085693, -6.98067569732666, -6.635978698730469, -6.291281700134277, -5.946585178375244, -5.601888179779053, -5.2571916580200195, -4.912494659423828, -4.567797660827637, -4.2231011390686035, -3.878404140472412, -3.5337073802948, -3.1890106201171875, -2.844313621520996, -2.499616861343384, -2.1549201011657715, -1.8102233409881592, -1.4655264616012573, -1.1208295822143555, -0.7761328220367432, -0.43143606185913086, -0.08673906326293945, 0.25795769691467285, 0.6026544570922852, 0.9473512768745422, 1.2920480966567993, 1.6367449760437012, 1.9814417362213135, 2.326138496398926, 2.670835494995117, 3.0155322551727295, 3.360229015350342, 3.704925775527954, 4.049622535705566, 4.394319534301758, 4.739016532897949, 5.083713054656982, 5.428410053253174, 5.773106575012207, 6.117803573608398, 6.46250057220459, 6.807197093963623, 7.1518940925598145, 7.496590614318848, 7.841287612915039, 8.18598461151123, 8.530681610107422, 8.875377655029297, 9.220074653625488, 9.56477165222168, 9.909467697143555, 10.254164695739746, 10.598861694335938, 10.943558692932129, 11.28825569152832, 11.632952690124512]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 1.0, 6.0, 4.0, 8.0, 17.0, 22.0, 29.0, 54.0, 72.0, 138.0, 171.0, 280.0, 478.0, 658.0, 1117.0, 1729.0, 2736.0, 4569.0, 7500.0, 13447.0, 25143.0, 49314.0, 101181.0, 219686.0, 475639.0, 882281.0, 1043729.0, 701520.0, 346834.0, 159304.0, 74740.0, 37003.0, 19018.0, 10308.0, 5939.0, 3506.0, 2097.0, 1371.0, 869.0, 555.0, 377.0, 249.0, 164.0, 118.0, 95.0, 64.0, 47.0, 28.0, 22.0, 20.0, 11.0, 7.0, 2.0, 1.0, 9.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-20.640625, -19.935791015625, -19.23095703125, -18.526123046875, -17.8212890625, -17.116455078125, -16.41162109375, -15.706787109375, -15.001953125, -14.297119140625, -13.59228515625, -12.887451171875, -12.1826171875, -11.477783203125, -10.77294921875, -10.068115234375, -9.36328125, -8.658447265625, -7.95361328125, -7.248779296875, -6.5439453125, -5.839111328125, -5.13427734375, -4.429443359375, -3.724609375, -3.019775390625, -2.31494140625, -1.610107421875, -0.9052734375, -0.200439453125, 0.50439453125, 1.209228515625, 1.9140625, 2.618896484375, 3.32373046875, 4.028564453125, 4.7333984375, 5.438232421875, 6.14306640625, 6.847900390625, 7.552734375, 8.257568359375, 8.96240234375, 9.667236328125, 10.3720703125, 11.076904296875, 11.78173828125, 12.486572265625, 13.19140625, 13.896240234375, 14.60107421875, 15.305908203125, 16.0107421875, 16.715576171875, 17.42041015625, 18.125244140625, 18.830078125, 19.534912109375, 20.23974609375, 20.944580078125, 21.6494140625, 22.354248046875, 23.05908203125, 23.763916015625, 24.46875]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 2.0, 10.0, 8.0, 8.0, 11.0, 12.0, 11.0, 14.0, 28.0, 20.0, 23.0, 25.0, 28.0, 30.0, 31.0, 43.0, 29.0, 37.0, 44.0, 49.0, 49.0, 35.0, 34.0, 38.0, 44.0, 42.0, 45.0, 25.0, 31.0, 36.0, 23.0, 22.0, 15.0, 18.0, 16.0, 12.0, 13.0, 8.0, 6.0, 6.0, 7.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.359375, -9.0513916015625, -8.743408203125, -8.4354248046875, -8.12744140625, -7.8194580078125, -7.511474609375, -7.2034912109375, -6.8955078125, -6.5875244140625, -6.279541015625, -5.9715576171875, -5.66357421875, -5.3555908203125, -5.047607421875, -4.7396240234375, -4.431640625, -4.1236572265625, -3.815673828125, -3.5076904296875, -3.19970703125, -2.8917236328125, -2.583740234375, -2.2757568359375, -1.9677734375, -1.6597900390625, -1.351806640625, -1.0438232421875, -0.73583984375, -0.4278564453125, -0.119873046875, 0.1881103515625, 0.49609375, 0.8040771484375, 1.112060546875, 1.4200439453125, 1.72802734375, 2.0360107421875, 2.343994140625, 2.6519775390625, 2.9599609375, 3.2679443359375, 3.575927734375, 3.8839111328125, 4.19189453125, 4.4998779296875, 4.807861328125, 5.1158447265625, 5.423828125, 5.7318115234375, 6.039794921875, 6.3477783203125, 6.65576171875, 6.9637451171875, 7.271728515625, 7.5797119140625, 7.8876953125, 8.1956787109375, 8.503662109375, 8.8116455078125, 9.11962890625, 9.4276123046875, 9.735595703125, 10.0435791015625, 10.3515625]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 6.0, 12.0, 17.0, 21.0, 48.0, 45.0, 61.0, 109.0, 150.0, 251.0, 354.0, 563.0, 898.0, 1407.0, 2147.0, 3647.0, 6040.0, 9870.0, 16943.0, 29287.0, 51554.0, 92424.0, 166679.0, 297522.0, 501227.0, 728089.0, 790793.0, 611937.0, 382971.0, 218117.0, 121613.0, 67545.0, 37791.0, 21606.0, 12694.0, 7507.0, 4521.0, 2772.0, 1826.0, 1176.0, 660.0, 459.0, 307.0, 184.0, 144.0, 95.0, 68.0, 44.0, 25.0, 26.0, 18.0, 13.0, 3.0, 5.0, 1.0, 2.0, 2.0], "bins": [-21.09375, -20.458984375, -19.82421875, -19.189453125, -18.5546875, -17.919921875, -17.28515625, -16.650390625, -16.015625, -15.380859375, -14.74609375, -14.111328125, -13.4765625, -12.841796875, -12.20703125, -11.572265625, -10.9375, -10.302734375, -9.66796875, -9.033203125, -8.3984375, -7.763671875, -7.12890625, -6.494140625, -5.859375, -5.224609375, -4.58984375, -3.955078125, -3.3203125, -2.685546875, -2.05078125, -1.416015625, -0.78125, -0.146484375, 0.48828125, 1.123046875, 1.7578125, 2.392578125, 3.02734375, 3.662109375, 4.296875, 4.931640625, 5.56640625, 6.201171875, 6.8359375, 7.470703125, 8.10546875, 8.740234375, 9.375, 10.009765625, 10.64453125, 11.279296875, 11.9140625, 12.548828125, 13.18359375, 13.818359375, 14.453125, 15.087890625, 15.72265625, 16.357421875, 16.9921875, 17.626953125, 18.26171875, 18.896484375, 19.53125]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 7.0, 7.0, 9.0, 11.0, 19.0, 21.0, 29.0, 37.0, 39.0, 66.0, 75.0, 97.0, 119.0, 163.0, 215.0, 242.0, 275.0, 314.0, 314.0, 311.0, 309.0, 278.0, 243.0, 184.0, 175.0, 124.0, 106.0, 88.0, 62.0, 38.0, 32.0, 20.0, 10.0, 11.0, 7.0, 5.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.3125, -9.05865478515625, -8.8048095703125, -8.55096435546875, -8.297119140625, -8.04327392578125, -7.7894287109375, -7.53558349609375, -7.28173828125, -7.02789306640625, -6.7740478515625, -6.52020263671875, -6.266357421875, -6.01251220703125, -5.7586669921875, -5.50482177734375, -5.2509765625, -4.99713134765625, -4.7432861328125, -4.48944091796875, -4.235595703125, -3.98175048828125, -3.7279052734375, -3.47406005859375, -3.22021484375, -2.96636962890625, -2.7125244140625, -2.45867919921875, -2.204833984375, -1.95098876953125, -1.6971435546875, -1.44329833984375, -1.189453125, -0.93560791015625, -0.6817626953125, -0.42791748046875, -0.174072265625, 0.07977294921875, 0.3336181640625, 0.58746337890625, 0.84130859375, 1.09515380859375, 1.3489990234375, 1.60284423828125, 1.856689453125, 2.11053466796875, 2.3643798828125, 2.61822509765625, 2.8720703125, 3.12591552734375, 3.3797607421875, 3.63360595703125, 3.887451171875, 4.14129638671875, 4.3951416015625, 4.64898681640625, 4.90283203125, 5.15667724609375, 5.4105224609375, 5.66436767578125, 5.918212890625, 6.17205810546875, 6.4259033203125, 6.67974853515625, 6.93359375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 4.0, 10.0, 6.0, 14.0, 13.0, 18.0, 29.0, 24.0, 33.0, 31.0, 48.0, 54.0, 64.0, 49.0, 80.0, 69.0, 72.0, 69.0, 61.0, 52.0, 39.0, 36.0, 29.0, 15.0, 15.0, 13.0, 6.0, 10.0, 7.0, 12.0, 6.0, 1.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.033483505249023, -23.233503341674805, -22.433523178100586, -21.633543014526367, -20.83356285095215, -20.03358268737793, -19.233600616455078, -18.43362045288086, -17.63364028930664, -16.833660125732422, -16.033679962158203, -15.233699798583984, -14.433719635009766, -13.633739471435547, -12.833758354187012, -12.033778190612793, -11.23379898071289, -10.433818817138672, -9.633838653564453, -8.833858489990234, -8.033878326416016, -7.233897686004639, -6.433917045593262, -5.633936882019043, -4.833956718444824, -4.0339765548706055, -3.2339961528778076, -2.4340157508850098, -1.634035587310791, -0.8340554237365723, -0.03407478332519531, 0.7659053802490234, 1.5658836364746094, 2.365863800048828, 3.165844202041626, 3.965824604034424, 4.765804767608643, 5.565784931182861, 6.365765571594238, 7.165745735168457, 7.965725898742676, 8.765706062316895, 9.565686225891113, 10.365667343139648, 11.165647506713867, 11.965627670288086, 12.765607833862305, 13.565587997436523, 14.365568161010742, 15.165548324584961, 15.96552848815918, 16.7655086517334, 17.565488815307617, 18.365468978881836, 19.165451049804688, 19.965431213378906, 20.765411376953125, 21.565391540527344, 22.365371704101562, 23.16535186767578, 23.96533203125, 24.76531219482422, 25.565292358398438, 26.365272521972656, 27.165252685546875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 7.0, 6.0, 6.0, 10.0, 8.0, 9.0, 15.0, 20.0, 22.0, 26.0, 25.0, 24.0, 30.0, 27.0, 31.0, 36.0, 37.0, 39.0, 45.0, 47.0, 50.0, 41.0, 48.0, 37.0, 32.0, 35.0, 39.0, 40.0, 32.0, 30.0, 28.0, 13.0, 19.0, 19.0, 19.0, 10.0, 9.0, 7.0, 3.0, 6.0, 3.0, 2.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.314404487609863, -13.856593132019043, -13.398782730102539, -12.940971374511719, -12.483160018920898, -12.025349617004395, -11.567538261413574, -11.10972785949707, -10.65191650390625, -10.19410514831543, -9.736294746398926, -9.278483390808105, -8.820672988891602, -8.362861633300781, -7.905050277709961, -7.447239398956299, -6.989428520202637, -6.531617641448975, -6.0738067626953125, -5.615995407104492, -5.15818452835083, -4.700373649597168, -4.242562294006348, -3.7847514152526855, -3.3269405364990234, -2.8691296577453613, -2.41131854057312, -1.9535075426101685, -1.4956965446472168, -1.0378856658935547, -0.5800745487213135, -0.12226343154907227, 0.33554840087890625, 0.7933593988418579, 1.2511703968048096, 1.7089813947677612, 2.166792392730713, 2.624603271484375, 3.082414388656616, 3.5402255058288574, 3.9980363845825195, 4.455847263336182, 4.913658142089844, 5.371469497680664, 5.829280376434326, 6.287091255187988, 6.744902610778809, 7.202713489532471, 7.660524368286133, 8.118335723876953, 8.576146125793457, 9.033957481384277, 9.491767883300781, 9.949579238891602, 10.407390594482422, 10.865201950073242, 11.323012351989746, 11.780823707580566, 12.23863410949707, 12.69644546508789, 13.154256820678711, 13.612067222595215, 14.069878578186035, 14.527688980102539, 14.98550033569336]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 6.0, 8.0, 17.0, 12.0, 24.0, 33.0, 59.0, 71.0, 119.0, 187.0, 269.0, 383.0, 587.0, 929.0, 1441.0, 2291.0, 3521.0, 5814.0, 9684.0, 15611.0, 26221.0, 42874.0, 68183.0, 102067.0, 138034.0, 158214.0, 148092.0, 114778.0, 79270.0, 50507.0, 30747.0, 18664.0, 11373.0, 6786.0, 4245.0, 2665.0, 1654.0, 1062.0, 649.0, 444.0, 327.0, 212.0, 131.0, 93.0, 53.0, 46.0, 42.0, 17.0, 14.0, 8.0, 11.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-11.25, -10.894775390625, -10.53955078125, -10.184326171875, -9.8291015625, -9.473876953125, -9.11865234375, -8.763427734375, -8.408203125, -8.052978515625, -7.69775390625, -7.342529296875, -6.9873046875, -6.632080078125, -6.27685546875, -5.921630859375, -5.56640625, -5.211181640625, -4.85595703125, -4.500732421875, -4.1455078125, -3.790283203125, -3.43505859375, -3.079833984375, -2.724609375, -2.369384765625, -2.01416015625, -1.658935546875, -1.3037109375, -0.948486328125, -0.59326171875, -0.238037109375, 0.1171875, 0.472412109375, 0.82763671875, 1.182861328125, 1.5380859375, 1.893310546875, 2.24853515625, 2.603759765625, 2.958984375, 3.314208984375, 3.66943359375, 4.024658203125, 4.3798828125, 4.735107421875, 5.09033203125, 5.445556640625, 5.80078125, 6.156005859375, 6.51123046875, 6.866455078125, 7.2216796875, 7.576904296875, 7.93212890625, 8.287353515625, 8.642578125, 8.997802734375, 9.35302734375, 9.708251953125, 10.0634765625, 10.418701171875, 10.77392578125, 11.129150390625, 11.484375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 8.0, 7.0, 9.0, 4.0, 10.0, 19.0, 14.0, 14.0, 26.0, 24.0, 26.0, 35.0, 32.0, 45.0, 34.0, 36.0, 35.0, 52.0, 40.0, 51.0, 44.0, 44.0, 34.0, 34.0, 40.0, 32.0, 31.0, 30.0, 32.0, 29.0, 19.0, 24.0, 14.0, 13.0, 12.0, 10.0, 12.0, 5.0, 0.0, 1.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-15.75, -15.252197265625, -14.75439453125, -14.256591796875, -13.7587890625, -13.260986328125, -12.76318359375, -12.265380859375, -11.767578125, -11.269775390625, -10.77197265625, -10.274169921875, -9.7763671875, -9.278564453125, -8.78076171875, -8.282958984375, -7.78515625, -7.287353515625, -6.78955078125, -6.291748046875, -5.7939453125, -5.296142578125, -4.79833984375, -4.300537109375, -3.802734375, -3.304931640625, -2.80712890625, -2.309326171875, -1.8115234375, -1.313720703125, -0.81591796875, -0.318115234375, 0.1796875, 0.677490234375, 1.17529296875, 1.673095703125, 2.1708984375, 2.668701171875, 3.16650390625, 3.664306640625, 4.162109375, 4.659912109375, 5.15771484375, 5.655517578125, 6.1533203125, 6.651123046875, 7.14892578125, 7.646728515625, 8.14453125, 8.642333984375, 9.14013671875, 9.637939453125, 10.1357421875, 10.633544921875, 11.13134765625, 11.629150390625, 12.126953125, 12.624755859375, 13.12255859375, 13.620361328125, 14.1181640625, 14.615966796875, 15.11376953125, 15.611572265625, 16.109375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 11.0, 15.0, 13.0, 25.0, 38.0, 55.0, 105.0, 151.0, 265.0, 424.0, 735.0, 1323.0, 2383.0, 4437.0, 9008.0, 18910.0, 41919.0, 95740.0, 200285.0, 288946.0, 203566.0, 97799.0, 43096.0, 19712.0, 9283.0, 4698.0, 2367.0, 1321.0, 751.0, 478.0, 256.0, 159.0, 105.0, 55.0, 37.0, 26.0, 27.0, 12.0, 10.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.734375, -22.03515625, -21.3359375, -20.63671875, -19.9375, -19.23828125, -18.5390625, -17.83984375, -17.140625, -16.44140625, -15.7421875, -15.04296875, -14.34375, -13.64453125, -12.9453125, -12.24609375, -11.546875, -10.84765625, -10.1484375, -9.44921875, -8.75, -8.05078125, -7.3515625, -6.65234375, -5.953125, -5.25390625, -4.5546875, -3.85546875, -3.15625, -2.45703125, -1.7578125, -1.05859375, -0.359375, 0.33984375, 1.0390625, 1.73828125, 2.4375, 3.13671875, 3.8359375, 4.53515625, 5.234375, 5.93359375, 6.6328125, 7.33203125, 8.03125, 8.73046875, 9.4296875, 10.12890625, 10.828125, 11.52734375, 12.2265625, 12.92578125, 13.625, 14.32421875, 15.0234375, 15.72265625, 16.421875, 17.12109375, 17.8203125, 18.51953125, 19.21875, 19.91796875, 20.6171875, 21.31640625, 22.015625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 5.0, 2.0, 5.0, 5.0, 4.0, 12.0, 10.0, 6.0, 17.0, 14.0, 19.0, 18.0, 19.0, 24.0, 21.0, 23.0, 29.0, 36.0, 35.0, 48.0, 36.0, 42.0, 36.0, 38.0, 38.0, 39.0, 42.0, 43.0, 37.0, 41.0, 36.0, 30.0, 29.0, 22.0, 20.0, 14.0, 18.0, 21.0, 22.0, 8.0, 12.0, 11.0, 7.0, 8.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.90625, -6.63134765625, -6.3564453125, -6.08154296875, -5.806640625, -5.53173828125, -5.2568359375, -4.98193359375, -4.70703125, -4.43212890625, -4.1572265625, -3.88232421875, -3.607421875, -3.33251953125, -3.0576171875, -2.78271484375, -2.5078125, -2.23291015625, -1.9580078125, -1.68310546875, -1.408203125, -1.13330078125, -0.8583984375, -0.58349609375, -0.30859375, -0.03369140625, 0.2412109375, 0.51611328125, 0.791015625, 1.06591796875, 1.3408203125, 1.61572265625, 1.890625, 2.16552734375, 2.4404296875, 2.71533203125, 2.990234375, 3.26513671875, 3.5400390625, 3.81494140625, 4.08984375, 4.36474609375, 4.6396484375, 4.91455078125, 5.189453125, 5.46435546875, 5.7392578125, 6.01416015625, 6.2890625, 6.56396484375, 6.8388671875, 7.11376953125, 7.388671875, 7.66357421875, 7.9384765625, 8.21337890625, 8.48828125, 8.76318359375, 9.0380859375, 9.31298828125, 9.587890625, 9.86279296875, 10.1376953125, 10.41259765625, 10.6875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 5.0, 7.0, 6.0, 11.0, 20.0, 17.0, 26.0, 46.0, 57.0, 81.0, 94.0, 179.0, 249.0, 412.0, 590.0, 969.0, 1542.0, 2621.0, 4288.0, 7244.0, 12904.0, 23481.0, 43300.0, 80662.0, 145764.0, 222260.0, 210114.0, 131359.0, 72307.0, 38517.0, 20865.0, 11636.0, 6619.0, 3966.0, 2421.0, 1444.0, 831.0, 525.0, 366.0, 263.0, 155.0, 123.0, 63.0, 54.0, 23.0, 25.0, 14.0, 9.0, 13.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-9.890625, -9.6072998046875, -9.323974609375, -9.0406494140625, -8.75732421875, -8.4739990234375, -8.190673828125, -7.9073486328125, -7.6240234375, -7.3406982421875, -7.057373046875, -6.7740478515625, -6.49072265625, -6.2073974609375, -5.924072265625, -5.6407470703125, -5.357421875, -5.0740966796875, -4.790771484375, -4.5074462890625, -4.22412109375, -3.9407958984375, -3.657470703125, -3.3741455078125, -3.0908203125, -2.8074951171875, -2.524169921875, -2.2408447265625, -1.95751953125, -1.6741943359375, -1.390869140625, -1.1075439453125, -0.82421875, -0.5408935546875, -0.257568359375, 0.0257568359375, 0.30908203125, 0.5924072265625, 0.875732421875, 1.1590576171875, 1.4423828125, 1.7257080078125, 2.009033203125, 2.2923583984375, 2.57568359375, 2.8590087890625, 3.142333984375, 3.4256591796875, 3.708984375, 3.9923095703125, 4.275634765625, 4.5589599609375, 4.84228515625, 5.1256103515625, 5.408935546875, 5.6922607421875, 5.9755859375, 6.2589111328125, 6.542236328125, 6.8255615234375, 7.10888671875, 7.3922119140625, 7.675537109375, 7.9588623046875, 8.2421875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 7.0, 6.0, 8.0, 9.0, 12.0, 28.0, 31.0, 43.0, 54.0, 73.0, 69.0, 91.0, 73.0, 108.0, 74.0, 82.0, 53.0, 43.0, 34.0, 34.0, 17.0, 10.0, 11.0, 7.0, 8.0, 5.0, 0.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0006556510925292969, -0.0006361603736877441, -0.0006166696548461914, -0.0005971789360046387, -0.0005776882171630859, -0.0005581974983215332, -0.0005387067794799805, -0.0005192160606384277, -0.000499725341796875, -0.00048023462295532227, -0.00046074390411376953, -0.0004412531852722168, -0.00042176246643066406, -0.00040227174758911133, -0.0003827810287475586, -0.00036329030990600586, -0.0003437995910644531, -0.0003243088722229004, -0.00030481815338134766, -0.0002853274345397949, -0.0002658367156982422, -0.00024634599685668945, -0.00022685527801513672, -0.00020736455917358398, -0.00018787384033203125, -0.00016838312149047852, -0.00014889240264892578, -0.00012940168380737305, -0.00010991096496582031, -9.042024612426758e-05, -7.092952728271484e-05, -5.143880844116211e-05, -3.1948089599609375e-05, -1.245737075805664e-05, 7.033348083496094e-06, 2.6524066925048828e-05, 4.601478576660156e-05, 6.55055046081543e-05, 8.499622344970703e-05, 0.00010448694229125977, 0.0001239776611328125, 0.00014346837997436523, 0.00016295909881591797, 0.0001824498176574707, 0.00020194053649902344, 0.00022143125534057617, 0.0002409219741821289, 0.00026041269302368164, 0.0002799034118652344, 0.0002993941307067871, 0.00031888484954833984, 0.0003383755683898926, 0.0003578662872314453, 0.00037735700607299805, 0.0003968477249145508, 0.0004163384437561035, 0.00043582916259765625, 0.000455319881439209, 0.0004748106002807617, 0.0004943013191223145, 0.0005137920379638672, 0.0005332827568054199, 0.0005527734756469727, 0.0005722641944885254, 0.0005917549133300781]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 4.0, 5.0, 11.0, 15.0, 25.0, 28.0, 44.0, 67.0, 99.0, 141.0, 240.0, 279.0, 519.0, 747.0, 1142.0, 1747.0, 2606.0, 4151.0, 6194.0, 9608.0, 14765.0, 22736.0, 35416.0, 52876.0, 77548.0, 106870.0, 131283.0, 140603.0, 127000.0, 100057.0, 71941.0, 48654.0, 32040.0, 20709.0, 13321.0, 8531.0, 5666.0, 3667.0, 2419.0, 1620.0, 1103.0, 667.0, 488.0, 279.0, 230.0, 140.0, 87.0, 75.0, 37.0, 20.0, 9.0, 11.0, 14.0, 2.0, 5.0, 1.0, 5.0, 2.0, 0.0, 2.0], "bins": [-6.33203125, -6.13031005859375, -5.9285888671875, -5.72686767578125, -5.525146484375, -5.32342529296875, -5.1217041015625, -4.91998291015625, -4.71826171875, -4.51654052734375, -4.3148193359375, -4.11309814453125, -3.911376953125, -3.70965576171875, -3.5079345703125, -3.30621337890625, -3.1044921875, -2.90277099609375, -2.7010498046875, -2.49932861328125, -2.297607421875, -2.09588623046875, -1.8941650390625, -1.69244384765625, -1.49072265625, -1.28900146484375, -1.0872802734375, -0.88555908203125, -0.683837890625, -0.48211669921875, -0.2803955078125, -0.07867431640625, 0.123046875, 0.32476806640625, 0.5264892578125, 0.72821044921875, 0.929931640625, 1.13165283203125, 1.3333740234375, 1.53509521484375, 1.73681640625, 1.93853759765625, 2.1402587890625, 2.34197998046875, 2.543701171875, 2.74542236328125, 2.9471435546875, 3.14886474609375, 3.3505859375, 3.55230712890625, 3.7540283203125, 3.95574951171875, 4.157470703125, 4.35919189453125, 4.5609130859375, 4.76263427734375, 4.96435546875, 5.16607666015625, 5.3677978515625, 5.56951904296875, 5.771240234375, 5.97296142578125, 6.1746826171875, 6.37640380859375, 6.578125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 10.0, 5.0, 5.0, 8.0, 10.0, 7.0, 13.0, 10.0, 22.0, 15.0, 20.0, 19.0, 21.0, 28.0, 37.0, 39.0, 39.0, 45.0, 43.0, 45.0, 37.0, 53.0, 55.0, 47.0, 41.0, 40.0, 36.0, 33.0, 37.0, 26.0, 24.0, 19.0, 19.0, 19.0, 17.0, 12.0, 10.0, 3.0, 7.0, 8.0, 3.0, 5.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-1.8759765625, -1.8157958984375, -1.755615234375, -1.6954345703125, -1.63525390625, -1.5750732421875, -1.514892578125, -1.4547119140625, -1.39453125, -1.3343505859375, -1.274169921875, -1.2139892578125, -1.15380859375, -1.0936279296875, -1.033447265625, -0.9732666015625, -0.9130859375, -0.8529052734375, -0.792724609375, -0.7325439453125, -0.67236328125, -0.6121826171875, -0.552001953125, -0.4918212890625, -0.431640625, -0.3714599609375, -0.311279296875, -0.2510986328125, -0.19091796875, -0.1307373046875, -0.070556640625, -0.0103759765625, 0.0498046875, 0.1099853515625, 0.170166015625, 0.2303466796875, 0.29052734375, 0.3507080078125, 0.410888671875, 0.4710693359375, 0.53125, 0.5914306640625, 0.651611328125, 0.7117919921875, 0.77197265625, 0.8321533203125, 0.892333984375, 0.9525146484375, 1.0126953125, 1.0728759765625, 1.133056640625, 1.1932373046875, 1.25341796875, 1.3135986328125, 1.373779296875, 1.4339599609375, 1.494140625, 1.5543212890625, 1.614501953125, 1.6746826171875, 1.73486328125, 1.7950439453125, 1.855224609375, 1.9154052734375, 1.9755859375]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 5.0, 7.0, 5.0, 6.0, 12.0, 22.0, 22.0, 24.0, 29.0, 27.0, 35.0, 37.0, 58.0, 65.0, 53.0, 77.0, 76.0, 69.0, 66.0, 58.0, 43.0, 43.0, 37.0, 25.0, 20.0, 16.0, 10.0, 6.0, 7.0, 9.0, 13.0, 4.0, 4.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.444873809814453, -22.66288185119629, -21.880887985229492, -21.098896026611328, -20.31690216064453, -19.534910202026367, -18.752918243408203, -17.970924377441406, -17.188932418823242, -16.406940460205078, -15.624946594238281, -14.842954635620117, -14.060961723327637, -13.278968811035156, -12.496976852416992, -11.714983940124512, -10.932991027832031, -10.15099811553955, -9.36900520324707, -8.587013244628906, -7.805020332336426, -7.023027420043945, -6.241034984588623, -5.459042549133301, -4.67704963684082, -3.895056962966919, -3.1130642890930176, -2.331071615219116, -1.5490789413452148, -0.7670862674713135, 0.01490640640258789, 0.7968988418579102, 1.5788917541503906, 2.360884428024292, 3.1428771018981934, 3.9248697757720947, 4.706862449645996, 5.488855361938477, 6.270847797393799, 7.052840232849121, 7.834833145141602, 8.616826057434082, 9.398818969726562, 10.180810928344727, 10.962803840637207, 11.744796752929688, 12.526788711547852, 13.308781623840332, 14.090774536132812, 14.872767448425293, 15.654760360717773, 16.436752319335938, 17.218746185302734, 18.0007381439209, 18.782730102539062, 19.56472396850586, 20.346715927124023, 21.128707885742188, 21.910701751708984, 22.69269371032715, 23.474685668945312, 24.25667953491211, 25.038671493530273, 25.820663452148438, 26.602657318115234]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 10.0, 5.0, 7.0, 6.0, 12.0, 18.0, 12.0, 16.0, 27.0, 26.0, 27.0, 20.0, 23.0, 26.0, 35.0, 33.0, 47.0, 35.0, 39.0, 56.0, 41.0, 48.0, 39.0, 43.0, 33.0, 32.0, 37.0, 39.0, 28.0, 32.0, 24.0, 23.0, 19.0, 15.0, 17.0, 5.0, 13.0, 6.0, 6.0, 5.0, 4.0, 0.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.84384536743164, -13.400592803955078, -12.957340240478516, -12.514087677001953, -12.07083511352539, -11.627582550048828, -11.184329986572266, -10.741076469421387, -10.297823905944824, -9.854571342468262, -9.4113187789917, -8.968066215515137, -8.524813652038574, -8.081560134887695, -7.638308048248291, -7.19505500793457, -6.751802921295166, -6.3085503578186035, -5.865297794342041, -5.42204475402832, -4.978792190551758, -4.535539627075195, -4.092287063598633, -3.649034261703491, -3.2057816982269287, -2.762529134750366, -2.3192763328552246, -1.876023769378662, -1.43277108669281, -0.989518404006958, -0.5462658405303955, -0.1030130386352539, 0.3402395248413086, 0.7834922075271606, 1.2267448902130127, 1.6699974536895752, 2.113250255584717, 2.5565028190612793, 2.999755382537842, 3.4430081844329834, 3.886260747909546, 4.3295135498046875, 4.77276611328125, 5.2160186767578125, 5.659271240234375, 6.1025238037109375, 6.5457763671875, 6.989029407501221, 7.432281970977783, 7.875534534454346, 8.318787574768066, 8.762040138244629, 9.205292701721191, 9.648545265197754, 10.091797828674316, 10.535050392150879, 10.978302955627441, 11.421555519104004, 11.864808082580566, 12.308060646057129, 12.751313209533691, 13.19456672668457, 13.637819290161133, 14.081071853637695, 14.524324417114258]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 14.0, 16.0, 26.0, 31.0, 59.0, 67.0, 127.0, 176.0, 309.0, 445.0, 717.0, 1136.0, 1675.0, 2701.0, 4162.0, 6395.0, 9588.0, 14736.0, 22470.0, 32949.0, 47720.0, 65845.0, 86206.0, 104971.0, 117713.0, 117800.0, 107628.0, 88046.0, 66700.0, 48415.0, 33718.0, 22594.0, 15037.0, 9936.0, 6496.0, 4184.0, 2790.0, 1756.0, 1146.0, 732.0, 459.0, 311.0, 189.0, 145.0, 80.0, 47.0, 30.0, 19.0, 23.0, 6.0, 8.0, 5.0, 5.0, 1.0, 2.0, 5.0], "bins": [-12.15625, -11.7882080078125, -11.420166015625, -11.0521240234375, -10.68408203125, -10.3160400390625, -9.947998046875, -9.5799560546875, -9.2119140625, -8.8438720703125, -8.475830078125, -8.1077880859375, -7.73974609375, -7.3717041015625, -7.003662109375, -6.6356201171875, -6.267578125, -5.8995361328125, -5.531494140625, -5.1634521484375, -4.79541015625, -4.4273681640625, -4.059326171875, -3.6912841796875, -3.3232421875, -2.9552001953125, -2.587158203125, -2.2191162109375, -1.85107421875, -1.4830322265625, -1.114990234375, -0.7469482421875, -0.37890625, -0.0108642578125, 0.357177734375, 0.7252197265625, 1.09326171875, 1.4613037109375, 1.829345703125, 2.1973876953125, 2.5654296875, 2.9334716796875, 3.301513671875, 3.6695556640625, 4.03759765625, 4.4056396484375, 4.773681640625, 5.1417236328125, 5.509765625, 5.8778076171875, 6.245849609375, 6.6138916015625, 6.98193359375, 7.3499755859375, 7.718017578125, 8.0860595703125, 8.4541015625, 8.8221435546875, 9.190185546875, 9.5582275390625, 9.92626953125, 10.2943115234375, 10.662353515625, 11.0303955078125, 11.3984375]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 5.0, 7.0, 9.0, 11.0, 16.0, 24.0, 18.0, 19.0, 23.0, 19.0, 33.0, 25.0, 34.0, 36.0, 34.0, 39.0, 38.0, 47.0, 47.0, 46.0, 53.0, 38.0, 39.0, 43.0, 34.0, 27.0, 36.0, 26.0, 22.0, 17.0, 23.0, 15.0, 16.0, 17.0, 9.0, 12.0, 11.0, 8.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.5234375, -15.05126953125, -14.5791015625, -14.10693359375, -13.634765625, -13.16259765625, -12.6904296875, -12.21826171875, -11.74609375, -11.27392578125, -10.8017578125, -10.32958984375, -9.857421875, -9.38525390625, -8.9130859375, -8.44091796875, -7.96875, -7.49658203125, -7.0244140625, -6.55224609375, -6.080078125, -5.60791015625, -5.1357421875, -4.66357421875, -4.19140625, -3.71923828125, -3.2470703125, -2.77490234375, -2.302734375, -1.83056640625, -1.3583984375, -0.88623046875, -0.4140625, 0.05810546875, 0.5302734375, 1.00244140625, 1.474609375, 1.94677734375, 2.4189453125, 2.89111328125, 3.36328125, 3.83544921875, 4.3076171875, 4.77978515625, 5.251953125, 5.72412109375, 6.1962890625, 6.66845703125, 7.140625, 7.61279296875, 8.0849609375, 8.55712890625, 9.029296875, 9.50146484375, 9.9736328125, 10.44580078125, 10.91796875, 11.39013671875, 11.8623046875, 12.33447265625, 12.806640625, 13.27880859375, 13.7509765625, 14.22314453125, 14.6953125]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 8.0, 19.0, 22.0, 35.0, 61.0, 81.0, 124.0, 198.0, 300.0, 494.0, 703.0, 1114.0, 1685.0, 2505.0, 3761.0, 5699.0, 8317.0, 12193.0, 17883.0, 25515.0, 35981.0, 49046.0, 64995.0, 80572.0, 95684.0, 104528.0, 105260.0, 97678.0, 84531.0, 68415.0, 52534.0, 39218.0, 28306.0, 19448.0, 13628.0, 9284.0, 6439.0, 4226.0, 2773.0, 1820.0, 1221.0, 785.0, 505.0, 339.0, 243.0, 136.0, 90.0, 67.0, 30.0, 20.0, 22.0, 12.0, 7.0, 3.0, 0.0, 3.0], "bins": [-11.15625, -10.829345703125, -10.50244140625, -10.175537109375, -9.8486328125, -9.521728515625, -9.19482421875, -8.867919921875, -8.541015625, -8.214111328125, -7.88720703125, -7.560302734375, -7.2333984375, -6.906494140625, -6.57958984375, -6.252685546875, -5.92578125, -5.598876953125, -5.27197265625, -4.945068359375, -4.6181640625, -4.291259765625, -3.96435546875, -3.637451171875, -3.310546875, -2.983642578125, -2.65673828125, -2.329833984375, -2.0029296875, -1.676025390625, -1.34912109375, -1.022216796875, -0.6953125, -0.368408203125, -0.04150390625, 0.285400390625, 0.6123046875, 0.939208984375, 1.26611328125, 1.593017578125, 1.919921875, 2.246826171875, 2.57373046875, 2.900634765625, 3.2275390625, 3.554443359375, 3.88134765625, 4.208251953125, 4.53515625, 4.862060546875, 5.18896484375, 5.515869140625, 5.8427734375, 6.169677734375, 6.49658203125, 6.823486328125, 7.150390625, 7.477294921875, 7.80419921875, 8.131103515625, 8.4580078125, 8.784912109375, 9.11181640625, 9.438720703125, 9.765625]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 6.0, 4.0, 5.0, 4.0, 7.0, 14.0, 6.0, 9.0, 8.0, 11.0, 8.0, 7.0, 22.0, 19.0, 31.0, 26.0, 41.0, 44.0, 30.0, 27.0, 47.0, 33.0, 39.0, 43.0, 44.0, 50.0, 39.0, 42.0, 44.0, 35.0, 27.0, 27.0, 29.0, 27.0, 24.0, 14.0, 27.0, 12.0, 17.0, 14.0, 6.0, 8.0, 6.0, 6.0, 3.0, 5.0, 5.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.671875, -8.4036865234375, -8.135498046875, -7.8673095703125, -7.59912109375, -7.3309326171875, -7.062744140625, -6.7945556640625, -6.5263671875, -6.2581787109375, -5.989990234375, -5.7218017578125, -5.45361328125, -5.1854248046875, -4.917236328125, -4.6490478515625, -4.380859375, -4.1126708984375, -3.844482421875, -3.5762939453125, -3.30810546875, -3.0399169921875, -2.771728515625, -2.5035400390625, -2.2353515625, -1.9671630859375, -1.698974609375, -1.4307861328125, -1.16259765625, -0.8944091796875, -0.626220703125, -0.3580322265625, -0.08984375, 0.1783447265625, 0.446533203125, 0.7147216796875, 0.98291015625, 1.2510986328125, 1.519287109375, 1.7874755859375, 2.0556640625, 2.3238525390625, 2.592041015625, 2.8602294921875, 3.12841796875, 3.3966064453125, 3.664794921875, 3.9329833984375, 4.201171875, 4.4693603515625, 4.737548828125, 5.0057373046875, 5.27392578125, 5.5421142578125, 5.810302734375, 6.0784912109375, 6.3466796875, 6.6148681640625, 6.883056640625, 7.1512451171875, 7.41943359375, 7.6876220703125, 7.955810546875, 8.2239990234375, 8.4921875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 8.0, 11.0, 15.0, 22.0, 30.0, 53.0, 82.0, 126.0, 179.0, 314.0, 441.0, 688.0, 1129.0, 1835.0, 2945.0, 4536.0, 7319.0, 12100.0, 19082.0, 29466.0, 44700.0, 65070.0, 89578.0, 113554.0, 129324.0, 129194.0, 113988.0, 90598.0, 65726.0, 45113.0, 29640.0, 19273.0, 12210.0, 7489.0, 4840.0, 2832.0, 1884.0, 1137.0, 779.0, 407.0, 285.0, 205.0, 121.0, 76.0, 65.0, 29.0, 18.0, 19.0, 15.0, 3.0, 5.0, 1.0, 5.0, 1.0, 0.0, 1.0], "bins": [-5.53125, -5.36370849609375, -5.1961669921875, -5.02862548828125, -4.861083984375, -4.69354248046875, -4.5260009765625, -4.35845947265625, -4.19091796875, -4.02337646484375, -3.8558349609375, -3.68829345703125, -3.520751953125, -3.35321044921875, -3.1856689453125, -3.01812744140625, -2.8505859375, -2.68304443359375, -2.5155029296875, -2.34796142578125, -2.180419921875, -2.01287841796875, -1.8453369140625, -1.67779541015625, -1.51025390625, -1.34271240234375, -1.1751708984375, -1.00762939453125, -0.840087890625, -0.67254638671875, -0.5050048828125, -0.33746337890625, -0.169921875, -0.00238037109375, 0.1651611328125, 0.33270263671875, 0.500244140625, 0.66778564453125, 0.8353271484375, 1.00286865234375, 1.17041015625, 1.33795166015625, 1.5054931640625, 1.67303466796875, 1.840576171875, 2.00811767578125, 2.1756591796875, 2.34320068359375, 2.5107421875, 2.67828369140625, 2.8458251953125, 3.01336669921875, 3.180908203125, 3.34844970703125, 3.5159912109375, 3.68353271484375, 3.85107421875, 4.01861572265625, 4.1861572265625, 4.35369873046875, 4.521240234375, 4.68878173828125, 4.8563232421875, 5.02386474609375, 5.19140625]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 9.0, 6.0, 2.0, 9.0, 16.0, 15.0, 18.0, 29.0, 21.0, 38.0, 38.0, 37.0, 50.0, 58.0, 71.0, 53.0, 60.0, 60.0, 42.0, 60.0, 50.0, 47.0, 34.0, 28.0, 24.0, 29.0, 21.0, 19.0, 17.0, 10.0, 7.0, 4.0, 3.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0006580352783203125, -0.0006364732980728149, -0.0006149113178253174, -0.0005933493375778198, -0.0005717873573303223, -0.0005502253770828247, -0.0005286633968353271, -0.0005071014165878296, -0.00048553943634033203, -0.00046397745609283447, -0.0004424154758453369, -0.00042085349559783936, -0.0003992915153503418, -0.00037772953510284424, -0.0003561675548553467, -0.0003346055746078491, -0.00031304359436035156, -0.000291481614112854, -0.00026991963386535645, -0.0002483576536178589, -0.00022679567337036133, -0.00020523369312286377, -0.0001836717128753662, -0.00016210973262786865, -0.0001405477523803711, -0.00011898577213287354, -9.742379188537598e-05, -7.586181163787842e-05, -5.429983139038086e-05, -3.27378511428833e-05, -1.1175870895385742e-05, 1.0386109352111816e-05, 3.1948089599609375e-05, 5.3510069847106934e-05, 7.507205009460449e-05, 9.663403034210205e-05, 0.00011819601058959961, 0.00013975799083709717, 0.00016131997108459473, 0.00018288195133209229, 0.00020444393157958984, 0.0002260059118270874, 0.00024756789207458496, 0.0002691298723220825, 0.0002906918525695801, 0.00031225383281707764, 0.0003338158130645752, 0.00035537779331207275, 0.0003769397735595703, 0.00039850175380706787, 0.00042006373405456543, 0.000441625714302063, 0.00046318769454956055, 0.0004847496747970581, 0.0005063116550445557, 0.0005278736352920532, 0.0005494356155395508, 0.0005709975957870483, 0.0005925595760345459, 0.0006141215562820435, 0.000635683536529541, 0.0006572455167770386, 0.0006788074970245361, 0.0007003694772720337, 0.0007219314575195312]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 5.0, 7.0, 12.0, 19.0, 23.0, 45.0, 55.0, 97.0, 148.0, 214.0, 332.0, 515.0, 714.0, 1118.0, 1682.0, 2484.0, 3790.0, 5733.0, 8552.0, 12787.0, 18554.0, 27741.0, 39744.0, 55165.0, 73760.0, 92397.0, 107478.0, 114636.0, 110094.0, 96329.0, 77932.0, 59380.0, 43470.0, 30150.0, 20857.0, 14030.0, 9417.0, 6390.0, 4235.0, 2751.0, 1888.0, 1270.0, 905.0, 550.0, 366.0, 258.0, 183.0, 91.0, 91.0, 46.0, 18.0, 23.0, 12.0, 9.0, 5.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.5703125, -4.42108154296875, -4.2718505859375, -4.12261962890625, -3.973388671875, -3.82415771484375, -3.6749267578125, -3.52569580078125, -3.37646484375, -3.22723388671875, -3.0780029296875, -2.92877197265625, -2.779541015625, -2.63031005859375, -2.4810791015625, -2.33184814453125, -2.1826171875, -2.03338623046875, -1.8841552734375, -1.73492431640625, -1.585693359375, -1.43646240234375, -1.2872314453125, -1.13800048828125, -0.98876953125, -0.83953857421875, -0.6903076171875, -0.54107666015625, -0.391845703125, -0.24261474609375, -0.0933837890625, 0.05584716796875, 0.205078125, 0.35430908203125, 0.5035400390625, 0.65277099609375, 0.802001953125, 0.95123291015625, 1.1004638671875, 1.24969482421875, 1.39892578125, 1.54815673828125, 1.6973876953125, 1.84661865234375, 1.995849609375, 2.14508056640625, 2.2943115234375, 2.44354248046875, 2.5927734375, 2.74200439453125, 2.8912353515625, 3.04046630859375, 3.189697265625, 3.33892822265625, 3.4881591796875, 3.63739013671875, 3.78662109375, 3.93585205078125, 4.0850830078125, 4.23431396484375, 4.383544921875, 4.53277587890625, 4.6820068359375, 4.83123779296875, 4.98046875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 9.0, 7.0, 8.0, 8.0, 7.0, 12.0, 11.0, 17.0, 19.0, 22.0, 21.0, 34.0, 29.0, 39.0, 26.0, 42.0, 39.0, 41.0, 38.0, 39.0, 56.0, 49.0, 48.0, 38.0, 32.0, 32.0, 31.0, 42.0, 38.0, 32.0, 22.0, 16.0, 16.0, 12.0, 13.0, 12.0, 13.0, 5.0, 5.0, 4.0, 6.0, 3.0, 4.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.9794921875, -1.9201507568359375, -1.860809326171875, -1.8014678955078125, -1.74212646484375, -1.6827850341796875, -1.623443603515625, -1.5641021728515625, -1.5047607421875, -1.4454193115234375, -1.386077880859375, -1.3267364501953125, -1.26739501953125, -1.2080535888671875, -1.148712158203125, -1.0893707275390625, -1.030029296875, -0.9706878662109375, -0.911346435546875, -0.8520050048828125, -0.79266357421875, -0.7333221435546875, -0.673980712890625, -0.6146392822265625, -0.5552978515625, -0.4959564208984375, -0.436614990234375, -0.3772735595703125, -0.31793212890625, -0.2585906982421875, -0.199249267578125, -0.1399078369140625, -0.08056640625, -0.0212249755859375, 0.038116455078125, 0.0974578857421875, 0.15679931640625, 0.2161407470703125, 0.275482177734375, 0.3348236083984375, 0.3941650390625, 0.4535064697265625, 0.512847900390625, 0.5721893310546875, 0.63153076171875, 0.6908721923828125, 0.750213623046875, 0.8095550537109375, 0.868896484375, 0.9282379150390625, 0.987579345703125, 1.0469207763671875, 1.10626220703125, 1.1656036376953125, 1.224945068359375, 1.2842864990234375, 1.3436279296875, 1.4029693603515625, 1.462310791015625, 1.5216522216796875, 1.58099365234375, 1.6403350830078125, 1.699676513671875, 1.7590179443359375, 1.818359375]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 6.0, 6.0, 8.0, 5.0, 15.0, 5.0, 13.0, 11.0, 23.0, 28.0, 31.0, 46.0, 49.0, 51.0, 60.0, 54.0, 61.0, 77.0, 66.0, 69.0, 58.0, 49.0, 42.0, 34.0, 16.0, 26.0, 16.0, 18.0, 11.0, 8.0, 7.0, 11.0, 3.0, 5.0, 8.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.74799919128418, -22.989160537719727, -22.230321884155273, -21.471485137939453, -20.712646484375, -19.953807830810547, -19.194969177246094, -18.43613052368164, -17.677291870117188, -16.918453216552734, -16.15961456298828, -15.400776863098145, -14.641939163208008, -13.883100509643555, -13.124261856079102, -12.365423202514648, -11.606586456298828, -10.847747802734375, -10.088910102844238, -9.330071449279785, -8.571233749389648, -7.812395095825195, -7.053556442260742, -6.294718265533447, -5.535880088806152, -4.777041912078857, -4.0182037353515625, -3.2593650817871094, -2.5005269050598145, -1.7416887283325195, -0.9828500747680664, -0.22401189804077148, 0.5348281860351562, 1.2936664819717407, 2.052504777908325, 2.811343193054199, 3.570181369781494, 4.329019546508789, 5.087858200073242, 5.846696376800537, 6.605534553527832, 7.364372730255127, 8.123210906982422, 8.882049560546875, 9.640888214111328, 10.399725914001465, 11.158564567565918, 11.917402267456055, 12.676240921020508, 13.435079574584961, 14.193917274475098, 14.95275592803955, 15.711593627929688, 16.47043228149414, 17.229270935058594, 17.988109588623047, 18.7469482421875, 19.505786895751953, 20.264625549316406, 21.02346420288086, 21.78230094909668, 22.541139602661133, 23.299978256225586, 24.05881690979004, 24.81765365600586]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 5.0, 9.0, 6.0, 4.0, 9.0, 10.0, 13.0, 19.0, 16.0, 24.0, 26.0, 26.0, 35.0, 37.0, 44.0, 44.0, 45.0, 43.0, 42.0, 49.0, 47.0, 41.0, 48.0, 47.0, 37.0, 35.0, 40.0, 31.0, 37.0, 26.0, 20.0, 18.0, 11.0, 13.0, 18.0, 6.0, 7.0, 6.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.983983993530273, -15.481595993041992, -14.979207992553711, -14.47681999206543, -13.974432945251465, -13.472044944763184, -12.969656944274902, -12.467268943786621, -11.964881896972656, -11.462493896484375, -10.960105895996094, -10.457717895507812, -9.955330848693848, -9.452942848205566, -8.950554847717285, -8.448166847229004, -7.945778846740723, -7.443390846252441, -6.941003322601318, -6.438615322113037, -5.936227798461914, -5.433839797973633, -4.931451797485352, -4.42906379699707, -3.9266762733459473, -3.424288511276245, -2.921900749206543, -2.4195127487182617, -1.9171249866485596, -1.4147372245788574, -0.9123492240905762, -0.409961462020874, 0.09242630004882812, 0.594814121723175, 1.097201943397522, 1.5995898246765137, 2.101977586746216, 2.604365348815918, 3.106753349304199, 3.6091411113739014, 4.1115288734436035, 4.613916873931885, 5.116304397583008, 5.618692398071289, 6.12108039855957, 6.623467922210693, 7.125855922698975, 7.628243446350098, 8.130631446838379, 8.63301944732666, 9.135407447814941, 9.637794494628906, 10.140182495117188, 10.642570495605469, 11.14495849609375, 11.647346496582031, 12.149734497070312, 12.652122497558594, 13.154510498046875, 13.656898498535156, 14.159285545349121, 14.661673545837402, 15.164061546325684, 15.666449546813965, 16.16883659362793]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 8.0, 23.0, 21.0, 31.0, 41.0, 68.0, 111.0, 183.0, 263.0, 344.0, 580.0, 876.0, 1367.0, 2113.0, 3431.0, 5850.0, 10023.0, 17868.0, 32856.0, 63297.0, 125981.0, 258339.0, 508127.0, 845495.0, 945040.0, 663911.0, 355428.0, 173634.0, 84422.0, 42582.0, 22138.0, 12071.0, 6912.0, 4017.0, 2460.0, 1584.0, 982.0, 616.0, 385.0, 285.0, 176.0, 136.0, 77.0, 44.0, 32.0, 21.0, 16.0, 8.0, 11.0, 3.0, 2.0, 2.0], "bins": [-26.890625, -26.148193359375, -25.40576171875, -24.663330078125, -23.9208984375, -23.178466796875, -22.43603515625, -21.693603515625, -20.951171875, -20.208740234375, -19.46630859375, -18.723876953125, -17.9814453125, -17.239013671875, -16.49658203125, -15.754150390625, -15.01171875, -14.269287109375, -13.52685546875, -12.784423828125, -12.0419921875, -11.299560546875, -10.55712890625, -9.814697265625, -9.072265625, -8.329833984375, -7.58740234375, -6.844970703125, -6.1025390625, -5.360107421875, -4.61767578125, -3.875244140625, -3.1328125, -2.390380859375, -1.64794921875, -0.905517578125, -0.1630859375, 0.579345703125, 1.32177734375, 2.064208984375, 2.806640625, 3.549072265625, 4.29150390625, 5.033935546875, 5.7763671875, 6.518798828125, 7.26123046875, 8.003662109375, 8.74609375, 9.488525390625, 10.23095703125, 10.973388671875, 11.7158203125, 12.458251953125, 13.20068359375, 13.943115234375, 14.685546875, 15.427978515625, 16.17041015625, 16.912841796875, 17.6552734375, 18.397705078125, 19.14013671875, 19.882568359375, 20.625]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 4.0, 8.0, 2.0, 3.0, 16.0, 16.0, 14.0, 21.0, 19.0, 27.0, 30.0, 33.0, 43.0, 46.0, 44.0, 45.0, 46.0, 57.0, 37.0, 43.0, 57.0, 60.0, 42.0, 47.0, 42.0, 40.0, 41.0, 24.0, 18.0, 18.0, 16.0, 7.0, 14.0, 7.0, 2.0, 7.0, 4.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.2578125, -13.79248046875, -13.3271484375, -12.86181640625, -12.396484375, -11.93115234375, -11.4658203125, -11.00048828125, -10.53515625, -10.06982421875, -9.6044921875, -9.13916015625, -8.673828125, -8.20849609375, -7.7431640625, -7.27783203125, -6.8125, -6.34716796875, -5.8818359375, -5.41650390625, -4.951171875, -4.48583984375, -4.0205078125, -3.55517578125, -3.08984375, -2.62451171875, -2.1591796875, -1.69384765625, -1.228515625, -0.76318359375, -0.2978515625, 0.16748046875, 0.6328125, 1.09814453125, 1.5634765625, 2.02880859375, 2.494140625, 2.95947265625, 3.4248046875, 3.89013671875, 4.35546875, 4.82080078125, 5.2861328125, 5.75146484375, 6.216796875, 6.68212890625, 7.1474609375, 7.61279296875, 8.078125, 8.54345703125, 9.0087890625, 9.47412109375, 9.939453125, 10.40478515625, 10.8701171875, 11.33544921875, 11.80078125, 12.26611328125, 12.7314453125, 13.19677734375, 13.662109375, 14.12744140625, 14.5927734375, 15.05810546875, 15.5234375]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 7.0, 5.0, 9.0, 16.0, 25.0, 27.0, 59.0, 61.0, 110.0, 176.0, 279.0, 414.0, 567.0, 941.0, 1552.0, 2330.0, 3890.0, 6632.0, 11408.0, 19723.0, 35033.0, 64320.0, 119541.0, 221537.0, 399993.0, 647676.0, 826738.0, 734623.0, 484396.0, 277344.0, 150579.0, 80938.0, 44293.0, 24632.0, 13834.0, 8090.0, 4760.0, 2843.0, 1714.0, 1092.0, 758.0, 457.0, 324.0, 182.0, 140.0, 83.0, 48.0, 34.0, 23.0, 17.0, 8.0, 5.0, 5.0, 5.0, 0.0, 1.0], "bins": [-27.453125, -26.66162109375, -25.8701171875, -25.07861328125, -24.287109375, -23.49560546875, -22.7041015625, -21.91259765625, -21.12109375, -20.32958984375, -19.5380859375, -18.74658203125, -17.955078125, -17.16357421875, -16.3720703125, -15.58056640625, -14.7890625, -13.99755859375, -13.2060546875, -12.41455078125, -11.623046875, -10.83154296875, -10.0400390625, -9.24853515625, -8.45703125, -7.66552734375, -6.8740234375, -6.08251953125, -5.291015625, -4.49951171875, -3.7080078125, -2.91650390625, -2.125, -1.33349609375, -0.5419921875, 0.24951171875, 1.041015625, 1.83251953125, 2.6240234375, 3.41552734375, 4.20703125, 4.99853515625, 5.7900390625, 6.58154296875, 7.373046875, 8.16455078125, 8.9560546875, 9.74755859375, 10.5390625, 11.33056640625, 12.1220703125, 12.91357421875, 13.705078125, 14.49658203125, 15.2880859375, 16.07958984375, 16.87109375, 17.66259765625, 18.4541015625, 19.24560546875, 20.037109375, 20.82861328125, 21.6201171875, 22.41162109375, 23.203125]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 7.0, 0.0, 6.0, 5.0, 17.0, 15.0, 22.0, 18.0, 38.0, 51.0, 73.0, 80.0, 134.0, 164.0, 197.0, 262.0, 299.0, 317.0, 346.0, 344.0, 335.0, 275.0, 254.0, 208.0, 147.0, 130.0, 100.0, 68.0, 59.0, 26.0, 25.0, 13.0, 16.0, 7.0, 6.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.4296875, -12.10009765625, -11.7705078125, -11.44091796875, -11.111328125, -10.78173828125, -10.4521484375, -10.12255859375, -9.79296875, -9.46337890625, -9.1337890625, -8.80419921875, -8.474609375, -8.14501953125, -7.8154296875, -7.48583984375, -7.15625, -6.82666015625, -6.4970703125, -6.16748046875, -5.837890625, -5.50830078125, -5.1787109375, -4.84912109375, -4.51953125, -4.18994140625, -3.8603515625, -3.53076171875, -3.201171875, -2.87158203125, -2.5419921875, -2.21240234375, -1.8828125, -1.55322265625, -1.2236328125, -0.89404296875, -0.564453125, -0.23486328125, 0.0947265625, 0.42431640625, 0.75390625, 1.08349609375, 1.4130859375, 1.74267578125, 2.072265625, 2.40185546875, 2.7314453125, 3.06103515625, 3.390625, 3.72021484375, 4.0498046875, 4.37939453125, 4.708984375, 5.03857421875, 5.3681640625, 5.69775390625, 6.02734375, 6.35693359375, 6.6865234375, 7.01611328125, 7.345703125, 7.67529296875, 8.0048828125, 8.33447265625, 8.6640625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 6.0, 6.0, 3.0, 8.0, 20.0, 8.0, 15.0, 27.0, 24.0, 25.0, 36.0, 35.0, 52.0, 58.0, 59.0, 58.0, 64.0, 50.0, 69.0, 55.0, 45.0, 55.0, 51.0, 38.0, 27.0, 25.0, 16.0, 13.0, 9.0, 12.0, 8.0, 6.0, 4.0, 4.0, 6.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.259218215942383, -20.40230941772461, -19.545400619506836, -18.688491821289062, -17.83158302307129, -16.974674224853516, -16.117765426635742, -15.260856628417969, -14.403947830200195, -13.547039031982422, -12.690130233764648, -11.833221435546875, -10.976312637329102, -10.119403839111328, -9.262495040893555, -8.405586242675781, -7.548677444458008, -6.691768646240234, -5.834859848022461, -4.9779510498046875, -4.121042251586914, -3.2641334533691406, -2.407224655151367, -1.5503158569335938, -0.6934070587158203, 0.16350173950195312, 1.0204105377197266, 1.8773193359375, 2.7342281341552734, 3.591136932373047, 4.44804573059082, 5.304954528808594, 6.161865234375, 7.018774032592773, 7.875682830810547, 8.73259162902832, 9.589500427246094, 10.446409225463867, 11.30331802368164, 12.160226821899414, 13.017135620117188, 13.874044418334961, 14.730953216552734, 15.587862014770508, 16.44477081298828, 17.301679611206055, 18.158588409423828, 19.0154972076416, 19.872406005859375, 20.72931480407715, 21.586223602294922, 22.443132400512695, 23.30004119873047, 24.156949996948242, 25.013858795166016, 25.87076759338379, 26.727676391601562, 27.584585189819336, 28.44149398803711, 29.298402786254883, 30.155311584472656, 31.01222038269043, 31.869129180908203, 32.726036071777344, 33.58294677734375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 4.0, 3.0, 4.0, 8.0, 5.0, 14.0, 11.0, 12.0, 19.0, 15.0, 26.0, 24.0, 35.0, 32.0, 26.0, 37.0, 43.0, 51.0, 40.0, 42.0, 43.0, 44.0, 45.0, 42.0, 33.0, 33.0, 42.0, 23.0, 16.0, 23.0, 31.0, 24.0, 26.0, 20.0, 23.0, 23.0, 13.0, 11.0, 6.0, 7.0, 5.0, 2.0, 4.0, 4.0, 2.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-16.862382888793945, -16.340221405029297, -15.818058967590332, -15.295896530151367, -14.773735046386719, -14.25157356262207, -13.729411125183105, -13.20724868774414, -12.685087203979492, -12.162925720214844, -11.640763282775879, -11.118600845336914, -10.596439361572266, -10.074277877807617, -9.552115440368652, -9.029953002929688, -8.507791519165039, -7.985629558563232, -7.463467597961426, -6.941305637359619, -6.4191436767578125, -5.896981716156006, -5.374819755554199, -4.852657794952393, -4.330495834350586, -3.8083338737487793, -3.2861719131469727, -2.764009952545166, -2.2418479919433594, -1.7196860313415527, -1.197524070739746, -0.6753621101379395, -0.1532001495361328, 0.36896181106567383, 0.8911237716674805, 1.413285732269287, 1.9354476928710938, 2.4576096534729004, 2.979771614074707, 3.5019335746765137, 4.02409553527832, 4.546257495880127, 5.068419456481934, 5.59058141708374, 6.112743377685547, 6.6349053382873535, 7.15706729888916, 7.679229259490967, 8.201391220092773, 8.723552703857422, 9.245715141296387, 9.767877578735352, 10.2900390625, 10.812200546264648, 11.334362983703613, 11.856525421142578, 12.378686904907227, 12.900848388671875, 13.42301082611084, 13.945173263549805, 14.467334747314453, 14.989496231079102, 15.511658668518066, 16.03382110595703, 16.55598258972168]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 3.0, 10.0, 17.0, 27.0, 34.0, 70.0, 90.0, 143.0, 204.0, 286.0, 495.0, 766.0, 1129.0, 1651.0, 2731.0, 4353.0, 6848.0, 10828.0, 17083.0, 26636.0, 40408.0, 59362.0, 82861.0, 108603.0, 127139.0, 132023.0, 119024.0, 95661.0, 70375.0, 48608.0, 32795.0, 21211.0, 13530.0, 8719.0, 5390.0, 3440.0, 2140.0, 1367.0, 912.0, 503.0, 373.0, 243.0, 139.0, 109.0, 66.0, 55.0, 35.0, 17.0, 15.0, 9.0, 8.0, 7.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.859375, -10.5225830078125, -10.185791015625, -9.8489990234375, -9.51220703125, -9.1754150390625, -8.838623046875, -8.5018310546875, -8.1650390625, -7.8282470703125, -7.491455078125, -7.1546630859375, -6.81787109375, -6.4810791015625, -6.144287109375, -5.8074951171875, -5.470703125, -5.1339111328125, -4.797119140625, -4.4603271484375, -4.12353515625, -3.7867431640625, -3.449951171875, -3.1131591796875, -2.7763671875, -2.4395751953125, -2.102783203125, -1.7659912109375, -1.42919921875, -1.0924072265625, -0.755615234375, -0.4188232421875, -0.08203125, 0.2547607421875, 0.591552734375, 0.9283447265625, 1.26513671875, 1.6019287109375, 1.938720703125, 2.2755126953125, 2.6123046875, 2.9490966796875, 3.285888671875, 3.6226806640625, 3.95947265625, 4.2962646484375, 4.633056640625, 4.9698486328125, 5.306640625, 5.6434326171875, 5.980224609375, 6.3170166015625, 6.65380859375, 6.9906005859375, 7.327392578125, 7.6641845703125, 8.0009765625, 8.3377685546875, 8.674560546875, 9.0113525390625, 9.34814453125, 9.6849365234375, 10.021728515625, 10.3585205078125, 10.6953125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 4.0, 8.0, 6.0, 8.0, 15.0, 19.0, 14.0, 25.0, 25.0, 30.0, 33.0, 47.0, 35.0, 40.0, 47.0, 57.0, 42.0, 41.0, 51.0, 53.0, 51.0, 41.0, 31.0, 34.0, 38.0, 31.0, 24.0, 23.0, 23.0, 12.0, 17.0, 25.0, 14.0, 13.0, 5.0, 9.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-21.90625, -21.2646484375, -20.623046875, -19.9814453125, -19.33984375, -18.6982421875, -18.056640625, -17.4150390625, -16.7734375, -16.1318359375, -15.490234375, -14.8486328125, -14.20703125, -13.5654296875, -12.923828125, -12.2822265625, -11.640625, -10.9990234375, -10.357421875, -9.7158203125, -9.07421875, -8.4326171875, -7.791015625, -7.1494140625, -6.5078125, -5.8662109375, -5.224609375, -4.5830078125, -3.94140625, -3.2998046875, -2.658203125, -2.0166015625, -1.375, -0.7333984375, -0.091796875, 0.5498046875, 1.19140625, 1.8330078125, 2.474609375, 3.1162109375, 3.7578125, 4.3994140625, 5.041015625, 5.6826171875, 6.32421875, 6.9658203125, 7.607421875, 8.2490234375, 8.890625, 9.5322265625, 10.173828125, 10.8154296875, 11.45703125, 12.0986328125, 12.740234375, 13.3818359375, 14.0234375, 14.6650390625, 15.306640625, 15.9482421875, 16.58984375, 17.2314453125, 17.873046875, 18.5146484375, 19.15625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 4.0, 6.0, 11.0, 8.0, 11.0, 27.0, 30.0, 33.0, 67.0, 102.0, 125.0, 183.0, 359.0, 508.0, 838.0, 1309.0, 2201.0, 3696.0, 6457.0, 11832.0, 21036.0, 40246.0, 74590.0, 133764.0, 203508.0, 213516.0, 148264.0, 85358.0, 45419.0, 23958.0, 13077.0, 7462.0, 4083.0, 2455.0, 1484.0, 885.0, 594.0, 352.0, 223.0, 140.0, 127.0, 69.0, 50.0, 26.0, 20.0, 17.0, 13.0, 7.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-19.359375, -18.75634765625, -18.1533203125, -17.55029296875, -16.947265625, -16.34423828125, -15.7412109375, -15.13818359375, -14.53515625, -13.93212890625, -13.3291015625, -12.72607421875, -12.123046875, -11.52001953125, -10.9169921875, -10.31396484375, -9.7109375, -9.10791015625, -8.5048828125, -7.90185546875, -7.298828125, -6.69580078125, -6.0927734375, -5.48974609375, -4.88671875, -4.28369140625, -3.6806640625, -3.07763671875, -2.474609375, -1.87158203125, -1.2685546875, -0.66552734375, -0.0625, 0.54052734375, 1.1435546875, 1.74658203125, 2.349609375, 2.95263671875, 3.5556640625, 4.15869140625, 4.76171875, 5.36474609375, 5.9677734375, 6.57080078125, 7.173828125, 7.77685546875, 8.3798828125, 8.98291015625, 9.5859375, 10.18896484375, 10.7919921875, 11.39501953125, 11.998046875, 12.60107421875, 13.2041015625, 13.80712890625, 14.41015625, 15.01318359375, 15.6162109375, 16.21923828125, 16.822265625, 17.42529296875, 18.0283203125, 18.63134765625, 19.234375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 8.0, 11.0, 8.0, 12.0, 12.0, 12.0, 16.0, 19.0, 18.0, 26.0, 37.0, 26.0, 36.0, 37.0, 32.0, 32.0, 38.0, 44.0, 46.0, 36.0, 35.0, 37.0, 43.0, 41.0, 31.0, 33.0, 30.0, 27.0, 25.0, 37.0, 26.0, 25.0, 16.0, 15.0, 16.0, 9.0, 12.0, 15.0, 5.0, 3.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-10.5, -10.195068359375, -9.89013671875, -9.585205078125, -9.2802734375, -8.975341796875, -8.67041015625, -8.365478515625, -8.060546875, -7.755615234375, -7.45068359375, -7.145751953125, -6.8408203125, -6.535888671875, -6.23095703125, -5.926025390625, -5.62109375, -5.316162109375, -5.01123046875, -4.706298828125, -4.4013671875, -4.096435546875, -3.79150390625, -3.486572265625, -3.181640625, -2.876708984375, -2.57177734375, -2.266845703125, -1.9619140625, -1.656982421875, -1.35205078125, -1.047119140625, -0.7421875, -0.437255859375, -0.13232421875, 0.172607421875, 0.4775390625, 0.782470703125, 1.08740234375, 1.392333984375, 1.697265625, 2.002197265625, 2.30712890625, 2.612060546875, 2.9169921875, 3.221923828125, 3.52685546875, 3.831787109375, 4.13671875, 4.441650390625, 4.74658203125, 5.051513671875, 5.3564453125, 5.661376953125, 5.96630859375, 6.271240234375, 6.576171875, 6.881103515625, 7.18603515625, 7.490966796875, 7.7958984375, 8.100830078125, 8.40576171875, 8.710693359375, 9.015625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 9.0, 17.0, 22.0, 30.0, 51.0, 79.0, 98.0, 159.0, 268.0, 439.0, 648.0, 1021.0, 1663.0, 2650.0, 4393.0, 7453.0, 13238.0, 23613.0, 43280.0, 78814.0, 140225.0, 210374.0, 208467.0, 137406.0, 77168.0, 42326.0, 22696.0, 13029.0, 7406.0, 4418.0, 2582.0, 1605.0, 994.0, 643.0, 419.0, 280.0, 189.0, 135.0, 74.0, 55.0, 41.0, 22.0, 19.0, 20.0, 6.0, 5.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.0, -10.66650390625, -10.3330078125, -9.99951171875, -9.666015625, -9.33251953125, -8.9990234375, -8.66552734375, -8.33203125, -7.99853515625, -7.6650390625, -7.33154296875, -6.998046875, -6.66455078125, -6.3310546875, -5.99755859375, -5.6640625, -5.33056640625, -4.9970703125, -4.66357421875, -4.330078125, -3.99658203125, -3.6630859375, -3.32958984375, -2.99609375, -2.66259765625, -2.3291015625, -1.99560546875, -1.662109375, -1.32861328125, -0.9951171875, -0.66162109375, -0.328125, 0.00537109375, 0.3388671875, 0.67236328125, 1.005859375, 1.33935546875, 1.6728515625, 2.00634765625, 2.33984375, 2.67333984375, 3.0068359375, 3.34033203125, 3.673828125, 4.00732421875, 4.3408203125, 4.67431640625, 5.0078125, 5.34130859375, 5.6748046875, 6.00830078125, 6.341796875, 6.67529296875, 7.0087890625, 7.34228515625, 7.67578125, 8.00927734375, 8.3427734375, 8.67626953125, 9.009765625, 9.34326171875, 9.6767578125, 10.01025390625, 10.34375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 8.0, 3.0, 2.0, 2.0, 2.0, 10.0, 7.0, 11.0, 14.0, 12.0, 18.0, 17.0, 24.0, 29.0, 32.0, 45.0, 37.0, 62.0, 56.0, 55.0, 56.0, 52.0, 57.0, 35.0, 56.0, 43.0, 34.0, 38.0, 40.0, 32.0, 27.0, 18.0, 18.0, 11.0, 8.0, 9.0, 6.0, 5.0, 3.0, 9.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0004820823669433594, -0.00046910718083381653, -0.0004561319947242737, -0.00044315680861473083, -0.000430181622505188, -0.00041720643639564514, -0.0004042312502861023, -0.00039125606417655945, -0.0003782808780670166, -0.00036530569195747375, -0.0003523305058479309, -0.00033935531973838806, -0.0003263801336288452, -0.00031340494751930237, -0.0003004297614097595, -0.0002874545753002167, -0.00027447938919067383, -0.000261504203081131, -0.00024852901697158813, -0.0002355538308620453, -0.00022257864475250244, -0.0002096034586429596, -0.00019662827253341675, -0.0001836530864238739, -0.00017067790031433105, -0.0001577027142047882, -0.00014472752809524536, -0.00013175234198570251, -0.00011877715587615967, -0.00010580196976661682, -9.282678365707397e-05, -7.985159754753113e-05, -6.687641143798828e-05, -5.3901225328445435e-05, -4.092603921890259e-05, -2.795085310935974e-05, -1.4975666999816895e-05, -2.000480890274048e-06, 1.0974705219268799e-05, 2.3949891328811646e-05, 3.692507743835449e-05, 4.990026354789734e-05, 6.287544965744019e-05, 7.585063576698303e-05, 8.882582187652588e-05, 0.00010180100798606873, 0.00011477619409561157, 0.00012775138020515442, 0.00014072656631469727, 0.0001537017524242401, 0.00016667693853378296, 0.0001796521246433258, 0.00019262731075286865, 0.0002056024968624115, 0.00021857768297195435, 0.0002315528690814972, 0.00024452805519104004, 0.0002575032413005829, 0.00027047842741012573, 0.0002834536135196686, 0.0002964287996292114, 0.00030940398573875427, 0.0003223791718482971, 0.00033535435795783997, 0.0003483295440673828]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 9.0, 13.0, 26.0, 25.0, 45.0, 81.0, 111.0, 191.0, 231.0, 362.0, 568.0, 844.0, 1279.0, 1934.0, 3078.0, 4364.0, 6812.0, 10313.0, 15740.0, 25034.0, 37716.0, 56820.0, 82909.0, 112185.0, 135559.0, 140732.0, 122699.0, 94344.0, 65945.0, 44368.0, 29538.0, 18731.0, 12305.0, 8075.0, 5330.0, 3426.0, 2254.0, 1516.0, 1065.0, 684.0, 432.0, 282.0, 194.0, 129.0, 91.0, 61.0, 41.0, 29.0, 14.0, 13.0, 9.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.3125, -8.0543212890625, -7.796142578125, -7.5379638671875, -7.27978515625, -7.0216064453125, -6.763427734375, -6.5052490234375, -6.2470703125, -5.9888916015625, -5.730712890625, -5.4725341796875, -5.21435546875, -4.9561767578125, -4.697998046875, -4.4398193359375, -4.181640625, -3.9234619140625, -3.665283203125, -3.4071044921875, -3.14892578125, -2.8907470703125, -2.632568359375, -2.3743896484375, -2.1162109375, -1.8580322265625, -1.599853515625, -1.3416748046875, -1.08349609375, -0.8253173828125, -0.567138671875, -0.3089599609375, -0.05078125, 0.2073974609375, 0.465576171875, 0.7237548828125, 0.98193359375, 1.2401123046875, 1.498291015625, 1.7564697265625, 2.0146484375, 2.2728271484375, 2.531005859375, 2.7891845703125, 3.04736328125, 3.3055419921875, 3.563720703125, 3.8218994140625, 4.080078125, 4.3382568359375, 4.596435546875, 4.8546142578125, 5.11279296875, 5.3709716796875, 5.629150390625, 5.8873291015625, 6.1455078125, 6.4036865234375, 6.661865234375, 6.9200439453125, 7.17822265625, 7.4364013671875, 7.694580078125, 7.9527587890625, 8.2109375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 4.0, 1.0, 5.0, 4.0, 3.0, 3.0, 5.0, 10.0, 9.0, 8.0, 12.0, 12.0, 17.0, 19.0, 19.0, 30.0, 21.0, 40.0, 43.0, 38.0, 36.0, 52.0, 54.0, 38.0, 49.0, 49.0, 47.0, 46.0, 48.0, 35.0, 37.0, 35.0, 24.0, 27.0, 23.0, 16.0, 23.0, 13.0, 10.0, 6.0, 10.0, 2.0, 5.0, 7.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.595703125, -2.512664794921875, -2.42962646484375, -2.346588134765625, -2.2635498046875, -2.180511474609375, -2.09747314453125, -2.014434814453125, -1.931396484375, -1.848358154296875, -1.76531982421875, -1.682281494140625, -1.5992431640625, -1.516204833984375, -1.43316650390625, -1.350128173828125, -1.26708984375, -1.184051513671875, -1.10101318359375, -1.017974853515625, -0.9349365234375, -0.851898193359375, -0.76885986328125, -0.685821533203125, -0.602783203125, -0.519744873046875, -0.43670654296875, -0.353668212890625, -0.2706298828125, -0.187591552734375, -0.10455322265625, -0.021514892578125, 0.0615234375, 0.144561767578125, 0.22760009765625, 0.310638427734375, 0.3936767578125, 0.476715087890625, 0.55975341796875, 0.642791748046875, 0.725830078125, 0.808868408203125, 0.89190673828125, 0.974945068359375, 1.0579833984375, 1.141021728515625, 1.22406005859375, 1.307098388671875, 1.39013671875, 1.473175048828125, 1.55621337890625, 1.639251708984375, 1.7222900390625, 1.805328369140625, 1.88836669921875, 1.971405029296875, 2.054443359375, 2.137481689453125, 2.22052001953125, 2.303558349609375, 2.3865966796875, 2.469635009765625, 2.55267333984375, 2.635711669921875, 2.71875]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 4.0, 7.0, 4.0, 8.0, 11.0, 12.0, 20.0, 26.0, 28.0, 28.0, 34.0, 57.0, 63.0, 52.0, 76.0, 61.0, 62.0, 70.0, 64.0, 54.0, 60.0, 43.0, 30.0, 36.0, 21.0, 18.0, 14.0, 10.0, 10.0, 8.0, 4.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.695209503173828, -23.747371673583984, -22.79953384399414, -21.851696014404297, -20.903858184814453, -19.95602035522461, -19.008182525634766, -18.060344696044922, -17.112506866455078, -16.164669036865234, -15.21683120727539, -14.268993377685547, -13.321155548095703, -12.37331771850586, -11.425479888916016, -10.477642059326172, -9.529803276062012, -8.581965446472168, -7.634127616882324, -6.6862897872924805, -5.738451957702637, -4.790613651275635, -3.842775821685791, -2.8949379920959473, -1.9471001625061035, -0.999262273311615, -0.051424384117126465, 0.8964135646820068, 1.8442513942718506, 2.7920894622802734, 3.739927291870117, 4.687765121459961, 5.635602951049805, 6.583440780639648, 7.531278610229492, 8.479116439819336, 9.42695426940918, 10.374792098999023, 11.322629928588867, 12.270467758178711, 13.218305587768555, 14.166143417358398, 15.113981246948242, 16.061819076538086, 17.00965690612793, 17.957494735717773, 18.905332565307617, 19.85317039489746, 20.801010131835938, 21.74884796142578, 22.696685791015625, 23.64452362060547, 24.592361450195312, 25.540199279785156, 26.488037109375, 27.435874938964844, 28.383712768554688, 29.33155059814453, 30.279388427734375, 31.22722625732422, 32.17506408691406, 33.122901916503906, 34.07073974609375, 35.018577575683594, 35.96641540527344]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 6.0, 4.0, 7.0, 9.0, 13.0, 11.0, 15.0, 11.0, 21.0, 19.0, 21.0, 31.0, 31.0, 32.0, 33.0, 50.0, 34.0, 43.0, 39.0, 51.0, 41.0, 49.0, 42.0, 39.0, 28.0, 34.0, 33.0, 21.0, 21.0, 20.0, 24.0, 27.0, 23.0, 23.0, 23.0, 14.0, 15.0, 13.0, 6.0, 4.0, 4.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-16.635669708251953, -16.127405166625977, -15.619141578674316, -15.11087703704834, -14.60261344909668, -14.094348907470703, -13.586084365844727, -13.07781982421875, -12.56955623626709, -12.061291694641113, -11.553028106689453, -11.044763565063477, -10.5364990234375, -10.02823543548584, -9.519970893859863, -9.011707305908203, -8.503442764282227, -7.995178699493408, -7.48691463470459, -6.978650093078613, -6.470386028289795, -5.962121963500977, -5.453857421875, -4.945593357086182, -4.437329292297363, -3.929065227508545, -3.4208009243011475, -2.91253662109375, -2.4042725563049316, -1.8960084915161133, -1.3877441883087158, -0.8794798851013184, -0.3712167739868164, 0.1370474100112915, 0.6453115940093994, 1.1535757780075073, 1.6618399620056152, 2.1701040267944336, 2.678368330001831, 3.1866326332092285, 3.694896697998047, 4.203160762786865, 4.711424827575684, 5.21968936920166, 5.7279534339904785, 6.236217498779297, 6.744482040405273, 7.252746105194092, 7.76101016998291, 8.269274711608887, 8.777538299560547, 9.285802841186523, 9.7940673828125, 10.30233097076416, 10.810595512390137, 11.318859100341797, 11.827123641967773, 12.33538818359375, 12.84365177154541, 13.351916313171387, 13.860179901123047, 14.368444442749023, 14.876708984375, 15.384973526000977, 15.893237113952637]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 8.0, 4.0, 9.0, 18.0, 27.0, 49.0, 85.0, 153.0, 199.0, 286.0, 430.0, 715.0, 1148.0, 1829.0, 3014.0, 4797.0, 7595.0, 11806.0, 18695.0, 28795.0, 43623.0, 63515.0, 86814.0, 111006.0, 126479.0, 128356.0, 114977.0, 92019.0, 67648.0, 47218.0, 31150.0, 20398.0, 13234.0, 8295.0, 5219.0, 3223.0, 2176.0, 1289.0, 832.0, 506.0, 327.0, 195.0, 147.0, 97.0, 56.0, 28.0, 21.0, 19.0, 11.0, 7.0, 3.0, 3.0, 1.0, 2.0, 2.0], "bins": [-15.5234375, -15.0682373046875, -14.613037109375, -14.1578369140625, -13.70263671875, -13.2474365234375, -12.792236328125, -12.3370361328125, -11.8818359375, -11.4266357421875, -10.971435546875, -10.5162353515625, -10.06103515625, -9.6058349609375, -9.150634765625, -8.6954345703125, -8.240234375, -7.7850341796875, -7.329833984375, -6.8746337890625, -6.41943359375, -5.9642333984375, -5.509033203125, -5.0538330078125, -4.5986328125, -4.1434326171875, -3.688232421875, -3.2330322265625, -2.77783203125, -2.3226318359375, -1.867431640625, -1.4122314453125, -0.95703125, -0.5018310546875, -0.046630859375, 0.4085693359375, 0.86376953125, 1.3189697265625, 1.774169921875, 2.2293701171875, 2.6845703125, 3.1397705078125, 3.594970703125, 4.0501708984375, 4.50537109375, 4.9605712890625, 5.415771484375, 5.8709716796875, 6.326171875, 6.7813720703125, 7.236572265625, 7.6917724609375, 8.14697265625, 8.6021728515625, 9.057373046875, 9.5125732421875, 9.9677734375, 10.4229736328125, 10.878173828125, 11.3333740234375, 11.78857421875, 12.2437744140625, 12.698974609375, 13.1541748046875, 13.609375]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 3.0, 8.0, 7.0, 13.0, 8.0, 13.0, 15.0, 18.0, 23.0, 20.0, 29.0, 49.0, 38.0, 29.0, 47.0, 47.0, 51.0, 43.0, 40.0, 47.0, 39.0, 41.0, 34.0, 34.0, 48.0, 29.0, 36.0, 28.0, 30.0, 23.0, 22.0, 14.0, 14.0, 9.0, 8.0, 10.0, 10.0, 9.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.0625, -17.471435546875, -16.88037109375, -16.289306640625, -15.6982421875, -15.107177734375, -14.51611328125, -13.925048828125, -13.333984375, -12.742919921875, -12.15185546875, -11.560791015625, -10.9697265625, -10.378662109375, -9.78759765625, -9.196533203125, -8.60546875, -8.014404296875, -7.42333984375, -6.832275390625, -6.2412109375, -5.650146484375, -5.05908203125, -4.468017578125, -3.876953125, -3.285888671875, -2.69482421875, -2.103759765625, -1.5126953125, -0.921630859375, -0.33056640625, 0.260498046875, 0.8515625, 1.442626953125, 2.03369140625, 2.624755859375, 3.2158203125, 3.806884765625, 4.39794921875, 4.989013671875, 5.580078125, 6.171142578125, 6.76220703125, 7.353271484375, 7.9443359375, 8.535400390625, 9.12646484375, 9.717529296875, 10.30859375, 10.899658203125, 11.49072265625, 12.081787109375, 12.6728515625, 13.263916015625, 13.85498046875, 14.446044921875, 15.037109375, 15.628173828125, 16.21923828125, 16.810302734375, 17.4013671875, 17.992431640625, 18.58349609375, 19.174560546875, 19.765625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 8.0, 17.0, 13.0, 28.0, 54.0, 85.0, 134.0, 182.0, 303.0, 454.0, 668.0, 1161.0, 1775.0, 2617.0, 4319.0, 6726.0, 10388.0, 16219.0, 24589.0, 37115.0, 53781.0, 74780.0, 96389.0, 114943.0, 124073.0, 118559.0, 101358.0, 79891.0, 58806.0, 40870.0, 27500.0, 18329.0, 11803.0, 7417.0, 4834.0, 3027.0, 1919.0, 1193.0, 818.0, 514.0, 336.0, 210.0, 130.0, 75.0, 59.0, 31.0, 25.0, 14.0, 7.0, 10.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.6328125, -14.184326171875, -13.73583984375, -13.287353515625, -12.8388671875, -12.390380859375, -11.94189453125, -11.493408203125, -11.044921875, -10.596435546875, -10.14794921875, -9.699462890625, -9.2509765625, -8.802490234375, -8.35400390625, -7.905517578125, -7.45703125, -7.008544921875, -6.56005859375, -6.111572265625, -5.6630859375, -5.214599609375, -4.76611328125, -4.317626953125, -3.869140625, -3.420654296875, -2.97216796875, -2.523681640625, -2.0751953125, -1.626708984375, -1.17822265625, -0.729736328125, -0.28125, 0.167236328125, 0.61572265625, 1.064208984375, 1.5126953125, 1.961181640625, 2.40966796875, 2.858154296875, 3.306640625, 3.755126953125, 4.20361328125, 4.652099609375, 5.1005859375, 5.549072265625, 5.99755859375, 6.446044921875, 6.89453125, 7.343017578125, 7.79150390625, 8.239990234375, 8.6884765625, 9.136962890625, 9.58544921875, 10.033935546875, 10.482421875, 10.930908203125, 11.37939453125, 11.827880859375, 12.2763671875, 12.724853515625, 13.17333984375, 13.621826171875, 14.0703125]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 1.0, 9.0, 2.0, 6.0, 6.0, 5.0, 4.0, 9.0, 12.0, 23.0, 24.0, 22.0, 23.0, 32.0, 21.0, 35.0, 32.0, 36.0, 34.0, 49.0, 49.0, 37.0, 46.0, 50.0, 29.0, 38.0, 37.0, 31.0, 16.0, 38.0, 34.0, 34.0, 28.0, 22.0, 22.0, 24.0, 16.0, 19.0, 11.0, 8.0, 5.0, 6.0, 8.0, 2.0, 6.0, 1.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1328125, -8.7822265625, -8.431640625, -8.0810546875, -7.73046875, -7.3798828125, -7.029296875, -6.6787109375, -6.328125, -5.9775390625, -5.626953125, -5.2763671875, -4.92578125, -4.5751953125, -4.224609375, -3.8740234375, -3.5234375, -3.1728515625, -2.822265625, -2.4716796875, -2.12109375, -1.7705078125, -1.419921875, -1.0693359375, -0.71875, -0.3681640625, -0.017578125, 0.3330078125, 0.68359375, 1.0341796875, 1.384765625, 1.7353515625, 2.0859375, 2.4365234375, 2.787109375, 3.1376953125, 3.48828125, 3.8388671875, 4.189453125, 4.5400390625, 4.890625, 5.2412109375, 5.591796875, 5.9423828125, 6.29296875, 6.6435546875, 6.994140625, 7.3447265625, 7.6953125, 8.0458984375, 8.396484375, 8.7470703125, 9.09765625, 9.4482421875, 9.798828125, 10.1494140625, 10.5, 10.8505859375, 11.201171875, 11.5517578125, 11.90234375, 12.2529296875, 12.603515625, 12.9541015625, 13.3046875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 4.0, 5.0, 6.0, 12.0, 10.0, 21.0, 24.0, 49.0, 59.0, 76.0, 129.0, 196.0, 277.0, 397.0, 710.0, 1136.0, 1761.0, 3056.0, 5278.0, 9286.0, 17232.0, 32105.0, 59815.0, 103925.0, 158256.0, 192492.0, 174621.0, 123906.0, 73664.0, 40363.0, 21854.0, 11657.0, 6584.0, 3730.0, 2178.0, 1342.0, 809.0, 518.0, 328.0, 230.0, 135.0, 105.0, 71.0, 44.0, 33.0, 23.0, 19.0, 13.0, 7.0, 3.0, 6.0, 2.0, 3.0, 2.0], "bins": [-12.21875, -11.8763427734375, -11.533935546875, -11.1915283203125, -10.84912109375, -10.5067138671875, -10.164306640625, -9.8218994140625, -9.4794921875, -9.1370849609375, -8.794677734375, -8.4522705078125, -8.10986328125, -7.7674560546875, -7.425048828125, -7.0826416015625, -6.740234375, -6.3978271484375, -6.055419921875, -5.7130126953125, -5.37060546875, -5.0281982421875, -4.685791015625, -4.3433837890625, -4.0009765625, -3.6585693359375, -3.316162109375, -2.9737548828125, -2.63134765625, -2.2889404296875, -1.946533203125, -1.6041259765625, -1.26171875, -0.9193115234375, -0.576904296875, -0.2344970703125, 0.10791015625, 0.4503173828125, 0.792724609375, 1.1351318359375, 1.4775390625, 1.8199462890625, 2.162353515625, 2.5047607421875, 2.84716796875, 3.1895751953125, 3.531982421875, 3.8743896484375, 4.216796875, 4.5592041015625, 4.901611328125, 5.2440185546875, 5.58642578125, 5.9288330078125, 6.271240234375, 6.6136474609375, 6.9560546875, 7.2984619140625, 7.640869140625, 7.9832763671875, 8.32568359375, 8.6680908203125, 9.010498046875, 9.3529052734375, 9.6953125]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 5.0, 0.0, 4.0, 2.0, 4.0, 9.0, 5.0, 5.0, 13.0, 6.0, 13.0, 18.0, 23.0, 15.0, 22.0, 36.0, 23.0, 32.0, 36.0, 48.0, 54.0, 50.0, 43.0, 40.0, 47.0, 47.0, 43.0, 45.0, 34.0, 35.0, 34.0, 27.0, 32.0, 27.0, 23.0, 17.0, 15.0, 10.0, 11.0, 7.0, 6.0, 9.0, 5.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0007491111755371094, -0.0007250681519508362, -0.000701025128364563, -0.0006769821047782898, -0.0006529390811920166, -0.0006288960576057434, -0.0006048530340194702, -0.000580810010433197, -0.0005567669868469238, -0.0005327239632606506, -0.0005086809396743774, -0.00048463791608810425, -0.00046059489250183105, -0.00043655186891555786, -0.00041250884532928467, -0.0003884658217430115, -0.0003644227981567383, -0.0003403797745704651, -0.0003163367509841919, -0.0002922937273979187, -0.0002682507038116455, -0.0002442076802253723, -0.00022016465663909912, -0.00019612163305282593, -0.00017207860946655273, -0.00014803558588027954, -0.00012399256229400635, -9.994953870773315e-05, -7.590651512145996e-05, -5.186349153518677e-05, -2.7820467948913574e-05, -3.777444362640381e-06, 2.0265579223632812e-05, 4.4308602809906006e-05, 6.83516263961792e-05, 9.239464998245239e-05, 0.00011643767356872559, 0.00014048069715499878, 0.00016452372074127197, 0.00018856674432754517, 0.00021260976791381836, 0.00023665279150009155, 0.00026069581508636475, 0.00028473883867263794, 0.00030878186225891113, 0.0003328248858451843, 0.0003568679094314575, 0.0003809109330177307, 0.0004049539566040039, 0.0004289969801902771, 0.0004530400037765503, 0.0004770830273628235, 0.0005011260509490967, 0.0005251690745353699, 0.0005492120981216431, 0.0005732551217079163, 0.0005972981452941895, 0.0006213411688804626, 0.0006453841924667358, 0.000669427216053009, 0.0006934702396392822, 0.0007175132632255554, 0.0007415562868118286, 0.0007655993103981018, 0.000789642333984375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 8.0, 10.0, 12.0, 21.0, 28.0, 28.0, 39.0, 70.0, 120.0, 146.0, 269.0, 422.0, 737.0, 1266.0, 2592.0, 5940.0, 15599.0, 43730.0, 122001.0, 261405.0, 306287.0, 177899.0, 69271.0, 24065.0, 8879.0, 3637.0, 1714.0, 924.0, 509.0, 319.0, 206.0, 137.0, 82.0, 56.0, 40.0, 26.0, 25.0, 16.0, 8.0, 9.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.984375, -17.38916015625, -16.7939453125, -16.19873046875, -15.603515625, -15.00830078125, -14.4130859375, -13.81787109375, -13.22265625, -12.62744140625, -12.0322265625, -11.43701171875, -10.841796875, -10.24658203125, -9.6513671875, -9.05615234375, -8.4609375, -7.86572265625, -7.2705078125, -6.67529296875, -6.080078125, -5.48486328125, -4.8896484375, -4.29443359375, -3.69921875, -3.10400390625, -2.5087890625, -1.91357421875, -1.318359375, -0.72314453125, -0.1279296875, 0.46728515625, 1.0625, 1.65771484375, 2.2529296875, 2.84814453125, 3.443359375, 4.03857421875, 4.6337890625, 5.22900390625, 5.82421875, 6.41943359375, 7.0146484375, 7.60986328125, 8.205078125, 8.80029296875, 9.3955078125, 9.99072265625, 10.5859375, 11.18115234375, 11.7763671875, 12.37158203125, 12.966796875, 13.56201171875, 14.1572265625, 14.75244140625, 15.34765625, 15.94287109375, 16.5380859375, 17.13330078125, 17.728515625, 18.32373046875, 18.9189453125, 19.51416015625, 20.109375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 5.0, 5.0, 13.0, 13.0, 19.0, 15.0, 31.0, 27.0, 39.0, 43.0, 60.0, 59.0, 50.0, 68.0, 72.0, 62.0, 69.0, 45.0, 56.0, 49.0, 28.0, 26.0, 35.0, 28.0, 22.0, 16.0, 12.0, 6.0, 4.0, 5.0, 7.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.90625, -3.78173828125, -3.6572265625, -3.53271484375, -3.408203125, -3.28369140625, -3.1591796875, -3.03466796875, -2.91015625, -2.78564453125, -2.6611328125, -2.53662109375, -2.412109375, -2.28759765625, -2.1630859375, -2.03857421875, -1.9140625, -1.78955078125, -1.6650390625, -1.54052734375, -1.416015625, -1.29150390625, -1.1669921875, -1.04248046875, -0.91796875, -0.79345703125, -0.6689453125, -0.54443359375, -0.419921875, -0.29541015625, -0.1708984375, -0.04638671875, 0.078125, 0.20263671875, 0.3271484375, 0.45166015625, 0.576171875, 0.70068359375, 0.8251953125, 0.94970703125, 1.07421875, 1.19873046875, 1.3232421875, 1.44775390625, 1.572265625, 1.69677734375, 1.8212890625, 1.94580078125, 2.0703125, 2.19482421875, 2.3193359375, 2.44384765625, 2.568359375, 2.69287109375, 2.8173828125, 2.94189453125, 3.06640625, 3.19091796875, 3.3154296875, 3.43994140625, 3.564453125, 3.68896484375, 3.8134765625, 3.93798828125, 4.0625]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 9.0, 8.0, 7.0, 16.0, 9.0, 11.0, 20.0, 22.0, 32.0, 38.0, 40.0, 51.0, 61.0, 70.0, 69.0, 62.0, 66.0, 67.0, 50.0, 51.0, 61.0, 36.0, 33.0, 33.0, 20.0, 16.0, 10.0, 14.0, 7.0, 2.0, 7.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.203081130981445, -23.262569427490234, -22.322057723999023, -21.381546020507812, -20.4410343170166, -19.50052261352539, -18.560012817382812, -17.61949920654297, -16.67898941040039, -15.73847770690918, -14.797966003417969, -13.857454299926758, -12.916942596435547, -11.976430892944336, -11.035920143127441, -10.09540843963623, -9.154895782470703, -8.214384078979492, -7.273872375488281, -6.3333611488342285, -5.392849445343018, -4.452337741851807, -3.511826515197754, -2.571314811706543, -1.630803108215332, -0.6902915239334106, 0.25022006034851074, 1.1907315254211426, 2.1312432289123535, 3.0717549324035645, 4.012266159057617, 4.952777862548828, 5.893291473388672, 6.833803176879883, 7.774314880371094, 8.714826583862305, 9.655338287353516, 10.595849990844727, 11.536360740661621, 12.476872444152832, 13.417384147644043, 14.357895851135254, 15.298407554626465, 16.23891830444336, 17.17943000793457, 18.11994171142578, 19.060453414916992, 20.000965118408203, 20.941476821899414, 21.881988525390625, 22.822500228881836, 23.763011932373047, 24.703523635864258, 25.64403533935547, 26.584545135498047, 27.52505874633789, 28.46556854248047, 29.40608024597168, 30.34659194946289, 31.2871036529541, 32.22761535644531, 33.16812515258789, 34.108638763427734, 35.04914855957031, 35.989662170410156]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 3.0, 7.0, 3.0, 8.0, 5.0, 11.0, 10.0, 14.0, 9.0, 19.0, 18.0, 21.0, 23.0, 28.0, 32.0, 26.0, 38.0, 42.0, 36.0, 40.0, 42.0, 42.0, 40.0, 38.0, 40.0, 43.0, 49.0, 33.0, 33.0, 38.0, 27.0, 18.0, 28.0, 22.0, 18.0, 13.0, 18.0, 8.0, 9.0, 7.0, 12.0, 9.0, 6.0, 5.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-17.0711669921875, -16.55986213684082, -16.048559188842773, -15.53725528717041, -15.025951385498047, -14.514646530151367, -14.003342628479004, -13.49203872680664, -12.980734825134277, -12.469430923461914, -11.95812702178955, -11.446823120117188, -10.935518264770508, -10.424215316772461, -9.912910461425781, -9.401606559753418, -8.890302658081055, -8.378998756408691, -7.867694854736328, -7.356390476226807, -6.845086574554443, -6.33378267288208, -5.822478294372559, -5.311174392700195, -4.799870491027832, -4.288566589355469, -3.7772624492645264, -3.265958309173584, -2.7546544075012207, -2.2433505058288574, -1.732046365737915, -1.2207422256469727, -0.7094402313232422, -0.19813621044158936, 0.3131678104400635, 0.8244718313217163, 1.3357758522033691, 1.8470797538757324, 2.358383893966675, 2.869688034057617, 3.3809919357299805, 3.8922958374023438, 4.403599739074707, 4.9149041175842285, 5.426208019256592, 5.937511920928955, 6.448816299438477, 6.96012020111084, 7.471424102783203, 7.982728004455566, 8.49403190612793, 9.005335807800293, 9.516639709472656, 10.027944564819336, 10.5392484664917, 11.050552368164062, 11.561856269836426, 12.073160171508789, 12.584464073181152, 13.095767974853516, 13.607072830200195, 14.118375778198242, 14.629680633544922, 15.140984535217285, 15.652288436889648]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 8.0, 9.0, 7.0, 11.0, 31.0, 44.0, 53.0, 97.0, 140.0, 212.0, 348.0, 537.0, 927.0, 1606.0, 2640.0, 4635.0, 8550.0, 15619.0, 30449.0, 61422.0, 128583.0, 274104.0, 549928.0, 893863.0, 950438.0, 637087.0, 327392.0, 153976.0, 73643.0, 36199.0, 18462.0, 9972.0, 5561.0, 3082.0, 1791.0, 1074.0, 648.0, 387.0, 254.0, 165.0, 123.0, 71.0, 44.0, 31.0, 21.0, 14.0, 12.0, 3.0, 8.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-29.90625, -28.97509765625, -28.0439453125, -27.11279296875, -26.181640625, -25.25048828125, -24.3193359375, -23.38818359375, -22.45703125, -21.52587890625, -20.5947265625, -19.66357421875, -18.732421875, -17.80126953125, -16.8701171875, -15.93896484375, -15.0078125, -14.07666015625, -13.1455078125, -12.21435546875, -11.283203125, -10.35205078125, -9.4208984375, -8.48974609375, -7.55859375, -6.62744140625, -5.6962890625, -4.76513671875, -3.833984375, -2.90283203125, -1.9716796875, -1.04052734375, -0.109375, 0.82177734375, 1.7529296875, 2.68408203125, 3.615234375, 4.54638671875, 5.4775390625, 6.40869140625, 7.33984375, 8.27099609375, 9.2021484375, 10.13330078125, 11.064453125, 11.99560546875, 12.9267578125, 13.85791015625, 14.7890625, 15.72021484375, 16.6513671875, 17.58251953125, 18.513671875, 19.44482421875, 20.3759765625, 21.30712890625, 22.23828125, 23.16943359375, 24.1005859375, 25.03173828125, 25.962890625, 26.89404296875, 27.8251953125, 28.75634765625, 29.6875]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 8.0, 10.0, 12.0, 11.0, 20.0, 10.0, 22.0, 23.0, 27.0, 32.0, 30.0, 35.0, 33.0, 43.0, 44.0, 42.0, 51.0, 38.0, 48.0, 45.0, 43.0, 55.0, 43.0, 30.0, 30.0, 30.0, 26.0, 22.0, 21.0, 23.0, 17.0, 8.0, 15.0, 8.0, 7.0, 6.0, 6.0, 4.0, 2.0, 6.0, 1.0, 5.0, 1.0, 1.0, 1.0], "bins": [-18.03125, -17.537353515625, -17.04345703125, -16.549560546875, -16.0556640625, -15.561767578125, -15.06787109375, -14.573974609375, -14.080078125, -13.586181640625, -13.09228515625, -12.598388671875, -12.1044921875, -11.610595703125, -11.11669921875, -10.622802734375, -10.12890625, -9.635009765625, -9.14111328125, -8.647216796875, -8.1533203125, -7.659423828125, -7.16552734375, -6.671630859375, -6.177734375, -5.683837890625, -5.18994140625, -4.696044921875, -4.2021484375, -3.708251953125, -3.21435546875, -2.720458984375, -2.2265625, -1.732666015625, -1.23876953125, -0.744873046875, -0.2509765625, 0.242919921875, 0.73681640625, 1.230712890625, 1.724609375, 2.218505859375, 2.71240234375, 3.206298828125, 3.7001953125, 4.194091796875, 4.68798828125, 5.181884765625, 5.67578125, 6.169677734375, 6.66357421875, 7.157470703125, 7.6513671875, 8.145263671875, 8.63916015625, 9.133056640625, 9.626953125, 10.120849609375, 10.61474609375, 11.108642578125, 11.6025390625, 12.096435546875, 12.59033203125, 13.084228515625, 13.578125]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 8.0, 4.0, 10.0, 22.0, 38.0, 51.0, 87.0, 117.0, 192.0, 373.0, 578.0, 1061.0, 1982.0, 3758.0, 7386.0, 14883.0, 29579.0, 60667.0, 125907.0, 255598.0, 491933.0, 803007.0, 925365.0, 690466.0, 392592.0, 198412.0, 96609.0, 46935.0, 22980.0, 11403.0, 5664.0, 3023.0, 1580.0, 873.0, 450.0, 251.0, 170.0, 97.0, 67.0, 42.0, 27.0, 13.0, 11.0, 7.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.5625, -35.43115234375, -34.2998046875, -33.16845703125, -32.037109375, -30.90576171875, -29.7744140625, -28.64306640625, -27.51171875, -26.38037109375, -25.2490234375, -24.11767578125, -22.986328125, -21.85498046875, -20.7236328125, -19.59228515625, -18.4609375, -17.32958984375, -16.1982421875, -15.06689453125, -13.935546875, -12.80419921875, -11.6728515625, -10.54150390625, -9.41015625, -8.27880859375, -7.1474609375, -6.01611328125, -4.884765625, -3.75341796875, -2.6220703125, -1.49072265625, -0.359375, 0.77197265625, 1.9033203125, 3.03466796875, 4.166015625, 5.29736328125, 6.4287109375, 7.56005859375, 8.69140625, 9.82275390625, 10.9541015625, 12.08544921875, 13.216796875, 14.34814453125, 15.4794921875, 16.61083984375, 17.7421875, 18.87353515625, 20.0048828125, 21.13623046875, 22.267578125, 23.39892578125, 24.5302734375, 25.66162109375, 26.79296875, 27.92431640625, 29.0556640625, 30.18701171875, 31.318359375, 32.44970703125, 33.5810546875, 34.71240234375, 35.84375]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 2.0, 3.0, 4.0, 4.0, 6.0, 10.0, 28.0, 25.0, 42.0, 51.0, 50.0, 74.0, 100.0, 120.0, 155.0, 186.0, 237.0, 238.0, 272.0, 304.0, 293.0, 310.0, 266.0, 249.0, 243.0, 179.0, 146.0, 118.0, 96.0, 63.0, 57.0, 42.0, 22.0, 22.0, 23.0, 7.0, 5.0, 8.0, 7.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.703125, -11.33837890625, -10.9736328125, -10.60888671875, -10.244140625, -9.87939453125, -9.5146484375, -9.14990234375, -8.78515625, -8.42041015625, -8.0556640625, -7.69091796875, -7.326171875, -6.96142578125, -6.5966796875, -6.23193359375, -5.8671875, -5.50244140625, -5.1376953125, -4.77294921875, -4.408203125, -4.04345703125, -3.6787109375, -3.31396484375, -2.94921875, -2.58447265625, -2.2197265625, -1.85498046875, -1.490234375, -1.12548828125, -0.7607421875, -0.39599609375, -0.03125, 0.33349609375, 0.6982421875, 1.06298828125, 1.427734375, 1.79248046875, 2.1572265625, 2.52197265625, 2.88671875, 3.25146484375, 3.6162109375, 3.98095703125, 4.345703125, 4.71044921875, 5.0751953125, 5.43994140625, 5.8046875, 6.16943359375, 6.5341796875, 6.89892578125, 7.263671875, 7.62841796875, 7.9931640625, 8.35791015625, 8.72265625, 9.08740234375, 9.4521484375, 9.81689453125, 10.181640625, 10.54638671875, 10.9111328125, 11.27587890625, 11.640625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 0.0, 1.0, 2.0, 5.0, 3.0, 5.0, 6.0, 10.0, 11.0, 13.0, 6.0, 18.0, 20.0, 27.0, 25.0, 27.0, 38.0, 47.0, 46.0, 38.0, 48.0, 55.0, 61.0, 56.0, 49.0, 60.0, 56.0, 38.0, 33.0, 37.0, 26.0, 28.0, 16.0, 14.0, 9.0, 12.0, 20.0, 6.0, 8.0, 5.0, 2.0, 5.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.080623626708984, -26.166078567504883, -25.25153350830078, -24.33698844909668, -23.422443389892578, -22.507898330688477, -21.593353271484375, -20.67880630493164, -19.764263153076172, -18.84971809387207, -17.93517303466797, -17.020627975463867, -16.106082916259766, -15.191537857055664, -14.276991844177246, -13.362446784973145, -12.447900772094727, -11.533355712890625, -10.618810653686523, -9.704265594482422, -8.78972053527832, -7.8751749992370605, -6.960629463195801, -6.046084403991699, -5.131539344787598, -4.216994285583496, -3.3024489879608154, -2.3879036903381348, -1.4733586311340332, -0.5588135719299316, 0.3557319641113281, 1.2702770233154297, 2.1848201751708984, 3.099365234375, 4.013910293579102, 4.928455829620361, 5.843000888824463, 6.7575459480285645, 7.672091484069824, 8.586636543273926, 9.501181602478027, 10.415726661682129, 11.33027172088623, 12.244817733764648, 13.15936279296875, 14.073907852172852, 14.988452911376953, 15.902997970581055, 16.817543029785156, 17.732088088989258, 18.64663314819336, 19.56117820739746, 20.475723266601562, 21.390268325805664, 22.304813385009766, 23.2193603515625, 24.13390350341797, 25.04844856262207, 25.962993621826172, 26.877538681030273, 27.792083740234375, 28.706628799438477, 29.621173858642578, 30.535720825195312, 31.450265884399414]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 1.0, 4.0, 5.0, 6.0, 8.0, 4.0, 10.0, 18.0, 15.0, 20.0, 15.0, 25.0, 32.0, 32.0, 25.0, 28.0, 30.0, 52.0, 45.0, 40.0, 57.0, 48.0, 39.0, 42.0, 40.0, 36.0, 40.0, 31.0, 32.0, 29.0, 34.0, 32.0, 19.0, 20.0, 11.0, 15.0, 10.0, 13.0, 7.0, 7.0, 3.0, 8.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-22.500263214111328, -21.853761672973633, -21.207260131835938, -20.560758590698242, -19.914257049560547, -19.26775360107422, -18.621253967285156, -17.974750518798828, -17.328248977661133, -16.681747436523438, -16.035245895385742, -15.388744354248047, -14.742241859436035, -14.09574031829834, -13.449238777160645, -12.802736282348633, -12.156235694885254, -11.509734153747559, -10.863232612609863, -10.216730117797852, -9.570228576660156, -8.923727035522461, -8.277225494384766, -7.630723476409912, -6.984221935272217, -6.3377203941345215, -5.691218376159668, -5.044716835021973, -4.398215293884277, -3.751713275909424, -3.1052117347717285, -2.458709716796875, -1.8122081756591797, -1.1657063961029053, -0.5192047357559204, 0.12729692459106445, 0.7737987041473389, 1.4203004837036133, 2.0668020248413086, 2.713304042816162, 3.3598055839538574, 4.006307125091553, 4.652809143066406, 5.299310684204102, 5.945812225341797, 6.59231424331665, 7.238815784454346, 7.885317802429199, 8.531819343566895, 9.17832088470459, 9.824822425842285, 10.471324920654297, 11.117826461791992, 11.764328002929688, 12.410829544067383, 13.057331085205078, 13.703832626342773, 14.350334167480469, 14.996835708618164, 15.64333724975586, 16.289838790893555, 16.93634033203125, 17.582843780517578, 18.229345321655273, 18.87584686279297]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 7.0, 15.0, 13.0, 23.0, 34.0, 59.0, 77.0, 124.0, 182.0, 273.0, 487.0, 762.0, 1263.0, 1941.0, 3361.0, 5564.0, 9288.0, 15048.0, 25128.0, 41087.0, 64799.0, 95254.0, 128589.0, 150086.0, 146116.0, 120975.0, 87661.0, 57174.0, 36576.0, 22419.0, 13740.0, 8113.0, 4797.0, 2929.0, 1733.0, 1088.0, 641.0, 387.0, 272.0, 156.0, 105.0, 60.0, 62.0, 32.0, 24.0, 14.0, 4.0, 3.0, 5.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.4375, -14.9375, -14.4375, -13.9375, -13.4375, -12.9375, -12.4375, -11.9375, -11.4375, -10.9375, -10.4375, -9.9375, -9.4375, -8.9375, -8.4375, -7.9375, -7.4375, -6.9375, -6.4375, -5.9375, -5.4375, -4.9375, -4.4375, -3.9375, -3.4375, -2.9375, -2.4375, -1.9375, -1.4375, -0.9375, -0.4375, 0.0625, 0.5625, 1.0625, 1.5625, 2.0625, 2.5625, 3.0625, 3.5625, 4.0625, 4.5625, 5.0625, 5.5625, 6.0625, 6.5625, 7.0625, 7.5625, 8.0625, 8.5625, 9.0625, 9.5625, 10.0625, 10.5625, 11.0625, 11.5625, 12.0625, 12.5625, 13.0625, 13.5625, 14.0625, 14.5625, 15.0625, 15.5625, 16.0625, 16.5625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 8.0, 4.0, 2.0, 8.0, 7.0, 13.0, 11.0, 15.0, 28.0, 31.0, 20.0, 32.0, 22.0, 35.0, 40.0, 50.0, 55.0, 44.0, 54.0, 52.0, 53.0, 44.0, 45.0, 51.0, 44.0, 34.0, 32.0, 30.0, 28.0, 20.0, 14.0, 13.0, 15.0, 9.0, 8.0, 9.0, 9.0, 5.0, 1.0, 0.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.5, -25.705810546875, -24.91162109375, -24.117431640625, -23.3232421875, -22.529052734375, -21.73486328125, -20.940673828125, -20.146484375, -19.352294921875, -18.55810546875, -17.763916015625, -16.9697265625, -16.175537109375, -15.38134765625, -14.587158203125, -13.79296875, -12.998779296875, -12.20458984375, -11.410400390625, -10.6162109375, -9.822021484375, -9.02783203125, -8.233642578125, -7.439453125, -6.645263671875, -5.85107421875, -5.056884765625, -4.2626953125, -3.468505859375, -2.67431640625, -1.880126953125, -1.0859375, -0.291748046875, 0.50244140625, 1.296630859375, 2.0908203125, 2.885009765625, 3.67919921875, 4.473388671875, 5.267578125, 6.061767578125, 6.85595703125, 7.650146484375, 8.4443359375, 9.238525390625, 10.03271484375, 10.826904296875, 11.62109375, 12.415283203125, 13.20947265625, 14.003662109375, 14.7978515625, 15.592041015625, 16.38623046875, 17.180419921875, 17.974609375, 18.768798828125, 19.56298828125, 20.357177734375, 21.1513671875, 21.945556640625, 22.73974609375, 23.533935546875, 24.328125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 8.0, 9.0, 10.0, 9.0, 15.0, 22.0, 28.0, 53.0, 47.0, 70.0, 99.0, 161.0, 246.0, 447.0, 677.0, 1131.0, 1933.0, 3272.0, 5892.0, 11204.0, 21913.0, 44281.0, 89082.0, 165483.0, 241287.0, 210223.0, 122755.0, 63017.0, 30997.0, 15545.0, 7959.0, 4331.0, 2493.0, 1419.0, 851.0, 538.0, 360.0, 208.0, 146.0, 94.0, 66.0, 42.0, 23.0, 21.0, 23.0, 14.0, 10.0, 10.0, 6.0, 5.0, 5.0, 2.0, 3.0, 4.0, 3.0, 2.0, 1.0], "bins": [-27.21875, -26.361328125, -25.50390625, -24.646484375, -23.7890625, -22.931640625, -22.07421875, -21.216796875, -20.359375, -19.501953125, -18.64453125, -17.787109375, -16.9296875, -16.072265625, -15.21484375, -14.357421875, -13.5, -12.642578125, -11.78515625, -10.927734375, -10.0703125, -9.212890625, -8.35546875, -7.498046875, -6.640625, -5.783203125, -4.92578125, -4.068359375, -3.2109375, -2.353515625, -1.49609375, -0.638671875, 0.21875, 1.076171875, 1.93359375, 2.791015625, 3.6484375, 4.505859375, 5.36328125, 6.220703125, 7.078125, 7.935546875, 8.79296875, 9.650390625, 10.5078125, 11.365234375, 12.22265625, 13.080078125, 13.9375, 14.794921875, 15.65234375, 16.509765625, 17.3671875, 18.224609375, 19.08203125, 19.939453125, 20.796875, 21.654296875, 22.51171875, 23.369140625, 24.2265625, 25.083984375, 25.94140625, 26.798828125, 27.65625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 8.0, 7.0, 4.0, 8.0, 4.0, 13.0, 10.0, 12.0, 13.0, 20.0, 14.0, 18.0, 24.0, 25.0, 22.0, 26.0, 39.0, 32.0, 26.0, 42.0, 33.0, 44.0, 49.0, 36.0, 43.0, 39.0, 34.0, 36.0, 40.0, 34.0, 33.0, 27.0, 24.0, 20.0, 20.0, 21.0, 13.0, 15.0, 18.0, 11.0, 7.0, 9.0, 12.0, 11.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-11.6953125, -11.3287353515625, -10.962158203125, -10.5955810546875, -10.22900390625, -9.8624267578125, -9.495849609375, -9.1292724609375, -8.7626953125, -8.3961181640625, -8.029541015625, -7.6629638671875, -7.29638671875, -6.9298095703125, -6.563232421875, -6.1966552734375, -5.830078125, -5.4635009765625, -5.096923828125, -4.7303466796875, -4.36376953125, -3.9971923828125, -3.630615234375, -3.2640380859375, -2.8974609375, -2.5308837890625, -2.164306640625, -1.7977294921875, -1.43115234375, -1.0645751953125, -0.697998046875, -0.3314208984375, 0.03515625, 0.4017333984375, 0.768310546875, 1.1348876953125, 1.50146484375, 1.8680419921875, 2.234619140625, 2.6011962890625, 2.9677734375, 3.3343505859375, 3.700927734375, 4.0675048828125, 4.43408203125, 4.8006591796875, 5.167236328125, 5.5338134765625, 5.900390625, 6.2669677734375, 6.633544921875, 7.0001220703125, 7.36669921875, 7.7332763671875, 8.099853515625, 8.4664306640625, 8.8330078125, 9.1995849609375, 9.566162109375, 9.9327392578125, 10.29931640625, 10.6658935546875, 11.032470703125, 11.3990478515625, 11.765625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 4.0, 8.0, 11.0, 16.0, 19.0, 40.0, 56.0, 60.0, 110.0, 149.0, 206.0, 307.0, 438.0, 639.0, 993.0, 1509.0, 2303.0, 3631.0, 5509.0, 9055.0, 15051.0, 25021.0, 42697.0, 72637.0, 119276.0, 175729.0, 193388.0, 147759.0, 93262.0, 55786.0, 32657.0, 18930.0, 11430.0, 7014.0, 4479.0, 2794.0, 1780.0, 1247.0, 790.0, 535.0, 379.0, 263.0, 184.0, 115.0, 82.0, 70.0, 44.0, 19.0, 24.0, 14.0, 14.0, 13.0, 4.0, 4.0, 4.0, 1.0, 2.0], "bins": [-13.7109375, -13.298583984375, -12.88623046875, -12.473876953125, -12.0615234375, -11.649169921875, -11.23681640625, -10.824462890625, -10.412109375, -9.999755859375, -9.58740234375, -9.175048828125, -8.7626953125, -8.350341796875, -7.93798828125, -7.525634765625, -7.11328125, -6.700927734375, -6.28857421875, -5.876220703125, -5.4638671875, -5.051513671875, -4.63916015625, -4.226806640625, -3.814453125, -3.402099609375, -2.98974609375, -2.577392578125, -2.1650390625, -1.752685546875, -1.34033203125, -0.927978515625, -0.515625, -0.103271484375, 0.30908203125, 0.721435546875, 1.1337890625, 1.546142578125, 1.95849609375, 2.370849609375, 2.783203125, 3.195556640625, 3.60791015625, 4.020263671875, 4.4326171875, 4.844970703125, 5.25732421875, 5.669677734375, 6.08203125, 6.494384765625, 6.90673828125, 7.319091796875, 7.7314453125, 8.143798828125, 8.55615234375, 8.968505859375, 9.380859375, 9.793212890625, 10.20556640625, 10.617919921875, 11.0302734375, 11.442626953125, 11.85498046875, 12.267333984375, 12.6796875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 0.0, 10.0, 8.0, 12.0, 6.0, 8.0, 18.0, 18.0, 20.0, 38.0, 24.0, 32.0, 45.0, 36.0, 40.0, 27.0, 43.0, 49.0, 59.0, 52.0, 38.0, 51.0, 47.0, 37.0, 42.0, 28.0, 31.0, 32.0, 20.0, 22.0, 13.0, 20.0, 5.0, 4.0, 7.0, 14.0, 9.0, 5.0, 8.0, 4.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0004608631134033203, -0.00044594332575798035, -0.0004310235381126404, -0.0004161037504673004, -0.00040118396282196045, -0.0003862641751766205, -0.0003713443875312805, -0.00035642459988594055, -0.0003415048122406006, -0.0003265850245952606, -0.00031166523694992065, -0.0002967454493045807, -0.0002818256616592407, -0.00026690587401390076, -0.0002519860863685608, -0.00023706629872322083, -0.00022214651107788086, -0.0002072267234325409, -0.00019230693578720093, -0.00017738714814186096, -0.000162467360496521, -0.00014754757285118103, -0.00013262778520584106, -0.0001177079975605011, -0.00010278820991516113, -8.786842226982117e-05, -7.29486346244812e-05, -5.8028846979141235e-05, -4.310905933380127e-05, -2.8189271688461304e-05, -1.3269484043121338e-05, 1.650303602218628e-06, 1.6570091247558594e-05, 3.148987889289856e-05, 4.6409666538238525e-05, 6.132945418357849e-05, 7.624924182891846e-05, 9.116902947425842e-05, 0.00010608881711959839, 0.00012100860476493835, 0.00013592839241027832, 0.00015084818005561829, 0.00016576796770095825, 0.00018068775534629822, 0.00019560754299163818, 0.00021052733063697815, 0.00022544711828231812, 0.00024036690592765808, 0.00025528669357299805, 0.000270206481218338, 0.000285126268863678, 0.00030004605650901794, 0.0003149658441543579, 0.0003298856317996979, 0.00034480541944503784, 0.0003597252070903778, 0.0003746449947357178, 0.00038956478238105774, 0.0004044845700263977, 0.00041940435767173767, 0.00043432414531707764, 0.0004492439329624176, 0.00046416372060775757, 0.00047908350825309753, 0.0004940032958984375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 5.0, 4.0, 4.0, 4.0, 9.0, 10.0, 22.0, 17.0, 39.0, 60.0, 73.0, 122.0, 167.0, 281.0, 407.0, 646.0, 967.0, 1549.0, 2317.0, 3609.0, 5952.0, 9654.0, 15679.0, 25219.0, 41017.0, 64428.0, 96241.0, 130339.0, 152058.0, 147127.0, 118588.0, 84410.0, 55458.0, 34641.0, 21764.0, 13241.0, 8290.0, 5194.0, 3175.0, 2062.0, 1260.0, 840.0, 544.0, 355.0, 254.0, 151.0, 102.0, 66.0, 42.0, 32.0, 21.0, 18.0, 11.0, 8.0, 8.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-13.1796875, -12.765625, -12.3515625, -11.9375, -11.5234375, -11.109375, -10.6953125, -10.28125, -9.8671875, -9.453125, -9.0390625, -8.625, -8.2109375, -7.796875, -7.3828125, -6.96875, -6.5546875, -6.140625, -5.7265625, -5.3125, -4.8984375, -4.484375, -4.0703125, -3.65625, -3.2421875, -2.828125, -2.4140625, -2.0, -1.5859375, -1.171875, -0.7578125, -0.34375, 0.0703125, 0.484375, 0.8984375, 1.3125, 1.7265625, 2.140625, 2.5546875, 2.96875, 3.3828125, 3.796875, 4.2109375, 4.625, 5.0390625, 5.453125, 5.8671875, 6.28125, 6.6953125, 7.109375, 7.5234375, 7.9375, 8.3515625, 8.765625, 9.1796875, 9.59375, 10.0078125, 10.421875, 10.8359375, 11.25, 11.6640625, 12.078125, 12.4921875, 12.90625, 13.3203125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 2.0, 8.0, 1.0, 9.0, 8.0, 5.0, 9.0, 15.0, 15.0, 28.0, 23.0, 34.0, 35.0, 35.0, 54.0, 51.0, 67.0, 52.0, 52.0, 65.0, 48.0, 51.0, 64.0, 30.0, 37.0, 32.0, 33.0, 29.0, 16.0, 20.0, 13.0, 14.0, 14.0, 10.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.96875, -4.82220458984375, -4.6756591796875, -4.52911376953125, -4.382568359375, -4.23602294921875, -4.0894775390625, -3.94293212890625, -3.79638671875, -3.64984130859375, -3.5032958984375, -3.35675048828125, -3.210205078125, -3.06365966796875, -2.9171142578125, -2.77056884765625, -2.6240234375, -2.47747802734375, -2.3309326171875, -2.18438720703125, -2.037841796875, -1.89129638671875, -1.7447509765625, -1.59820556640625, -1.45166015625, -1.30511474609375, -1.1585693359375, -1.01202392578125, -0.865478515625, -0.71893310546875, -0.5723876953125, -0.42584228515625, -0.279296875, -0.13275146484375, 0.0137939453125, 0.16033935546875, 0.306884765625, 0.45343017578125, 0.5999755859375, 0.74652099609375, 0.89306640625, 1.03961181640625, 1.1861572265625, 1.33270263671875, 1.479248046875, 1.62579345703125, 1.7723388671875, 1.91888427734375, 2.0654296875, 2.21197509765625, 2.3585205078125, 2.50506591796875, 2.651611328125, 2.79815673828125, 2.9447021484375, 3.09124755859375, 3.23779296875, 3.38433837890625, 3.5308837890625, 3.67742919921875, 3.823974609375, 3.97052001953125, 4.1170654296875, 4.26361083984375, 4.41015625]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 8.0, 4.0, 9.0, 7.0, 12.0, 10.0, 15.0, 12.0, 23.0, 24.0, 28.0, 35.0, 31.0, 55.0, 52.0, 48.0, 40.0, 44.0, 61.0, 56.0, 50.0, 57.0, 55.0, 30.0, 40.0, 33.0, 28.0, 16.0, 16.0, 21.0, 13.0, 14.0, 14.0, 7.0, 8.0, 3.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.911890029907227, -25.99489402770996, -25.077896118164062, -24.160900115966797, -23.24390411376953, -22.326908111572266, -21.409912109375, -20.4929141998291, -19.575918197631836, -18.65892219543457, -17.741924285888672, -16.824928283691406, -15.90793228149414, -14.990936279296875, -14.073939323425293, -13.156942367553711, -12.239946365356445, -11.32295036315918, -10.405953407287598, -9.488956451416016, -8.57196044921875, -7.654963970184326, -6.737967491149902, -5.8209710121154785, -4.903974533081055, -3.986978054046631, -3.069981575012207, -2.152985095977783, -1.2359886169433594, -0.31899213790893555, 0.5980043411254883, 1.515000820159912, 2.431997299194336, 3.3489937782287598, 4.265990257263184, 5.182986736297607, 6.099983215332031, 7.016979694366455, 7.933976173400879, 8.850973129272461, 9.767969131469727, 10.684965133666992, 11.601962089538574, 12.518959045410156, 13.435955047607422, 14.352951049804688, 15.26994800567627, 16.18694496154785, 17.103940963745117, 18.020936965942383, 18.93793487548828, 19.854930877685547, 20.771926879882812, 21.688922882080078, 22.605918884277344, 23.522916793823242, 24.439912796020508, 25.356908798217773, 26.273906707763672, 27.190902709960938, 28.107898712158203, 29.02489471435547, 29.941890716552734, 30.858888626098633, 31.7758846282959]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 5.0, 3.0, 3.0, 8.0, 3.0, 16.0, 13.0, 9.0, 12.0, 21.0, 24.0, 25.0, 37.0, 30.0, 32.0, 32.0, 36.0, 42.0, 46.0, 44.0, 47.0, 45.0, 37.0, 38.0, 38.0, 44.0, 35.0, 34.0, 33.0, 32.0, 28.0, 25.0, 21.0, 18.0, 19.0, 12.0, 11.0, 7.0, 7.0, 4.0, 6.0, 6.0, 3.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0], "bins": [-22.62870216369629, -21.98770523071289, -21.34670639038086, -20.70570945739746, -20.064712524414062, -19.42371368408203, -18.782716751098633, -18.141719818115234, -17.500720977783203, -16.859724044799805, -16.218725204467773, -15.577728271484375, -14.936731338500977, -14.295733451843262, -13.654735565185547, -13.013738632202148, -12.37274169921875, -11.731743812561035, -11.090746879577637, -10.449748992919922, -9.808752059936523, -9.167754173278809, -8.526756286621094, -7.885758876800537, -7.2447614669799805, -6.603764057159424, -5.962766647338867, -5.321768760681152, -4.680771350860596, -4.039773941040039, -3.3987762928009033, -2.7577786445617676, -2.116781234741211, -1.4757837057113647, -0.8347861766815186, -0.19378864765167236, 0.44720888137817383, 1.0882062911987305, 1.7292039394378662, 2.370201587677002, 3.0111989974975586, 3.6521964073181152, 4.293193817138672, 4.934191703796387, 5.575189113616943, 6.2161865234375, 6.857184410095215, 7.4981818199157715, 8.139179229736328, 8.780177116394043, 9.421174049377441, 10.062171936035156, 10.703168869018555, 11.34416675567627, 11.985164642333984, 12.626161575317383, 13.267159461975098, 13.908157348632812, 14.549154281616211, 15.190152168273926, 15.83115005493164, 16.47214698791504, 17.113143920898438, 17.75414276123047, 18.395139694213867]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 10.0, 9.0, 17.0, 23.0, 25.0, 37.0, 60.0, 72.0, 116.0, 149.0, 295.0, 411.0, 655.0, 1029.0, 1525.0, 2357.0, 3675.0, 5678.0, 8490.0, 13218.0, 20352.0, 30561.0, 44547.0, 63298.0, 85558.0, 105655.0, 120881.0, 121861.0, 111085.0, 90417.0, 68678.0, 49218.0, 33461.0, 22466.0, 14869.0, 9735.0, 6374.0, 4036.0, 2761.0, 1669.0, 1139.0, 721.0, 473.0, 321.0, 204.0, 134.0, 81.0, 59.0, 33.0, 25.0, 17.0, 8.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0], "bins": [-16.296875, -15.804931640625, -15.31298828125, -14.821044921875, -14.3291015625, -13.837158203125, -13.34521484375, -12.853271484375, -12.361328125, -11.869384765625, -11.37744140625, -10.885498046875, -10.3935546875, -9.901611328125, -9.40966796875, -8.917724609375, -8.42578125, -7.933837890625, -7.44189453125, -6.949951171875, -6.4580078125, -5.966064453125, -5.47412109375, -4.982177734375, -4.490234375, -3.998291015625, -3.50634765625, -3.014404296875, -2.5224609375, -2.030517578125, -1.53857421875, -1.046630859375, -0.5546875, -0.062744140625, 0.42919921875, 0.921142578125, 1.4130859375, 1.905029296875, 2.39697265625, 2.888916015625, 3.380859375, 3.872802734375, 4.36474609375, 4.856689453125, 5.3486328125, 5.840576171875, 6.33251953125, 6.824462890625, 7.31640625, 7.808349609375, 8.30029296875, 8.792236328125, 9.2841796875, 9.776123046875, 10.26806640625, 10.760009765625, 11.251953125, 11.743896484375, 12.23583984375, 12.727783203125, 13.2197265625, 13.711669921875, 14.20361328125, 14.695556640625, 15.1875]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 4.0, 2.0, 4.0, 5.0, 4.0, 10.0, 6.0, 10.0, 7.0, 14.0, 11.0, 20.0, 23.0, 31.0, 36.0, 28.0, 37.0, 40.0, 42.0, 47.0, 58.0, 47.0, 50.0, 60.0, 49.0, 42.0, 35.0, 38.0, 29.0, 36.0, 30.0, 26.0, 23.0, 11.0, 19.0, 15.0, 13.0, 9.0, 7.0, 9.0, 4.0, 3.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.34375, -20.591064453125, -19.83837890625, -19.085693359375, -18.3330078125, -17.580322265625, -16.82763671875, -16.074951171875, -15.322265625, -14.569580078125, -13.81689453125, -13.064208984375, -12.3115234375, -11.558837890625, -10.80615234375, -10.053466796875, -9.30078125, -8.548095703125, -7.79541015625, -7.042724609375, -6.2900390625, -5.537353515625, -4.78466796875, -4.031982421875, -3.279296875, -2.526611328125, -1.77392578125, -1.021240234375, -0.2685546875, 0.484130859375, 1.23681640625, 1.989501953125, 2.7421875, 3.494873046875, 4.24755859375, 5.000244140625, 5.7529296875, 6.505615234375, 7.25830078125, 8.010986328125, 8.763671875, 9.516357421875, 10.26904296875, 11.021728515625, 11.7744140625, 12.527099609375, 13.27978515625, 14.032470703125, 14.78515625, 15.537841796875, 16.29052734375, 17.043212890625, 17.7958984375, 18.548583984375, 19.30126953125, 20.053955078125, 20.806640625, 21.559326171875, 22.31201171875, 23.064697265625, 23.8173828125, 24.570068359375, 25.32275390625, 26.075439453125, 26.828125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 9.0, 13.0, 8.0, 26.0, 34.0, 49.0, 91.0, 146.0, 232.0, 331.0, 561.0, 995.0, 1712.0, 2935.0, 4738.0, 7697.0, 12620.0, 20362.0, 32117.0, 49470.0, 72639.0, 98912.0, 121853.0, 134723.0, 129206.0, 109725.0, 83667.0, 59351.0, 39579.0, 25039.0, 15588.0, 9508.0, 5809.0, 3483.0, 2087.0, 1280.0, 770.0, 474.0, 268.0, 179.0, 115.0, 49.0, 31.0, 31.0, 23.0, 13.0, 5.0, 5.0, 5.0, 6.0, 0.0, 1.0], "bins": [-22.125, -21.505615234375, -20.88623046875, -20.266845703125, -19.6474609375, -19.028076171875, -18.40869140625, -17.789306640625, -17.169921875, -16.550537109375, -15.93115234375, -15.311767578125, -14.6923828125, -14.072998046875, -13.45361328125, -12.834228515625, -12.21484375, -11.595458984375, -10.97607421875, -10.356689453125, -9.7373046875, -9.117919921875, -8.49853515625, -7.879150390625, -7.259765625, -6.640380859375, -6.02099609375, -5.401611328125, -4.7822265625, -4.162841796875, -3.54345703125, -2.924072265625, -2.3046875, -1.685302734375, -1.06591796875, -0.446533203125, 0.1728515625, 0.792236328125, 1.41162109375, 2.031005859375, 2.650390625, 3.269775390625, 3.88916015625, 4.508544921875, 5.1279296875, 5.747314453125, 6.36669921875, 6.986083984375, 7.60546875, 8.224853515625, 8.84423828125, 9.463623046875, 10.0830078125, 10.702392578125, 11.32177734375, 11.941162109375, 12.560546875, 13.179931640625, 13.79931640625, 14.418701171875, 15.0380859375, 15.657470703125, 16.27685546875, 16.896240234375, 17.515625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 3.0, 6.0, 7.0, 16.0, 8.0, 11.0, 19.0, 18.0, 20.0, 20.0, 27.0, 30.0, 34.0, 33.0, 38.0, 35.0, 38.0, 43.0, 41.0, 41.0, 38.0, 35.0, 32.0, 46.0, 37.0, 25.0, 40.0, 38.0, 44.0, 21.0, 21.0, 17.0, 18.0, 17.0, 18.0, 13.0, 13.0, 9.0, 13.0, 3.0, 2.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-14.7421875, -14.2867431640625, -13.831298828125, -13.3758544921875, -12.92041015625, -12.4649658203125, -12.009521484375, -11.5540771484375, -11.0986328125, -10.6431884765625, -10.187744140625, -9.7322998046875, -9.27685546875, -8.8214111328125, -8.365966796875, -7.9105224609375, -7.455078125, -6.9996337890625, -6.544189453125, -6.0887451171875, -5.63330078125, -5.1778564453125, -4.722412109375, -4.2669677734375, -3.8115234375, -3.3560791015625, -2.900634765625, -2.4451904296875, -1.98974609375, -1.5343017578125, -1.078857421875, -0.6234130859375, -0.16796875, 0.2874755859375, 0.742919921875, 1.1983642578125, 1.65380859375, 2.1092529296875, 2.564697265625, 3.0201416015625, 3.4755859375, 3.9310302734375, 4.386474609375, 4.8419189453125, 5.29736328125, 5.7528076171875, 6.208251953125, 6.6636962890625, 7.119140625, 7.5745849609375, 8.030029296875, 8.4854736328125, 8.94091796875, 9.3963623046875, 9.851806640625, 10.3072509765625, 10.7626953125, 11.2181396484375, 11.673583984375, 12.1290283203125, 12.58447265625, 13.0399169921875, 13.495361328125, 13.9508056640625, 14.40625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 12.0, 11.0, 17.0, 24.0, 32.0, 51.0, 87.0, 121.0, 189.0, 323.0, 585.0, 932.0, 1593.0, 2826.0, 5643.0, 12174.0, 28910.0, 74286.0, 180980.0, 301271.0, 246349.0, 112992.0, 44623.0, 17607.0, 7921.0, 3991.0, 2026.0, 1061.0, 717.0, 446.0, 258.0, 157.0, 111.0, 65.0, 44.0, 40.0, 19.0, 26.0, 9.0, 9.0, 1.0, 5.0, 1.0, 4.0, 1.0, 2.0], "bins": [-28.40625, -27.6533203125, -26.900390625, -26.1474609375, -25.39453125, -24.6416015625, -23.888671875, -23.1357421875, -22.3828125, -21.6298828125, -20.876953125, -20.1240234375, -19.37109375, -18.6181640625, -17.865234375, -17.1123046875, -16.359375, -15.6064453125, -14.853515625, -14.1005859375, -13.34765625, -12.5947265625, -11.841796875, -11.0888671875, -10.3359375, -9.5830078125, -8.830078125, -8.0771484375, -7.32421875, -6.5712890625, -5.818359375, -5.0654296875, -4.3125, -3.5595703125, -2.806640625, -2.0537109375, -1.30078125, -0.5478515625, 0.205078125, 0.9580078125, 1.7109375, 2.4638671875, 3.216796875, 3.9697265625, 4.72265625, 5.4755859375, 6.228515625, 6.9814453125, 7.734375, 8.4873046875, 9.240234375, 9.9931640625, 10.74609375, 11.4990234375, 12.251953125, 13.0048828125, 13.7578125, 14.5107421875, 15.263671875, 16.0166015625, 16.76953125, 17.5224609375, 18.275390625, 19.0283203125, 19.78125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 5.0, 6.0, 1.0, 12.0, 10.0, 18.0, 21.0, 29.0, 37.0, 54.0, 77.0, 84.0, 79.0, 98.0, 74.0, 76.0, 64.0, 62.0, 44.0, 28.0, 34.0, 27.0, 13.0, 13.0, 10.0, 4.0, 3.0, 9.0, 2.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015993118286132812, -0.0015435665845870972, -0.001487821340560913, -0.001432076096534729, -0.001376330852508545, -0.0013205856084823608, -0.0012648403644561768, -0.0012090951204299927, -0.0011533498764038086, -0.0010976046323776245, -0.0010418593883514404, -0.0009861141443252563, -0.0009303689002990723, -0.0008746236562728882, -0.0008188784122467041, -0.00076313316822052, -0.0007073879241943359, -0.0006516426801681519, -0.0005958974361419678, -0.0005401521921157837, -0.0004844069480895996, -0.00042866170406341553, -0.00037291646003723145, -0.00031717121601104736, -0.0002614259719848633, -0.0002056807279586792, -0.00014993548393249512, -9.419023990631104e-05, -3.844499588012695e-05, 1.730024814605713e-05, 7.304549217224121e-05, 0.0001287907361984253, 0.00018453598022460938, 0.00024028122425079346, 0.00029602646827697754, 0.0003517717123031616, 0.0004075169563293457, 0.0004632622003555298, 0.0005190074443817139, 0.000574752688407898, 0.000630497932434082, 0.0006862431764602661, 0.0007419884204864502, 0.0007977336645126343, 0.0008534789085388184, 0.0009092241525650024, 0.0009649693965911865, 0.0010207146406173706, 0.0010764598846435547, 0.0011322051286697388, 0.0011879503726959229, 0.001243695616722107, 0.001299440860748291, 0.001355186104774475, 0.0014109313488006592, 0.0014666765928268433, 0.0015224218368530273, 0.0015781670808792114, 0.0016339123249053955, 0.0016896575689315796, 0.0017454028129577637, 0.0018011480569839478, 0.0018568933010101318, 0.001912638545036316, 0.0019683837890625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 2.0, 4.0, 5.0, 5.0, 14.0, 16.0, 18.0, 31.0, 46.0, 73.0, 91.0, 133.0, 182.0, 210.0, 306.0, 487.0, 637.0, 1005.0, 1532.0, 2451.0, 3919.0, 6651.0, 11370.0, 20602.0, 38271.0, 70800.0, 122983.0, 179367.0, 198224.0, 160730.0, 100995.0, 56560.0, 30463.0, 16360.0, 9231.0, 5365.0, 3235.0, 2036.0, 1282.0, 869.0, 621.0, 395.0, 304.0, 196.0, 143.0, 101.0, 83.0, 47.0, 33.0, 27.0, 17.0, 11.0, 5.0, 8.0, 6.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0], "bins": [-16.0, -15.489013671875, -14.97802734375, -14.467041015625, -13.9560546875, -13.445068359375, -12.93408203125, -12.423095703125, -11.912109375, -11.401123046875, -10.89013671875, -10.379150390625, -9.8681640625, -9.357177734375, -8.84619140625, -8.335205078125, -7.82421875, -7.313232421875, -6.80224609375, -6.291259765625, -5.7802734375, -5.269287109375, -4.75830078125, -4.247314453125, -3.736328125, -3.225341796875, -2.71435546875, -2.203369140625, -1.6923828125, -1.181396484375, -0.67041015625, -0.159423828125, 0.3515625, 0.862548828125, 1.37353515625, 1.884521484375, 2.3955078125, 2.906494140625, 3.41748046875, 3.928466796875, 4.439453125, 4.950439453125, 5.46142578125, 5.972412109375, 6.4833984375, 6.994384765625, 7.50537109375, 8.016357421875, 8.52734375, 9.038330078125, 9.54931640625, 10.060302734375, 10.5712890625, 11.082275390625, 11.59326171875, 12.104248046875, 12.615234375, 13.126220703125, 13.63720703125, 14.148193359375, 14.6591796875, 15.170166015625, 15.68115234375, 16.192138671875, 16.703125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 7.0, 7.0, 5.0, 11.0, 8.0, 11.0, 9.0, 18.0, 18.0, 19.0, 24.0, 29.0, 25.0, 37.0, 40.0, 51.0, 49.0, 47.0, 58.0, 68.0, 46.0, 68.0, 55.0, 57.0, 28.0, 48.0, 21.0, 17.0, 28.0, 16.0, 12.0, 15.0, 4.0, 10.0, 5.0, 10.0, 3.0, 5.0, 4.0, 2.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-5.71484375, -5.55792236328125, -5.4010009765625, -5.24407958984375, -5.087158203125, -4.93023681640625, -4.7733154296875, -4.61639404296875, -4.45947265625, -4.30255126953125, -4.1456298828125, -3.98870849609375, -3.831787109375, -3.67486572265625, -3.5179443359375, -3.36102294921875, -3.2041015625, -3.04718017578125, -2.8902587890625, -2.73333740234375, -2.576416015625, -2.41949462890625, -2.2625732421875, -2.10565185546875, -1.94873046875, -1.79180908203125, -1.6348876953125, -1.47796630859375, -1.321044921875, -1.16412353515625, -1.0072021484375, -0.85028076171875, -0.693359375, -0.53643798828125, -0.3795166015625, -0.22259521484375, -0.065673828125, 0.09124755859375, 0.2481689453125, 0.40509033203125, 0.56201171875, 0.71893310546875, 0.8758544921875, 1.03277587890625, 1.189697265625, 1.34661865234375, 1.5035400390625, 1.66046142578125, 1.8173828125, 1.97430419921875, 2.1312255859375, 2.28814697265625, 2.445068359375, 2.60198974609375, 2.7589111328125, 2.91583251953125, 3.07275390625, 3.22967529296875, 3.3865966796875, 3.54351806640625, 3.700439453125, 3.85736083984375, 4.0142822265625, 4.17120361328125, 4.328125]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 9.0, 4.0, 11.0, 8.0, 9.0, 8.0, 12.0, 18.0, 25.0, 26.0, 31.0, 37.0, 36.0, 36.0, 48.0, 49.0, 61.0, 59.0, 65.0, 61.0, 56.0, 52.0, 59.0, 41.0, 25.0, 18.0, 22.0, 20.0, 25.0, 17.0, 13.0, 8.0, 11.0, 6.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.86786460876465, -30.837194442749023, -29.8065242767334, -28.775854110717773, -27.745182037353516, -26.71451187133789, -25.683841705322266, -24.65317153930664, -23.622501373291016, -22.59183120727539, -21.561161041259766, -20.53049087524414, -19.499820709228516, -18.46915054321289, -17.438478469848633, -16.407808303833008, -15.377138137817383, -14.346467971801758, -13.315797805786133, -12.285126686096191, -11.254456520080566, -10.223786354064941, -9.193115234375, -8.162445068359375, -7.13177490234375, -6.101104736328125, -5.070434093475342, -4.039763450622559, -3.0090932846069336, -1.9784231185913086, -0.9477524757385254, 0.08291816711425781, 1.11358642578125, 2.144256830215454, 3.174927234649658, 4.205597877502441, 5.236268043518066, 6.266938209533691, 7.297608852386475, 8.328279495239258, 9.358949661254883, 10.389619827270508, 11.420289993286133, 12.450961112976074, 13.4816312789917, 14.512301445007324, 15.542972564697266, 16.57364273071289, 17.604312896728516, 18.63498306274414, 19.665653228759766, 20.69632339477539, 21.726993560791016, 22.75766372680664, 23.7883358001709, 24.819005966186523, 25.84967613220215, 26.880346298217773, 27.9110164642334, 28.941686630249023, 29.97235870361328, 31.003028869628906, 32.03369903564453, 33.064369201660156, 34.09503936767578]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 1.0, 5.0, 5.0, 6.0, 8.0, 8.0, 12.0, 7.0, 9.0, 13.0, 19.0, 19.0, 18.0, 20.0, 24.0, 24.0, 22.0, 29.0, 28.0, 41.0, 33.0, 36.0, 43.0, 35.0, 41.0, 33.0, 43.0, 35.0, 34.0, 26.0, 45.0, 31.0, 30.0, 21.0, 28.0, 18.0, 14.0, 23.0, 18.0, 18.0, 15.0, 10.0, 11.0, 10.0, 8.0, 4.0, 4.0, 6.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-18.195226669311523, -17.602327346801758, -17.009428024291992, -16.416528701782227, -15.823630332946777, -15.230731010437012, -14.637832641601562, -14.044933319091797, -13.452033996582031, -12.859134674072266, -12.2662353515625, -11.67333698272705, -11.080437660217285, -10.48753833770752, -9.89463996887207, -9.301740646362305, -8.708841323852539, -8.115942001342773, -7.523043155670166, -6.930144309997559, -6.337244987487793, -5.744345664978027, -5.15144681930542, -4.5585479736328125, -3.965648651123047, -3.3727495670318604, -2.779850482940674, -2.1869513988494873, -1.5940523147583008, -1.0011532306671143, -0.40825414657592773, 0.1846446990966797, 0.7775421142578125, 1.370441198348999, 1.9633402824401855, 2.556239366531372, 3.1491384506225586, 3.742037534713745, 4.334936618804932, 4.927835464477539, 5.520734786987305, 6.11363410949707, 6.706532955169678, 7.299431800842285, 7.892331123352051, 8.485230445861816, 9.078128814697266, 9.671028137207031, 10.263927459716797, 10.856826782226562, 11.449726104736328, 12.042624473571777, 12.635523796081543, 13.228423118591309, 13.821321487426758, 14.414220809936523, 15.007120132446289, 15.600019454956055, 16.19291877746582, 16.785818099975586, 17.37871551513672, 17.971614837646484, 18.56451416015625, 19.157413482666016, 19.75031280517578]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 15.0, 14.0, 24.0, 36.0, 72.0, 120.0, 212.0, 327.0, 619.0, 1020.0, 1913.0, 3403.0, 6571.0, 12677.0, 25033.0, 51337.0, 106052.0, 221711.0, 443756.0, 768107.0, 952362.0, 752088.0, 429892.0, 213219.0, 102074.0, 49184.0, 24282.0, 12371.0, 6616.0, 3675.0, 2118.0, 1237.0, 760.0, 446.0, 336.0, 208.0, 116.0, 86.0, 63.0, 35.0, 30.0, 17.0, 16.0, 14.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.28125, -33.15625, -32.03125, -30.90625, -29.78125, -28.65625, -27.53125, -26.40625, -25.28125, -24.15625, -23.03125, -21.90625, -20.78125, -19.65625, -18.53125, -17.40625, -16.28125, -15.15625, -14.03125, -12.90625, -11.78125, -10.65625, -9.53125, -8.40625, -7.28125, -6.15625, -5.03125, -3.90625, -2.78125, -1.65625, -0.53125, 0.59375, 1.71875, 2.84375, 3.96875, 5.09375, 6.21875, 7.34375, 8.46875, 9.59375, 10.71875, 11.84375, 12.96875, 14.09375, 15.21875, 16.34375, 17.46875, 18.59375, 19.71875, 20.84375, 21.96875, 23.09375, 24.21875, 25.34375, 26.46875, 27.59375, 28.71875, 29.84375, 30.96875, 32.09375, 33.21875, 34.34375, 35.46875, 36.59375, 37.71875]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 7.0, 5.0, 5.0, 9.0, 9.0, 4.0, 10.0, 11.0, 14.0, 26.0, 22.0, 18.0, 34.0, 26.0, 42.0, 27.0, 35.0, 43.0, 38.0, 41.0, 45.0, 43.0, 44.0, 42.0, 44.0, 32.0, 47.0, 33.0, 36.0, 25.0, 30.0, 28.0, 19.0, 17.0, 16.0, 18.0, 7.0, 20.0, 7.0, 5.0, 6.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.203125, -16.57861328125, -15.9541015625, -15.32958984375, -14.705078125, -14.08056640625, -13.4560546875, -12.83154296875, -12.20703125, -11.58251953125, -10.9580078125, -10.33349609375, -9.708984375, -9.08447265625, -8.4599609375, -7.83544921875, -7.2109375, -6.58642578125, -5.9619140625, -5.33740234375, -4.712890625, -4.08837890625, -3.4638671875, -2.83935546875, -2.21484375, -1.59033203125, -0.9658203125, -0.34130859375, 0.283203125, 0.90771484375, 1.5322265625, 2.15673828125, 2.78125, 3.40576171875, 4.0302734375, 4.65478515625, 5.279296875, 5.90380859375, 6.5283203125, 7.15283203125, 7.77734375, 8.40185546875, 9.0263671875, 9.65087890625, 10.275390625, 10.89990234375, 11.5244140625, 12.14892578125, 12.7734375, 13.39794921875, 14.0224609375, 14.64697265625, 15.271484375, 15.89599609375, 16.5205078125, 17.14501953125, 17.76953125, 18.39404296875, 19.0185546875, 19.64306640625, 20.267578125, 20.89208984375, 21.5166015625, 22.14111328125, 22.765625]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 8.0, 13.0, 22.0, 37.0, 56.0, 87.0, 139.0, 248.0, 415.0, 716.0, 1306.0, 2202.0, 3941.0, 7495.0, 14466.0, 27980.0, 55203.0, 109322.0, 215476.0, 406620.0, 673930.0, 864530.0, 761815.0, 494214.0, 270312.0, 139035.0, 70454.0, 35428.0, 18101.0, 9477.0, 4997.0, 2705.0, 1512.0, 808.0, 501.0, 257.0, 164.0, 125.0, 44.0, 51.0, 24.0, 19.0, 10.0, 8.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-40.65625, -39.2861328125, -37.916015625, -36.5458984375, -35.17578125, -33.8056640625, -32.435546875, -31.0654296875, -29.6953125, -28.3251953125, -26.955078125, -25.5849609375, -24.21484375, -22.8447265625, -21.474609375, -20.1044921875, -18.734375, -17.3642578125, -15.994140625, -14.6240234375, -13.25390625, -11.8837890625, -10.513671875, -9.1435546875, -7.7734375, -6.4033203125, -5.033203125, -3.6630859375, -2.29296875, -0.9228515625, 0.447265625, 1.8173828125, 3.1875, 4.5576171875, 5.927734375, 7.2978515625, 8.66796875, 10.0380859375, 11.408203125, 12.7783203125, 14.1484375, 15.5185546875, 16.888671875, 18.2587890625, 19.62890625, 20.9990234375, 22.369140625, 23.7392578125, 25.109375, 26.4794921875, 27.849609375, 29.2197265625, 30.58984375, 31.9599609375, 33.330078125, 34.7001953125, 36.0703125, 37.4404296875, 38.810546875, 40.1806640625, 41.55078125, 42.9208984375, 44.291015625, 45.6611328125, 47.03125]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 1.0, 3.0, 4.0, 3.0, 5.0, 11.0, 5.0, 15.0, 20.0, 19.0, 31.0, 49.0, 70.0, 85.0, 98.0, 110.0, 142.0, 193.0, 209.0, 243.0, 278.0, 295.0, 309.0, 240.0, 253.0, 263.0, 211.0, 203.0, 177.0, 129.0, 99.0, 92.0, 55.0, 52.0, 35.0, 19.0, 14.0, 9.0, 11.0, 6.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.234375, -12.7841796875, -12.333984375, -11.8837890625, -11.43359375, -10.9833984375, -10.533203125, -10.0830078125, -9.6328125, -9.1826171875, -8.732421875, -8.2822265625, -7.83203125, -7.3818359375, -6.931640625, -6.4814453125, -6.03125, -5.5810546875, -5.130859375, -4.6806640625, -4.23046875, -3.7802734375, -3.330078125, -2.8798828125, -2.4296875, -1.9794921875, -1.529296875, -1.0791015625, -0.62890625, -0.1787109375, 0.271484375, 0.7216796875, 1.171875, 1.6220703125, 2.072265625, 2.5224609375, 2.97265625, 3.4228515625, 3.873046875, 4.3232421875, 4.7734375, 5.2236328125, 5.673828125, 6.1240234375, 6.57421875, 7.0244140625, 7.474609375, 7.9248046875, 8.375, 8.8251953125, 9.275390625, 9.7255859375, 10.17578125, 10.6259765625, 11.076171875, 11.5263671875, 11.9765625, 12.4267578125, 12.876953125, 13.3271484375, 13.77734375, 14.2275390625, 14.677734375, 15.1279296875, 15.578125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 7.0, 6.0, 11.0, 9.0, 7.0, 8.0, 12.0, 14.0, 22.0, 23.0, 39.0, 33.0, 39.0, 48.0, 52.0, 54.0, 59.0, 51.0, 61.0, 57.0, 50.0, 45.0, 50.0, 37.0, 41.0, 28.0, 24.0, 27.0, 16.0, 15.0, 15.0, 8.0, 8.0, 10.0, 4.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.26799011230469, -38.92879867553711, -37.58960723876953, -36.25041580200195, -34.911224365234375, -33.5720329284668, -32.23284149169922, -30.893648147583008, -29.55445671081543, -28.21526527404785, -26.876073837280273, -25.536880493164062, -24.197689056396484, -22.858497619628906, -21.519306182861328, -20.18011474609375, -18.840923309326172, -17.501731872558594, -16.162540435791016, -14.823348045349121, -13.484156608581543, -12.144965171813965, -10.80577278137207, -9.466581344604492, -8.127389907836914, -6.788198471069336, -5.4490065574646, -4.109814643859863, -2.770623207092285, -1.431431770324707, -0.0922393798828125, 1.2469520568847656, 2.5861473083496094, 3.9253389835357666, 5.264530658721924, 6.60372257232666, 7.942914009094238, 9.282105445861816, 10.621297836303711, 11.960489273071289, 13.299680709838867, 14.638872146606445, 15.978063583374023, 17.317256927490234, 18.656448364257812, 19.99563980102539, 21.33483123779297, 22.674022674560547, 24.013214111328125, 25.352405548095703, 26.69159698486328, 28.03078842163086, 29.369979858398438, 30.709171295166016, 32.048362731933594, 33.38755798339844, 34.72674560546875, 36.06593704223633, 37.405128479003906, 38.744319915771484, 40.08351135253906, 41.42270278930664, 42.76189422607422, 44.10108947753906, 45.44028091430664]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 6.0, 6.0, 7.0, 8.0, 11.0, 12.0, 11.0, 10.0, 11.0, 13.0, 19.0, 22.0, 20.0, 32.0, 29.0, 25.0, 34.0, 30.0, 43.0, 37.0, 44.0, 30.0, 42.0, 49.0, 37.0, 47.0, 42.0, 32.0, 33.0, 38.0, 35.0, 21.0, 30.0, 15.0, 25.0, 17.0, 16.0, 15.0, 9.0, 10.0, 8.0, 3.0, 2.0, 5.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.071855545043945, -23.28384017944336, -22.495824813842773, -21.707809448242188, -20.919795989990234, -20.13178062438965, -19.343765258789062, -18.555749893188477, -17.76773452758789, -16.979719161987305, -16.19170379638672, -15.40368938446045, -14.61567497253418, -13.827659606933594, -13.039644241333008, -12.251628875732422, -11.463615417480469, -10.675600051879883, -9.887585639953613, -9.099570274353027, -8.311555862426758, -7.523540496826172, -6.735525131225586, -5.947510242462158, -5.1594953536987305, -4.371480464935303, -3.583465337753296, -2.795450210571289, -2.0074353218078613, -1.2194204330444336, -0.43140506744384766, 0.3566098213195801, 1.1446247100830078, 1.932639718055725, 2.7206547260284424, 3.508669853210449, 4.296684741973877, 5.084699630737305, 5.872714996337891, 6.660729885101318, 7.448744773864746, 8.236760139465332, 9.024774551391602, 9.812789916992188, 10.600805282592773, 11.388819694519043, 12.176835060119629, 12.964849472045898, 13.752864837646484, 14.54088020324707, 15.32889461517334, 16.11690902709961, 16.904924392700195, 17.69293975830078, 18.480955123901367, 19.268970489501953, 20.056983947753906, 20.844999313354492, 21.633014678955078, 22.42102813720703, 23.209043502807617, 23.997058868408203, 24.78507423400879, 25.573089599609375, 26.36110496520996]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 6.0, 9.0, 25.0, 35.0, 52.0, 79.0, 125.0, 227.0, 359.0, 534.0, 880.0, 1439.0, 2376.0, 4033.0, 6682.0, 11290.0, 18888.0, 31628.0, 51661.0, 79990.0, 114212.0, 144557.0, 154445.0, 137468.0, 104078.0, 70747.0, 44858.0, 27375.0, 15999.0, 9703.0, 5937.0, 3390.0, 2083.0, 1340.0, 749.0, 491.0, 293.0, 182.0, 118.0, 64.0, 56.0, 33.0, 19.0, 15.0, 13.0, 11.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.765625, -19.09228515625, -18.4189453125, -17.74560546875, -17.072265625, -16.39892578125, -15.7255859375, -15.05224609375, -14.37890625, -13.70556640625, -13.0322265625, -12.35888671875, -11.685546875, -11.01220703125, -10.3388671875, -9.66552734375, -8.9921875, -8.31884765625, -7.6455078125, -6.97216796875, -6.298828125, -5.62548828125, -4.9521484375, -4.27880859375, -3.60546875, -2.93212890625, -2.2587890625, -1.58544921875, -0.912109375, -0.23876953125, 0.4345703125, 1.10791015625, 1.78125, 2.45458984375, 3.1279296875, 3.80126953125, 4.474609375, 5.14794921875, 5.8212890625, 6.49462890625, 7.16796875, 7.84130859375, 8.5146484375, 9.18798828125, 9.861328125, 10.53466796875, 11.2080078125, 11.88134765625, 12.5546875, 13.22802734375, 13.9013671875, 14.57470703125, 15.248046875, 15.92138671875, 16.5947265625, 17.26806640625, 17.94140625, 18.61474609375, 19.2880859375, 19.96142578125, 20.634765625, 21.30810546875, 21.9814453125, 22.65478515625, 23.328125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 10.0, 3.0, 6.0, 13.0, 11.0, 14.0, 15.0, 22.0, 22.0, 15.0, 32.0, 41.0, 29.0, 34.0, 35.0, 39.0, 40.0, 34.0, 44.0, 42.0, 40.0, 45.0, 34.0, 41.0, 41.0, 28.0, 35.0, 23.0, 37.0, 18.0, 22.0, 19.0, 18.0, 19.0, 17.0, 11.0, 7.0, 6.0, 6.0, 7.0, 5.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 5.0, 0.0, 0.0, 2.0], "bins": [-28.265625, -27.398193359375, -26.53076171875, -25.663330078125, -24.7958984375, -23.928466796875, -23.06103515625, -22.193603515625, -21.326171875, -20.458740234375, -19.59130859375, -18.723876953125, -17.8564453125, -16.989013671875, -16.12158203125, -15.254150390625, -14.38671875, -13.519287109375, -12.65185546875, -11.784423828125, -10.9169921875, -10.049560546875, -9.18212890625, -8.314697265625, -7.447265625, -6.579833984375, -5.71240234375, -4.844970703125, -3.9775390625, -3.110107421875, -2.24267578125, -1.375244140625, -0.5078125, 0.359619140625, 1.22705078125, 2.094482421875, 2.9619140625, 3.829345703125, 4.69677734375, 5.564208984375, 6.431640625, 7.299072265625, 8.16650390625, 9.033935546875, 9.9013671875, 10.768798828125, 11.63623046875, 12.503662109375, 13.37109375, 14.238525390625, 15.10595703125, 15.973388671875, 16.8408203125, 17.708251953125, 18.57568359375, 19.443115234375, 20.310546875, 21.177978515625, 22.04541015625, 22.912841796875, 23.7802734375, 24.647705078125, 25.51513671875, 26.382568359375, 27.25]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 6.0, 10.0, 11.0, 15.0, 35.0, 33.0, 54.0, 81.0, 123.0, 181.0, 274.0, 428.0, 658.0, 1081.0, 1672.0, 2774.0, 4861.0, 8562.0, 15882.0, 30241.0, 58614.0, 110490.0, 186474.0, 229798.0, 177056.0, 102331.0, 54406.0, 27931.0, 14834.0, 8158.0, 4529.0, 2571.0, 1550.0, 979.0, 642.0, 401.0, 257.0, 164.0, 115.0, 76.0, 66.0, 54.0, 33.0, 15.0, 12.0, 9.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.875, -31.794921875, -30.71484375, -29.634765625, -28.5546875, -27.474609375, -26.39453125, -25.314453125, -24.234375, -23.154296875, -22.07421875, -20.994140625, -19.9140625, -18.833984375, -17.75390625, -16.673828125, -15.59375, -14.513671875, -13.43359375, -12.353515625, -11.2734375, -10.193359375, -9.11328125, -8.033203125, -6.953125, -5.873046875, -4.79296875, -3.712890625, -2.6328125, -1.552734375, -0.47265625, 0.607421875, 1.6875, 2.767578125, 3.84765625, 4.927734375, 6.0078125, 7.087890625, 8.16796875, 9.248046875, 10.328125, 11.408203125, 12.48828125, 13.568359375, 14.6484375, 15.728515625, 16.80859375, 17.888671875, 18.96875, 20.048828125, 21.12890625, 22.208984375, 23.2890625, 24.369140625, 25.44921875, 26.529296875, 27.609375, 28.689453125, 29.76953125, 30.849609375, 31.9296875, 33.009765625, 34.08984375, 35.169921875, 36.25]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 7.0, 5.0, 10.0, 9.0, 11.0, 15.0, 13.0, 14.0, 16.0, 24.0, 23.0, 16.0, 27.0, 28.0, 39.0, 31.0, 41.0, 29.0, 48.0, 48.0, 49.0, 47.0, 41.0, 51.0, 31.0, 42.0, 39.0, 37.0, 28.0, 26.0, 15.0, 19.0, 32.0, 11.0, 13.0, 13.0, 14.0, 7.0, 7.0, 9.0, 0.0, 6.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-17.46875, -16.929931640625, -16.39111328125, -15.852294921875, -15.3134765625, -14.774658203125, -14.23583984375, -13.697021484375, -13.158203125, -12.619384765625, -12.08056640625, -11.541748046875, -11.0029296875, -10.464111328125, -9.92529296875, -9.386474609375, -8.84765625, -8.308837890625, -7.77001953125, -7.231201171875, -6.6923828125, -6.153564453125, -5.61474609375, -5.075927734375, -4.537109375, -3.998291015625, -3.45947265625, -2.920654296875, -2.3818359375, -1.843017578125, -1.30419921875, -0.765380859375, -0.2265625, 0.312255859375, 0.85107421875, 1.389892578125, 1.9287109375, 2.467529296875, 3.00634765625, 3.545166015625, 4.083984375, 4.622802734375, 5.16162109375, 5.700439453125, 6.2392578125, 6.778076171875, 7.31689453125, 7.855712890625, 8.39453125, 8.933349609375, 9.47216796875, 10.010986328125, 10.5498046875, 11.088623046875, 11.62744140625, 12.166259765625, 12.705078125, 13.243896484375, 13.78271484375, 14.321533203125, 14.8603515625, 15.399169921875, 15.93798828125, 16.476806640625, 17.015625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 9.0, 8.0, 11.0, 10.0, 13.0, 28.0, 46.0, 67.0, 91.0, 146.0, 195.0, 375.0, 573.0, 935.0, 1529.0, 2706.0, 4745.0, 8600.0, 16291.0, 32633.0, 65234.0, 127644.0, 218743.0, 242848.0, 157330.0, 81963.0, 40701.0, 20393.0, 10815.0, 5775.0, 3324.0, 1873.0, 1093.0, 642.0, 413.0, 273.0, 169.0, 110.0, 64.0, 54.0, 32.0, 18.0, 15.0, 10.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.296875, -20.566650390625, -19.83642578125, -19.106201171875, -18.3759765625, -17.645751953125, -16.91552734375, -16.185302734375, -15.455078125, -14.724853515625, -13.99462890625, -13.264404296875, -12.5341796875, -11.803955078125, -11.07373046875, -10.343505859375, -9.61328125, -8.883056640625, -8.15283203125, -7.422607421875, -6.6923828125, -5.962158203125, -5.23193359375, -4.501708984375, -3.771484375, -3.041259765625, -2.31103515625, -1.580810546875, -0.8505859375, -0.120361328125, 0.60986328125, 1.340087890625, 2.0703125, 2.800537109375, 3.53076171875, 4.260986328125, 4.9912109375, 5.721435546875, 6.45166015625, 7.181884765625, 7.912109375, 8.642333984375, 9.37255859375, 10.102783203125, 10.8330078125, 11.563232421875, 12.29345703125, 13.023681640625, 13.75390625, 14.484130859375, 15.21435546875, 15.944580078125, 16.6748046875, 17.405029296875, 18.13525390625, 18.865478515625, 19.595703125, 20.325927734375, 21.05615234375, 21.786376953125, 22.5166015625, 23.246826171875, 23.97705078125, 24.707275390625, 25.4375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 3.0, 7.0, 12.0, 11.0, 18.0, 12.0, 22.0, 18.0, 29.0, 27.0, 43.0, 45.0, 47.0, 52.0, 66.0, 69.0, 65.0, 59.0, 60.0, 56.0, 48.0, 47.0, 28.0, 33.0, 24.0, 27.0, 15.0, 7.0, 9.0, 8.0, 7.0, 7.0, 7.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.000919342041015625, -0.0008916258811950684, -0.0008639097213745117, -0.0008361935615539551, -0.0008084774017333984, -0.0007807612419128418, -0.0007530450820922852, -0.0007253289222717285, -0.0006976127624511719, -0.0006698966026306152, -0.0006421804428100586, -0.000614464282989502, -0.0005867481231689453, -0.0005590319633483887, -0.000531315803527832, -0.0005035996437072754, -0.00047588348388671875, -0.0004481673240661621, -0.00042045116424560547, -0.00039273500442504883, -0.0003650188446044922, -0.00033730268478393555, -0.0003095865249633789, -0.00028187036514282227, -0.0002541542053222656, -0.00022643804550170898, -0.00019872188568115234, -0.0001710057258605957, -0.00014328956604003906, -0.00011557340621948242, -8.785724639892578e-05, -6.014108657836914e-05, -3.24249267578125e-05, -4.708766937255859e-06, 2.300739288330078e-05, 5.072355270385742e-05, 7.843971252441406e-05, 0.0001061558723449707, 0.00013387203216552734, 0.00016158819198608398, 0.00018930435180664062, 0.00021702051162719727, 0.0002447366714477539, 0.00027245283126831055, 0.0003001689910888672, 0.00032788515090942383, 0.00035560131072998047, 0.0003833174705505371, 0.00041103363037109375, 0.0004387497901916504, 0.00046646595001220703, 0.0004941821098327637, 0.0005218982696533203, 0.000549614429473877, 0.0005773305892944336, 0.0006050467491149902, 0.0006327629089355469, 0.0006604790687561035, 0.0006881952285766602, 0.0007159113883972168, 0.0007436275482177734, 0.0007713437080383301, 0.0007990598678588867, 0.0008267760276794434, 0.0008544921875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 6.0, 2.0, 4.0, 4.0, 8.0, 3.0, 9.0, 15.0, 13.0, 25.0, 40.0, 54.0, 71.0, 104.0, 145.0, 208.0, 268.0, 500.0, 751.0, 1223.0, 2105.0, 3688.0, 6581.0, 12563.0, 24403.0, 46640.0, 88175.0, 149480.0, 205669.0, 198857.0, 138578.0, 79202.0, 41827.0, 21578.0, 11246.0, 6073.0, 3257.0, 1875.0, 1145.0, 744.0, 486.0, 308.0, 162.0, 139.0, 94.0, 60.0, 40.0, 47.0, 27.0, 24.0, 10.0, 12.0, 6.0, 8.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.609375, -24.781005859375, -23.95263671875, -23.124267578125, -22.2958984375, -21.467529296875, -20.63916015625, -19.810791015625, -18.982421875, -18.154052734375, -17.32568359375, -16.497314453125, -15.6689453125, -14.840576171875, -14.01220703125, -13.183837890625, -12.35546875, -11.527099609375, -10.69873046875, -9.870361328125, -9.0419921875, -8.213623046875, -7.38525390625, -6.556884765625, -5.728515625, -4.900146484375, -4.07177734375, -3.243408203125, -2.4150390625, -1.586669921875, -0.75830078125, 0.070068359375, 0.8984375, 1.726806640625, 2.55517578125, 3.383544921875, 4.2119140625, 5.040283203125, 5.86865234375, 6.697021484375, 7.525390625, 8.353759765625, 9.18212890625, 10.010498046875, 10.8388671875, 11.667236328125, 12.49560546875, 13.323974609375, 14.15234375, 14.980712890625, 15.80908203125, 16.637451171875, 17.4658203125, 18.294189453125, 19.12255859375, 19.950927734375, 20.779296875, 21.607666015625, 22.43603515625, 23.264404296875, 24.0927734375, 24.921142578125, 25.74951171875, 26.577880859375, 27.40625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 3.0, 2.0, 4.0, 7.0, 9.0, 6.0, 17.0, 12.0, 18.0, 21.0, 30.0, 44.0, 21.0, 37.0, 44.0, 50.0, 53.0, 41.0, 56.0, 53.0, 58.0, 62.0, 63.0, 57.0, 37.0, 32.0, 24.0, 31.0, 19.0, 15.0, 13.0, 14.0, 7.0, 9.0, 10.0, 4.0, 3.0, 2.0, 3.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-7.390625, -7.19158935546875, -6.9925537109375, -6.79351806640625, -6.594482421875, -6.39544677734375, -6.1964111328125, -5.99737548828125, -5.79833984375, -5.59930419921875, -5.4002685546875, -5.20123291015625, -5.002197265625, -4.80316162109375, -4.6041259765625, -4.40509033203125, -4.2060546875, -4.00701904296875, -3.8079833984375, -3.60894775390625, -3.409912109375, -3.21087646484375, -3.0118408203125, -2.81280517578125, -2.61376953125, -2.41473388671875, -2.2156982421875, -2.01666259765625, -1.817626953125, -1.61859130859375, -1.4195556640625, -1.22052001953125, -1.021484375, -0.82244873046875, -0.6234130859375, -0.42437744140625, -0.225341796875, -0.02630615234375, 0.1727294921875, 0.37176513671875, 0.57080078125, 0.76983642578125, 0.9688720703125, 1.16790771484375, 1.366943359375, 1.56597900390625, 1.7650146484375, 1.96405029296875, 2.1630859375, 2.36212158203125, 2.5611572265625, 2.76019287109375, 2.959228515625, 3.15826416015625, 3.3572998046875, 3.55633544921875, 3.75537109375, 3.95440673828125, 4.1534423828125, 4.35247802734375, 4.551513671875, 4.75054931640625, 4.9495849609375, 5.14862060546875, 5.34765625]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 8.0, 8.0, 7.0, 9.0, 11.0, 10.0, 13.0, 18.0, 29.0, 30.0, 26.0, 39.0, 51.0, 45.0, 61.0, 44.0, 60.0, 61.0, 57.0, 47.0, 48.0, 51.0, 43.0, 44.0, 32.0, 28.0, 25.0, 17.0, 17.0, 13.0, 8.0, 12.0, 8.0, 6.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.21493148803711, -39.865421295166016, -38.515907287597656, -37.16639709472656, -35.81688690185547, -34.467376708984375, -33.11786651611328, -31.768352508544922, -30.418842315673828, -29.069332122802734, -27.719820022583008, -26.37030792236328, -25.020797729492188, -23.671287536621094, -22.321775436401367, -20.97226333618164, -19.622753143310547, -18.273242950439453, -16.923730850219727, -15.574219703674316, -14.224708557128906, -12.875197410583496, -11.525686264038086, -10.176175117492676, -8.826663970947266, -7.4771528244018555, -6.127641677856445, -4.778130531311035, -3.428619384765625, -2.079108238220215, -0.7295970916748047, 0.6199140548706055, 1.9694252014160156, 3.318936347961426, 4.668447494506836, 6.017958641052246, 7.367469787597656, 8.716980934143066, 10.066492080688477, 11.416003227233887, 12.765514373779297, 14.115025520324707, 15.464536666870117, 16.814048767089844, 18.163558959960938, 19.51306915283203, 20.862581253051758, 22.212093353271484, 23.561603546142578, 24.911113739013672, 26.2606258392334, 27.610137939453125, 28.95964813232422, 30.309158325195312, 31.65867042541504, 33.008182525634766, 34.35769271850586, 35.70720291137695, 37.05671691894531, 38.406227111816406, 39.7557373046875, 41.105247497558594, 42.45475769042969, 43.80427169799805, 45.15378189086914]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 6.0, 4.0, 7.0, 7.0, 17.0, 9.0, 13.0, 8.0, 15.0, 18.0, 20.0, 25.0, 20.0, 29.0, 27.0, 33.0, 33.0, 34.0, 38.0, 44.0, 40.0, 32.0, 49.0, 48.0, 45.0, 47.0, 38.0, 32.0, 22.0, 44.0, 23.0, 25.0, 20.0, 17.0, 23.0, 13.0, 19.0, 10.0, 9.0, 9.0, 8.0, 6.0, 4.0, 2.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-25.21017074584961, -24.417564392089844, -23.624958038330078, -22.832353591918945, -22.03974723815918, -21.247140884399414, -20.45453643798828, -19.661930084228516, -18.86932373046875, -18.076717376708984, -17.28411102294922, -16.491506576538086, -15.69890022277832, -14.906293869018555, -14.113688468933105, -13.321083068847656, -12.52847671508789, -11.735870361328125, -10.943264961242676, -10.150659561157227, -9.358053207397461, -8.565446853637695, -7.772841453552246, -6.980235576629639, -6.187629699707031, -5.395023822784424, -4.602417945861816, -3.809812068939209, -3.0172061920166016, -2.224600315093994, -1.4319944381713867, -0.6393885612487793, 0.1532154083251953, 0.9458212852478027, 1.7384271621704102, 2.5310330390930176, 3.323638916015625, 4.116244792938232, 4.90885066986084, 5.701456546783447, 6.494062423706055, 7.286668300628662, 8.07927417755127, 8.871879577636719, 9.664485931396484, 10.45709228515625, 11.2496976852417, 12.042303085327148, 12.834909439086914, 13.62751579284668, 14.420121192932129, 15.212726593017578, 16.005332946777344, 16.79793930053711, 17.590545654296875, 18.383150100708008, 19.175756454467773, 19.96836280822754, 20.760967254638672, 21.553573608398438, 22.346179962158203, 23.13878631591797, 23.931392669677734, 24.723997116088867, 25.516603469848633]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 7.0, 16.0, 13.0, 23.0, 43.0, 52.0, 89.0, 136.0, 229.0, 320.0, 545.0, 808.0, 1269.0, 2064.0, 3129.0, 5350.0, 8854.0, 14758.0, 24836.0, 39970.0, 63968.0, 94843.0, 128732.0, 149965.0, 147091.0, 122194.0, 88413.0, 58215.0, 36580.0, 21975.0, 13349.0, 7909.0, 4832.0, 2998.0, 1826.0, 1162.0, 742.0, 445.0, 279.0, 187.0, 117.0, 81.0, 44.0, 33.0, 23.0, 16.0, 8.0, 11.0, 8.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.25, -24.405517578125, -23.56103515625, -22.716552734375, -21.8720703125, -21.027587890625, -20.18310546875, -19.338623046875, -18.494140625, -17.649658203125, -16.80517578125, -15.960693359375, -15.1162109375, -14.271728515625, -13.42724609375, -12.582763671875, -11.73828125, -10.893798828125, -10.04931640625, -9.204833984375, -8.3603515625, -7.515869140625, -6.67138671875, -5.826904296875, -4.982421875, -4.137939453125, -3.29345703125, -2.448974609375, -1.6044921875, -0.760009765625, 0.08447265625, 0.928955078125, 1.7734375, 2.617919921875, 3.46240234375, 4.306884765625, 5.1513671875, 5.995849609375, 6.84033203125, 7.684814453125, 8.529296875, 9.373779296875, 10.21826171875, 11.062744140625, 11.9072265625, 12.751708984375, 13.59619140625, 14.440673828125, 15.28515625, 16.129638671875, 16.97412109375, 17.818603515625, 18.6630859375, 19.507568359375, 20.35205078125, 21.196533203125, 22.041015625, 22.885498046875, 23.72998046875, 24.574462890625, 25.4189453125, 26.263427734375, 27.10791015625, 27.952392578125, 28.796875]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 8.0, 11.0, 9.0, 15.0, 20.0, 22.0, 19.0, 12.0, 20.0, 16.0, 44.0, 30.0, 46.0, 33.0, 49.0, 51.0, 57.0, 65.0, 55.0, 42.0, 53.0, 46.0, 43.0, 34.0, 41.0, 31.0, 19.0, 24.0, 13.0, 18.0, 15.0, 11.0, 10.0, 4.0, 5.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.203125, -29.169189453125, -28.13525390625, -27.101318359375, -26.0673828125, -25.033447265625, -23.99951171875, -22.965576171875, -21.931640625, -20.897705078125, -19.86376953125, -18.829833984375, -17.7958984375, -16.761962890625, -15.72802734375, -14.694091796875, -13.66015625, -12.626220703125, -11.59228515625, -10.558349609375, -9.5244140625, -8.490478515625, -7.45654296875, -6.422607421875, -5.388671875, -4.354736328125, -3.32080078125, -2.286865234375, -1.2529296875, -0.218994140625, 0.81494140625, 1.848876953125, 2.8828125, 3.916748046875, 4.95068359375, 5.984619140625, 7.0185546875, 8.052490234375, 9.08642578125, 10.120361328125, 11.154296875, 12.188232421875, 13.22216796875, 14.256103515625, 15.2900390625, 16.323974609375, 17.35791015625, 18.391845703125, 19.42578125, 20.459716796875, 21.49365234375, 22.527587890625, 23.5615234375, 24.595458984375, 25.62939453125, 26.663330078125, 27.697265625, 28.731201171875, 29.76513671875, 30.799072265625, 31.8330078125, 32.866943359375, 33.90087890625, 34.934814453125, 35.96875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 0.0, 3.0, 3.0, 6.0, 6.0, 13.0, 18.0, 33.0, 33.0, 52.0, 72.0, 91.0, 167.0, 219.0, 323.0, 453.0, 710.0, 1186.0, 1961.0, 3251.0, 5777.0, 11110.0, 21896.0, 45688.0, 93532.0, 166494.0, 224217.0, 205476.0, 130613.0, 67702.0, 32429.0, 15839.0, 8157.0, 4205.0, 2551.0, 1484.0, 925.0, 619.0, 390.0, 249.0, 180.0, 112.0, 91.0, 82.0, 43.0, 24.0, 21.0, 19.0, 10.0, 3.0, 9.0, 3.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-46.40625, -44.89794921875, -43.3896484375, -41.88134765625, -40.373046875, -38.86474609375, -37.3564453125, -35.84814453125, -34.33984375, -32.83154296875, -31.3232421875, -29.81494140625, -28.306640625, -26.79833984375, -25.2900390625, -23.78173828125, -22.2734375, -20.76513671875, -19.2568359375, -17.74853515625, -16.240234375, -14.73193359375, -13.2236328125, -11.71533203125, -10.20703125, -8.69873046875, -7.1904296875, -5.68212890625, -4.173828125, -2.66552734375, -1.1572265625, 0.35107421875, 1.859375, 3.36767578125, 4.8759765625, 6.38427734375, 7.892578125, 9.40087890625, 10.9091796875, 12.41748046875, 13.92578125, 15.43408203125, 16.9423828125, 18.45068359375, 19.958984375, 21.46728515625, 22.9755859375, 24.48388671875, 25.9921875, 27.50048828125, 29.0087890625, 30.51708984375, 32.025390625, 33.53369140625, 35.0419921875, 36.55029296875, 38.05859375, 39.56689453125, 41.0751953125, 42.58349609375, 44.091796875, 45.60009765625, 47.1083984375, 48.61669921875, 50.125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 6.0, 4.0, 5.0, 11.0, 8.0, 10.0, 12.0, 10.0, 23.0, 11.0, 21.0, 35.0, 25.0, 28.0, 39.0, 34.0, 35.0, 46.0, 38.0, 42.0, 45.0, 38.0, 35.0, 31.0, 46.0, 43.0, 38.0, 29.0, 24.0, 41.0, 31.0, 23.0, 21.0, 19.0, 22.0, 16.0, 14.0, 7.0, 9.0, 10.0, 2.0, 5.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-21.015625, -20.408203125, -19.80078125, -19.193359375, -18.5859375, -17.978515625, -17.37109375, -16.763671875, -16.15625, -15.548828125, -14.94140625, -14.333984375, -13.7265625, -13.119140625, -12.51171875, -11.904296875, -11.296875, -10.689453125, -10.08203125, -9.474609375, -8.8671875, -8.259765625, -7.65234375, -7.044921875, -6.4375, -5.830078125, -5.22265625, -4.615234375, -4.0078125, -3.400390625, -2.79296875, -2.185546875, -1.578125, -0.970703125, -0.36328125, 0.244140625, 0.8515625, 1.458984375, 2.06640625, 2.673828125, 3.28125, 3.888671875, 4.49609375, 5.103515625, 5.7109375, 6.318359375, 6.92578125, 7.533203125, 8.140625, 8.748046875, 9.35546875, 9.962890625, 10.5703125, 11.177734375, 11.78515625, 12.392578125, 13.0, 13.607421875, 14.21484375, 14.822265625, 15.4296875, 16.037109375, 16.64453125, 17.251953125, 17.859375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 11.0, 16.0, 10.0, 21.0, 39.0, 55.0, 67.0, 95.0, 149.0, 180.0, 260.0, 336.0, 540.0, 869.0, 1378.0, 2185.0, 3661.0, 6296.0, 11546.0, 20937.0, 39877.0, 74570.0, 133868.0, 199478.0, 209265.0, 151496.0, 88069.0, 46782.0, 24714.0, 13176.0, 7542.0, 4186.0, 2471.0, 1505.0, 965.0, 587.0, 379.0, 265.0, 209.0, 153.0, 95.0, 74.0, 57.0, 36.0, 31.0, 20.0, 13.0, 13.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0], "bins": [-26.4375, -25.662841796875, -24.88818359375, -24.113525390625, -23.3388671875, -22.564208984375, -21.78955078125, -21.014892578125, -20.240234375, -19.465576171875, -18.69091796875, -17.916259765625, -17.1416015625, -16.366943359375, -15.59228515625, -14.817626953125, -14.04296875, -13.268310546875, -12.49365234375, -11.718994140625, -10.9443359375, -10.169677734375, -9.39501953125, -8.620361328125, -7.845703125, -7.071044921875, -6.29638671875, -5.521728515625, -4.7470703125, -3.972412109375, -3.19775390625, -2.423095703125, -1.6484375, -0.873779296875, -0.09912109375, 0.675537109375, 1.4501953125, 2.224853515625, 2.99951171875, 3.774169921875, 4.548828125, 5.323486328125, 6.09814453125, 6.872802734375, 7.6474609375, 8.422119140625, 9.19677734375, 9.971435546875, 10.74609375, 11.520751953125, 12.29541015625, 13.070068359375, 13.8447265625, 14.619384765625, 15.39404296875, 16.168701171875, 16.943359375, 17.718017578125, 18.49267578125, 19.267333984375, 20.0419921875, 20.816650390625, 21.59130859375, 22.365966796875, 23.140625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 1.0, 4.0, 0.0, 4.0, 3.0, 7.0, 8.0, 11.0, 11.0, 20.0, 29.0, 44.0, 67.0, 81.0, 95.0, 125.0, 119.0, 95.0, 81.0, 69.0, 47.0, 27.0, 21.0, 12.0, 9.0, 8.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0032787322998046875, -0.0031517446041107178, -0.003024756908416748, -0.0028977692127227783, -0.0027707815170288086, -0.002643793821334839, -0.002516806125640869, -0.0023898184299468994, -0.0022628307342529297, -0.00213584303855896, -0.0020088553428649902, -0.0018818676471710205, -0.0017548799514770508, -0.001627892255783081, -0.0015009045600891113, -0.0013739168643951416, -0.0012469291687011719, -0.0011199414730072021, -0.0009929537773132324, -0.0008659660816192627, -0.000738978385925293, -0.0006119906902313232, -0.0004850029945373535, -0.0003580152988433838, -0.00023102760314941406, -0.00010403990745544434, 2.294778823852539e-05, 0.00014993548393249512, 0.00027692317962646484, 0.00040391087532043457, 0.0005308985710144043, 0.000657886266708374, 0.0007848739624023438, 0.0009118616580963135, 0.0010388493537902832, 0.001165837049484253, 0.0012928247451782227, 0.0014198124408721924, 0.0015468001365661621, 0.0016737878322601318, 0.0018007755279541016, 0.0019277632236480713, 0.002054750919342041, 0.0021817386150360107, 0.0023087263107299805, 0.00243571400642395, 0.00256270170211792, 0.0026896893978118896, 0.0028166770935058594, 0.002943664789199829, 0.003070652484893799, 0.0031976401805877686, 0.0033246278762817383, 0.003451615571975708, 0.0035786032676696777, 0.0037055909633636475, 0.003832578659057617, 0.003959566354751587, 0.004086554050445557, 0.004213541746139526, 0.004340529441833496, 0.004467517137527466, 0.0045945048332214355, 0.004721492528915405, 0.004848480224609375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 2.0, 7.0, 11.0, 15.0, 16.0, 24.0, 47.0, 53.0, 80.0, 115.0, 178.0, 276.0, 424.0, 601.0, 951.0, 1412.0, 2361.0, 3652.0, 6230.0, 10685.0, 19082.0, 34887.0, 65306.0, 116803.0, 181193.0, 207424.0, 166589.0, 103035.0, 56502.0, 30140.0, 16533.0, 9468.0, 5475.0, 3268.0, 2042.0, 1250.0, 795.0, 534.0, 334.0, 237.0, 153.0, 113.0, 79.0, 54.0, 33.0, 31.0, 23.0, 9.0, 14.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-24.53125, -23.74951171875, -22.9677734375, -22.18603515625, -21.404296875, -20.62255859375, -19.8408203125, -19.05908203125, -18.27734375, -17.49560546875, -16.7138671875, -15.93212890625, -15.150390625, -14.36865234375, -13.5869140625, -12.80517578125, -12.0234375, -11.24169921875, -10.4599609375, -9.67822265625, -8.896484375, -8.11474609375, -7.3330078125, -6.55126953125, -5.76953125, -4.98779296875, -4.2060546875, -3.42431640625, -2.642578125, -1.86083984375, -1.0791015625, -0.29736328125, 0.484375, 1.26611328125, 2.0478515625, 2.82958984375, 3.611328125, 4.39306640625, 5.1748046875, 5.95654296875, 6.73828125, 7.52001953125, 8.3017578125, 9.08349609375, 9.865234375, 10.64697265625, 11.4287109375, 12.21044921875, 12.9921875, 13.77392578125, 14.5556640625, 15.33740234375, 16.119140625, 16.90087890625, 17.6826171875, 18.46435546875, 19.24609375, 20.02783203125, 20.8095703125, 21.59130859375, 22.373046875, 23.15478515625, 23.9365234375, 24.71826171875, 25.5]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 5.0, 4.0, 4.0, 7.0, 7.0, 7.0, 16.0, 12.0, 20.0, 31.0, 30.0, 38.0, 44.0, 67.0, 65.0, 63.0, 93.0, 68.0, 74.0, 75.0, 65.0, 51.0, 26.0, 24.0, 22.0, 27.0, 10.0, 12.0, 8.0, 9.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.171875, -7.9005126953125, -7.629150390625, -7.3577880859375, -7.08642578125, -6.8150634765625, -6.543701171875, -6.2723388671875, -6.0009765625, -5.7296142578125, -5.458251953125, -5.1868896484375, -4.91552734375, -4.6441650390625, -4.372802734375, -4.1014404296875, -3.830078125, -3.5587158203125, -3.287353515625, -3.0159912109375, -2.74462890625, -2.4732666015625, -2.201904296875, -1.9305419921875, -1.6591796875, -1.3878173828125, -1.116455078125, -0.8450927734375, -0.57373046875, -0.3023681640625, -0.031005859375, 0.2403564453125, 0.51171875, 0.7830810546875, 1.054443359375, 1.3258056640625, 1.59716796875, 1.8685302734375, 2.139892578125, 2.4112548828125, 2.6826171875, 2.9539794921875, 3.225341796875, 3.4967041015625, 3.76806640625, 4.0394287109375, 4.310791015625, 4.5821533203125, 4.853515625, 5.1248779296875, 5.396240234375, 5.6676025390625, 5.93896484375, 6.2103271484375, 6.481689453125, 6.7530517578125, 7.0244140625, 7.2957763671875, 7.567138671875, 7.8385009765625, 8.10986328125, 8.3812255859375, 8.652587890625, 8.9239501953125, 9.1953125]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 4.0, 4.0, 8.0, 4.0, 12.0, 8.0, 11.0, 12.0, 17.0, 26.0, 20.0, 20.0, 46.0, 37.0, 41.0, 50.0, 45.0, 45.0, 48.0, 38.0, 48.0, 47.0, 50.0, 43.0, 48.0, 41.0, 28.0, 37.0, 29.0, 19.0, 22.0, 21.0, 17.0, 10.0, 11.0, 9.0, 6.0, 7.0, 2.0, 5.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.419578552246094, -34.14214324951172, -32.864707946777344, -31.58727264404297, -30.309837341308594, -29.03240203857422, -27.754966735839844, -26.47753143310547, -25.200096130371094, -23.92266082763672, -22.645225524902344, -21.36779022216797, -20.090354919433594, -18.81291961669922, -17.535484313964844, -16.25804901123047, -14.980615615844727, -13.703180313110352, -12.425745010375977, -11.148309707641602, -9.870874404907227, -8.593439102172852, -7.316004753112793, -6.038569450378418, -4.761134147644043, -3.483698844909668, -2.206263780593872, -0.9288287162780762, 0.34860658645629883, 1.6260418891906738, 2.9034767150878906, 4.180912017822266, 5.458347320556641, 6.735782623291016, 8.01321792602539, 9.290653228759766, 10.56808853149414, 11.845523834228516, 13.122958183288574, 14.40039348602295, 15.677828788757324, 16.955263137817383, 18.232698440551758, 19.510133743286133, 20.787569046020508, 22.065004348754883, 23.342439651489258, 24.619874954223633, 25.897310256958008, 27.174745559692383, 28.452180862426758, 29.729616165161133, 31.007051467895508, 32.28448486328125, 33.561920166015625, 34.83935546875, 36.116790771484375, 37.39422607421875, 38.671661376953125, 39.9490966796875, 41.226531982421875, 42.50396728515625, 43.781402587890625, 45.058837890625, 46.336273193359375]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 9.0, 6.0, 7.0, 12.0, 11.0, 13.0, 6.0, 28.0, 8.0, 24.0, 29.0, 24.0, 25.0, 33.0, 42.0, 38.0, 45.0, 35.0, 43.0, 49.0, 45.0, 52.0, 43.0, 31.0, 37.0, 34.0, 38.0, 29.0, 29.0, 30.0, 16.0, 29.0, 17.0, 14.0, 12.0, 15.0, 5.0, 5.0, 13.0, 12.0, 5.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-33.991695404052734, -33.017005920410156, -32.042320251464844, -31.0676326751709, -30.092945098876953, -29.118255615234375, -28.14356803894043, -27.168880462646484, -26.19419288635254, -25.219505310058594, -24.24481773376465, -23.270130157470703, -22.295440673828125, -21.320755004882812, -20.346065521240234, -19.37137794494629, -18.396690368652344, -17.4220027923584, -16.447315216064453, -15.472626686096191, -14.497939109802246, -13.5232515335083, -12.548563003540039, -11.573875427246094, -10.599187850952148, -9.624500274658203, -8.649812698364258, -7.675124168395996, -6.700436592102051, -5.7257490158081055, -4.751060962677002, -3.7763729095458984, -2.801685333251953, -1.8269975185394287, -0.8523097038269043, 0.12237811088562012, 1.0970659255981445, 2.07175350189209, 3.0464415550231934, 4.021129608154297, 4.995817184448242, 5.9705047607421875, 6.945192813873291, 7.9198808670043945, 8.89456844329834, 9.869256019592285, 10.843944549560547, 11.818632125854492, 12.793319702148438, 13.768007278442383, 14.742694854736328, 15.71738338470459, 16.69207000732422, 17.666759490966797, 18.641447067260742, 19.616134643554688, 20.590822219848633, 21.565509796142578, 22.540197372436523, 23.51488494873047, 24.489574432373047, 25.46426010131836, 26.438949584960938, 27.413637161254883, 28.388324737548828]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 7.0, 7.0, 16.0, 14.0, 26.0, 50.0, 71.0, 116.0, 205.0, 337.0, 550.0, 1012.0, 1772.0, 3163.0, 5632.0, 10130.0, 18898.0, 35827.0, 69036.0, 135464.0, 268491.0, 501172.0, 789335.0, 886923.0, 670110.0, 385608.0, 198975.0, 100430.0, 51500.0, 26948.0, 14265.0, 7760.0, 4379.0, 2432.0, 1421.0, 811.0, 505.0, 297.0, 206.0, 129.0, 82.0, 73.0, 38.0, 18.0, 15.0, 14.0, 10.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-43.53125, -42.1396484375, -40.748046875, -39.3564453125, -37.96484375, -36.5732421875, -35.181640625, -33.7900390625, -32.3984375, -31.0068359375, -29.615234375, -28.2236328125, -26.83203125, -25.4404296875, -24.048828125, -22.6572265625, -21.265625, -19.8740234375, -18.482421875, -17.0908203125, -15.69921875, -14.3076171875, -12.916015625, -11.5244140625, -10.1328125, -8.7412109375, -7.349609375, -5.9580078125, -4.56640625, -3.1748046875, -1.783203125, -0.3916015625, 1.0, 2.3916015625, 3.783203125, 5.1748046875, 6.56640625, 7.9580078125, 9.349609375, 10.7412109375, 12.1328125, 13.5244140625, 14.916015625, 16.3076171875, 17.69921875, 19.0908203125, 20.482421875, 21.8740234375, 23.265625, 24.6572265625, 26.048828125, 27.4404296875, 28.83203125, 30.2236328125, 31.615234375, 33.0068359375, 34.3984375, 35.7900390625, 37.181640625, 38.5732421875, 39.96484375, 41.3564453125, 42.748046875, 44.1396484375, 45.53125]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 9.0, 9.0, 5.0, 20.0, 14.0, 12.0, 14.0, 20.0, 17.0, 24.0, 22.0, 32.0, 36.0, 30.0, 42.0, 31.0, 39.0, 37.0, 42.0, 46.0, 46.0, 45.0, 42.0, 33.0, 36.0, 39.0, 41.0, 33.0, 32.0, 17.0, 22.0, 13.0, 12.0, 21.0, 15.0, 10.0, 8.0, 10.0, 8.0, 8.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-29.6875, -28.724609375, -27.76171875, -26.798828125, -25.8359375, -24.873046875, -23.91015625, -22.947265625, -21.984375, -21.021484375, -20.05859375, -19.095703125, -18.1328125, -17.169921875, -16.20703125, -15.244140625, -14.28125, -13.318359375, -12.35546875, -11.392578125, -10.4296875, -9.466796875, -8.50390625, -7.541015625, -6.578125, -5.615234375, -4.65234375, -3.689453125, -2.7265625, -1.763671875, -0.80078125, 0.162109375, 1.125, 2.087890625, 3.05078125, 4.013671875, 4.9765625, 5.939453125, 6.90234375, 7.865234375, 8.828125, 9.791015625, 10.75390625, 11.716796875, 12.6796875, 13.642578125, 14.60546875, 15.568359375, 16.53125, 17.494140625, 18.45703125, 19.419921875, 20.3828125, 21.345703125, 22.30859375, 23.271484375, 24.234375, 25.197265625, 26.16015625, 27.123046875, 28.0859375, 29.048828125, 30.01171875, 30.974609375, 31.9375]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 0.0, 7.0, 10.0, 11.0, 17.0, 29.0, 50.0, 58.0, 108.0, 136.0, 244.0, 362.0, 610.0, 965.0, 1613.0, 2535.0, 4119.0, 6812.0, 11763.0, 19568.0, 34178.0, 58718.0, 102402.0, 177157.0, 301787.0, 483858.0, 677016.0, 737788.0, 599140.0, 399391.0, 241594.0, 139803.0, 80501.0, 46005.0, 26826.0, 15665.0, 9264.0, 5455.0, 3309.0, 2007.0, 1260.0, 792.0, 501.0, 292.0, 223.0, 122.0, 91.0, 47.0, 32.0, 18.0, 19.0, 8.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-49.34375, -47.71435546875, -46.0849609375, -44.45556640625, -42.826171875, -41.19677734375, -39.5673828125, -37.93798828125, -36.30859375, -34.67919921875, -33.0498046875, -31.42041015625, -29.791015625, -28.16162109375, -26.5322265625, -24.90283203125, -23.2734375, -21.64404296875, -20.0146484375, -18.38525390625, -16.755859375, -15.12646484375, -13.4970703125, -11.86767578125, -10.23828125, -8.60888671875, -6.9794921875, -5.35009765625, -3.720703125, -2.09130859375, -0.4619140625, 1.16748046875, 2.796875, 4.42626953125, 6.0556640625, 7.68505859375, 9.314453125, 10.94384765625, 12.5732421875, 14.20263671875, 15.83203125, 17.46142578125, 19.0908203125, 20.72021484375, 22.349609375, 23.97900390625, 25.6083984375, 27.23779296875, 28.8671875, 30.49658203125, 32.1259765625, 33.75537109375, 35.384765625, 37.01416015625, 38.6435546875, 40.27294921875, 41.90234375, 43.53173828125, 45.1611328125, 46.79052734375, 48.419921875, 50.04931640625, 51.6787109375, 53.30810546875, 54.9375]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 6.0, 17.0, 13.0, 17.0, 31.0, 35.0, 29.0, 49.0, 56.0, 82.0, 90.0, 121.0, 160.0, 169.0, 203.0, 218.0, 257.0, 274.0, 258.0, 272.0, 233.0, 270.0, 239.0, 196.0, 158.0, 116.0, 94.0, 91.0, 65.0, 60.0, 51.0, 31.0, 32.0, 22.0, 15.0, 12.0, 10.0, 6.0, 10.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.796875, -19.17333984375, -18.5498046875, -17.92626953125, -17.302734375, -16.67919921875, -16.0556640625, -15.43212890625, -14.80859375, -14.18505859375, -13.5615234375, -12.93798828125, -12.314453125, -11.69091796875, -11.0673828125, -10.44384765625, -9.8203125, -9.19677734375, -8.5732421875, -7.94970703125, -7.326171875, -6.70263671875, -6.0791015625, -5.45556640625, -4.83203125, -4.20849609375, -3.5849609375, -2.96142578125, -2.337890625, -1.71435546875, -1.0908203125, -0.46728515625, 0.15625, 0.77978515625, 1.4033203125, 2.02685546875, 2.650390625, 3.27392578125, 3.8974609375, 4.52099609375, 5.14453125, 5.76806640625, 6.3916015625, 7.01513671875, 7.638671875, 8.26220703125, 8.8857421875, 9.50927734375, 10.1328125, 10.75634765625, 11.3798828125, 12.00341796875, 12.626953125, 13.25048828125, 13.8740234375, 14.49755859375, 15.12109375, 15.74462890625, 16.3681640625, 16.99169921875, 17.615234375, 18.23876953125, 18.8623046875, 19.48583984375, 20.109375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 9.0, 7.0, 6.0, 15.0, 11.0, 14.0, 15.0, 30.0, 29.0, 34.0, 30.0, 40.0, 42.0, 49.0, 44.0, 41.0, 54.0, 58.0, 46.0, 55.0, 54.0, 45.0, 43.0, 21.0, 38.0, 27.0, 23.0, 23.0, 23.0, 16.0, 6.0, 11.0, 10.0, 12.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-54.776466369628906, -52.83802032470703, -50.89957046508789, -48.961124420166016, -47.022674560546875, -45.084228515625, -43.145782470703125, -41.207332611083984, -39.268882751464844, -37.33043670654297, -35.39198684692383, -33.45354080200195, -31.515090942382812, -29.576644897460938, -27.63819694519043, -25.699748992919922, -23.761302947998047, -21.82285499572754, -19.88440704345703, -17.945960998535156, -16.007511138916016, -14.069064140319824, -12.130617141723633, -10.192169189453125, -8.253721237182617, -6.315273284912109, -4.37682580947876, -2.43837833404541, -0.49993038177490234, 1.4385175704956055, 3.376964569091797, 5.315412521362305, 7.2538604736328125, 9.19230842590332, 11.130756378173828, 13.06920337677002, 15.007651329040527, 16.94609832763672, 18.884546279907227, 20.822994232177734, 22.761442184448242, 24.69989013671875, 26.638338088989258, 28.576786041259766, 30.51523208618164, 32.45368194580078, 34.392127990722656, 36.33057403564453, 38.26902389526367, 40.20746994018555, 42.14591979980469, 44.08436584472656, 46.0228157043457, 47.96126174926758, 49.89971160888672, 51.838157653808594, 53.77660369873047, 55.715049743652344, 57.653499603271484, 59.59194564819336, 61.5303955078125, 63.468841552734375, 65.40728759765625, 67.34573364257812, 69.28418731689453]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 8.0, 12.0, 6.0, 9.0, 9.0, 10.0, 18.0, 20.0, 21.0, 26.0, 22.0, 30.0, 29.0, 38.0, 31.0, 42.0, 34.0, 41.0, 48.0, 37.0, 41.0, 32.0, 34.0, 37.0, 31.0, 37.0, 45.0, 29.0, 35.0, 26.0, 23.0, 22.0, 12.0, 15.0, 13.0, 12.0, 13.0, 12.0, 14.0, 4.0, 7.0, 8.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-45.55194854736328, -44.18765640258789, -42.8233642578125, -41.459068298339844, -40.09477615356445, -38.73048400878906, -37.36619186401367, -36.00189971923828, -34.637603759765625, -33.273311614990234, -31.90901756286621, -30.54472541809082, -29.180431365966797, -27.816139221191406, -26.451847076416016, -25.087554931640625, -23.723262786865234, -22.358970642089844, -20.99467658996582, -19.63038444519043, -18.266090393066406, -16.901798248291016, -15.537506103515625, -14.173213005065918, -12.808919906616211, -11.444626808166504, -10.080333709716797, -8.716041564941406, -7.351748466491699, -5.987455368041992, -4.623163223266602, -3.2588701248168945, -1.8945770263671875, -0.5302841663360596, 0.8340086936950684, 2.198301315307617, 3.562594413757324, 4.926887512207031, 6.291179656982422, 7.655472755432129, 9.019765853881836, 10.384058952331543, 11.74835205078125, 13.11264419555664, 14.476937294006348, 15.841230392456055, 17.205522537231445, 18.56981658935547, 19.93410873413086, 21.29840087890625, 22.662694931030273, 24.026987075805664, 25.391281127929688, 26.755573272705078, 28.11986541748047, 29.48415756225586, 30.848451614379883, 32.212745666503906, 33.5770378112793, 34.94132995605469, 36.30562210083008, 37.66991424560547, 39.034210205078125, 40.398502349853516, 41.762794494628906]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 5.0, 12.0, 18.0, 34.0, 40.0, 57.0, 98.0, 132.0, 228.0, 314.0, 426.0, 689.0, 1040.0, 1622.0, 2529.0, 3679.0, 5609.0, 8628.0, 13261.0, 20639.0, 32014.0, 47661.0, 70233.0, 97913.0, 123687.0, 137379.0, 130417.0, 107484.0, 80126.0, 55740.0, 37235.0, 24151.0, 15835.0, 10360.0, 6558.0, 4394.0, 2851.0, 1958.0, 1177.0, 774.0, 559.0, 334.0, 182.0, 166.0, 104.0, 71.0, 65.0, 24.0, 19.0, 14.0, 8.0, 5.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0], "bins": [-25.25, -24.453125, -23.65625, -22.859375, -22.0625, -21.265625, -20.46875, -19.671875, -18.875, -18.078125, -17.28125, -16.484375, -15.6875, -14.890625, -14.09375, -13.296875, -12.5, -11.703125, -10.90625, -10.109375, -9.3125, -8.515625, -7.71875, -6.921875, -6.125, -5.328125, -4.53125, -3.734375, -2.9375, -2.140625, -1.34375, -0.546875, 0.25, 1.046875, 1.84375, 2.640625, 3.4375, 4.234375, 5.03125, 5.828125, 6.625, 7.421875, 8.21875, 9.015625, 9.8125, 10.609375, 11.40625, 12.203125, 13.0, 13.796875, 14.59375, 15.390625, 16.1875, 16.984375, 17.78125, 18.578125, 19.375, 20.171875, 20.96875, 21.765625, 22.5625, 23.359375, 24.15625, 24.953125, 25.75]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 6.0, 8.0, 9.0, 14.0, 9.0, 12.0, 25.0, 22.0, 21.0, 28.0, 30.0, 34.0, 47.0, 28.0, 39.0, 38.0, 36.0, 54.0, 40.0, 45.0, 32.0, 33.0, 47.0, 39.0, 41.0, 39.0, 34.0, 30.0, 26.0, 23.0, 12.0, 13.0, 10.0, 15.0, 14.0, 9.0, 6.0, 8.0, 6.0, 3.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-48.53125, -46.95654296875, -45.3818359375, -43.80712890625, -42.232421875, -40.65771484375, -39.0830078125, -37.50830078125, -35.93359375, -34.35888671875, -32.7841796875, -31.20947265625, -29.634765625, -28.06005859375, -26.4853515625, -24.91064453125, -23.3359375, -21.76123046875, -20.1865234375, -18.61181640625, -17.037109375, -15.46240234375, -13.8876953125, -12.31298828125, -10.73828125, -9.16357421875, -7.5888671875, -6.01416015625, -4.439453125, -2.86474609375, -1.2900390625, 0.28466796875, 1.859375, 3.43408203125, 5.0087890625, 6.58349609375, 8.158203125, 9.73291015625, 11.3076171875, 12.88232421875, 14.45703125, 16.03173828125, 17.6064453125, 19.18115234375, 20.755859375, 22.33056640625, 23.9052734375, 25.47998046875, 27.0546875, 28.62939453125, 30.2041015625, 31.77880859375, 33.353515625, 34.92822265625, 36.5029296875, 38.07763671875, 39.65234375, 41.22705078125, 42.8017578125, 44.37646484375, 45.951171875, 47.52587890625, 49.1005859375, 50.67529296875, 52.25]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 9.0, 9.0, 16.0, 14.0, 36.0, 56.0, 69.0, 93.0, 177.0, 264.0, 466.0, 659.0, 1133.0, 1787.0, 2996.0, 5131.0, 9326.0, 16460.0, 29720.0, 54483.0, 97210.0, 158343.0, 207225.0, 184016.0, 121621.0, 69980.0, 38395.0, 21172.0, 11760.0, 6390.0, 3687.0, 2291.0, 1339.0, 798.0, 485.0, 344.0, 202.0, 132.0, 85.0, 60.0, 46.0, 23.0, 28.0, 6.0, 8.0, 5.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.21875, -36.8876953125, -35.556640625, -34.2255859375, -32.89453125, -31.5634765625, -30.232421875, -28.9013671875, -27.5703125, -26.2392578125, -24.908203125, -23.5771484375, -22.24609375, -20.9150390625, -19.583984375, -18.2529296875, -16.921875, -15.5908203125, -14.259765625, -12.9287109375, -11.59765625, -10.2666015625, -8.935546875, -7.6044921875, -6.2734375, -4.9423828125, -3.611328125, -2.2802734375, -0.94921875, 0.3818359375, 1.712890625, 3.0439453125, 4.375, 5.7060546875, 7.037109375, 8.3681640625, 9.69921875, 11.0302734375, 12.361328125, 13.6923828125, 15.0234375, 16.3544921875, 17.685546875, 19.0166015625, 20.34765625, 21.6787109375, 23.009765625, 24.3408203125, 25.671875, 27.0029296875, 28.333984375, 29.6650390625, 30.99609375, 32.3271484375, 33.658203125, 34.9892578125, 36.3203125, 37.6513671875, 38.982421875, 40.3134765625, 41.64453125, 42.9755859375, 44.306640625, 45.6376953125, 46.96875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 1.0, 3.0, 6.0, 9.0, 4.0, 7.0, 12.0, 11.0, 19.0, 20.0, 19.0, 35.0, 25.0, 24.0, 33.0, 32.0, 38.0, 32.0, 58.0, 57.0, 47.0, 42.0, 36.0, 36.0, 32.0, 39.0, 33.0, 40.0, 35.0, 35.0, 33.0, 27.0, 24.0, 19.0, 21.0, 15.0, 7.0, 9.0, 5.0, 11.0, 7.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.3125, -24.433349609375, -23.55419921875, -22.675048828125, -21.7958984375, -20.916748046875, -20.03759765625, -19.158447265625, -18.279296875, -17.400146484375, -16.52099609375, -15.641845703125, -14.7626953125, -13.883544921875, -13.00439453125, -12.125244140625, -11.24609375, -10.366943359375, -9.48779296875, -8.608642578125, -7.7294921875, -6.850341796875, -5.97119140625, -5.092041015625, -4.212890625, -3.333740234375, -2.45458984375, -1.575439453125, -0.6962890625, 0.182861328125, 1.06201171875, 1.941162109375, 2.8203125, 3.699462890625, 4.57861328125, 5.457763671875, 6.3369140625, 7.216064453125, 8.09521484375, 8.974365234375, 9.853515625, 10.732666015625, 11.61181640625, 12.490966796875, 13.3701171875, 14.249267578125, 15.12841796875, 16.007568359375, 16.88671875, 17.765869140625, 18.64501953125, 19.524169921875, 20.4033203125, 21.282470703125, 22.16162109375, 23.040771484375, 23.919921875, 24.799072265625, 25.67822265625, 26.557373046875, 27.4365234375, 28.315673828125, 29.19482421875, 30.073974609375, 30.953125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 9.0, 15.0, 16.0, 19.0, 39.0, 43.0, 72.0, 113.0, 189.0, 291.0, 444.0, 794.0, 1286.0, 2282.0, 3925.0, 7162.0, 12988.0, 24749.0, 47365.0, 88257.0, 157779.0, 225541.0, 203013.0, 126129.0, 68411.0, 35478.0, 18732.0, 10119.0, 5668.0, 3097.0, 1721.0, 1076.0, 630.0, 387.0, 254.0, 150.0, 107.0, 60.0, 40.0, 39.0, 21.0, 19.0, 9.0, 12.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.578125, -20.8017578125, -20.025390625, -19.2490234375, -18.47265625, -17.6962890625, -16.919921875, -16.1435546875, -15.3671875, -14.5908203125, -13.814453125, -13.0380859375, -12.26171875, -11.4853515625, -10.708984375, -9.9326171875, -9.15625, -8.3798828125, -7.603515625, -6.8271484375, -6.05078125, -5.2744140625, -4.498046875, -3.7216796875, -2.9453125, -2.1689453125, -1.392578125, -0.6162109375, 0.16015625, 0.9365234375, 1.712890625, 2.4892578125, 3.265625, 4.0419921875, 4.818359375, 5.5947265625, 6.37109375, 7.1474609375, 7.923828125, 8.7001953125, 9.4765625, 10.2529296875, 11.029296875, 11.8056640625, 12.58203125, 13.3583984375, 14.134765625, 14.9111328125, 15.6875, 16.4638671875, 17.240234375, 18.0166015625, 18.79296875, 19.5693359375, 20.345703125, 21.1220703125, 21.8984375, 22.6748046875, 23.451171875, 24.2275390625, 25.00390625, 25.7802734375, 26.556640625, 27.3330078125, 28.109375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 7.0, 3.0, 6.0, 6.0, 5.0, 8.0, 14.0, 13.0, 18.0, 22.0, 23.0, 33.0, 33.0, 28.0, 51.0, 39.0, 39.0, 53.0, 52.0, 43.0, 48.0, 50.0, 46.0, 46.0, 40.0, 30.0, 29.0, 29.0, 27.0, 32.0, 16.0, 12.0, 18.0, 13.0, 15.0, 16.0, 12.0, 5.0, 4.0, 4.0, 2.0, 3.0, 4.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008177757263183594, -0.0007904618978500366, -0.0007631480693817139, -0.0007358342409133911, -0.0007085204124450684, -0.0006812065839767456, -0.0006538927555084229, -0.0006265789270401001, -0.0005992650985717773, -0.0005719512701034546, -0.0005446374416351318, -0.0005173236131668091, -0.0004900097846984863, -0.0004626959562301636, -0.0004353821277618408, -0.00040806829929351807, -0.0003807544708251953, -0.00035344064235687256, -0.0003261268138885498, -0.00029881298542022705, -0.0002714991569519043, -0.00024418532848358154, -0.0002168715000152588, -0.00018955767154693604, -0.00016224384307861328, -0.00013493001461029053, -0.00010761618614196777, -8.030235767364502e-05, -5.2988529205322266e-05, -2.5674700736999512e-05, 1.6391277313232422e-06, 2.8952956199645996e-05, 5.626678466796875e-05, 8.35806131362915e-05, 0.00011089444160461426, 0.000138208270072937, 0.00016552209854125977, 0.00019283592700958252, 0.00022014975547790527, 0.00024746358394622803, 0.0002747774124145508, 0.00030209124088287354, 0.0003294050693511963, 0.00035671889781951904, 0.0003840327262878418, 0.00041134655475616455, 0.0004386603832244873, 0.00046597421169281006, 0.0004932880401611328, 0.0005206018686294556, 0.0005479156970977783, 0.0005752295255661011, 0.0006025433540344238, 0.0006298571825027466, 0.0006571710109710693, 0.0006844848394393921, 0.0007117986679077148, 0.0007391124963760376, 0.0007664263248443604, 0.0007937401533126831, 0.0008210539817810059, 0.0008483678102493286, 0.0008756816387176514, 0.0009029954671859741, 0.0009303092956542969]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 6.0, 4.0, 6.0, 5.0, 14.0, 15.0, 22.0, 29.0, 41.0, 75.0, 85.0, 159.0, 224.0, 280.0, 500.0, 732.0, 1141.0, 1849.0, 2863.0, 4708.0, 8049.0, 14632.0, 26361.0, 48814.0, 86490.0, 139372.0, 188151.0, 186947.0, 139789.0, 86278.0, 48794.0, 26455.0, 14807.0, 8248.0, 4646.0, 2837.0, 1817.0, 1141.0, 742.0, 443.0, 306.0, 197.0, 165.0, 109.0, 56.0, 51.0, 36.0, 30.0, 16.0, 9.0, 7.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.375, -23.5625, -22.75, -21.9375, -21.125, -20.3125, -19.5, -18.6875, -17.875, -17.0625, -16.25, -15.4375, -14.625, -13.8125, -13.0, -12.1875, -11.375, -10.5625, -9.75, -8.9375, -8.125, -7.3125, -6.5, -5.6875, -4.875, -4.0625, -3.25, -2.4375, -1.625, -0.8125, 0.0, 0.8125, 1.625, 2.4375, 3.25, 4.0625, 4.875, 5.6875, 6.5, 7.3125, 8.125, 8.9375, 9.75, 10.5625, 11.375, 12.1875, 13.0, 13.8125, 14.625, 15.4375, 16.25, 17.0625, 17.875, 18.6875, 19.5, 20.3125, 21.125, 21.9375, 22.75, 23.5625, 24.375, 25.1875, 26.0, 26.8125, 27.625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 5.0, 7.0, 4.0, 7.0, 9.0, 7.0, 15.0, 17.0, 14.0, 15.0, 18.0, 25.0, 33.0, 33.0, 27.0, 41.0, 39.0, 50.0, 59.0, 52.0, 46.0, 39.0, 56.0, 57.0, 48.0, 43.0, 40.0, 31.0, 27.0, 19.0, 17.0, 17.0, 18.0, 11.0, 9.0, 13.0, 5.0, 10.0, 2.0, 6.0, 3.0, 7.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-7.03125, -6.82421875, -6.6171875, -6.41015625, -6.203125, -5.99609375, -5.7890625, -5.58203125, -5.375, -5.16796875, -4.9609375, -4.75390625, -4.546875, -4.33984375, -4.1328125, -3.92578125, -3.71875, -3.51171875, -3.3046875, -3.09765625, -2.890625, -2.68359375, -2.4765625, -2.26953125, -2.0625, -1.85546875, -1.6484375, -1.44140625, -1.234375, -1.02734375, -0.8203125, -0.61328125, -0.40625, -0.19921875, 0.0078125, 0.21484375, 0.421875, 0.62890625, 0.8359375, 1.04296875, 1.25, 1.45703125, 1.6640625, 1.87109375, 2.078125, 2.28515625, 2.4921875, 2.69921875, 2.90625, 3.11328125, 3.3203125, 3.52734375, 3.734375, 3.94140625, 4.1484375, 4.35546875, 4.5625, 4.76953125, 4.9765625, 5.18359375, 5.390625, 5.59765625, 5.8046875, 6.01171875, 6.21875]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 7.0, 6.0, 5.0, 4.0, 8.0, 10.0, 9.0, 12.0, 19.0, 21.0, 26.0, 34.0, 36.0, 34.0, 35.0, 41.0, 52.0, 39.0, 48.0, 53.0, 45.0, 43.0, 56.0, 43.0, 47.0, 39.0, 30.0, 36.0, 23.0, 22.0, 21.0, 20.0, 15.0, 13.0, 12.0, 15.0, 4.0, 6.0, 5.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.782806396484375, -50.89947509765625, -49.016143798828125, -47.132808685302734, -45.24947738647461, -43.366146087646484, -41.482810974121094, -39.59947967529297, -37.716148376464844, -35.83281707763672, -33.949485778808594, -32.0661506652832, -30.182819366455078, -28.299488067626953, -26.416154861450195, -24.532821655273438, -22.649490356445312, -20.766159057617188, -18.88282585144043, -16.999492645263672, -15.116161346435547, -13.232829093933105, -11.349496841430664, -9.466164588928223, -7.582832336425781, -5.69950008392334, -3.8161678314208984, -1.932835578918457, -0.049503326416015625, 1.8338289260864258, 3.717161178588867, 5.600493431091309, 7.48382568359375, 9.367157936096191, 11.250490188598633, 13.133822441101074, 15.017154693603516, 16.90048599243164, 18.7838191986084, 20.667152404785156, 22.55048370361328, 24.433815002441406, 26.317148208618164, 28.200481414794922, 30.083812713623047, 31.967144012451172, 33.85047912597656, 35.73381042480469, 37.61714172363281, 39.50047302246094, 41.38380432128906, 43.26713943481445, 45.15047073364258, 47.0338020324707, 48.917137145996094, 50.80046844482422, 52.683799743652344, 54.56713104248047, 56.450462341308594, 58.333797454833984, 60.21712875366211, 62.100460052490234, 63.983795166015625, 65.86712646484375, 67.75045776367188]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 7.0, 12.0, 5.0, 10.0, 11.0, 15.0, 16.0, 20.0, 26.0, 21.0, 30.0, 39.0, 29.0, 31.0, 37.0, 38.0, 40.0, 50.0, 44.0, 31.0, 35.0, 44.0, 29.0, 30.0, 41.0, 42.0, 29.0, 42.0, 27.0, 24.0, 19.0, 16.0, 14.0, 13.0, 10.0, 11.0, 16.0, 9.0, 11.0, 3.0, 7.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-46.820247650146484, -45.43103790283203, -44.04182815551758, -42.652618408203125, -41.263404846191406, -39.87419509887695, -38.4849853515625, -37.09577560424805, -35.706565856933594, -34.31735610961914, -32.92814636230469, -31.5389347076416, -30.149723052978516, -28.760513305664062, -27.37130355834961, -25.982093811035156, -24.592880249023438, -23.203670501708984, -21.8144588470459, -20.425249099731445, -19.03603744506836, -17.646827697753906, -16.257617950439453, -14.868407249450684, -13.479196548461914, -12.089985847473145, -10.700775146484375, -9.311565399169922, -7.922354698181152, -6.533143997192383, -5.14393424987793, -3.75472354888916, -2.3655128479003906, -0.9763023853302002, 0.41290807723999023, 1.8021183013916016, 3.191329002380371, 4.580539703369141, 5.969749450683594, 7.358960151672363, 8.748170852661133, 10.137381553649902, 11.526592254638672, 12.915802001953125, 14.305012702941895, 15.694223403930664, 17.083433151245117, 18.472644805908203, 19.861854553222656, 21.25106430053711, 22.640275955200195, 24.02948570251465, 25.418697357177734, 26.807907104492188, 28.19711685180664, 29.586326599121094, 30.97553825378418, 32.364749908447266, 33.75395965576172, 35.14316940307617, 36.532379150390625, 37.921592712402344, 39.31079864501953, 40.70001220703125, 42.0892219543457]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 5.0, 12.0, 12.0, 14.0, 31.0, 41.0, 64.0, 82.0, 111.0, 198.0, 290.0, 374.0, 592.0, 904.0, 1304.0, 2012.0, 2858.0, 4231.0, 6128.0, 9091.0, 13072.0, 19207.0, 27290.0, 38282.0, 52715.0, 69469.0, 87459.0, 102190.0, 109943.0, 107545.0, 96194.0, 79966.0, 62387.0, 46283.0, 33480.0, 23427.0, 16195.0, 11346.0, 7540.0, 5143.0, 3526.0, 2375.0, 1669.0, 1137.0, 797.0, 499.0, 327.0, 254.0, 170.0, 122.0, 66.0, 59.0, 25.0, 20.0, 12.0, 6.0, 8.0, 5.0, 1.0, 2.0], "bins": [-28.015625, -27.1611328125, -26.306640625, -25.4521484375, -24.59765625, -23.7431640625, -22.888671875, -22.0341796875, -21.1796875, -20.3251953125, -19.470703125, -18.6162109375, -17.76171875, -16.9072265625, -16.052734375, -15.1982421875, -14.34375, -13.4892578125, -12.634765625, -11.7802734375, -10.92578125, -10.0712890625, -9.216796875, -8.3623046875, -7.5078125, -6.6533203125, -5.798828125, -4.9443359375, -4.08984375, -3.2353515625, -2.380859375, -1.5263671875, -0.671875, 0.1826171875, 1.037109375, 1.8916015625, 2.74609375, 3.6005859375, 4.455078125, 5.3095703125, 6.1640625, 7.0185546875, 7.873046875, 8.7275390625, 9.58203125, 10.4365234375, 11.291015625, 12.1455078125, 13.0, 13.8544921875, 14.708984375, 15.5634765625, 16.41796875, 17.2724609375, 18.126953125, 18.9814453125, 19.8359375, 20.6904296875, 21.544921875, 22.3994140625, 23.25390625, 24.1083984375, 24.962890625, 25.8173828125, 26.671875]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 10.0, 5.0, 8.0, 11.0, 6.0, 7.0, 5.0, 17.0, 15.0, 19.0, 27.0, 30.0, 23.0, 32.0, 31.0, 35.0, 42.0, 34.0, 37.0, 39.0, 38.0, 42.0, 44.0, 30.0, 37.0, 34.0, 29.0, 34.0, 44.0, 44.0, 22.0, 28.0, 19.0, 22.0, 18.0, 14.0, 15.0, 6.0, 5.0, 11.0, 9.0, 4.0, 6.0, 3.0, 3.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.28125, -39.89208984375, -38.5029296875, -37.11376953125, -35.724609375, -34.33544921875, -32.9462890625, -31.55712890625, -30.16796875, -28.77880859375, -27.3896484375, -26.00048828125, -24.611328125, -23.22216796875, -21.8330078125, -20.44384765625, -19.0546875, -17.66552734375, -16.2763671875, -14.88720703125, -13.498046875, -12.10888671875, -10.7197265625, -9.33056640625, -7.94140625, -6.55224609375, -5.1630859375, -3.77392578125, -2.384765625, -0.99560546875, 0.3935546875, 1.78271484375, 3.171875, 4.56103515625, 5.9501953125, 7.33935546875, 8.728515625, 10.11767578125, 11.5068359375, 12.89599609375, 14.28515625, 15.67431640625, 17.0634765625, 18.45263671875, 19.841796875, 21.23095703125, 22.6201171875, 24.00927734375, 25.3984375, 26.78759765625, 28.1767578125, 29.56591796875, 30.955078125, 32.34423828125, 33.7333984375, 35.12255859375, 36.51171875, 37.90087890625, 39.2900390625, 40.67919921875, 42.068359375, 43.45751953125, 44.8466796875, 46.23583984375, 47.625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 8.0, 7.0, 6.0, 19.0, 27.0, 38.0, 62.0, 84.0, 113.0, 172.0, 287.0, 383.0, 620.0, 867.0, 1356.0, 2183.0, 3352.0, 5436.0, 8888.0, 14929.0, 25966.0, 45965.0, 82188.0, 138235.0, 193126.0, 192920.0, 138013.0, 82274.0, 46152.0, 26217.0, 14816.0, 8722.0, 5509.0, 3420.0, 2090.0, 1365.0, 909.0, 601.0, 407.0, 288.0, 156.0, 117.0, 86.0, 62.0, 36.0, 32.0, 23.0, 13.0, 7.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-74.5625, -72.232421875, -69.90234375, -67.572265625, -65.2421875, -62.912109375, -60.58203125, -58.251953125, -55.921875, -53.591796875, -51.26171875, -48.931640625, -46.6015625, -44.271484375, -41.94140625, -39.611328125, -37.28125, -34.951171875, -32.62109375, -30.291015625, -27.9609375, -25.630859375, -23.30078125, -20.970703125, -18.640625, -16.310546875, -13.98046875, -11.650390625, -9.3203125, -6.990234375, -4.66015625, -2.330078125, 0.0, 2.330078125, 4.66015625, 6.990234375, 9.3203125, 11.650390625, 13.98046875, 16.310546875, 18.640625, 20.970703125, 23.30078125, 25.630859375, 27.9609375, 30.291015625, 32.62109375, 34.951171875, 37.28125, 39.611328125, 41.94140625, 44.271484375, 46.6015625, 48.931640625, 51.26171875, 53.591796875, 55.921875, 58.251953125, 60.58203125, 62.912109375, 65.2421875, 67.572265625, 69.90234375, 72.232421875, 74.5625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 7.0, 5.0, 13.0, 14.0, 14.0, 15.0, 20.0, 21.0, 15.0, 32.0, 28.0, 31.0, 34.0, 39.0, 46.0, 32.0, 45.0, 54.0, 58.0, 36.0, 34.0, 40.0, 50.0, 51.0, 31.0, 25.0, 29.0, 24.0, 20.0, 31.0, 16.0, 12.0, 11.0, 12.0, 16.0, 11.0, 5.0, 2.0, 2.0, 4.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.8125, -34.59326171875, -33.3740234375, -32.15478515625, -30.935546875, -29.71630859375, -28.4970703125, -27.27783203125, -26.05859375, -24.83935546875, -23.6201171875, -22.40087890625, -21.181640625, -19.96240234375, -18.7431640625, -17.52392578125, -16.3046875, -15.08544921875, -13.8662109375, -12.64697265625, -11.427734375, -10.20849609375, -8.9892578125, -7.77001953125, -6.55078125, -5.33154296875, -4.1123046875, -2.89306640625, -1.673828125, -0.45458984375, 0.7646484375, 1.98388671875, 3.203125, 4.42236328125, 5.6416015625, 6.86083984375, 8.080078125, 9.29931640625, 10.5185546875, 11.73779296875, 12.95703125, 14.17626953125, 15.3955078125, 16.61474609375, 17.833984375, 19.05322265625, 20.2724609375, 21.49169921875, 22.7109375, 23.93017578125, 25.1494140625, 26.36865234375, 27.587890625, 28.80712890625, 30.0263671875, 31.24560546875, 32.46484375, 33.68408203125, 34.9033203125, 36.12255859375, 37.341796875, 38.56103515625, 39.7802734375, 40.99951171875, 42.21875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 7.0, 10.0, 16.0, 12.0, 17.0, 37.0, 42.0, 68.0, 118.0, 171.0, 285.0, 563.0, 875.0, 1615.0, 2933.0, 5321.0, 9907.0, 19371.0, 38934.0, 79463.0, 151829.0, 226254.0, 220710.0, 141216.0, 74297.0, 36163.0, 18177.0, 9163.0, 4863.0, 2606.0, 1448.0, 801.0, 484.0, 284.0, 176.0, 85.0, 68.0, 56.0, 34.0, 23.0, 17.0, 6.0, 13.0, 6.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-52.15625, -50.61962890625, -49.0830078125, -47.54638671875, -46.009765625, -44.47314453125, -42.9365234375, -41.39990234375, -39.86328125, -38.32666015625, -36.7900390625, -35.25341796875, -33.716796875, -32.18017578125, -30.6435546875, -29.10693359375, -27.5703125, -26.03369140625, -24.4970703125, -22.96044921875, -21.423828125, -19.88720703125, -18.3505859375, -16.81396484375, -15.27734375, -13.74072265625, -12.2041015625, -10.66748046875, -9.130859375, -7.59423828125, -6.0576171875, -4.52099609375, -2.984375, -1.44775390625, 0.0888671875, 1.62548828125, 3.162109375, 4.69873046875, 6.2353515625, 7.77197265625, 9.30859375, 10.84521484375, 12.3818359375, 13.91845703125, 15.455078125, 16.99169921875, 18.5283203125, 20.06494140625, 21.6015625, 23.13818359375, 24.6748046875, 26.21142578125, 27.748046875, 29.28466796875, 30.8212890625, 32.35791015625, 33.89453125, 35.43115234375, 36.9677734375, 38.50439453125, 40.041015625, 41.57763671875, 43.1142578125, 44.65087890625, 46.1875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 4.0, 4.0, 11.0, 8.0, 10.0, 14.0, 6.0, 20.0, 33.0, 40.0, 48.0, 69.0, 75.0, 77.0, 76.0, 106.0, 82.0, 81.0, 58.0, 44.0, 28.0, 34.0, 15.0, 23.0, 6.0, 12.0, 3.0, 3.0, 3.0, 2.0, 7.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.005977630615234375, -0.00580209493637085, -0.005626559257507324, -0.005451023578643799, -0.0052754878997802734, -0.005099952220916748, -0.004924416542053223, -0.004748880863189697, -0.004573345184326172, -0.0043978095054626465, -0.004222273826599121, -0.004046738147735596, -0.0038712024688720703, -0.003695666790008545, -0.0035201311111450195, -0.003344595432281494, -0.0031690597534179688, -0.0029935240745544434, -0.002817988395690918, -0.0026424527168273926, -0.002466917037963867, -0.002291381359100342, -0.0021158456802368164, -0.001940310001373291, -0.0017647743225097656, -0.0015892386436462402, -0.0014137029647827148, -0.0012381672859191895, -0.001062631607055664, -0.0008870959281921387, -0.0007115602493286133, -0.0005360245704650879, -0.0003604888916015625, -0.0001849532127380371, -9.417533874511719e-06, 0.00016611814498901367, 0.00034165382385253906, 0.0005171895027160645, 0.0006927251815795898, 0.0008682608604431152, 0.0010437965393066406, 0.001219332218170166, 0.0013948678970336914, 0.0015704035758972168, 0.0017459392547607422, 0.0019214749336242676, 0.002097010612487793, 0.0022725462913513184, 0.0024480819702148438, 0.002623617649078369, 0.0027991533279418945, 0.00297468900680542, 0.0031502246856689453, 0.0033257603645324707, 0.003501296043395996, 0.0036768317222595215, 0.003852367401123047, 0.004027903079986572, 0.004203438758850098, 0.004378974437713623, 0.0045545101165771484, 0.004730045795440674, 0.004905581474304199, 0.005081117153167725, 0.00525665283203125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 4.0, 8.0, 11.0, 19.0, 22.0, 43.0, 49.0, 68.0, 105.0, 134.0, 222.0, 299.0, 457.0, 695.0, 966.0, 1394.0, 2072.0, 3061.0, 4621.0, 6828.0, 10779.0, 16496.0, 25635.0, 40094.0, 61495.0, 91021.0, 124157.0, 147225.0, 144287.0, 119075.0, 85025.0, 56928.0, 36932.0, 23699.0, 15457.0, 9870.0, 6257.0, 4237.0, 2757.0, 1950.0, 1310.0, 888.0, 587.0, 397.0, 289.0, 207.0, 129.0, 99.0, 70.0, 33.0, 29.0, 24.0, 22.0, 12.0, 6.0, 4.0, 1.0, 0.0, 2.0, 2.0, 4.0], "bins": [-26.75, -25.884521484375, -25.01904296875, -24.153564453125, -23.2880859375, -22.422607421875, -21.55712890625, -20.691650390625, -19.826171875, -18.960693359375, -18.09521484375, -17.229736328125, -16.3642578125, -15.498779296875, -14.63330078125, -13.767822265625, -12.90234375, -12.036865234375, -11.17138671875, -10.305908203125, -9.4404296875, -8.574951171875, -7.70947265625, -6.843994140625, -5.978515625, -5.113037109375, -4.24755859375, -3.382080078125, -2.5166015625, -1.651123046875, -0.78564453125, 0.079833984375, 0.9453125, 1.810791015625, 2.67626953125, 3.541748046875, 4.4072265625, 5.272705078125, 6.13818359375, 7.003662109375, 7.869140625, 8.734619140625, 9.60009765625, 10.465576171875, 11.3310546875, 12.196533203125, 13.06201171875, 13.927490234375, 14.79296875, 15.658447265625, 16.52392578125, 17.389404296875, 18.2548828125, 19.120361328125, 19.98583984375, 20.851318359375, 21.716796875, 22.582275390625, 23.44775390625, 24.313232421875, 25.1787109375, 26.044189453125, 26.90966796875, 27.775146484375, 28.640625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 1.0, 2.0, 4.0, 4.0, 2.0, 4.0, 3.0, 7.0, 11.0, 11.0, 16.0, 17.0, 21.0, 20.0, 30.0, 25.0, 38.0, 31.0, 41.0, 44.0, 55.0, 49.0, 52.0, 39.0, 54.0, 51.0, 46.0, 52.0, 43.0, 49.0, 30.0, 27.0, 22.0, 17.0, 11.0, 15.0, 13.0, 8.0, 7.0, 9.0, 4.0, 4.0, 7.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-10.0859375, -9.784423828125, -9.48291015625, -9.181396484375, -8.8798828125, -8.578369140625, -8.27685546875, -7.975341796875, -7.673828125, -7.372314453125, -7.07080078125, -6.769287109375, -6.4677734375, -6.166259765625, -5.86474609375, -5.563232421875, -5.26171875, -4.960205078125, -4.65869140625, -4.357177734375, -4.0556640625, -3.754150390625, -3.45263671875, -3.151123046875, -2.849609375, -2.548095703125, -2.24658203125, -1.945068359375, -1.6435546875, -1.342041015625, -1.04052734375, -0.739013671875, -0.4375, -0.135986328125, 0.16552734375, 0.467041015625, 0.7685546875, 1.070068359375, 1.37158203125, 1.673095703125, 1.974609375, 2.276123046875, 2.57763671875, 2.879150390625, 3.1806640625, 3.482177734375, 3.78369140625, 4.085205078125, 4.38671875, 4.688232421875, 4.98974609375, 5.291259765625, 5.5927734375, 5.894287109375, 6.19580078125, 6.497314453125, 6.798828125, 7.100341796875, 7.40185546875, 7.703369140625, 8.0048828125, 8.306396484375, 8.60791015625, 8.909423828125, 9.2109375]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 3.0, 2.0, 4.0, 3.0, 5.0, 13.0, 8.0, 10.0, 17.0, 29.0, 16.0, 27.0, 41.0, 26.0, 35.0, 40.0, 41.0, 45.0, 51.0, 49.0, 48.0, 47.0, 43.0, 38.0, 52.0, 39.0, 35.0, 31.0, 39.0, 32.0, 17.0, 26.0, 19.0, 17.0, 8.0, 9.0, 8.0, 7.0, 11.0, 4.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-69.01078796386719, -66.85242462158203, -64.69405364990234, -62.53569030761719, -60.37732696533203, -58.21895980834961, -56.06059265136719, -53.90222930908203, -51.74386215209961, -49.58549499511719, -47.42713165283203, -45.26876449584961, -43.11039733886719, -40.95203399658203, -38.79366683959961, -36.63529968261719, -34.47693634033203, -32.31856918334961, -30.160205841064453, -28.00183868408203, -25.843473434448242, -23.685108184814453, -21.52674102783203, -19.368375778198242, -17.210010528564453, -15.051645278930664, -12.893279075622559, -10.734912872314453, -8.576547622680664, -6.418182373046875, -4.2598161697387695, -2.101449966430664, 0.05690765380859375, 2.215273380279541, 4.373639106750488, 6.5320048332214355, 8.690370559692383, 10.848735809326172, 13.007102012634277, 15.165468215942383, 17.323833465576172, 19.48219871520996, 21.64056396484375, 23.798931121826172, 25.95729637145996, 28.11566162109375, 30.274028778076172, 32.432395935058594, 34.59075927734375, 36.74912643432617, 38.90748977661133, 41.06585693359375, 43.224220275878906, 45.38258743286133, 47.54095458984375, 49.699317932128906, 51.85768508911133, 54.01605224609375, 56.174415588378906, 58.33278274536133, 60.49114990234375, 62.649513244628906, 64.80787658691406, 66.96624755859375, 69.1246109008789]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 3.0, 4.0, 7.0, 4.0, 11.0, 8.0, 18.0, 15.0, 12.0, 20.0, 24.0, 30.0, 28.0, 43.0, 32.0, 35.0, 37.0, 29.0, 39.0, 38.0, 47.0, 46.0, 40.0, 45.0, 39.0, 35.0, 33.0, 30.0, 35.0, 19.0, 23.0, 25.0, 27.0, 26.0, 17.0, 9.0, 13.0, 12.0, 6.0, 8.0, 8.0, 1.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-64.76392364501953, -62.54938888549805, -60.3348503112793, -58.12031555175781, -55.90577697753906, -53.69124221801758, -51.476707458496094, -49.262168884277344, -47.04763412475586, -44.833099365234375, -42.618560791015625, -40.40402603149414, -38.189491271972656, -35.974952697753906, -33.76041793823242, -31.545881271362305, -29.331344604492188, -27.11680793762207, -24.902271270751953, -22.68773651123047, -20.47319984436035, -18.258663177490234, -16.04412841796875, -13.829591751098633, -11.615055084228516, -9.400518417358398, -7.185982704162598, -4.971446514129639, -2.7569103240966797, -0.5423736572265625, 1.6721620559692383, 3.886697769165039, 6.101234436035156, 8.315771102905273, 10.530306816101074, 12.744842529296875, 14.959379196166992, 17.17391586303711, 19.388450622558594, 21.60298728942871, 23.817523956298828, 26.032060623168945, 28.246597290039062, 30.461132049560547, 32.67566680908203, 34.89020538330078, 37.104740142822266, 39.31927490234375, 41.5338134765625, 43.748348236083984, 45.962886810302734, 48.17742156982422, 50.39196014404297, 52.60649490356445, 54.82102966308594, 57.03556823730469, 59.25010299682617, 61.464637756347656, 63.679176330566406, 65.89371490478516, 68.10824584960938, 70.32278442382812, 72.53732299804688, 74.7518539428711, 76.96639251708984]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 7.0, 2.0, 9.0, 11.0, 11.0, 19.0, 25.0, 28.0, 40.0, 51.0, 74.0, 68.0, 133.0, 126.0, 171.0, 232.0, 293.0, 414.0, 537.0, 730.0, 940.0, 1402.0, 2411.0, 4144.0, 8885.0, 491303.0, 4284.0, 2432.0, 1420.0, 1011.0, 752.0, 568.0, 430.0, 311.0, 241.0, 183.0, 112.0, 118.0, 93.0, 54.0, 44.0, 33.0, 34.0, 21.0, 21.0, 13.0, 11.0, 10.0, 7.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-737.7885131835938, -713.224609375, -688.6607055664062, -664.0968017578125, -639.5328369140625, -614.9689331054688, -590.405029296875, -565.8411254882812, -541.2772216796875, -516.7133178710938, -492.1494140625, -467.5854797363281, -443.0215759277344, -418.4576721191406, -393.89373779296875, -369.329833984375, -344.76593017578125, -320.2020263671875, -295.63812255859375, -271.0741882324219, -246.51028442382812, -221.94638061523438, -197.38246154785156, -172.81854248046875, -148.254638671875, -123.69072723388672, -99.12681579589844, -74.56290435791016, -49.998992919921875, -25.435081481933594, -0.8711700439453125, 23.6927490234375, 48.25665283203125, 72.82056427001953, 97.38447570800781, 121.9483871459961, 146.51229858398438, 171.07620239257812, 195.64012145996094, 220.20404052734375, 244.7679443359375, 269.33184814453125, 293.895751953125, 318.4596862792969, 343.0235900878906, 367.5874938964844, 392.15142822265625, 416.71533203125, 441.27923583984375, 465.8431396484375, 490.40704345703125, 514.970947265625, 539.534912109375, 564.0988159179688, 588.6627197265625, 613.2266235351562, 637.79052734375, 662.3544311523438, 686.9183349609375, 711.4822387695312, 736.046142578125, 760.610107421875, 785.1740112304688, 809.7379150390625, 834.3018188476562]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 4.0, 4.0, 8.0, 3.0, 9.0, 10.0, 14.0, 21.0, 10.0, 21.0, 25.0, 29.0, 27.0, 45.0, 32.0, 30.0, 42.0, 28.0, 39.0, 48.0, 41.0, 1070.0, 36.0, 43.0, 45.0, 31.0, 32.0, 31.0, 33.0, 23.0, 22.0, 31.0, 23.0, 19.0, 22.0, 9.0, 10.0, 11.0, 11.0, 9.0, 5.0, 2.0, 4.0, 4.0, 6.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2068.56884765625, -1997.9425048828125, -1927.316162109375, -1856.6898193359375, -1786.0634765625, -1715.43701171875, -1644.8106689453125, -1574.184326171875, -1503.5579833984375, -1432.931640625, -1362.3052978515625, -1291.678955078125, -1221.052490234375, -1150.42626953125, -1079.7998046875, -1009.1734619140625, -938.547119140625, -867.9207763671875, -797.29443359375, -726.6680297851562, -656.0416870117188, -585.4153442382812, -514.7889404296875, -444.16259765625, -373.5362548828125, -302.909912109375, -232.28353881835938, -161.6571807861328, -91.03082275390625, -20.40447998046875, 50.221893310546875, 120.8482666015625, 191.474853515625, 262.1011962890625, 332.7275695800781, 403.35394287109375, 473.98028564453125, 544.6066284179688, 615.2330322265625, 685.859375, 756.4857177734375, 827.112060546875, 897.7384033203125, 968.3648071289062, 1038.9912109375, 1109.617431640625, 1180.243896484375, 1250.8702392578125, 1321.49658203125, 1392.1229248046875, 1462.749267578125, 1533.3756103515625, 1604.001953125, 1674.62841796875, 1745.2547607421875, 1815.881103515625, 1886.5074462890625, 1957.1337890625, 2027.7601318359375, 2098.386474609375, 2169.012939453125, 2239.63916015625, 2310.265625, 2380.89208984375, 2451.518310546875]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 4.0, 3.0, 7.0, 4.0, 5.0, 7.0, 4.0, 11.0, 9.0, 13.0, 13.0, 11.0, 30.0, 35.0, 27.0, 37.0, 62.0, 74.0, 118.0, 154.0, 212.0, 311.0, 437.0, 569.0, 740.0, 925.0, 1237.0, 1614.0, 2117.0, 2660.0, 4093.0, 7531.0, 64020.0, 31128602.0, 15112.0, 9158.0, 7984.0, 3354.0, 1239.0, 732.0, 400.0, 227.0, 178.0, 123.0, 127.0, 86.0, 50.0, 30.0, 13.0, 3.0, 1.0, 1.0, 1.0], "bins": [-2639.215087890625, -2579.439697265625, -2519.664306640625, -2459.88916015625, -2400.11376953125, -2340.33837890625, -2280.56298828125, -2220.78759765625, -2161.01220703125, -2101.23681640625, -2041.4615478515625, -1981.6861572265625, -1921.9107666015625, -1862.135498046875, -1802.360107421875, -1742.584716796875, -1682.8094482421875, -1623.0340576171875, -1563.2587890625, -1503.4833984375, -1443.7080078125, -1383.9326171875, -1324.1573486328125, -1264.3819580078125, -1204.606689453125, -1144.831298828125, -1085.0560302734375, -1025.2806396484375, -965.5052490234375, -905.7299194335938, -845.95458984375, -786.17919921875, -726.4039306640625, -666.6286010742188, -606.8532104492188, -547.077880859375, -487.3025207519531, -427.52716064453125, -367.7518310546875, -307.9764709472656, -248.20111083984375, -188.42575073242188, -128.65040588378906, -68.87506103515625, -9.099700927734375, 50.6756591796875, 110.45098876953125, 170.22634887695312, 230.001708984375, 289.7770690917969, 349.55242919921875, 409.3277587890625, 469.1031188964844, 528.8784790039062, 588.65380859375, 648.42919921875, 708.2045288085938, 767.9798583984375, 827.7552490234375, 887.5305786132812, 947.305908203125, 1007.081298828125, 1066.856689453125, 1126.6319580078125, 1186.4073486328125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 9.0, 7.0, 18.0, 20.0, 31.0, 34.0, 55.0, 95.0, 109.0, 173.0, 278.0, 396.0, 573.0, 834.0, 1389.0, 2150.0, 3548.0, 5633.0, 9535.0, 16273.0, 28471.0, 50647.0, 92299.0, 175690.0, 351865.0, 773437.0, 1821933.0, 1611281.0, 678234.0, 313769.0, 159150.0, 83891.0, 45874.0, 25861.0, 14927.0, 8935.0, 5198.0, 3242.0, 1960.0, 1257.0, 809.0, 540.0, 337.0, 196.0, 157.0, 117.0, 71.0, 41.0, 32.0, 25.0, 13.0, 6.0, 6.0, 10.0, 1.0, 2.0, 1.0, 1.0], "bins": [-199.375, -193.318359375, -187.26171875, -181.205078125, -175.1484375, -169.091796875, -163.03515625, -156.978515625, -150.921875, -144.865234375, -138.80859375, -132.751953125, -126.6953125, -120.638671875, -114.58203125, -108.525390625, -102.46875, -96.412109375, -90.35546875, -84.298828125, -78.2421875, -72.185546875, -66.12890625, -60.072265625, -54.015625, -47.958984375, -41.90234375, -35.845703125, -29.7890625, -23.732421875, -17.67578125, -11.619140625, -5.5625, 0.494140625, 6.55078125, 12.607421875, 18.6640625, 24.720703125, 30.77734375, 36.833984375, 42.890625, 48.947265625, 55.00390625, 61.060546875, 67.1171875, 73.173828125, 79.23046875, 85.287109375, 91.34375, 97.400390625, 103.45703125, 109.513671875, 115.5703125, 121.626953125, 127.68359375, 133.740234375, 139.796875, 145.853515625, 151.91015625, 157.966796875, 164.0234375, 170.080078125, 176.13671875, 182.193359375, 188.25]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 0.0, 1.0, 5.0, 9.0, 15.0, 14.0, 13.0, 17.0, 22.0, 28.0, 22.0, 44.0, 54.0, 54.0, 78.0, 83.0, 131.0, 136.0, 180.0, 214.0, 169.0, 157.0, 109.0, 92.0, 77.0, 57.0, 50.0, 37.0, 18.0, 31.0, 25.0, 15.0, 9.0, 10.0, 10.0, 5.0, 13.0, 5.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-82.5625, -80.03515625, -77.5078125, -74.98046875, -72.453125, -69.92578125, -67.3984375, -64.87109375, -62.34375, -59.81640625, -57.2890625, -54.76171875, -52.234375, -49.70703125, -47.1796875, -44.65234375, -42.125, -39.59765625, -37.0703125, -34.54296875, -32.015625, -29.48828125, -26.9609375, -24.43359375, -21.90625, -19.37890625, -16.8515625, -14.32421875, -11.796875, -9.26953125, -6.7421875, -4.21484375, -1.6875, 0.83984375, 3.3671875, 5.89453125, 8.421875, 10.94921875, 13.4765625, 16.00390625, 18.53125, 21.05859375, 23.5859375, 26.11328125, 28.640625, 31.16796875, 33.6953125, 36.22265625, 38.75, 41.27734375, 43.8046875, 46.33203125, 48.859375, 51.38671875, 53.9140625, 56.44140625, 58.96875, 61.49609375, 64.0234375, 66.55078125, 69.078125, 71.60546875, 74.1328125, 76.66015625, 79.1875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 17.0, 14.0, 22.0, 22.0, 28.0, 56.0, 91.0, 121.0, 179.0, 253.0, 348.0, 529.0, 783.0, 1270.0, 1888.0, 3057.0, 5135.0, 8548.0, 14640.0, 24624.0, 42670.0, 76094.0, 135727.0, 244195.0, 458225.0, 985853.0, 1969935.0, 1167544.0, 522490.0, 272559.0, 152026.0, 85714.0, 48255.0, 27702.0, 16098.0, 9451.0, 5497.0, 3511.0, 2064.0, 1428.0, 911.0, 585.0, 394.0, 292.0, 178.0, 123.0, 87.0, 55.0, 36.0, 36.0, 30.0, 22.0, 8.0, 5.0, 5.0, 8.0, 2.0, 3.0], "bins": [-98.625, -95.599609375, -92.57421875, -89.548828125, -86.5234375, -83.498046875, -80.47265625, -77.447265625, -74.421875, -71.396484375, -68.37109375, -65.345703125, -62.3203125, -59.294921875, -56.26953125, -53.244140625, -50.21875, -47.193359375, -44.16796875, -41.142578125, -38.1171875, -35.091796875, -32.06640625, -29.041015625, -26.015625, -22.990234375, -19.96484375, -16.939453125, -13.9140625, -10.888671875, -7.86328125, -4.837890625, -1.8125, 1.212890625, 4.23828125, 7.263671875, 10.2890625, 13.314453125, 16.33984375, 19.365234375, 22.390625, 25.416015625, 28.44140625, 31.466796875, 34.4921875, 37.517578125, 40.54296875, 43.568359375, 46.59375, 49.619140625, 52.64453125, 55.669921875, 58.6953125, 61.720703125, 64.74609375, 67.771484375, 70.796875, 73.822265625, 76.84765625, 79.873046875, 82.8984375, 85.923828125, 88.94921875, 91.974609375, 95.0]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 9.0, 11.0, 15.0, 12.0, 11.0, 22.0, 28.0, 38.0, 61.0, 73.0, 100.0, 150.0, 189.0, 273.0, 279.0, 229.0, 157.0, 90.0, 56.0, 45.0, 30.0, 37.0, 24.0, 18.0, 14.0, 7.0, 12.0, 10.0, 4.0, 5.0, 4.0, 5.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-157.375, -153.2744140625, -149.173828125, -145.0732421875, -140.97265625, -136.8720703125, -132.771484375, -128.6708984375, -124.5703125, -120.4697265625, -116.369140625, -112.2685546875, -108.16796875, -104.0673828125, -99.966796875, -95.8662109375, -91.765625, -87.6650390625, -83.564453125, -79.4638671875, -75.36328125, -71.2626953125, -67.162109375, -63.0615234375, -58.9609375, -54.8603515625, -50.759765625, -46.6591796875, -42.55859375, -38.4580078125, -34.357421875, -30.2568359375, -26.15625, -22.0556640625, -17.955078125, -13.8544921875, -9.75390625, -5.6533203125, -1.552734375, 2.5478515625, 6.6484375, 10.7490234375, 14.849609375, 18.9501953125, 23.05078125, 27.1513671875, 31.251953125, 35.3525390625, 39.453125, 43.5537109375, 47.654296875, 51.7548828125, 55.85546875, 59.9560546875, 64.056640625, 68.1572265625, 72.2578125, 76.3583984375, 80.458984375, 84.5595703125, 88.66015625, 92.7607421875, 96.861328125, 100.9619140625, 105.0625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 6.0, 10.0, 7.0, 26.0, 26.0, 35.0, 61.0, 79.0, 120.0, 217.0, 348.0, 555.0, 890.0, 1468.0, 2680.0, 5104.0, 9861.0, 20252.0, 43308.0, 109605.0, 5442987.0, 491098.0, 89461.0, 36893.0, 17436.0, 8740.0, 4535.0, 2354.0, 1261.0, 772.0, 439.0, 293.0, 193.0, 124.0, 85.0, 38.0, 24.0, 13.0, 13.0, 9.0, 7.0, 11.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-239.125, -229.119140625, -219.11328125, -209.107421875, -199.1015625, -189.095703125, -179.08984375, -169.083984375, -159.078125, -149.072265625, -139.06640625, -129.060546875, -119.0546875, -109.048828125, -99.04296875, -89.037109375, -79.03125, -69.025390625, -59.01953125, -49.013671875, -39.0078125, -29.001953125, -18.99609375, -8.990234375, 1.015625, 11.021484375, 21.02734375, 31.033203125, 41.0390625, 51.044921875, 61.05078125, 71.056640625, 81.0625, 91.068359375, 101.07421875, 111.080078125, 121.0859375, 131.091796875, 141.09765625, 151.103515625, 161.109375, 171.115234375, 181.12109375, 191.126953125, 201.1328125, 211.138671875, 221.14453125, 231.150390625, 241.15625, 251.162109375, 261.16796875, 271.173828125, 281.1796875, 291.185546875, 301.19140625, 311.197265625, 321.203125, 331.208984375, 341.21484375, 351.220703125, 361.2265625, 371.232421875, 381.23828125, 391.244140625, 401.25]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 6.0, 2.0, 2.0, 8.0, 6.0, 9.0, 9.0, 13.0, 9.0, 18.0, 27.0, 35.0, 23.0, 42.0, 42.0, 42.0, 63.0, 71.0, 135.0, 235.0, 329.0, 260.0, 147.0, 87.0, 68.0, 56.0, 33.0, 36.0, 46.0, 29.0, 19.0, 19.0, 25.0, 13.0, 12.0, 9.0, 7.0, 7.0, 3.0, 4.0, 4.0, 6.0, 3.0, 1.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-152.5, -147.5546875, -142.609375, -137.6640625, -132.71875, -127.7734375, -122.828125, -117.8828125, -112.9375, -107.9921875, -103.046875, -98.1015625, -93.15625, -88.2109375, -83.265625, -78.3203125, -73.375, -68.4296875, -63.484375, -58.5390625, -53.59375, -48.6484375, -43.703125, -38.7578125, -33.8125, -28.8671875, -23.921875, -18.9765625, -14.03125, -9.0859375, -4.140625, 0.8046875, 5.75, 10.6953125, 15.640625, 20.5859375, 25.53125, 30.4765625, 35.421875, 40.3671875, 45.3125, 50.2578125, 55.203125, 60.1484375, 65.09375, 70.0390625, 74.984375, 79.9296875, 84.875, 89.8203125, 94.765625, 99.7109375, 104.65625, 109.6015625, 114.546875, 119.4921875, 124.4375, 129.3828125, 134.328125, 139.2734375, 144.21875, 149.1640625, 154.109375, 159.0546875, 164.0]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 9.0, 9.0, 7.0, 12.0, 15.0, 22.0, 30.0, 51.0, 45.0, 71.0, 105.0, 177.0, 142.0, 79.0, 56.0, 32.0, 41.0, 26.0, 19.0, 10.0, 13.0, 8.0, 8.0, 9.0, 4.0, 2.0, 0.0, 2.0, 3.0], "bins": [-8581.712890625, -8398.4638671875, -8215.2138671875, -8031.96484375, -7848.71533203125, -7665.4658203125, -7482.216796875, -7298.96728515625, -7115.7177734375, -6932.46826171875, -6749.21875, -6565.9697265625, -6382.72021484375, -6199.470703125, -6016.2216796875, -5832.97216796875, -5649.72265625, -5466.47314453125, -5283.2236328125, -5099.974609375, -4916.72509765625, -4733.4755859375, -4550.2265625, -4366.97705078125, -4183.7275390625, -4000.47802734375, -3817.228759765625, -3633.9794921875, -3450.72998046875, -3267.48046875, -3084.231201171875, -2900.98193359375, -2717.732421875, -2534.48291015625, -2351.233642578125, -2167.984375, -1984.73486328125, -1801.4854736328125, -1618.236083984375, -1434.9866943359375, -1251.7373046875, -1068.4879150390625, -885.238525390625, -701.9891357421875, -518.73974609375, -335.4903564453125, -152.240966796875, 31.0084228515625, 214.2578125, 397.5072021484375, 580.756591796875, 764.0059814453125, 947.25537109375, 1130.5047607421875, 1313.754150390625, 1497.0035400390625, 1680.2529296875, 1863.5023193359375, 2046.751708984375, 2230.0009765625, 2413.25048828125, 2596.5, 2779.749267578125, 2962.99853515625, 3146.248046875]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 4.0, 3.0, 4.0, 7.0, 12.0, 12.0, 19.0, 8.0, 21.0, 18.0, 14.0, 18.0, 25.0, 21.0, 23.0, 47.0, 70.0, 117.0, 149.0, 85.0, 45.0, 44.0, 31.0, 35.0, 19.0, 24.0, 16.0, 19.0, 12.0, 8.0, 9.0, 6.0, 13.0, 8.0, 6.0, 5.0, 7.0, 2.0, 2.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4715.66064453125, -4569.54931640625, -4423.4375, -4277.326171875, -4131.21484375, -3985.10302734375, -3838.99169921875, -3692.880126953125, -3546.7685546875, -3400.656982421875, -3254.54541015625, -3108.43408203125, -2962.322509765625, -2816.2109375, -2670.099609375, -2523.988037109375, -2377.87646484375, -2231.764892578125, -2085.6533203125, -1939.5419921875, -1793.430419921875, -1647.31884765625, -1501.2073974609375, -1355.095947265625, -1208.984375, -1062.872802734375, -916.7613525390625, -770.6498413085938, -624.538330078125, -478.42681884765625, -332.3153076171875, -186.20379638671875, -40.091796875, 106.01971435546875, 252.1312255859375, 398.24273681640625, 544.354248046875, 690.4657592773438, 836.5772705078125, 982.6887817382812, 1128.80029296875, 1274.911865234375, 1421.0233154296875, 1567.134765625, 1713.246337890625, 1859.35791015625, 2005.4693603515625, 2151.580810546875, 2297.6923828125, 2443.803955078125, 2589.91552734375, 2736.02685546875, 2882.138427734375, 3028.25, 3174.361328125, 3320.472900390625, 3466.58447265625, 3612.696044921875, 3758.8076171875, 3904.9189453125, 4051.030517578125, 4197.14208984375, 4343.25341796875, 4489.365234375, 4635.4765625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 10.0, 7.0, 12.0, 26.0, 14.0, 30.0, 46.0, 59.0, 64.0, 81.0, 151.0, 204.0, 268.0, 395.0, 476.0, 745.0, 1093.0, 1601.0, 2294.0, 3450.0, 5307.0, 8338.0, 13599.0, 23310.0, 44932.0, 106009.0, 375449.0, 2779088.0, 575042.0, 140608.0, 52859.0, 25093.0, 13445.0, 7697.0, 4513.0, 2911.0, 1859.0, 1200.0, 707.0, 433.0, 314.0, 200.0, 135.0, 80.0, 55.0, 32.0, 17.0, 9.0, 8.0, 6.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-42.71875, -41.5185546875, -40.318359375, -39.1181640625, -37.91796875, -36.7177734375, -35.517578125, -34.3173828125, -33.1171875, -31.9169921875, -30.716796875, -29.5166015625, -28.31640625, -27.1162109375, -25.916015625, -24.7158203125, -23.515625, -22.3154296875, -21.115234375, -19.9150390625, -18.71484375, -17.5146484375, -16.314453125, -15.1142578125, -13.9140625, -12.7138671875, -11.513671875, -10.3134765625, -9.11328125, -7.9130859375, -6.712890625, -5.5126953125, -4.3125, -3.1123046875, -1.912109375, -0.7119140625, 0.48828125, 1.6884765625, 2.888671875, 4.0888671875, 5.2890625, 6.4892578125, 7.689453125, 8.8896484375, 10.08984375, 11.2900390625, 12.490234375, 13.6904296875, 14.890625, 16.0908203125, 17.291015625, 18.4912109375, 19.69140625, 20.8916015625, 22.091796875, 23.2919921875, 24.4921875, 25.6923828125, 26.892578125, 28.0927734375, 29.29296875, 30.4931640625, 31.693359375, 32.8935546875, 34.09375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 6.0, 2.0, 4.0, 2.0, 12.0, 3.0, 4.0, 13.0, 9.0, 14.0, 23.0, 24.0, 42.0, 41.0, 59.0, 93.0, 125.0, 134.0, 82.0, 78.0, 62.0, 40.0, 30.0, 19.0, 18.0, 12.0, 12.0, 7.0, 8.0, 3.0, 3.0, 3.0, 3.0, 5.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.703125, -4.575531005859375, -4.44793701171875, -4.320343017578125, -4.1927490234375, -4.065155029296875, -3.93756103515625, -3.809967041015625, -3.682373046875, -3.554779052734375, -3.42718505859375, -3.299591064453125, -3.1719970703125, -3.044403076171875, -2.91680908203125, -2.789215087890625, -2.66162109375, -2.534027099609375, -2.40643310546875, -2.278839111328125, -2.1512451171875, -2.023651123046875, -1.89605712890625, -1.768463134765625, -1.640869140625, -1.513275146484375, -1.38568115234375, -1.258087158203125, -1.1304931640625, -1.002899169921875, -0.87530517578125, -0.747711181640625, -0.6201171875, -0.492523193359375, -0.36492919921875, -0.237335205078125, -0.1097412109375, 0.017852783203125, 0.14544677734375, 0.273040771484375, 0.400634765625, 0.528228759765625, 0.65582275390625, 0.783416748046875, 0.9110107421875, 1.038604736328125, 1.16619873046875, 1.293792724609375, 1.42138671875, 1.548980712890625, 1.67657470703125, 1.804168701171875, 1.9317626953125, 2.059356689453125, 2.18695068359375, 2.314544677734375, 2.442138671875, 2.569732666015625, 2.69732666015625, 2.824920654296875, 2.9525146484375, 3.080108642578125, 3.20770263671875, 3.335296630859375, 3.462890625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 5.0, 4.0, 10.0, 6.0, 8.0, 9.0, 37.0, 32.0, 44.0, 53.0, 112.0, 113.0, 187.0, 230.0, 375.0, 549.0, 887.0, 1491.0, 2552.0, 4864.0, 9771.0, 21848.0, 53910.0, 147571.0, 458985.0, 1856567.0, 1129297.0, 322730.0, 107213.0, 40508.0, 16963.0, 7803.0, 3891.0, 2129.0, 1177.0, 808.0, 467.0, 306.0, 217.0, 153.0, 126.0, 91.0, 57.0, 50.0, 27.0, 16.0, 14.0, 12.0, 8.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-37.84375, -36.53173828125, -35.2197265625, -33.90771484375, -32.595703125, -31.28369140625, -29.9716796875, -28.65966796875, -27.34765625, -26.03564453125, -24.7236328125, -23.41162109375, -22.099609375, -20.78759765625, -19.4755859375, -18.16357421875, -16.8515625, -15.53955078125, -14.2275390625, -12.91552734375, -11.603515625, -10.29150390625, -8.9794921875, -7.66748046875, -6.35546875, -5.04345703125, -3.7314453125, -2.41943359375, -1.107421875, 0.20458984375, 1.5166015625, 2.82861328125, 4.140625, 5.45263671875, 6.7646484375, 8.07666015625, 9.388671875, 10.70068359375, 12.0126953125, 13.32470703125, 14.63671875, 15.94873046875, 17.2607421875, 18.57275390625, 19.884765625, 21.19677734375, 22.5087890625, 23.82080078125, 25.1328125, 26.44482421875, 27.7568359375, 29.06884765625, 30.380859375, 31.69287109375, 33.0048828125, 34.31689453125, 35.62890625, 36.94091796875, 38.2529296875, 39.56494140625, 40.876953125, 42.18896484375, 43.5009765625, 44.81298828125, 46.125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 12.0, 17.0, 14.0, 18.0, 12.0, 30.0, 28.0, 32.0, 43.0, 67.0, 66.0, 90.0, 115.0, 145.0, 168.0, 237.0, 266.0, 407.0, 543.0, 343.0, 266.0, 229.0, 183.0, 145.0, 115.0, 87.0, 85.0, 64.0, 48.0, 55.0, 34.0, 27.0, 17.0, 12.0, 12.0, 9.0, 10.0, 8.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-14.59375, -14.2027587890625, -13.811767578125, -13.4207763671875, -13.02978515625, -12.6387939453125, -12.247802734375, -11.8568115234375, -11.4658203125, -11.0748291015625, -10.683837890625, -10.2928466796875, -9.90185546875, -9.5108642578125, -9.119873046875, -8.7288818359375, -8.337890625, -7.9468994140625, -7.555908203125, -7.1649169921875, -6.77392578125, -6.3829345703125, -5.991943359375, -5.6009521484375, -5.2099609375, -4.8189697265625, -4.427978515625, -4.0369873046875, -3.64599609375, -3.2550048828125, -2.864013671875, -2.4730224609375, -2.08203125, -1.6910400390625, -1.300048828125, -0.9090576171875, -0.51806640625, -0.1270751953125, 0.263916015625, 0.6549072265625, 1.0458984375, 1.4368896484375, 1.827880859375, 2.2188720703125, 2.60986328125, 3.0008544921875, 3.391845703125, 3.7828369140625, 4.173828125, 4.5648193359375, 4.955810546875, 5.3468017578125, 5.73779296875, 6.1287841796875, 6.519775390625, 6.9107666015625, 7.3017578125, 7.6927490234375, 8.083740234375, 8.4747314453125, 8.86572265625, 9.2567138671875, 9.647705078125, 10.0386962890625, 10.4296875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 8.0, 12.0, 27.0, 61.0, 108.0, 163.0, 184.0, 184.0, 121.0, 54.0, 33.0, 16.0, 16.0, 8.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-214.38536071777344, -205.2847442626953, -196.18414306640625, -187.08352661132812, -177.98291015625, -168.88229370117188, -159.78167724609375, -150.6810760498047, -141.58045959472656, -132.47984313964844, -123.37923431396484, -114.27862548828125, -105.17800903320312, -96.077392578125, -86.9767837524414, -77.87617492675781, -68.77555847167969, -59.67494583129883, -50.57433319091797, -41.47372055053711, -32.37310791015625, -23.27249526977539, -14.171882629394531, -5.071269989013672, 4.0293426513671875, 13.129955291748047, 22.230567932128906, 31.331180572509766, 40.431793212890625, 49.532405853271484, 58.633018493652344, 67.73362731933594, 76.83425903320312, 85.93487548828125, 95.03548431396484, 104.13609313964844, 113.23670959472656, 122.33732604980469, 131.43792724609375, 140.53854370117188, 149.63916015625, 158.73977661132812, 167.84039306640625, 176.9409942626953, 186.04161071777344, 195.14222717285156, 204.24282836914062, 213.34344482421875, 222.44406127929688, 231.544677734375, 240.64529418945312, 249.7458953857422, 258.84649658203125, 267.9471130371094, 277.0477294921875, 286.1483459472656, 295.24896240234375, 304.3495788574219, 313.4501953125, 322.5508117675781, 331.65142822265625, 340.75201416015625, 349.8526306152344, 358.9532470703125, 368.0538635253906]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 4.0, 8.0, 13.0, 11.0, 17.0, 17.0, 28.0, 30.0, 51.0, 56.0, 63.0, 61.0, 58.0, 67.0, 78.0, 66.0, 58.0, 49.0, 43.0, 32.0, 47.0, 42.0, 23.0, 23.0, 19.0, 10.0, 6.0, 7.0, 1.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-166.04632568359375, -161.99449157714844, -157.9426727294922, -153.89083862304688, -149.83900451660156, -145.7871856689453, -141.7353515625, -137.6835174560547, -133.63169860839844, -129.57986450195312, -125.52803802490234, -121.47621154785156, -117.42438507080078, -113.37255859375, -109.32072448730469, -105.2688980102539, -101.2170639038086, -97.16523742675781, -93.1134033203125, -89.06157684326172, -85.00975036621094, -80.95791625976562, -76.90608978271484, -72.85426330566406, -68.80242919921875, -64.75060272216797, -60.69877243041992, -56.646942138671875, -52.595115661621094, -48.54328536987305, -44.491455078125, -40.43962860107422, -36.38780975341797, -32.33597946166992, -28.28415298461914, -24.232322692871094, -20.18049430847168, -16.128665924072266, -12.076835632324219, -8.025007247924805, -3.9731788635253906, 0.07864999771118164, 4.130478858947754, 8.182308197021484, 12.234136581420898, 16.285964965820312, 20.33779525756836, 24.389623641967773, 28.441452026367188, 32.493282318115234, 36.545108795166016, 40.59693908691406, 44.648765563964844, 48.70059585571289, 52.75242614746094, 56.80425262451172, 60.856082916259766, 64.90791320800781, 68.9597396850586, 73.01156616210938, 77.06340026855469, 81.11522674560547, 85.16705322265625, 89.21888732910156, 93.27071380615234]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 11.0, 9.0, 20.0, 26.0, 30.0, 52.0, 56.0, 97.0, 128.0, 187.0, 332.0, 521.0, 887.0, 1623.0, 3110.0, 6346.0, 14290.0, 37738.0, 128521.0, 508949.0, 244197.0, 61756.0, 21614.0, 8815.0, 4263.0, 2144.0, 1179.0, 602.0, 363.0, 227.0, 149.0, 94.0, 68.0, 39.0, 26.0, 27.0, 6.0, 7.0, 8.0, 14.0, 2.0, 6.0, 1.0, 2.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-30.171875, -29.156494140625, -28.14111328125, -27.125732421875, -26.1103515625, -25.094970703125, -24.07958984375, -23.064208984375, -22.048828125, -21.033447265625, -20.01806640625, -19.002685546875, -17.9873046875, -16.971923828125, -15.95654296875, -14.941162109375, -13.92578125, -12.910400390625, -11.89501953125, -10.879638671875, -9.8642578125, -8.848876953125, -7.83349609375, -6.818115234375, -5.802734375, -4.787353515625, -3.77197265625, -2.756591796875, -1.7412109375, -0.725830078125, 0.28955078125, 1.304931640625, 2.3203125, 3.335693359375, 4.35107421875, 5.366455078125, 6.3818359375, 7.397216796875, 8.41259765625, 9.427978515625, 10.443359375, 11.458740234375, 12.47412109375, 13.489501953125, 14.5048828125, 15.520263671875, 16.53564453125, 17.551025390625, 18.56640625, 19.581787109375, 20.59716796875, 21.612548828125, 22.6279296875, 23.643310546875, 24.65869140625, 25.674072265625, 26.689453125, 27.704833984375, 28.72021484375, 29.735595703125, 30.7509765625, 31.766357421875, 32.78173828125, 33.797119140625, 34.8125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 5.0, 4.0, 4.0, 6.0, 4.0, 14.0, 20.0, 22.0, 14.0, 30.0, 56.0, 60.0, 69.0, 73.0, 81.0, 95.0, 70.0, 73.0, 60.0, 54.0, 39.0, 45.0, 22.0, 24.0, 15.0, 9.0, 7.0, 3.0, 2.0, 10.0, 3.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6875, -6.521270751953125, -6.35504150390625, -6.188812255859375, -6.0225830078125, -5.856353759765625, -5.69012451171875, -5.523895263671875, -5.357666015625, -5.191436767578125, -5.02520751953125, -4.858978271484375, -4.6927490234375, -4.526519775390625, -4.36029052734375, -4.194061279296875, -4.02783203125, -3.861602783203125, -3.69537353515625, -3.529144287109375, -3.3629150390625, -3.196685791015625, -3.03045654296875, -2.864227294921875, -2.697998046875, -2.531768798828125, -2.36553955078125, -2.199310302734375, -2.0330810546875, -1.866851806640625, -1.70062255859375, -1.534393310546875, -1.3681640625, -1.201934814453125, -1.03570556640625, -0.869476318359375, -0.7032470703125, -0.537017822265625, -0.37078857421875, -0.204559326171875, -0.038330078125, 0.127899169921875, 0.29412841796875, 0.460357666015625, 0.6265869140625, 0.792816162109375, 0.95904541015625, 1.125274658203125, 1.29150390625, 1.457733154296875, 1.62396240234375, 1.790191650390625, 1.9564208984375, 2.122650146484375, 2.28887939453125, 2.455108642578125, 2.621337890625, 2.787567138671875, 2.95379638671875, 3.120025634765625, 3.2862548828125, 3.452484130859375, 3.61871337890625, 3.784942626953125, 3.951171875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 6.0, 5.0, 3.0, 8.0, 13.0, 23.0, 16.0, 24.0, 28.0, 66.0, 74.0, 101.0, 167.0, 239.0, 320.0, 458.0, 668.0, 1048.0, 1637.0, 2550.0, 4313.0, 7460.0, 13358.0, 27019.0, 59782.0, 160152.0, 389516.0, 225741.0, 79581.0, 34456.0, 16812.0, 8995.0, 5077.0, 3102.0, 1940.0, 1238.0, 790.0, 513.0, 359.0, 263.0, 175.0, 142.0, 102.0, 61.0, 48.0, 35.0, 22.0, 24.0, 11.0, 6.0, 11.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.59375, -17.9873046875, -17.380859375, -16.7744140625, -16.16796875, -15.5615234375, -14.955078125, -14.3486328125, -13.7421875, -13.1357421875, -12.529296875, -11.9228515625, -11.31640625, -10.7099609375, -10.103515625, -9.4970703125, -8.890625, -8.2841796875, -7.677734375, -7.0712890625, -6.46484375, -5.8583984375, -5.251953125, -4.6455078125, -4.0390625, -3.4326171875, -2.826171875, -2.2197265625, -1.61328125, -1.0068359375, -0.400390625, 0.2060546875, 0.8125, 1.4189453125, 2.025390625, 2.6318359375, 3.23828125, 3.8447265625, 4.451171875, 5.0576171875, 5.6640625, 6.2705078125, 6.876953125, 7.4833984375, 8.08984375, 8.6962890625, 9.302734375, 9.9091796875, 10.515625, 11.1220703125, 11.728515625, 12.3349609375, 12.94140625, 13.5478515625, 14.154296875, 14.7607421875, 15.3671875, 15.9736328125, 16.580078125, 17.1865234375, 17.79296875, 18.3994140625, 19.005859375, 19.6123046875, 20.21875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 5.0, 7.0, 2.0, 8.0, 11.0, 17.0, 11.0, 8.0, 9.0, 15.0, 18.0, 18.0, 23.0, 29.0, 37.0, 43.0, 43.0, 41.0, 41.0, 40.0, 38.0, 38.0, 45.0, 38.0, 30.0, 35.0, 42.0, 33.0, 29.0, 33.0, 29.0, 22.0, 23.0, 16.0, 20.0, 13.0, 19.0, 11.0, 16.0, 9.0, 11.0, 5.0, 4.0, 4.0, 5.0, 4.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.28125, -18.6494140625, -18.017578125, -17.3857421875, -16.75390625, -16.1220703125, -15.490234375, -14.8583984375, -14.2265625, -13.5947265625, -12.962890625, -12.3310546875, -11.69921875, -11.0673828125, -10.435546875, -9.8037109375, -9.171875, -8.5400390625, -7.908203125, -7.2763671875, -6.64453125, -6.0126953125, -5.380859375, -4.7490234375, -4.1171875, -3.4853515625, -2.853515625, -2.2216796875, -1.58984375, -0.9580078125, -0.326171875, 0.3056640625, 0.9375, 1.5693359375, 2.201171875, 2.8330078125, 3.46484375, 4.0966796875, 4.728515625, 5.3603515625, 5.9921875, 6.6240234375, 7.255859375, 7.8876953125, 8.51953125, 9.1513671875, 9.783203125, 10.4150390625, 11.046875, 11.6787109375, 12.310546875, 12.9423828125, 13.57421875, 14.2060546875, 14.837890625, 15.4697265625, 16.1015625, 16.7333984375, 17.365234375, 17.9970703125, 18.62890625, 19.2607421875, 19.892578125, 20.5244140625, 21.15625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 5.0, 5.0, 5.0, 3.0, 14.0, 10.0, 15.0, 39.0, 37.0, 48.0, 94.0, 161.0, 224.0, 406.0, 777.0, 1673.0, 3737.0, 9575.0, 30202.0, 135528.0, 534336.0, 256426.0, 50755.0, 14511.0, 5301.0, 2272.0, 1074.0, 554.0, 301.0, 185.0, 108.0, 71.0, 26.0, 24.0, 17.0, 10.0, 13.0, 8.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.890625, -19.262939453125, -18.63525390625, -18.007568359375, -17.3798828125, -16.752197265625, -16.12451171875, -15.496826171875, -14.869140625, -14.241455078125, -13.61376953125, -12.986083984375, -12.3583984375, -11.730712890625, -11.10302734375, -10.475341796875, -9.84765625, -9.219970703125, -8.59228515625, -7.964599609375, -7.3369140625, -6.709228515625, -6.08154296875, -5.453857421875, -4.826171875, -4.198486328125, -3.57080078125, -2.943115234375, -2.3154296875, -1.687744140625, -1.06005859375, -0.432373046875, 0.1953125, 0.822998046875, 1.45068359375, 2.078369140625, 2.7060546875, 3.333740234375, 3.96142578125, 4.589111328125, 5.216796875, 5.844482421875, 6.47216796875, 7.099853515625, 7.7275390625, 8.355224609375, 8.98291015625, 9.610595703125, 10.23828125, 10.865966796875, 11.49365234375, 12.121337890625, 12.7490234375, 13.376708984375, 14.00439453125, 14.632080078125, 15.259765625, 15.887451171875, 16.51513671875, 17.142822265625, 17.7705078125, 18.398193359375, 19.02587890625, 19.653564453125, 20.28125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 7.0, 10.0, 9.0, 13.0, 18.0, 24.0, 27.0, 32.0, 37.0, 47.0, 45.0, 56.0, 64.0, 58.0, 63.0, 69.0, 61.0, 59.0, 54.0, 40.0, 40.0, 26.0, 21.0, 23.0, 21.0, 17.0, 11.0, 2.0, 8.0, 11.0, 5.0, 3.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.0005445480346679688, -0.00052623450756073, -0.0005079209804534912, -0.0004896074533462524, -0.00047129392623901367, -0.0004529803991317749, -0.00043466687202453613, -0.00041635334491729736, -0.0003980398178100586, -0.0003797262907028198, -0.00036141276359558105, -0.0003430992364883423, -0.0003247857093811035, -0.00030647218227386475, -0.000288158655166626, -0.0002698451280593872, -0.00025153160095214844, -0.00023321807384490967, -0.0002149045467376709, -0.00019659101963043213, -0.00017827749252319336, -0.0001599639654159546, -0.00014165043830871582, -0.00012333691120147705, -0.00010502338409423828, -8.670985698699951e-05, -6.839632987976074e-05, -5.008280277252197e-05, -3.17692756652832e-05, -1.3455748558044434e-05, 4.857778549194336e-06, 2.3171305656433105e-05, 4.1484832763671875e-05, 5.9798359870910645e-05, 7.811188697814941e-05, 9.642541408538818e-05, 0.00011473894119262695, 0.00013305246829986572, 0.0001513659954071045, 0.00016967952251434326, 0.00018799304962158203, 0.0002063065767288208, 0.00022462010383605957, 0.00024293363094329834, 0.0002612471580505371, 0.0002795606851577759, 0.00029787421226501465, 0.0003161877393722534, 0.0003345012664794922, 0.00035281479358673096, 0.0003711283206939697, 0.0003894418478012085, 0.00040775537490844727, 0.00042606890201568604, 0.0004443824291229248, 0.0004626959562301636, 0.00048100948333740234, 0.0004993230104446411, 0.0005176365375518799, 0.0005359500646591187, 0.0005542635917663574, 0.0005725771188735962, 0.000590890645980835, 0.0006092041730880737, 0.0006275177001953125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 4.0, 6.0, 10.0, 13.0, 30.0, 36.0, 91.0, 177.0, 345.0, 803.0, 1680.0, 4594.0, 13809.0, 54738.0, 298340.0, 525958.0, 112286.0, 23695.0, 7155.0, 2590.0, 1089.0, 523.0, 270.0, 127.0, 84.0, 33.0, 21.0, 14.0, 10.0, 6.0, 5.0, 8.0, 1.0, 3.0, 2.0], "bins": [-31.015625, -30.314208984375, -29.61279296875, -28.911376953125, -28.2099609375, -27.508544921875, -26.80712890625, -26.105712890625, -25.404296875, -24.702880859375, -24.00146484375, -23.300048828125, -22.5986328125, -21.897216796875, -21.19580078125, -20.494384765625, -19.79296875, -19.091552734375, -18.39013671875, -17.688720703125, -16.9873046875, -16.285888671875, -15.58447265625, -14.883056640625, -14.181640625, -13.480224609375, -12.77880859375, -12.077392578125, -11.3759765625, -10.674560546875, -9.97314453125, -9.271728515625, -8.5703125, -7.868896484375, -7.16748046875, -6.466064453125, -5.7646484375, -5.063232421875, -4.36181640625, -3.660400390625, -2.958984375, -2.257568359375, -1.55615234375, -0.854736328125, -0.1533203125, 0.548095703125, 1.24951171875, 1.950927734375, 2.65234375, 3.353759765625, 4.05517578125, 4.756591796875, 5.4580078125, 6.159423828125, 6.86083984375, 7.562255859375, 8.263671875, 8.965087890625, 9.66650390625, 10.367919921875, 11.0693359375, 11.770751953125, 12.47216796875, 13.173583984375, 13.875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 8.0, 10.0, 6.0, 11.0, 15.0, 18.0, 25.0, 23.0, 24.0, 32.0, 36.0, 37.0, 45.0, 52.0, 52.0, 50.0, 72.0, 46.0, 62.0, 59.0, 42.0, 31.0, 44.0, 36.0, 22.0, 21.0, 22.0, 20.0, 14.0, 13.0, 9.0, 7.0, 9.0, 3.0, 2.0, 6.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.6484375, -8.39825439453125, -8.1480712890625, -7.89788818359375, -7.647705078125, -7.39752197265625, -7.1473388671875, -6.89715576171875, -6.64697265625, -6.39678955078125, -6.1466064453125, -5.89642333984375, -5.646240234375, -5.39605712890625, -5.1458740234375, -4.89569091796875, -4.6455078125, -4.39532470703125, -4.1451416015625, -3.89495849609375, -3.644775390625, -3.39459228515625, -3.1444091796875, -2.89422607421875, -2.64404296875, -2.39385986328125, -2.1436767578125, -1.89349365234375, -1.643310546875, -1.39312744140625, -1.1429443359375, -0.89276123046875, -0.642578125, -0.39239501953125, -0.1422119140625, 0.10797119140625, 0.358154296875, 0.60833740234375, 0.8585205078125, 1.10870361328125, 1.35888671875, 1.60906982421875, 1.8592529296875, 2.10943603515625, 2.359619140625, 2.60980224609375, 2.8599853515625, 3.11016845703125, 3.3603515625, 3.61053466796875, 3.8607177734375, 4.11090087890625, 4.361083984375, 4.61126708984375, 4.8614501953125, 5.11163330078125, 5.36181640625, 5.61199951171875, 5.8621826171875, 6.11236572265625, 6.362548828125, 6.61273193359375, 6.8629150390625, 7.11309814453125, 7.36328125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 7.0, 4.0, 5.0, 8.0, 11.0, 17.0, 26.0, 36.0, 94.0, 197.0, 215.0, 191.0, 85.0, 46.0, 24.0, 12.0, 6.0, 8.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-288.68634033203125, -279.2657470703125, -269.84515380859375, -260.4245300292969, -251.00393676757812, -241.58334350585938, -232.16273498535156, -222.74212646484375, -213.321533203125, -203.90093994140625, -194.48033142089844, -185.05972290039062, -175.63912963867188, -166.21853637695312, -156.7979278564453, -147.3773193359375, -137.95672607421875, -128.5361328125, -119.11552429199219, -109.6949234008789, -100.27432250976562, -90.85372161865234, -81.43312072753906, -72.01251983642578, -62.5919189453125, -53.17131805419922, -43.75071716308594, -34.330116271972656, -24.909515380859375, -15.488914489746094, -6.0683135986328125, 3.3522872924804688, 12.772918701171875, 22.193519592285156, 31.614120483398438, 41.03472137451172, 50.455322265625, 59.87592315673828, 69.29652404785156, 78.71712493896484, 88.13772583007812, 97.5583267211914, 106.97892761230469, 116.39952850341797, 125.82012939453125, 135.24072265625, 144.6613311767578, 154.08193969726562, 163.50253295898438, 172.92312622070312, 182.34373474121094, 191.76434326171875, 201.1849365234375, 210.60552978515625, 220.02613830566406, 229.44674682617188, 238.86734008789062, 248.28793334960938, 257.70855712890625, 267.129150390625, 276.54974365234375, 285.9703369140625, 295.39093017578125, 304.8115539550781, 314.2321472167969]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 3.0, 2.0, 9.0, 9.0, 12.0, 12.0, 29.0, 61.0, 88.0, 131.0, 188.0, 139.0, 113.0, 64.0, 40.0, 22.0, 17.0, 6.0, 7.0, 7.0, 6.0, 2.0, 7.0, 2.0, 0.0, 2.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-279.038818359375, -266.829345703125, -254.61988830566406, -242.41043090820312, -230.20095825195312, -217.99148559570312, -205.7820281982422, -193.57257080078125, -181.36309814453125, -169.15362548828125, -156.9441680908203, -144.73471069335938, -132.52523803710938, -120.3157730102539, -108.10630798339844, -95.89684295654297, -83.6873779296875, -71.47791290283203, -59.26844787597656, -47.058982849121094, -34.849517822265625, -22.640052795410156, -10.430587768554688, 1.7788772583007812, 13.98834228515625, 26.19780731201172, 38.40727233886719, 50.616737365722656, 62.826202392578125, 75.0356674194336, 87.24513244628906, 99.45459747314453, 111.6640625, 123.87352752685547, 136.08299255371094, 148.29244995117188, 160.50192260742188, 172.71139526367188, 184.9208526611328, 197.13031005859375, 209.33978271484375, 221.54925537109375, 233.7587127685547, 245.96817016601562, 258.1776428222656, 270.3871154785156, 282.5965576171875, 294.8060302734375, 307.0155029296875, 319.2249755859375, 331.4344482421875, 343.6438903808594, 355.8533630371094, 368.0628356933594, 380.27227783203125, 392.48175048828125, 404.69122314453125, 416.90069580078125, 429.11016845703125, 441.3196105957031, 453.5290832519531, 465.7385559082031, 477.947998046875, 490.157470703125, 502.366943359375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 3.0, 8.0, 6.0, 15.0, 17.0, 21.0, 18.0, 55.0, 62.0, 110.0, 208.0, 378.0, 621.0, 1238.0, 2439.0, 5633.0, 14450.0, 48726.0, 295348.0, 3568143.0, 195194.0, 38937.0, 12427.0, 5016.0, 2356.0, 1126.0, 619.0, 405.0, 229.0, 152.0, 94.0, 62.0, 49.0, 28.0, 19.0, 24.0, 16.0, 14.0, 4.0, 6.0, 2.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-92.1875, -89.15625, -86.125, -83.09375, -80.0625, -77.03125, -74.0, -70.96875, -67.9375, -64.90625, -61.875, -58.84375, -55.8125, -52.78125, -49.75, -46.71875, -43.6875, -40.65625, -37.625, -34.59375, -31.5625, -28.53125, -25.5, -22.46875, -19.4375, -16.40625, -13.375, -10.34375, -7.3125, -4.28125, -1.25, 1.78125, 4.8125, 7.84375, 10.875, 13.90625, 16.9375, 19.96875, 23.0, 26.03125, 29.0625, 32.09375, 35.125, 38.15625, 41.1875, 44.21875, 47.25, 50.28125, 53.3125, 56.34375, 59.375, 62.40625, 65.4375, 68.46875, 71.5, 74.53125, 77.5625, 80.59375, 83.625, 86.65625, 89.6875, 92.71875, 95.75, 98.78125, 101.8125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 8.0, 5.0, 6.0, 6.0, 15.0, 14.0, 19.0, 21.0, 30.0, 48.0, 71.0, 77.0, 86.0, 88.0, 71.0, 94.0, 77.0, 61.0, 50.0, 40.0, 34.0, 20.0, 19.0, 4.0, 10.0, 4.0, 4.0, 6.0, 2.0, 3.0, 0.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.96875, -5.77081298828125, -5.5728759765625, -5.37493896484375, -5.177001953125, -4.97906494140625, -4.7811279296875, -4.58319091796875, -4.38525390625, -4.18731689453125, -3.9893798828125, -3.79144287109375, -3.593505859375, -3.39556884765625, -3.1976318359375, -2.99969482421875, -2.8017578125, -2.60382080078125, -2.4058837890625, -2.20794677734375, -2.010009765625, -1.81207275390625, -1.6141357421875, -1.41619873046875, -1.21826171875, -1.02032470703125, -0.8223876953125, -0.62445068359375, -0.426513671875, -0.22857666015625, -0.0306396484375, 0.16729736328125, 0.365234375, 0.56317138671875, 0.7611083984375, 0.95904541015625, 1.156982421875, 1.35491943359375, 1.5528564453125, 1.75079345703125, 1.94873046875, 2.14666748046875, 2.3446044921875, 2.54254150390625, 2.740478515625, 2.93841552734375, 3.1363525390625, 3.33428955078125, 3.5322265625, 3.73016357421875, 3.9281005859375, 4.12603759765625, 4.323974609375, 4.52191162109375, 4.7198486328125, 4.91778564453125, 5.11572265625, 5.31365966796875, 5.5115966796875, 5.70953369140625, 5.907470703125, 6.10540771484375, 6.3033447265625, 6.50128173828125, 6.69921875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 8.0, 8.0, 13.0, 15.0, 26.0, 41.0, 40.0, 58.0, 84.0, 123.0, 172.0, 260.0, 379.0, 613.0, 877.0, 1471.0, 2372.0, 4150.0, 7323.0, 13225.0, 26512.0, 55798.0, 131504.0, 384781.0, 2517491.0, 699401.0, 194664.0, 77385.0, 35555.0, 17452.0, 9329.0, 5139.0, 2973.0, 1786.0, 1107.0, 708.0, 427.0, 300.0, 214.0, 136.0, 115.0, 73.0, 50.0, 37.0, 26.0, 16.0, 11.0, 11.0, 8.0, 2.0, 7.0, 3.0, 5.0, 3.0, 2.0, 1.0], "bins": [-52.1875, -50.591796875, -48.99609375, -47.400390625, -45.8046875, -44.208984375, -42.61328125, -41.017578125, -39.421875, -37.826171875, -36.23046875, -34.634765625, -33.0390625, -31.443359375, -29.84765625, -28.251953125, -26.65625, -25.060546875, -23.46484375, -21.869140625, -20.2734375, -18.677734375, -17.08203125, -15.486328125, -13.890625, -12.294921875, -10.69921875, -9.103515625, -7.5078125, -5.912109375, -4.31640625, -2.720703125, -1.125, 0.470703125, 2.06640625, 3.662109375, 5.2578125, 6.853515625, 8.44921875, 10.044921875, 11.640625, 13.236328125, 14.83203125, 16.427734375, 18.0234375, 19.619140625, 21.21484375, 22.810546875, 24.40625, 26.001953125, 27.59765625, 29.193359375, 30.7890625, 32.384765625, 33.98046875, 35.576171875, 37.171875, 38.767578125, 40.36328125, 41.958984375, 43.5546875, 45.150390625, 46.74609375, 48.341796875, 49.9375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 7.0, 7.0, 8.0, 11.0, 9.0, 22.0, 23.0, 24.0, 29.0, 49.0, 61.0, 84.0, 82.0, 133.0, 182.0, 289.0, 551.0, 1281.0, 407.0, 216.0, 161.0, 106.0, 70.0, 66.0, 40.0, 33.0, 25.0, 19.0, 10.0, 10.0, 13.0, 8.0, 5.0, 6.0, 5.0, 2.0, 3.0, 6.0, 4.0, 1.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.484375, -9.1490478515625, -8.813720703125, -8.4783935546875, -8.14306640625, -7.8077392578125, -7.472412109375, -7.1370849609375, -6.8017578125, -6.4664306640625, -6.131103515625, -5.7957763671875, -5.46044921875, -5.1251220703125, -4.789794921875, -4.4544677734375, -4.119140625, -3.7838134765625, -3.448486328125, -3.1131591796875, -2.77783203125, -2.4425048828125, -2.107177734375, -1.7718505859375, -1.4365234375, -1.1011962890625, -0.765869140625, -0.4305419921875, -0.09521484375, 0.2401123046875, 0.575439453125, 0.9107666015625, 1.24609375, 1.5814208984375, 1.916748046875, 2.2520751953125, 2.58740234375, 2.9227294921875, 3.258056640625, 3.5933837890625, 3.9287109375, 4.2640380859375, 4.599365234375, 4.9346923828125, 5.27001953125, 5.6053466796875, 5.940673828125, 6.2760009765625, 6.611328125, 6.9466552734375, 7.281982421875, 7.6173095703125, 7.95263671875, 8.2879638671875, 8.623291015625, 8.9586181640625, 9.2939453125, 9.6292724609375, 9.964599609375, 10.2999267578125, 10.63525390625, 10.9705810546875, 11.305908203125, 11.6412353515625, 11.9765625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 6.0, 16.0, 9.0, 21.0, 45.0, 70.0, 117.0, 183.0, 184.0, 135.0, 104.0, 52.0, 36.0, 17.0, 3.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-147.76976013183594, -143.60548400878906, -139.44122314453125, -135.27694702148438, -131.11268615722656, -126.94841766357422, -122.78414916992188, -118.619873046875, -114.45561218261719, -110.29134368896484, -106.1270751953125, -101.96280670166016, -97.79853820800781, -93.63426971435547, -89.47000122070312, -85.30572509765625, -81.1414566040039, -76.97718811035156, -72.81291961669922, -68.64865112304688, -64.48438262939453, -60.32011413574219, -56.15584182739258, -51.991573333740234, -47.82730484008789, -43.66303634643555, -39.4987678527832, -35.334495544433594, -31.170228958129883, -27.00596046447754, -22.841690063476562, -18.67742156982422, -14.513153076171875, -10.348884582519531, -6.184615135192871, -2.020345687866211, 2.143922805786133, 6.308191299438477, 10.472461700439453, 14.636730194091797, 18.80099868774414, 22.965267181396484, 27.129535675048828, 31.293806076049805, 35.45807647705078, 39.622344970703125, 43.78661346435547, 47.95088195800781, 52.115150451660156, 56.2794189453125, 60.443687438964844, 64.60795593261719, 68.77222442626953, 72.93649291992188, 77.10076904296875, 81.26502990722656, 85.42930603027344, 89.59357452392578, 93.75784301757812, 97.92211151123047, 102.08638000488281, 106.25064849853516, 110.4149169921875, 114.57919311523438, 118.74345397949219]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 6.0, 11.0, 17.0, 16.0, 17.0, 26.0, 31.0, 34.0, 47.0, 49.0, 67.0, 54.0, 77.0, 74.0, 78.0, 78.0, 59.0, 45.0, 46.0, 41.0, 28.0, 28.0, 15.0, 17.0, 8.0, 6.0, 7.0, 5.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.56741333007812, -62.397796630859375, -60.228179931640625, -58.05856704711914, -55.88895034790039, -53.71933364868164, -51.549720764160156, -49.380104064941406, -47.210487365722656, -45.040870666503906, -42.871253967285156, -40.70164108276367, -38.53202438354492, -36.36240768432617, -34.19279479980469, -32.02317810058594, -29.853561401367188, -27.683944702148438, -25.51432991027832, -23.344715118408203, -21.175098419189453, -19.005481719970703, -16.835866928100586, -14.666251182556152, -12.496635437011719, -10.327019691467285, -8.157403945922852, -5.987788200378418, -3.8181724548339844, -1.6485567092895508, 0.5210590362548828, 2.6906747817993164, 4.86029052734375, 7.029906272888184, 9.199522018432617, 11.36913776397705, 13.538753509521484, 15.708369255065918, 17.87798500061035, 20.04759979248047, 22.21721649169922, 24.38683319091797, 26.556447982788086, 28.726062774658203, 30.895679473876953, 33.0652961730957, 35.23490905761719, 37.40452575683594, 39.57414245605469, 41.74375915527344, 43.91337585449219, 46.08298873901367, 48.25260543823242, 50.42222213745117, 52.591835021972656, 54.761451721191406, 56.931068420410156, 59.100685119628906, 61.270301818847656, 63.43991470336914, 65.60952758789062, 67.77914428710938, 69.94876098632812, 72.11837768554688, 74.28799438476562]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 11.0, 9.0, 13.0, 18.0, 26.0, 30.0, 38.0, 65.0, 112.0, 129.0, 210.0, 337.0, 510.0, 737.0, 1320.0, 2262.0, 4081.0, 7763.0, 15312.0, 34157.0, 88838.0, 294557.0, 389424.0, 123975.0, 44444.0, 19061.0, 9352.0, 4948.0, 2720.0, 1541.0, 882.0, 585.0, 337.0, 238.0, 160.0, 106.0, 78.0, 42.0, 31.0, 27.0, 16.0, 17.0, 13.0, 9.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-46.25, -44.93408203125, -43.6181640625, -42.30224609375, -40.986328125, -39.67041015625, -38.3544921875, -37.03857421875, -35.72265625, -34.40673828125, -33.0908203125, -31.77490234375, -30.458984375, -29.14306640625, -27.8271484375, -26.51123046875, -25.1953125, -23.87939453125, -22.5634765625, -21.24755859375, -19.931640625, -18.61572265625, -17.2998046875, -15.98388671875, -14.66796875, -13.35205078125, -12.0361328125, -10.72021484375, -9.404296875, -8.08837890625, -6.7724609375, -5.45654296875, -4.140625, -2.82470703125, -1.5087890625, -0.19287109375, 1.123046875, 2.43896484375, 3.7548828125, 5.07080078125, 6.38671875, 7.70263671875, 9.0185546875, 10.33447265625, 11.650390625, 12.96630859375, 14.2822265625, 15.59814453125, 16.9140625, 18.22998046875, 19.5458984375, 20.86181640625, 22.177734375, 23.49365234375, 24.8095703125, 26.12548828125, 27.44140625, 28.75732421875, 30.0732421875, 31.38916015625, 32.705078125, 34.02099609375, 35.3369140625, 36.65283203125, 37.96875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 5.0, 3.0, 3.0, 4.0, 4.0, 6.0, 10.0, 8.0, 12.0, 16.0, 13.0, 21.0, 28.0, 32.0, 31.0, 34.0, 39.0, 58.0, 53.0, 53.0, 51.0, 62.0, 46.0, 53.0, 52.0, 48.0, 46.0, 43.0, 24.0, 26.0, 13.0, 15.0, 18.0, 22.0, 10.0, 8.0, 8.0, 5.0, 7.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3203125, -3.18487548828125, -3.0494384765625, -2.91400146484375, -2.778564453125, -2.64312744140625, -2.5076904296875, -2.37225341796875, -2.23681640625, -2.10137939453125, -1.9659423828125, -1.83050537109375, -1.695068359375, -1.55963134765625, -1.4241943359375, -1.28875732421875, -1.1533203125, -1.01788330078125, -0.8824462890625, -0.74700927734375, -0.611572265625, -0.47613525390625, -0.3406982421875, -0.20526123046875, -0.06982421875, 0.06561279296875, 0.2010498046875, 0.33648681640625, 0.471923828125, 0.60736083984375, 0.7427978515625, 0.87823486328125, 1.013671875, 1.14910888671875, 1.2845458984375, 1.41998291015625, 1.555419921875, 1.69085693359375, 1.8262939453125, 1.96173095703125, 2.09716796875, 2.23260498046875, 2.3680419921875, 2.50347900390625, 2.638916015625, 2.77435302734375, 2.9097900390625, 3.04522705078125, 3.1806640625, 3.31610107421875, 3.4515380859375, 3.58697509765625, 3.722412109375, 3.85784912109375, 3.9932861328125, 4.12872314453125, 4.26416015625, 4.39959716796875, 4.5350341796875, 4.67047119140625, 4.805908203125, 4.94134521484375, 5.0767822265625, 5.21221923828125, 5.34765625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 7.0, 11.0, 15.0, 13.0, 12.0, 34.0, 64.0, 95.0, 169.0, 252.0, 422.0, 702.0, 1296.0, 2318.0, 4736.0, 10787.0, 30130.0, 119837.0, 538181.0, 257745.0, 51965.0, 16193.0, 6687.0, 3114.0, 1611.0, 893.0, 447.0, 301.0, 191.0, 110.0, 75.0, 49.0, 36.0, 30.0, 11.0, 8.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-57.09375, -55.5390625, -53.984375, -52.4296875, -50.875, -49.3203125, -47.765625, -46.2109375, -44.65625, -43.1015625, -41.546875, -39.9921875, -38.4375, -36.8828125, -35.328125, -33.7734375, -32.21875, -30.6640625, -29.109375, -27.5546875, -26.0, -24.4453125, -22.890625, -21.3359375, -19.78125, -18.2265625, -16.671875, -15.1171875, -13.5625, -12.0078125, -10.453125, -8.8984375, -7.34375, -5.7890625, -4.234375, -2.6796875, -1.125, 0.4296875, 1.984375, 3.5390625, 5.09375, 6.6484375, 8.203125, 9.7578125, 11.3125, 12.8671875, 14.421875, 15.9765625, 17.53125, 19.0859375, 20.640625, 22.1953125, 23.75, 25.3046875, 26.859375, 28.4140625, 29.96875, 31.5234375, 33.078125, 34.6328125, 36.1875, 37.7421875, 39.296875, 40.8515625, 42.40625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 2.0, 4.0, 6.0, 6.0, 10.0, 4.0, 13.0, 10.0, 25.0, 25.0, 28.0, 29.0, 38.0, 45.0, 45.0, 47.0, 55.0, 67.0, 67.0, 45.0, 52.0, 56.0, 49.0, 54.0, 37.0, 37.0, 24.0, 23.0, 24.0, 18.0, 9.0, 14.0, 5.0, 4.0, 2.0, 4.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-27.546875, -26.780517578125, -26.01416015625, -25.247802734375, -24.4814453125, -23.715087890625, -22.94873046875, -22.182373046875, -21.416015625, -20.649658203125, -19.88330078125, -19.116943359375, -18.3505859375, -17.584228515625, -16.81787109375, -16.051513671875, -15.28515625, -14.518798828125, -13.75244140625, -12.986083984375, -12.2197265625, -11.453369140625, -10.68701171875, -9.920654296875, -9.154296875, -8.387939453125, -7.62158203125, -6.855224609375, -6.0888671875, -5.322509765625, -4.55615234375, -3.789794921875, -3.0234375, -2.257080078125, -1.49072265625, -0.724365234375, 0.0419921875, 0.808349609375, 1.57470703125, 2.341064453125, 3.107421875, 3.873779296875, 4.64013671875, 5.406494140625, 6.1728515625, 6.939208984375, 7.70556640625, 8.471923828125, 9.23828125, 10.004638671875, 10.77099609375, 11.537353515625, 12.3037109375, 13.070068359375, 13.83642578125, 14.602783203125, 15.369140625, 16.135498046875, 16.90185546875, 17.668212890625, 18.4345703125, 19.200927734375, 19.96728515625, 20.733642578125, 21.5]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 10.0, 12.0, 16.0, 30.0, 39.0, 51.0, 86.0, 143.0, 234.0, 347.0, 689.0, 1214.0, 2421.0, 5014.0, 11318.0, 27354.0, 73868.0, 205429.0, 368866.0, 219371.0, 79557.0, 29517.0, 11961.0, 5357.0, 2623.0, 1280.0, 675.0, 403.0, 226.0, 136.0, 85.0, 86.0, 37.0, 26.0, 22.0, 15.0, 6.0, 9.0, 9.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-28.71875, -27.88720703125, -27.0556640625, -26.22412109375, -25.392578125, -24.56103515625, -23.7294921875, -22.89794921875, -22.06640625, -21.23486328125, -20.4033203125, -19.57177734375, -18.740234375, -17.90869140625, -17.0771484375, -16.24560546875, -15.4140625, -14.58251953125, -13.7509765625, -12.91943359375, -12.087890625, -11.25634765625, -10.4248046875, -9.59326171875, -8.76171875, -7.93017578125, -7.0986328125, -6.26708984375, -5.435546875, -4.60400390625, -3.7724609375, -2.94091796875, -2.109375, -1.27783203125, -0.4462890625, 0.38525390625, 1.216796875, 2.04833984375, 2.8798828125, 3.71142578125, 4.54296875, 5.37451171875, 6.2060546875, 7.03759765625, 7.869140625, 8.70068359375, 9.5322265625, 10.36376953125, 11.1953125, 12.02685546875, 12.8583984375, 13.68994140625, 14.521484375, 15.35302734375, 16.1845703125, 17.01611328125, 17.84765625, 18.67919921875, 19.5107421875, 20.34228515625, 21.173828125, 22.00537109375, 22.8369140625, 23.66845703125, 24.5]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 6.0, 0.0, 5.0, 4.0, 4.0, 5.0, 9.0, 18.0, 27.0, 62.0, 94.0, 139.0, 167.0, 197.0, 101.0, 75.0, 31.0, 11.0, 8.0, 6.0, 3.0, 6.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0028076171875, -0.0027156472206115723, -0.0026236772537231445, -0.002531707286834717, -0.002439737319946289, -0.0023477673530578613, -0.0022557973861694336, -0.002163827419281006, -0.002071857452392578, -0.0019798874855041504, -0.0018879175186157227, -0.001795947551727295, -0.0017039775848388672, -0.0016120076179504395, -0.0015200376510620117, -0.001428067684173584, -0.0013360977172851562, -0.0012441277503967285, -0.0011521577835083008, -0.001060187816619873, -0.0009682178497314453, -0.0008762478828430176, -0.0007842779159545898, -0.0006923079490661621, -0.0006003379821777344, -0.0005083680152893066, -0.0004163980484008789, -0.00032442808151245117, -0.00023245811462402344, -0.0001404881477355957, -4.851818084716797e-05, 4.3451786041259766e-05, 0.0001354217529296875, 0.00022739171981811523, 0.00031936168670654297, 0.0004113316535949707, 0.0005033016204833984, 0.0005952715873718262, 0.0006872415542602539, 0.0007792115211486816, 0.0008711814880371094, 0.0009631514549255371, 0.0010551214218139648, 0.0011470913887023926, 0.0012390613555908203, 0.001331031322479248, 0.0014230012893676758, 0.0015149712562561035, 0.0016069412231445312, 0.001698911190032959, 0.0017908811569213867, 0.0018828511238098145, 0.001974821090698242, 0.00206679105758667, 0.0021587610244750977, 0.0022507309913635254, 0.002342700958251953, 0.002434670925140381, 0.0025266408920288086, 0.0026186108589172363, 0.002710580825805664, 0.002802550792694092, 0.0028945207595825195, 0.0029864907264709473, 0.003078460693359375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 7.0, 3.0, 6.0, 5.0, 11.0, 20.0, 29.0, 62.0, 132.0, 215.0, 475.0, 1170.0, 2880.0, 7611.0, 25205.0, 99677.0, 385549.0, 387426.0, 100677.0, 24881.0, 7545.0, 2783.0, 1108.0, 500.0, 276.0, 129.0, 78.0, 36.0, 19.0, 14.0, 7.0, 6.0, 3.0, 3.0, 1.0, 4.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-49.125, -47.865478515625, -46.60595703125, -45.346435546875, -44.0869140625, -42.827392578125, -41.56787109375, -40.308349609375, -39.048828125, -37.789306640625, -36.52978515625, -35.270263671875, -34.0107421875, -32.751220703125, -31.49169921875, -30.232177734375, -28.97265625, -27.713134765625, -26.45361328125, -25.194091796875, -23.9345703125, -22.675048828125, -21.41552734375, -20.156005859375, -18.896484375, -17.636962890625, -16.37744140625, -15.117919921875, -13.8583984375, -12.598876953125, -11.33935546875, -10.079833984375, -8.8203125, -7.560791015625, -6.30126953125, -5.041748046875, -3.7822265625, -2.522705078125, -1.26318359375, -0.003662109375, 1.255859375, 2.515380859375, 3.77490234375, 5.034423828125, 6.2939453125, 7.553466796875, 8.81298828125, 10.072509765625, 11.33203125, 12.591552734375, 13.85107421875, 15.110595703125, 16.3701171875, 17.629638671875, 18.88916015625, 20.148681640625, 21.408203125, 22.667724609375, 23.92724609375, 25.186767578125, 26.4462890625, 27.705810546875, 28.96533203125, 30.224853515625, 31.484375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 1.0, 4.0, 3.0, 6.0, 10.0, 7.0, 7.0, 17.0, 14.0, 17.0, 29.0, 25.0, 33.0, 48.0, 64.0, 63.0, 61.0, 63.0, 62.0, 84.0, 69.0, 59.0, 60.0, 35.0, 39.0, 25.0, 29.0, 21.0, 9.0, 4.0, 9.0, 13.0, 6.0, 6.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.65625, -11.177978515625, -10.69970703125, -10.221435546875, -9.7431640625, -9.264892578125, -8.78662109375, -8.308349609375, -7.830078125, -7.351806640625, -6.87353515625, -6.395263671875, -5.9169921875, -5.438720703125, -4.96044921875, -4.482177734375, -4.00390625, -3.525634765625, -3.04736328125, -2.569091796875, -2.0908203125, -1.612548828125, -1.13427734375, -0.656005859375, -0.177734375, 0.300537109375, 0.77880859375, 1.257080078125, 1.7353515625, 2.213623046875, 2.69189453125, 3.170166015625, 3.6484375, 4.126708984375, 4.60498046875, 5.083251953125, 5.5615234375, 6.039794921875, 6.51806640625, 6.996337890625, 7.474609375, 7.952880859375, 8.43115234375, 8.909423828125, 9.3876953125, 9.865966796875, 10.34423828125, 10.822509765625, 11.30078125, 11.779052734375, 12.25732421875, 12.735595703125, 13.2138671875, 13.692138671875, 14.17041015625, 14.648681640625, 15.126953125, 15.605224609375, 16.08349609375, 16.561767578125, 17.0400390625, 17.518310546875, 17.99658203125, 18.474853515625, 18.953125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 11.0, 7.0, 12.0, 18.0, 31.0, 77.0, 118.0, 150.0, 165.0, 146.0, 103.0, 71.0, 50.0, 21.0, 9.0, 8.0, 2.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-177.26101684570312, -167.6498260498047, -158.03863525390625, -148.42745971679688, -138.81626892089844, -129.205078125, -119.59388732910156, -109.98270416259766, -100.37151336669922, -90.76032257080078, -81.14913940429688, -71.53794860839844, -61.926761627197266, -52.315574645996094, -42.704383850097656, -33.09320068359375, -23.482009887695312, -13.870821952819824, -4.259634017944336, 5.351554870605469, 14.96274185180664, 24.573928833007812, 34.18511962890625, 43.796302795410156, 53.407493591308594, 63.018680572509766, 72.62986755371094, 82.24105834960938, 91.85224914550781, 101.46343231201172, 111.07462310791016, 120.68580627441406, 130.2969970703125, 139.90818786621094, 149.51937866210938, 159.13055419921875, 168.7417449951172, 178.35293579101562, 187.96412658691406, 197.5753173828125, 207.18649291992188, 216.7976837158203, 226.40887451171875, 236.02005004882812, 245.63124084472656, 255.242431640625, 264.8536376953125, 274.4648132324219, 284.07598876953125, 293.6871643066406, 303.2983703613281, 312.9095458984375, 322.520751953125, 332.1319274902344, 341.74310302734375, 351.35430908203125, 360.96551513671875, 370.5766906738281, 380.1878967285156, 389.799072265625, 399.4102783203125, 409.0214538574219, 418.63262939453125, 428.24383544921875, 437.8550109863281]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 10.0, 3.0, 9.0, 9.0, 12.0, 11.0, 17.0, 21.0, 29.0, 35.0, 35.0, 51.0, 53.0, 58.0, 70.0, 52.0, 60.0, 52.0, 64.0, 45.0, 46.0, 45.0, 38.0, 35.0, 33.0, 23.0, 19.0, 14.0, 9.0, 10.0, 11.0, 6.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-159.87094116210938, -154.9088897705078, -149.94683837890625, -144.98477172851562, -140.02272033691406, -135.0606689453125, -130.09861755371094, -125.13656616210938, -120.17450714111328, -115.21245574951172, -110.25039672851562, -105.28834533691406, -100.3262939453125, -95.3642349243164, -90.40218353271484, -85.44012451171875, -80.47807312011719, -75.51602172851562, -70.55396270751953, -65.59191131591797, -60.62985610961914, -55.66780090332031, -50.70574951171875, -45.74369430541992, -40.781639099121094, -35.819583892822266, -30.85753059387207, -25.895477294921875, -20.933422088623047, -15.971366882324219, -11.009313583374023, -6.047260284423828, -1.085205078125, 3.8768491744995117, 8.838903427124023, 13.800957679748535, 18.763011932373047, 23.725067138671875, 28.68712043762207, 33.649173736572266, 38.611228942871094, 43.57328414916992, 48.53533935546875, 53.49739074707031, 58.45944595336914, 63.42150115966797, 68.38355255126953, 73.34561157226562, 78.30766296386719, 83.26971435546875, 88.23177337646484, 93.1938247680664, 98.1558837890625, 103.11793518066406, 108.07998657226562, 113.04203796386719, 118.00409698486328, 122.96614837646484, 127.92820739746094, 132.8902587890625, 137.85231018066406, 142.81436157226562, 147.77642822265625, 152.7384796142578, 157.70053100585938]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 4.0, 10.0, 20.0, 36.0, 47.0, 77.0, 123.0, 199.0, 352.0, 581.0, 1109.0, 2012.0, 3887.0, 8059.0, 18143.0, 47206.0, 182247.0, 3342556.0, 456421.0, 79857.0, 27346.0, 11726.0, 5552.0, 2849.0, 1561.0, 855.0, 497.0, 329.0, 198.0, 102.0, 96.0, 65.0, 38.0, 33.0, 20.0, 13.0, 15.0, 5.0, 4.0, 6.0, 8.0, 8.0, 5.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-90.8125, -87.2822265625, -83.751953125, -80.2216796875, -76.69140625, -73.1611328125, -69.630859375, -66.1005859375, -62.5703125, -59.0400390625, -55.509765625, -51.9794921875, -48.44921875, -44.9189453125, -41.388671875, -37.8583984375, -34.328125, -30.7978515625, -27.267578125, -23.7373046875, -20.20703125, -16.6767578125, -13.146484375, -9.6162109375, -6.0859375, -2.5556640625, 0.974609375, 4.5048828125, 8.03515625, 11.5654296875, 15.095703125, 18.6259765625, 22.15625, 25.6865234375, 29.216796875, 32.7470703125, 36.27734375, 39.8076171875, 43.337890625, 46.8681640625, 50.3984375, 53.9287109375, 57.458984375, 60.9892578125, 64.51953125, 68.0498046875, 71.580078125, 75.1103515625, 78.640625, 82.1708984375, 85.701171875, 89.2314453125, 92.76171875, 96.2919921875, 99.822265625, 103.3525390625, 106.8828125, 110.4130859375, 113.943359375, 117.4736328125, 121.00390625, 124.5341796875, 128.064453125, 131.5947265625, 135.125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 6.0, 8.0, 14.0, 15.0, 20.0, 25.0, 33.0, 50.0, 48.0, 53.0, 61.0, 66.0, 72.0, 61.0, 83.0, 57.0, 60.0, 64.0, 48.0, 25.0, 21.0, 30.0, 18.0, 14.0, 15.0, 7.0, 10.0, 6.0, 5.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.54296875, -4.35711669921875, -4.1712646484375, -3.98541259765625, -3.799560546875, -3.61370849609375, -3.4278564453125, -3.24200439453125, -3.05615234375, -2.87030029296875, -2.6844482421875, -2.49859619140625, -2.312744140625, -2.12689208984375, -1.9410400390625, -1.75518798828125, -1.5693359375, -1.38348388671875, -1.1976318359375, -1.01177978515625, -0.825927734375, -0.64007568359375, -0.4542236328125, -0.26837158203125, -0.08251953125, 0.10333251953125, 0.2891845703125, 0.47503662109375, 0.660888671875, 0.84674072265625, 1.0325927734375, 1.21844482421875, 1.404296875, 1.59014892578125, 1.7760009765625, 1.96185302734375, 2.147705078125, 2.33355712890625, 2.5194091796875, 2.70526123046875, 2.89111328125, 3.07696533203125, 3.2628173828125, 3.44866943359375, 3.634521484375, 3.82037353515625, 4.0062255859375, 4.19207763671875, 4.3779296875, 4.56378173828125, 4.7496337890625, 4.93548583984375, 5.121337890625, 5.30718994140625, 5.4930419921875, 5.67889404296875, 5.86474609375, 6.05059814453125, 6.2364501953125, 6.42230224609375, 6.608154296875, 6.79400634765625, 6.9798583984375, 7.16571044921875, 7.3515625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 7.0, 4.0, 4.0, 3.0, 9.0, 5.0, 14.0, 15.0, 21.0, 23.0, 29.0, 42.0, 62.0, 96.0, 194.0, 368.0, 907.0, 2926.0, 13667.0, 107921.0, 3468250.0, 550047.0, 40180.0, 6636.0, 1637.0, 536.0, 242.0, 117.0, 95.0, 61.0, 39.0, 21.0, 18.0, 16.0, 19.0, 5.0, 10.0, 6.0, 7.0, 4.0, 2.0, 5.0, 2.0, 5.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-210.625, -203.306640625, -195.98828125, -188.669921875, -181.3515625, -174.033203125, -166.71484375, -159.396484375, -152.078125, -144.759765625, -137.44140625, -130.123046875, -122.8046875, -115.486328125, -108.16796875, -100.849609375, -93.53125, -86.212890625, -78.89453125, -71.576171875, -64.2578125, -56.939453125, -49.62109375, -42.302734375, -34.984375, -27.666015625, -20.34765625, -13.029296875, -5.7109375, 1.607421875, 8.92578125, 16.244140625, 23.5625, 30.880859375, 38.19921875, 45.517578125, 52.8359375, 60.154296875, 67.47265625, 74.791015625, 82.109375, 89.427734375, 96.74609375, 104.064453125, 111.3828125, 118.701171875, 126.01953125, 133.337890625, 140.65625, 147.974609375, 155.29296875, 162.611328125, 169.9296875, 177.248046875, 184.56640625, 191.884765625, 199.203125, 206.521484375, 213.83984375, 221.158203125, 228.4765625, 235.794921875, 243.11328125, 250.431640625, 257.75]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 5.0, 6.0, 1.0, 3.0, 3.0, 4.0, 8.0, 8.0, 6.0, 7.0, 6.0, 15.0, 23.0, 23.0, 33.0, 50.0, 51.0, 78.0, 94.0, 143.0, 237.0, 398.0, 1306.0, 596.0, 296.0, 187.0, 116.0, 95.0, 65.0, 51.0, 38.0, 27.0, 20.0, 16.0, 10.0, 13.0, 8.0, 12.0, 8.0, 4.0, 6.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.59375, -17.1153564453125, -16.636962890625, -16.1585693359375, -15.68017578125, -15.2017822265625, -14.723388671875, -14.2449951171875, -13.7666015625, -13.2882080078125, -12.809814453125, -12.3314208984375, -11.85302734375, -11.3746337890625, -10.896240234375, -10.4178466796875, -9.939453125, -9.4610595703125, -8.982666015625, -8.5042724609375, -8.02587890625, -7.5474853515625, -7.069091796875, -6.5906982421875, -6.1123046875, -5.6339111328125, -5.155517578125, -4.6771240234375, -4.19873046875, -3.7203369140625, -3.241943359375, -2.7635498046875, -2.28515625, -1.8067626953125, -1.328369140625, -0.8499755859375, -0.37158203125, 0.1068115234375, 0.585205078125, 1.0635986328125, 1.5419921875, 2.0203857421875, 2.498779296875, 2.9771728515625, 3.45556640625, 3.9339599609375, 4.412353515625, 4.8907470703125, 5.369140625, 5.8475341796875, 6.325927734375, 6.8043212890625, 7.28271484375, 7.7611083984375, 8.239501953125, 8.7178955078125, 9.1962890625, 9.6746826171875, 10.153076171875, 10.6314697265625, 11.10986328125, 11.5882568359375, 12.066650390625, 12.5450439453125, 13.0234375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 3.0, 5.0, 9.0, 10.0, 20.0, 38.0, 52.0, 76.0, 101.0, 115.0, 146.0, 102.0, 112.0, 61.0, 55.0, 38.0, 26.0, 14.0, 8.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-200.0250701904297, -195.2325897216797, -190.4401092529297, -185.64764404296875, -180.85516357421875, -176.06268310546875, -171.27020263671875, -166.47772216796875, -161.6852569580078, -156.8927764892578, -152.1002960205078, -147.30783081054688, -142.51535034179688, -137.72286987304688, -132.93038940429688, -128.13790893554688, -123.3454360961914, -118.5529556274414, -113.76048278808594, -108.96800231933594, -104.17552947998047, -99.38304901123047, -94.590576171875, -89.798095703125, -85.005615234375, -80.213134765625, -75.42066192626953, -70.62818145751953, -65.83570861816406, -61.04322814941406, -56.25075149536133, -51.458274841308594, -46.665809631347656, -41.87333297729492, -37.08085632324219, -32.28837585449219, -27.495901107788086, -22.70342445373535, -17.910945892333984, -13.11846923828125, -8.325992584228516, -3.533515453338623, 1.2589616775512695, 6.05143928527832, 10.843915939331055, 15.636392593383789, 20.428871154785156, 25.22134780883789, 30.013824462890625, 34.80630111694336, 39.598777770996094, 44.391258239746094, 49.18373107910156, 53.97621154785156, 58.7686882019043, 63.56116485595703, 68.3536376953125, 73.1461181640625, 77.93859100341797, 82.73107147216797, 87.52354431152344, 92.31602478027344, 97.10850524902344, 101.9009780883789, 106.6934585571289]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 7.0, 3.0, 4.0, 5.0, 3.0, 4.0, 9.0, 17.0, 15.0, 15.0, 12.0, 19.0, 35.0, 25.0, 36.0, 31.0, 34.0, 36.0, 43.0, 47.0, 52.0, 38.0, 37.0, 51.0, 42.0, 39.0, 50.0, 44.0, 35.0, 29.0, 30.0, 38.0, 22.0, 17.0, 8.0, 9.0, 11.0, 10.0, 9.0, 14.0, 7.0, 7.0, 3.0, 8.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-70.94207000732422, -68.9043960571289, -66.8667221069336, -64.82904052734375, -62.79136657714844, -60.753692626953125, -58.71601867675781, -56.678340911865234, -54.640663146972656, -52.602989196777344, -50.565311431884766, -48.52763748168945, -46.489959716796875, -44.45228576660156, -42.41461181640625, -40.37693405151367, -38.33926010131836, -36.30158615112305, -34.26390838623047, -32.226234436035156, -30.188556671142578, -28.150882720947266, -26.11320686340332, -24.075531005859375, -22.03785514831543, -20.000179290771484, -17.96250343322754, -15.92482852935791, -13.887152671813965, -11.84947681427002, -9.81180191040039, -7.774126052856445, -5.7364501953125, -3.698774576187134, -1.6610989570617676, 0.37657642364501953, 2.414252281188965, 4.45192813873291, 6.489603042602539, 8.527278900146484, 10.56495475769043, 12.602630615234375, 14.64030647277832, 16.677982330322266, 18.715656280517578, 20.753334045410156, 22.79100799560547, 24.828683853149414, 26.86635971069336, 28.904035568237305, 30.94171142578125, 32.97938537597656, 35.01706314086914, 37.05473709106445, 39.09241485595703, 41.130088806152344, 43.167762756347656, 45.20543670654297, 47.24311447143555, 49.28078842163086, 51.31846618652344, 53.35614013671875, 55.39381408691406, 57.43149185180664, 59.46916961669922]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 10.0, 8.0, 8.0, 7.0, 14.0, 21.0, 37.0, 60.0, 73.0, 121.0, 125.0, 242.0, 326.0, 507.0, 749.0, 1133.0, 1744.0, 2723.0, 4102.0, 6512.0, 10437.0, 16182.0, 26064.0, 41075.0, 64266.0, 97296.0, 137524.0, 165767.0, 151517.0, 111916.0, 75525.0, 48805.0, 30911.0, 19095.0, 12086.0, 7444.0, 4882.0, 3132.0, 1997.0, 1361.0, 873.0, 572.0, 446.0, 265.0, 178.0, 138.0, 89.0, 85.0, 36.0, 21.0, 19.0, 11.0, 7.0, 8.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-30.765625, -29.762939453125, -28.76025390625, -27.757568359375, -26.7548828125, -25.752197265625, -24.74951171875, -23.746826171875, -22.744140625, -21.741455078125, -20.73876953125, -19.736083984375, -18.7333984375, -17.730712890625, -16.72802734375, -15.725341796875, -14.72265625, -13.719970703125, -12.71728515625, -11.714599609375, -10.7119140625, -9.709228515625, -8.70654296875, -7.703857421875, -6.701171875, -5.698486328125, -4.69580078125, -3.693115234375, -2.6904296875, -1.687744140625, -0.68505859375, 0.317626953125, 1.3203125, 2.322998046875, 3.32568359375, 4.328369140625, 5.3310546875, 6.333740234375, 7.33642578125, 8.339111328125, 9.341796875, 10.344482421875, 11.34716796875, 12.349853515625, 13.3525390625, 14.355224609375, 15.35791015625, 16.360595703125, 17.36328125, 18.365966796875, 19.36865234375, 20.371337890625, 21.3740234375, 22.376708984375, 23.37939453125, 24.382080078125, 25.384765625, 26.387451171875, 27.39013671875, 28.392822265625, 29.3955078125, 30.398193359375, 31.40087890625, 32.403564453125, 33.40625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 6.0, 5.0, 2.0, 6.0, 9.0, 14.0, 7.0, 17.0, 12.0, 15.0, 12.0, 24.0, 28.0, 37.0, 36.0, 37.0, 44.0, 47.0, 39.0, 48.0, 53.0, 47.0, 41.0, 43.0, 42.0, 41.0, 56.0, 41.0, 22.0, 21.0, 30.0, 23.0, 18.0, 19.0, 13.0, 10.0, 5.0, 5.0, 12.0, 7.0, 4.0, 2.0, 3.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.30078125, -4.15350341796875, -4.0062255859375, -3.85894775390625, -3.711669921875, -3.56439208984375, -3.4171142578125, -3.26983642578125, -3.12255859375, -2.97528076171875, -2.8280029296875, -2.68072509765625, -2.533447265625, -2.38616943359375, -2.2388916015625, -2.09161376953125, -1.9443359375, -1.79705810546875, -1.6497802734375, -1.50250244140625, -1.355224609375, -1.20794677734375, -1.0606689453125, -0.91339111328125, -0.76611328125, -0.61883544921875, -0.4715576171875, -0.32427978515625, -0.177001953125, -0.02972412109375, 0.1175537109375, 0.26483154296875, 0.412109375, 0.55938720703125, 0.7066650390625, 0.85394287109375, 1.001220703125, 1.14849853515625, 1.2957763671875, 1.44305419921875, 1.59033203125, 1.73760986328125, 1.8848876953125, 2.03216552734375, 2.179443359375, 2.32672119140625, 2.4739990234375, 2.62127685546875, 2.7685546875, 2.91583251953125, 3.0631103515625, 3.21038818359375, 3.357666015625, 3.50494384765625, 3.6522216796875, 3.79949951171875, 3.94677734375, 4.09405517578125, 4.2413330078125, 4.38861083984375, 4.535888671875, 4.68316650390625, 4.8304443359375, 4.97772216796875, 5.125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 10.0, 16.0, 21.0, 33.0, 37.0, 46.0, 87.0, 116.0, 193.0, 273.0, 409.0, 685.0, 1219.0, 2376.0, 4774.0, 11107.0, 27280.0, 71923.0, 181802.0, 336640.0, 242497.0, 101013.0, 38078.0, 14857.0, 6323.0, 2931.0, 1506.0, 836.0, 498.0, 321.0, 217.0, 161.0, 83.0, 56.0, 48.0, 27.0, 21.0, 13.0, 9.0, 8.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-78.6875, -76.279296875, -73.87109375, -71.462890625, -69.0546875, -66.646484375, -64.23828125, -61.830078125, -59.421875, -57.013671875, -54.60546875, -52.197265625, -49.7890625, -47.380859375, -44.97265625, -42.564453125, -40.15625, -37.748046875, -35.33984375, -32.931640625, -30.5234375, -28.115234375, -25.70703125, -23.298828125, -20.890625, -18.482421875, -16.07421875, -13.666015625, -11.2578125, -8.849609375, -6.44140625, -4.033203125, -1.625, 0.783203125, 3.19140625, 5.599609375, 8.0078125, 10.416015625, 12.82421875, 15.232421875, 17.640625, 20.048828125, 22.45703125, 24.865234375, 27.2734375, 29.681640625, 32.08984375, 34.498046875, 36.90625, 39.314453125, 41.72265625, 44.130859375, 46.5390625, 48.947265625, 51.35546875, 53.763671875, 56.171875, 58.580078125, 60.98828125, 63.396484375, 65.8046875, 68.212890625, 70.62109375, 73.029296875, 75.4375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 5.0, 6.0, 8.0, 7.0, 12.0, 11.0, 11.0, 10.0, 12.0, 25.0, 17.0, 22.0, 22.0, 31.0, 32.0, 35.0, 43.0, 49.0, 34.0, 30.0, 48.0, 53.0, 54.0, 48.0, 44.0, 40.0, 31.0, 38.0, 33.0, 33.0, 23.0, 26.0, 23.0, 18.0, 15.0, 12.0, 6.0, 10.0, 9.0, 6.0, 4.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-33.21875, -32.14990234375, -31.0810546875, -30.01220703125, -28.943359375, -27.87451171875, -26.8056640625, -25.73681640625, -24.66796875, -23.59912109375, -22.5302734375, -21.46142578125, -20.392578125, -19.32373046875, -18.2548828125, -17.18603515625, -16.1171875, -15.04833984375, -13.9794921875, -12.91064453125, -11.841796875, -10.77294921875, -9.7041015625, -8.63525390625, -7.56640625, -6.49755859375, -5.4287109375, -4.35986328125, -3.291015625, -2.22216796875, -1.1533203125, -0.08447265625, 0.984375, 2.05322265625, 3.1220703125, 4.19091796875, 5.259765625, 6.32861328125, 7.3974609375, 8.46630859375, 9.53515625, 10.60400390625, 11.6728515625, 12.74169921875, 13.810546875, 14.87939453125, 15.9482421875, 17.01708984375, 18.0859375, 19.15478515625, 20.2236328125, 21.29248046875, 22.361328125, 23.43017578125, 24.4990234375, 25.56787109375, 26.63671875, 27.70556640625, 28.7744140625, 29.84326171875, 30.912109375, 31.98095703125, 33.0498046875, 34.11865234375, 35.1875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 7.0, 8.0, 9.0, 18.0, 23.0, 41.0, 64.0, 90.0, 162.0, 306.0, 598.0, 1132.0, 2551.0, 5989.0, 16365.0, 51166.0, 174203.0, 389398.0, 275591.0, 88247.0, 26425.0, 9109.0, 3530.0, 1636.0, 856.0, 429.0, 227.0, 135.0, 84.0, 59.0, 21.0, 24.0, 16.0, 11.0, 13.0, 5.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.59375, -51.84912109375, -50.1044921875, -48.35986328125, -46.615234375, -44.87060546875, -43.1259765625, -41.38134765625, -39.63671875, -37.89208984375, -36.1474609375, -34.40283203125, -32.658203125, -30.91357421875, -29.1689453125, -27.42431640625, -25.6796875, -23.93505859375, -22.1904296875, -20.44580078125, -18.701171875, -16.95654296875, -15.2119140625, -13.46728515625, -11.72265625, -9.97802734375, -8.2333984375, -6.48876953125, -4.744140625, -2.99951171875, -1.2548828125, 0.48974609375, 2.234375, 3.97900390625, 5.7236328125, 7.46826171875, 9.212890625, 10.95751953125, 12.7021484375, 14.44677734375, 16.19140625, 17.93603515625, 19.6806640625, 21.42529296875, 23.169921875, 24.91455078125, 26.6591796875, 28.40380859375, 30.1484375, 31.89306640625, 33.6376953125, 35.38232421875, 37.126953125, 38.87158203125, 40.6162109375, 42.36083984375, 44.10546875, 45.85009765625, 47.5947265625, 49.33935546875, 51.083984375, 52.82861328125, 54.5732421875, 56.31787109375, 58.0625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 3.0, 5.0, 7.0, 7.0, 8.0, 13.0, 21.0, 16.0, 38.0, 30.0, 42.0, 55.0, 56.0, 73.0, 94.0, 88.0, 82.0, 72.0, 63.0, 35.0, 34.0, 39.0, 23.0, 18.0, 16.0, 11.0, 8.0, 9.0, 5.0, 5.0, 5.0, 4.0, 4.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.006748199462890625, -0.006529808044433594, -0.0063114166259765625, -0.006093025207519531, -0.0058746337890625, -0.005656242370605469, -0.0054378509521484375, -0.005219459533691406, -0.005001068115234375, -0.004782676696777344, -0.0045642852783203125, -0.004345893859863281, -0.00412750244140625, -0.003909111022949219, -0.0036907196044921875, -0.0034723281860351562, -0.003253936767578125, -0.0030355453491210938, -0.0028171539306640625, -0.0025987625122070312, -0.00238037109375, -0.0021619796752929688, -0.0019435882568359375, -0.0017251968383789062, -0.001506805419921875, -0.0012884140014648438, -0.0010700225830078125, -0.0008516311645507812, -0.00063323974609375, -0.00041484832763671875, -0.0001964569091796875, 2.193450927734375e-05, 0.000240325927734375, 0.00045871734619140625, 0.0006771087646484375, 0.0008955001831054688, 0.0011138916015625, 0.0013322830200195312, 0.0015506744384765625, 0.0017690658569335938, 0.001987457275390625, 0.0022058486938476562, 0.0024242401123046875, 0.0026426315307617188, 0.00286102294921875, 0.0030794143676757812, 0.0032978057861328125, 0.0035161972045898438, 0.003734588623046875, 0.003952980041503906, 0.0041713714599609375, 0.004389762878417969, 0.004608154296875, 0.004826545715332031, 0.0050449371337890625, 0.005263328552246094, 0.005481719970703125, 0.005700111389160156, 0.0059185028076171875, 0.006136894226074219, 0.00635528564453125, 0.006573677062988281, 0.0067920684814453125, 0.007010459899902344, 0.007228851318359375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 2.0, 5.0, 4.0, 12.0, 2.0, 20.0, 30.0, 38.0, 69.0, 159.0, 272.0, 550.0, 1392.0, 4003.0, 17021.0, 131228.0, 643140.0, 217183.0, 25020.0, 5258.0, 1725.0, 700.0, 338.0, 155.0, 85.0, 45.0, 31.0, 24.0, 14.0, 9.0, 9.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.625, -90.56640625, -87.5078125, -84.44921875, -81.390625, -78.33203125, -75.2734375, -72.21484375, -69.15625, -66.09765625, -63.0390625, -59.98046875, -56.921875, -53.86328125, -50.8046875, -47.74609375, -44.6875, -41.62890625, -38.5703125, -35.51171875, -32.453125, -29.39453125, -26.3359375, -23.27734375, -20.21875, -17.16015625, -14.1015625, -11.04296875, -7.984375, -4.92578125, -1.8671875, 1.19140625, 4.25, 7.30859375, 10.3671875, 13.42578125, 16.484375, 19.54296875, 22.6015625, 25.66015625, 28.71875, 31.77734375, 34.8359375, 37.89453125, 40.953125, 44.01171875, 47.0703125, 50.12890625, 53.1875, 56.24609375, 59.3046875, 62.36328125, 65.421875, 68.48046875, 71.5390625, 74.59765625, 77.65625, 80.71484375, 83.7734375, 86.83203125, 89.890625, 92.94921875, 96.0078125, 99.06640625, 102.125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 1.0, 3.0, 5.0, 11.0, 16.0, 19.0, 36.0, 46.0, 34.0, 68.0, 79.0, 98.0, 131.0, 97.0, 89.0, 76.0, 56.0, 58.0, 21.0, 26.0, 9.0, 6.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.359375, -25.141357421875, -23.92333984375, -22.705322265625, -21.4873046875, -20.269287109375, -19.05126953125, -17.833251953125, -16.615234375, -15.397216796875, -14.17919921875, -12.961181640625, -11.7431640625, -10.525146484375, -9.30712890625, -8.089111328125, -6.87109375, -5.653076171875, -4.43505859375, -3.217041015625, -1.9990234375, -0.781005859375, 0.43701171875, 1.655029296875, 2.873046875, 4.091064453125, 5.30908203125, 6.527099609375, 7.7451171875, 8.963134765625, 10.18115234375, 11.399169921875, 12.6171875, 13.835205078125, 15.05322265625, 16.271240234375, 17.4892578125, 18.707275390625, 19.92529296875, 21.143310546875, 22.361328125, 23.579345703125, 24.79736328125, 26.015380859375, 27.2333984375, 28.451416015625, 29.66943359375, 30.887451171875, 32.10546875, 33.323486328125, 34.54150390625, 35.759521484375, 36.9775390625, 38.195556640625, 39.41357421875, 40.631591796875, 41.849609375, 43.067626953125, 44.28564453125, 45.503662109375, 46.7216796875, 47.939697265625, 49.15771484375, 50.375732421875, 51.59375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 8.0, 10.0, 17.0, 35.0, 104.0, 213.0, 250.0, 198.0, 100.0, 39.0, 21.0, 6.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-660.50146484375, -626.5277099609375, -592.553955078125, -558.5802001953125, -524.6065063476562, -490.63275146484375, -456.65899658203125, -422.68524169921875, -388.7115173339844, -354.7377624511719, -320.7640380859375, -286.790283203125, -252.81654357910156, -218.84280395507812, -184.86904907226562, -150.8953094482422, -116.92156982421875, -82.94783020019531, -48.974082946777344, -15.000335693359375, 18.973403930664062, 52.9471435546875, 86.9208984375, 120.89463806152344, 154.86837768554688, 188.8421173095703, 222.81585693359375, 256.78961181640625, 290.76336669921875, 324.7370910644531, 358.7108459472656, 392.6845703125, 426.6583251953125, 460.632080078125, 494.6058044433594, 528.57958984375, 562.5532836914062, 596.5270385742188, 630.5007934570312, 664.4745483398438, 698.4482421875, 732.4219970703125, 766.395751953125, 800.3695068359375, 834.3432006835938, 868.3169555664062, 902.2907104492188, 936.2644653320312, 970.2382202148438, 1004.2119750976562, 1038.1856689453125, 1072.159423828125, 1106.1331787109375, 1140.10693359375, 1174.0806884765625, 1208.054443359375, 1242.0281982421875, 1276.001953125, 1309.9757080078125, 1343.949462890625, 1377.9232177734375, 1411.89697265625, 1445.87060546875, 1479.8443603515625, 1513.818115234375]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 2.0, 5.0, 13.0, 7.0, 12.0, 24.0, 15.0, 28.0, 36.0, 50.0, 51.0, 59.0, 70.0, 67.0, 65.0, 79.0, 76.0, 71.0, 44.0, 43.0, 40.0, 31.0, 22.0, 21.0, 23.0, 13.0, 5.0, 11.0, 9.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-326.781982421875, -314.1104431152344, -301.4389343261719, -288.76739501953125, -276.0958557128906, -263.42431640625, -250.7528076171875, -238.08126831054688, -225.4097442626953, -212.73822021484375, -200.06668090820312, -187.39515686035156, -174.7236328125, -162.05209350585938, -149.3805694580078, -136.70904541015625, -124.03750610351562, -111.36597442626953, -98.69444274902344, -86.02291870117188, -73.35138702392578, -60.67985534667969, -48.008331298828125, -35.33679962158203, -22.665267944335938, -9.993738174438477, 2.6777915954589844, 15.349319458007812, 28.020851135253906, 40.6923828125, 53.36390686035156, 66.03543853759766, 78.70697021484375, 91.37850189208984, 104.05003356933594, 116.7215576171875, 129.39309692382812, 142.0646209716797, 154.73614501953125, 167.40768432617188, 180.07920837402344, 192.750732421875, 205.42227172851562, 218.0937957763672, 230.76531982421875, 243.43685913085938, 256.1083984375, 268.7799072265625, 281.4514465332031, 294.12298583984375, 306.79449462890625, 319.4660339355469, 332.1375732421875, 344.80908203125, 357.4806213378906, 370.15216064453125, 382.82366943359375, 395.4952087402344, 408.1667175292969, 420.8382568359375, 433.5097961425781, 446.18133544921875, 458.85284423828125, 471.5243835449219, 484.1959228515625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 9.0, 6.0, 3.0, 2.0, 11.0, 30.0, 31.0, 41.0, 71.0, 123.0, 334.0, 775.0, 2853.0, 15629.0, 195355.0, 3883129.0, 84709.0, 8657.0, 1557.0, 484.0, 188.0, 102.0, 69.0, 42.0, 25.0, 19.0, 10.0, 3.0, 8.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-403.0, -390.546875, -378.09375, -365.640625, -353.1875, -340.734375, -328.28125, -315.828125, -303.375, -290.921875, -278.46875, -266.015625, -253.5625, -241.109375, -228.65625, -216.203125, -203.75, -191.296875, -178.84375, -166.390625, -153.9375, -141.484375, -129.03125, -116.578125, -104.125, -91.671875, -79.21875, -66.765625, -54.3125, -41.859375, -29.40625, -16.953125, -4.5, 7.953125, 20.40625, 32.859375, 45.3125, 57.765625, 70.21875, 82.671875, 95.125, 107.578125, 120.03125, 132.484375, 144.9375, 157.390625, 169.84375, 182.296875, 194.75, 207.203125, 219.65625, 232.109375, 244.5625, 257.015625, 269.46875, 281.921875, 294.375, 306.828125, 319.28125, 331.734375, 344.1875, 356.640625, 369.09375, 381.546875, 394.0]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 7.0, 5.0, 2.0, 8.0, 13.0, 25.0, 26.0, 29.0, 26.0, 50.0, 40.0, 53.0, 65.0, 59.0, 77.0, 78.0, 72.0, 84.0, 59.0, 52.0, 26.0, 36.0, 34.0, 24.0, 14.0, 13.0, 2.0, 8.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.703125, -10.36767578125, -10.0322265625, -9.69677734375, -9.361328125, -9.02587890625, -8.6904296875, -8.35498046875, -8.01953125, -7.68408203125, -7.3486328125, -7.01318359375, -6.677734375, -6.34228515625, -6.0068359375, -5.67138671875, -5.3359375, -5.00048828125, -4.6650390625, -4.32958984375, -3.994140625, -3.65869140625, -3.3232421875, -2.98779296875, -2.65234375, -2.31689453125, -1.9814453125, -1.64599609375, -1.310546875, -0.97509765625, -0.6396484375, -0.30419921875, 0.03125, 0.36669921875, 0.7021484375, 1.03759765625, 1.373046875, 1.70849609375, 2.0439453125, 2.37939453125, 2.71484375, 3.05029296875, 3.3857421875, 3.72119140625, 4.056640625, 4.39208984375, 4.7275390625, 5.06298828125, 5.3984375, 5.73388671875, 6.0693359375, 6.40478515625, 6.740234375, 7.07568359375, 7.4111328125, 7.74658203125, 8.08203125, 8.41748046875, 8.7529296875, 9.08837890625, 9.423828125, 9.75927734375, 10.0947265625, 10.43017578125, 10.765625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 4.0, 8.0, 6.0, 16.0, 18.0, 19.0, 29.0, 28.0, 71.0, 108.0, 241.0, 688.0, 2519.0, 11104.0, 66845.0, 844334.0, 3128244.0, 117032.0, 17486.0, 3794.0, 998.0, 334.0, 147.0, 77.0, 45.0, 28.0, 21.0, 16.0, 11.0, 3.0, 7.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-265.5, -256.38671875, -247.2734375, -238.16015625, -229.046875, -219.93359375, -210.8203125, -201.70703125, -192.59375, -183.48046875, -174.3671875, -165.25390625, -156.140625, -147.02734375, -137.9140625, -128.80078125, -119.6875, -110.57421875, -101.4609375, -92.34765625, -83.234375, -74.12109375, -65.0078125, -55.89453125, -46.78125, -37.66796875, -28.5546875, -19.44140625, -10.328125, -1.21484375, 7.8984375, 17.01171875, 26.125, 35.23828125, 44.3515625, 53.46484375, 62.578125, 71.69140625, 80.8046875, 89.91796875, 99.03125, 108.14453125, 117.2578125, 126.37109375, 135.484375, 144.59765625, 153.7109375, 162.82421875, 171.9375, 181.05078125, 190.1640625, 199.27734375, 208.390625, 217.50390625, 226.6171875, 235.73046875, 244.84375, 253.95703125, 263.0703125, 272.18359375, 281.296875, 290.41015625, 299.5234375, 308.63671875, 317.75]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 9.0, 8.0, 14.0, 7.0, 13.0, 19.0, 31.0, 38.0, 46.0, 62.0, 65.0, 114.0, 161.0, 286.0, 615.0, 1377.0, 405.0, 238.0, 165.0, 95.0, 81.0, 49.0, 29.0, 31.0, 32.0, 18.0, 17.0, 17.0, 7.0, 5.0, 8.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-35.25, -34.30517578125, -33.3603515625, -32.41552734375, -31.470703125, -30.52587890625, -29.5810546875, -28.63623046875, -27.69140625, -26.74658203125, -25.8017578125, -24.85693359375, -23.912109375, -22.96728515625, -22.0224609375, -21.07763671875, -20.1328125, -19.18798828125, -18.2431640625, -17.29833984375, -16.353515625, -15.40869140625, -14.4638671875, -13.51904296875, -12.57421875, -11.62939453125, -10.6845703125, -9.73974609375, -8.794921875, -7.85009765625, -6.9052734375, -5.96044921875, -5.015625, -4.07080078125, -3.1259765625, -2.18115234375, -1.236328125, -0.29150390625, 0.6533203125, 1.59814453125, 2.54296875, 3.48779296875, 4.4326171875, 5.37744140625, 6.322265625, 7.26708984375, 8.2119140625, 9.15673828125, 10.1015625, 11.04638671875, 11.9912109375, 12.93603515625, 13.880859375, 14.82568359375, 15.7705078125, 16.71533203125, 17.66015625, 18.60498046875, 19.5498046875, 20.49462890625, 21.439453125, 22.38427734375, 23.3291015625, 24.27392578125, 25.21875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 8.0, 12.0, 35.0, 32.0, 72.0, 127.0, 171.0, 172.0, 144.0, 106.0, 51.0, 31.0, 21.0, 8.0, 5.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-263.3853759765625, -251.46664428710938, -239.54791259765625, -227.62918090820312, -215.71044921875, -203.79171752929688, -191.87298583984375, -179.95425415039062, -168.0355224609375, -156.11679077148438, -144.19805908203125, -132.27932739257812, -120.360595703125, -108.44186401367188, -96.52313232421875, -84.60440063476562, -72.6856689453125, -60.766937255859375, -48.84820556640625, -36.929473876953125, -25.0107421875, -13.092010498046875, -1.17327880859375, 10.745452880859375, 22.6641845703125, 34.582916259765625, 46.50164794921875, 58.420379638671875, 70.339111328125, 82.25784301757812, 94.17657470703125, 106.09530639648438, 118.0140380859375, 129.93276977539062, 141.85150146484375, 153.77023315429688, 165.68896484375, 177.60769653320312, 189.52642822265625, 201.44515991210938, 213.3638916015625, 225.28262329101562, 237.20135498046875, 249.12008666992188, 261.038818359375, 272.9575500488281, 284.87628173828125, 296.7950134277344, 308.7137451171875, 320.6324768066406, 332.55120849609375, 344.4699401855469, 356.388671875, 368.3074035644531, 380.22613525390625, 392.1448669433594, 404.0635986328125, 415.9823303222656, 427.90106201171875, 439.8197937011719, 451.738525390625, 463.6572570800781, 475.57598876953125, 487.4947204589844, 499.4134521484375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 5.0, 0.0, 5.0, 10.0, 5.0, 9.0, 4.0, 17.0, 14.0, 9.0, 12.0, 14.0, 22.0, 22.0, 27.0, 31.0, 23.0, 34.0, 36.0, 33.0, 42.0, 44.0, 40.0, 39.0, 46.0, 49.0, 40.0, 33.0, 48.0, 33.0, 26.0, 19.0, 22.0, 23.0, 26.0, 22.0, 17.0, 18.0, 9.0, 17.0, 9.0, 9.0, 8.0, 4.0, 9.0, 5.0, 9.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-131.38462829589844, -127.5765609741211, -123.76848602294922, -119.96041870117188, -116.15234375, -112.34427642822266, -108.53620910644531, -104.72813415527344, -100.92005920410156, -97.11199188232422, -93.30391693115234, -89.495849609375, -85.68777465820312, -81.87970733642578, -78.07164001464844, -74.26356506347656, -70.45549774169922, -66.64743041992188, -62.83935546875, -59.031288146972656, -55.22321319580078, -51.41514587402344, -47.60707473754883, -43.79900360107422, -39.99093246459961, -36.182861328125, -32.37479019165039, -28.566720962524414, -24.758649826049805, -20.950578689575195, -17.14250946044922, -13.33443832397461, -9.5263671875, -5.718296527862549, -1.9102258682250977, 1.8978443145751953, 5.705915451049805, 9.513986587524414, 13.32205581665039, 17.130126953125, 20.93819808959961, 24.74626922607422, 28.554340362548828, 32.36241149902344, 36.17047882080078, 39.978553771972656, 43.78662109375, 47.59469223022461, 51.40276336669922, 55.21083450317383, 59.01890563964844, 62.82697296142578, 66.63504791259766, 70.443115234375, 74.25119018554688, 78.05925750732422, 81.86732482910156, 85.6753921508789, 89.48346710205078, 93.29153442382812, 97.099609375, 100.90767669677734, 104.71574401855469, 108.52381896972656, 112.33189392089844]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 12.0, 13.0, 16.0, 22.0, 38.0, 46.0, 72.0, 114.0, 183.0, 277.0, 435.0, 750.0, 1193.0, 2356.0, 5194.0, 12774.0, 34988.0, 95807.0, 235310.0, 348744.0, 190333.0, 73998.0, 26785.0, 10112.0, 4205.0, 1957.0, 1076.0, 611.0, 374.0, 236.0, 148.0, 123.0, 83.0, 49.0, 40.0, 20.0, 13.0, 13.0, 10.0, 4.0, 8.0, 6.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-92.0, -89.2431640625, -86.486328125, -83.7294921875, -80.97265625, -78.2158203125, -75.458984375, -72.7021484375, -69.9453125, -67.1884765625, -64.431640625, -61.6748046875, -58.91796875, -56.1611328125, -53.404296875, -50.6474609375, -47.890625, -45.1337890625, -42.376953125, -39.6201171875, -36.86328125, -34.1064453125, -31.349609375, -28.5927734375, -25.8359375, -23.0791015625, -20.322265625, -17.5654296875, -14.80859375, -12.0517578125, -9.294921875, -6.5380859375, -3.78125, -1.0244140625, 1.732421875, 4.4892578125, 7.24609375, 10.0029296875, 12.759765625, 15.5166015625, 18.2734375, 21.0302734375, 23.787109375, 26.5439453125, 29.30078125, 32.0576171875, 34.814453125, 37.5712890625, 40.328125, 43.0849609375, 45.841796875, 48.5986328125, 51.35546875, 54.1123046875, 56.869140625, 59.6259765625, 62.3828125, 65.1396484375, 67.896484375, 70.6533203125, 73.41015625, 76.1669921875, 78.923828125, 81.6806640625, 84.4375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 7.0, 6.0, 12.0, 20.0, 33.0, 35.0, 48.0, 60.0, 59.0, 72.0, 68.0, 69.0, 76.0, 66.0, 59.0, 64.0, 63.0, 50.0, 35.0, 21.0, 25.0, 10.0, 13.0, 13.0, 4.0, 7.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.3125, -12.897705078125, -12.48291015625, -12.068115234375, -11.6533203125, -11.238525390625, -10.82373046875, -10.408935546875, -9.994140625, -9.579345703125, -9.16455078125, -8.749755859375, -8.3349609375, -7.920166015625, -7.50537109375, -7.090576171875, -6.67578125, -6.260986328125, -5.84619140625, -5.431396484375, -5.0166015625, -4.601806640625, -4.18701171875, -3.772216796875, -3.357421875, -2.942626953125, -2.52783203125, -2.113037109375, -1.6982421875, -1.283447265625, -0.86865234375, -0.453857421875, -0.0390625, 0.375732421875, 0.79052734375, 1.205322265625, 1.6201171875, 2.034912109375, 2.44970703125, 2.864501953125, 3.279296875, 3.694091796875, 4.10888671875, 4.523681640625, 4.9384765625, 5.353271484375, 5.76806640625, 6.182861328125, 6.59765625, 7.012451171875, 7.42724609375, 7.842041015625, 8.2568359375, 8.671630859375, 9.08642578125, 9.501220703125, 9.916015625, 10.330810546875, 10.74560546875, 11.160400390625, 11.5751953125, 11.989990234375, 12.40478515625, 12.819580078125, 13.234375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 7.0, 7.0, 10.0, 9.0, 14.0, 21.0, 28.0, 36.0, 59.0, 77.0, 131.0, 203.0, 284.0, 457.0, 796.0, 1291.0, 2594.0, 5555.0, 13778.0, 40010.0, 128445.0, 364726.0, 325798.0, 108152.0, 34084.0, 11928.0, 4642.0, 2244.0, 1215.0, 696.0, 455.0, 260.0, 160.0, 120.0, 84.0, 44.0, 38.0, 30.0, 25.0, 12.0, 14.0, 9.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.6875, -107.326171875, -103.96484375, -100.603515625, -97.2421875, -93.880859375, -90.51953125, -87.158203125, -83.796875, -80.435546875, -77.07421875, -73.712890625, -70.3515625, -66.990234375, -63.62890625, -60.267578125, -56.90625, -53.544921875, -50.18359375, -46.822265625, -43.4609375, -40.099609375, -36.73828125, -33.376953125, -30.015625, -26.654296875, -23.29296875, -19.931640625, -16.5703125, -13.208984375, -9.84765625, -6.486328125, -3.125, 0.236328125, 3.59765625, 6.958984375, 10.3203125, 13.681640625, 17.04296875, 20.404296875, 23.765625, 27.126953125, 30.48828125, 33.849609375, 37.2109375, 40.572265625, 43.93359375, 47.294921875, 50.65625, 54.017578125, 57.37890625, 60.740234375, 64.1015625, 67.462890625, 70.82421875, 74.185546875, 77.546875, 80.908203125, 84.26953125, 87.630859375, 90.9921875, 94.353515625, 97.71484375, 101.076171875, 104.4375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 9.0, 11.0, 9.0, 12.0, 15.0, 25.0, 31.0, 31.0, 42.0, 46.0, 56.0, 69.0, 60.0, 62.0, 56.0, 80.0, 76.0, 55.0, 40.0, 43.0, 43.0, 31.0, 23.0, 18.0, 12.0, 8.0, 13.0, 7.0, 7.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.5625, -68.2412109375, -65.919921875, -63.5986328125, -61.27734375, -58.9560546875, -56.634765625, -54.3134765625, -51.9921875, -49.6708984375, -47.349609375, -45.0283203125, -42.70703125, -40.3857421875, -38.064453125, -35.7431640625, -33.421875, -31.1005859375, -28.779296875, -26.4580078125, -24.13671875, -21.8154296875, -19.494140625, -17.1728515625, -14.8515625, -12.5302734375, -10.208984375, -7.8876953125, -5.56640625, -3.2451171875, -0.923828125, 1.3974609375, 3.71875, 6.0400390625, 8.361328125, 10.6826171875, 13.00390625, 15.3251953125, 17.646484375, 19.9677734375, 22.2890625, 24.6103515625, 26.931640625, 29.2529296875, 31.57421875, 33.8955078125, 36.216796875, 38.5380859375, 40.859375, 43.1806640625, 45.501953125, 47.8232421875, 50.14453125, 52.4658203125, 54.787109375, 57.1083984375, 59.4296875, 61.7509765625, 64.072265625, 66.3935546875, 68.71484375, 71.0361328125, 73.357421875, 75.6787109375, 78.0]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 5.0, 8.0, 14.0, 11.0, 22.0, 31.0, 38.0, 58.0, 99.0, 118.0, 235.0, 405.0, 817.0, 1786.0, 4739.0, 14709.0, 59008.0, 266596.0, 477273.0, 169412.0, 36898.0, 10028.0, 3339.0, 1326.0, 683.0, 369.0, 194.0, 127.0, 78.0, 42.0, 32.0, 20.0, 13.0, 7.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.375, -43.65234375, -41.9296875, -40.20703125, -38.484375, -36.76171875, -35.0390625, -33.31640625, -31.59375, -29.87109375, -28.1484375, -26.42578125, -24.703125, -22.98046875, -21.2578125, -19.53515625, -17.8125, -16.08984375, -14.3671875, -12.64453125, -10.921875, -9.19921875, -7.4765625, -5.75390625, -4.03125, -2.30859375, -0.5859375, 1.13671875, 2.859375, 4.58203125, 6.3046875, 8.02734375, 9.75, 11.47265625, 13.1953125, 14.91796875, 16.640625, 18.36328125, 20.0859375, 21.80859375, 23.53125, 25.25390625, 26.9765625, 28.69921875, 30.421875, 32.14453125, 33.8671875, 35.58984375, 37.3125, 39.03515625, 40.7578125, 42.48046875, 44.203125, 45.92578125, 47.6484375, 49.37109375, 51.09375, 52.81640625, 54.5390625, 56.26171875, 57.984375, 59.70703125, 61.4296875, 63.15234375, 64.875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 6.0, 7.0, 9.0, 13.0, 15.0, 22.0, 23.0, 21.0, 38.0, 48.0, 74.0, 64.0, 105.0, 100.0, 90.0, 84.0, 64.0, 41.0, 32.0, 32.0, 25.0, 19.0, 16.0, 14.0, 11.0, 12.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00801849365234375, -0.007793307304382324, -0.0075681209564208984, -0.007342934608459473, -0.007117748260498047, -0.006892561912536621, -0.006667375564575195, -0.0064421892166137695, -0.006217002868652344, -0.005991816520690918, -0.005766630172729492, -0.005541443824768066, -0.005316257476806641, -0.005091071128845215, -0.004865884780883789, -0.004640698432922363, -0.0044155120849609375, -0.004190325736999512, -0.003965139389038086, -0.00373995304107666, -0.0035147666931152344, -0.0032895803451538086, -0.003064393997192383, -0.002839207649230957, -0.0026140213012695312, -0.0023888349533081055, -0.0021636486053466797, -0.001938462257385254, -0.0017132759094238281, -0.0014880895614624023, -0.0012629032135009766, -0.0010377168655395508, -0.000812530517578125, -0.0005873441696166992, -0.00036215782165527344, -0.00013697147369384766, 8.821487426757812e-05, 0.0003134012222290039, 0.0005385875701904297, 0.0007637739181518555, 0.0009889602661132812, 0.001214146614074707, 0.0014393329620361328, 0.0016645193099975586, 0.0018897056579589844, 0.00211489200592041, 0.002340078353881836, 0.0025652647018432617, 0.0027904510498046875, 0.0030156373977661133, 0.003240823745727539, 0.003466010093688965, 0.0036911964416503906, 0.003916382789611816, 0.004141569137573242, 0.004366755485534668, 0.004591941833496094, 0.0048171281814575195, 0.005042314529418945, 0.005267500877380371, 0.005492687225341797, 0.005717873573303223, 0.0059430599212646484, 0.006168246269226074, 0.0063934326171875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 7.0, 7.0, 16.0, 12.0, 16.0, 25.0, 37.0, 39.0, 91.0, 130.0, 189.0, 306.0, 521.0, 930.0, 1814.0, 3896.0, 9715.0, 28770.0, 106251.0, 359589.0, 373067.0, 114101.0, 30543.0, 10177.0, 3995.0, 1884.0, 965.0, 545.0, 336.0, 196.0, 123.0, 82.0, 52.0, 34.0, 29.0, 21.0, 7.0, 10.0, 6.0, 7.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-53.90625, -52.3671875, -50.828125, -49.2890625, -47.75, -46.2109375, -44.671875, -43.1328125, -41.59375, -40.0546875, -38.515625, -36.9765625, -35.4375, -33.8984375, -32.359375, -30.8203125, -29.28125, -27.7421875, -26.203125, -24.6640625, -23.125, -21.5859375, -20.046875, -18.5078125, -16.96875, -15.4296875, -13.890625, -12.3515625, -10.8125, -9.2734375, -7.734375, -6.1953125, -4.65625, -3.1171875, -1.578125, -0.0390625, 1.5, 3.0390625, 4.578125, 6.1171875, 7.65625, 9.1953125, 10.734375, 12.2734375, 13.8125, 15.3515625, 16.890625, 18.4296875, 19.96875, 21.5078125, 23.046875, 24.5859375, 26.125, 27.6640625, 29.203125, 30.7421875, 32.28125, 33.8203125, 35.359375, 36.8984375, 38.4375, 39.9765625, 41.515625, 43.0546875, 44.59375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 3.0, 3.0, 7.0, 8.0, 6.0, 11.0, 5.0, 10.0, 19.0, 21.0, 31.0, 50.0, 44.0, 59.0, 66.0, 69.0, 70.0, 72.0, 76.0, 56.0, 54.0, 44.0, 53.0, 41.0, 19.0, 31.0, 25.0, 12.0, 10.0, 8.0, 8.0, 5.0, 2.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-30.5625, -29.804443359375, -29.04638671875, -28.288330078125, -27.5302734375, -26.772216796875, -26.01416015625, -25.256103515625, -24.498046875, -23.739990234375, -22.98193359375, -22.223876953125, -21.4658203125, -20.707763671875, -19.94970703125, -19.191650390625, -18.43359375, -17.675537109375, -16.91748046875, -16.159423828125, -15.4013671875, -14.643310546875, -13.88525390625, -13.127197265625, -12.369140625, -11.611083984375, -10.85302734375, -10.094970703125, -9.3369140625, -8.578857421875, -7.82080078125, -7.062744140625, -6.3046875, -5.546630859375, -4.78857421875, -4.030517578125, -3.2724609375, -2.514404296875, -1.75634765625, -0.998291015625, -0.240234375, 0.517822265625, 1.27587890625, 2.033935546875, 2.7919921875, 3.550048828125, 4.30810546875, 5.066162109375, 5.82421875, 6.582275390625, 7.34033203125, 8.098388671875, 8.8564453125, 9.614501953125, 10.37255859375, 11.130615234375, 11.888671875, 12.646728515625, 13.40478515625, 14.162841796875, 14.9208984375, 15.678955078125, 16.43701171875, 17.195068359375, 17.953125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 8.0, 14.0, 26.0, 51.0, 73.0, 96.0, 137.0, 141.0, 132.0, 109.0, 75.0, 44.0, 35.0, 21.0, 7.0, 9.0, 6.0, 0.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-641.4290161132812, -618.9644165039062, -596.4998168945312, -574.0352783203125, -551.5706787109375, -529.1060791015625, -506.6414794921875, -484.1768798828125, -461.7123107910156, -439.2477111816406, -416.78314208984375, -394.31854248046875, -371.85394287109375, -349.3893737792969, -326.9247741699219, -304.460205078125, -281.99560546875, -259.531005859375, -237.06643676757812, -214.60183715820312, -192.1372528076172, -169.67266845703125, -147.20806884765625, -124.74348449707031, -102.27890014648438, -79.81431579589844, -57.34972381591797, -34.8851318359375, -12.420547485351562, 10.044036865234375, 32.508636474609375, 54.97322082519531, 77.4378662109375, 99.90245056152344, 122.3670425415039, 144.83163452148438, 167.2962188720703, 189.76080322265625, 212.22540283203125, 234.6899871826172, 257.1545715332031, 279.6191711425781, 302.083740234375, 324.54833984375, 347.012939453125, 369.4775085449219, 391.9421081542969, 414.40667724609375, 436.87127685546875, 459.33587646484375, 481.8004455566406, 504.2650451660156, 526.7296142578125, 549.1942138671875, 571.6588134765625, 594.1234130859375, 616.5880126953125, 639.0526123046875, 661.5172119140625, 683.9818115234375, 706.4463500976562, 728.9109497070312, 751.3755493164062, 773.8401489257812, 796.3046875]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 9.0, 4.0, 8.0, 10.0, 10.0, 8.0, 10.0, 22.0, 20.0, 19.0, 26.0, 19.0, 21.0, 30.0, 30.0, 48.0, 36.0, 39.0, 44.0, 56.0, 49.0, 51.0, 56.0, 49.0, 36.0, 37.0, 29.0, 30.0, 41.0, 27.0, 25.0, 17.0, 19.0, 15.0, 10.0, 12.0, 8.0, 6.0, 4.0, 3.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-411.755126953125, -399.9296569824219, -388.1042175292969, -376.27874755859375, -364.4532775878906, -352.6278076171875, -340.8023681640625, -328.9768981933594, -317.15142822265625, -305.3259582519531, -293.5005187988281, -281.675048828125, -269.8495788574219, -258.02410888671875, -246.19866943359375, -234.37319946289062, -222.54774475097656, -210.7222900390625, -198.89682006835938, -187.0713653564453, -175.2458953857422, -163.42044067382812, -151.594970703125, -139.76951599121094, -127.94405364990234, -116.11859130859375, -104.29312896728516, -92.46766662597656, -80.6422119140625, -68.81674194335938, -56.99128723144531, -45.16582489013672, -33.340362548828125, -21.51490020751953, -9.68943977355957, 2.1360206604003906, 13.961483001708984, 25.786945343017578, 37.612403869628906, 49.4378662109375, 61.263328552246094, 73.08879089355469, 84.91425323486328, 96.73971557617188, 108.56517028808594, 120.39064025878906, 132.21609497070312, 144.04156494140625, 155.8670196533203, 167.69247436523438, 179.5179443359375, 191.34339904785156, 203.1688690185547, 214.99432373046875, 226.81979370117188, 238.64524841308594, 250.470703125, 262.2961730957031, 274.1216125488281, 285.94708251953125, 297.7725524902344, 309.5980224609375, 321.4234619140625, 333.2489318847656, 345.07440185546875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 9.0, 13.0, 28.0, 25.0, 64.0, 123.0, 283.0, 862.0, 3989.0, 32835.0, 3772369.0, 363993.0, 16077.0, 2495.0, 599.0, 216.0, 111.0, 63.0, 62.0, 27.0, 18.0, 10.0, 3.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-338.75, -326.1328125, -313.515625, -300.8984375, -288.28125, -275.6640625, -263.046875, -250.4296875, -237.8125, -225.1953125, -212.578125, -199.9609375, -187.34375, -174.7265625, -162.109375, -149.4921875, -136.875, -124.2578125, -111.640625, -99.0234375, -86.40625, -73.7890625, -61.171875, -48.5546875, -35.9375, -23.3203125, -10.703125, 1.9140625, 14.53125, 27.1484375, 39.765625, 52.3828125, 65.0, 77.6171875, 90.234375, 102.8515625, 115.46875, 128.0859375, 140.703125, 153.3203125, 165.9375, 178.5546875, 191.171875, 203.7890625, 216.40625, 229.0234375, 241.640625, 254.2578125, 266.875, 279.4921875, 292.109375, 304.7265625, 317.34375, 329.9609375, 342.578125, 355.1953125, 367.8125, 380.4296875, 393.046875, 405.6640625, 418.28125, 430.8984375, 443.515625, 456.1328125, 468.75]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 7.0, 21.0, 18.0, 33.0, 59.0, 63.0, 71.0, 67.0, 103.0, 92.0, 95.0, 91.0, 73.0, 46.0, 47.0, 36.0, 34.0, 17.0, 10.0, 11.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.8125, -17.188232421875, -16.56396484375, -15.939697265625, -15.3154296875, -14.691162109375, -14.06689453125, -13.442626953125, -12.818359375, -12.194091796875, -11.56982421875, -10.945556640625, -10.3212890625, -9.697021484375, -9.07275390625, -8.448486328125, -7.82421875, -7.199951171875, -6.57568359375, -5.951416015625, -5.3271484375, -4.702880859375, -4.07861328125, -3.454345703125, -2.830078125, -2.205810546875, -1.58154296875, -0.957275390625, -0.3330078125, 0.291259765625, 0.91552734375, 1.539794921875, 2.1640625, 2.788330078125, 3.41259765625, 4.036865234375, 4.6611328125, 5.285400390625, 5.90966796875, 6.533935546875, 7.158203125, 7.782470703125, 8.40673828125, 9.031005859375, 9.6552734375, 10.279541015625, 10.90380859375, 11.528076171875, 12.15234375, 12.776611328125, 13.40087890625, 14.025146484375, 14.6494140625, 15.273681640625, 15.89794921875, 16.522216796875, 17.146484375, 17.770751953125, 18.39501953125, 19.019287109375, 19.6435546875, 20.267822265625, 20.89208984375, 21.516357421875, 22.140625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 6.0, 12.0, 10.0, 33.0, 55.0, 84.0, 125.0, 184.0, 432.0, 759.0, 1523.0, 3455.0, 8292.0, 22839.0, 79408.0, 486297.0, 3275479.0, 237576.0, 50505.0, 15829.0, 6071.0, 2624.0, 1245.0, 607.0, 340.0, 199.0, 117.0, 68.0, 38.0, 13.0, 17.0, 13.0, 9.0, 7.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-168.125, -163.228515625, -158.33203125, -153.435546875, -148.5390625, -143.642578125, -138.74609375, -133.849609375, -128.953125, -124.056640625, -119.16015625, -114.263671875, -109.3671875, -104.470703125, -99.57421875, -94.677734375, -89.78125, -84.884765625, -79.98828125, -75.091796875, -70.1953125, -65.298828125, -60.40234375, -55.505859375, -50.609375, -45.712890625, -40.81640625, -35.919921875, -31.0234375, -26.126953125, -21.23046875, -16.333984375, -11.4375, -6.541015625, -1.64453125, 3.251953125, 8.1484375, 13.044921875, 17.94140625, 22.837890625, 27.734375, 32.630859375, 37.52734375, 42.423828125, 47.3203125, 52.216796875, 57.11328125, 62.009765625, 66.90625, 71.802734375, 76.69921875, 81.595703125, 86.4921875, 91.388671875, 96.28515625, 101.181640625, 106.078125, 110.974609375, 115.87109375, 120.767578125, 125.6640625, 130.560546875, 135.45703125, 140.353515625, 145.25]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 1.0, 2.0, 8.0, 5.0, 14.0, 10.0, 15.0, 15.0, 31.0, 38.0, 48.0, 93.0, 129.0, 238.0, 540.0, 1729.0, 533.0, 245.0, 111.0, 91.0, 60.0, 22.0, 30.0, 25.0, 10.0, 4.0, 7.0, 6.0, 7.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.125, -31.91943359375, -30.7138671875, -29.50830078125, -28.302734375, -27.09716796875, -25.8916015625, -24.68603515625, -23.48046875, -22.27490234375, -21.0693359375, -19.86376953125, -18.658203125, -17.45263671875, -16.2470703125, -15.04150390625, -13.8359375, -12.63037109375, -11.4248046875, -10.21923828125, -9.013671875, -7.80810546875, -6.6025390625, -5.39697265625, -4.19140625, -2.98583984375, -1.7802734375, -0.57470703125, 0.630859375, 1.83642578125, 3.0419921875, 4.24755859375, 5.453125, 6.65869140625, 7.8642578125, 9.06982421875, 10.275390625, 11.48095703125, 12.6865234375, 13.89208984375, 15.09765625, 16.30322265625, 17.5087890625, 18.71435546875, 19.919921875, 21.12548828125, 22.3310546875, 23.53662109375, 24.7421875, 25.94775390625, 27.1533203125, 28.35888671875, 29.564453125, 30.77001953125, 31.9755859375, 33.18115234375, 34.38671875, 35.59228515625, 36.7978515625, 38.00341796875, 39.208984375, 40.41455078125, 41.6201171875, 42.82568359375, 44.03125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 11.0, 10.0, 8.0, 28.0, 51.0, 50.0, 72.0, 105.0, 127.0, 123.0, 114.0, 84.0, 81.0, 48.0, 31.0, 20.0, 16.0, 8.0, 2.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-250.4905548095703, -242.75283813476562, -235.01512145996094, -227.2773895263672, -219.5396728515625, -211.8019561767578, -204.06423950195312, -196.32650756835938, -188.5887908935547, -180.85107421875, -173.1133575439453, -165.37562561035156, -157.63790893554688, -149.9001922607422, -142.1624755859375, -134.42474365234375, -126.6870346069336, -118.9493179321289, -111.21159362792969, -103.473876953125, -95.73615264892578, -87.9984359741211, -80.26071166992188, -72.52299499511719, -64.7852783203125, -57.04755783081055, -49.309837341308594, -41.572120666503906, -33.83439636230469, -26.0966796875, -18.358959197998047, -10.621238708496094, -2.883514404296875, 4.85420560836792, 12.591925621032715, 20.32964515686035, 28.067365646362305, 35.805084228515625, 43.54280471801758, 51.28052520751953, 59.018245697021484, 66.75596618652344, 74.49368286132812, 82.23140716552734, 89.96912384033203, 97.70684814453125, 105.44456481933594, 113.18228149414062, 120.92000579833984, 128.65773010253906, 136.39544677734375, 144.13316345214844, 151.87088012695312, 159.60861206054688, 167.34632873535156, 175.08404541015625, 182.82176208496094, 190.55947875976562, 198.2971954345703, 206.03492736816406, 213.77264404296875, 221.51036071777344, 229.24807739257812, 236.98580932617188, 244.72352600097656]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 4.0, 8.0, 8.0, 4.0, 12.0, 12.0, 19.0, 18.0, 27.0, 25.0, 23.0, 32.0, 33.0, 31.0, 40.0, 34.0, 36.0, 53.0, 35.0, 43.0, 49.0, 53.0, 51.0, 44.0, 45.0, 25.0, 26.0, 42.0, 30.0, 21.0, 15.0, 19.0, 18.0, 17.0, 7.0, 8.0, 6.0, 3.0, 5.0, 5.0, 1.0, 6.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-117.79442596435547, -114.21016693115234, -110.62590789794922, -107.04164123535156, -103.45738220214844, -99.87312316894531, -96.28886413574219, -92.70460510253906, -89.12034606933594, -85.53608703613281, -81.95182800292969, -78.36756896972656, -74.7833023071289, -71.19904327392578, -67.61478424072266, -64.03052520751953, -60.446258544921875, -56.86199951171875, -53.27773666381836, -49.693477630615234, -46.109214782714844, -42.52495574951172, -38.940696716308594, -35.35643768310547, -31.772174835205078, -28.18791389465332, -24.603652954101562, -21.019393920898438, -17.43513298034668, -13.850872039794922, -10.266613006591797, -6.682352066040039, -3.09808349609375, 0.4861769676208496, 4.070437431335449, 7.654697418212891, 11.238958358764648, 14.823219299316406, 18.40747833251953, 21.99173927307129, 25.576000213623047, 29.160261154174805, 32.74452209472656, 36.32878112792969, 39.91304016113281, 43.4973030090332, 47.08156204223633, 50.66582489013672, 54.250083923339844, 57.83434295654297, 61.41860580444336, 65.00286865234375, 68.58712768554688, 72.17138671875, 75.75564575195312, 79.33990478515625, 82.92416381835938, 86.5084228515625, 90.09268188476562, 93.67694091796875, 97.2612075805664, 100.84546661376953, 104.42972564697266, 108.01398468017578, 111.59825134277344]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 6.0, 8.0, 14.0, 8.0, 31.0, 30.0, 33.0, 58.0, 90.0, 134.0, 161.0, 246.0, 376.0, 660.0, 1294.0, 2781.0, 6857.0, 18072.0, 52629.0, 152276.0, 348539.0, 289434.0, 112594.0, 38482.0, 13726.0, 5066.0, 2257.0, 1068.0, 582.0, 332.0, 218.0, 157.0, 94.0, 79.0, 56.0, 33.0, 28.0, 11.0, 8.0, 11.0, 9.0, 9.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-96.3125, -93.69921875, -91.0859375, -88.47265625, -85.859375, -83.24609375, -80.6328125, -78.01953125, -75.40625, -72.79296875, -70.1796875, -67.56640625, -64.953125, -62.33984375, -59.7265625, -57.11328125, -54.5, -51.88671875, -49.2734375, -46.66015625, -44.046875, -41.43359375, -38.8203125, -36.20703125, -33.59375, -30.98046875, -28.3671875, -25.75390625, -23.140625, -20.52734375, -17.9140625, -15.30078125, -12.6875, -10.07421875, -7.4609375, -4.84765625, -2.234375, 0.37890625, 2.9921875, 5.60546875, 8.21875, 10.83203125, 13.4453125, 16.05859375, 18.671875, 21.28515625, 23.8984375, 26.51171875, 29.125, 31.73828125, 34.3515625, 36.96484375, 39.578125, 42.19140625, 44.8046875, 47.41796875, 50.03125, 52.64453125, 55.2578125, 57.87109375, 60.484375, 63.09765625, 65.7109375, 68.32421875, 70.9375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 9.0, 9.0, 20.0, 34.0, 37.0, 47.0, 62.0, 79.0, 83.0, 93.0, 102.0, 81.0, 88.0, 71.0, 52.0, 40.0, 39.0, 22.0, 17.0, 6.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.75, -18.106201171875, -17.46240234375, -16.818603515625, -16.1748046875, -15.531005859375, -14.88720703125, -14.243408203125, -13.599609375, -12.955810546875, -12.31201171875, -11.668212890625, -11.0244140625, -10.380615234375, -9.73681640625, -9.093017578125, -8.44921875, -7.805419921875, -7.16162109375, -6.517822265625, -5.8740234375, -5.230224609375, -4.58642578125, -3.942626953125, -3.298828125, -2.655029296875, -2.01123046875, -1.367431640625, -0.7236328125, -0.079833984375, 0.56396484375, 1.207763671875, 1.8515625, 2.495361328125, 3.13916015625, 3.782958984375, 4.4267578125, 5.070556640625, 5.71435546875, 6.358154296875, 7.001953125, 7.645751953125, 8.28955078125, 8.933349609375, 9.5771484375, 10.220947265625, 10.86474609375, 11.508544921875, 12.15234375, 12.796142578125, 13.43994140625, 14.083740234375, 14.7275390625, 15.371337890625, 16.01513671875, 16.658935546875, 17.302734375, 17.946533203125, 18.59033203125, 19.234130859375, 19.8779296875, 20.521728515625, 21.16552734375, 21.809326171875, 22.453125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 7.0, 8.0, 19.0, 16.0, 23.0, 43.0, 41.0, 72.0, 96.0, 124.0, 189.0, 272.0, 375.0, 563.0, 918.0, 1517.0, 2758.0, 5592.0, 11818.0, 26876.0, 64444.0, 144554.0, 267322.0, 264700.0, 142444.0, 62914.0, 26653.0, 11604.0, 5506.0, 2762.0, 1543.0, 902.0, 560.0, 363.0, 307.0, 195.0, 137.0, 83.0, 74.0, 46.0, 34.0, 29.0, 18.0, 9.0, 9.0, 4.0, 3.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.34375, -50.5380859375, -48.732421875, -46.9267578125, -45.12109375, -43.3154296875, -41.509765625, -39.7041015625, -37.8984375, -36.0927734375, -34.287109375, -32.4814453125, -30.67578125, -28.8701171875, -27.064453125, -25.2587890625, -23.453125, -21.6474609375, -19.841796875, -18.0361328125, -16.23046875, -14.4248046875, -12.619140625, -10.8134765625, -9.0078125, -7.2021484375, -5.396484375, -3.5908203125, -1.78515625, 0.0205078125, 1.826171875, 3.6318359375, 5.4375, 7.2431640625, 9.048828125, 10.8544921875, 12.66015625, 14.4658203125, 16.271484375, 18.0771484375, 19.8828125, 21.6884765625, 23.494140625, 25.2998046875, 27.10546875, 28.9111328125, 30.716796875, 32.5224609375, 34.328125, 36.1337890625, 37.939453125, 39.7451171875, 41.55078125, 43.3564453125, 45.162109375, 46.9677734375, 48.7734375, 50.5791015625, 52.384765625, 54.1904296875, 55.99609375, 57.8017578125, 59.607421875, 61.4130859375, 63.21875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 6.0, 9.0, 8.0, 18.0, 7.0, 12.0, 15.0, 14.0, 23.0, 25.0, 35.0, 33.0, 45.0, 36.0, 52.0, 56.0, 46.0, 46.0, 36.0, 52.0, 50.0, 41.0, 53.0, 38.0, 40.0, 30.0, 34.0, 30.0, 22.0, 12.0, 13.0, 18.0, 12.0, 10.0, 6.0, 8.0, 3.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.75, -50.013671875, -48.27734375, -46.541015625, -44.8046875, -43.068359375, -41.33203125, -39.595703125, -37.859375, -36.123046875, -34.38671875, -32.650390625, -30.9140625, -29.177734375, -27.44140625, -25.705078125, -23.96875, -22.232421875, -20.49609375, -18.759765625, -17.0234375, -15.287109375, -13.55078125, -11.814453125, -10.078125, -8.341796875, -6.60546875, -4.869140625, -3.1328125, -1.396484375, 0.33984375, 2.076171875, 3.8125, 5.548828125, 7.28515625, 9.021484375, 10.7578125, 12.494140625, 14.23046875, 15.966796875, 17.703125, 19.439453125, 21.17578125, 22.912109375, 24.6484375, 26.384765625, 28.12109375, 29.857421875, 31.59375, 33.330078125, 35.06640625, 36.802734375, 38.5390625, 40.275390625, 42.01171875, 43.748046875, 45.484375, 47.220703125, 48.95703125, 50.693359375, 52.4296875, 54.166015625, 55.90234375, 57.638671875, 59.375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 5.0, 8.0, 14.0, 16.0, 23.0, 27.0, 39.0, 41.0, 81.0, 123.0, 183.0, 306.0, 510.0, 1070.0, 2461.0, 6230.0, 20576.0, 85191.0, 336018.0, 423328.0, 128158.0, 29649.0, 8602.0, 2985.0, 1291.0, 664.0, 366.0, 187.0, 122.0, 73.0, 55.0, 40.0, 13.0, 19.0, 14.0, 16.0, 12.0, 9.0, 8.0, 3.0, 6.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.5, -34.35986328125, -33.2197265625, -32.07958984375, -30.939453125, -29.79931640625, -28.6591796875, -27.51904296875, -26.37890625, -25.23876953125, -24.0986328125, -22.95849609375, -21.818359375, -20.67822265625, -19.5380859375, -18.39794921875, -17.2578125, -16.11767578125, -14.9775390625, -13.83740234375, -12.697265625, -11.55712890625, -10.4169921875, -9.27685546875, -8.13671875, -6.99658203125, -5.8564453125, -4.71630859375, -3.576171875, -2.43603515625, -1.2958984375, -0.15576171875, 0.984375, 2.12451171875, 3.2646484375, 4.40478515625, 5.544921875, 6.68505859375, 7.8251953125, 8.96533203125, 10.10546875, 11.24560546875, 12.3857421875, 13.52587890625, 14.666015625, 15.80615234375, 16.9462890625, 18.08642578125, 19.2265625, 20.36669921875, 21.5068359375, 22.64697265625, 23.787109375, 24.92724609375, 26.0673828125, 27.20751953125, 28.34765625, 29.48779296875, 30.6279296875, 31.76806640625, 32.908203125, 34.04833984375, 35.1884765625, 36.32861328125, 37.46875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 6.0, 5.0, 9.0, 7.0, 5.0, 16.0, 18.0, 19.0, 32.0, 26.0, 26.0, 41.0, 47.0, 67.0, 100.0, 89.0, 92.0, 64.0, 50.0, 51.0, 45.0, 28.0, 35.0, 21.0, 21.0, 22.0, 9.0, 14.0, 10.0, 5.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.004543304443359375, -0.004396557807922363, -0.0042498111724853516, -0.00410306453704834, -0.003956317901611328, -0.0038095712661743164, -0.0036628246307373047, -0.003516077995300293, -0.0033693313598632812, -0.0032225847244262695, -0.003075838088989258, -0.002929091453552246, -0.0027823448181152344, -0.0026355981826782227, -0.002488851547241211, -0.0023421049118041992, -0.0021953582763671875, -0.0020486116409301758, -0.001901865005493164, -0.0017551183700561523, -0.0016083717346191406, -0.001461625099182129, -0.0013148784637451172, -0.0011681318283081055, -0.0010213851928710938, -0.000874638557434082, -0.0007278919219970703, -0.0005811452865600586, -0.0004343986511230469, -0.00028765201568603516, -0.00014090538024902344, 5.841255187988281e-06, 0.000152587890625, 0.0002993345260620117, 0.00044608116149902344, 0.0005928277969360352, 0.0007395744323730469, 0.0008863210678100586, 0.0010330677032470703, 0.001179814338684082, 0.0013265609741210938, 0.0014733076095581055, 0.0016200542449951172, 0.001766800880432129, 0.0019135475158691406, 0.0020602941513061523, 0.002207040786743164, 0.0023537874221801758, 0.0025005340576171875, 0.0026472806930541992, 0.002794027328491211, 0.0029407739639282227, 0.0030875205993652344, 0.003234267234802246, 0.003381013870239258, 0.0035277605056762695, 0.0036745071411132812, 0.003821253776550293, 0.003968000411987305, 0.004114747047424316, 0.004261493682861328, 0.00440824031829834, 0.0045549869537353516, 0.004701733589172363, 0.004848480224609375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 6.0, 7.0, 11.0, 21.0, 23.0, 31.0, 54.0, 82.0, 123.0, 237.0, 382.0, 668.0, 1183.0, 2493.0, 5963.0, 17854.0, 75553.0, 349971.0, 442700.0, 112803.0, 24469.0, 7689.0, 2995.0, 1408.0, 737.0, 428.0, 247.0, 137.0, 96.0, 62.0, 36.0, 18.0, 14.0, 16.0, 7.0, 9.0, 6.0, 0.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-40.59375, -39.3681640625, -38.142578125, -36.9169921875, -35.69140625, -34.4658203125, -33.240234375, -32.0146484375, -30.7890625, -29.5634765625, -28.337890625, -27.1123046875, -25.88671875, -24.6611328125, -23.435546875, -22.2099609375, -20.984375, -19.7587890625, -18.533203125, -17.3076171875, -16.08203125, -14.8564453125, -13.630859375, -12.4052734375, -11.1796875, -9.9541015625, -8.728515625, -7.5029296875, -6.27734375, -5.0517578125, -3.826171875, -2.6005859375, -1.375, -0.1494140625, 1.076171875, 2.3017578125, 3.52734375, 4.7529296875, 5.978515625, 7.2041015625, 8.4296875, 9.6552734375, 10.880859375, 12.1064453125, 13.33203125, 14.5576171875, 15.783203125, 17.0087890625, 18.234375, 19.4599609375, 20.685546875, 21.9111328125, 23.13671875, 24.3623046875, 25.587890625, 26.8134765625, 28.0390625, 29.2646484375, 30.490234375, 31.7158203125, 32.94140625, 34.1669921875, 35.392578125, 36.6181640625, 37.84375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 11.0, 14.0, 11.0, 17.0, 21.0, 23.0, 44.0, 48.0, 54.0, 58.0, 80.0, 92.0, 69.0, 78.0, 77.0, 52.0, 39.0, 48.0, 39.0, 27.0, 19.0, 16.0, 15.0, 8.0, 6.0, 10.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.453125, -21.758056640625, -21.06298828125, -20.367919921875, -19.6728515625, -18.977783203125, -18.28271484375, -17.587646484375, -16.892578125, -16.197509765625, -15.50244140625, -14.807373046875, -14.1123046875, -13.417236328125, -12.72216796875, -12.027099609375, -11.33203125, -10.636962890625, -9.94189453125, -9.246826171875, -8.5517578125, -7.856689453125, -7.16162109375, -6.466552734375, -5.771484375, -5.076416015625, -4.38134765625, -3.686279296875, -2.9912109375, -2.296142578125, -1.60107421875, -0.906005859375, -0.2109375, 0.484130859375, 1.17919921875, 1.874267578125, 2.5693359375, 3.264404296875, 3.95947265625, 4.654541015625, 5.349609375, 6.044677734375, 6.73974609375, 7.434814453125, 8.1298828125, 8.824951171875, 9.52001953125, 10.215087890625, 10.91015625, 11.605224609375, 12.30029296875, 12.995361328125, 13.6904296875, 14.385498046875, 15.08056640625, 15.775634765625, 16.470703125, 17.165771484375, 17.86083984375, 18.555908203125, 19.2509765625, 19.946044921875, 20.64111328125, 21.336181640625, 22.03125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 6.0, 13.0, 18.0, 14.0, 37.0, 61.0, 68.0, 82.0, 96.0, 129.0, 96.0, 92.0, 75.0, 54.0, 47.0, 37.0, 22.0, 13.0, 11.0, 8.0, 7.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-502.29571533203125, -489.33551025390625, -476.37530517578125, -463.4150695800781, -450.4548645019531, -437.4946594238281, -424.5344543457031, -411.57421875, -398.614013671875, -385.65380859375, -372.693603515625, -359.7333679199219, -346.7731628417969, -333.8129577636719, -320.8527526855469, -307.89251708984375, -294.93231201171875, -281.97210693359375, -269.01190185546875, -256.0516662597656, -243.09146118164062, -230.13125610351562, -217.17105102539062, -204.21083068847656, -191.25064086914062, -178.29043579101562, -165.33021545410156, -152.37001037597656, -139.4097900390625, -126.4495849609375, -113.48937225341797, -100.52915954589844, -87.56893920898438, -74.60872650146484, -61.64851379394531, -48.68830490112305, -35.728092193603516, -22.76788330078125, -9.807670593261719, 3.1525421142578125, 16.112754821777344, 29.072967529296875, 42.033180236816406, 54.99338912963867, 67.95359802246094, 80.91381072998047, 93.8740234375, 106.83423614501953, 119.79444885253906, 132.75465393066406, 145.71487426757812, 158.67507934570312, 171.6352996826172, 184.5955047607422, 197.55572509765625, 210.51593017578125, 223.47613525390625, 236.43634033203125, 249.3965606689453, 262.3567810058594, 275.3169860839844, 288.2771911621094, 301.2373962402344, 314.1976318359375, 327.1578369140625]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 4.0, 11.0, 4.0, 10.0, 17.0, 18.0, 15.0, 23.0, 28.0, 28.0, 46.0, 47.0, 34.0, 35.0, 58.0, 44.0, 49.0, 58.0, 57.0, 45.0, 39.0, 46.0, 43.0, 28.0, 44.0, 25.0, 36.0, 20.0, 14.0, 9.0, 18.0, 10.0, 5.0, 4.0, 11.0, 2.0, 3.0, 3.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-290.86920166015625, -280.7148132324219, -270.5603942871094, -260.406005859375, -250.25161743164062, -240.0972137451172, -229.94281005859375, -219.78842163085938, -209.63401794433594, -199.4796142578125, -189.32522583007812, -179.1708221435547, -169.01641845703125, -158.86203002929688, -148.70762634277344, -138.55322265625, -128.39883422851562, -118.24443817138672, -108.09004211425781, -97.93563842773438, -87.78124237060547, -77.62684631347656, -67.47244262695312, -57.31804656982422, -47.16365051269531, -37.009254455566406, -26.854854583740234, -16.700456619262695, -6.546058654785156, 3.60833740234375, 13.762737274169922, 23.917137145996094, 34.071533203125, 44.225929260253906, 54.38032913208008, 64.53472900390625, 74.68912506103516, 84.84352111816406, 94.9979248046875, 105.1523208618164, 115.30671691894531, 125.46111297607422, 135.61550903320312, 145.76991271972656, 155.92431640625, 166.07870483398438, 176.2331085205078, 186.38751220703125, 196.54190063476562, 206.69630432128906, 216.85069274902344, 227.00509643554688, 237.15948486328125, 247.3138885498047, 257.4682922363281, 267.6226806640625, 277.777099609375, 287.9314880371094, 298.0859069824219, 308.24029541015625, 318.3946838378906, 328.549072265625, 338.7034912109375, 348.8578796386719, 359.01226806640625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 10.0, 10.0, 8.0, 20.0, 33.0, 48.0, 73.0, 102.0, 181.0, 329.0, 610.0, 1199.0, 2964.0, 8620.0, 33589.0, 353145.0, 3695411.0, 74827.0, 14901.0, 4668.0, 1747.0, 799.0, 416.0, 225.0, 125.0, 69.0, 49.0, 27.0, 24.0, 15.0, 6.0, 11.0, 3.0, 6.0, 2.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-145.0, -139.861328125, -134.72265625, -129.583984375, -124.4453125, -119.306640625, -114.16796875, -109.029296875, -103.890625, -98.751953125, -93.61328125, -88.474609375, -83.3359375, -78.197265625, -73.05859375, -67.919921875, -62.78125, -57.642578125, -52.50390625, -47.365234375, -42.2265625, -37.087890625, -31.94921875, -26.810546875, -21.671875, -16.533203125, -11.39453125, -6.255859375, -1.1171875, 4.021484375, 9.16015625, 14.298828125, 19.4375, 24.576171875, 29.71484375, 34.853515625, 39.9921875, 45.130859375, 50.26953125, 55.408203125, 60.546875, 65.685546875, 70.82421875, 75.962890625, 81.1015625, 86.240234375, 91.37890625, 96.517578125, 101.65625, 106.794921875, 111.93359375, 117.072265625, 122.2109375, 127.349609375, 132.48828125, 137.626953125, 142.765625, 147.904296875, 153.04296875, 158.181640625, 163.3203125, 168.458984375, 173.59765625, 178.736328125, 183.875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 4.0, 6.0, 14.0, 21.0, 20.0, 19.0, 32.0, 46.0, 60.0, 65.0, 69.0, 82.0, 81.0, 82.0, 68.0, 76.0, 50.0, 54.0, 31.0, 41.0, 27.0, 16.0, 15.0, 9.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.5390625, -14.9981689453125, -14.457275390625, -13.9163818359375, -13.37548828125, -12.8345947265625, -12.293701171875, -11.7528076171875, -11.2119140625, -10.6710205078125, -10.130126953125, -9.5892333984375, -9.04833984375, -8.5074462890625, -7.966552734375, -7.4256591796875, -6.884765625, -6.3438720703125, -5.802978515625, -5.2620849609375, -4.72119140625, -4.1802978515625, -3.639404296875, -3.0985107421875, -2.5576171875, -2.0167236328125, -1.475830078125, -0.9349365234375, -0.39404296875, 0.1468505859375, 0.687744140625, 1.2286376953125, 1.76953125, 2.3104248046875, 2.851318359375, 3.3922119140625, 3.93310546875, 4.4739990234375, 5.014892578125, 5.5557861328125, 6.0966796875, 6.6375732421875, 7.178466796875, 7.7193603515625, 8.26025390625, 8.8011474609375, 9.342041015625, 9.8829345703125, 10.423828125, 10.9647216796875, 11.505615234375, 12.0465087890625, 12.58740234375, 13.1282958984375, 13.669189453125, 14.2100830078125, 14.7509765625, 15.2918701171875, 15.832763671875, 16.3736572265625, 16.91455078125, 17.4554443359375, 17.996337890625, 18.5372314453125, 19.078125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 6.0, 5.0, 7.0, 12.0, 12.0, 18.0, 28.0, 17.0, 27.0, 34.0, 36.0, 80.0, 101.0, 157.0, 327.0, 701.0, 1710.0, 4944.0, 16478.0, 69454.0, 576713.0, 3327656.0, 152370.0, 29879.0, 8311.0, 2920.0, 1191.0, 511.0, 217.0, 126.0, 61.0, 47.0, 33.0, 24.0, 16.0, 17.0, 8.0, 11.0, 7.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-122.3125, -118.5166015625, -114.720703125, -110.9248046875, -107.12890625, -103.3330078125, -99.537109375, -95.7412109375, -91.9453125, -88.1494140625, -84.353515625, -80.5576171875, -76.76171875, -72.9658203125, -69.169921875, -65.3740234375, -61.578125, -57.7822265625, -53.986328125, -50.1904296875, -46.39453125, -42.5986328125, -38.802734375, -35.0068359375, -31.2109375, -27.4150390625, -23.619140625, -19.8232421875, -16.02734375, -12.2314453125, -8.435546875, -4.6396484375, -0.84375, 2.9521484375, 6.748046875, 10.5439453125, 14.33984375, 18.1357421875, 21.931640625, 25.7275390625, 29.5234375, 33.3193359375, 37.115234375, 40.9111328125, 44.70703125, 48.5029296875, 52.298828125, 56.0947265625, 59.890625, 63.6865234375, 67.482421875, 71.2783203125, 75.07421875, 78.8701171875, 82.666015625, 86.4619140625, 90.2578125, 94.0537109375, 97.849609375, 101.6455078125, 105.44140625, 109.2373046875, 113.033203125, 116.8291015625, 120.625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 4.0, 3.0, 6.0, 20.0, 29.0, 42.0, 63.0, 113.0, 214.0, 604.0, 2060.0, 440.0, 210.0, 108.0, 50.0, 39.0, 21.0, 20.0, 10.0, 10.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-54.9375, -53.75244140625, -52.5673828125, -51.38232421875, -50.197265625, -49.01220703125, -47.8271484375, -46.64208984375, -45.45703125, -44.27197265625, -43.0869140625, -41.90185546875, -40.716796875, -39.53173828125, -38.3466796875, -37.16162109375, -35.9765625, -34.79150390625, -33.6064453125, -32.42138671875, -31.236328125, -30.05126953125, -28.8662109375, -27.68115234375, -26.49609375, -25.31103515625, -24.1259765625, -22.94091796875, -21.755859375, -20.57080078125, -19.3857421875, -18.20068359375, -17.015625, -15.83056640625, -14.6455078125, -13.46044921875, -12.275390625, -11.09033203125, -9.9052734375, -8.72021484375, -7.53515625, -6.35009765625, -5.1650390625, -3.97998046875, -2.794921875, -1.60986328125, -0.4248046875, 0.76025390625, 1.9453125, 3.13037109375, 4.3154296875, 5.50048828125, 6.685546875, 7.87060546875, 9.0556640625, 10.24072265625, 11.42578125, 12.61083984375, 13.7958984375, 14.98095703125, 16.166015625, 17.35107421875, 18.5361328125, 19.72119140625, 20.90625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 5.0, 4.0, 11.0, 19.0, 18.0, 34.0, 46.0, 75.0, 133.0, 120.0, 143.0, 123.0, 89.0, 73.0, 35.0, 28.0, 17.0, 7.0, 8.0, 3.0, 6.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-121.0135269165039, -115.53886413574219, -110.06420135498047, -104.58953857421875, -99.11488342285156, -93.64021301269531, -88.16555786132812, -82.6908950805664, -77.21623229980469, -71.74156951904297, -66.26690673828125, -60.7922477722168, -55.31758499145508, -49.84292221069336, -44.368263244628906, -38.89360046386719, -33.41893768310547, -27.94427490234375, -22.469614028930664, -16.994953155517578, -11.52029037475586, -6.045627593994141, -0.5709686279296875, 4.903694152832031, 10.37835693359375, 15.853018760681152, 21.327680587768555, 26.80234146118164, 32.27700424194336, 37.75166702270508, 43.22632598876953, 48.70098876953125, 54.17564392089844, 59.650306701660156, 65.12496948242188, 70.59962463378906, 76.07429504394531, 81.5489501953125, 87.02361297607422, 92.49827575683594, 97.97293853759766, 103.44760131835938, 108.9222640991211, 114.39692687988281, 119.87158203125, 125.34625244140625, 130.82090759277344, 136.29556274414062, 141.77023315429688, 147.24488830566406, 152.7195587158203, 158.1942138671875, 163.66888427734375, 169.14353942871094, 174.61819458007812, 180.09286499023438, 185.56753540039062, 191.0421905517578, 196.51686096191406, 201.99151611328125, 207.4661865234375, 212.9408416748047, 218.41549682617188, 223.89016723632812, 229.3648223876953]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 6.0, 9.0, 12.0, 9.0, 13.0, 15.0, 19.0, 18.0, 24.0, 20.0, 31.0, 29.0, 34.0, 35.0, 29.0, 28.0, 51.0, 39.0, 38.0, 48.0, 47.0, 44.0, 42.0, 42.0, 37.0, 30.0, 29.0, 32.0, 27.0, 20.0, 15.0, 19.0, 13.0, 11.0, 13.0, 11.0, 9.0, 11.0, 11.0, 2.0, 8.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0], "bins": [-86.27619934082031, -83.82474517822266, -81.373291015625, -78.92182922363281, -76.47037506103516, -74.0189208984375, -71.56746673583984, -69.11601257324219, -66.66455078125, -64.21309661865234, -61.76163864135742, -59.310184478759766, -56.858726501464844, -54.40727233886719, -51.95581817626953, -49.50436019897461, -47.05290603637695, -44.6014518737793, -42.149993896484375, -39.69853973388672, -37.2470817565918, -34.79562759399414, -32.34416961669922, -29.892715454101562, -27.441259384155273, -24.989803314208984, -22.538347244262695, -20.086891174316406, -17.63543701171875, -15.183979988098145, -12.732524871826172, -10.281068801879883, -7.829612731933594, -5.378156661987305, -2.926701068878174, -0.47524547576904297, 1.976210594177246, 4.427666664123535, 6.879121780395508, 9.330577850341797, 11.782033920288086, 14.233489990234375, 16.684946060180664, 19.136402130126953, 21.58785629272461, 24.03931427001953, 26.490768432617188, 28.942224502563477, 31.393680572509766, 33.84513473510742, 36.296592712402344, 38.748046875, 41.19950485229492, 43.65095901489258, 46.1024169921875, 48.553871154785156, 51.00532531738281, 53.45677947998047, 55.90823745727539, 58.35969161987305, 60.81114959716797, 63.262603759765625, 65.71405792236328, 68.16551208496094, 70.61697387695312]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 6.0, 5.0, 6.0, 7.0, 12.0, 24.0, 40.0, 42.0, 70.0, 80.0, 197.0, 271.0, 484.0, 1001.0, 2147.0, 5643.0, 18128.0, 66668.0, 255361.0, 471452.0, 164830.0, 42863.0, 11817.0, 3981.0, 1622.0, 755.0, 416.0, 231.0, 126.0, 86.0, 52.0, 48.0, 30.0, 17.0, 6.0, 9.0, 7.0, 4.0, 4.0, 1.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.875, -92.6064453125, -89.337890625, -86.0693359375, -82.80078125, -79.5322265625, -76.263671875, -72.9951171875, -69.7265625, -66.4580078125, -63.189453125, -59.9208984375, -56.65234375, -53.3837890625, -50.115234375, -46.8466796875, -43.578125, -40.3095703125, -37.041015625, -33.7724609375, -30.50390625, -27.2353515625, -23.966796875, -20.6982421875, -17.4296875, -14.1611328125, -10.892578125, -7.6240234375, -4.35546875, -1.0869140625, 2.181640625, 5.4501953125, 8.71875, 11.9873046875, 15.255859375, 18.5244140625, 21.79296875, 25.0615234375, 28.330078125, 31.5986328125, 34.8671875, 38.1357421875, 41.404296875, 44.6728515625, 47.94140625, 51.2099609375, 54.478515625, 57.7470703125, 61.015625, 64.2841796875, 67.552734375, 70.8212890625, 74.08984375, 77.3583984375, 80.626953125, 83.8955078125, 87.1640625, 90.4326171875, 93.701171875, 96.9697265625, 100.23828125, 103.5068359375, 106.775390625, 110.0439453125, 113.3125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 7.0, 16.0, 12.0, 26.0, 22.0, 36.0, 46.0, 53.0, 72.0, 73.0, 101.0, 92.0, 75.0, 90.0, 67.0, 46.0, 46.0, 44.0, 25.0, 21.0, 11.0, 7.0, 8.0, 7.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.71875, -15.12451171875, -14.5302734375, -13.93603515625, -13.341796875, -12.74755859375, -12.1533203125, -11.55908203125, -10.96484375, -10.37060546875, -9.7763671875, -9.18212890625, -8.587890625, -7.99365234375, -7.3994140625, -6.80517578125, -6.2109375, -5.61669921875, -5.0224609375, -4.42822265625, -3.833984375, -3.23974609375, -2.6455078125, -2.05126953125, -1.45703125, -0.86279296875, -0.2685546875, 0.32568359375, 0.919921875, 1.51416015625, 2.1083984375, 2.70263671875, 3.296875, 3.89111328125, 4.4853515625, 5.07958984375, 5.673828125, 6.26806640625, 6.8623046875, 7.45654296875, 8.05078125, 8.64501953125, 9.2392578125, 9.83349609375, 10.427734375, 11.02197265625, 11.6162109375, 12.21044921875, 12.8046875, 13.39892578125, 13.9931640625, 14.58740234375, 15.181640625, 15.77587890625, 16.3701171875, 16.96435546875, 17.55859375, 18.15283203125, 18.7470703125, 19.34130859375, 19.935546875, 20.52978515625, 21.1240234375, 21.71826171875, 22.3125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 3.0, 4.0, 5.0, 11.0, 14.0, 18.0, 28.0, 47.0, 61.0, 91.0, 97.0, 171.0, 214.0, 275.0, 466.0, 746.0, 1258.0, 2144.0, 4337.0, 9375.0, 21474.0, 54359.0, 133009.0, 275978.0, 293049.0, 145947.0, 60441.0, 24088.0, 10186.0, 4703.0, 2332.0, 1302.0, 776.0, 488.0, 328.0, 208.0, 140.0, 113.0, 71.0, 64.0, 44.0, 33.0, 14.0, 18.0, 10.0, 6.0, 3.0, 5.0, 6.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.375, -49.720703125, -48.06640625, -46.412109375, -44.7578125, -43.103515625, -41.44921875, -39.794921875, -38.140625, -36.486328125, -34.83203125, -33.177734375, -31.5234375, -29.869140625, -28.21484375, -26.560546875, -24.90625, -23.251953125, -21.59765625, -19.943359375, -18.2890625, -16.634765625, -14.98046875, -13.326171875, -11.671875, -10.017578125, -8.36328125, -6.708984375, -5.0546875, -3.400390625, -1.74609375, -0.091796875, 1.5625, 3.216796875, 4.87109375, 6.525390625, 8.1796875, 9.833984375, 11.48828125, 13.142578125, 14.796875, 16.451171875, 18.10546875, 19.759765625, 21.4140625, 23.068359375, 24.72265625, 26.376953125, 28.03125, 29.685546875, 31.33984375, 32.994140625, 34.6484375, 36.302734375, 37.95703125, 39.611328125, 41.265625, 42.919921875, 44.57421875, 46.228515625, 47.8828125, 49.537109375, 51.19140625, 52.845703125, 54.5]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 5.0, 6.0, 4.0, 13.0, 9.0, 14.0, 16.0, 14.0, 16.0, 24.0, 24.0, 27.0, 40.0, 32.0, 33.0, 43.0, 38.0, 50.0, 50.0, 60.0, 54.0, 45.0, 37.0, 50.0, 41.0, 44.0, 41.0, 30.0, 27.0, 15.0, 27.0, 17.0, 14.0, 9.0, 8.0, 11.0, 5.0, 2.0, 2.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.3125, -40.76171875, -39.2109375, -37.66015625, -36.109375, -34.55859375, -33.0078125, -31.45703125, -29.90625, -28.35546875, -26.8046875, -25.25390625, -23.703125, -22.15234375, -20.6015625, -19.05078125, -17.5, -15.94921875, -14.3984375, -12.84765625, -11.296875, -9.74609375, -8.1953125, -6.64453125, -5.09375, -3.54296875, -1.9921875, -0.44140625, 1.109375, 2.66015625, 4.2109375, 5.76171875, 7.3125, 8.86328125, 10.4140625, 11.96484375, 13.515625, 15.06640625, 16.6171875, 18.16796875, 19.71875, 21.26953125, 22.8203125, 24.37109375, 25.921875, 27.47265625, 29.0234375, 30.57421875, 32.125, 33.67578125, 35.2265625, 36.77734375, 38.328125, 39.87890625, 41.4296875, 42.98046875, 44.53125, 46.08203125, 47.6328125, 49.18359375, 50.734375, 52.28515625, 53.8359375, 55.38671875, 56.9375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 4.0, 3.0, 4.0, 10.0, 17.0, 11.0, 29.0, 29.0, 48.0, 82.0, 128.0, 229.0, 472.0, 857.0, 1738.0, 3924.0, 11314.0, 45845.0, 279892.0, 552160.0, 117351.0, 22383.0, 6616.0, 2686.0, 1213.0, 655.0, 353.0, 202.0, 98.0, 68.0, 39.0, 27.0, 21.0, 9.0, 12.0, 7.0, 8.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-42.65625, -41.2919921875, -39.927734375, -38.5634765625, -37.19921875, -35.8349609375, -34.470703125, -33.1064453125, -31.7421875, -30.3779296875, -29.013671875, -27.6494140625, -26.28515625, -24.9208984375, -23.556640625, -22.1923828125, -20.828125, -19.4638671875, -18.099609375, -16.7353515625, -15.37109375, -14.0068359375, -12.642578125, -11.2783203125, -9.9140625, -8.5498046875, -7.185546875, -5.8212890625, -4.45703125, -3.0927734375, -1.728515625, -0.3642578125, 1.0, 2.3642578125, 3.728515625, 5.0927734375, 6.45703125, 7.8212890625, 9.185546875, 10.5498046875, 11.9140625, 13.2783203125, 14.642578125, 16.0068359375, 17.37109375, 18.7353515625, 20.099609375, 21.4638671875, 22.828125, 24.1923828125, 25.556640625, 26.9208984375, 28.28515625, 29.6494140625, 31.013671875, 32.3779296875, 33.7421875, 35.1064453125, 36.470703125, 37.8349609375, 39.19921875, 40.5634765625, 41.927734375, 43.2919921875, 44.65625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 5.0, 4.0, 6.0, 7.0, 10.0, 10.0, 13.0, 14.0, 22.0, 37.0, 41.0, 66.0, 82.0, 130.0, 145.0, 107.0, 81.0, 58.0, 38.0, 34.0, 29.0, 17.0, 9.0, 10.0, 5.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00690460205078125, -0.006703615188598633, -0.006502628326416016, -0.0063016414642333984, -0.006100654602050781, -0.005899667739868164, -0.005698680877685547, -0.00549769401550293, -0.0052967071533203125, -0.005095720291137695, -0.004894733428955078, -0.004693746566772461, -0.004492759704589844, -0.0042917728424072266, -0.004090785980224609, -0.003889799118041992, -0.003688812255859375, -0.003487825393676758, -0.0032868385314941406, -0.0030858516693115234, -0.0028848648071289062, -0.002683877944946289, -0.002482891082763672, -0.0022819042205810547, -0.0020809173583984375, -0.0018799304962158203, -0.0016789436340332031, -0.001477956771850586, -0.0012769699096679688, -0.0010759830474853516, -0.0008749961853027344, -0.0006740093231201172, -0.0004730224609375, -0.0002720355987548828, -7.104873657226562e-05, 0.00012993812561035156, 0.00033092498779296875, 0.0005319118499755859, 0.0007328987121582031, 0.0009338855743408203, 0.0011348724365234375, 0.0013358592987060547, 0.0015368461608886719, 0.001737833023071289, 0.0019388198852539062, 0.0021398067474365234, 0.0023407936096191406, 0.002541780471801758, 0.002742767333984375, 0.002943754196166992, 0.0031447410583496094, 0.0033457279205322266, 0.0035467147827148438, 0.003747701644897461, 0.003948688507080078, 0.004149675369262695, 0.0043506622314453125, 0.00455164909362793, 0.004752635955810547, 0.004953622817993164, 0.005154609680175781, 0.0053555965423583984, 0.005556583404541016, 0.005757570266723633, 0.00595855712890625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 1.0, 6.0, 0.0, 3.0, 6.0, 2.0, 7.0, 6.0, 10.0, 24.0, 21.0, 28.0, 46.0, 77.0, 134.0, 200.0, 372.0, 728.0, 1535.0, 3540.0, 9782.0, 38165.0, 302387.0, 588049.0, 78453.0, 15701.0, 5084.0, 1994.0, 954.0, 486.0, 279.0, 173.0, 93.0, 62.0, 40.0, 36.0, 15.0, 15.0, 9.0, 6.0, 7.0, 9.0, 5.0, 7.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.1875, -54.54443359375, -52.9013671875, -51.25830078125, -49.615234375, -47.97216796875, -46.3291015625, -44.68603515625, -43.04296875, -41.39990234375, -39.7568359375, -38.11376953125, -36.470703125, -34.82763671875, -33.1845703125, -31.54150390625, -29.8984375, -28.25537109375, -26.6123046875, -24.96923828125, -23.326171875, -21.68310546875, -20.0400390625, -18.39697265625, -16.75390625, -15.11083984375, -13.4677734375, -11.82470703125, -10.181640625, -8.53857421875, -6.8955078125, -5.25244140625, -3.609375, -1.96630859375, -0.3232421875, 1.31982421875, 2.962890625, 4.60595703125, 6.2490234375, 7.89208984375, 9.53515625, 11.17822265625, 12.8212890625, 14.46435546875, 16.107421875, 17.75048828125, 19.3935546875, 21.03662109375, 22.6796875, 24.32275390625, 25.9658203125, 27.60888671875, 29.251953125, 30.89501953125, 32.5380859375, 34.18115234375, 35.82421875, 37.46728515625, 39.1103515625, 40.75341796875, 42.396484375, 44.03955078125, 45.6826171875, 47.32568359375, 48.96875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 6.0, 2.0, 6.0, 4.0, 7.0, 9.0, 8.0, 8.0, 21.0, 28.0, 26.0, 44.0, 61.0, 69.0, 80.0, 81.0, 104.0, 101.0, 85.0, 62.0, 46.0, 40.0, 32.0, 17.0, 16.0, 7.0, 9.0, 4.0, 7.0, 6.0, 3.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-32.65625, -31.82421875, -30.9921875, -30.16015625, -29.328125, -28.49609375, -27.6640625, -26.83203125, -26.0, -25.16796875, -24.3359375, -23.50390625, -22.671875, -21.83984375, -21.0078125, -20.17578125, -19.34375, -18.51171875, -17.6796875, -16.84765625, -16.015625, -15.18359375, -14.3515625, -13.51953125, -12.6875, -11.85546875, -11.0234375, -10.19140625, -9.359375, -8.52734375, -7.6953125, -6.86328125, -6.03125, -5.19921875, -4.3671875, -3.53515625, -2.703125, -1.87109375, -1.0390625, -0.20703125, 0.625, 1.45703125, 2.2890625, 3.12109375, 3.953125, 4.78515625, 5.6171875, 6.44921875, 7.28125, 8.11328125, 8.9453125, 9.77734375, 10.609375, 11.44140625, 12.2734375, 13.10546875, 13.9375, 14.76953125, 15.6015625, 16.43359375, 17.265625, 18.09765625, 18.9296875, 19.76171875, 20.59375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 9.0, 7.0, 9.0, 6.0, 19.0, 19.0, 29.0, 51.0, 59.0, 100.0, 92.0, 110.0, 121.0, 84.0, 90.0, 68.0, 39.0, 29.0, 21.0, 12.0, 10.0, 11.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0], "bins": [-573.565673828125, -561.1333618164062, -548.7010498046875, -536.268798828125, -523.8364868164062, -511.4041748046875, -498.97186279296875, -486.53955078125, -474.10723876953125, -461.6749267578125, -449.2426452636719, -436.8103332519531, -424.3780212402344, -411.94573974609375, -399.513427734375, -387.08111572265625, -374.6488342285156, -362.2165222167969, -349.78424072265625, -337.3519287109375, -324.91961669921875, -312.4873046875, -300.0550231933594, -287.6227111816406, -275.1904296875, -262.75811767578125, -250.32582092285156, -237.89352416992188, -225.46121215820312, -213.02891540527344, -200.59661865234375, -188.164306640625, -175.73202514648438, -163.2997283935547, -150.86741638183594, -138.43511962890625, -126.00281524658203, -113.57051086425781, -101.13821411132812, -88.7059097290039, -76.27360534667969, -63.84130096435547, -51.409000396728516, -38.97669982910156, -26.544395446777344, -14.112091064453125, -1.6797943115234375, 10.752510070800781, 23.184814453125, 35.61711883544922, 48.04941940307617, 60.481719970703125, 72.91402435302734, 85.34632873535156, 97.77862548828125, 110.21092987060547, 122.64323425292969, 135.07553100585938, 147.50784301757812, 159.9401397705078, 172.3724365234375, 184.80474853515625, 197.23704528808594, 209.66934204101562, 222.10165405273438]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 5.0, 6.0, 10.0, 11.0, 14.0, 11.0, 18.0, 29.0, 30.0, 35.0, 40.0, 49.0, 32.0, 40.0, 52.0, 42.0, 35.0, 46.0, 58.0, 51.0, 51.0, 49.0, 48.0, 29.0, 39.0, 35.0, 26.0, 23.0, 12.0, 19.0, 26.0, 2.0, 5.0, 4.0, 8.0, 2.0, 3.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-315.7646179199219, -306.2895202636719, -296.8144226074219, -287.3393249511719, -277.8642272949219, -268.3891296386719, -258.9140319824219, -249.4389190673828, -239.9638214111328, -230.4887237548828, -221.0136260986328, -211.5385284423828, -202.06341552734375, -192.58831787109375, -183.11322021484375, -173.63812255859375, -164.16302490234375, -154.68792724609375, -145.21282958984375, -135.73773193359375, -126.26262664794922, -116.78752899169922, -107.31242370605469, -97.83732604980469, -88.36222839355469, -78.88713073730469, -69.41203308105469, -59.936927795410156, -50.461830139160156, -40.986732482910156, -31.51163101196289, -22.036529541015625, -12.56146240234375, -3.086362838745117, 6.388736724853516, 15.863836288452148, 25.33893585205078, 34.81403350830078, 44.28913497924805, 53.76423645019531, 63.23933410644531, 72.71443176269531, 82.18952941894531, 91.66463470458984, 101.13973236083984, 110.61483001708984, 120.08993530273438, 129.56503295898438, 139.04013061523438, 148.51522827148438, 157.99032592773438, 167.46542358398438, 176.94052124023438, 186.41561889648438, 195.89073181152344, 205.36582946777344, 214.84092712402344, 224.31602478027344, 233.79112243652344, 243.26622009277344, 252.7413330078125, 262.2164306640625, 271.6915283203125, 281.1666259765625, 290.6417236328125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 8.0, 6.0, 11.0, 8.0, 26.0, 38.0, 49.0, 64.0, 121.0, 238.0, 481.0, 916.0, 2287.0, 6420.0, 22276.0, 122367.0, 3535504.0, 438003.0, 47545.0, 11231.0, 3589.0, 1463.0, 688.0, 352.0, 192.0, 127.0, 62.0, 40.0, 38.0, 33.0, 21.0, 17.0, 18.0, 14.0, 7.0, 5.0, 6.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-129.25, -124.591796875, -119.93359375, -115.275390625, -110.6171875, -105.958984375, -101.30078125, -96.642578125, -91.984375, -87.326171875, -82.66796875, -78.009765625, -73.3515625, -68.693359375, -64.03515625, -59.376953125, -54.71875, -50.060546875, -45.40234375, -40.744140625, -36.0859375, -31.427734375, -26.76953125, -22.111328125, -17.453125, -12.794921875, -8.13671875, -3.478515625, 1.1796875, 5.837890625, 10.49609375, 15.154296875, 19.8125, 24.470703125, 29.12890625, 33.787109375, 38.4453125, 43.103515625, 47.76171875, 52.419921875, 57.078125, 61.736328125, 66.39453125, 71.052734375, 75.7109375, 80.369140625, 85.02734375, 89.685546875, 94.34375, 99.001953125, 103.66015625, 108.318359375, 112.9765625, 117.634765625, 122.29296875, 126.951171875, 131.609375, 136.267578125, 140.92578125, 145.583984375, 150.2421875, 154.900390625, 159.55859375, 164.216796875, 168.875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 14.0, 20.0, 23.0, 31.0, 33.0, 58.0, 69.0, 96.0, 97.0, 84.0, 77.0, 74.0, 97.0, 60.0, 45.0, 40.0, 26.0, 17.0, 23.0, 5.0, 7.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.109375, -17.501220703125, -16.89306640625, -16.284912109375, -15.6767578125, -15.068603515625, -14.46044921875, -13.852294921875, -13.244140625, -12.635986328125, -12.02783203125, -11.419677734375, -10.8115234375, -10.203369140625, -9.59521484375, -8.987060546875, -8.37890625, -7.770751953125, -7.16259765625, -6.554443359375, -5.9462890625, -5.338134765625, -4.72998046875, -4.121826171875, -3.513671875, -2.905517578125, -2.29736328125, -1.689208984375, -1.0810546875, -0.472900390625, 0.13525390625, 0.743408203125, 1.3515625, 1.959716796875, 2.56787109375, 3.176025390625, 3.7841796875, 4.392333984375, 5.00048828125, 5.608642578125, 6.216796875, 6.824951171875, 7.43310546875, 8.041259765625, 8.6494140625, 9.257568359375, 9.86572265625, 10.473876953125, 11.08203125, 11.690185546875, 12.29833984375, 12.906494140625, 13.5146484375, 14.122802734375, 14.73095703125, 15.339111328125, 15.947265625, 16.555419921875, 17.16357421875, 17.771728515625, 18.3798828125, 18.988037109375, 19.59619140625, 20.204345703125, 20.8125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 7.0, 8.0, 10.0, 13.0, 15.0, 28.0, 27.0, 60.0, 51.0, 69.0, 89.0, 119.0, 185.0, 234.0, 328.0, 493.0, 893.0, 1551.0, 3168.0, 8295.0, 27271.0, 135507.0, 2376303.0, 1485477.0, 115666.0, 24127.0, 7263.0, 2980.0, 1485.0, 856.0, 549.0, 361.0, 214.0, 149.0, 102.0, 81.0, 80.0, 42.0, 31.0, 26.0, 24.0, 14.0, 7.0, 11.0, 5.0, 6.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-109.0, -105.58984375, -102.1796875, -98.76953125, -95.359375, -91.94921875, -88.5390625, -85.12890625, -81.71875, -78.30859375, -74.8984375, -71.48828125, -68.078125, -64.66796875, -61.2578125, -57.84765625, -54.4375, -51.02734375, -47.6171875, -44.20703125, -40.796875, -37.38671875, -33.9765625, -30.56640625, -27.15625, -23.74609375, -20.3359375, -16.92578125, -13.515625, -10.10546875, -6.6953125, -3.28515625, 0.125, 3.53515625, 6.9453125, 10.35546875, 13.765625, 17.17578125, 20.5859375, 23.99609375, 27.40625, 30.81640625, 34.2265625, 37.63671875, 41.046875, 44.45703125, 47.8671875, 51.27734375, 54.6875, 58.09765625, 61.5078125, 64.91796875, 68.328125, 71.73828125, 75.1484375, 78.55859375, 81.96875, 85.37890625, 88.7890625, 92.19921875, 95.609375, 99.01953125, 102.4296875, 105.83984375, 109.25]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 6.0, 8.0, 5.0, 15.0, 25.0, 42.0, 63.0, 92.0, 167.0, 308.0, 709.0, 1652.0, 464.0, 236.0, 109.0, 69.0, 38.0, 27.0, 12.0, 10.0, 6.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-55.875, -54.376953125, -52.87890625, -51.380859375, -49.8828125, -48.384765625, -46.88671875, -45.388671875, -43.890625, -42.392578125, -40.89453125, -39.396484375, -37.8984375, -36.400390625, -34.90234375, -33.404296875, -31.90625, -30.408203125, -28.91015625, -27.412109375, -25.9140625, -24.416015625, -22.91796875, -21.419921875, -19.921875, -18.423828125, -16.92578125, -15.427734375, -13.9296875, -12.431640625, -10.93359375, -9.435546875, -7.9375, -6.439453125, -4.94140625, -3.443359375, -1.9453125, -0.447265625, 1.05078125, 2.548828125, 4.046875, 5.544921875, 7.04296875, 8.541015625, 10.0390625, 11.537109375, 13.03515625, 14.533203125, 16.03125, 17.529296875, 19.02734375, 20.525390625, 22.0234375, 23.521484375, 25.01953125, 26.517578125, 28.015625, 29.513671875, 31.01171875, 32.509765625, 34.0078125, 35.505859375, 37.00390625, 38.501953125, 40.0]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 9.0, 11.0, 20.0, 25.0, 53.0, 66.0, 103.0, 117.0, 133.0, 116.0, 105.0, 70.0, 57.0, 45.0, 28.0, 12.0, 15.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-364.1314392089844, -355.24560546875, -346.35980224609375, -337.4739990234375, -328.5881652832031, -319.70233154296875, -310.8165283203125, -301.93072509765625, -293.0448913574219, -284.1590576171875, -275.27325439453125, -266.387451171875, -257.5016174316406, -248.6157989501953, -239.72998046875, -230.8441619873047, -221.95834350585938, -213.07252502441406, -204.18670654296875, -195.30088806152344, -186.41506958007812, -177.5292510986328, -168.6434326171875, -159.7576141357422, -150.87179565429688, -141.98597717285156, -133.10015869140625, -124.21434020996094, -115.32852172851562, -106.44270324707031, -97.556884765625, -88.67106628417969, -79.78526306152344, -70.89944458007812, -62.01362609863281, -53.1278076171875, -44.24198913574219, -35.356170654296875, -26.470352172851562, -17.58453369140625, -8.698715209960938, 0.187103271484375, 9.072921752929688, 17.958740234375, 26.844558715820312, 35.730377197265625, 44.61619567871094, 53.50201416015625, 62.38783264160156, 71.27365112304688, 80.15946960449219, 89.0452880859375, 97.93110656738281, 106.81692504882812, 115.70274353027344, 124.58856201171875, 133.47438049316406, 142.36019897460938, 151.2460174560547, 160.1318359375, 169.0176544189453, 177.90347290039062, 186.78929138183594, 195.67510986328125, 204.56092834472656]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 6.0, 1.0, 4.0, 4.0, 5.0, 4.0, 5.0, 10.0, 8.0, 12.0, 23.0, 24.0, 27.0, 30.0, 35.0, 36.0, 40.0, 42.0, 41.0, 41.0, 40.0, 57.0, 60.0, 60.0, 37.0, 45.0, 36.0, 32.0, 33.0, 29.0, 39.0, 33.0, 21.0, 11.0, 18.0, 10.0, 15.0, 9.0, 7.0, 5.0, 4.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.99546813964844, -129.6334686279297, -125.27147674560547, -120.90947723388672, -116.5474853515625, -112.18548583984375, -107.823486328125, -103.46148681640625, -99.09949493408203, -94.73749542236328, -90.37550354003906, -86.01350402832031, -81.65150451660156, -77.28951263427734, -72.9275131225586, -68.56552124023438, -64.20352172851562, -59.84152603149414, -55.479530334472656, -51.117530822753906, -46.75553512573242, -42.39353942871094, -38.03153991699219, -33.6695442199707, -29.30754852294922, -24.945552825927734, -20.583555221557617, -16.2215576171875, -11.859561920166016, -7.497566223144531, -3.135568618774414, 1.2264289855957031, 5.588409423828125, 9.950406074523926, 14.312402725219727, 18.674400329589844, 23.036396026611328, 27.398391723632812, 31.76038932800293, 36.12238693237305, 40.48438262939453, 44.846378326416016, 49.2083740234375, 53.57037353515625, 57.932369232177734, 62.29436492919922, 66.65636444091797, 71.01835632324219, 75.38035583496094, 79.74235534667969, 84.1043472290039, 88.46634674072266, 92.82833862304688, 97.19033813476562, 101.55233764648438, 105.91433715820312, 110.27632904052734, 114.6383285522461, 119.00032043457031, 123.36231994628906, 127.72431945800781, 132.0863037109375, 136.44830322265625, 140.810302734375, 145.17230224609375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 8.0, 16.0, 27.0, 41.0, 62.0, 97.0, 153.0, 273.0, 511.0, 1087.0, 3045.0, 14729.0, 116540.0, 698525.0, 184847.0, 21902.0, 3983.0, 1342.0, 625.0, 278.0, 177.0, 116.0, 69.0, 31.0, 25.0, 15.0, 15.0, 8.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-180.75, -174.84375, -168.9375, -163.03125, -157.125, -151.21875, -145.3125, -139.40625, -133.5, -127.59375, -121.6875, -115.78125, -109.875, -103.96875, -98.0625, -92.15625, -86.25, -80.34375, -74.4375, -68.53125, -62.625, -56.71875, -50.8125, -44.90625, -39.0, -33.09375, -27.1875, -21.28125, -15.375, -9.46875, -3.5625, 2.34375, 8.25, 14.15625, 20.0625, 25.96875, 31.875, 37.78125, 43.6875, 49.59375, 55.5, 61.40625, 67.3125, 73.21875, 79.125, 85.03125, 90.9375, 96.84375, 102.75, 108.65625, 114.5625, 120.46875, 126.375, 132.28125, 138.1875, 144.09375, 150.0, 155.90625, 161.8125, 167.71875, 173.625, 179.53125, 185.4375, 191.34375, 197.25]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 8.0, 8.0, 12.0, 20.0, 31.0, 37.0, 54.0, 63.0, 74.0, 103.0, 83.0, 100.0, 87.0, 84.0, 75.0, 42.0, 30.0, 40.0, 23.0, 14.0, 8.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.25, -20.605712890625, -19.96142578125, -19.317138671875, -18.6728515625, -18.028564453125, -17.38427734375, -16.739990234375, -16.095703125, -15.451416015625, -14.80712890625, -14.162841796875, -13.5185546875, -12.874267578125, -12.22998046875, -11.585693359375, -10.94140625, -10.297119140625, -9.65283203125, -9.008544921875, -8.3642578125, -7.719970703125, -7.07568359375, -6.431396484375, -5.787109375, -5.142822265625, -4.49853515625, -3.854248046875, -3.2099609375, -2.565673828125, -1.92138671875, -1.277099609375, -0.6328125, 0.011474609375, 0.65576171875, 1.300048828125, 1.9443359375, 2.588623046875, 3.23291015625, 3.877197265625, 4.521484375, 5.165771484375, 5.81005859375, 6.454345703125, 7.0986328125, 7.742919921875, 8.38720703125, 9.031494140625, 9.67578125, 10.320068359375, 10.96435546875, 11.608642578125, 12.2529296875, 12.897216796875, 13.54150390625, 14.185791015625, 14.830078125, 15.474365234375, 16.11865234375, 16.762939453125, 17.4072265625, 18.051513671875, 18.69580078125, 19.340087890625, 19.984375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 2.0, 10.0, 11.0, 11.0, 28.0, 37.0, 50.0, 75.0, 111.0, 155.0, 232.0, 366.0, 613.0, 1001.0, 1790.0, 3260.0, 6647.0, 13941.0, 30622.0, 67388.0, 147768.0, 296934.0, 255283.0, 119736.0, 54674.0, 24461.0, 11394.0, 5398.0, 2745.0, 1552.0, 816.0, 504.0, 303.0, 241.0, 112.0, 91.0, 61.0, 37.0, 25.0, 25.0, 15.0, 11.0, 11.0, 7.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-47.65625, -46.2490234375, -44.841796875, -43.4345703125, -42.02734375, -40.6201171875, -39.212890625, -37.8056640625, -36.3984375, -34.9912109375, -33.583984375, -32.1767578125, -30.76953125, -29.3623046875, -27.955078125, -26.5478515625, -25.140625, -23.7333984375, -22.326171875, -20.9189453125, -19.51171875, -18.1044921875, -16.697265625, -15.2900390625, -13.8828125, -12.4755859375, -11.068359375, -9.6611328125, -8.25390625, -6.8466796875, -5.439453125, -4.0322265625, -2.625, -1.2177734375, 0.189453125, 1.5966796875, 3.00390625, 4.4111328125, 5.818359375, 7.2255859375, 8.6328125, 10.0400390625, 11.447265625, 12.8544921875, 14.26171875, 15.6689453125, 17.076171875, 18.4833984375, 19.890625, 21.2978515625, 22.705078125, 24.1123046875, 25.51953125, 26.9267578125, 28.333984375, 29.7412109375, 31.1484375, 32.5556640625, 33.962890625, 35.3701171875, 36.77734375, 38.1845703125, 39.591796875, 40.9990234375, 42.40625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 2.0, 5.0, 10.0, 5.0, 9.0, 15.0, 14.0, 12.0, 15.0, 18.0, 33.0, 23.0, 32.0, 31.0, 36.0, 41.0, 45.0, 42.0, 46.0, 31.0, 50.0, 45.0, 49.0, 43.0, 27.0, 39.0, 32.0, 40.0, 33.0, 21.0, 17.0, 16.0, 24.0, 20.0, 20.0, 13.0, 12.0, 6.0, 10.0, 8.0, 5.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.03125, -38.72265625, -37.4140625, -36.10546875, -34.796875, -33.48828125, -32.1796875, -30.87109375, -29.5625, -28.25390625, -26.9453125, -25.63671875, -24.328125, -23.01953125, -21.7109375, -20.40234375, -19.09375, -17.78515625, -16.4765625, -15.16796875, -13.859375, -12.55078125, -11.2421875, -9.93359375, -8.625, -7.31640625, -6.0078125, -4.69921875, -3.390625, -2.08203125, -0.7734375, 0.53515625, 1.84375, 3.15234375, 4.4609375, 5.76953125, 7.078125, 8.38671875, 9.6953125, 11.00390625, 12.3125, 13.62109375, 14.9296875, 16.23828125, 17.546875, 18.85546875, 20.1640625, 21.47265625, 22.78125, 24.08984375, 25.3984375, 26.70703125, 28.015625, 29.32421875, 30.6328125, 31.94140625, 33.25, 34.55859375, 35.8671875, 37.17578125, 38.484375, 39.79296875, 41.1015625, 42.41015625, 43.71875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 4.0, 16.0, 24.0, 44.0, 72.0, 144.0, 319.0, 842.0, 2813.0, 13599.0, 111197.0, 660574.0, 228443.0, 24136.0, 4351.0, 1151.0, 428.0, 177.0, 91.0, 59.0, 22.0, 15.0, 11.0, 9.0, 9.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.21875, -42.5595703125, -40.900390625, -39.2412109375, -37.58203125, -35.9228515625, -34.263671875, -32.6044921875, -30.9453125, -29.2861328125, -27.626953125, -25.9677734375, -24.30859375, -22.6494140625, -20.990234375, -19.3310546875, -17.671875, -16.0126953125, -14.353515625, -12.6943359375, -11.03515625, -9.3759765625, -7.716796875, -6.0576171875, -4.3984375, -2.7392578125, -1.080078125, 0.5791015625, 2.23828125, 3.8974609375, 5.556640625, 7.2158203125, 8.875, 10.5341796875, 12.193359375, 13.8525390625, 15.51171875, 17.1708984375, 18.830078125, 20.4892578125, 22.1484375, 23.8076171875, 25.466796875, 27.1259765625, 28.78515625, 30.4443359375, 32.103515625, 33.7626953125, 35.421875, 37.0810546875, 38.740234375, 40.3994140625, 42.05859375, 43.7177734375, 45.376953125, 47.0361328125, 48.6953125, 50.3544921875, 52.013671875, 53.6728515625, 55.33203125, 56.9912109375, 58.650390625, 60.3095703125, 61.96875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 9.0, 7.0, 8.0, 14.0, 17.0, 20.0, 27.0, 35.0, 38.0, 56.0, 54.0, 124.0, 133.0, 130.0, 77.0, 53.0, 48.0, 32.0, 33.0, 18.0, 19.0, 13.0, 9.0, 6.0, 1.0, 10.0, 0.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00592803955078125, -0.005778014659881592, -0.005627989768981934, -0.005477964878082275, -0.005327939987182617, -0.005177915096282959, -0.005027890205383301, -0.004877865314483643, -0.004727840423583984, -0.004577815532684326, -0.004427790641784668, -0.00427776575088501, -0.0041277408599853516, -0.003977715969085693, -0.003827691078186035, -0.003677666187286377, -0.0035276412963867188, -0.0033776164054870605, -0.0032275915145874023, -0.003077566623687744, -0.002927541732788086, -0.0027775168418884277, -0.0026274919509887695, -0.0024774670600891113, -0.002327442169189453, -0.002177417278289795, -0.0020273923873901367, -0.0018773674964904785, -0.0017273426055908203, -0.0015773177146911621, -0.001427292823791504, -0.0012772679328918457, -0.0011272430419921875, -0.0009772181510925293, -0.0008271932601928711, -0.0006771683692932129, -0.0005271434783935547, -0.0003771185874938965, -0.00022709369659423828, -7.706880569458008e-05, 7.295608520507812e-05, 0.00022298097610473633, 0.00037300586700439453, 0.0005230307579040527, 0.0006730556488037109, 0.0008230805397033691, 0.0009731054306030273, 0.0011231303215026855, 0.0012731552124023438, 0.001423180103302002, 0.0015732049942016602, 0.0017232298851013184, 0.0018732547760009766, 0.0020232796669006348, 0.002173304557800293, 0.002323329448699951, 0.0024733543395996094, 0.0026233792304992676, 0.0027734041213989258, 0.002923429012298584, 0.003073453903198242, 0.0032234787940979004, 0.0033735036849975586, 0.003523528575897217, 0.003673553466796875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 4.0, 11.0, 19.0, 23.0, 19.0, 38.0, 54.0, 102.0, 130.0, 229.0, 359.0, 595.0, 1108.0, 2135.0, 4265.0, 10270.0, 28062.0, 94719.0, 309473.0, 390105.0, 140609.0, 40766.0, 13994.0, 5667.0, 2640.0, 1301.0, 708.0, 431.0, 248.0, 158.0, 102.0, 68.0, 44.0, 18.0, 23.0, 18.0, 16.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-27.078125, -26.236083984375, -25.39404296875, -24.552001953125, -23.7099609375, -22.867919921875, -22.02587890625, -21.183837890625, -20.341796875, -19.499755859375, -18.65771484375, -17.815673828125, -16.9736328125, -16.131591796875, -15.28955078125, -14.447509765625, -13.60546875, -12.763427734375, -11.92138671875, -11.079345703125, -10.2373046875, -9.395263671875, -8.55322265625, -7.711181640625, -6.869140625, -6.027099609375, -5.18505859375, -4.343017578125, -3.5009765625, -2.658935546875, -1.81689453125, -0.974853515625, -0.1328125, 0.709228515625, 1.55126953125, 2.393310546875, 3.2353515625, 4.077392578125, 4.91943359375, 5.761474609375, 6.603515625, 7.445556640625, 8.28759765625, 9.129638671875, 9.9716796875, 10.813720703125, 11.65576171875, 12.497802734375, 13.33984375, 14.181884765625, 15.02392578125, 15.865966796875, 16.7080078125, 17.550048828125, 18.39208984375, 19.234130859375, 20.076171875, 20.918212890625, 21.76025390625, 22.602294921875, 23.4443359375, 24.286376953125, 25.12841796875, 25.970458984375, 26.8125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 5.0, 2.0, 2.0, 8.0, 8.0, 22.0, 18.0, 26.0, 30.0, 45.0, 46.0, 66.0, 80.0, 107.0, 97.0, 83.0, 83.0, 69.0, 41.0, 46.0, 24.0, 20.0, 23.0, 16.0, 11.0, 3.0, 6.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.296875, -21.564697265625, -20.83251953125, -20.100341796875, -19.3681640625, -18.635986328125, -17.90380859375, -17.171630859375, -16.439453125, -15.707275390625, -14.97509765625, -14.242919921875, -13.5107421875, -12.778564453125, -12.04638671875, -11.314208984375, -10.58203125, -9.849853515625, -9.11767578125, -8.385498046875, -7.6533203125, -6.921142578125, -6.18896484375, -5.456787109375, -4.724609375, -3.992431640625, -3.26025390625, -2.528076171875, -1.7958984375, -1.063720703125, -0.33154296875, 0.400634765625, 1.1328125, 1.864990234375, 2.59716796875, 3.329345703125, 4.0615234375, 4.793701171875, 5.52587890625, 6.258056640625, 6.990234375, 7.722412109375, 8.45458984375, 9.186767578125, 9.9189453125, 10.651123046875, 11.38330078125, 12.115478515625, 12.84765625, 13.579833984375, 14.31201171875, 15.044189453125, 15.7763671875, 16.508544921875, 17.24072265625, 17.972900390625, 18.705078125, 19.437255859375, 20.16943359375, 20.901611328125, 21.6337890625, 22.365966796875, 23.09814453125, 23.830322265625, 24.5625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 3.0, 5.0, 2.0, 5.0, 8.0, 9.0, 15.0, 32.0, 33.0, 35.0, 49.0, 50.0, 68.0, 65.0, 84.0, 110.0, 67.0, 69.0, 65.0, 56.0, 41.0, 35.0, 25.0, 22.0, 16.0, 11.0, 4.0, 5.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-231.17059326171875, -222.47744750976562, -213.7843017578125, -205.09115600585938, -196.39801025390625, -187.70486450195312, -179.01171875, -170.31857299804688, -161.62542724609375, -152.93228149414062, -144.2391357421875, -135.54598999023438, -126.85284423828125, -118.15969848632812, -109.46656036376953, -100.7734146118164, -92.08027648925781, -83.38713073730469, -74.69398498535156, -66.00083923339844, -57.30769729614258, -48.61455154418945, -39.921409606933594, -31.22826385498047, -22.535118103027344, -13.841973304748535, -5.148828506469727, 3.5443153381347656, 12.23746109008789, 20.930606842041016, 29.623748779296875, 38.31689453125, 47.010040283203125, 55.70318603515625, 64.39633178710938, 73.0894775390625, 81.78262329101562, 90.47576904296875, 99.16890716552734, 107.86205291748047, 116.5551986694336, 125.24834442138672, 133.9414825439453, 142.63462829589844, 151.32777404785156, 160.0209197998047, 168.7140655517578, 177.40721130371094, 186.10035705566406, 194.7935028076172, 203.4866485595703, 212.17979431152344, 220.87294006347656, 229.5660858154297, 238.25921630859375, 246.95236206054688, 255.6455078125, 264.3386535644531, 273.03179931640625, 281.7249450683594, 290.4180908203125, 299.1112365722656, 307.80438232421875, 316.4975280761719, 325.190673828125]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 9.0, 12.0, 10.0, 14.0, 14.0, 17.0, 19.0, 24.0, 21.0, 28.0, 27.0, 29.0, 44.0, 39.0, 50.0, 47.0, 49.0, 43.0, 42.0, 52.0, 39.0, 43.0, 44.0, 38.0, 25.0, 33.0, 23.0, 32.0, 15.0, 16.0, 18.0, 16.0, 11.0, 12.0, 11.0, 5.0, 6.0, 1.0, 4.0, 5.0, 5.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-247.33224487304688, -239.5975799560547, -231.8629150390625, -224.1282501220703, -216.39358520507812, -208.65892028808594, -200.92425537109375, -193.18960571289062, -185.45492553710938, -177.7202606201172, -169.985595703125, -162.2509307861328, -154.51626586914062, -146.78160095214844, -139.04693603515625, -131.31228637695312, -123.57762145996094, -115.84295654296875, -108.10829162597656, -100.37362670898438, -92.63896179199219, -84.904296875, -77.16963958740234, -69.43497467041016, -61.70030975341797, -53.96564483642578, -46.230979919433594, -38.49631881713867, -30.761653900146484, -23.026988983154297, -15.292327880859375, -7.5576629638671875, 0.1770172119140625, 7.911681175231934, 15.646345138549805, 23.38100814819336, 31.115673065185547, 38.850337982177734, 46.584999084472656, 54.319664001464844, 62.05432891845703, 69.78899383544922, 77.5236587524414, 85.25831604003906, 92.99298095703125, 100.72764587402344, 108.46231079101562, 116.19697570800781, 123.931640625, 131.6663055419922, 139.40097045898438, 147.13563537597656, 154.87030029296875, 162.60496520996094, 170.33963012695312, 178.07427978515625, 185.8089599609375, 193.5436248779297, 201.27828979492188, 209.01295471191406, 216.74761962890625, 224.48228454589844, 232.21694946289062, 239.95159912109375, 247.68626403808594]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 3.0, 6.0, 13.0, 14.0, 27.0, 38.0, 61.0, 95.0, 156.0, 275.0, 603.0, 1429.0, 4248.0, 21747.0, 704500.0, 3425192.0, 27719.0, 5160.0, 1566.0, 645.0, 277.0, 181.0, 81.0, 71.0, 46.0, 41.0, 21.0, 12.0, 15.0, 4.0, 6.0, 11.0, 2.0, 5.0, 0.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-209.625, -202.154296875, -194.68359375, -187.212890625, -179.7421875, -172.271484375, -164.80078125, -157.330078125, -149.859375, -142.388671875, -134.91796875, -127.447265625, -119.9765625, -112.505859375, -105.03515625, -97.564453125, -90.09375, -82.623046875, -75.15234375, -67.681640625, -60.2109375, -52.740234375, -45.26953125, -37.798828125, -30.328125, -22.857421875, -15.38671875, -7.916015625, -0.4453125, 7.025390625, 14.49609375, 21.966796875, 29.4375, 36.908203125, 44.37890625, 51.849609375, 59.3203125, 66.791015625, 74.26171875, 81.732421875, 89.203125, 96.673828125, 104.14453125, 111.615234375, 119.0859375, 126.556640625, 134.02734375, 141.498046875, 148.96875, 156.439453125, 163.91015625, 171.380859375, 178.8515625, 186.322265625, 193.79296875, 201.263671875, 208.734375, 216.205078125, 223.67578125, 231.146484375, 238.6171875, 246.087890625, 253.55859375, 261.029296875, 268.5]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 9.0, 14.0, 13.0, 32.0, 33.0, 43.0, 51.0, 69.0, 100.0, 81.0, 108.0, 94.0, 69.0, 67.0, 60.0, 43.0, 40.0, 25.0, 18.0, 12.0, 13.0, 1.0, 4.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.5, -20.8583984375, -20.216796875, -19.5751953125, -18.93359375, -18.2919921875, -17.650390625, -17.0087890625, -16.3671875, -15.7255859375, -15.083984375, -14.4423828125, -13.80078125, -13.1591796875, -12.517578125, -11.8759765625, -11.234375, -10.5927734375, -9.951171875, -9.3095703125, -8.66796875, -8.0263671875, -7.384765625, -6.7431640625, -6.1015625, -5.4599609375, -4.818359375, -4.1767578125, -3.53515625, -2.8935546875, -2.251953125, -1.6103515625, -0.96875, -0.3271484375, 0.314453125, 0.9560546875, 1.59765625, 2.2392578125, 2.880859375, 3.5224609375, 4.1640625, 4.8056640625, 5.447265625, 6.0888671875, 6.73046875, 7.3720703125, 8.013671875, 8.6552734375, 9.296875, 9.9384765625, 10.580078125, 11.2216796875, 11.86328125, 12.5048828125, 13.146484375, 13.7880859375, 14.4296875, 15.0712890625, 15.712890625, 16.3544921875, 16.99609375, 17.6376953125, 18.279296875, 18.9208984375, 19.5625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 5.0, 6.0, 3.0, 2.0, 9.0, 6.0, 9.0, 19.0, 11.0, 13.0, 20.0, 30.0, 44.0, 76.0, 137.0, 245.0, 429.0, 869.0, 1857.0, 4501.0, 11988.0, 38718.0, 180997.0, 3156470.0, 673631.0, 87048.0, 22948.0, 8061.0, 3177.0, 1372.0, 712.0, 327.0, 200.0, 108.0, 75.0, 52.0, 38.0, 14.0, 12.0, 12.0, 6.0, 8.0, 7.0, 6.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-89.25, -86.52734375, -83.8046875, -81.08203125, -78.359375, -75.63671875, -72.9140625, -70.19140625, -67.46875, -64.74609375, -62.0234375, -59.30078125, -56.578125, -53.85546875, -51.1328125, -48.41015625, -45.6875, -42.96484375, -40.2421875, -37.51953125, -34.796875, -32.07421875, -29.3515625, -26.62890625, -23.90625, -21.18359375, -18.4609375, -15.73828125, -13.015625, -10.29296875, -7.5703125, -4.84765625, -2.125, 0.59765625, 3.3203125, 6.04296875, 8.765625, 11.48828125, 14.2109375, 16.93359375, 19.65625, 22.37890625, 25.1015625, 27.82421875, 30.546875, 33.26953125, 35.9921875, 38.71484375, 41.4375, 44.16015625, 46.8828125, 49.60546875, 52.328125, 55.05078125, 57.7734375, 60.49609375, 63.21875, 65.94140625, 68.6640625, 71.38671875, 74.109375, 76.83203125, 79.5546875, 82.27734375, 85.0]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 4.0, 6.0, 5.0, 11.0, 8.0, 9.0, 7.0, 16.0, 22.0, 35.0, 35.0, 60.0, 91.0, 131.0, 183.0, 346.0, 1027.0, 1036.0, 350.0, 206.0, 128.0, 90.0, 63.0, 41.0, 26.0, 27.0, 26.0, 19.0, 17.0, 9.0, 4.0, 7.0, 9.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-19.21875, -18.507080078125, -17.79541015625, -17.083740234375, -16.3720703125, -15.660400390625, -14.94873046875, -14.237060546875, -13.525390625, -12.813720703125, -12.10205078125, -11.390380859375, -10.6787109375, -9.967041015625, -9.25537109375, -8.543701171875, -7.83203125, -7.120361328125, -6.40869140625, -5.697021484375, -4.9853515625, -4.273681640625, -3.56201171875, -2.850341796875, -2.138671875, -1.427001953125, -0.71533203125, -0.003662109375, 0.7080078125, 1.419677734375, 2.13134765625, 2.843017578125, 3.5546875, 4.266357421875, 4.97802734375, 5.689697265625, 6.4013671875, 7.113037109375, 7.82470703125, 8.536376953125, 9.248046875, 9.959716796875, 10.67138671875, 11.383056640625, 12.0947265625, 12.806396484375, 13.51806640625, 14.229736328125, 14.94140625, 15.653076171875, 16.36474609375, 17.076416015625, 17.7880859375, 18.499755859375, 19.21142578125, 19.923095703125, 20.634765625, 21.346435546875, 22.05810546875, 22.769775390625, 23.4814453125, 24.193115234375, 24.90478515625, 25.616455078125, 26.328125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 6.0, 15.0, 25.0, 45.0, 50.0, 79.0, 121.0, 123.0, 127.0, 92.0, 94.0, 65.0, 52.0, 30.0, 29.0, 10.0, 9.0, 6.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-174.47479248046875, -167.94744873046875, -161.42010498046875, -154.8927459716797, -148.3654022216797, -141.8380584716797, -135.3107147216797, -128.78335571289062, -122.25601196289062, -115.72866821289062, -109.2013168334961, -102.6739730834961, -96.14662170410156, -89.61927795410156, -83.09193420410156, -76.56458282470703, -70.03723907470703, -63.509891510009766, -56.9825439453125, -50.4552001953125, -43.92784881591797, -37.40050506591797, -30.873157501220703, -24.345809936523438, -17.818462371826172, -11.291114807128906, -4.763768196105957, 1.7635784149169922, 8.290925979614258, 14.81827163696289, 21.345619201660156, 27.872966766357422, 34.40031433105469, 40.92766189575195, 47.45500946044922, 53.98235321044922, 60.50970458984375, 67.03704833984375, 73.56439208984375, 80.09174346923828, 86.61909484863281, 93.14643859863281, 99.67378997802734, 106.20113372802734, 112.72848510742188, 119.25582885742188, 125.78317260742188, 132.31051635742188, 138.83786010742188, 145.36520385742188, 151.89254760742188, 158.41990661621094, 164.94725036621094, 171.47459411621094, 178.00193786621094, 184.529296875, 191.056640625, 197.583984375, 204.111328125, 210.63868713378906, 217.16603088378906, 223.69337463378906, 230.22071838378906, 236.74807739257812, 243.27542114257812]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 6.0, 5.0, 9.0, 6.0, 9.0, 10.0, 19.0, 19.0, 24.0, 28.0, 28.0, 44.0, 31.0, 41.0, 46.0, 56.0, 61.0, 52.0, 43.0, 49.0, 45.0, 51.0, 33.0, 37.0, 36.0, 29.0, 29.0, 33.0, 25.0, 19.0, 17.0, 12.0, 15.0, 11.0, 7.0, 4.0, 5.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-113.060546875, -109.63899230957031, -106.21743774414062, -102.79588317871094, -99.37432861328125, -95.95277404785156, -92.5312271118164, -89.10967254638672, -85.68811798095703, -82.26656341552734, -78.84500885009766, -75.42345428466797, -72.00190734863281, -68.58035278320312, -65.15879821777344, -61.73724365234375, -58.31568908691406, -54.894134521484375, -51.47257995605469, -48.051029205322266, -44.62947463989258, -41.20792007446289, -37.78636932373047, -34.36481475830078, -30.943260192871094, -27.521705627441406, -24.10015296936035, -20.678600311279297, -17.25704574584961, -13.835491180419922, -10.413938522338867, -6.9923858642578125, -3.570831298828125, -0.1492776870727539, 3.272275924682617, 6.693829536437988, 10.11538314819336, 13.536937713623047, 16.9584903717041, 20.380043029785156, 23.801597595214844, 27.22315216064453, 30.644704818725586, 34.06625747680664, 37.48781204223633, 40.909366607666016, 44.33091735839844, 47.752471923828125, 51.17402648925781, 54.5955810546875, 58.01713562011719, 61.43868637084961, 64.86024475097656, 68.28179931640625, 71.7033462524414, 75.1249008178711, 78.54645538330078, 81.96800994873047, 85.38956451416016, 88.81111907958984, 92.232666015625, 95.65422058105469, 99.07577514648438, 102.49732971191406, 105.91888427734375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 4.0, 5.0, 6.0, 12.0, 19.0, 13.0, 29.0, 33.0, 42.0, 49.0, 74.0, 109.0, 193.0, 281.0, 503.0, 973.0, 1964.0, 4976.0, 15934.0, 65921.0, 330861.0, 486440.0, 104416.0, 23462.0, 6903.0, 2573.0, 1154.0, 609.0, 331.0, 228.0, 130.0, 100.0, 51.0, 44.0, 33.0, 27.0, 15.0, 11.0, 5.0, 4.0, 7.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-134.75, -130.6845703125, -126.619140625, -122.5537109375, -118.48828125, -114.4228515625, -110.357421875, -106.2919921875, -102.2265625, -98.1611328125, -94.095703125, -90.0302734375, -85.96484375, -81.8994140625, -77.833984375, -73.7685546875, -69.703125, -65.6376953125, -61.572265625, -57.5068359375, -53.44140625, -49.3759765625, -45.310546875, -41.2451171875, -37.1796875, -33.1142578125, -29.048828125, -24.9833984375, -20.91796875, -16.8525390625, -12.787109375, -8.7216796875, -4.65625, -0.5908203125, 3.474609375, 7.5400390625, 11.60546875, 15.6708984375, 19.736328125, 23.8017578125, 27.8671875, 31.9326171875, 35.998046875, 40.0634765625, 44.12890625, 48.1943359375, 52.259765625, 56.3251953125, 60.390625, 64.4560546875, 68.521484375, 72.5869140625, 76.65234375, 80.7177734375, 84.783203125, 88.8486328125, 92.9140625, 96.9794921875, 101.044921875, 105.1103515625, 109.17578125, 113.2412109375, 117.306640625, 121.3720703125, 125.4375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 13.0, 14.0, 17.0, 25.0, 30.0, 31.0, 53.0, 72.0, 88.0, 80.0, 89.0, 86.0, 102.0, 76.0, 61.0, 41.0, 36.0, 21.0, 29.0, 14.0, 10.0, 4.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.796875, -21.151123046875, -20.50537109375, -19.859619140625, -19.2138671875, -18.568115234375, -17.92236328125, -17.276611328125, -16.630859375, -15.985107421875, -15.33935546875, -14.693603515625, -14.0478515625, -13.402099609375, -12.75634765625, -12.110595703125, -11.46484375, -10.819091796875, -10.17333984375, -9.527587890625, -8.8818359375, -8.236083984375, -7.59033203125, -6.944580078125, -6.298828125, -5.653076171875, -5.00732421875, -4.361572265625, -3.7158203125, -3.070068359375, -2.42431640625, -1.778564453125, -1.1328125, -0.487060546875, 0.15869140625, 0.804443359375, 1.4501953125, 2.095947265625, 2.74169921875, 3.387451171875, 4.033203125, 4.678955078125, 5.32470703125, 5.970458984375, 6.6162109375, 7.261962890625, 7.90771484375, 8.553466796875, 9.19921875, 9.844970703125, 10.49072265625, 11.136474609375, 11.7822265625, 12.427978515625, 13.07373046875, 13.719482421875, 14.365234375, 15.010986328125, 15.65673828125, 16.302490234375, 16.9482421875, 17.593994140625, 18.23974609375, 18.885498046875, 19.53125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 6.0, 7.0, 15.0, 14.0, 17.0, 23.0, 32.0, 47.0, 53.0, 50.0, 91.0, 119.0, 157.0, 198.0, 300.0, 488.0, 679.0, 1117.0, 1952.0, 3620.0, 7470.0, 15955.0, 35230.0, 81191.0, 184184.0, 327392.0, 214350.0, 95256.0, 41452.0, 18349.0, 8520.0, 4206.0, 2262.0, 1226.0, 802.0, 471.0, 352.0, 232.0, 163.0, 129.0, 108.0, 59.0, 53.0, 43.0, 23.0, 22.0, 18.0, 20.0, 14.0, 5.0, 7.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-43.96875, -42.5771484375, -41.185546875, -39.7939453125, -38.40234375, -37.0107421875, -35.619140625, -34.2275390625, -32.8359375, -31.4443359375, -30.052734375, -28.6611328125, -27.26953125, -25.8779296875, -24.486328125, -23.0947265625, -21.703125, -20.3115234375, -18.919921875, -17.5283203125, -16.13671875, -14.7451171875, -13.353515625, -11.9619140625, -10.5703125, -9.1787109375, -7.787109375, -6.3955078125, -5.00390625, -3.6123046875, -2.220703125, -0.8291015625, 0.5625, 1.9541015625, 3.345703125, 4.7373046875, 6.12890625, 7.5205078125, 8.912109375, 10.3037109375, 11.6953125, 13.0869140625, 14.478515625, 15.8701171875, 17.26171875, 18.6533203125, 20.044921875, 21.4365234375, 22.828125, 24.2197265625, 25.611328125, 27.0029296875, 28.39453125, 29.7861328125, 31.177734375, 32.5693359375, 33.9609375, 35.3525390625, 36.744140625, 38.1357421875, 39.52734375, 40.9189453125, 42.310546875, 43.7021484375, 45.09375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 9.0, 13.0, 6.0, 9.0, 12.0, 12.0, 20.0, 22.0, 22.0, 20.0, 24.0, 19.0, 35.0, 38.0, 37.0, 39.0, 44.0, 35.0, 62.0, 44.0, 37.0, 37.0, 35.0, 40.0, 27.0, 31.0, 36.0, 27.0, 27.0, 25.0, 29.0, 21.0, 14.0, 12.0, 15.0, 9.0, 9.0, 10.0, 10.0, 9.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0], "bins": [-43.6875, -42.39794921875, -41.1083984375, -39.81884765625, -38.529296875, -37.23974609375, -35.9501953125, -34.66064453125, -33.37109375, -32.08154296875, -30.7919921875, -29.50244140625, -28.212890625, -26.92333984375, -25.6337890625, -24.34423828125, -23.0546875, -21.76513671875, -20.4755859375, -19.18603515625, -17.896484375, -16.60693359375, -15.3173828125, -14.02783203125, -12.73828125, -11.44873046875, -10.1591796875, -8.86962890625, -7.580078125, -6.29052734375, -5.0009765625, -3.71142578125, -2.421875, -1.13232421875, 0.1572265625, 1.44677734375, 2.736328125, 4.02587890625, 5.3154296875, 6.60498046875, 7.89453125, 9.18408203125, 10.4736328125, 11.76318359375, 13.052734375, 14.34228515625, 15.6318359375, 16.92138671875, 18.2109375, 19.50048828125, 20.7900390625, 22.07958984375, 23.369140625, 24.65869140625, 25.9482421875, 27.23779296875, 28.52734375, 29.81689453125, 31.1064453125, 32.39599609375, 33.685546875, 34.97509765625, 36.2646484375, 37.55419921875, 38.84375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 4.0, 3.0, 5.0, 26.0, 28.0, 44.0, 69.0, 154.0, 262.0, 551.0, 1308.0, 3106.0, 8829.0, 29028.0, 115661.0, 416514.0, 348925.0, 88900.0, 23030.0, 7278.0, 2641.0, 1171.0, 477.0, 280.0, 117.0, 59.0, 34.0, 15.0, 14.0, 14.0, 4.0, 3.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.34375, -25.36474609375, -24.3857421875, -23.40673828125, -22.427734375, -21.44873046875, -20.4697265625, -19.49072265625, -18.51171875, -17.53271484375, -16.5537109375, -15.57470703125, -14.595703125, -13.61669921875, -12.6376953125, -11.65869140625, -10.6796875, -9.70068359375, -8.7216796875, -7.74267578125, -6.763671875, -5.78466796875, -4.8056640625, -3.82666015625, -2.84765625, -1.86865234375, -0.8896484375, 0.08935546875, 1.068359375, 2.04736328125, 3.0263671875, 4.00537109375, 4.984375, 5.96337890625, 6.9423828125, 7.92138671875, 8.900390625, 9.87939453125, 10.8583984375, 11.83740234375, 12.81640625, 13.79541015625, 14.7744140625, 15.75341796875, 16.732421875, 17.71142578125, 18.6904296875, 19.66943359375, 20.6484375, 21.62744140625, 22.6064453125, 23.58544921875, 24.564453125, 25.54345703125, 26.5224609375, 27.50146484375, 28.48046875, 29.45947265625, 30.4384765625, 31.41748046875, 32.396484375, 33.37548828125, 34.3544921875, 35.33349609375, 36.3125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 6.0, 9.0, 11.0, 20.0, 15.0, 29.0, 31.0, 30.0, 64.0, 72.0, 141.0, 141.0, 119.0, 76.0, 53.0, 36.0, 29.0, 30.0, 15.0, 20.0, 12.0, 9.0, 7.0, 5.0, 4.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0042266845703125, -0.004067182540893555, -0.003907680511474609, -0.003748178482055664, -0.0035886764526367188, -0.0034291744232177734, -0.003269672393798828, -0.003110170364379883, -0.0029506683349609375, -0.002791166305541992, -0.002631664276123047, -0.0024721622467041016, -0.0023126602172851562, -0.002153158187866211, -0.0019936561584472656, -0.0018341541290283203, -0.001674652099609375, -0.0015151500701904297, -0.0013556480407714844, -0.001196146011352539, -0.0010366439819335938, -0.0008771419525146484, -0.0007176399230957031, -0.0005581378936767578, -0.0003986358642578125, -0.0002391338348388672, -7.963180541992188e-05, 7.987022399902344e-05, 0.00023937225341796875, 0.00039887428283691406, 0.0005583763122558594, 0.0007178783416748047, 0.00087738037109375, 0.0010368824005126953, 0.0011963844299316406, 0.001355886459350586, 0.0015153884887695312, 0.0016748905181884766, 0.0018343925476074219, 0.001993894577026367, 0.0021533966064453125, 0.002312898635864258, 0.002472400665283203, 0.0026319026947021484, 0.0027914047241210938, 0.002950906753540039, 0.0031104087829589844, 0.0032699108123779297, 0.003429412841796875, 0.0035889148712158203, 0.0037484169006347656, 0.003907918930053711, 0.004067420959472656, 0.0042269229888916016, 0.004386425018310547, 0.004545927047729492, 0.0047054290771484375, 0.004864931106567383, 0.005024433135986328, 0.0051839351654052734, 0.005343437194824219, 0.005502939224243164, 0.005662441253662109, 0.005821943283081055, 0.0059814453125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 7.0, 9.0, 14.0, 15.0, 33.0, 33.0, 71.0, 117.0, 208.0, 333.0, 684.0, 1467.0, 3719.0, 10385.0, 37095.0, 161655.0, 497249.0, 254508.0, 57148.0, 15175.0, 4819.0, 1873.0, 876.0, 461.0, 238.0, 128.0, 83.0, 56.0, 31.0, 30.0, 8.0, 14.0, 3.0, 9.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-36.3125, -35.32177734375, -34.3310546875, -33.34033203125, -32.349609375, -31.35888671875, -30.3681640625, -29.37744140625, -28.38671875, -27.39599609375, -26.4052734375, -25.41455078125, -24.423828125, -23.43310546875, -22.4423828125, -21.45166015625, -20.4609375, -19.47021484375, -18.4794921875, -17.48876953125, -16.498046875, -15.50732421875, -14.5166015625, -13.52587890625, -12.53515625, -11.54443359375, -10.5537109375, -9.56298828125, -8.572265625, -7.58154296875, -6.5908203125, -5.60009765625, -4.609375, -3.61865234375, -2.6279296875, -1.63720703125, -0.646484375, 0.34423828125, 1.3349609375, 2.32568359375, 3.31640625, 4.30712890625, 5.2978515625, 6.28857421875, 7.279296875, 8.27001953125, 9.2607421875, 10.25146484375, 11.2421875, 12.23291015625, 13.2236328125, 14.21435546875, 15.205078125, 16.19580078125, 17.1865234375, 18.17724609375, 19.16796875, 20.15869140625, 21.1494140625, 22.14013671875, 23.130859375, 24.12158203125, 25.1123046875, 26.10302734375, 27.09375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 5.0, 4.0, 5.0, 8.0, 6.0, 8.0, 8.0, 15.0, 14.0, 23.0, 32.0, 34.0, 46.0, 44.0, 56.0, 55.0, 69.0, 67.0, 67.0, 59.0, 57.0, 57.0, 53.0, 49.0, 32.0, 26.0, 21.0, 14.0, 12.0, 11.0, 9.0, 5.0, 7.0, 7.0, 5.0, 6.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.03125, -18.471435546875, -17.91162109375, -17.351806640625, -16.7919921875, -16.232177734375, -15.67236328125, -15.112548828125, -14.552734375, -13.992919921875, -13.43310546875, -12.873291015625, -12.3134765625, -11.753662109375, -11.19384765625, -10.634033203125, -10.07421875, -9.514404296875, -8.95458984375, -8.394775390625, -7.8349609375, -7.275146484375, -6.71533203125, -6.155517578125, -5.595703125, -5.035888671875, -4.47607421875, -3.916259765625, -3.3564453125, -2.796630859375, -2.23681640625, -1.677001953125, -1.1171875, -0.557373046875, 0.00244140625, 0.562255859375, 1.1220703125, 1.681884765625, 2.24169921875, 2.801513671875, 3.361328125, 3.921142578125, 4.48095703125, 5.040771484375, 5.6005859375, 6.160400390625, 6.72021484375, 7.280029296875, 7.83984375, 8.399658203125, 8.95947265625, 9.519287109375, 10.0791015625, 10.638916015625, 11.19873046875, 11.758544921875, 12.318359375, 12.878173828125, 13.43798828125, 13.997802734375, 14.5576171875, 15.117431640625, 15.67724609375, 16.237060546875, 16.796875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 5.0, 6.0, 9.0, 15.0, 32.0, 34.0, 53.0, 65.0, 92.0, 112.0, 103.0, 95.0, 112.0, 82.0, 62.0, 48.0, 24.0, 24.0, 18.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-505.0211181640625, -492.9909362792969, -480.96075439453125, -468.9305419921875, -456.9003601074219, -444.87017822265625, -432.8399963378906, -420.809814453125, -408.77960205078125, -396.7494201660156, -384.71923828125, -372.68902587890625, -360.6588439941406, -348.628662109375, -336.5984802246094, -324.56829833984375, -312.5380859375, -300.5079040527344, -288.47772216796875, -276.447509765625, -264.4173278808594, -252.38714599609375, -240.35696411132812, -228.32676696777344, -216.29660034179688, -204.26641845703125, -192.23622131347656, -180.20603942871094, -168.17584228515625, -156.14566040039062, -144.115478515625, -132.0852813720703, -120.05508422851562, -108.02489471435547, -95.99470520019531, -83.96452331542969, -71.934326171875, -59.90414047241211, -47.87395477294922, -35.84376525878906, -23.813575744628906, -11.783387184143066, 0.24680137634277344, 12.276988983154297, 24.307178497314453, 36.33736801147461, 48.3675537109375, 60.397743225097656, 72.42793273925781, 84.45812225341797, 96.48831176757812, 108.51849365234375, 120.54869079589844, 132.57887268066406, 144.60906982421875, 156.63925170898438, 168.66943359375, 180.69961547851562, 192.7298126220703, 204.75999450683594, 216.79019165039062, 228.82037353515625, 240.85055541992188, 252.88075256347656, 264.91094970703125]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 7.0, 2.0, 2.0, 8.0, 8.0, 6.0, 7.0, 13.0, 15.0, 16.0, 22.0, 23.0, 24.0, 28.0, 28.0, 49.0, 43.0, 40.0, 30.0, 46.0, 56.0, 36.0, 47.0, 52.0, 44.0, 48.0, 32.0, 34.0, 38.0, 37.0, 31.0, 25.0, 28.0, 20.0, 10.0, 14.0, 13.0, 12.0, 4.0, 3.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-192.45175170898438, -184.69760131835938, -176.9434356689453, -169.1892852783203, -161.4351348876953, -153.68096923828125, -145.92681884765625, -138.17266845703125, -130.4185028076172, -122.66434478759766, -114.91019439697266, -107.15603637695312, -99.4018783569336, -91.64772033691406, -83.89356994628906, -76.13941192626953, -68.38526153564453, -60.631107330322266, -52.876949310302734, -45.12279510498047, -37.36863708496094, -29.614482879638672, -21.860328674316406, -14.106170654296875, -6.352016448974609, 1.4021391868591309, 9.156294822692871, 16.910449981689453, 24.66460609436035, 32.41876220703125, 40.172916412353516, 47.92707443237305, 55.68122863769531, 63.43538284301758, 71.18953704833984, 78.94369506835938, 86.6978530883789, 94.45201110839844, 102.20616149902344, 109.96031951904297, 117.7144775390625, 125.46863555908203, 133.22279357910156, 140.97694396972656, 148.73109436035156, 156.48526000976562, 164.23941040039062, 171.99356079101562, 179.74771118164062, 187.50186157226562, 195.2560272216797, 203.0101776123047, 210.7643280029297, 218.51849365234375, 226.27264404296875, 234.02679443359375, 241.7809600830078, 249.5351104736328, 257.2892761230469, 265.0434265136719, 272.7975769042969, 280.5517272949219, 288.305908203125, 296.06005859375, 303.814208984375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 3.0, 3.0, 4.0, 12.0, 7.0, 16.0, 25.0, 33.0, 51.0, 74.0, 103.0, 194.0, 408.0, 809.0, 2000.0, 6021.0, 27694.0, 427985.0, 3652438.0, 61417.0, 9781.0, 2902.0, 1113.0, 507.0, 229.0, 167.0, 102.0, 54.0, 29.0, 21.0, 22.0, 10.0, 11.0, 7.0, 8.0, 7.0, 10.0, 5.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-169.125, -162.904296875, -156.68359375, -150.462890625, -144.2421875, -138.021484375, -131.80078125, -125.580078125, -119.359375, -113.138671875, -106.91796875, -100.697265625, -94.4765625, -88.255859375, -82.03515625, -75.814453125, -69.59375, -63.373046875, -57.15234375, -50.931640625, -44.7109375, -38.490234375, -32.26953125, -26.048828125, -19.828125, -13.607421875, -7.38671875, -1.166015625, 5.0546875, 11.275390625, 17.49609375, 23.716796875, 29.9375, 36.158203125, 42.37890625, 48.599609375, 54.8203125, 61.041015625, 67.26171875, 73.482421875, 79.703125, 85.923828125, 92.14453125, 98.365234375, 104.5859375, 110.806640625, 117.02734375, 123.248046875, 129.46875, 135.689453125, 141.91015625, 148.130859375, 154.3515625, 160.572265625, 166.79296875, 173.013671875, 179.234375, 185.455078125, 191.67578125, 197.896484375, 204.1171875, 210.337890625, 216.55859375, 222.779296875, 229.0]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 8.0, 7.0, 13.0, 19.0, 23.0, 27.0, 33.0, 53.0, 76.0, 78.0, 81.0, 93.0, 91.0, 70.0, 64.0, 73.0, 48.0, 42.0, 26.0, 32.0, 13.0, 16.0, 8.0, 2.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.671875, -20.0439453125, -19.416015625, -18.7880859375, -18.16015625, -17.5322265625, -16.904296875, -16.2763671875, -15.6484375, -15.0205078125, -14.392578125, -13.7646484375, -13.13671875, -12.5087890625, -11.880859375, -11.2529296875, -10.625, -9.9970703125, -9.369140625, -8.7412109375, -8.11328125, -7.4853515625, -6.857421875, -6.2294921875, -5.6015625, -4.9736328125, -4.345703125, -3.7177734375, -3.08984375, -2.4619140625, -1.833984375, -1.2060546875, -0.578125, 0.0498046875, 0.677734375, 1.3056640625, 1.93359375, 2.5615234375, 3.189453125, 3.8173828125, 4.4453125, 5.0732421875, 5.701171875, 6.3291015625, 6.95703125, 7.5849609375, 8.212890625, 8.8408203125, 9.46875, 10.0966796875, 10.724609375, 11.3525390625, 11.98046875, 12.6083984375, 13.236328125, 13.8642578125, 14.4921875, 15.1201171875, 15.748046875, 16.3759765625, 17.00390625, 17.6318359375, 18.259765625, 18.8876953125, 19.515625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 3.0, 6.0, 9.0, 13.0, 11.0, 29.0, 27.0, 31.0, 52.0, 51.0, 88.0, 99.0, 172.0, 236.0, 404.0, 816.0, 1963.0, 6139.0, 27001.0, 221411.0, 3587066.0, 304115.0, 33067.0, 7202.0, 2117.0, 856.0, 411.0, 251.0, 158.0, 111.0, 93.0, 61.0, 56.0, 37.0, 31.0, 15.0, 15.0, 14.0, 15.0, 15.0, 1.0, 5.0, 3.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-130.625, -126.732421875, -122.83984375, -118.947265625, -115.0546875, -111.162109375, -107.26953125, -103.376953125, -99.484375, -95.591796875, -91.69921875, -87.806640625, -83.9140625, -80.021484375, -76.12890625, -72.236328125, -68.34375, -64.451171875, -60.55859375, -56.666015625, -52.7734375, -48.880859375, -44.98828125, -41.095703125, -37.203125, -33.310546875, -29.41796875, -25.525390625, -21.6328125, -17.740234375, -13.84765625, -9.955078125, -6.0625, -2.169921875, 1.72265625, 5.615234375, 9.5078125, 13.400390625, 17.29296875, 21.185546875, 25.078125, 28.970703125, 32.86328125, 36.755859375, 40.6484375, 44.541015625, 48.43359375, 52.326171875, 56.21875, 60.111328125, 64.00390625, 67.896484375, 71.7890625, 75.681640625, 79.57421875, 83.466796875, 87.359375, 91.251953125, 95.14453125, 99.037109375, 102.9296875, 106.822265625, 110.71484375, 114.607421875, 118.5]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 5.0, 9.0, 1.0, 22.0, 24.0, 50.0, 76.0, 234.0, 792.0, 2004.0, 494.0, 177.0, 83.0, 53.0, 26.0, 15.0, 6.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.8125, -56.7373046875, -54.662109375, -52.5869140625, -50.51171875, -48.4365234375, -46.361328125, -44.2861328125, -42.2109375, -40.1357421875, -38.060546875, -35.9853515625, -33.91015625, -31.8349609375, -29.759765625, -27.6845703125, -25.609375, -23.5341796875, -21.458984375, -19.3837890625, -17.30859375, -15.2333984375, -13.158203125, -11.0830078125, -9.0078125, -6.9326171875, -4.857421875, -2.7822265625, -0.70703125, 1.3681640625, 3.443359375, 5.5185546875, 7.59375, 9.6689453125, 11.744140625, 13.8193359375, 15.89453125, 17.9697265625, 20.044921875, 22.1201171875, 24.1953125, 26.2705078125, 28.345703125, 30.4208984375, 32.49609375, 34.5712890625, 36.646484375, 38.7216796875, 40.796875, 42.8720703125, 44.947265625, 47.0224609375, 49.09765625, 51.1728515625, 53.248046875, 55.3232421875, 57.3984375, 59.4736328125, 61.548828125, 63.6240234375, 65.69921875, 67.7744140625, 69.849609375, 71.9248046875, 74.0]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 6.0, 6.0, 12.0, 22.0, 24.0, 42.0, 64.0, 89.0, 116.0, 114.0, 122.0, 106.0, 92.0, 67.0, 49.0, 34.0, 18.0, 6.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-282.52789306640625, -274.9053039550781, -267.28271484375, -259.6601257324219, -252.0375518798828, -244.4149627685547, -236.79237365722656, -229.16978454589844, -221.54721069335938, -213.92462158203125, -206.30203247070312, -198.679443359375, -191.05686950683594, -183.4342803955078, -175.8116912841797, -168.18910217285156, -160.56651306152344, -152.9439239501953, -145.3213348388672, -137.69876098632812, -130.076171875, -122.45358276367188, -114.83099365234375, -107.20840454101562, -99.58582305908203, -91.9632339477539, -84.34065246582031, -76.71806335449219, -69.09547424316406, -61.47289276123047, -53.850303649902344, -46.227718353271484, -38.60511779785156, -30.982532501220703, -23.35994529724121, -15.737358093261719, -8.11477279663086, -0.4921875, 7.130401611328125, 14.752986907958984, 22.375572204589844, 29.998157501220703, 37.62074279785156, 45.24333190917969, 52.86591720581055, 60.488502502441406, 68.11109161376953, 75.73367309570312, 83.35626220703125, 90.97885131835938, 98.60143280029297, 106.2240219116211, 113.84660339355469, 121.46919250488281, 129.09178161621094, 136.71437072753906, 144.33694458007812, 151.95953369140625, 159.58212280273438, 167.2047119140625, 174.82728576660156, 182.4498748779297, 190.0724639892578, 197.69505310058594, 205.31764221191406]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 6.0, 12.0, 14.0, 12.0, 20.0, 28.0, 30.0, 33.0, 39.0, 44.0, 52.0, 68.0, 54.0, 42.0, 60.0, 68.0, 54.0, 62.0, 50.0, 43.0, 45.0, 29.0, 25.0, 31.0, 19.0, 13.0, 16.0, 7.0, 9.0, 4.0, 3.0, 8.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-139.14976501464844, -134.23031616210938, -129.3108673095703, -124.39141845703125, -119.47196960449219, -114.55252075195312, -109.63307189941406, -104.713623046875, -99.79417419433594, -94.87472534179688, -89.95527648925781, -85.03582763671875, -80.11637878417969, -75.19692993164062, -70.27748107910156, -65.3580322265625, -60.43858337402344, -55.519134521484375, -50.59968566894531, -45.68023681640625, -40.76078796386719, -35.841339111328125, -30.921890258789062, -26.00244140625, -21.082992553710938, -16.163543701171875, -11.244094848632812, -6.32464599609375, -1.4051971435546875, 3.514251708984375, 8.433700561523438, 13.3531494140625, 18.2725830078125, 23.192031860351562, 28.111480712890625, 33.03092956542969, 37.95037841796875, 42.86982727050781, 47.789276123046875, 52.70872497558594, 57.628173828125, 62.54762268066406, 67.46707153320312, 72.38652038574219, 77.30596923828125, 82.22541809082031, 87.14486694335938, 92.06431579589844, 96.9837646484375, 101.90321350097656, 106.82266235351562, 111.74211120605469, 116.66156005859375, 121.58100891113281, 126.50045776367188, 131.41990661621094, 136.33935546875, 141.25880432128906, 146.17825317382812, 151.0977020263672, 156.01715087890625, 160.9365997314453, 165.85604858398438, 170.77549743652344, 175.6949462890625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 4.0, 2.0, 1.0, 7.0, 11.0, 7.0, 27.0, 35.0, 45.0, 61.0, 95.0, 156.0, 294.0, 534.0, 1260.0, 3314.0, 12827.0, 74864.0, 702069.0, 215996.0, 27249.0, 6035.0, 1869.0, 827.0, 397.0, 208.0, 135.0, 94.0, 33.0, 29.0, 24.0, 8.0, 6.0, 11.0, 6.0, 3.0, 4.0, 1.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-145.875, -140.615234375, -135.35546875, -130.095703125, -124.8359375, -119.576171875, -114.31640625, -109.056640625, -103.796875, -98.537109375, -93.27734375, -88.017578125, -82.7578125, -77.498046875, -72.23828125, -66.978515625, -61.71875, -56.458984375, -51.19921875, -45.939453125, -40.6796875, -35.419921875, -30.16015625, -24.900390625, -19.640625, -14.380859375, -9.12109375, -3.861328125, 1.3984375, 6.658203125, 11.91796875, 17.177734375, 22.4375, 27.697265625, 32.95703125, 38.216796875, 43.4765625, 48.736328125, 53.99609375, 59.255859375, 64.515625, 69.775390625, 75.03515625, 80.294921875, 85.5546875, 90.814453125, 96.07421875, 101.333984375, 106.59375, 111.853515625, 117.11328125, 122.373046875, 127.6328125, 132.892578125, 138.15234375, 143.412109375, 148.671875, 153.931640625, 159.19140625, 164.451171875, 169.7109375, 174.970703125, 180.23046875, 185.490234375, 190.75]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 7.0, 10.0, 6.0, 23.0, 25.0, 25.0, 56.0, 66.0, 91.0, 73.0, 84.0, 100.0, 91.0, 63.0, 72.0, 52.0, 53.0, 34.0, 24.0, 16.0, 14.0, 8.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.140625, -21.455078125, -20.76953125, -20.083984375, -19.3984375, -18.712890625, -18.02734375, -17.341796875, -16.65625, -15.970703125, -15.28515625, -14.599609375, -13.9140625, -13.228515625, -12.54296875, -11.857421875, -11.171875, -10.486328125, -9.80078125, -9.115234375, -8.4296875, -7.744140625, -7.05859375, -6.373046875, -5.6875, -5.001953125, -4.31640625, -3.630859375, -2.9453125, -2.259765625, -1.57421875, -0.888671875, -0.203125, 0.482421875, 1.16796875, 1.853515625, 2.5390625, 3.224609375, 3.91015625, 4.595703125, 5.28125, 5.966796875, 6.65234375, 7.337890625, 8.0234375, 8.708984375, 9.39453125, 10.080078125, 10.765625, 11.451171875, 12.13671875, 12.822265625, 13.5078125, 14.193359375, 14.87890625, 15.564453125, 16.25, 16.935546875, 17.62109375, 18.306640625, 18.9921875, 19.677734375, 20.36328125, 21.048828125, 21.734375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 2.0, 5.0, 9.0, 14.0, 12.0, 26.0, 29.0, 39.0, 52.0, 68.0, 130.0, 151.0, 201.0, 296.0, 488.0, 762.0, 1426.0, 3002.0, 7243.0, 19648.0, 56119.0, 176815.0, 492100.0, 193624.0, 60424.0, 20890.0, 7869.0, 3161.0, 1535.0, 895.0, 482.0, 303.0, 221.0, 137.0, 101.0, 68.0, 55.0, 44.0, 27.0, 19.0, 21.0, 17.0, 9.0, 2.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-60.8125, -58.943359375, -57.07421875, -55.205078125, -53.3359375, -51.466796875, -49.59765625, -47.728515625, -45.859375, -43.990234375, -42.12109375, -40.251953125, -38.3828125, -36.513671875, -34.64453125, -32.775390625, -30.90625, -29.037109375, -27.16796875, -25.298828125, -23.4296875, -21.560546875, -19.69140625, -17.822265625, -15.953125, -14.083984375, -12.21484375, -10.345703125, -8.4765625, -6.607421875, -4.73828125, -2.869140625, -1.0, 0.869140625, 2.73828125, 4.607421875, 6.4765625, 8.345703125, 10.21484375, 12.083984375, 13.953125, 15.822265625, 17.69140625, 19.560546875, 21.4296875, 23.298828125, 25.16796875, 27.037109375, 28.90625, 30.775390625, 32.64453125, 34.513671875, 36.3828125, 38.251953125, 40.12109375, 41.990234375, 43.859375, 45.728515625, 47.59765625, 49.466796875, 51.3359375, 53.205078125, 55.07421875, 56.943359375, 58.8125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 9.0, 10.0, 8.0, 13.0, 15.0, 11.0, 16.0, 26.0, 22.0, 19.0, 32.0, 32.0, 40.0, 49.0, 37.0, 53.0, 43.0, 45.0, 51.0, 45.0, 58.0, 43.0, 40.0, 34.0, 33.0, 28.0, 30.0, 25.0, 26.0, 25.0, 22.0, 20.0, 11.0, 8.0, 7.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.125, -42.56982421875, -41.0146484375, -39.45947265625, -37.904296875, -36.34912109375, -34.7939453125, -33.23876953125, -31.68359375, -30.12841796875, -28.5732421875, -27.01806640625, -25.462890625, -23.90771484375, -22.3525390625, -20.79736328125, -19.2421875, -17.68701171875, -16.1318359375, -14.57666015625, -13.021484375, -11.46630859375, -9.9111328125, -8.35595703125, -6.80078125, -5.24560546875, -3.6904296875, -2.13525390625, -0.580078125, 0.97509765625, 2.5302734375, 4.08544921875, 5.640625, 7.19580078125, 8.7509765625, 10.30615234375, 11.861328125, 13.41650390625, 14.9716796875, 16.52685546875, 18.08203125, 19.63720703125, 21.1923828125, 22.74755859375, 24.302734375, 25.85791015625, 27.4130859375, 28.96826171875, 30.5234375, 32.07861328125, 33.6337890625, 35.18896484375, 36.744140625, 38.29931640625, 39.8544921875, 41.40966796875, 42.96484375, 44.52001953125, 46.0751953125, 47.63037109375, 49.185546875, 50.74072265625, 52.2958984375, 53.85107421875, 55.40625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 0.0, 8.0, 5.0, 12.0, 18.0, 32.0, 53.0, 79.0, 88.0, 188.0, 363.0, 808.0, 2150.0, 7335.0, 30634.0, 184535.0, 620785.0, 163534.0, 27562.0, 6629.0, 2052.0, 855.0, 368.0, 184.0, 98.0, 75.0, 32.0, 18.0, 14.0, 10.0, 9.0, 4.0, 8.0, 7.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.984375, -30.968017578125, -29.95166015625, -28.935302734375, -27.9189453125, -26.902587890625, -25.88623046875, -24.869873046875, -23.853515625, -22.837158203125, -21.82080078125, -20.804443359375, -19.7880859375, -18.771728515625, -17.75537109375, -16.739013671875, -15.72265625, -14.706298828125, -13.68994140625, -12.673583984375, -11.6572265625, -10.640869140625, -9.62451171875, -8.608154296875, -7.591796875, -6.575439453125, -5.55908203125, -4.542724609375, -3.5263671875, -2.510009765625, -1.49365234375, -0.477294921875, 0.5390625, 1.555419921875, 2.57177734375, 3.588134765625, 4.6044921875, 5.620849609375, 6.63720703125, 7.653564453125, 8.669921875, 9.686279296875, 10.70263671875, 11.718994140625, 12.7353515625, 13.751708984375, 14.76806640625, 15.784423828125, 16.80078125, 17.817138671875, 18.83349609375, 19.849853515625, 20.8662109375, 21.882568359375, 22.89892578125, 23.915283203125, 24.931640625, 25.947998046875, 26.96435546875, 27.980712890625, 28.9970703125, 30.013427734375, 31.02978515625, 32.046142578125, 33.0625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 7.0, 8.0, 3.0, 14.0, 6.0, 15.0, 18.0, 35.0, 31.0, 52.0, 114.0, 190.0, 201.0, 103.0, 62.0, 30.0, 30.0, 18.0, 13.0, 19.0, 5.0, 8.0, 6.0, 5.0, 4.0, 1.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0072479248046875, -0.007052063941955566, -0.006856203079223633, -0.006660342216491699, -0.006464481353759766, -0.006268620491027832, -0.0060727596282958984, -0.005876898765563965, -0.005681037902832031, -0.005485177040100098, -0.005289316177368164, -0.0050934553146362305, -0.004897594451904297, -0.004701733589172363, -0.00450587272644043, -0.004310011863708496, -0.0041141510009765625, -0.003918290138244629, -0.0037224292755126953, -0.0035265684127807617, -0.003330707550048828, -0.0031348466873168945, -0.002938985824584961, -0.0027431249618530273, -0.0025472640991210938, -0.00235140323638916, -0.0021555423736572266, -0.001959681510925293, -0.0017638206481933594, -0.0015679597854614258, -0.0013720989227294922, -0.0011762380599975586, -0.000980377197265625, -0.0007845163345336914, -0.0005886554718017578, -0.0003927946090698242, -0.00019693374633789062, -1.0728836059570312e-06, 0.00019478797912597656, 0.00039064884185791016, 0.0005865097045898438, 0.0007823705673217773, 0.000978231430053711, 0.0011740922927856445, 0.0013699531555175781, 0.0015658140182495117, 0.0017616748809814453, 0.001957535743713379, 0.0021533966064453125, 0.002349257469177246, 0.0025451183319091797, 0.0027409791946411133, 0.002936840057373047, 0.0031327009201049805, 0.003328561782836914, 0.0035244226455688477, 0.0037202835083007812, 0.003916144371032715, 0.0041120052337646484, 0.004307866096496582, 0.004503726959228516, 0.004699587821960449, 0.004895448684692383, 0.005091309547424316, 0.00528717041015625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 1.0, 3.0, 4.0, 5.0, 4.0, 7.0, 10.0, 14.0, 16.0, 34.0, 49.0, 70.0, 117.0, 216.0, 344.0, 659.0, 1608.0, 4758.0, 17521.0, 81292.0, 549930.0, 326745.0, 47988.0, 11262.0, 3221.0, 1338.0, 557.0, 318.0, 167.0, 105.0, 81.0, 36.0, 21.0, 13.0, 14.0, 7.0, 13.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-34.09375, -33.115234375, -32.13671875, -31.158203125, -30.1796875, -29.201171875, -28.22265625, -27.244140625, -26.265625, -25.287109375, -24.30859375, -23.330078125, -22.3515625, -21.373046875, -20.39453125, -19.416015625, -18.4375, -17.458984375, -16.48046875, -15.501953125, -14.5234375, -13.544921875, -12.56640625, -11.587890625, -10.609375, -9.630859375, -8.65234375, -7.673828125, -6.6953125, -5.716796875, -4.73828125, -3.759765625, -2.78125, -1.802734375, -0.82421875, 0.154296875, 1.1328125, 2.111328125, 3.08984375, 4.068359375, 5.046875, 6.025390625, 7.00390625, 7.982421875, 8.9609375, 9.939453125, 10.91796875, 11.896484375, 12.875, 13.853515625, 14.83203125, 15.810546875, 16.7890625, 17.767578125, 18.74609375, 19.724609375, 20.703125, 21.681640625, 22.66015625, 23.638671875, 24.6171875, 25.595703125, 26.57421875, 27.552734375, 28.53125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 7.0, 11.0, 5.0, 12.0, 12.0, 9.0, 19.0, 25.0, 42.0, 45.0, 73.0, 88.0, 144.0, 115.0, 107.0, 89.0, 45.0, 28.0, 35.0, 28.0, 12.0, 10.0, 15.0, 9.0, 9.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.40625, -18.760009765625, -18.11376953125, -17.467529296875, -16.8212890625, -16.175048828125, -15.52880859375, -14.882568359375, -14.236328125, -13.590087890625, -12.94384765625, -12.297607421875, -11.6513671875, -11.005126953125, -10.35888671875, -9.712646484375, -9.06640625, -8.420166015625, -7.77392578125, -7.127685546875, -6.4814453125, -5.835205078125, -5.18896484375, -4.542724609375, -3.896484375, -3.250244140625, -2.60400390625, -1.957763671875, -1.3115234375, -0.665283203125, -0.01904296875, 0.627197265625, 1.2734375, 1.919677734375, 2.56591796875, 3.212158203125, 3.8583984375, 4.504638671875, 5.15087890625, 5.797119140625, 6.443359375, 7.089599609375, 7.73583984375, 8.382080078125, 9.0283203125, 9.674560546875, 10.32080078125, 10.967041015625, 11.61328125, 12.259521484375, 12.90576171875, 13.552001953125, 14.1982421875, 14.844482421875, 15.49072265625, 16.136962890625, 16.783203125, 17.429443359375, 18.07568359375, 18.721923828125, 19.3681640625, 20.014404296875, 20.66064453125, 21.306884765625, 21.953125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 8.0, 7.0, 15.0, 36.0, 60.0, 105.0, 137.0, 187.0, 167.0, 100.0, 76.0, 56.0, 24.0, 17.0, 8.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-635.1976928710938, -617.8590698242188, -600.5204467773438, -583.1817626953125, -565.8431396484375, -548.5045166015625, -531.1658935546875, -513.8272705078125, -496.4886169433594, -479.1499938964844, -461.81134033203125, -444.47271728515625, -427.13409423828125, -409.7954406738281, -392.4568176269531, -375.1181640625, -357.779541015625, -340.44091796875, -323.1022644042969, -305.7636413574219, -288.42498779296875, -271.08636474609375, -253.74774169921875, -236.4091033935547, -219.07046508789062, -201.73182678222656, -184.3931884765625, -167.0545654296875, -149.71592712402344, -132.37728881835938, -115.03865814208984, -97.70002746582031, -80.36138916015625, -63.02275466918945, -45.684120178222656, -28.34548568725586, -11.006851196289062, 6.331787109375, 23.67041778564453, 41.00904846191406, 58.347686767578125, 75.68632507324219, 93.02495574951172, 110.36358642578125, 127.70222473144531, 145.04086303710938, 162.37948608398438, 179.71812438964844, 197.0567626953125, 214.39540100097656, 231.73403930664062, 249.07266235351562, 266.41131591796875, 283.74993896484375, 301.08856201171875, 318.42718505859375, 335.7658386230469, 353.1044616699219, 370.443115234375, 387.78173828125, 405.120361328125, 422.4590148925781, 439.7976379394531, 457.13629150390625, 474.47491455078125]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 11.0, 10.0, 11.0, 12.0, 13.0, 15.0, 22.0, 20.0, 23.0, 36.0, 24.0, 31.0, 23.0, 38.0, 35.0, 45.0, 47.0, 54.0, 32.0, 47.0, 37.0, 39.0, 47.0, 27.0, 38.0, 31.0, 28.0, 43.0, 18.0, 25.0, 13.0, 15.0, 15.0, 10.0, 14.0, 8.0, 10.0, 12.0, 4.0, 5.0, 8.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-199.2005615234375, -192.03567504882812, -184.8707733154297, -177.7058868408203, -170.54100036621094, -163.3760986328125, -156.21121215820312, -149.04632568359375, -141.88143920898438, -134.716552734375, -127.5516586303711, -120.38676452636719, -113.22187805175781, -106.0569839477539, -98.89208984375, -91.72720336914062, -84.56230163574219, -77.39740753173828, -70.2325210571289, -63.067626953125, -55.90273666381836, -48.73784637451172, -41.57295227050781, -34.40806198120117, -27.24317169189453, -20.07828140258789, -12.913389205932617, -5.748497009277344, 1.4163932800292969, 8.581283569335938, 15.746177673339844, 22.911067962646484, 30.075958251953125, 37.240848541259766, 44.405738830566406, 51.57063293457031, 58.73552322387695, 65.9004135131836, 73.0653076171875, 80.23019409179688, 87.39508819580078, 94.55998229980469, 101.72486877441406, 108.88976287841797, 116.05465698242188, 123.21954345703125, 130.38442993164062, 137.54933166503906, 144.71421813964844, 151.8791046142578, 159.04400634765625, 166.20889282226562, 173.373779296875, 180.53866577148438, 187.7035675048828, 194.8684539794922, 202.03335571289062, 209.1982421875, 216.36314392089844, 223.5280303955078, 230.6929168701172, 237.85781860351562, 245.022705078125, 252.18759155273438, 259.35247802734375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 8.0, 7.0, 6.0, 8.0, 11.0, 15.0, 35.0, 33.0, 54.0, 68.0, 88.0, 124.0, 219.0, 334.0, 627.0, 1204.0, 2703.0, 6777.0, 23233.0, 149712.0, 3793906.0, 176830.0, 25322.0, 7334.0, 2770.0, 1312.0, 619.0, 335.0, 181.0, 116.0, 73.0, 50.0, 37.0, 17.0, 21.0, 10.0, 18.0, 13.0, 12.0, 8.0, 10.0, 3.0, 3.0, 3.0, 4.0, 1.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-143.375, -138.349609375, -133.32421875, -128.298828125, -123.2734375, -118.248046875, -113.22265625, -108.197265625, -103.171875, -98.146484375, -93.12109375, -88.095703125, -83.0703125, -78.044921875, -73.01953125, -67.994140625, -62.96875, -57.943359375, -52.91796875, -47.892578125, -42.8671875, -37.841796875, -32.81640625, -27.791015625, -22.765625, -17.740234375, -12.71484375, -7.689453125, -2.6640625, 2.361328125, 7.38671875, 12.412109375, 17.4375, 22.462890625, 27.48828125, 32.513671875, 37.5390625, 42.564453125, 47.58984375, 52.615234375, 57.640625, 62.666015625, 67.69140625, 72.716796875, 77.7421875, 82.767578125, 87.79296875, 92.818359375, 97.84375, 102.869140625, 107.89453125, 112.919921875, 117.9453125, 122.970703125, 127.99609375, 133.021484375, 138.046875, 143.072265625, 148.09765625, 153.123046875, 158.1484375, 163.173828125, 168.19921875, 173.224609375, 178.25]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 6.0, 5.0, 3.0, 6.0, 15.0, 16.0, 18.0, 29.0, 44.0, 45.0, 87.0, 83.0, 65.0, 78.0, 73.0, 75.0, 79.0, 60.0, 59.0, 53.0, 36.0, 21.0, 18.0, 12.0, 14.0, 2.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.265625, -20.600830078125, -19.93603515625, -19.271240234375, -18.6064453125, -17.941650390625, -17.27685546875, -16.612060546875, -15.947265625, -15.282470703125, -14.61767578125, -13.952880859375, -13.2880859375, -12.623291015625, -11.95849609375, -11.293701171875, -10.62890625, -9.964111328125, -9.29931640625, -8.634521484375, -7.9697265625, -7.304931640625, -6.64013671875, -5.975341796875, -5.310546875, -4.645751953125, -3.98095703125, -3.316162109375, -2.6513671875, -1.986572265625, -1.32177734375, -0.656982421875, 0.0078125, 0.672607421875, 1.33740234375, 2.002197265625, 2.6669921875, 3.331787109375, 3.99658203125, 4.661376953125, 5.326171875, 5.990966796875, 6.65576171875, 7.320556640625, 7.9853515625, 8.650146484375, 9.31494140625, 9.979736328125, 10.64453125, 11.309326171875, 11.97412109375, 12.638916015625, 13.3037109375, 13.968505859375, 14.63330078125, 15.298095703125, 15.962890625, 16.627685546875, 17.29248046875, 17.957275390625, 18.6220703125, 19.286865234375, 19.95166015625, 20.616455078125, 21.28125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 11.0, 9.0, 13.0, 19.0, 31.0, 43.0, 51.0, 72.0, 85.0, 136.0, 221.0, 393.0, 801.0, 1890.0, 5603.0, 19964.0, 111748.0, 3106144.0, 859358.0, 66486.0, 14073.0, 4086.0, 1467.0, 636.0, 349.0, 190.0, 113.0, 76.0, 49.0, 47.0, 27.0, 20.0, 10.0, 11.0, 11.0, 9.0, 6.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0], "bins": [-114.125, -110.65234375, -107.1796875, -103.70703125, -100.234375, -96.76171875, -93.2890625, -89.81640625, -86.34375, -82.87109375, -79.3984375, -75.92578125, -72.453125, -68.98046875, -65.5078125, -62.03515625, -58.5625, -55.08984375, -51.6171875, -48.14453125, -44.671875, -41.19921875, -37.7265625, -34.25390625, -30.78125, -27.30859375, -23.8359375, -20.36328125, -16.890625, -13.41796875, -9.9453125, -6.47265625, -3.0, 0.47265625, 3.9453125, 7.41796875, 10.890625, 14.36328125, 17.8359375, 21.30859375, 24.78125, 28.25390625, 31.7265625, 35.19921875, 38.671875, 42.14453125, 45.6171875, 49.08984375, 52.5625, 56.03515625, 59.5078125, 62.98046875, 66.453125, 69.92578125, 73.3984375, 76.87109375, 80.34375, 83.81640625, 87.2890625, 90.76171875, 94.234375, 97.70703125, 101.1796875, 104.65234375, 108.125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 10.0, 21.0, 30.0, 57.0, 95.0, 251.0, 569.0, 1898.0, 640.0, 223.0, 113.0, 55.0, 43.0, 21.0, 19.0, 7.0, 8.0, 5.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-63.8125, -62.3779296875, -60.943359375, -59.5087890625, -58.07421875, -56.6396484375, -55.205078125, -53.7705078125, -52.3359375, -50.9013671875, -49.466796875, -48.0322265625, -46.59765625, -45.1630859375, -43.728515625, -42.2939453125, -40.859375, -39.4248046875, -37.990234375, -36.5556640625, -35.12109375, -33.6865234375, -32.251953125, -30.8173828125, -29.3828125, -27.9482421875, -26.513671875, -25.0791015625, -23.64453125, -22.2099609375, -20.775390625, -19.3408203125, -17.90625, -16.4716796875, -15.037109375, -13.6025390625, -12.16796875, -10.7333984375, -9.298828125, -7.8642578125, -6.4296875, -4.9951171875, -3.560546875, -2.1259765625, -0.69140625, 0.7431640625, 2.177734375, 3.6123046875, 5.046875, 6.4814453125, 7.916015625, 9.3505859375, 10.78515625, 12.2197265625, 13.654296875, 15.0888671875, 16.5234375, 17.9580078125, 19.392578125, 20.8271484375, 22.26171875, 23.6962890625, 25.130859375, 26.5654296875, 28.0]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 8.0, 13.0, 24.0, 64.0, 97.0, 123.0, 143.0, 159.0, 120.0, 116.0, 55.0, 37.0, 13.0, 10.0, 5.0, 4.0, 0.0, 1.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-215.8210906982422, -207.04991149902344, -198.2787322998047, -189.50753784179688, -180.73635864257812, -171.96517944335938, -163.19400024414062, -154.42282104492188, -145.65164184570312, -136.88046264648438, -128.10928344726562, -119.33809661865234, -110.56690979003906, -101.79573059082031, -93.02455139160156, -84.25337219238281, -75.482177734375, -66.71099853515625, -57.93981170654297, -49.16863250732422, -40.3974494934082, -31.626266479492188, -22.855087280273438, -14.083904266357422, -5.312721252441406, 3.458460807800293, 12.229642868041992, 21.000823974609375, 29.77200698852539, 38.543190002441406, 47.314369201660156, 56.08555221557617, 64.85671997070312, 73.62789916992188, 82.39908599853516, 91.1702651977539, 99.94145202636719, 108.71263122558594, 117.48381042480469, 126.25498962402344, 135.02618408203125, 143.79736328125, 152.56854248046875, 161.3397216796875, 170.1109161376953, 178.88209533691406, 187.6532745361328, 196.42445373535156, 205.1956329345703, 213.96681213378906, 222.7379913330078, 231.50918579101562, 240.28036499023438, 249.05154418945312, 257.8227233886719, 266.5939025878906, 275.3650817871094, 284.1362609863281, 292.9074401855469, 301.6786193847656, 310.4497985839844, 319.22100830078125, 327.9921875, 336.76336669921875, 345.5345458984375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 3.0, 6.0, 5.0, 15.0, 7.0, 10.0, 9.0, 24.0, 22.0, 21.0, 33.0, 46.0, 44.0, 41.0, 33.0, 52.0, 76.0, 60.0, 64.0, 52.0, 44.0, 45.0, 44.0, 50.0, 33.0, 21.0, 30.0, 22.0, 14.0, 19.0, 19.0, 10.0, 9.0, 7.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.55390167236328, -98.66016387939453, -94.76643371582031, -90.87269592285156, -86.97895812988281, -83.08522033691406, -79.19148254394531, -75.2977523803711, -71.40401458740234, -67.5102767944336, -63.61654281616211, -59.722808837890625, -55.829071044921875, -51.935333251953125, -48.04159927368164, -44.147865295410156, -40.254127502441406, -36.360389709472656, -32.46665573120117, -28.572919845581055, -24.679183959960938, -20.78544807434082, -16.891712188720703, -12.997976303100586, -9.104240417480469, -5.210504531860352, -1.3167686462402344, 2.576967239379883, 6.470703125, 10.364439010620117, 14.258174896240234, 18.15191078186035, 22.045639038085938, 25.939374923706055, 29.833110809326172, 33.726844787597656, 37.620582580566406, 41.514320373535156, 45.40805435180664, 49.301788330078125, 53.195526123046875, 57.089263916015625, 60.98299789428711, 64.8767318725586, 68.77046966552734, 72.6642074584961, 76.55793762207031, 80.45167541503906, 84.34541320800781, 88.23915100097656, 92.13288879394531, 96.02661895751953, 99.92035675048828, 103.81409454345703, 107.70782470703125, 111.6015625, 115.49530029296875, 119.3890380859375, 123.28277587890625, 127.17650604248047, 131.07025146484375, 134.96397399902344, 138.8577117919922, 142.75144958496094, 146.6451873779297]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 2.0, 5.0, 6.0, 9.0, 15.0, 21.0, 27.0, 54.0, 74.0, 110.0, 190.0, 297.0, 537.0, 1198.0, 3490.0, 14604.0, 84429.0, 753049.0, 159015.0, 23053.0, 5140.0, 1603.0, 721.0, 345.0, 229.0, 107.0, 72.0, 41.0, 38.0, 18.0, 22.0, 12.0, 9.0, 9.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-165.25, -160.1875, -155.125, -150.0625, -145.0, -139.9375, -134.875, -129.8125, -124.75, -119.6875, -114.625, -109.5625, -104.5, -99.4375, -94.375, -89.3125, -84.25, -79.1875, -74.125, -69.0625, -64.0, -58.9375, -53.875, -48.8125, -43.75, -38.6875, -33.625, -28.5625, -23.5, -18.4375, -13.375, -8.3125, -3.25, 1.8125, 6.875, 11.9375, 17.0, 22.0625, 27.125, 32.1875, 37.25, 42.3125, 47.375, 52.4375, 57.5, 62.5625, 67.625, 72.6875, 77.75, 82.8125, 87.875, 92.9375, 98.0, 103.0625, 108.125, 113.1875, 118.25, 123.3125, 128.375, 133.4375, 138.5, 143.5625, 148.625, 153.6875, 158.75]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 7.0, 4.0, 9.0, 13.0, 15.0, 18.0, 35.0, 33.0, 49.0, 57.0, 85.0, 60.0, 80.0, 80.0, 85.0, 85.0, 61.0, 60.0, 40.0, 40.0, 32.0, 17.0, 12.0, 11.0, 6.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.6875, -21.015625, -20.34375, -19.671875, -19.0, -18.328125, -17.65625, -16.984375, -16.3125, -15.640625, -14.96875, -14.296875, -13.625, -12.953125, -12.28125, -11.609375, -10.9375, -10.265625, -9.59375, -8.921875, -8.25, -7.578125, -6.90625, -6.234375, -5.5625, -4.890625, -4.21875, -3.546875, -2.875, -2.203125, -1.53125, -0.859375, -0.1875, 0.484375, 1.15625, 1.828125, 2.5, 3.171875, 3.84375, 4.515625, 5.1875, 5.859375, 6.53125, 7.203125, 7.875, 8.546875, 9.21875, 9.890625, 10.5625, 11.234375, 11.90625, 12.578125, 13.25, 13.921875, 14.59375, 15.265625, 15.9375, 16.609375, 17.28125, 17.953125, 18.625, 19.296875, 19.96875, 20.640625, 21.3125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 5.0, 5.0, 5.0, 7.0, 9.0, 9.0, 20.0, 29.0, 37.0, 36.0, 65.0, 112.0, 151.0, 238.0, 378.0, 711.0, 1383.0, 2453.0, 5165.0, 10667.0, 22252.0, 48791.0, 136323.0, 452824.0, 237394.0, 70368.0, 30780.0, 14046.0, 6909.0, 3387.0, 1748.0, 903.0, 513.0, 301.0, 160.0, 101.0, 77.0, 53.0, 41.0, 29.0, 26.0, 12.0, 11.0, 9.0, 4.0, 7.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.5, -48.03125, -46.5625, -45.09375, -43.625, -42.15625, -40.6875, -39.21875, -37.75, -36.28125, -34.8125, -33.34375, -31.875, -30.40625, -28.9375, -27.46875, -26.0, -24.53125, -23.0625, -21.59375, -20.125, -18.65625, -17.1875, -15.71875, -14.25, -12.78125, -11.3125, -9.84375, -8.375, -6.90625, -5.4375, -3.96875, -2.5, -1.03125, 0.4375, 1.90625, 3.375, 4.84375, 6.3125, 7.78125, 9.25, 10.71875, 12.1875, 13.65625, 15.125, 16.59375, 18.0625, 19.53125, 21.0, 22.46875, 23.9375, 25.40625, 26.875, 28.34375, 29.8125, 31.28125, 32.75, 34.21875, 35.6875, 37.15625, 38.625, 40.09375, 41.5625, 43.03125, 44.5]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 4.0, 4.0, 1.0, 8.0, 8.0, 11.0, 14.0, 23.0, 13.0, 20.0, 33.0, 36.0, 35.0, 30.0, 38.0, 35.0, 40.0, 37.0, 41.0, 39.0, 47.0, 63.0, 41.0, 48.0, 44.0, 36.0, 44.0, 36.0, 31.0, 18.0, 25.0, 16.0, 13.0, 13.0, 13.0, 8.0, 6.0, 7.0, 3.0, 7.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.0, -45.478515625, -43.95703125, -42.435546875, -40.9140625, -39.392578125, -37.87109375, -36.349609375, -34.828125, -33.306640625, -31.78515625, -30.263671875, -28.7421875, -27.220703125, -25.69921875, -24.177734375, -22.65625, -21.134765625, -19.61328125, -18.091796875, -16.5703125, -15.048828125, -13.52734375, -12.005859375, -10.484375, -8.962890625, -7.44140625, -5.919921875, -4.3984375, -2.876953125, -1.35546875, 0.166015625, 1.6875, 3.208984375, 4.73046875, 6.251953125, 7.7734375, 9.294921875, 10.81640625, 12.337890625, 13.859375, 15.380859375, 16.90234375, 18.423828125, 19.9453125, 21.466796875, 22.98828125, 24.509765625, 26.03125, 27.552734375, 29.07421875, 30.595703125, 32.1171875, 33.638671875, 35.16015625, 36.681640625, 38.203125, 39.724609375, 41.24609375, 42.767578125, 44.2890625, 45.810546875, 47.33203125, 48.853515625, 50.375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 5.0, 6.0, 16.0, 22.0, 28.0, 39.0, 40.0, 100.0, 140.0, 293.0, 505.0, 986.0, 2528.0, 9193.0, 69883.0, 852383.0, 96106.0, 11124.0, 2806.0, 1097.0, 541.0, 286.0, 153.0, 76.0, 68.0, 34.0, 30.0, 16.0, 15.0, 8.0, 8.0, 6.0, 2.0, 4.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.65625, -45.79150390625, -43.9267578125, -42.06201171875, -40.197265625, -38.33251953125, -36.4677734375, -34.60302734375, -32.73828125, -30.87353515625, -29.0087890625, -27.14404296875, -25.279296875, -23.41455078125, -21.5498046875, -19.68505859375, -17.8203125, -15.95556640625, -14.0908203125, -12.22607421875, -10.361328125, -8.49658203125, -6.6318359375, -4.76708984375, -2.90234375, -1.03759765625, 0.8271484375, 2.69189453125, 4.556640625, 6.42138671875, 8.2861328125, 10.15087890625, 12.015625, 13.88037109375, 15.7451171875, 17.60986328125, 19.474609375, 21.33935546875, 23.2041015625, 25.06884765625, 26.93359375, 28.79833984375, 30.6630859375, 32.52783203125, 34.392578125, 36.25732421875, 38.1220703125, 39.98681640625, 41.8515625, 43.71630859375, 45.5810546875, 47.44580078125, 49.310546875, 51.17529296875, 53.0400390625, 54.90478515625, 56.76953125, 58.63427734375, 60.4990234375, 62.36376953125, 64.228515625, 66.09326171875, 67.9580078125, 69.82275390625, 71.6875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 0.0, 4.0, 6.0, 6.0, 3.0, 3.0, 6.0, 13.0, 11.0, 26.0, 20.0, 43.0, 130.0, 320.0, 214.0, 73.0, 34.0, 25.0, 22.0, 12.0, 6.0, 6.0, 8.0, 6.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0111541748046875, -0.010910391807556152, -0.010666608810424805, -0.010422825813293457, -0.01017904281616211, -0.009935259819030762, -0.009691476821899414, -0.009447693824768066, -0.009203910827636719, -0.008960127830505371, -0.008716344833374023, -0.008472561836242676, -0.008228778839111328, -0.00798499584197998, -0.007741212844848633, -0.007497429847717285, -0.0072536468505859375, -0.00700986385345459, -0.006766080856323242, -0.0065222978591918945, -0.006278514862060547, -0.006034731864929199, -0.0057909488677978516, -0.005547165870666504, -0.005303382873535156, -0.005059599876403809, -0.004815816879272461, -0.004572033882141113, -0.004328250885009766, -0.004084467887878418, -0.0038406848907470703, -0.0035969018936157227, -0.003353118896484375, -0.0031093358993530273, -0.0028655529022216797, -0.002621769905090332, -0.0023779869079589844, -0.0021342039108276367, -0.001890420913696289, -0.0016466379165649414, -0.0014028549194335938, -0.001159071922302246, -0.0009152889251708984, -0.0006715059280395508, -0.0004277229309082031, -0.00018393993377685547, 5.984306335449219e-05, 0.00030362606048583984, 0.0005474090576171875, 0.0007911920547485352, 0.0010349750518798828, 0.0012787580490112305, 0.0015225410461425781, 0.0017663240432739258, 0.0020101070404052734, 0.002253890037536621, 0.0024976730346679688, 0.0027414560317993164, 0.002985239028930664, 0.0032290220260620117, 0.0034728050231933594, 0.003716588020324707, 0.003960371017456055, 0.004204154014587402, 0.00444793701171875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 5.0, 7.0, 13.0, 8.0, 19.0, 35.0, 38.0, 49.0, 105.0, 173.0, 391.0, 1013.0, 3470.0, 19026.0, 316753.0, 671832.0, 28719.0, 4662.0, 1244.0, 503.0, 195.0, 100.0, 66.0, 36.0, 22.0, 16.0, 14.0, 7.0, 10.0, 7.0, 4.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.375, -57.40234375, -55.4296875, -53.45703125, -51.484375, -49.51171875, -47.5390625, -45.56640625, -43.59375, -41.62109375, -39.6484375, -37.67578125, -35.703125, -33.73046875, -31.7578125, -29.78515625, -27.8125, -25.83984375, -23.8671875, -21.89453125, -19.921875, -17.94921875, -15.9765625, -14.00390625, -12.03125, -10.05859375, -8.0859375, -6.11328125, -4.140625, -2.16796875, -0.1953125, 1.77734375, 3.75, 5.72265625, 7.6953125, 9.66796875, 11.640625, 13.61328125, 15.5859375, 17.55859375, 19.53125, 21.50390625, 23.4765625, 25.44921875, 27.421875, 29.39453125, 31.3671875, 33.33984375, 35.3125, 37.28515625, 39.2578125, 41.23046875, 43.203125, 45.17578125, 47.1484375, 49.12109375, 51.09375, 53.06640625, 55.0390625, 57.01171875, 58.984375, 60.95703125, 62.9296875, 64.90234375, 66.875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 6.0, 6.0, 10.0, 14.0, 19.0, 31.0, 42.0, 79.0, 180.0, 229.0, 157.0, 85.0, 38.0, 24.0, 15.0, 11.0, 11.0, 8.0, 9.0, 6.0, 4.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.5625, -34.5615234375, -33.560546875, -32.5595703125, -31.55859375, -30.5576171875, -29.556640625, -28.5556640625, -27.5546875, -26.5537109375, -25.552734375, -24.5517578125, -23.55078125, -22.5498046875, -21.548828125, -20.5478515625, -19.546875, -18.5458984375, -17.544921875, -16.5439453125, -15.54296875, -14.5419921875, -13.541015625, -12.5400390625, -11.5390625, -10.5380859375, -9.537109375, -8.5361328125, -7.53515625, -6.5341796875, -5.533203125, -4.5322265625, -3.53125, -2.5302734375, -1.529296875, -0.5283203125, 0.47265625, 1.4736328125, 2.474609375, 3.4755859375, 4.4765625, 5.4775390625, 6.478515625, 7.4794921875, 8.48046875, 9.4814453125, 10.482421875, 11.4833984375, 12.484375, 13.4853515625, 14.486328125, 15.4873046875, 16.48828125, 17.4892578125, 18.490234375, 19.4912109375, 20.4921875, 21.4931640625, 22.494140625, 23.4951171875, 24.49609375, 25.4970703125, 26.498046875, 27.4990234375, 28.5]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 5.0, 15.0, 38.0, 41.0, 83.0, 140.0, 158.0, 162.0, 150.0, 97.0, 57.0, 42.0, 11.0, 8.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-190.3349151611328, -172.87261962890625, -155.4103240966797, -137.94802856445312, -120.4857406616211, -103.02344512939453, -85.5611572265625, -68.09886169433594, -50.636566162109375, -33.17427062988281, -15.711978912353516, 1.7503128051757812, 19.212608337402344, 36.674903869628906, 54.13719177246094, 71.5994873046875, 89.06178283691406, 106.52407836914062, 123.98637390136719, 141.44866943359375, 158.91094970703125, 176.37326049804688, 193.83554077148438, 211.29783630371094, 228.7601318359375, 246.22242736816406, 263.6847229003906, 281.1470031738281, 298.60931396484375, 316.07159423828125, 333.53387451171875, 350.9961853027344, 368.45843505859375, 385.92071533203125, 403.3830261230469, 420.8453063964844, 438.3076171875, 455.7698974609375, 473.232177734375, 490.6944885253906, 508.15679931640625, 525.6190795898438, 543.0813598632812, 560.543701171875, 578.0059814453125, 595.46826171875, 612.9305419921875, 630.392822265625, 647.8551025390625, 665.3173828125, 682.7796630859375, 700.2420043945312, 717.7042846679688, 735.1665649414062, 752.6288452148438, 770.0911865234375, 787.553466796875, 805.0157470703125, 822.47802734375, 839.9403686523438, 857.4026489257812, 874.8649291992188, 892.3272094726562, 909.78955078125, 927.2518310546875]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 6.0, 5.0, 3.0, 7.0, 5.0, 10.0, 13.0, 15.0, 9.0, 25.0, 28.0, 16.0, 26.0, 37.0, 28.0, 32.0, 35.0, 37.0, 48.0, 57.0, 53.0, 48.0, 37.0, 42.0, 42.0, 40.0, 35.0, 34.0, 33.0, 31.0, 22.0, 22.0, 25.0, 23.0, 21.0, 12.0, 8.0, 12.0, 6.0, 8.0, 1.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-191.6279296875, -184.66299438476562, -177.6980438232422, -170.7331085205078, -163.76815795898438, -156.80322265625, -149.83828735351562, -142.8733367919922, -135.9084014892578, -128.94346618652344, -121.978515625, -115.01358032226562, -108.04863739013672, -101.08369445800781, -94.1187515258789, -87.15380859375, -80.1888656616211, -73.22392272949219, -66.25897979736328, -59.29404067993164, -52.3291015625, -45.364158630371094, -38.39921569824219, -31.434276580810547, -24.46933364868164, -17.504392623901367, -10.539450645446777, -3.5745086669921875, 3.390432357788086, 10.35537338256836, 17.320316314697266, 24.285255432128906, 31.250198364257812, 38.21514129638672, 45.18008041381836, 52.145023345947266, 59.109962463378906, 66.07490539550781, 73.03984832763672, 80.00479125976562, 86.9697265625, 93.9346694946289, 100.89961242675781, 107.86454772949219, 114.8294906616211, 121.79443359375, 128.75936889648438, 135.7243194580078, 142.68927001953125, 149.65420532226562, 156.61915588378906, 163.58409118652344, 170.54904174804688, 177.51397705078125, 184.47891235351562, 191.44386291503906, 198.40879821777344, 205.3737335205078, 212.33868408203125, 219.30361938476562, 226.26856994628906, 233.23350524902344, 240.19845581054688, 247.16339111328125, 254.12832641601562]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 9.0, 16.0, 14.0, 23.0, 32.0, 37.0, 38.0, 57.0, 86.0, 135.0, 203.0, 301.0, 476.0, 851.0, 1540.0, 3284.0, 7747.0, 23431.0, 98074.0, 3262223.0, 699083.0, 66695.0, 17776.0, 6375.0, 2600.0, 1225.0, 662.0, 387.0, 255.0, 168.0, 110.0, 97.0, 58.0, 47.0, 32.0, 38.0, 18.0, 16.0, 12.0, 16.0, 6.0, 3.0, 5.0, 0.0, 3.0, 2.0, 6.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0], "bins": [-145.125, -140.42578125, -135.7265625, -131.02734375, -126.328125, -121.62890625, -116.9296875, -112.23046875, -107.53125, -102.83203125, -98.1328125, -93.43359375, -88.734375, -84.03515625, -79.3359375, -74.63671875, -69.9375, -65.23828125, -60.5390625, -55.83984375, -51.140625, -46.44140625, -41.7421875, -37.04296875, -32.34375, -27.64453125, -22.9453125, -18.24609375, -13.546875, -8.84765625, -4.1484375, 0.55078125, 5.25, 9.94921875, 14.6484375, 19.34765625, 24.046875, 28.74609375, 33.4453125, 38.14453125, 42.84375, 47.54296875, 52.2421875, 56.94140625, 61.640625, 66.33984375, 71.0390625, 75.73828125, 80.4375, 85.13671875, 89.8359375, 94.53515625, 99.234375, 103.93359375, 108.6328125, 113.33203125, 118.03125, 122.73046875, 127.4296875, 132.12890625, 136.828125, 141.52734375, 146.2265625, 150.92578125, 155.625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 8.0, 7.0, 6.0, 12.0, 7.0, 20.0, 22.0, 28.0, 54.0, 40.0, 64.0, 72.0, 77.0, 66.0, 102.0, 70.0, 70.0, 65.0, 67.0, 32.0, 34.0, 37.0, 13.0, 16.0, 6.0, 7.0, 4.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.609375, -20.93505859375, -20.2607421875, -19.58642578125, -18.912109375, -18.23779296875, -17.5634765625, -16.88916015625, -16.21484375, -15.54052734375, -14.8662109375, -14.19189453125, -13.517578125, -12.84326171875, -12.1689453125, -11.49462890625, -10.8203125, -10.14599609375, -9.4716796875, -8.79736328125, -8.123046875, -7.44873046875, -6.7744140625, -6.10009765625, -5.42578125, -4.75146484375, -4.0771484375, -3.40283203125, -2.728515625, -2.05419921875, -1.3798828125, -0.70556640625, -0.03125, 0.64306640625, 1.3173828125, 1.99169921875, 2.666015625, 3.34033203125, 4.0146484375, 4.68896484375, 5.36328125, 6.03759765625, 6.7119140625, 7.38623046875, 8.060546875, 8.73486328125, 9.4091796875, 10.08349609375, 10.7578125, 11.43212890625, 12.1064453125, 12.78076171875, 13.455078125, 14.12939453125, 14.8037109375, 15.47802734375, 16.15234375, 16.82666015625, 17.5009765625, 18.17529296875, 18.849609375, 19.52392578125, 20.1982421875, 20.87255859375, 21.546875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 6.0, 9.0, 10.0, 14.0, 14.0, 18.0, 36.0, 41.0, 50.0, 63.0, 115.0, 157.0, 237.0, 415.0, 722.0, 1315.0, 2732.0, 6101.0, 14616.0, 39276.0, 129394.0, 922889.0, 2808316.0, 184037.0, 51014.0, 18247.0, 7418.0, 3343.0, 1592.0, 807.0, 477.0, 273.0, 177.0, 106.0, 72.0, 50.0, 32.0, 23.0, 15.0, 15.0, 12.0, 6.0, 5.0, 7.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-86.4375, -83.904296875, -81.37109375, -78.837890625, -76.3046875, -73.771484375, -71.23828125, -68.705078125, -66.171875, -63.638671875, -61.10546875, -58.572265625, -56.0390625, -53.505859375, -50.97265625, -48.439453125, -45.90625, -43.373046875, -40.83984375, -38.306640625, -35.7734375, -33.240234375, -30.70703125, -28.173828125, -25.640625, -23.107421875, -20.57421875, -18.041015625, -15.5078125, -12.974609375, -10.44140625, -7.908203125, -5.375, -2.841796875, -0.30859375, 2.224609375, 4.7578125, 7.291015625, 9.82421875, 12.357421875, 14.890625, 17.423828125, 19.95703125, 22.490234375, 25.0234375, 27.556640625, 30.08984375, 32.623046875, 35.15625, 37.689453125, 40.22265625, 42.755859375, 45.2890625, 47.822265625, 50.35546875, 52.888671875, 55.421875, 57.955078125, 60.48828125, 63.021484375, 65.5546875, 68.087890625, 70.62109375, 73.154296875, 75.6875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 6.0, 6.0, 11.0, 11.0, 22.0, 29.0, 33.0, 66.0, 71.0, 139.0, 279.0, 772.0, 1772.0, 373.0, 202.0, 102.0, 62.0, 43.0, 25.0, 9.0, 10.0, 15.0, 4.0, 2.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-54.46875, -53.208740234375, -51.94873046875, -50.688720703125, -49.4287109375, -48.168701171875, -46.90869140625, -45.648681640625, -44.388671875, -43.128662109375, -41.86865234375, -40.608642578125, -39.3486328125, -38.088623046875, -36.82861328125, -35.568603515625, -34.30859375, -33.048583984375, -31.78857421875, -30.528564453125, -29.2685546875, -28.008544921875, -26.74853515625, -25.488525390625, -24.228515625, -22.968505859375, -21.70849609375, -20.448486328125, -19.1884765625, -17.928466796875, -16.66845703125, -15.408447265625, -14.1484375, -12.888427734375, -11.62841796875, -10.368408203125, -9.1083984375, -7.848388671875, -6.58837890625, -5.328369140625, -4.068359375, -2.808349609375, -1.54833984375, -0.288330078125, 0.9716796875, 2.231689453125, 3.49169921875, 4.751708984375, 6.01171875, 7.271728515625, 8.53173828125, 9.791748046875, 11.0517578125, 12.311767578125, 13.57177734375, 14.831787109375, 16.091796875, 17.351806640625, 18.61181640625, 19.871826171875, 21.1318359375, 22.391845703125, 23.65185546875, 24.911865234375, 26.171875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 9.0, 22.0, 37.0, 61.0, 107.0, 161.0, 194.0, 174.0, 126.0, 62.0, 29.0, 20.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-550.94921875, -540.5137329101562, -530.0782470703125, -519.6427612304688, -509.207275390625, -498.7717590332031, -488.3362731933594, -477.9007873535156, -467.4653015136719, -457.0298156738281, -446.5943298339844, -436.1588439941406, -425.72332763671875, -415.287841796875, -404.85235595703125, -394.4168701171875, -383.98138427734375, -373.5458984375, -363.11041259765625, -352.6749267578125, -342.23944091796875, -331.8039245605469, -321.3684387207031, -310.9329528808594, -300.4974670410156, -290.0619812011719, -279.6264953613281, -269.1910095214844, -258.7554931640625, -248.3200225830078, -237.884521484375, -227.44903564453125, -217.01353454589844, -206.5780487060547, -196.14254760742188, -185.70706176757812, -175.27157592773438, -164.83609008789062, -154.40060424804688, -143.96510314941406, -133.5296173095703, -123.09413146972656, -112.65863800048828, -102.22314453125, -91.78765869140625, -81.3521728515625, -70.91667938232422, -60.48118591308594, -50.04570007324219, -39.61021041870117, -29.174720764160156, -18.73923110961914, -8.303741455078125, 2.1317481994628906, 12.567237854003906, 23.002731323242188, 33.43821716308594, 43.87370681762695, 54.30919647216797, 64.74468994140625, 75.18017578125, 85.61566162109375, 96.05115509033203, 106.48664855957031, 116.92213439941406]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 0.0, 6.0, 4.0, 6.0, 6.0, 7.0, 7.0, 10.0, 15.0, 15.0, 14.0, 13.0, 25.0, 22.0, 28.0, 24.0, 20.0, 32.0, 37.0, 35.0, 37.0, 40.0, 38.0, 45.0, 39.0, 31.0, 40.0, 38.0, 35.0, 30.0, 24.0, 33.0, 22.0, 22.0, 24.0, 28.0, 22.0, 20.0, 21.0, 14.0, 14.0, 8.0, 11.0, 14.0, 8.0, 6.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-89.22309875488281, -86.47863006591797, -83.73416137695312, -80.98970031738281, -78.24523162841797, -75.50076293945312, -72.75629425048828, -70.01182556152344, -67.26736450195312, -64.52289581298828, -61.7784309387207, -59.03396224975586, -56.28949737548828, -53.54502868652344, -50.800559997558594, -48.05609130859375, -45.311622619628906, -42.56715393066406, -39.822689056396484, -37.07822036743164, -34.33375549316406, -31.58928680419922, -28.844818115234375, -26.100351333618164, -23.355884552001953, -20.611417770385742, -17.86695098876953, -15.122482299804688, -12.378015518188477, -9.633548736572266, -6.889080047607422, -4.144613265991211, -1.400146484375, 1.3443207740783691, 4.088788032531738, 6.833255767822266, 9.577722549438477, 12.322189331054688, 15.066658020019531, 17.811124801635742, 20.555591583251953, 23.300058364868164, 26.044525146484375, 28.78899383544922, 31.53346061706543, 34.27792739868164, 37.022396087646484, 39.76686096191406, 42.511329650878906, 45.25579833984375, 48.00026321411133, 50.74473190307617, 53.48919677734375, 56.233665466308594, 58.97813415527344, 61.72260284423828, 64.46707153320312, 67.21154022216797, 69.95600891113281, 72.70046997070312, 75.44493865966797, 78.18940734863281, 80.93387603759766, 83.6783447265625, 86.42280578613281]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 3.0, 3.0, 6.0, 19.0, 31.0, 55.0, 71.0, 105.0, 195.0, 303.0, 551.0, 1176.0, 3177.0, 11266.0, 54645.0, 317257.0, 541564.0, 92486.0, 17933.0, 4441.0, 1615.0, 671.0, 390.0, 235.0, 144.0, 78.0, 52.0, 40.0, 11.0, 19.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.0625, -115.1142578125, -111.166015625, -107.2177734375, -103.26953125, -99.3212890625, -95.373046875, -91.4248046875, -87.4765625, -83.5283203125, -79.580078125, -75.6318359375, -71.68359375, -67.7353515625, -63.787109375, -59.8388671875, -55.890625, -51.9423828125, -47.994140625, -44.0458984375, -40.09765625, -36.1494140625, -32.201171875, -28.2529296875, -24.3046875, -20.3564453125, -16.408203125, -12.4599609375, -8.51171875, -4.5634765625, -0.615234375, 3.3330078125, 7.28125, 11.2294921875, 15.177734375, 19.1259765625, 23.07421875, 27.0224609375, 30.970703125, 34.9189453125, 38.8671875, 42.8154296875, 46.763671875, 50.7119140625, 54.66015625, 58.6083984375, 62.556640625, 66.5048828125, 70.453125, 74.4013671875, 78.349609375, 82.2978515625, 86.24609375, 90.1943359375, 94.142578125, 98.0908203125, 102.0390625, 105.9873046875, 109.935546875, 113.8837890625, 117.83203125, 121.7802734375, 125.728515625, 129.6767578125, 133.625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 7.0, 9.0, 9.0, 9.0, 21.0, 12.0, 21.0, 32.0, 46.0, 58.0, 49.0, 86.0, 77.0, 77.0, 89.0, 63.0, 63.0, 65.0, 59.0, 54.0, 28.0, 28.0, 16.0, 7.0, 8.0, 8.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.125, -21.4287109375, -20.732421875, -20.0361328125, -19.33984375, -18.6435546875, -17.947265625, -17.2509765625, -16.5546875, -15.8583984375, -15.162109375, -14.4658203125, -13.76953125, -13.0732421875, -12.376953125, -11.6806640625, -10.984375, -10.2880859375, -9.591796875, -8.8955078125, -8.19921875, -7.5029296875, -6.806640625, -6.1103515625, -5.4140625, -4.7177734375, -4.021484375, -3.3251953125, -2.62890625, -1.9326171875, -1.236328125, -0.5400390625, 0.15625, 0.8525390625, 1.548828125, 2.2451171875, 2.94140625, 3.6376953125, 4.333984375, 5.0302734375, 5.7265625, 6.4228515625, 7.119140625, 7.8154296875, 8.51171875, 9.2080078125, 9.904296875, 10.6005859375, 11.296875, 11.9931640625, 12.689453125, 13.3857421875, 14.08203125, 14.7783203125, 15.474609375, 16.1708984375, 16.8671875, 17.5634765625, 18.259765625, 18.9560546875, 19.65234375, 20.3486328125, 21.044921875, 21.7412109375, 22.4375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 8.0, 13.0, 9.0, 22.0, 35.0, 40.0, 54.0, 89.0, 123.0, 147.0, 214.0, 327.0, 486.0, 970.0, 2074.0, 5295.0, 16433.0, 55532.0, 208369.0, 521224.0, 168286.0, 46473.0, 13825.0, 4417.0, 1765.0, 851.0, 501.0, 285.0, 199.0, 161.0, 90.0, 58.0, 53.0, 36.0, 24.0, 16.0, 18.0, 8.0, 7.0, 7.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-69.8125, -67.841796875, -65.87109375, -63.900390625, -61.9296875, -59.958984375, -57.98828125, -56.017578125, -54.046875, -52.076171875, -50.10546875, -48.134765625, -46.1640625, -44.193359375, -42.22265625, -40.251953125, -38.28125, -36.310546875, -34.33984375, -32.369140625, -30.3984375, -28.427734375, -26.45703125, -24.486328125, -22.515625, -20.544921875, -18.57421875, -16.603515625, -14.6328125, -12.662109375, -10.69140625, -8.720703125, -6.75, -4.779296875, -2.80859375, -0.837890625, 1.1328125, 3.103515625, 5.07421875, 7.044921875, 9.015625, 10.986328125, 12.95703125, 14.927734375, 16.8984375, 18.869140625, 20.83984375, 22.810546875, 24.78125, 26.751953125, 28.72265625, 30.693359375, 32.6640625, 34.634765625, 36.60546875, 38.576171875, 40.546875, 42.517578125, 44.48828125, 46.458984375, 48.4296875, 50.400390625, 52.37109375, 54.341796875, 56.3125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 5.0, 2.0, 3.0, 5.0, 8.0, 5.0, 13.0, 8.0, 8.0, 11.0, 14.0, 16.0, 15.0, 17.0, 22.0, 23.0, 35.0, 30.0, 33.0, 28.0, 38.0, 41.0, 29.0, 33.0, 48.0, 38.0, 39.0, 40.0, 41.0, 38.0, 38.0, 41.0, 33.0, 37.0, 15.0, 20.0, 19.0, 21.0, 13.0, 18.0, 10.0, 14.0, 8.0, 6.0, 10.0, 9.0, 5.0, 6.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.5625, -37.10888671875, -35.6552734375, -34.20166015625, -32.748046875, -31.29443359375, -29.8408203125, -28.38720703125, -26.93359375, -25.47998046875, -24.0263671875, -22.57275390625, -21.119140625, -19.66552734375, -18.2119140625, -16.75830078125, -15.3046875, -13.85107421875, -12.3974609375, -10.94384765625, -9.490234375, -8.03662109375, -6.5830078125, -5.12939453125, -3.67578125, -2.22216796875, -0.7685546875, 0.68505859375, 2.138671875, 3.59228515625, 5.0458984375, 6.49951171875, 7.953125, 9.40673828125, 10.8603515625, 12.31396484375, 13.767578125, 15.22119140625, 16.6748046875, 18.12841796875, 19.58203125, 21.03564453125, 22.4892578125, 23.94287109375, 25.396484375, 26.85009765625, 28.3037109375, 29.75732421875, 31.2109375, 32.66455078125, 34.1181640625, 35.57177734375, 37.025390625, 38.47900390625, 39.9326171875, 41.38623046875, 42.83984375, 44.29345703125, 45.7470703125, 47.20068359375, 48.654296875, 50.10791015625, 51.5615234375, 53.01513671875, 54.46875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 7.0, 12.0, 14.0, 13.0, 36.0, 54.0, 71.0, 167.0, 279.0, 553.0, 1431.0, 3544.0, 10005.0, 31385.0, 103788.0, 414413.0, 352116.0, 89093.0, 27367.0, 8739.0, 3161.0, 1164.0, 552.0, 290.0, 129.0, 76.0, 30.0, 29.0, 15.0, 12.0, 6.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.765625, -21.887939453125, -21.01025390625, -20.132568359375, -19.2548828125, -18.377197265625, -17.49951171875, -16.621826171875, -15.744140625, -14.866455078125, -13.98876953125, -13.111083984375, -12.2333984375, -11.355712890625, -10.47802734375, -9.600341796875, -8.72265625, -7.844970703125, -6.96728515625, -6.089599609375, -5.2119140625, -4.334228515625, -3.45654296875, -2.578857421875, -1.701171875, -0.823486328125, 0.05419921875, 0.931884765625, 1.8095703125, 2.687255859375, 3.56494140625, 4.442626953125, 5.3203125, 6.197998046875, 7.07568359375, 7.953369140625, 8.8310546875, 9.708740234375, 10.58642578125, 11.464111328125, 12.341796875, 13.219482421875, 14.09716796875, 14.974853515625, 15.8525390625, 16.730224609375, 17.60791015625, 18.485595703125, 19.36328125, 20.240966796875, 21.11865234375, 21.996337890625, 22.8740234375, 23.751708984375, 24.62939453125, 25.507080078125, 26.384765625, 27.262451171875, 28.14013671875, 29.017822265625, 29.8955078125, 30.773193359375, 31.65087890625, 32.528564453125, 33.40625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 1.0, 3.0, 2.0, 3.0, 1.0, 6.0, 7.0, 13.0, 21.0, 23.0, 21.0, 34.0, 42.0, 62.0, 104.0, 183.0, 136.0, 86.0, 69.0, 31.0, 42.0, 30.0, 22.0, 14.0, 14.0, 6.0, 8.0, 8.0, 2.0, 5.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0], "bins": [-0.00711822509765625, -0.006952166557312012, -0.0067861080169677734, -0.006620049476623535, -0.006453990936279297, -0.006287932395935059, -0.00612187385559082, -0.005955815315246582, -0.005789756774902344, -0.0056236982345581055, -0.005457639694213867, -0.005291581153869629, -0.005125522613525391, -0.004959464073181152, -0.004793405532836914, -0.004627346992492676, -0.0044612884521484375, -0.004295229911804199, -0.004129171371459961, -0.003963112831115723, -0.0037970542907714844, -0.003630995750427246, -0.003464937210083008, -0.0032988786697387695, -0.0031328201293945312, -0.002966761589050293, -0.0028007030487060547, -0.0026346445083618164, -0.002468585968017578, -0.00230252742767334, -0.0021364688873291016, -0.0019704103469848633, -0.001804351806640625, -0.0016382932662963867, -0.0014722347259521484, -0.0013061761856079102, -0.0011401176452636719, -0.0009740591049194336, -0.0008080005645751953, -0.000641942024230957, -0.00047588348388671875, -0.00030982494354248047, -0.0001437664031982422, 2.2292137145996094e-05, 0.00018835067749023438, 0.00035440921783447266, 0.0005204677581787109, 0.0006865262985229492, 0.0008525848388671875, 0.0010186433792114258, 0.001184701919555664, 0.0013507604598999023, 0.0015168190002441406, 0.001682877540588379, 0.0018489360809326172, 0.0020149946212768555, 0.0021810531616210938, 0.002347111701965332, 0.0025131702423095703, 0.0026792287826538086, 0.002845287322998047, 0.003011345863342285, 0.0031774044036865234, 0.0033434629440307617, 0.003509521484375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 3.0, 18.0, 19.0, 26.0, 32.0, 48.0, 81.0, 112.0, 145.0, 264.0, 425.0, 806.0, 1679.0, 4152.0, 11972.0, 44153.0, 195948.0, 538912.0, 188145.0, 42307.0, 11777.0, 4041.0, 1641.0, 766.0, 400.0, 228.0, 139.0, 77.0, 67.0, 57.0, 26.0, 27.0, 17.0, 12.0, 6.0, 4.0, 7.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.28125, -32.2568359375, -31.232421875, -30.2080078125, -29.18359375, -28.1591796875, -27.134765625, -26.1103515625, -25.0859375, -24.0615234375, -23.037109375, -22.0126953125, -20.98828125, -19.9638671875, -18.939453125, -17.9150390625, -16.890625, -15.8662109375, -14.841796875, -13.8173828125, -12.79296875, -11.7685546875, -10.744140625, -9.7197265625, -8.6953125, -7.6708984375, -6.646484375, -5.6220703125, -4.59765625, -3.5732421875, -2.548828125, -1.5244140625, -0.5, 0.5244140625, 1.548828125, 2.5732421875, 3.59765625, 4.6220703125, 5.646484375, 6.6708984375, 7.6953125, 8.7197265625, 9.744140625, 10.7685546875, 11.79296875, 12.8173828125, 13.841796875, 14.8662109375, 15.890625, 16.9150390625, 17.939453125, 18.9638671875, 19.98828125, 21.0126953125, 22.037109375, 23.0615234375, 24.0859375, 25.1103515625, 26.134765625, 27.1591796875, 28.18359375, 29.2080078125, 30.232421875, 31.2568359375, 32.28125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 1.0, 5.0, 2.0, 11.0, 4.0, 5.0, 10.0, 10.0, 6.0, 19.0, 7.0, 16.0, 22.0, 37.0, 31.0, 38.0, 40.0, 61.0, 69.0, 69.0, 64.0, 63.0, 50.0, 57.0, 47.0, 51.0, 42.0, 37.0, 24.0, 20.0, 19.0, 14.0, 10.0, 8.0, 6.0, 4.0, 4.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-20.390625, -19.777099609375, -19.16357421875, -18.550048828125, -17.9365234375, -17.322998046875, -16.70947265625, -16.095947265625, -15.482421875, -14.868896484375, -14.25537109375, -13.641845703125, -13.0283203125, -12.414794921875, -11.80126953125, -11.187744140625, -10.57421875, -9.960693359375, -9.34716796875, -8.733642578125, -8.1201171875, -7.506591796875, -6.89306640625, -6.279541015625, -5.666015625, -5.052490234375, -4.43896484375, -3.825439453125, -3.2119140625, -2.598388671875, -1.98486328125, -1.371337890625, -0.7578125, -0.144287109375, 0.46923828125, 1.082763671875, 1.6962890625, 2.309814453125, 2.92333984375, 3.536865234375, 4.150390625, 4.763916015625, 5.37744140625, 5.990966796875, 6.6044921875, 7.218017578125, 7.83154296875, 8.445068359375, 9.05859375, 9.672119140625, 10.28564453125, 10.899169921875, 11.5126953125, 12.126220703125, 12.73974609375, 13.353271484375, 13.966796875, 14.580322265625, 15.19384765625, 15.807373046875, 16.4208984375, 17.034423828125, 17.64794921875, 18.261474609375, 18.875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 7.0, 34.0, 149.0, 324.0, 317.0, 139.0, 31.0, 10.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-314.1203308105469, -269.69305419921875, -225.26580810546875, -180.8385467529297, -136.41128540039062, -91.98402404785156, -47.5567626953125, -3.129486083984375, 41.297760009765625, 85.72502136230469, 130.15228271484375, 174.5795440673828, 219.00680541992188, 263.43408203125, 307.861328125, 352.2886047363281, 396.7158508300781, 441.14312744140625, 485.57037353515625, 529.9976196289062, 574.4249267578125, 618.8521728515625, 663.2794189453125, 707.7066650390625, 752.1339111328125, 796.5611572265625, 840.9884033203125, 885.4157104492188, 929.8429565429688, 974.2702026367188, 1018.697509765625, 1063.124755859375, 1107.552001953125, 1151.979248046875, 1196.406494140625, 1240.833740234375, 1285.260986328125, 1329.6883544921875, 1374.1156005859375, 1418.5428466796875, 1462.9700927734375, 1507.3973388671875, 1551.8245849609375, 1596.2518310546875, 1640.67919921875, 1685.1064453125, 1729.53369140625, 1773.9609375, 1818.38818359375, 1862.8154296875, 1907.24267578125, 1951.669921875, 1996.09716796875, 2040.5245361328125, 2084.95166015625, 2129.37890625, 2173.80615234375, 2218.2333984375, 2262.66064453125, 2307.087890625, 2351.51513671875, 2395.9423828125, 2440.36962890625, 2484.796875, 2529.224365234375]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 4.0, 6.0, 2.0, 7.0, 12.0, 10.0, 9.0, 10.0, 14.0, 11.0, 22.0, 14.0, 22.0, 29.0, 32.0, 22.0, 39.0, 40.0, 39.0, 34.0, 34.0, 43.0, 44.0, 40.0, 40.0, 35.0, 41.0, 28.0, 35.0, 40.0, 24.0, 37.0, 17.0, 26.0, 17.0, 24.0, 12.0, 17.0, 11.0, 10.0, 9.0, 6.0, 8.0, 7.0, 9.0, 6.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0], "bins": [-268.91546630859375, -261.24969482421875, -253.58389282226562, -245.91812133789062, -238.25233459472656, -230.5865478515625, -222.9207763671875, -215.25498962402344, -207.58920288085938, -199.9234161376953, -192.25762939453125, -184.59185791015625, -176.9260711669922, -169.26028442382812, -161.59451293945312, -153.92872619628906, -146.262939453125, -138.59715270996094, -130.93136596679688, -123.26559448242188, -115.59980773925781, -107.93402099609375, -100.26824188232422, -92.60246276855469, -84.93667602539062, -77.27088928222656, -69.60511016845703, -61.939327239990234, -54.27354431152344, -46.60776138305664, -38.941978454589844, -31.276195526123047, -23.610397338867188, -15.94461441040039, -8.278831481933594, -0.6130485534667969, 7.052734375, 14.718517303466797, 22.384300231933594, 30.05008316040039, 37.71586608886719, 45.381649017333984, 53.04743194580078, 60.71321487426758, 68.37899780273438, 76.04478454589844, 83.71056365966797, 91.3763427734375, 99.04212951660156, 106.70791625976562, 114.37369537353516, 122.03947448730469, 129.70526123046875, 137.3710479736328, 145.03683471679688, 152.70260620117188, 160.36839294433594, 168.0341796875, 175.699951171875, 183.36573791503906, 191.03152465820312, 198.6973114013672, 206.36309814453125, 214.02886962890625, 221.6946563720703]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 6.0, 6.0, 12.0, 6.0, 23.0, 42.0, 44.0, 57.0, 108.0, 172.0, 286.0, 498.0, 885.0, 1770.0, 4170.0, 12197.0, 50039.0, 403614.0, 3489321.0, 186247.0, 30339.0, 8207.0, 3036.0, 1296.0, 721.0, 402.0, 265.0, 155.0, 92.0, 70.0, 59.0, 38.0, 31.0, 16.0, 6.0, 12.0, 10.0, 7.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-141.875, -137.19921875, -132.5234375, -127.84765625, -123.171875, -118.49609375, -113.8203125, -109.14453125, -104.46875, -99.79296875, -95.1171875, -90.44140625, -85.765625, -81.08984375, -76.4140625, -71.73828125, -67.0625, -62.38671875, -57.7109375, -53.03515625, -48.359375, -43.68359375, -39.0078125, -34.33203125, -29.65625, -24.98046875, -20.3046875, -15.62890625, -10.953125, -6.27734375, -1.6015625, 3.07421875, 7.75, 12.42578125, 17.1015625, 21.77734375, 26.453125, 31.12890625, 35.8046875, 40.48046875, 45.15625, 49.83203125, 54.5078125, 59.18359375, 63.859375, 68.53515625, 73.2109375, 77.88671875, 82.5625, 87.23828125, 91.9140625, 96.58984375, 101.265625, 105.94140625, 110.6171875, 115.29296875, 119.96875, 124.64453125, 129.3203125, 133.99609375, 138.671875, 143.34765625, 148.0234375, 152.69921875, 157.375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 6.0, 7.0, 16.0, 20.0, 20.0, 26.0, 43.0, 42.0, 56.0, 88.0, 55.0, 80.0, 82.0, 71.0, 74.0, 70.0, 60.0, 51.0, 39.0, 33.0, 16.0, 18.0, 8.0, 9.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.640625, -20.948974609375, -20.25732421875, -19.565673828125, -18.8740234375, -18.182373046875, -17.49072265625, -16.799072265625, -16.107421875, -15.415771484375, -14.72412109375, -14.032470703125, -13.3408203125, -12.649169921875, -11.95751953125, -11.265869140625, -10.57421875, -9.882568359375, -9.19091796875, -8.499267578125, -7.8076171875, -7.115966796875, -6.42431640625, -5.732666015625, -5.041015625, -4.349365234375, -3.65771484375, -2.966064453125, -2.2744140625, -1.582763671875, -0.89111328125, -0.199462890625, 0.4921875, 1.183837890625, 1.87548828125, 2.567138671875, 3.2587890625, 3.950439453125, 4.64208984375, 5.333740234375, 6.025390625, 6.717041015625, 7.40869140625, 8.100341796875, 8.7919921875, 9.483642578125, 10.17529296875, 10.866943359375, 11.55859375, 12.250244140625, 12.94189453125, 13.633544921875, 14.3251953125, 15.016845703125, 15.70849609375, 16.400146484375, 17.091796875, 17.783447265625, 18.47509765625, 19.166748046875, 19.8583984375, 20.550048828125, 21.24169921875, 21.933349609375, 22.625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 7.0, 4.0, 5.0, 12.0, 12.0, 30.0, 29.0, 35.0, 51.0, 75.0, 98.0, 154.0, 210.0, 353.0, 583.0, 1387.0, 4442.0, 21850.0, 157064.0, 3244146.0, 686403.0, 62185.0, 10351.0, 2526.0, 946.0, 485.0, 268.0, 161.0, 124.0, 76.0, 69.0, 35.0, 29.0, 16.0, 15.0, 18.0, 9.0, 9.0, 5.0, 3.0, 3.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-139.625, -135.6103515625, -131.595703125, -127.5810546875, -123.56640625, -119.5517578125, -115.537109375, -111.5224609375, -107.5078125, -103.4931640625, -99.478515625, -95.4638671875, -91.44921875, -87.4345703125, -83.419921875, -79.4052734375, -75.390625, -71.3759765625, -67.361328125, -63.3466796875, -59.33203125, -55.3173828125, -51.302734375, -47.2880859375, -43.2734375, -39.2587890625, -35.244140625, -31.2294921875, -27.21484375, -23.2001953125, -19.185546875, -15.1708984375, -11.15625, -7.1416015625, -3.126953125, 0.8876953125, 4.90234375, 8.9169921875, 12.931640625, 16.9462890625, 20.9609375, 24.9755859375, 28.990234375, 33.0048828125, 37.01953125, 41.0341796875, 45.048828125, 49.0634765625, 53.078125, 57.0927734375, 61.107421875, 65.1220703125, 69.13671875, 73.1513671875, 77.166015625, 81.1806640625, 85.1953125, 89.2099609375, 93.224609375, 97.2392578125, 101.25390625, 105.2685546875, 109.283203125, 113.2978515625, 117.3125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 8.0, 17.0, 30.0, 59.0, 142.0, 333.0, 1158.0, 1628.0, 394.0, 158.0, 69.0, 44.0, 27.0, 6.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.25, -67.7470703125, -65.244140625, -62.7412109375, -60.23828125, -57.7353515625, -55.232421875, -52.7294921875, -50.2265625, -47.7236328125, -45.220703125, -42.7177734375, -40.21484375, -37.7119140625, -35.208984375, -32.7060546875, -30.203125, -27.7001953125, -25.197265625, -22.6943359375, -20.19140625, -17.6884765625, -15.185546875, -12.6826171875, -10.1796875, -7.6767578125, -5.173828125, -2.6708984375, -0.16796875, 2.3349609375, 4.837890625, 7.3408203125, 9.84375, 12.3466796875, 14.849609375, 17.3525390625, 19.85546875, 22.3583984375, 24.861328125, 27.3642578125, 29.8671875, 32.3701171875, 34.873046875, 37.3759765625, 39.87890625, 42.3818359375, 44.884765625, 47.3876953125, 49.890625, 52.3935546875, 54.896484375, 57.3994140625, 59.90234375, 62.4052734375, 64.908203125, 67.4111328125, 69.9140625, 72.4169921875, 74.919921875, 77.4228515625, 79.92578125, 82.4287109375, 84.931640625, 87.4345703125, 89.9375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 4.0, 7.0, 8.0, 20.0, 24.0, 34.0, 41.0, 53.0, 70.0, 79.0, 87.0, 107.0, 82.0, 71.0, 79.0, 55.0, 56.0, 36.0, 22.0, 13.0, 15.0, 9.0, 4.0, 9.0, 1.0, 4.0, 0.0, 3.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-211.2149200439453, -203.9550018310547, -196.69508361816406, -189.43516540527344, -182.1752471923828, -174.9153289794922, -167.65541076660156, -160.39549255371094, -153.1355743408203, -145.8756561279297, -138.61573791503906, -131.35581970214844, -124.09590148925781, -116.83598327636719, -109.57606506347656, -102.31614685058594, -95.05622863769531, -87.79631042480469, -80.53639221191406, -73.27647399902344, -66.01655578613281, -58.75663757324219, -51.49671936035156, -44.23680114746094, -36.97688293457031, -29.716964721679688, -22.457046508789062, -15.197128295898438, -7.9372100830078125, -0.6772918701171875, 6.5826263427734375, 13.842544555664062, 21.10247802734375, 28.362396240234375, 35.622314453125, 42.882232666015625, 50.14215087890625, 57.402069091796875, 64.6619873046875, 71.92190551757812, 79.18182373046875, 86.44174194335938, 93.70166015625, 100.96157836914062, 108.22149658203125, 115.48141479492188, 122.7413330078125, 130.00125122070312, 137.26116943359375, 144.52108764648438, 151.781005859375, 159.04092407226562, 166.30084228515625, 173.56076049804688, 180.8206787109375, 188.08059692382812, 195.34051513671875, 202.60043334960938, 209.8603515625, 217.12026977539062, 224.38018798828125, 231.64010620117188, 238.9000244140625, 246.15994262695312, 253.41986083984375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 9.0, 10.0, 11.0, 21.0, 19.0, 21.0, 27.0, 28.0, 28.0, 32.0, 47.0, 37.0, 52.0, 60.0, 38.0, 38.0, 59.0, 43.0, 36.0, 49.0, 46.0, 42.0, 45.0, 26.0, 32.0, 16.0, 28.0, 25.0, 22.0, 13.0, 8.0, 13.0, 7.0, 4.0, 0.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-126.20563507080078, -121.4463882446289, -116.68714141845703, -111.92789459228516, -107.16864776611328, -102.4094009399414, -97.65015411376953, -92.89090728759766, -88.13166046142578, -83.3724136352539, -78.61316680908203, -73.85391998291016, -69.09467315673828, -64.3354263305664, -59.57617950439453, -54.816932678222656, -50.05768585205078, -45.298439025878906, -40.53919219970703, -35.779945373535156, -31.02069854736328, -26.261451721191406, -21.50220489501953, -16.742958068847656, -11.983711242675781, -7.224464416503906, -2.4652175903320312, 2.2940292358398438, 7.053276062011719, 11.812522888183594, 16.57176971435547, 21.331016540527344, 26.090255737304688, 30.849502563476562, 35.60874938964844, 40.36799621582031, 45.12724304199219, 49.88648986816406, 54.64573669433594, 59.40498352050781, 64.16423034667969, 68.92347717285156, 73.68272399902344, 78.44197082519531, 83.20121765136719, 87.96046447753906, 92.71971130371094, 97.47895812988281, 102.23820495605469, 106.99745178222656, 111.75669860839844, 116.51594543457031, 121.27519226074219, 126.03443908691406, 130.79368591308594, 135.5529327392578, 140.3121795654297, 145.07142639160156, 149.83067321777344, 154.5899200439453, 159.3491668701172, 164.10841369628906, 168.86766052246094, 173.6269073486328, 178.3861541748047]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 5.0, 9.0, 9.0, 10.0, 26.0, 18.0, 31.0, 66.0, 98.0, 177.0, 341.0, 613.0, 1445.0, 3971.0, 16158.0, 98447.0, 581589.0, 293256.0, 39792.0, 8039.0, 2416.0, 979.0, 489.0, 250.0, 139.0, 58.0, 31.0, 35.0, 21.0, 13.0, 14.0, 4.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-113.125, -109.05078125, -104.9765625, -100.90234375, -96.828125, -92.75390625, -88.6796875, -84.60546875, -80.53125, -76.45703125, -72.3828125, -68.30859375, -64.234375, -60.16015625, -56.0859375, -52.01171875, -47.9375, -43.86328125, -39.7890625, -35.71484375, -31.640625, -27.56640625, -23.4921875, -19.41796875, -15.34375, -11.26953125, -7.1953125, -3.12109375, 0.953125, 5.02734375, 9.1015625, 13.17578125, 17.25, 21.32421875, 25.3984375, 29.47265625, 33.546875, 37.62109375, 41.6953125, 45.76953125, 49.84375, 53.91796875, 57.9921875, 62.06640625, 66.140625, 70.21484375, 74.2890625, 78.36328125, 82.4375, 86.51171875, 90.5859375, 94.66015625, 98.734375, 102.80859375, 106.8828125, 110.95703125, 115.03125, 119.10546875, 123.1796875, 127.25390625, 131.328125, 135.40234375, 139.4765625, 143.55078125, 147.625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 6.0, 9.0, 8.0, 24.0, 10.0, 28.0, 39.0, 51.0, 58.0, 76.0, 67.0, 77.0, 73.0, 75.0, 89.0, 70.0, 56.0, 44.0, 40.0, 40.0, 23.0, 7.0, 9.0, 8.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.65625, -20.92138671875, -20.1865234375, -19.45166015625, -18.716796875, -17.98193359375, -17.2470703125, -16.51220703125, -15.77734375, -15.04248046875, -14.3076171875, -13.57275390625, -12.837890625, -12.10302734375, -11.3681640625, -10.63330078125, -9.8984375, -9.16357421875, -8.4287109375, -7.69384765625, -6.958984375, -6.22412109375, -5.4892578125, -4.75439453125, -4.01953125, -3.28466796875, -2.5498046875, -1.81494140625, -1.080078125, -0.34521484375, 0.3896484375, 1.12451171875, 1.859375, 2.59423828125, 3.3291015625, 4.06396484375, 4.798828125, 5.53369140625, 6.2685546875, 7.00341796875, 7.73828125, 8.47314453125, 9.2080078125, 9.94287109375, 10.677734375, 11.41259765625, 12.1474609375, 12.88232421875, 13.6171875, 14.35205078125, 15.0869140625, 15.82177734375, 16.556640625, 17.29150390625, 18.0263671875, 18.76123046875, 19.49609375, 20.23095703125, 20.9658203125, 21.70068359375, 22.435546875, 23.17041015625, 23.9052734375, 24.64013671875, 25.375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 7.0, 6.0, 8.0, 8.0, 15.0, 20.0, 36.0, 44.0, 63.0, 92.0, 112.0, 179.0, 235.0, 319.0, 521.0, 898.0, 1672.0, 3566.0, 8933.0, 25334.0, 83466.0, 328810.0, 426043.0, 114575.0, 33360.0, 11262.0, 4282.0, 1934.0, 992.0, 545.0, 374.0, 222.0, 179.0, 122.0, 88.0, 58.0, 64.0, 35.0, 26.0, 13.0, 11.0, 4.0, 8.0, 8.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-62.0625, -60.001953125, -57.94140625, -55.880859375, -53.8203125, -51.759765625, -49.69921875, -47.638671875, -45.578125, -43.517578125, -41.45703125, -39.396484375, -37.3359375, -35.275390625, -33.21484375, -31.154296875, -29.09375, -27.033203125, -24.97265625, -22.912109375, -20.8515625, -18.791015625, -16.73046875, -14.669921875, -12.609375, -10.548828125, -8.48828125, -6.427734375, -4.3671875, -2.306640625, -0.24609375, 1.814453125, 3.875, 5.935546875, 7.99609375, 10.056640625, 12.1171875, 14.177734375, 16.23828125, 18.298828125, 20.359375, 22.419921875, 24.48046875, 26.541015625, 28.6015625, 30.662109375, 32.72265625, 34.783203125, 36.84375, 38.904296875, 40.96484375, 43.025390625, 45.0859375, 47.146484375, 49.20703125, 51.267578125, 53.328125, 55.388671875, 57.44921875, 59.509765625, 61.5703125, 63.630859375, 65.69140625, 67.751953125, 69.8125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 8.0, 6.0, 8.0, 11.0, 13.0, 18.0, 22.0, 19.0, 33.0, 21.0, 35.0, 40.0, 37.0, 36.0, 49.0, 52.0, 50.0, 59.0, 60.0, 59.0, 44.0, 42.0, 40.0, 41.0, 35.0, 28.0, 24.0, 11.0, 25.0, 22.0, 11.0, 7.0, 8.0, 9.0, 5.0, 8.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-68.8125, -66.6806640625, -64.548828125, -62.4169921875, -60.28515625, -58.1533203125, -56.021484375, -53.8896484375, -51.7578125, -49.6259765625, -47.494140625, -45.3623046875, -43.23046875, -41.0986328125, -38.966796875, -36.8349609375, -34.703125, -32.5712890625, -30.439453125, -28.3076171875, -26.17578125, -24.0439453125, -21.912109375, -19.7802734375, -17.6484375, -15.5166015625, -13.384765625, -11.2529296875, -9.12109375, -6.9892578125, -4.857421875, -2.7255859375, -0.59375, 1.5380859375, 3.669921875, 5.8017578125, 7.93359375, 10.0654296875, 12.197265625, 14.3291015625, 16.4609375, 18.5927734375, 20.724609375, 22.8564453125, 24.98828125, 27.1201171875, 29.251953125, 31.3837890625, 33.515625, 35.6474609375, 37.779296875, 39.9111328125, 42.04296875, 44.1748046875, 46.306640625, 48.4384765625, 50.5703125, 52.7021484375, 54.833984375, 56.9658203125, 59.09765625, 61.2294921875, 63.361328125, 65.4931640625, 67.625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 8.0, 9.0, 17.0, 25.0, 34.0, 50.0, 104.0, 174.0, 349.0, 742.0, 2026.0, 8144.0, 43827.0, 261641.0, 546005.0, 152831.0, 24955.0, 4902.0, 1434.0, 561.0, 294.0, 169.0, 98.0, 51.0, 37.0, 18.0, 13.0, 13.0, 9.0, 3.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-31.609375, -30.600830078125, -29.59228515625, -28.583740234375, -27.5751953125, -26.566650390625, -25.55810546875, -24.549560546875, -23.541015625, -22.532470703125, -21.52392578125, -20.515380859375, -19.5068359375, -18.498291015625, -17.48974609375, -16.481201171875, -15.47265625, -14.464111328125, -13.45556640625, -12.447021484375, -11.4384765625, -10.429931640625, -9.42138671875, -8.412841796875, -7.404296875, -6.395751953125, -5.38720703125, -4.378662109375, -3.3701171875, -2.361572265625, -1.35302734375, -0.344482421875, 0.6640625, 1.672607421875, 2.68115234375, 3.689697265625, 4.6982421875, 5.706787109375, 6.71533203125, 7.723876953125, 8.732421875, 9.740966796875, 10.74951171875, 11.758056640625, 12.7666015625, 13.775146484375, 14.78369140625, 15.792236328125, 16.80078125, 17.809326171875, 18.81787109375, 19.826416015625, 20.8349609375, 21.843505859375, 22.85205078125, 23.860595703125, 24.869140625, 25.877685546875, 26.88623046875, 27.894775390625, 28.9033203125, 29.911865234375, 30.92041015625, 31.928955078125, 32.9375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 7.0, 8.0, 17.0, 11.0, 19.0, 23.0, 35.0, 41.0, 65.0, 87.0, 97.0, 93.0, 111.0, 88.0, 52.0, 54.0, 45.0, 36.0, 28.0, 21.0, 19.0, 6.0, 10.0, 12.0, 6.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005023956298828125, -0.0048789381980896, -0.004733920097351074, -0.004588901996612549, -0.0044438838958740234, -0.004298865795135498, -0.004153847694396973, -0.004008829593658447, -0.003863811492919922, -0.0037187933921813965, -0.003573775291442871, -0.0034287571907043457, -0.0032837390899658203, -0.003138720989227295, -0.0029937028884887695, -0.002848684787750244, -0.0027036666870117188, -0.0025586485862731934, -0.002413630485534668, -0.0022686123847961426, -0.002123594284057617, -0.001978576183319092, -0.0018335580825805664, -0.001688539981842041, -0.0015435218811035156, -0.0013985037803649902, -0.0012534856796264648, -0.0011084675788879395, -0.0009634494781494141, -0.0008184313774108887, -0.0006734132766723633, -0.0005283951759338379, -0.0003833770751953125, -0.0002383589744567871, -9.334087371826172e-05, 5.167722702026367e-05, 0.00019669532775878906, 0.00034171342849731445, 0.00048673152923583984, 0.0006317496299743652, 0.0007767677307128906, 0.000921785831451416, 0.0010668039321899414, 0.0012118220329284668, 0.0013568401336669922, 0.0015018582344055176, 0.001646876335144043, 0.0017918944358825684, 0.0019369125366210938, 0.002081930637359619, 0.0022269487380981445, 0.00237196683883667, 0.0025169849395751953, 0.0026620030403137207, 0.002807021141052246, 0.0029520392417907715, 0.003097057342529297, 0.0032420754432678223, 0.0033870935440063477, 0.003532111644744873, 0.0036771297454833984, 0.003822147846221924, 0.003967165946960449, 0.004112184047698975, 0.0042572021484375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 13.0, 14.0, 16.0, 33.0, 54.0, 92.0, 173.0, 249.0, 501.0, 982.0, 2387.0, 7658.0, 36065.0, 194647.0, 529780.0, 221065.0, 41417.0, 8537.0, 2658.0, 1001.0, 493.0, 287.0, 147.0, 104.0, 54.0, 32.0, 31.0, 18.0, 11.0, 12.0, 6.0, 9.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.1875, -33.168212890625, -32.14892578125, -31.129638671875, -30.1103515625, -29.091064453125, -28.07177734375, -27.052490234375, -26.033203125, -25.013916015625, -23.99462890625, -22.975341796875, -21.9560546875, -20.936767578125, -19.91748046875, -18.898193359375, -17.87890625, -16.859619140625, -15.84033203125, -14.821044921875, -13.8017578125, -12.782470703125, -11.76318359375, -10.743896484375, -9.724609375, -8.705322265625, -7.68603515625, -6.666748046875, -5.6474609375, -4.628173828125, -3.60888671875, -2.589599609375, -1.5703125, -0.551025390625, 0.46826171875, 1.487548828125, 2.5068359375, 3.526123046875, 4.54541015625, 5.564697265625, 6.583984375, 7.603271484375, 8.62255859375, 9.641845703125, 10.6611328125, 11.680419921875, 12.69970703125, 13.718994140625, 14.73828125, 15.757568359375, 16.77685546875, 17.796142578125, 18.8154296875, 19.834716796875, 20.85400390625, 21.873291015625, 22.892578125, 23.911865234375, 24.93115234375, 25.950439453125, 26.9697265625, 27.989013671875, 29.00830078125, 30.027587890625, 31.046875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 6.0, 4.0, 10.0, 10.0, 9.0, 11.0, 25.0, 28.0, 38.0, 35.0, 62.0, 70.0, 79.0, 91.0, 95.0, 82.0, 64.0, 73.0, 51.0, 40.0, 26.0, 28.0, 18.0, 17.0, 13.0, 8.0, 1.0, 4.0, 4.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.71875, -26.935791015625, -26.15283203125, -25.369873046875, -24.5869140625, -23.803955078125, -23.02099609375, -22.238037109375, -21.455078125, -20.672119140625, -19.88916015625, -19.106201171875, -18.3232421875, -17.540283203125, -16.75732421875, -15.974365234375, -15.19140625, -14.408447265625, -13.62548828125, -12.842529296875, -12.0595703125, -11.276611328125, -10.49365234375, -9.710693359375, -8.927734375, -8.144775390625, -7.36181640625, -6.578857421875, -5.7958984375, -5.012939453125, -4.22998046875, -3.447021484375, -2.6640625, -1.881103515625, -1.09814453125, -0.315185546875, 0.4677734375, 1.250732421875, 2.03369140625, 2.816650390625, 3.599609375, 4.382568359375, 5.16552734375, 5.948486328125, 6.7314453125, 7.514404296875, 8.29736328125, 9.080322265625, 9.86328125, 10.646240234375, 11.42919921875, 12.212158203125, 12.9951171875, 13.778076171875, 14.56103515625, 15.343994140625, 16.126953125, 16.909912109375, 17.69287109375, 18.475830078125, 19.2587890625, 20.041748046875, 20.82470703125, 21.607666015625, 22.390625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 6.0, 13.0, 6.0, 21.0, 45.0, 78.0, 89.0, 132.0, 145.0, 124.0, 121.0, 70.0, 62.0, 42.0, 23.0, 10.0, 8.0, 8.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-862.804931640625, -845.1047973632812, -827.4046630859375, -809.7045288085938, -792.00439453125, -774.3042602539062, -756.6041259765625, -738.904052734375, -721.203857421875, -703.5037231445312, -685.8035888671875, -668.1034545898438, -650.4033203125, -632.7031860351562, -615.0030517578125, -597.302978515625, -579.6028442382812, -561.9027099609375, -544.2025756835938, -526.50244140625, -508.80230712890625, -491.1021728515625, -473.4020690917969, -455.7019348144531, -438.0018005371094, -420.3016662597656, -402.6015319824219, -384.9013977050781, -367.2012939453125, -349.50115966796875, -331.801025390625, -314.10089111328125, -296.40069580078125, -278.7005615234375, -261.00042724609375, -243.30030822753906, -225.6001739501953, -207.90003967285156, -190.19992065429688, -172.49978637695312, -154.79965209960938, -137.09951782226562, -119.3993911743164, -101.69926452636719, -83.99913024902344, -66.29899597167969, -48.59886932373047, -30.89874267578125, -13.1986083984375, 4.501522064208984, 22.20165252685547, 39.90178298950195, 57.60191345214844, 75.30204772949219, 93.0021743774414, 110.70230102539062, 128.40243530273438, 146.10256958007812, 163.80270385742188, 181.50282287597656, 199.2029571533203, 216.90309143066406, 234.60321044921875, 252.3033447265625, 270.00347900390625]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 4.0, 6.0, 5.0, 12.0, 19.0, 17.0, 20.0, 27.0, 31.0, 37.0, 44.0, 36.0, 56.0, 55.0, 55.0, 67.0, 52.0, 52.0, 50.0, 56.0, 56.0, 53.0, 37.0, 34.0, 26.0, 22.0, 15.0, 17.0, 9.0, 6.0, 11.0, 5.0, 5.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-460.99365234375, -448.9089660644531, -436.82427978515625, -424.7395935058594, -412.6549072265625, -400.5702209472656, -388.48553466796875, -376.40081787109375, -364.316162109375, -352.2314758300781, -340.14678955078125, -328.0621032714844, -315.9774169921875, -303.8927307128906, -291.80804443359375, -279.72332763671875, -267.6386413574219, -255.553955078125, -243.46926879882812, -231.38458251953125, -219.29989624023438, -207.2152099609375, -195.13050842285156, -183.0458221435547, -170.9611358642578, -158.87644958496094, -146.79176330566406, -134.70706176757812, -122.62238311767578, -110.5376968383789, -98.4530029296875, -86.36831665039062, -74.28363037109375, -62.198944091796875, -50.114253997802734, -38.029563903808594, -25.94487762451172, -13.860191345214844, -1.7754974365234375, 10.309188842773438, 22.393875122070312, 34.47856140136719, 46.56325149536133, 58.64794158935547, 70.73262786865234, 82.81731414794922, 94.90200805664062, 106.9866943359375, 119.07138061523438, 131.15606689453125, 143.24075317382812, 155.325439453125, 167.41012573242188, 179.49481201171875, 191.5795135498047, 203.66419982910156, 215.74888610839844, 227.8335723876953, 239.9182586669922, 252.00296020507812, 264.087646484375, 276.1723327636719, 288.25701904296875, 300.3417053222656, 312.4263916015625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 6.0, 3.0, 9.0, 19.0, 20.0, 35.0, 42.0, 94.0, 152.0, 220.0, 453.0, 952.0, 2554.0, 8702.0, 58596.0, 4066785.0, 44032.0, 7387.0, 2336.0, 917.0, 407.0, 189.0, 135.0, 87.0, 43.0, 21.0, 24.0, 14.0, 15.0, 5.0, 5.0, 3.0, 8.0, 4.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-220.75, -213.5, -206.25, -199.0, -191.75, -184.5, -177.25, -170.0, -162.75, -155.5, -148.25, -141.0, -133.75, -126.5, -119.25, -112.0, -104.75, -97.5, -90.25, -83.0, -75.75, -68.5, -61.25, -54.0, -46.75, -39.5, -32.25, -25.0, -17.75, -10.5, -3.25, 4.0, 11.25, 18.5, 25.75, 33.0, 40.25, 47.5, 54.75, 62.0, 69.25, 76.5, 83.75, 91.0, 98.25, 105.5, 112.75, 120.0, 127.25, 134.5, 141.75, 149.0, 156.25, 163.5, 170.75, 178.0, 185.25, 192.5, 199.75, 207.0, 214.25, 221.5, 228.75, 236.0, 243.25]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 4.0, 10.0, 6.0, 7.0, 10.0, 31.0, 20.0, 29.0, 42.0, 36.0, 54.0, 69.0, 63.0, 72.0, 60.0, 61.0, 77.0, 54.0, 58.0, 40.0, 42.0, 32.0, 31.0, 16.0, 17.0, 20.0, 8.0, 12.0, 8.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-20.359375, -19.64990234375, -18.9404296875, -18.23095703125, -17.521484375, -16.81201171875, -16.1025390625, -15.39306640625, -14.68359375, -13.97412109375, -13.2646484375, -12.55517578125, -11.845703125, -11.13623046875, -10.4267578125, -9.71728515625, -9.0078125, -8.29833984375, -7.5888671875, -6.87939453125, -6.169921875, -5.46044921875, -4.7509765625, -4.04150390625, -3.33203125, -2.62255859375, -1.9130859375, -1.20361328125, -0.494140625, 0.21533203125, 0.9248046875, 1.63427734375, 2.34375, 3.05322265625, 3.7626953125, 4.47216796875, 5.181640625, 5.89111328125, 6.6005859375, 7.31005859375, 8.01953125, 8.72900390625, 9.4384765625, 10.14794921875, 10.857421875, 11.56689453125, 12.2763671875, 12.98583984375, 13.6953125, 14.40478515625, 15.1142578125, 15.82373046875, 16.533203125, 17.24267578125, 17.9521484375, 18.66162109375, 19.37109375, 20.08056640625, 20.7900390625, 21.49951171875, 22.208984375, 22.91845703125, 23.6279296875, 24.33740234375, 25.046875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 6.0, 13.0, 8.0, 18.0, 27.0, 50.0, 103.0, 215.0, 519.0, 1113.0, 2900.0, 8706.0, 43873.0, 3901007.0, 207708.0, 19636.0, 5155.0, 1818.0, 781.0, 321.0, 145.0, 75.0, 38.0, 20.0, 15.0, 10.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-162.375, -158.0771484375, -153.779296875, -149.4814453125, -145.18359375, -140.8857421875, -136.587890625, -132.2900390625, -127.9921875, -123.6943359375, -119.396484375, -115.0986328125, -110.80078125, -106.5029296875, -102.205078125, -97.9072265625, -93.609375, -89.3115234375, -85.013671875, -80.7158203125, -76.41796875, -72.1201171875, -67.822265625, -63.5244140625, -59.2265625, -54.9287109375, -50.630859375, -46.3330078125, -42.03515625, -37.7373046875, -33.439453125, -29.1416015625, -24.84375, -20.5458984375, -16.248046875, -11.9501953125, -7.65234375, -3.3544921875, 0.943359375, 5.2412109375, 9.5390625, 13.8369140625, 18.134765625, 22.4326171875, 26.73046875, 31.0283203125, 35.326171875, 39.6240234375, 43.921875, 48.2197265625, 52.517578125, 56.8154296875, 61.11328125, 65.4111328125, 69.708984375, 74.0068359375, 78.3046875, 82.6025390625, 86.900390625, 91.1982421875, 95.49609375, 99.7939453125, 104.091796875, 108.3896484375, 112.6875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 6.0, 3.0, 8.0, 8.0, 7.0, 20.0, 20.0, 26.0, 43.0, 100.0, 177.0, 2657.0, 599.0, 150.0, 88.0, 53.0, 27.0, 27.0, 12.0, 10.0, 4.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.359375, -16.9130859375, -16.466796875, -16.0205078125, -15.57421875, -15.1279296875, -14.681640625, -14.2353515625, -13.7890625, -13.3427734375, -12.896484375, -12.4501953125, -12.00390625, -11.5576171875, -11.111328125, -10.6650390625, -10.21875, -9.7724609375, -9.326171875, -8.8798828125, -8.43359375, -7.9873046875, -7.541015625, -7.0947265625, -6.6484375, -6.2021484375, -5.755859375, -5.3095703125, -4.86328125, -4.4169921875, -3.970703125, -3.5244140625, -3.078125, -2.6318359375, -2.185546875, -1.7392578125, -1.29296875, -0.8466796875, -0.400390625, 0.0458984375, 0.4921875, 0.9384765625, 1.384765625, 1.8310546875, 2.27734375, 2.7236328125, 3.169921875, 3.6162109375, 4.0625, 4.5087890625, 4.955078125, 5.4013671875, 5.84765625, 6.2939453125, 6.740234375, 7.1865234375, 7.6328125, 8.0791015625, 8.525390625, 8.9716796875, 9.41796875, 9.8642578125, 10.310546875, 10.7568359375, 11.203125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 3.0, 12.0, 4.0, 9.0, 19.0, 13.0, 42.0, 51.0, 57.0, 70.0, 82.0, 88.0, 86.0, 91.0, 88.0, 73.0, 70.0, 39.0, 36.0, 23.0, 10.0, 9.0, 7.0, 9.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-87.95367431640625, -85.9128646850586, -83.87205505371094, -81.83124542236328, -79.79043579101562, -77.74961853027344, -75.70880889892578, -73.66799926757812, -71.62718963623047, -69.58638000488281, -67.54557037353516, -65.5047607421875, -63.46394729614258, -61.42313766479492, -59.38232421875, -57.341514587402344, -55.30070495605469, -53.25989532470703, -51.219085693359375, -49.17827224731445, -47.1374626159668, -45.09665298461914, -43.05583953857422, -41.01502990722656, -38.974220275878906, -36.93341064453125, -34.892601013183594, -32.85178756713867, -30.810977935791016, -28.77016830444336, -26.72935676574707, -24.68854522705078, -22.647735595703125, -20.60692596435547, -18.56611442565918, -16.52530288696289, -14.484493255615234, -12.443682670593262, -10.402872085571289, -8.362061500549316, -6.321250915527344, -4.280440330505371, -2.2396297454833984, -0.19881916046142578, 1.8419914245605469, 3.8828020095825195, 5.923612594604492, 7.964423179626465, 10.005233764648438, 12.04604434967041, 14.086854934692383, 16.127666473388672, 18.168476104736328, 20.209285736083984, 22.250097274780273, 24.290908813476562, 26.33171844482422, 28.372528076171875, 30.413339614868164, 32.45415115356445, 34.49496078491211, 36.535770416259766, 38.57658386230469, 40.617393493652344, 42.658203125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 3.0, 9.0, 11.0, 13.0, 13.0, 16.0, 23.0, 22.0, 26.0, 31.0, 26.0, 39.0, 37.0, 45.0, 40.0, 44.0, 43.0, 33.0, 33.0, 47.0, 38.0, 36.0, 34.0, 43.0, 40.0, 25.0, 29.0, 25.0, 27.0, 22.0, 17.0, 13.0, 10.0, 14.0, 14.0, 7.0, 7.0, 7.0, 11.0, 3.0, 3.0, 1.0, 8.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-34.16252899169922, -33.09475326538086, -32.0269775390625, -30.95920181274414, -29.89142608642578, -28.823650360107422, -27.75587272644043, -26.68809700012207, -25.62032127380371, -24.55254554748535, -23.484769821166992, -22.416994094848633, -21.34921646118164, -20.28144073486328, -19.213665008544922, -18.145889282226562, -17.078113555908203, -16.010337829589844, -14.942562103271484, -13.874785423278809, -12.80700969696045, -11.73923397064209, -10.671457290649414, -9.603681564331055, -8.535905838012695, -7.468130111694336, -6.400353908538818, -5.332577705383301, -4.264801979064941, -3.197026252746582, -2.1292500495910645, -1.0614738464355469, 0.0063018798828125, 1.074077844619751, 2.1418538093566895, 3.209629774093628, 4.277405738830566, 5.345181465148926, 6.412957668304443, 7.480733871459961, 8.54850959777832, 9.61628532409668, 10.684061050415039, 11.751837730407715, 12.819613456726074, 13.887389183044434, 14.95516586303711, 16.02294158935547, 17.090717315673828, 18.158493041992188, 19.226268768310547, 20.294044494628906, 21.361820220947266, 22.429595947265625, 23.497373580932617, 24.565149307250977, 25.632925033569336, 26.700700759887695, 27.768476486206055, 28.836252212524414, 29.904029846191406, 30.971805572509766, 32.039581298828125, 33.107357025146484, 34.175132751464844]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 6.0, 6.0, 13.0, 10.0, 24.0, 34.0, 39.0, 44.0, 58.0, 118.0, 176.0, 265.0, 430.0, 680.0, 1137.0, 2198.0, 4648.0, 10888.0, 27319.0, 72210.0, 197389.0, 367353.0, 225728.0, 83004.0, 31511.0, 12307.0, 5325.0, 2413.0, 1270.0, 665.0, 429.0, 270.0, 183.0, 125.0, 78.0, 57.0, 46.0, 30.0, 21.0, 13.0, 12.0, 8.0, 3.0, 5.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-60.09375, -58.3037109375, -56.513671875, -54.7236328125, -52.93359375, -51.1435546875, -49.353515625, -47.5634765625, -45.7734375, -43.9833984375, -42.193359375, -40.4033203125, -38.61328125, -36.8232421875, -35.033203125, -33.2431640625, -31.453125, -29.6630859375, -27.873046875, -26.0830078125, -24.29296875, -22.5029296875, -20.712890625, -18.9228515625, -17.1328125, -15.3427734375, -13.552734375, -11.7626953125, -9.97265625, -8.1826171875, -6.392578125, -4.6025390625, -2.8125, -1.0224609375, 0.767578125, 2.5576171875, 4.34765625, 6.1376953125, 7.927734375, 9.7177734375, 11.5078125, 13.2978515625, 15.087890625, 16.8779296875, 18.66796875, 20.4580078125, 22.248046875, 24.0380859375, 25.828125, 27.6181640625, 29.408203125, 31.1982421875, 32.98828125, 34.7783203125, 36.568359375, 38.3583984375, 40.1484375, 41.9384765625, 43.728515625, 45.5185546875, 47.30859375, 49.0986328125, 50.888671875, 52.6787109375, 54.46875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 4.0, 5.0, 7.0, 11.0, 14.0, 11.0, 22.0, 30.0, 40.0, 40.0, 47.0, 46.0, 49.0, 62.0, 81.0, 52.0, 64.0, 76.0, 52.0, 50.0, 39.0, 42.0, 24.0, 35.0, 26.0, 18.0, 16.0, 9.0, 9.0, 8.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-20.9375, -20.229248046875, -19.52099609375, -18.812744140625, -18.1044921875, -17.396240234375, -16.68798828125, -15.979736328125, -15.271484375, -14.563232421875, -13.85498046875, -13.146728515625, -12.4384765625, -11.730224609375, -11.02197265625, -10.313720703125, -9.60546875, -8.897216796875, -8.18896484375, -7.480712890625, -6.7724609375, -6.064208984375, -5.35595703125, -4.647705078125, -3.939453125, -3.231201171875, -2.52294921875, -1.814697265625, -1.1064453125, -0.398193359375, 0.31005859375, 1.018310546875, 1.7265625, 2.434814453125, 3.14306640625, 3.851318359375, 4.5595703125, 5.267822265625, 5.97607421875, 6.684326171875, 7.392578125, 8.100830078125, 8.80908203125, 9.517333984375, 10.2255859375, 10.933837890625, 11.64208984375, 12.350341796875, 13.05859375, 13.766845703125, 14.47509765625, 15.183349609375, 15.8916015625, 16.599853515625, 17.30810546875, 18.016357421875, 18.724609375, 19.432861328125, 20.14111328125, 20.849365234375, 21.5576171875, 22.265869140625, 22.97412109375, 23.682373046875, 24.390625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 2.0, 2.0, 11.0, 9.0, 12.0, 26.0, 35.0, 65.0, 80.0, 168.0, 246.0, 403.0, 723.0, 1325.0, 3873.0, 21812.0, 213083.0, 697701.0, 92719.0, 11213.0, 2508.0, 1048.0, 567.0, 350.0, 195.0, 126.0, 87.0, 62.0, 40.0, 16.0, 16.0, 10.0, 4.0, 7.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-113.3125, -110.01171875, -106.7109375, -103.41015625, -100.109375, -96.80859375, -93.5078125, -90.20703125, -86.90625, -83.60546875, -80.3046875, -77.00390625, -73.703125, -70.40234375, -67.1015625, -63.80078125, -60.5, -57.19921875, -53.8984375, -50.59765625, -47.296875, -43.99609375, -40.6953125, -37.39453125, -34.09375, -30.79296875, -27.4921875, -24.19140625, -20.890625, -17.58984375, -14.2890625, -10.98828125, -7.6875, -4.38671875, -1.0859375, 2.21484375, 5.515625, 8.81640625, 12.1171875, 15.41796875, 18.71875, 22.01953125, 25.3203125, 28.62109375, 31.921875, 35.22265625, 38.5234375, 41.82421875, 45.125, 48.42578125, 51.7265625, 55.02734375, 58.328125, 61.62890625, 64.9296875, 68.23046875, 71.53125, 74.83203125, 78.1328125, 81.43359375, 84.734375, 88.03515625, 91.3359375, 94.63671875, 97.9375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 6.0, 5.0, 12.0, 5.0, 16.0, 10.0, 13.0, 19.0, 23.0, 33.0, 22.0, 32.0, 33.0, 34.0, 32.0, 41.0, 37.0, 42.0, 40.0, 46.0, 47.0, 42.0, 46.0, 53.0, 31.0, 48.0, 29.0, 22.0, 28.0, 22.0, 18.0, 25.0, 16.0, 11.0, 7.0, 13.0, 10.0, 7.0, 6.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.4375, -62.23046875, -60.0234375, -57.81640625, -55.609375, -53.40234375, -51.1953125, -48.98828125, -46.78125, -44.57421875, -42.3671875, -40.16015625, -37.953125, -35.74609375, -33.5390625, -31.33203125, -29.125, -26.91796875, -24.7109375, -22.50390625, -20.296875, -18.08984375, -15.8828125, -13.67578125, -11.46875, -9.26171875, -7.0546875, -4.84765625, -2.640625, -0.43359375, 1.7734375, 3.98046875, 6.1875, 8.39453125, 10.6015625, 12.80859375, 15.015625, 17.22265625, 19.4296875, 21.63671875, 23.84375, 26.05078125, 28.2578125, 30.46484375, 32.671875, 34.87890625, 37.0859375, 39.29296875, 41.5, 43.70703125, 45.9140625, 48.12109375, 50.328125, 52.53515625, 54.7421875, 56.94921875, 59.15625, 61.36328125, 63.5703125, 65.77734375, 67.984375, 70.19140625, 72.3984375, 74.60546875, 76.8125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 0.0, 5.0, 6.0, 7.0, 14.0, 13.0, 17.0, 27.0, 43.0, 58.0, 64.0, 102.0, 171.0, 256.0, 483.0, 852.0, 1675.0, 3644.0, 8717.0, 22809.0, 74167.0, 291430.0, 454634.0, 130355.0, 36271.0, 12627.0, 5143.0, 2313.0, 1130.0, 570.0, 325.0, 214.0, 130.0, 85.0, 55.0, 47.0, 21.0, 17.0, 14.0, 14.0, 10.0, 11.0, 4.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.8125, -21.065673828125, -20.31884765625, -19.572021484375, -18.8251953125, -18.078369140625, -17.33154296875, -16.584716796875, -15.837890625, -15.091064453125, -14.34423828125, -13.597412109375, -12.8505859375, -12.103759765625, -11.35693359375, -10.610107421875, -9.86328125, -9.116455078125, -8.36962890625, -7.622802734375, -6.8759765625, -6.129150390625, -5.38232421875, -4.635498046875, -3.888671875, -3.141845703125, -2.39501953125, -1.648193359375, -0.9013671875, -0.154541015625, 0.59228515625, 1.339111328125, 2.0859375, 2.832763671875, 3.57958984375, 4.326416015625, 5.0732421875, 5.820068359375, 6.56689453125, 7.313720703125, 8.060546875, 8.807373046875, 9.55419921875, 10.301025390625, 11.0478515625, 11.794677734375, 12.54150390625, 13.288330078125, 14.03515625, 14.781982421875, 15.52880859375, 16.275634765625, 17.0224609375, 17.769287109375, 18.51611328125, 19.262939453125, 20.009765625, 20.756591796875, 21.50341796875, 22.250244140625, 22.9970703125, 23.743896484375, 24.49072265625, 25.237548828125, 25.984375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 7.0, 7.0, 10.0, 12.0, 14.0, 22.0, 19.0, 30.0, 34.0, 50.0, 48.0, 74.0, 73.0, 82.0, 80.0, 73.0, 76.0, 62.0, 37.0, 36.0, 27.0, 34.0, 14.0, 20.0, 8.0, 8.0, 10.0, 8.0, 5.0, 2.0, 1.0, 6.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0038967132568359375, -0.0037879645824432373, -0.003679215908050537, -0.003570467233657837, -0.0034617185592651367, -0.0033529698848724365, -0.0032442212104797363, -0.003135472536087036, -0.003026723861694336, -0.0029179751873016357, -0.0028092265129089355, -0.0027004778385162354, -0.002591729164123535, -0.002482980489730835, -0.0023742318153381348, -0.0022654831409454346, -0.0021567344665527344, -0.002047985792160034, -0.001939237117767334, -0.0018304884433746338, -0.0017217397689819336, -0.0016129910945892334, -0.0015042424201965332, -0.001395493745803833, -0.0012867450714111328, -0.0011779963970184326, -0.0010692477226257324, -0.0009604990482330322, -0.000851750373840332, -0.0007430016994476318, -0.0006342530250549316, -0.0005255043506622314, -0.00041675567626953125, -0.00030800700187683105, -0.00019925832748413086, -9.050965309143066e-05, 1.823902130126953e-05, 0.00012698769569396973, 0.00023573637008666992, 0.0003444850444793701, 0.0004532337188720703, 0.0005619823932647705, 0.0006707310676574707, 0.0007794797420501709, 0.0008882284164428711, 0.0009969770908355713, 0.0011057257652282715, 0.0012144744396209717, 0.0013232231140136719, 0.001431971788406372, 0.0015407204627990723, 0.0016494691371917725, 0.0017582178115844727, 0.0018669664859771729, 0.001975715160369873, 0.0020844638347625732, 0.0021932125091552734, 0.0023019611835479736, 0.002410709857940674, 0.002519458532333374, 0.0026282072067260742, 0.0027369558811187744, 0.0028457045555114746, 0.002954453229904175, 0.003063201904296875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 6.0, 7.0, 22.0, 34.0, 41.0, 60.0, 119.0, 200.0, 422.0, 1075.0, 4072.0, 25106.0, 385583.0, 587790.0, 36429.0, 5204.0, 1378.0, 511.0, 207.0, 114.0, 59.0, 31.0, 30.0, 18.0, 10.0, 13.0, 5.0, 5.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.0625, -57.37890625, -55.6953125, -54.01171875, -52.328125, -50.64453125, -48.9609375, -47.27734375, -45.59375, -43.91015625, -42.2265625, -40.54296875, -38.859375, -37.17578125, -35.4921875, -33.80859375, -32.125, -30.44140625, -28.7578125, -27.07421875, -25.390625, -23.70703125, -22.0234375, -20.33984375, -18.65625, -16.97265625, -15.2890625, -13.60546875, -11.921875, -10.23828125, -8.5546875, -6.87109375, -5.1875, -3.50390625, -1.8203125, -0.13671875, 1.546875, 3.23046875, 4.9140625, 6.59765625, 8.28125, 9.96484375, 11.6484375, 13.33203125, 15.015625, 16.69921875, 18.3828125, 20.06640625, 21.75, 23.43359375, 25.1171875, 26.80078125, 28.484375, 30.16796875, 31.8515625, 33.53515625, 35.21875, 36.90234375, 38.5859375, 40.26953125, 41.953125, 43.63671875, 45.3203125, 47.00390625, 48.6875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 11.0, 10.0, 20.0, 35.0, 48.0, 61.0, 80.0, 130.0, 132.0, 146.0, 101.0, 90.0, 38.0, 39.0, 21.0, 7.0, 14.0, 4.0, 4.0, 5.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.21875, -50.93603515625, -49.6533203125, -48.37060546875, -47.087890625, -45.80517578125, -44.5224609375, -43.23974609375, -41.95703125, -40.67431640625, -39.3916015625, -38.10888671875, -36.826171875, -35.54345703125, -34.2607421875, -32.97802734375, -31.6953125, -30.41259765625, -29.1298828125, -27.84716796875, -26.564453125, -25.28173828125, -23.9990234375, -22.71630859375, -21.43359375, -20.15087890625, -18.8681640625, -17.58544921875, -16.302734375, -15.02001953125, -13.7373046875, -12.45458984375, -11.171875, -9.88916015625, -8.6064453125, -7.32373046875, -6.041015625, -4.75830078125, -3.4755859375, -2.19287109375, -0.91015625, 0.37255859375, 1.6552734375, 2.93798828125, 4.220703125, 5.50341796875, 6.7861328125, 8.06884765625, 9.3515625, 10.63427734375, 11.9169921875, 13.19970703125, 14.482421875, 15.76513671875, 17.0478515625, 18.33056640625, 19.61328125, 20.89599609375, 22.1787109375, 23.46142578125, 24.744140625, 26.02685546875, 27.3095703125, 28.59228515625, 29.875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 10.0, 27.0, 47.0, 68.0, 110.0, 169.0, 162.0, 133.0, 100.0, 77.0, 48.0, 23.0, 14.0, 4.0, 6.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-349.2296142578125, -328.0545654296875, -306.8795166015625, -285.7044982910156, -264.5294494628906, -243.35440063476562, -222.1793670654297, -201.00433349609375, -179.82928466796875, -158.65423583984375, -137.4792022705078, -116.30416107177734, -95.12911987304688, -73.9540786743164, -52.77903747558594, -31.60400390625, -10.428955078125, 10.746086120605469, 31.921127319335938, 53.096168518066406, 74.27120971679688, 95.44625091552734, 116.62129211425781, 137.79632568359375, 158.97137451171875, 180.14642333984375, 201.3214569091797, 222.49649047851562, 243.67153930664062, 264.8465881347656, 286.0216064453125, 307.1966552734375, 328.3717041015625, 349.5467529296875, 370.7218017578125, 391.8968200683594, 413.0718688964844, 434.2469177246094, 455.42193603515625, 476.59698486328125, 497.77203369140625, 518.9470825195312, 540.1221313476562, 561.2971801757812, 582.47216796875, 603.647216796875, 624.822265625, 645.997314453125, 667.17236328125, 688.347412109375, 709.5224609375, 730.697509765625, 751.87255859375, 773.0475463867188, 794.2225952148438, 815.3976440429688, 836.5726928710938, 857.7477416992188, 878.9227905273438, 900.0978393554688, 921.2728271484375, 942.4478759765625, 963.6229248046875, 984.7979736328125, 1005.9730224609375]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 0.0, 3.0, 4.0, 4.0, 6.0, 5.0, 10.0, 8.0, 10.0, 9.0, 24.0, 12.0, 33.0, 22.0, 26.0, 32.0, 32.0, 21.0, 35.0, 42.0, 47.0, 42.0, 50.0, 43.0, 43.0, 38.0, 39.0, 26.0, 42.0, 42.0, 43.0, 34.0, 32.0, 19.0, 24.0, 23.0, 16.0, 10.0, 9.0, 9.0, 7.0, 6.0, 4.0, 8.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-333.5670166015625, -322.6954345703125, -311.8238525390625, -300.9522705078125, -290.0806884765625, -279.2091064453125, -268.3375244140625, -257.4659423828125, -246.5943603515625, -235.7227783203125, -224.8511962890625, -213.9796142578125, -203.1080322265625, -192.2364501953125, -181.3648681640625, -170.4932861328125, -159.6217041015625, -148.7501220703125, -137.8785400390625, -127.0069580078125, -116.1353759765625, -105.2637939453125, -94.3922119140625, -83.5206298828125, -72.6490478515625, -61.7774658203125, -50.9058837890625, -40.0343017578125, -29.1627197265625, -18.2911376953125, -7.4195556640625, 3.4520263671875, 14.3236083984375, 25.1951904296875, 36.0667724609375, 46.9383544921875, 57.8099365234375, 68.6815185546875, 79.5531005859375, 90.4246826171875, 101.2962646484375, 112.1678466796875, 123.0394287109375, 133.9110107421875, 144.7825927734375, 155.6541748046875, 166.5257568359375, 177.3973388671875, 188.2689208984375, 199.1405029296875, 210.0120849609375, 220.8836669921875, 231.7552490234375, 242.6268310546875, 253.4984130859375, 264.3699951171875, 275.2415771484375, 286.1131591796875, 296.9847412109375, 307.8563232421875, 318.7279052734375, 329.5994873046875, 340.4710693359375, 351.3426513671875, 362.2142333984375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 7.0, 7.0, 14.0, 23.0, 24.0, 47.0, 85.0, 123.0, 200.0, 359.0, 725.0, 1604.0, 4013.0, 13559.0, 87485.0, 3984518.0, 81205.0, 13106.0, 3961.0, 1565.0, 696.0, 363.0, 229.0, 132.0, 68.0, 51.0, 32.0, 12.0, 21.0, 14.0, 7.0, 4.0, 6.0, 6.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-137.0, -132.015625, -127.03125, -122.046875, -117.0625, -112.078125, -107.09375, -102.109375, -97.125, -92.140625, -87.15625, -82.171875, -77.1875, -72.203125, -67.21875, -62.234375, -57.25, -52.265625, -47.28125, -42.296875, -37.3125, -32.328125, -27.34375, -22.359375, -17.375, -12.390625, -7.40625, -2.421875, 2.5625, 7.546875, 12.53125, 17.515625, 22.5, 27.484375, 32.46875, 37.453125, 42.4375, 47.421875, 52.40625, 57.390625, 62.375, 67.359375, 72.34375, 77.328125, 82.3125, 87.296875, 92.28125, 97.265625, 102.25, 107.234375, 112.21875, 117.203125, 122.1875, 127.171875, 132.15625, 137.140625, 142.125, 147.109375, 152.09375, 157.078125, 162.0625, 167.046875, 172.03125, 177.015625, 182.0]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 3.0, 5.0, 5.0, 11.0, 11.0, 20.0, 19.0, 26.0, 37.0, 23.0, 39.0, 55.0, 44.0, 53.0, 66.0, 70.0, 65.0, 75.0, 59.0, 59.0, 53.0, 31.0, 33.0, 38.0, 34.0, 13.0, 18.0, 7.0, 5.0, 9.0, 3.0, 4.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-21.3125, -20.600341796875, -19.88818359375, -19.176025390625, -18.4638671875, -17.751708984375, -17.03955078125, -16.327392578125, -15.615234375, -14.903076171875, -14.19091796875, -13.478759765625, -12.7666015625, -12.054443359375, -11.34228515625, -10.630126953125, -9.91796875, -9.205810546875, -8.49365234375, -7.781494140625, -7.0693359375, -6.357177734375, -5.64501953125, -4.932861328125, -4.220703125, -3.508544921875, -2.79638671875, -2.084228515625, -1.3720703125, -0.659912109375, 0.05224609375, 0.764404296875, 1.4765625, 2.188720703125, 2.90087890625, 3.613037109375, 4.3251953125, 5.037353515625, 5.74951171875, 6.461669921875, 7.173828125, 7.885986328125, 8.59814453125, 9.310302734375, 10.0224609375, 10.734619140625, 11.44677734375, 12.158935546875, 12.87109375, 13.583251953125, 14.29541015625, 15.007568359375, 15.7197265625, 16.431884765625, 17.14404296875, 17.856201171875, 18.568359375, 19.280517578125, 19.99267578125, 20.704833984375, 21.4169921875, 22.129150390625, 22.84130859375, 23.553466796875, 24.265625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 10.0, 11.0, 12.0, 11.0, 20.0, 20.0, 48.0, 70.0, 99.0, 142.0, 228.0, 394.0, 651.0, 1264.0, 2619.0, 5856.0, 16034.0, 55093.0, 508501.0, 3491311.0, 77198.0, 20740.0, 7470.0, 3093.0, 1449.0, 818.0, 401.0, 263.0, 159.0, 102.0, 56.0, 34.0, 29.0, 19.0, 20.0, 5.0, 8.0, 7.0, 9.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.0, -70.4033203125, -67.806640625, -65.2099609375, -62.61328125, -60.0166015625, -57.419921875, -54.8232421875, -52.2265625, -49.6298828125, -47.033203125, -44.4365234375, -41.83984375, -39.2431640625, -36.646484375, -34.0498046875, -31.453125, -28.8564453125, -26.259765625, -23.6630859375, -21.06640625, -18.4697265625, -15.873046875, -13.2763671875, -10.6796875, -8.0830078125, -5.486328125, -2.8896484375, -0.29296875, 2.3037109375, 4.900390625, 7.4970703125, 10.09375, 12.6904296875, 15.287109375, 17.8837890625, 20.48046875, 23.0771484375, 25.673828125, 28.2705078125, 30.8671875, 33.4638671875, 36.060546875, 38.6572265625, 41.25390625, 43.8505859375, 46.447265625, 49.0439453125, 51.640625, 54.2373046875, 56.833984375, 59.4306640625, 62.02734375, 64.6240234375, 67.220703125, 69.8173828125, 72.4140625, 75.0107421875, 77.607421875, 80.2041015625, 82.80078125, 85.3974609375, 87.994140625, 90.5908203125, 93.1875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 2.0, 0.0, 3.0, 6.0, 8.0, 6.0, 10.0, 14.0, 14.0, 32.0, 41.0, 76.0, 97.0, 230.0, 2551.0, 556.0, 166.0, 89.0, 42.0, 36.0, 28.0, 25.0, 13.0, 16.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0078125, -11.4805908203125, -10.953369140625, -10.4261474609375, -9.89892578125, -9.3717041015625, -8.844482421875, -8.3172607421875, -7.7900390625, -7.2628173828125, -6.735595703125, -6.2083740234375, -5.68115234375, -5.1539306640625, -4.626708984375, -4.0994873046875, -3.572265625, -3.0450439453125, -2.517822265625, -1.9906005859375, -1.46337890625, -0.9361572265625, -0.408935546875, 0.1182861328125, 0.6455078125, 1.1727294921875, 1.699951171875, 2.2271728515625, 2.75439453125, 3.2816162109375, 3.808837890625, 4.3360595703125, 4.86328125, 5.3905029296875, 5.917724609375, 6.4449462890625, 6.97216796875, 7.4993896484375, 8.026611328125, 8.5538330078125, 9.0810546875, 9.6082763671875, 10.135498046875, 10.6627197265625, 11.18994140625, 11.7171630859375, 12.244384765625, 12.7716064453125, 13.298828125, 13.8260498046875, 14.353271484375, 14.8804931640625, 15.40771484375, 15.9349365234375, 16.462158203125, 16.9893798828125, 17.5166015625, 18.0438232421875, 18.571044921875, 19.0982666015625, 19.62548828125, 20.1527099609375, 20.679931640625, 21.2071533203125, 21.734375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 7.0, 15.0, 33.0, 33.0, 81.0, 99.0, 131.0, 158.0, 122.0, 109.0, 84.0, 46.0, 34.0, 19.0, 9.0, 11.0, 7.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.72802734375, -83.01950073242188, -79.31096649169922, -75.6024398803711, -71.89390563964844, -68.18537902832031, -64.47685241699219, -60.7683219909668, -57.059791564941406, -53.351261138916016, -49.642730712890625, -45.9342041015625, -42.22567367553711, -38.51714324951172, -34.808616638183594, -31.100086212158203, -27.391555786132812, -23.683025360107422, -19.974496841430664, -16.265968322753906, -12.557437896728516, -8.848907470703125, -5.140378952026367, -1.4318504333496094, 2.2766799926757812, 5.9852094650268555, 9.69373893737793, 13.402268409729004, 17.110797882080078, 20.81932830810547, 24.527856826782227, 28.236385345458984, 31.944915771484375, 35.653446197509766, 39.361976623535156, 43.07050323486328, 46.77903366088867, 50.48756408691406, 54.19609069824219, 57.90462112426758, 61.61315155029297, 65.3216781616211, 69.03021240234375, 72.73873901367188, 76.447265625, 80.15579986572266, 83.86432647705078, 87.57286071777344, 91.28138732910156, 94.98991394042969, 98.69844818115234, 102.40697479248047, 106.11550903320312, 109.82403564453125, 113.53256225585938, 117.2410888671875, 120.94962310791016, 124.65814971923828, 128.36668395996094, 132.07521057128906, 135.7837371826172, 139.49227905273438, 143.2008056640625, 146.90933227539062, 150.61785888671875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 4.0, 3.0, 4.0, 7.0, 11.0, 16.0, 6.0, 7.0, 11.0, 22.0, 18.0, 23.0, 26.0, 24.0, 29.0, 26.0, 41.0, 27.0, 25.0, 35.0, 47.0, 45.0, 33.0, 38.0, 60.0, 44.0, 34.0, 33.0, 34.0, 29.0, 32.0, 24.0, 27.0, 21.0, 17.0, 15.0, 21.0, 23.0, 16.0, 9.0, 7.0, 5.0, 7.0, 5.0, 3.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0], "bins": [-44.682899475097656, -43.43684768676758, -42.190792083740234, -40.944740295410156, -39.69868850708008, -38.45263671875, -37.206581115722656, -35.96052932739258, -34.7144775390625, -33.46842575073242, -32.22237014770508, -30.976318359375, -29.730266571044922, -28.48421287536621, -27.2381591796875, -25.992107391357422, -24.74605369567871, -23.5, -22.253948211669922, -21.00789451599121, -19.761842727661133, -18.515789031982422, -17.269737243652344, -16.023683547973633, -14.777630805969238, -13.531578063964844, -12.28552532196045, -11.039472579956055, -9.793418884277344, -8.547367095947266, -7.301313400268555, -6.05526065826416, -4.809207916259766, -3.563155174255371, -2.3171021938323975, -1.0710492134094238, 0.1750035285949707, 1.4210562705993652, 2.667109489440918, 3.9131622314453125, 5.159214973449707, 6.405267715454102, 7.651320457458496, 8.89737319946289, 10.143426895141602, 11.38947868347168, 12.63553237915039, 13.881585121154785, 15.12763786315918, 16.37369155883789, 17.61974334716797, 18.86579704284668, 20.111848831176758, 21.35790252685547, 22.603954315185547, 23.850008010864258, 25.09606170654297, 26.34211540222168, 27.588167190551758, 28.83422088623047, 30.080272674560547, 31.326326370239258, 32.57238006591797, 33.81843185424805, 35.064483642578125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 5.0, 13.0, 24.0, 19.0, 18.0, 54.0, 81.0, 111.0, 192.0, 298.0, 601.0, 1187.0, 2622.0, 5884.0, 16027.0, 47227.0, 148620.0, 367751.0, 299356.0, 104417.0, 33644.0, 11794.0, 4521.0, 1835.0, 986.0, 481.0, 271.0, 186.0, 107.0, 73.0, 39.0, 36.0, 20.0, 17.0, 12.0, 8.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.4375, -49.822265625, -48.20703125, -46.591796875, -44.9765625, -43.361328125, -41.74609375, -40.130859375, -38.515625, -36.900390625, -35.28515625, -33.669921875, -32.0546875, -30.439453125, -28.82421875, -27.208984375, -25.59375, -23.978515625, -22.36328125, -20.748046875, -19.1328125, -17.517578125, -15.90234375, -14.287109375, -12.671875, -11.056640625, -9.44140625, -7.826171875, -6.2109375, -4.595703125, -2.98046875, -1.365234375, 0.25, 1.865234375, 3.48046875, 5.095703125, 6.7109375, 8.326171875, 9.94140625, 11.556640625, 13.171875, 14.787109375, 16.40234375, 18.017578125, 19.6328125, 21.248046875, 22.86328125, 24.478515625, 26.09375, 27.708984375, 29.32421875, 30.939453125, 32.5546875, 34.169921875, 35.78515625, 37.400390625, 39.015625, 40.630859375, 42.24609375, 43.861328125, 45.4765625, 47.091796875, 48.70703125, 50.322265625, 51.9375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 6.0, 6.0, 14.0, 21.0, 29.0, 24.0, 21.0, 24.0, 35.0, 48.0, 50.0, 47.0, 58.0, 67.0, 41.0, 67.0, 57.0, 57.0, 61.0, 49.0, 36.0, 41.0, 34.0, 26.0, 20.0, 11.0, 11.0, 9.0, 9.0, 3.0, 2.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-22.421875, -21.691650390625, -20.96142578125, -20.231201171875, -19.5009765625, -18.770751953125, -18.04052734375, -17.310302734375, -16.580078125, -15.849853515625, -15.11962890625, -14.389404296875, -13.6591796875, -12.928955078125, -12.19873046875, -11.468505859375, -10.73828125, -10.008056640625, -9.27783203125, -8.547607421875, -7.8173828125, -7.087158203125, -6.35693359375, -5.626708984375, -4.896484375, -4.166259765625, -3.43603515625, -2.705810546875, -1.9755859375, -1.245361328125, -0.51513671875, 0.215087890625, 0.9453125, 1.675537109375, 2.40576171875, 3.135986328125, 3.8662109375, 4.596435546875, 5.32666015625, 6.056884765625, 6.787109375, 7.517333984375, 8.24755859375, 8.977783203125, 9.7080078125, 10.438232421875, 11.16845703125, 11.898681640625, 12.62890625, 13.359130859375, 14.08935546875, 14.819580078125, 15.5498046875, 16.280029296875, 17.01025390625, 17.740478515625, 18.470703125, 19.200927734375, 19.93115234375, 20.661376953125, 21.3916015625, 22.121826171875, 22.85205078125, 23.582275390625, 24.3125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 10.0, 14.0, 33.0, 52.0, 102.0, 205.0, 445.0, 873.0, 2228.0, 15214.0, 672271.0, 344929.0, 8897.0, 1811.0, 760.0, 350.0, 206.0, 84.0, 34.0, 20.0, 10.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-147.0, -142.083984375, -137.16796875, -132.251953125, -127.3359375, -122.419921875, -117.50390625, -112.587890625, -107.671875, -102.755859375, -97.83984375, -92.923828125, -88.0078125, -83.091796875, -78.17578125, -73.259765625, -68.34375, -63.427734375, -58.51171875, -53.595703125, -48.6796875, -43.763671875, -38.84765625, -33.931640625, -29.015625, -24.099609375, -19.18359375, -14.267578125, -9.3515625, -4.435546875, 0.48046875, 5.396484375, 10.3125, 15.228515625, 20.14453125, 25.060546875, 29.9765625, 34.892578125, 39.80859375, 44.724609375, 49.640625, 54.556640625, 59.47265625, 64.388671875, 69.3046875, 74.220703125, 79.13671875, 84.052734375, 88.96875, 93.884765625, 98.80078125, 103.716796875, 108.6328125, 113.548828125, 118.46484375, 123.380859375, 128.296875, 133.212890625, 138.12890625, 143.044921875, 147.9609375, 152.876953125, 157.79296875, 162.708984375, 167.625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 3.0, 0.0, 11.0, 10.0, 12.0, 9.0, 22.0, 16.0, 14.0, 34.0, 25.0, 32.0, 31.0, 40.0, 38.0, 44.0, 48.0, 40.0, 39.0, 62.0, 51.0, 37.0, 61.0, 38.0, 38.0, 34.0, 29.0, 37.0, 33.0, 18.0, 19.0, 9.0, 5.0, 11.0, 11.0, 7.0, 5.0, 6.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-80.0, -77.3701171875, -74.740234375, -72.1103515625, -69.48046875, -66.8505859375, -64.220703125, -61.5908203125, -58.9609375, -56.3310546875, -53.701171875, -51.0712890625, -48.44140625, -45.8115234375, -43.181640625, -40.5517578125, -37.921875, -35.2919921875, -32.662109375, -30.0322265625, -27.40234375, -24.7724609375, -22.142578125, -19.5126953125, -16.8828125, -14.2529296875, -11.623046875, -8.9931640625, -6.36328125, -3.7333984375, -1.103515625, 1.5263671875, 4.15625, 6.7861328125, 9.416015625, 12.0458984375, 14.67578125, 17.3056640625, 19.935546875, 22.5654296875, 25.1953125, 27.8251953125, 30.455078125, 33.0849609375, 35.71484375, 38.3447265625, 40.974609375, 43.6044921875, 46.234375, 48.8642578125, 51.494140625, 54.1240234375, 56.75390625, 59.3837890625, 62.013671875, 64.6435546875, 67.2734375, 69.9033203125, 72.533203125, 75.1630859375, 77.79296875, 80.4228515625, 83.052734375, 85.6826171875, 88.3125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 5.0, 3.0, 16.0, 24.0, 44.0, 59.0, 113.0, 265.0, 767.0, 3195.0, 44200.0, 955077.0, 40290.0, 3187.0, 778.0, 272.0, 118.0, 68.0, 29.0, 17.0, 11.0, 6.0, 6.0, 4.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.75, -76.2490234375, -73.748046875, -71.2470703125, -68.74609375, -66.2451171875, -63.744140625, -61.2431640625, -58.7421875, -56.2412109375, -53.740234375, -51.2392578125, -48.73828125, -46.2373046875, -43.736328125, -41.2353515625, -38.734375, -36.2333984375, -33.732421875, -31.2314453125, -28.73046875, -26.2294921875, -23.728515625, -21.2275390625, -18.7265625, -16.2255859375, -13.724609375, -11.2236328125, -8.72265625, -6.2216796875, -3.720703125, -1.2197265625, 1.28125, 3.7822265625, 6.283203125, 8.7841796875, 11.28515625, 13.7861328125, 16.287109375, 18.7880859375, 21.2890625, 23.7900390625, 26.291015625, 28.7919921875, 31.29296875, 33.7939453125, 36.294921875, 38.7958984375, 41.296875, 43.7978515625, 46.298828125, 48.7998046875, 51.30078125, 53.8017578125, 56.302734375, 58.8037109375, 61.3046875, 63.8056640625, 66.306640625, 68.8076171875, 71.30859375, 73.8095703125, 76.310546875, 78.8115234375, 81.3125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 3.0, 6.0, 10.0, 3.0, 9.0, 12.0, 15.0, 19.0, 30.0, 38.0, 48.0, 55.0, 63.0, 103.0, 108.0, 95.0, 93.0, 71.0, 52.0, 40.0, 32.0, 23.0, 15.0, 6.0, 11.0, 6.0, 9.0, 6.0, 5.0, 1.0, 6.0, 2.0, 4.0, 2.0], "bins": [-0.00531005859375, -0.005191385746002197, -0.0050727128982543945, -0.004954040050506592, -0.004835367202758789, -0.004716694355010986, -0.004598021507263184, -0.004479348659515381, -0.004360675811767578, -0.004242002964019775, -0.004123330116271973, -0.00400465726852417, -0.003885984420776367, -0.0037673115730285645, -0.0036486387252807617, -0.003529965877532959, -0.0034112930297851562, -0.0032926201820373535, -0.0031739473342895508, -0.003055274486541748, -0.0029366016387939453, -0.0028179287910461426, -0.00269925594329834, -0.002580583095550537, -0.0024619102478027344, -0.0023432374000549316, -0.002224564552307129, -0.002105891704559326, -0.0019872188568115234, -0.0018685460090637207, -0.001749873161315918, -0.0016312003135681152, -0.0015125274658203125, -0.0013938546180725098, -0.001275181770324707, -0.0011565089225769043, -0.0010378360748291016, -0.0009191632270812988, -0.0008004903793334961, -0.0006818175315856934, -0.0005631446838378906, -0.0004444718360900879, -0.00032579898834228516, -0.00020712614059448242, -8.845329284667969e-05, 3.0219554901123047e-05, 0.00014889240264892578, 0.0002675652503967285, 0.00038623809814453125, 0.000504910945892334, 0.0006235837936401367, 0.0007422566413879395, 0.0008609294891357422, 0.000979602336883545, 0.0010982751846313477, 0.0012169480323791504, 0.0013356208801269531, 0.0014542937278747559, 0.0015729665756225586, 0.0016916394233703613, 0.001810312271118164, 0.0019289851188659668, 0.0020476579666137695, 0.0021663308143615723, 0.002285003662109375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 6.0, 5.0, 4.0, 13.0, 21.0, 22.0, 41.0, 75.0, 117.0, 192.0, 400.0, 1115.0, 3756.0, 25911.0, 784818.0, 217924.0, 10466.0, 2254.0, 739.0, 284.0, 151.0, 77.0, 64.0, 42.0, 21.0, 15.0, 10.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.8125, -59.8056640625, -57.798828125, -55.7919921875, -53.78515625, -51.7783203125, -49.771484375, -47.7646484375, -45.7578125, -43.7509765625, -41.744140625, -39.7373046875, -37.73046875, -35.7236328125, -33.716796875, -31.7099609375, -29.703125, -27.6962890625, -25.689453125, -23.6826171875, -21.67578125, -19.6689453125, -17.662109375, -15.6552734375, -13.6484375, -11.6416015625, -9.634765625, -7.6279296875, -5.62109375, -3.6142578125, -1.607421875, 0.3994140625, 2.40625, 4.4130859375, 6.419921875, 8.4267578125, 10.43359375, 12.4404296875, 14.447265625, 16.4541015625, 18.4609375, 20.4677734375, 22.474609375, 24.4814453125, 26.48828125, 28.4951171875, 30.501953125, 32.5087890625, 34.515625, 36.5224609375, 38.529296875, 40.5361328125, 42.54296875, 44.5498046875, 46.556640625, 48.5634765625, 50.5703125, 52.5771484375, 54.583984375, 56.5908203125, 58.59765625, 60.6044921875, 62.611328125, 64.6181640625, 66.625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 4.0, 7.0, 4.0, 5.0, 22.0, 46.0, 107.0, 217.0, 205.0, 193.0, 107.0, 35.0, 23.0, 8.0, 6.0, 8.0, 5.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.859375, -28.842041015625, -26.82470703125, -24.807373046875, -22.7900390625, -20.772705078125, -18.75537109375, -16.738037109375, -14.720703125, -12.703369140625, -10.68603515625, -8.668701171875, -6.6513671875, -4.634033203125, -2.61669921875, -0.599365234375, 1.41796875, 3.435302734375, 5.45263671875, 7.469970703125, 9.4873046875, 11.504638671875, 13.52197265625, 15.539306640625, 17.556640625, 19.573974609375, 21.59130859375, 23.608642578125, 25.6259765625, 27.643310546875, 29.66064453125, 31.677978515625, 33.6953125, 35.712646484375, 37.72998046875, 39.747314453125, 41.7646484375, 43.781982421875, 45.79931640625, 47.816650390625, 49.833984375, 51.851318359375, 53.86865234375, 55.885986328125, 57.9033203125, 59.920654296875, 61.93798828125, 63.955322265625, 65.97265625, 67.989990234375, 70.00732421875, 72.024658203125, 74.0419921875, 76.059326171875, 78.07666015625, 80.093994140625, 82.111328125, 84.128662109375, 86.14599609375, 88.163330078125, 90.1806640625, 92.197998046875, 94.21533203125, 96.232666015625, 98.25]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 8.0, 16.0, 85.0, 198.0, 320.0, 240.0, 97.0, 26.0, 13.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-312.1193542480469, -271.5897216796875, -231.06005859375, -190.53042602539062, -150.0007781982422, -109.47113037109375, -68.94149780273438, -28.411834716796875, 12.1177978515625, 52.64744186401367, 93.17708587646484, 133.70672607421875, 174.2363739013672, 214.76602172851562, 255.295654296875, 295.8253173828125, 336.3549499511719, 376.88458251953125, 417.41424560546875, 457.9438781738281, 498.4735107421875, 539.003173828125, 579.5328369140625, 620.0625, 660.5921020507812, 701.1217651367188, 741.6513671875, 782.1810302734375, 822.710693359375, 863.2403564453125, 903.7699584960938, 944.2996215820312, 984.8292236328125, 1025.35888671875, 1065.8885498046875, 1106.418212890625, 1146.94775390625, 1187.4774169921875, 1228.007080078125, 1268.5367431640625, 1309.06640625, 1349.5960693359375, 1390.125732421875, 1430.6552734375, 1471.1849365234375, 1511.714599609375, 1552.2442626953125, 1592.77392578125, 1633.303466796875, 1673.8331298828125, 1714.36279296875, 1754.892333984375, 1795.4219970703125, 1835.95166015625, 1876.4813232421875, 1917.010986328125, 1957.5406494140625, 1998.0703125, 2038.5999755859375, 2079.129638671875, 2119.6591796875, 2160.18896484375, 2200.718505859375, 2241.248046875, 2281.77783203125]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 2.0, 2.0, 7.0, 7.0, 19.0, 9.0, 6.0, 12.0, 12.0, 19.0, 25.0, 20.0, 37.0, 40.0, 31.0, 57.0, 39.0, 52.0, 47.0, 37.0, 56.0, 59.0, 50.0, 43.0, 50.0, 43.0, 32.0, 25.0, 27.0, 21.0, 21.0, 13.0, 14.0, 14.0, 10.0, 9.0, 5.0, 7.0, 7.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-373.48114013671875, -361.5601806640625, -349.6391906738281, -337.7182312011719, -325.7972412109375, -313.87628173828125, -301.955322265625, -290.0343322753906, -278.1133728027344, -266.1924133300781, -254.27142333984375, -242.3504638671875, -230.4294891357422, -218.50851440429688, -206.58753967285156, -194.66656494140625, -182.74559020996094, -170.82461547851562, -158.9036407470703, -146.982666015625, -135.06170654296875, -123.14073181152344, -111.21975708007812, -99.29878997802734, -87.37781524658203, -75.45684051513672, -63.53587341308594, -51.614898681640625, -39.69392776489258, -27.77295684814453, -15.851982116699219, -3.9310150146484375, 7.989959716796875, 19.910930633544922, 31.8319034576416, 43.75287628173828, 55.67384719848633, 67.59481811523438, 79.51579284667969, 91.43675994873047, 103.35773468017578, 115.2787094116211, 127.19967651367188, 139.1206512451172, 151.0416259765625, 162.96258544921875, 174.88357543945312, 186.80453491210938, 198.7255096435547, 210.646484375, 222.5674591064453, 234.48843383789062, 246.40939331054688, 258.33038330078125, 270.2513427734375, 282.17230224609375, 294.0932922363281, 306.0142517089844, 317.93524169921875, 329.856201171875, 341.7771911621094, 353.6981506347656, 365.619140625, 377.54010009765625, 389.4610595703125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 10.0, 10.0, 12.0, 22.0, 26.0, 36.0, 66.0, 76.0, 130.0, 195.0, 325.0, 607.0, 994.0, 2014.0, 4417.0, 10664.0, 44278.0, 4059196.0, 50600.0, 11242.0, 4514.0, 2124.0, 1149.0, 575.0, 364.0, 211.0, 154.0, 89.0, 58.0, 43.0, 18.0, 20.0, 9.0, 9.0, 3.0, 5.0, 5.0, 5.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-119.6875, -115.8916015625, -112.095703125, -108.2998046875, -104.50390625, -100.7080078125, -96.912109375, -93.1162109375, -89.3203125, -85.5244140625, -81.728515625, -77.9326171875, -74.13671875, -70.3408203125, -66.544921875, -62.7490234375, -58.953125, -55.1572265625, -51.361328125, -47.5654296875, -43.76953125, -39.9736328125, -36.177734375, -32.3818359375, -28.5859375, -24.7900390625, -20.994140625, -17.1982421875, -13.40234375, -9.6064453125, -5.810546875, -2.0146484375, 1.78125, 5.5771484375, 9.373046875, 13.1689453125, 16.96484375, 20.7607421875, 24.556640625, 28.3525390625, 32.1484375, 35.9443359375, 39.740234375, 43.5361328125, 47.33203125, 51.1279296875, 54.923828125, 58.7197265625, 62.515625, 66.3115234375, 70.107421875, 73.9033203125, 77.69921875, 81.4951171875, 85.291015625, 89.0869140625, 92.8828125, 96.6787109375, 100.474609375, 104.2705078125, 108.06640625, 111.8623046875, 115.658203125, 119.4541015625, 123.25]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 2.0, 2.0, 7.0, 11.0, 2.0, 11.0, 14.0, 27.0, 33.0, 39.0, 40.0, 47.0, 51.0, 64.0, 75.0, 63.0, 80.0, 62.0, 73.0, 56.0, 51.0, 43.0, 26.0, 27.0, 22.0, 17.0, 16.0, 13.0, 8.0, 10.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-28.875, -28.02734375, -27.1796875, -26.33203125, -25.484375, -24.63671875, -23.7890625, -22.94140625, -22.09375, -21.24609375, -20.3984375, -19.55078125, -18.703125, -17.85546875, -17.0078125, -16.16015625, -15.3125, -14.46484375, -13.6171875, -12.76953125, -11.921875, -11.07421875, -10.2265625, -9.37890625, -8.53125, -7.68359375, -6.8359375, -5.98828125, -5.140625, -4.29296875, -3.4453125, -2.59765625, -1.75, -0.90234375, -0.0546875, 0.79296875, 1.640625, 2.48828125, 3.3359375, 4.18359375, 5.03125, 5.87890625, 6.7265625, 7.57421875, 8.421875, 9.26953125, 10.1171875, 10.96484375, 11.8125, 12.66015625, 13.5078125, 14.35546875, 15.203125, 16.05078125, 16.8984375, 17.74609375, 18.59375, 19.44140625, 20.2890625, 21.13671875, 21.984375, 22.83203125, 23.6796875, 24.52734375, 25.375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 1.0, 7.0, 6.0, 7.0, 15.0, 27.0, 28.0, 30.0, 74.0, 84.0, 137.0, 169.0, 269.0, 476.0, 734.0, 1479.0, 2870.0, 6762.0, 19320.0, 187115.0, 3928118.0, 30077.0, 8869.0, 3675.0, 1661.0, 855.0, 467.0, 292.0, 208.0, 132.0, 92.0, 67.0, 39.0, 32.0, 32.0, 24.0, 15.0, 10.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.3125, -75.0693359375, -71.826171875, -68.5830078125, -65.33984375, -62.0966796875, -58.853515625, -55.6103515625, -52.3671875, -49.1240234375, -45.880859375, -42.6376953125, -39.39453125, -36.1513671875, -32.908203125, -29.6650390625, -26.421875, -23.1787109375, -19.935546875, -16.6923828125, -13.44921875, -10.2060546875, -6.962890625, -3.7197265625, -0.4765625, 2.7666015625, 6.009765625, 9.2529296875, 12.49609375, 15.7392578125, 18.982421875, 22.2255859375, 25.46875, 28.7119140625, 31.955078125, 35.1982421875, 38.44140625, 41.6845703125, 44.927734375, 48.1708984375, 51.4140625, 54.6572265625, 57.900390625, 61.1435546875, 64.38671875, 67.6298828125, 70.873046875, 74.1162109375, 77.359375, 80.6025390625, 83.845703125, 87.0888671875, 90.33203125, 93.5751953125, 96.818359375, 100.0615234375, 103.3046875, 106.5478515625, 109.791015625, 113.0341796875, 116.27734375, 119.5205078125, 122.763671875, 126.0068359375, 129.25]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 0.0, 4.0, 8.0, 6.0, 8.0, 12.0, 40.0, 83.0, 3285.0, 439.0, 93.0, 31.0, 20.0, 13.0, 7.0, 7.0, 5.0, 2.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.4375, -23.69482421875, -22.9521484375, -22.20947265625, -21.466796875, -20.72412109375, -19.9814453125, -19.23876953125, -18.49609375, -17.75341796875, -17.0107421875, -16.26806640625, -15.525390625, -14.78271484375, -14.0400390625, -13.29736328125, -12.5546875, -11.81201171875, -11.0693359375, -10.32666015625, -9.583984375, -8.84130859375, -8.0986328125, -7.35595703125, -6.61328125, -5.87060546875, -5.1279296875, -4.38525390625, -3.642578125, -2.89990234375, -2.1572265625, -1.41455078125, -0.671875, 0.07080078125, 0.8134765625, 1.55615234375, 2.298828125, 3.04150390625, 3.7841796875, 4.52685546875, 5.26953125, 6.01220703125, 6.7548828125, 7.49755859375, 8.240234375, 8.98291015625, 9.7255859375, 10.46826171875, 11.2109375, 11.95361328125, 12.6962890625, 13.43896484375, 14.181640625, 14.92431640625, 15.6669921875, 16.40966796875, 17.15234375, 17.89501953125, 18.6376953125, 19.38037109375, 20.123046875, 20.86572265625, 21.6083984375, 22.35107421875, 23.09375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 8.0, 10.0, 5.0, 9.0, 11.0, 26.0, 28.0, 40.0, 58.0, 73.0, 95.0, 104.0, 90.0, 102.0, 101.0, 78.0, 48.0, 42.0, 24.0, 20.0, 13.0, 7.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.728843688964844, -48.334014892578125, -45.939186096191406, -43.54435729980469, -41.14952850341797, -38.75469970703125, -36.35987091064453, -33.96504211425781, -31.570215225219727, -29.175386428833008, -26.78055763244629, -24.385730743408203, -21.990901947021484, -19.596073150634766, -17.201244354248047, -14.806415557861328, -12.41158676147461, -10.01675796508789, -7.62192964553833, -5.2271013259887695, -2.832272529602051, -0.43744373321533203, 1.9573841094970703, 4.352212905883789, 6.747041702270508, 9.141870498657227, 11.536699295043945, 13.931527137756348, 16.32635498046875, 18.72118377685547, 21.116012573242188, 23.510841369628906, 25.905670166015625, 28.300498962402344, 30.695327758789062, 33.09015655517578, 35.4849853515625, 37.87981414794922, 40.27464294433594, 42.669471740722656, 45.064300537109375, 47.459129333496094, 49.85395812988281, 52.24878692626953, 54.64361572265625, 57.03844451904297, 59.43327331542969, 61.828102111816406, 64.22293090820312, 66.61775970458984, 69.01258850097656, 71.40741729736328, 73.80224609375, 76.19707489013672, 78.59190368652344, 80.98673248291016, 83.38155364990234, 85.77638244628906, 88.17121124267578, 90.5660400390625, 92.96086883544922, 95.35569763183594, 97.75052642822266, 100.14535522460938, 102.5401840209961]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 8.0, 9.0, 7.0, 9.0, 5.0, 12.0, 9.0, 21.0, 19.0, 21.0, 27.0, 32.0, 25.0, 23.0, 31.0, 42.0, 30.0, 43.0, 28.0, 41.0, 42.0, 43.0, 40.0, 45.0, 36.0, 32.0, 47.0, 37.0, 29.0, 18.0, 32.0, 25.0, 19.0, 11.0, 12.0, 10.0, 6.0, 16.0, 7.0, 10.0, 7.0, 6.0, 6.0, 6.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-33.992958068847656, -32.957664489746094, -31.9223690032959, -30.887075424194336, -29.851781845092773, -28.816486358642578, -27.781192779541016, -26.745899200439453, -25.71060562133789, -24.675312042236328, -23.640016555786133, -22.60472297668457, -21.569429397583008, -20.534133911132812, -19.49884033203125, -18.463546752929688, -17.428251266479492, -16.39295768737793, -15.35766315460205, -14.322368621826172, -13.28707504272461, -12.25178050994873, -11.216485977172852, -10.181192398071289, -9.14589786529541, -8.110603332519531, -7.075309753417969, -6.04001522064209, -5.004721164703369, -3.9694271087646484, -2.9341325759887695, -1.8988385200500488, -0.8635444641113281, 0.17174971103668213, 1.2070438861846924, 2.242338180541992, 3.277632236480713, 4.312926292419434, 5.3482208251953125, 6.383514881134033, 7.418808937072754, 8.454103469848633, 9.489397048950195, 10.524691581726074, 11.559986114501953, 12.595279693603516, 13.630574226379395, 14.665868759155273, 15.701162338256836, 16.7364559173584, 17.771751403808594, 18.807044982910156, 19.84233856201172, 20.87763214111328, 21.912927627563477, 22.94822120666504, 23.983516693115234, 25.018810272216797, 26.054105758666992, 27.089399337768555, 28.124692916870117, 29.159988403320312, 30.195281982421875, 31.230575561523438, 32.265869140625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 7.0, 7.0, 16.0, 33.0, 31.0, 86.0, 149.0, 265.0, 518.0, 1157.0, 2775.0, 8022.0, 27098.0, 105403.0, 383085.0, 377551.0, 103199.0, 26142.0, 7956.0, 2824.0, 1135.0, 497.0, 259.0, 141.0, 75.0, 36.0, 31.0, 22.0, 10.0, 12.0, 5.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.84375, -57.00439453125, -55.1650390625, -53.32568359375, -51.486328125, -49.64697265625, -47.8076171875, -45.96826171875, -44.12890625, -42.28955078125, -40.4501953125, -38.61083984375, -36.771484375, -34.93212890625, -33.0927734375, -31.25341796875, -29.4140625, -27.57470703125, -25.7353515625, -23.89599609375, -22.056640625, -20.21728515625, -18.3779296875, -16.53857421875, -14.69921875, -12.85986328125, -11.0205078125, -9.18115234375, -7.341796875, -5.50244140625, -3.6630859375, -1.82373046875, 0.015625, 1.85498046875, 3.6943359375, 5.53369140625, 7.373046875, 9.21240234375, 11.0517578125, 12.89111328125, 14.73046875, 16.56982421875, 18.4091796875, 20.24853515625, 22.087890625, 23.92724609375, 25.7666015625, 27.60595703125, 29.4453125, 31.28466796875, 33.1240234375, 34.96337890625, 36.802734375, 38.64208984375, 40.4814453125, 42.32080078125, 44.16015625, 45.99951171875, 47.8388671875, 49.67822265625, 51.517578125, 53.35693359375, 55.1962890625, 57.03564453125, 58.875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 0.0, 5.0, 5.0, 5.0, 11.0, 8.0, 13.0, 13.0, 27.0, 24.0, 31.0, 41.0, 42.0, 58.0, 46.0, 57.0, 65.0, 69.0, 45.0, 73.0, 64.0, 64.0, 45.0, 39.0, 26.0, 27.0, 17.0, 17.0, 20.0, 7.0, 11.0, 9.0, 7.0, 4.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-27.96875, -27.1396484375, -26.310546875, -25.4814453125, -24.65234375, -23.8232421875, -22.994140625, -22.1650390625, -21.3359375, -20.5068359375, -19.677734375, -18.8486328125, -18.01953125, -17.1904296875, -16.361328125, -15.5322265625, -14.703125, -13.8740234375, -13.044921875, -12.2158203125, -11.38671875, -10.5576171875, -9.728515625, -8.8994140625, -8.0703125, -7.2412109375, -6.412109375, -5.5830078125, -4.75390625, -3.9248046875, -3.095703125, -2.2666015625, -1.4375, -0.6083984375, 0.220703125, 1.0498046875, 1.87890625, 2.7080078125, 3.537109375, 4.3662109375, 5.1953125, 6.0244140625, 6.853515625, 7.6826171875, 8.51171875, 9.3408203125, 10.169921875, 10.9990234375, 11.828125, 12.6572265625, 13.486328125, 14.3154296875, 15.14453125, 15.9736328125, 16.802734375, 17.6318359375, 18.4609375, 19.2900390625, 20.119140625, 20.9482421875, 21.77734375, 22.6064453125, 23.435546875, 24.2646484375, 25.09375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 11.0, 18.0, 24.0, 36.0, 43.0, 93.0, 126.0, 194.0, 314.0, 477.0, 875.0, 1686.0, 5586.0, 46802.0, 706049.0, 263027.0, 16880.0, 3305.0, 1240.0, 647.0, 438.0, 232.0, 163.0, 104.0, 68.0, 39.0, 25.0, 20.0, 15.0, 8.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.875, -65.71484375, -62.5546875, -59.39453125, -56.234375, -53.07421875, -49.9140625, -46.75390625, -43.59375, -40.43359375, -37.2734375, -34.11328125, -30.953125, -27.79296875, -24.6328125, -21.47265625, -18.3125, -15.15234375, -11.9921875, -8.83203125, -5.671875, -2.51171875, 0.6484375, 3.80859375, 6.96875, 10.12890625, 13.2890625, 16.44921875, 19.609375, 22.76953125, 25.9296875, 29.08984375, 32.25, 35.41015625, 38.5703125, 41.73046875, 44.890625, 48.05078125, 51.2109375, 54.37109375, 57.53125, 60.69140625, 63.8515625, 67.01171875, 70.171875, 73.33203125, 76.4921875, 79.65234375, 82.8125, 85.97265625, 89.1328125, 92.29296875, 95.453125, 98.61328125, 101.7734375, 104.93359375, 108.09375, 111.25390625, 114.4140625, 117.57421875, 120.734375, 123.89453125, 127.0546875, 130.21484375, 133.375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 10.0, 8.0, 17.0, 21.0, 18.0, 29.0, 39.0, 42.0, 57.0, 59.0, 63.0, 76.0, 78.0, 66.0, 72.0, 68.0, 58.0, 51.0, 39.0, 37.0, 29.0, 19.0, 12.0, 13.0, 8.0, 8.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-185.25, -180.783203125, -176.31640625, -171.849609375, -167.3828125, -162.916015625, -158.44921875, -153.982421875, -149.515625, -145.048828125, -140.58203125, -136.115234375, -131.6484375, -127.181640625, -122.71484375, -118.248046875, -113.78125, -109.314453125, -104.84765625, -100.380859375, -95.9140625, -91.447265625, -86.98046875, -82.513671875, -78.046875, -73.580078125, -69.11328125, -64.646484375, -60.1796875, -55.712890625, -51.24609375, -46.779296875, -42.3125, -37.845703125, -33.37890625, -28.912109375, -24.4453125, -19.978515625, -15.51171875, -11.044921875, -6.578125, -2.111328125, 2.35546875, 6.822265625, 11.2890625, 15.755859375, 20.22265625, 24.689453125, 29.15625, 33.623046875, 38.08984375, 42.556640625, 47.0234375, 51.490234375, 55.95703125, 60.423828125, 64.890625, 69.357421875, 73.82421875, 78.291015625, 82.7578125, 87.224609375, 91.69140625, 96.158203125, 100.625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 6.0, 4.0, 5.0, 6.0, 9.0, 11.0, 14.0, 28.0, 27.0, 38.0, 64.0, 87.0, 130.0, 242.0, 481.0, 1224.0, 4872.0, 40474.0, 774147.0, 208867.0, 13804.0, 2385.0, 802.0, 320.0, 201.0, 87.0, 62.0, 43.0, 29.0, 25.0, 11.0, 11.0, 11.0, 8.0, 10.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.21875, -41.76708984375, -40.3154296875, -38.86376953125, -37.412109375, -35.96044921875, -34.5087890625, -33.05712890625, -31.60546875, -30.15380859375, -28.7021484375, -27.25048828125, -25.798828125, -24.34716796875, -22.8955078125, -21.44384765625, -19.9921875, -18.54052734375, -17.0888671875, -15.63720703125, -14.185546875, -12.73388671875, -11.2822265625, -9.83056640625, -8.37890625, -6.92724609375, -5.4755859375, -4.02392578125, -2.572265625, -1.12060546875, 0.3310546875, 1.78271484375, 3.234375, 4.68603515625, 6.1376953125, 7.58935546875, 9.041015625, 10.49267578125, 11.9443359375, 13.39599609375, 14.84765625, 16.29931640625, 17.7509765625, 19.20263671875, 20.654296875, 22.10595703125, 23.5576171875, 25.00927734375, 26.4609375, 27.91259765625, 29.3642578125, 30.81591796875, 32.267578125, 33.71923828125, 35.1708984375, 36.62255859375, 38.07421875, 39.52587890625, 40.9775390625, 42.42919921875, 43.880859375, 45.33251953125, 46.7841796875, 48.23583984375, 49.6875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 4.0, 5.0, 6.0, 8.0, 8.0, 20.0, 14.0, 24.0, 36.0, 40.0, 56.0, 93.0, 113.0, 129.0, 112.0, 92.0, 66.0, 36.0, 31.0, 17.0, 17.0, 16.0, 16.0, 11.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.003875732421875, -0.0037534236907958984, -0.003631114959716797, -0.0035088062286376953, -0.0033864974975585938, -0.003264188766479492, -0.0031418800354003906, -0.003019571304321289, -0.0028972625732421875, -0.002774953842163086, -0.0026526451110839844, -0.002530336380004883, -0.0024080276489257812, -0.0022857189178466797, -0.002163410186767578, -0.0020411014556884766, -0.001918792724609375, -0.0017964839935302734, -0.0016741752624511719, -0.0015518665313720703, -0.0014295578002929688, -0.0013072490692138672, -0.0011849403381347656, -0.001062631607055664, -0.0009403228759765625, -0.0008180141448974609, -0.0006957054138183594, -0.0005733966827392578, -0.00045108795166015625, -0.0003287792205810547, -0.00020647048950195312, -8.416175842285156e-05, 3.814697265625e-05, 0.00016045570373535156, 0.0002827644348144531, 0.0004050731658935547, 0.0005273818969726562, 0.0006496906280517578, 0.0007719993591308594, 0.0008943080902099609, 0.0010166168212890625, 0.001138925552368164, 0.0012612342834472656, 0.0013835430145263672, 0.0015058517456054688, 0.0016281604766845703, 0.0017504692077636719, 0.0018727779388427734, 0.001995086669921875, 0.0021173954010009766, 0.002239704132080078, 0.0023620128631591797, 0.0024843215942382812, 0.002606630325317383, 0.0027289390563964844, 0.002851247787475586, 0.0029735565185546875, 0.003095865249633789, 0.0032181739807128906, 0.003340482711791992, 0.0034627914428710938, 0.0035851001739501953, 0.003707408905029297, 0.0038297176361083984, 0.0039520263671875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 7.0, 13.0, 29.0, 64.0, 102.0, 196.0, 421.0, 1246.0, 7709.0, 188352.0, 823240.0, 23409.0, 2547.0, 691.0, 268.0, 119.0, 69.0, 37.0, 18.0, 8.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.5625, -64.49609375, -62.4296875, -60.36328125, -58.296875, -56.23046875, -54.1640625, -52.09765625, -50.03125, -47.96484375, -45.8984375, -43.83203125, -41.765625, -39.69921875, -37.6328125, -35.56640625, -33.5, -31.43359375, -29.3671875, -27.30078125, -25.234375, -23.16796875, -21.1015625, -19.03515625, -16.96875, -14.90234375, -12.8359375, -10.76953125, -8.703125, -6.63671875, -4.5703125, -2.50390625, -0.4375, 1.62890625, 3.6953125, 5.76171875, 7.828125, 9.89453125, 11.9609375, 14.02734375, 16.09375, 18.16015625, 20.2265625, 22.29296875, 24.359375, 26.42578125, 28.4921875, 30.55859375, 32.625, 34.69140625, 36.7578125, 38.82421875, 40.890625, 42.95703125, 45.0234375, 47.08984375, 49.15625, 51.22265625, 53.2890625, 55.35546875, 57.421875, 59.48828125, 61.5546875, 63.62109375, 65.6875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 8.0, 1.0, 7.0, 8.0, 9.0, 13.0, 22.0, 18.0, 32.0, 58.0, 56.0, 83.0, 126.0, 118.0, 113.0, 87.0, 70.0, 59.0, 35.0, 22.0, 12.0, 9.0, 7.0, 6.0, 10.0, 7.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.9375, -29.84814453125, -28.7587890625, -27.66943359375, -26.580078125, -25.49072265625, -24.4013671875, -23.31201171875, -22.22265625, -21.13330078125, -20.0439453125, -18.95458984375, -17.865234375, -16.77587890625, -15.6865234375, -14.59716796875, -13.5078125, -12.41845703125, -11.3291015625, -10.23974609375, -9.150390625, -8.06103515625, -6.9716796875, -5.88232421875, -4.79296875, -3.70361328125, -2.6142578125, -1.52490234375, -0.435546875, 0.65380859375, 1.7431640625, 2.83251953125, 3.921875, 5.01123046875, 6.1005859375, 7.18994140625, 8.279296875, 9.36865234375, 10.4580078125, 11.54736328125, 12.63671875, 13.72607421875, 14.8154296875, 15.90478515625, 16.994140625, 18.08349609375, 19.1728515625, 20.26220703125, 21.3515625, 22.44091796875, 23.5302734375, 24.61962890625, 25.708984375, 26.79833984375, 27.8876953125, 28.97705078125, 30.06640625, 31.15576171875, 32.2451171875, 33.33447265625, 34.423828125, 35.51318359375, 36.6025390625, 37.69189453125, 38.78125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 10.0, 20.0, 70.0, 176.0, 306.0, 261.0, 111.0, 27.0, 17.0, 6.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-839.79931640625, -805.8283081054688, -771.8572387695312, -737.88623046875, -703.9151611328125, -669.9441528320312, -635.97314453125, -602.0020751953125, -568.031005859375, -534.0599975585938, -500.08892822265625, -466.117919921875, -432.1468505859375, -398.17584228515625, -364.2048034667969, -330.2337646484375, -296.26275634765625, -262.2917175292969, -228.3206787109375, -194.3496551513672, -160.3786163330078, -126.40757751464844, -92.43655395507812, -58.46551513671875, -24.494476318359375, 9.476558685302734, 43.447593688964844, 77.41862487792969, 111.38966369628906, 145.36070251464844, 179.33172607421875, 213.30276489257812, 247.2738037109375, 281.2448425292969, 315.21588134765625, 349.1868896484375, 383.157958984375, 417.12896728515625, 451.1000061035156, 485.071044921875, 519.0421142578125, 553.0131225585938, 586.9841918945312, 620.9552001953125, 654.92626953125, 688.8972778320312, 722.8682861328125, 756.83935546875, 790.8103637695312, 824.7813720703125, 858.75244140625, 892.7234497070312, 926.6945190429688, 960.66552734375, 994.6365966796875, 1028.607666015625, 1062.57861328125, 1096.5496826171875, 1130.5206298828125, 1164.49169921875, 1198.4627685546875, 1232.433837890625, 1266.40478515625, 1300.3758544921875, 1334.346923828125]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 6.0, 6.0, 4.0, 7.0, 16.0, 7.0, 15.0, 18.0, 20.0, 27.0, 10.0, 26.0, 32.0, 34.0, 38.0, 31.0, 34.0, 38.0, 49.0, 32.0, 43.0, 44.0, 49.0, 45.0, 39.0, 41.0, 37.0, 35.0, 34.0, 30.0, 32.0, 18.0, 24.0, 16.0, 13.0, 8.0, 8.0, 7.0, 10.0, 3.0, 6.0, 5.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-383.5564270019531, -372.88934326171875, -362.22222900390625, -351.5551452636719, -340.8880615234375, -330.220947265625, -319.5538635253906, -308.88677978515625, -298.21966552734375, -287.5525817871094, -276.8854675292969, -266.2183837890625, -255.55128479003906, -244.88418579101562, -234.21710205078125, -223.5500030517578, -212.88290405273438, -202.21580505371094, -191.5487060546875, -180.88162231445312, -170.2145233154297, -159.54742431640625, -148.88034057617188, -138.21324157714844, -127.546142578125, -116.87904357910156, -106.21195220947266, -95.54486083984375, -84.87776184082031, -74.21066284179688, -63.54357147216797, -52.87648010253906, -42.2093505859375, -31.542255401611328, -20.875160217285156, -10.208065032958984, 0.4590301513671875, 11.12612533569336, 21.79322052001953, 32.46031188964844, 43.127410888671875, 53.79450607299805, 64.46160125732422, 75.12869262695312, 85.79579162597656, 96.462890625, 107.1299819946289, 117.79707336425781, 128.46417236328125, 139.1312713623047, 149.79837036132812, 160.4654541015625, 171.13255310058594, 181.79965209960938, 192.46673583984375, 203.1338348388672, 213.80093383789062, 224.46803283691406, 235.1351318359375, 245.80221557617188, 256.46929931640625, 267.13641357421875, 277.8034973144531, 288.4705810546875, 299.1376953125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 4.0, 8.0, 4.0, 13.0, 16.0, 35.0, 41.0, 61.0, 102.0, 170.0, 321.0, 633.0, 1458.0, 3431.0, 9323.0, 38308.0, 3936131.0, 174795.0, 19267.0, 5754.0, 2209.0, 1034.0, 493.0, 266.0, 144.0, 81.0, 66.0, 32.0, 23.0, 17.0, 11.0, 10.0, 12.0, 4.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-101.3125, -97.79296875, -94.2734375, -90.75390625, -87.234375, -83.71484375, -80.1953125, -76.67578125, -73.15625, -69.63671875, -66.1171875, -62.59765625, -59.078125, -55.55859375, -52.0390625, -48.51953125, -45.0, -41.48046875, -37.9609375, -34.44140625, -30.921875, -27.40234375, -23.8828125, -20.36328125, -16.84375, -13.32421875, -9.8046875, -6.28515625, -2.765625, 0.75390625, 4.2734375, 7.79296875, 11.3125, 14.83203125, 18.3515625, 21.87109375, 25.390625, 28.91015625, 32.4296875, 35.94921875, 39.46875, 42.98828125, 46.5078125, 50.02734375, 53.546875, 57.06640625, 60.5859375, 64.10546875, 67.625, 71.14453125, 74.6640625, 78.18359375, 81.703125, 85.22265625, 88.7421875, 92.26171875, 95.78125, 99.30078125, 102.8203125, 106.33984375, 109.859375, 113.37890625, 116.8984375, 120.41796875, 123.9375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 3.0, 5.0, 10.0, 11.0, 16.0, 33.0, 24.0, 39.0, 47.0, 62.0, 78.0, 77.0, 76.0, 93.0, 78.0, 81.0, 54.0, 47.0, 45.0, 32.0, 22.0, 26.0, 15.0, 6.0, 7.0, 1.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-41.6875, -40.64501953125, -39.6025390625, -38.56005859375, -37.517578125, -36.47509765625, -35.4326171875, -34.39013671875, -33.34765625, -32.30517578125, -31.2626953125, -30.22021484375, -29.177734375, -28.13525390625, -27.0927734375, -26.05029296875, -25.0078125, -23.96533203125, -22.9228515625, -21.88037109375, -20.837890625, -19.79541015625, -18.7529296875, -17.71044921875, -16.66796875, -15.62548828125, -14.5830078125, -13.54052734375, -12.498046875, -11.45556640625, -10.4130859375, -9.37060546875, -8.328125, -7.28564453125, -6.2431640625, -5.20068359375, -4.158203125, -3.11572265625, -2.0732421875, -1.03076171875, 0.01171875, 1.05419921875, 2.0966796875, 3.13916015625, 4.181640625, 5.22412109375, 6.2666015625, 7.30908203125, 8.3515625, 9.39404296875, 10.4365234375, 11.47900390625, 12.521484375, 13.56396484375, 14.6064453125, 15.64892578125, 16.69140625, 17.73388671875, 18.7763671875, 19.81884765625, 20.861328125, 21.90380859375, 22.9462890625, 23.98876953125, 25.03125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 1.0, 3.0, 5.0, 6.0, 6.0, 15.0, 19.0, 34.0, 40.0, 56.0, 66.0, 113.0, 201.0, 293.0, 412.0, 630.0, 1142.0, 2163.0, 4407.0, 10245.0, 30675.0, 194341.0, 3821474.0, 92151.0, 20431.0, 7490.0, 3495.0, 1753.0, 936.0, 603.0, 328.0, 242.0, 163.0, 116.0, 61.0, 39.0, 45.0, 17.0, 18.0, 21.0, 8.0, 9.0, 3.0, 2.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-59.34375, -57.4501953125, -55.556640625, -53.6630859375, -51.76953125, -49.8759765625, -47.982421875, -46.0888671875, -44.1953125, -42.3017578125, -40.408203125, -38.5146484375, -36.62109375, -34.7275390625, -32.833984375, -30.9404296875, -29.046875, -27.1533203125, -25.259765625, -23.3662109375, -21.47265625, -19.5791015625, -17.685546875, -15.7919921875, -13.8984375, -12.0048828125, -10.111328125, -8.2177734375, -6.32421875, -4.4306640625, -2.537109375, -0.6435546875, 1.25, 3.1435546875, 5.037109375, 6.9306640625, 8.82421875, 10.7177734375, 12.611328125, 14.5048828125, 16.3984375, 18.2919921875, 20.185546875, 22.0791015625, 23.97265625, 25.8662109375, 27.759765625, 29.6533203125, 31.546875, 33.4404296875, 35.333984375, 37.2275390625, 39.12109375, 41.0146484375, 42.908203125, 44.8017578125, 46.6953125, 48.5888671875, 50.482421875, 52.3759765625, 54.26953125, 56.1630859375, 58.056640625, 59.9501953125, 61.84375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 6.0, 5.0, 8.0, 6.0, 6.0, 17.0, 30.0, 37.0, 50.0, 62.0, 124.0, 378.0, 2708.0, 300.0, 116.0, 66.0, 41.0, 30.0, 22.0, 11.0, 6.0, 10.0, 8.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.78125, -19.15185546875, -18.5224609375, -17.89306640625, -17.263671875, -16.63427734375, -16.0048828125, -15.37548828125, -14.74609375, -14.11669921875, -13.4873046875, -12.85791015625, -12.228515625, -11.59912109375, -10.9697265625, -10.34033203125, -9.7109375, -9.08154296875, -8.4521484375, -7.82275390625, -7.193359375, -6.56396484375, -5.9345703125, -5.30517578125, -4.67578125, -4.04638671875, -3.4169921875, -2.78759765625, -2.158203125, -1.52880859375, -0.8994140625, -0.27001953125, 0.359375, 0.98876953125, 1.6181640625, 2.24755859375, 2.876953125, 3.50634765625, 4.1357421875, 4.76513671875, 5.39453125, 6.02392578125, 6.6533203125, 7.28271484375, 7.912109375, 8.54150390625, 9.1708984375, 9.80029296875, 10.4296875, 11.05908203125, 11.6884765625, 12.31787109375, 12.947265625, 13.57666015625, 14.2060546875, 14.83544921875, 15.46484375, 16.09423828125, 16.7236328125, 17.35302734375, 17.982421875, 18.61181640625, 19.2412109375, 19.87060546875, 20.5]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 5.0, 1.0, 5.0, 5.0, 17.0, 20.0, 20.0, 25.0, 42.0, 40.0, 68.0, 70.0, 98.0, 114.0, 96.0, 93.0, 74.0, 59.0, 53.0, 30.0, 27.0, 14.0, 13.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-102.06675720214844, -99.00914001464844, -95.95153045654297, -92.8939208984375, -89.8363037109375, -86.7786865234375, -83.72107696533203, -80.66346740722656, -77.60585021972656, -74.54823303222656, -71.4906234741211, -68.43301391601562, -65.37539672851562, -62.31778335571289, -59.260169982910156, -56.20255661010742, -53.14494323730469, -50.08732986450195, -47.02971649169922, -43.972103118896484, -40.91448974609375, -37.856876373291016, -34.79926300048828, -31.741649627685547, -28.684036254882812, -25.626422882080078, -22.568809509277344, -19.51119613647461, -16.453582763671875, -13.39596939086914, -10.338356018066406, -7.280742645263672, -4.2231292724609375, -1.1655158996582031, 1.8920974731445312, 4.949710845947266, 8.00732421875, 11.064937591552734, 14.122550964355469, 17.180164337158203, 20.237777709960938, 23.295391082763672, 26.353004455566406, 29.41061782836914, 32.468231201171875, 35.52584457397461, 38.583457946777344, 41.64107131958008, 44.69868469238281, 47.75629806518555, 50.81391143798828, 53.871524810791016, 56.92913818359375, 59.986751556396484, 63.04436492919922, 66.10197448730469, 69.15959167480469, 72.21720886230469, 75.27481842041016, 78.33242797851562, 81.39004516601562, 84.44766235351562, 87.5052719116211, 90.56288146972656, 93.62049865722656]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 11.0, 9.0, 9.0, 6.0, 20.0, 15.0, 20.0, 17.0, 14.0, 22.0, 26.0, 33.0, 33.0, 46.0, 40.0, 43.0, 44.0, 50.0, 46.0, 48.0, 48.0, 46.0, 53.0, 47.0, 34.0, 35.0, 36.0, 26.0, 16.0, 29.0, 16.0, 16.0, 12.0, 10.0, 3.0, 4.0, 2.0, 4.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.46294403076172, -61.66453170776367, -59.866119384765625, -58.06770706176758, -56.26929473876953, -54.470882415771484, -52.67247009277344, -50.87405776977539, -49.075645446777344, -47.2772331237793, -45.47882080078125, -43.6804084777832, -41.881996154785156, -40.08358383178711, -38.28517150878906, -36.486759185791016, -34.68834686279297, -32.88993453979492, -31.091522216796875, -29.293109893798828, -27.49469757080078, -25.696285247802734, -23.897872924804688, -22.09946060180664, -20.301044464111328, -18.50263214111328, -16.704219818115234, -14.905807495117188, -13.10739517211914, -11.308981895446777, -9.51056957244873, -7.712157249450684, -5.913745880126953, -4.115333557128906, -2.3169209957122803, -0.5185084342956543, 1.2799038887023926, 3.0783166885375977, 4.8767290115356445, 6.675141334533691, 8.473553657531738, 10.271965980529785, 12.070378303527832, 13.868791580200195, 15.667203903198242, 17.46561622619629, 19.264028549194336, 21.062440872192383, 22.86085319519043, 24.659265518188477, 26.457677841186523, 28.25609016418457, 30.054502487182617, 31.852916717529297, 33.651329040527344, 35.44974136352539, 37.24815368652344, 39.046566009521484, 40.84497833251953, 42.64339065551758, 44.441802978515625, 46.24021530151367, 48.03862762451172, 49.837039947509766, 51.63545227050781]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 2.0, 5.0, 9.0, 8.0, 7.0, 16.0, 17.0, 29.0, 43.0, 63.0, 111.0, 156.0, 227.0, 372.0, 652.0, 1175.0, 2221.0, 4894.0, 11477.0, 29517.0, 81389.0, 224506.0, 399909.0, 182838.0, 66699.0, 24105.0, 9448.0, 4109.0, 1983.0, 1047.0, 572.0, 348.0, 194.0, 135.0, 91.0, 43.0, 45.0, 28.0, 14.0, 11.0, 12.0, 8.0, 6.0, 5.0, 2.0, 2.0, 0.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-62.21875, -60.29833984375, -58.3779296875, -56.45751953125, -54.537109375, -52.61669921875, -50.6962890625, -48.77587890625, -46.85546875, -44.93505859375, -43.0146484375, -41.09423828125, -39.173828125, -37.25341796875, -35.3330078125, -33.41259765625, -31.4921875, -29.57177734375, -27.6513671875, -25.73095703125, -23.810546875, -21.89013671875, -19.9697265625, -18.04931640625, -16.12890625, -14.20849609375, -12.2880859375, -10.36767578125, -8.447265625, -6.52685546875, -4.6064453125, -2.68603515625, -0.765625, 1.15478515625, 3.0751953125, 4.99560546875, 6.916015625, 8.83642578125, 10.7568359375, 12.67724609375, 14.59765625, 16.51806640625, 18.4384765625, 20.35888671875, 22.279296875, 24.19970703125, 26.1201171875, 28.04052734375, 29.9609375, 31.88134765625, 33.8017578125, 35.72216796875, 37.642578125, 39.56298828125, 41.4833984375, 43.40380859375, 45.32421875, 47.24462890625, 49.1650390625, 51.08544921875, 53.005859375, 54.92626953125, 56.8466796875, 58.76708984375, 60.6875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 6.0, 2.0, 7.0, 11.0, 12.0, 15.0, 17.0, 23.0, 35.0, 44.0, 41.0, 62.0, 56.0, 65.0, 69.0, 82.0, 68.0, 73.0, 54.0, 58.0, 38.0, 36.0, 29.0, 28.0, 25.0, 12.0, 10.0, 8.0, 7.0, 5.0, 2.0, 3.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-33.625, -32.701416015625, -31.77783203125, -30.854248046875, -29.9306640625, -29.007080078125, -28.08349609375, -27.159912109375, -26.236328125, -25.312744140625, -24.38916015625, -23.465576171875, -22.5419921875, -21.618408203125, -20.69482421875, -19.771240234375, -18.84765625, -17.924072265625, -17.00048828125, -16.076904296875, -15.1533203125, -14.229736328125, -13.30615234375, -12.382568359375, -11.458984375, -10.535400390625, -9.61181640625, -8.688232421875, -7.7646484375, -6.841064453125, -5.91748046875, -4.993896484375, -4.0703125, -3.146728515625, -2.22314453125, -1.299560546875, -0.3759765625, 0.547607421875, 1.47119140625, 2.394775390625, 3.318359375, 4.241943359375, 5.16552734375, 6.089111328125, 7.0126953125, 7.936279296875, 8.85986328125, 9.783447265625, 10.70703125, 11.630615234375, 12.55419921875, 13.477783203125, 14.4013671875, 15.324951171875, 16.24853515625, 17.172119140625, 18.095703125, 19.019287109375, 19.94287109375, 20.866455078125, 21.7900390625, 22.713623046875, 23.63720703125, 24.560791015625, 25.484375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 5.0, 2.0, 3.0, 3.0, 5.0, 6.0, 7.0, 5.0, 13.0, 21.0, 16.0, 23.0, 30.0, 36.0, 58.0, 87.0, 104.0, 183.0, 277.0, 418.0, 777.0, 1479.0, 4427.0, 18393.0, 135911.0, 712175.0, 146622.0, 19379.0, 4485.0, 1551.0, 753.0, 412.0, 278.0, 169.0, 120.0, 92.0, 62.0, 51.0, 24.0, 30.0, 21.0, 16.0, 4.0, 6.0, 8.0, 8.0, 4.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.0, -77.9453125, -74.890625, -71.8359375, -68.78125, -65.7265625, -62.671875, -59.6171875, -56.5625, -53.5078125, -50.453125, -47.3984375, -44.34375, -41.2890625, -38.234375, -35.1796875, -32.125, -29.0703125, -26.015625, -22.9609375, -19.90625, -16.8515625, -13.796875, -10.7421875, -7.6875, -4.6328125, -1.578125, 1.4765625, 4.53125, 7.5859375, 10.640625, 13.6953125, 16.75, 19.8046875, 22.859375, 25.9140625, 28.96875, 32.0234375, 35.078125, 38.1328125, 41.1875, 44.2421875, 47.296875, 50.3515625, 53.40625, 56.4609375, 59.515625, 62.5703125, 65.625, 68.6796875, 71.734375, 74.7890625, 77.84375, 80.8984375, 83.953125, 87.0078125, 90.0625, 93.1171875, 96.171875, 99.2265625, 102.28125, 105.3359375, 108.390625, 111.4453125, 114.5]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 11.0, 9.0, 14.0, 11.0, 10.0, 19.0, 22.0, 22.0, 21.0, 26.0, 42.0, 39.0, 45.0, 48.0, 50.0, 53.0, 60.0, 43.0, 48.0, 50.0, 53.0, 45.0, 29.0, 34.0, 32.0, 31.0, 20.0, 29.0, 17.0, 20.0, 12.0, 7.0, 5.0, 5.0, 5.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-96.0, -93.3427734375, -90.685546875, -88.0283203125, -85.37109375, -82.7138671875, -80.056640625, -77.3994140625, -74.7421875, -72.0849609375, -69.427734375, -66.7705078125, -64.11328125, -61.4560546875, -58.798828125, -56.1416015625, -53.484375, -50.8271484375, -48.169921875, -45.5126953125, -42.85546875, -40.1982421875, -37.541015625, -34.8837890625, -32.2265625, -29.5693359375, -26.912109375, -24.2548828125, -21.59765625, -18.9404296875, -16.283203125, -13.6259765625, -10.96875, -8.3115234375, -5.654296875, -2.9970703125, -0.33984375, 2.3173828125, 4.974609375, 7.6318359375, 10.2890625, 12.9462890625, 15.603515625, 18.2607421875, 20.91796875, 23.5751953125, 26.232421875, 28.8896484375, 31.546875, 34.2041015625, 36.861328125, 39.5185546875, 42.17578125, 44.8330078125, 47.490234375, 50.1474609375, 52.8046875, 55.4619140625, 58.119140625, 60.7763671875, 63.43359375, 66.0908203125, 68.748046875, 71.4052734375, 74.0625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 0.0, 0.0, 5.0, 12.0, 15.0, 21.0, 41.0, 48.0, 90.0, 196.0, 401.0, 867.0, 2558.0, 10359.0, 68254.0, 604173.0, 316037.0, 35899.0, 6373.0, 1809.0, 698.0, 325.0, 168.0, 83.0, 57.0, 37.0, 12.0, 7.0, 11.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.046875, -21.081787109375, -20.11669921875, -19.151611328125, -18.1865234375, -17.221435546875, -16.25634765625, -15.291259765625, -14.326171875, -13.361083984375, -12.39599609375, -11.430908203125, -10.4658203125, -9.500732421875, -8.53564453125, -7.570556640625, -6.60546875, -5.640380859375, -4.67529296875, -3.710205078125, -2.7451171875, -1.780029296875, -0.81494140625, 0.150146484375, 1.115234375, 2.080322265625, 3.04541015625, 4.010498046875, 4.9755859375, 5.940673828125, 6.90576171875, 7.870849609375, 8.8359375, 9.801025390625, 10.76611328125, 11.731201171875, 12.6962890625, 13.661376953125, 14.62646484375, 15.591552734375, 16.556640625, 17.521728515625, 18.48681640625, 19.451904296875, 20.4169921875, 21.382080078125, 22.34716796875, 23.312255859375, 24.27734375, 25.242431640625, 26.20751953125, 27.172607421875, 28.1376953125, 29.102783203125, 30.06787109375, 31.032958984375, 31.998046875, 32.963134765625, 33.92822265625, 34.893310546875, 35.8583984375, 36.823486328125, 37.78857421875, 38.753662109375, 39.71875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 5.0, 5.0, 6.0, 9.0, 15.0, 17.0, 21.0, 27.0, 23.0, 31.0, 45.0, 75.0, 107.0, 131.0, 119.0, 73.0, 56.0, 55.0, 42.0, 28.0, 30.0, 17.0, 14.0, 15.0, 6.0, 4.0, 7.0, 6.0, 7.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004486083984375, -0.004326164722442627, -0.004166245460510254, -0.004006326198577881, -0.003846406936645508, -0.0036864876747131348, -0.0035265684127807617, -0.0033666491508483887, -0.0032067298889160156, -0.0030468106269836426, -0.0028868913650512695, -0.0027269721031188965, -0.0025670528411865234, -0.0024071335792541504, -0.0022472143173217773, -0.0020872950553894043, -0.0019273757934570312, -0.0017674565315246582, -0.0016075372695922852, -0.0014476180076599121, -0.001287698745727539, -0.001127779483795166, -0.000967860221862793, -0.0008079409599304199, -0.0006480216979980469, -0.00048810243606567383, -0.0003281831741333008, -0.00016826391220092773, -8.344650268554688e-06, 0.00015157461166381836, 0.0003114938735961914, 0.00047141313552856445, 0.0006313323974609375, 0.0007912516593933105, 0.0009511709213256836, 0.0011110901832580566, 0.0012710094451904297, 0.0014309287071228027, 0.0015908479690551758, 0.0017507672309875488, 0.0019106864929199219, 0.002070605754852295, 0.002230525016784668, 0.002390444278717041, 0.002550363540649414, 0.002710282802581787, 0.00287020206451416, 0.003030121326446533, 0.0031900405883789062, 0.0033499598503112793, 0.0035098791122436523, 0.0036697983741760254, 0.0038297176361083984, 0.0039896368980407715, 0.0041495561599731445, 0.004309475421905518, 0.004469394683837891, 0.004629313945770264, 0.004789233207702637, 0.00494915246963501, 0.005109071731567383, 0.005268990993499756, 0.005428910255432129, 0.005588829517364502, 0.005748748779296875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 8.0, 8.0, 12.0, 29.0, 57.0, 72.0, 170.0, 306.0, 666.0, 1739.0, 7314.0, 76359.0, 799994.0, 147079.0, 11071.0, 2084.0, 804.0, 352.0, 186.0, 122.0, 55.0, 25.0, 11.0, 15.0, 10.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.109375, -28.777587890625, -27.44580078125, -26.114013671875, -24.7822265625, -23.450439453125, -22.11865234375, -20.786865234375, -19.455078125, -18.123291015625, -16.79150390625, -15.459716796875, -14.1279296875, -12.796142578125, -11.46435546875, -10.132568359375, -8.80078125, -7.468994140625, -6.13720703125, -4.805419921875, -3.4736328125, -2.141845703125, -0.81005859375, 0.521728515625, 1.853515625, 3.185302734375, 4.51708984375, 5.848876953125, 7.1806640625, 8.512451171875, 9.84423828125, 11.176025390625, 12.5078125, 13.839599609375, 15.17138671875, 16.503173828125, 17.8349609375, 19.166748046875, 20.49853515625, 21.830322265625, 23.162109375, 24.493896484375, 25.82568359375, 27.157470703125, 28.4892578125, 29.821044921875, 31.15283203125, 32.484619140625, 33.81640625, 35.148193359375, 36.47998046875, 37.811767578125, 39.1435546875, 40.475341796875, 41.80712890625, 43.138916015625, 44.470703125, 45.802490234375, 47.13427734375, 48.466064453125, 49.7978515625, 51.129638671875, 52.46142578125, 53.793212890625, 55.125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 8.0, 3.0, 7.0, 9.0, 12.0, 19.0, 17.0, 26.0, 32.0, 26.0, 26.0, 36.0, 42.0, 64.0, 45.0, 45.0, 71.0, 62.0, 56.0, 60.0, 47.0, 49.0, 44.0, 29.0, 32.0, 20.0, 15.0, 14.0, 17.0, 9.0, 14.0, 13.0, 6.0, 6.0, 4.0, 3.0, 2.0, 7.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-20.25, -19.65625, -19.0625, -18.46875, -17.875, -17.28125, -16.6875, -16.09375, -15.5, -14.90625, -14.3125, -13.71875, -13.125, -12.53125, -11.9375, -11.34375, -10.75, -10.15625, -9.5625, -8.96875, -8.375, -7.78125, -7.1875, -6.59375, -6.0, -5.40625, -4.8125, -4.21875, -3.625, -3.03125, -2.4375, -1.84375, -1.25, -0.65625, -0.0625, 0.53125, 1.125, 1.71875, 2.3125, 2.90625, 3.5, 4.09375, 4.6875, 5.28125, 5.875, 6.46875, 7.0625, 7.65625, 8.25, 8.84375, 9.4375, 10.03125, 10.625, 11.21875, 11.8125, 12.40625, 13.0, 13.59375, 14.1875, 14.78125, 15.375, 15.96875, 16.5625, 17.15625, 17.75]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 10.0, 56.0, 245.0, 430.0, 210.0, 44.0, 10.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-664.328369140625, -600.9441528320312, -537.5599975585938, -474.17578125, -410.7915954589844, -347.40740966796875, -284.023193359375, -220.63900756835938, -157.25482177734375, -93.8706283569336, -30.486434936523438, 32.89776611328125, 96.28195190429688, 159.6661376953125, 223.05035400390625, 286.4345397949219, 349.8187255859375, 413.2029113769531, 476.58709716796875, 539.9713134765625, 603.35546875, 666.7396850585938, 730.1239013671875, 793.508056640625, 856.8922729492188, 920.2764892578125, 983.66064453125, 1047.044921875, 1110.4290771484375, 1173.813232421875, 1237.197509765625, 1300.5816650390625, 1363.9658203125, 1427.3499755859375, 1490.7342529296875, 1554.118408203125, 1617.5025634765625, 1680.88671875, 1744.27099609375, 1807.6551513671875, 1871.039306640625, 1934.4234619140625, 1997.8077392578125, 2061.19189453125, 2124.576171875, 2187.960205078125, 2251.344482421875, 2314.728759765625, 2378.11279296875, 2441.4970703125, 2504.881103515625, 2568.265380859375, 2631.649658203125, 2695.03369140625, 2758.41796875, 2821.80224609375, 2885.1865234375, 2948.57080078125, 3011.954833984375, 3075.339111328125, 3138.723388671875, 3202.107421875, 3265.49169921875, 3328.8759765625, 3392.260009765625]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 1.0, 4.0, 4.0, 10.0, 14.0, 15.0, 7.0, 14.0, 16.0, 32.0, 18.0, 37.0, 41.0, 36.0, 55.0, 62.0, 63.0, 56.0, 56.0, 52.0, 54.0, 40.0, 39.0, 55.0, 38.0, 28.0, 29.0, 22.0, 27.0, 17.0, 10.0, 13.0, 7.0, 8.0, 8.0, 1.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-326.4562683105469, -313.5807800292969, -300.705322265625, -287.829833984375, -274.9543762207031, -262.0788879394531, -249.2034149169922, -236.32794189453125, -223.4524688720703, -210.57699584960938, -197.70152282714844, -184.8260498046875, -171.9505615234375, -159.07510375976562, -146.19961547851562, -133.3241424560547, -120.44866943359375, -107.57319641113281, -94.69772338867188, -81.8222427368164, -68.94676971435547, -56.07129669189453, -43.19581604003906, -30.320343017578125, -17.444869995117188, -4.569395065307617, 8.306079864501953, 21.181556701660156, 34.057029724121094, 46.93250274658203, 59.8079833984375, 72.68345642089844, 85.5589599609375, 98.43443298339844, 111.30990600585938, 124.18538665771484, 137.06085205078125, 149.93634033203125, 162.8118133544922, 175.68728637695312, 188.56275939941406, 201.438232421875, 214.31370544433594, 227.18917846679688, 240.06466674804688, 252.94012451171875, 265.81561279296875, 278.69110107421875, 291.5665588378906, 304.4420471191406, 317.3175048828125, 330.1929931640625, 343.0684509277344, 355.9439392089844, 368.81939697265625, 381.69488525390625, 394.57037353515625, 407.44586181640625, 420.3213195800781, 433.1968078613281, 446.072265625, 458.94775390625, 471.8232421875, 484.6986999511719, 497.57415771484375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 1.0, 13.0, 18.0, 34.0, 41.0, 74.0, 160.0, 303.0, 750.0, 1757.0, 5009.0, 18738.0, 108123.0, 2945614.0, 1031156.0, 63566.0, 12635.0, 3696.0, 1359.0, 596.0, 285.0, 133.0, 90.0, 39.0, 37.0, 22.0, 17.0, 7.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.5, -65.240234375, -62.98046875, -60.720703125, -58.4609375, -56.201171875, -53.94140625, -51.681640625, -49.421875, -47.162109375, -44.90234375, -42.642578125, -40.3828125, -38.123046875, -35.86328125, -33.603515625, -31.34375, -29.083984375, -26.82421875, -24.564453125, -22.3046875, -20.044921875, -17.78515625, -15.525390625, -13.265625, -11.005859375, -8.74609375, -6.486328125, -4.2265625, -1.966796875, 0.29296875, 2.552734375, 4.8125, 7.072265625, 9.33203125, 11.591796875, 13.8515625, 16.111328125, 18.37109375, 20.630859375, 22.890625, 25.150390625, 27.41015625, 29.669921875, 31.9296875, 34.189453125, 36.44921875, 38.708984375, 40.96875, 43.228515625, 45.48828125, 47.748046875, 50.0078125, 52.267578125, 54.52734375, 56.787109375, 59.046875, 61.306640625, 63.56640625, 65.826171875, 68.0859375, 70.345703125, 72.60546875, 74.865234375, 77.125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 7.0, 5.0, 6.0, 6.0, 18.0, 16.0, 16.0, 20.0, 33.0, 37.0, 31.0, 33.0, 42.0, 61.0, 68.0, 63.0, 76.0, 54.0, 61.0, 48.0, 60.0, 42.0, 37.0, 31.0, 26.0, 27.0, 20.0, 10.0, 15.0, 6.0, 6.0, 8.0, 2.0, 3.0, 3.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-21.265625, -20.547119140625, -19.82861328125, -19.110107421875, -18.3916015625, -17.673095703125, -16.95458984375, -16.236083984375, -15.517578125, -14.799072265625, -14.08056640625, -13.362060546875, -12.6435546875, -11.925048828125, -11.20654296875, -10.488037109375, -9.76953125, -9.051025390625, -8.33251953125, -7.614013671875, -6.8955078125, -6.177001953125, -5.45849609375, -4.739990234375, -4.021484375, -3.302978515625, -2.58447265625, -1.865966796875, -1.1474609375, -0.428955078125, 0.28955078125, 1.008056640625, 1.7265625, 2.445068359375, 3.16357421875, 3.882080078125, 4.6005859375, 5.319091796875, 6.03759765625, 6.756103515625, 7.474609375, 8.193115234375, 8.91162109375, 9.630126953125, 10.3486328125, 11.067138671875, 11.78564453125, 12.504150390625, 13.22265625, 13.941162109375, 14.65966796875, 15.378173828125, 16.0966796875, 16.815185546875, 17.53369140625, 18.252197265625, 18.970703125, 19.689208984375, 20.40771484375, 21.126220703125, 21.8447265625, 22.563232421875, 23.28173828125, 24.000244140625, 24.71875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 7.0, 8.0, 7.0, 8.0, 17.0, 17.0, 31.0, 49.0, 125.0, 205.0, 427.0, 1051.0, 3144.0, 12364.0, 76986.0, 2855718.0, 1178103.0, 52257.0, 9431.0, 2583.0, 836.0, 407.0, 195.0, 122.0, 66.0, 31.0, 29.0, 19.0, 16.0, 4.0, 5.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-86.6875, -84.2041015625, -81.720703125, -79.2373046875, -76.75390625, -74.2705078125, -71.787109375, -69.3037109375, -66.8203125, -64.3369140625, -61.853515625, -59.3701171875, -56.88671875, -54.4033203125, -51.919921875, -49.4365234375, -46.953125, -44.4697265625, -41.986328125, -39.5029296875, -37.01953125, -34.5361328125, -32.052734375, -29.5693359375, -27.0859375, -24.6025390625, -22.119140625, -19.6357421875, -17.15234375, -14.6689453125, -12.185546875, -9.7021484375, -7.21875, -4.7353515625, -2.251953125, 0.2314453125, 2.71484375, 5.1982421875, 7.681640625, 10.1650390625, 12.6484375, 15.1318359375, 17.615234375, 20.0986328125, 22.58203125, 25.0654296875, 27.548828125, 30.0322265625, 32.515625, 34.9990234375, 37.482421875, 39.9658203125, 42.44921875, 44.9326171875, 47.416015625, 49.8994140625, 52.3828125, 54.8662109375, 57.349609375, 59.8330078125, 62.31640625, 64.7998046875, 67.283203125, 69.7666015625, 72.25]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 1.0, 4.0, 3.0, 8.0, 15.0, 15.0, 20.0, 25.0, 56.0, 90.0, 144.0, 300.0, 633.0, 1146.0, 749.0, 349.0, 197.0, 114.0, 65.0, 41.0, 38.0, 16.0, 9.0, 7.0, 5.0, 5.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.34375, -49.25439453125, -47.1650390625, -45.07568359375, -42.986328125, -40.89697265625, -38.8076171875, -36.71826171875, -34.62890625, -32.53955078125, -30.4501953125, -28.36083984375, -26.271484375, -24.18212890625, -22.0927734375, -20.00341796875, -17.9140625, -15.82470703125, -13.7353515625, -11.64599609375, -9.556640625, -7.46728515625, -5.3779296875, -3.28857421875, -1.19921875, 0.89013671875, 2.9794921875, 5.06884765625, 7.158203125, 9.24755859375, 11.3369140625, 13.42626953125, 15.515625, 17.60498046875, 19.6943359375, 21.78369140625, 23.873046875, 25.96240234375, 28.0517578125, 30.14111328125, 32.23046875, 34.31982421875, 36.4091796875, 38.49853515625, 40.587890625, 42.67724609375, 44.7666015625, 46.85595703125, 48.9453125, 51.03466796875, 53.1240234375, 55.21337890625, 57.302734375, 59.39208984375, 61.4814453125, 63.57080078125, 65.66015625, 67.74951171875, 69.8388671875, 71.92822265625, 74.017578125, 76.10693359375, 78.1962890625, 80.28564453125, 82.375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 11.0, 26.0, 53.0, 138.0, 232.0, 226.0, 133.0, 93.0, 42.0, 15.0, 9.0, 8.0, 2.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-734.3699951171875, -711.4608154296875, -688.5516357421875, -665.6424560546875, -642.7332763671875, -619.8240966796875, -596.9149169921875, -574.0057373046875, -551.0965576171875, -528.1873779296875, -505.2781982421875, -482.3690185546875, -459.4598388671875, -436.5506591796875, -413.6414794921875, -390.7322998046875, -367.8231201171875, -344.9139404296875, -322.0047607421875, -299.0955810546875, -276.1864013671875, -253.2772216796875, -230.3680419921875, -207.4588623046875, -184.5496826171875, -161.6405029296875, -138.7313232421875, -115.8221435546875, -92.9129638671875, -70.0037841796875, -47.0946044921875, -24.1854248046875, -1.27618408203125, 21.63299560546875, 44.54217529296875, 67.45135498046875, 90.36053466796875, 113.26971435546875, 136.17889404296875, 159.08807373046875, 181.99725341796875, 204.90643310546875, 227.81561279296875, 250.72479248046875, 273.63397216796875, 296.54315185546875, 319.45233154296875, 342.36151123046875, 365.27069091796875, 388.17987060546875, 411.08905029296875, 433.99822998046875, 456.90740966796875, 479.81658935546875, 502.72576904296875, 525.6349487304688, 548.5441284179688, 571.4533081054688, 594.3624877929688, 617.2716674804688, 640.1808471679688, 663.0900268554688, 685.9992065429688, 708.9083862304688, 731.8175659179688]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 5.0, 6.0, 6.0, 5.0, 14.0, 16.0, 13.0, 20.0, 17.0, 34.0, 26.0, 43.0, 30.0, 40.0, 42.0, 49.0, 54.0, 44.0, 61.0, 57.0, 57.0, 52.0, 40.0, 30.0, 49.0, 31.0, 30.0, 30.0, 16.0, 24.0, 16.0, 8.0, 9.0, 10.0, 4.0, 5.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-266.94854736328125, -258.3462829589844, -249.74400329589844, -241.1417236328125, -232.53945922851562, -223.93719482421875, -215.3349151611328, -206.73263549804688, -198.13037109375, -189.52810668945312, -180.9258270263672, -172.32354736328125, -163.72128295898438, -155.1190185546875, -146.51673889160156, -137.91445922851562, -129.31219482421875, -120.70992279052734, -112.10765075683594, -103.50537872314453, -94.90310668945312, -86.30083465576172, -77.69856262207031, -69.0962905883789, -60.4940185546875, -51.891746520996094, -43.28947448730469, -34.68720245361328, -26.084930419921875, -17.48265838623047, -8.880386352539062, -0.27811431884765625, 8.32415771484375, 16.926429748535156, 25.528701782226562, 34.13097381591797, 42.733245849609375, 51.33551788330078, 59.93778991699219, 68.5400619506836, 77.142333984375, 85.7446060180664, 94.34687805175781, 102.94915008544922, 111.55142211914062, 120.15369415283203, 128.75596618652344, 137.35824584960938, 145.96051025390625, 154.56277465820312, 163.16505432128906, 171.767333984375, 180.36959838867188, 188.97186279296875, 197.5741424560547, 206.17642211914062, 214.7786865234375, 223.38095092773438, 231.9832305908203, 240.58551025390625, 249.18777465820312, 257.7900390625, 266.392333984375, 274.9945983886719, 283.59686279296875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 7.0, 7.0, 15.0, 17.0, 31.0, 48.0, 93.0, 119.0, 215.0, 371.0, 835.0, 1771.0, 3938.0, 10504.0, 31021.0, 99929.0, 392748.0, 367411.0, 93260.0, 28984.0, 10039.0, 3878.0, 1718.0, 742.0, 347.0, 198.0, 133.0, 67.0, 34.0, 28.0, 15.0, 10.0, 6.0, 7.0, 2.0, 7.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-74.5, -72.58837890625, -70.6767578125, -68.76513671875, -66.853515625, -64.94189453125, -63.0302734375, -61.11865234375, -59.20703125, -57.29541015625, -55.3837890625, -53.47216796875, -51.560546875, -49.64892578125, -47.7373046875, -45.82568359375, -43.9140625, -42.00244140625, -40.0908203125, -38.17919921875, -36.267578125, -34.35595703125, -32.4443359375, -30.53271484375, -28.62109375, -26.70947265625, -24.7978515625, -22.88623046875, -20.974609375, -19.06298828125, -17.1513671875, -15.23974609375, -13.328125, -11.41650390625, -9.5048828125, -7.59326171875, -5.681640625, -3.77001953125, -1.8583984375, 0.05322265625, 1.96484375, 3.87646484375, 5.7880859375, 7.69970703125, 9.611328125, 11.52294921875, 13.4345703125, 15.34619140625, 17.2578125, 19.16943359375, 21.0810546875, 22.99267578125, 24.904296875, 26.81591796875, 28.7275390625, 30.63916015625, 32.55078125, 34.46240234375, 36.3740234375, 38.28564453125, 40.197265625, 42.10888671875, 44.0205078125, 45.93212890625, 47.84375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 8.0, 7.0, 14.0, 16.0, 13.0, 24.0, 26.0, 45.0, 30.0, 47.0, 67.0, 61.0, 50.0, 73.0, 54.0, 66.0, 67.0, 40.0, 45.0, 43.0, 48.0, 36.0, 25.0, 21.0, 14.0, 14.0, 11.0, 3.0, 6.0, 7.0, 1.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-22.078125, -21.35009765625, -20.6220703125, -19.89404296875, -19.166015625, -18.43798828125, -17.7099609375, -16.98193359375, -16.25390625, -15.52587890625, -14.7978515625, -14.06982421875, -13.341796875, -12.61376953125, -11.8857421875, -11.15771484375, -10.4296875, -9.70166015625, -8.9736328125, -8.24560546875, -7.517578125, -6.78955078125, -6.0615234375, -5.33349609375, -4.60546875, -3.87744140625, -3.1494140625, -2.42138671875, -1.693359375, -0.96533203125, -0.2373046875, 0.49072265625, 1.21875, 1.94677734375, 2.6748046875, 3.40283203125, 4.130859375, 4.85888671875, 5.5869140625, 6.31494140625, 7.04296875, 7.77099609375, 8.4990234375, 9.22705078125, 9.955078125, 10.68310546875, 11.4111328125, 12.13916015625, 12.8671875, 13.59521484375, 14.3232421875, 15.05126953125, 15.779296875, 16.50732421875, 17.2353515625, 17.96337890625, 18.69140625, 19.41943359375, 20.1474609375, 20.87548828125, 21.603515625, 22.33154296875, 23.0595703125, 23.78759765625, 24.515625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 4.0, 5.0, 9.0, 13.0, 15.0, 19.0, 28.0, 38.0, 56.0, 85.0, 135.0, 238.0, 433.0, 821.0, 1879.0, 6205.0, 66074.0, 857591.0, 102792.0, 7960.0, 2121.0, 874.0, 438.0, 250.0, 173.0, 100.0, 60.0, 40.0, 19.0, 20.0, 18.0, 12.0, 2.0, 8.0, 2.0, 6.0, 7.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-127.8125, -124.115234375, -120.41796875, -116.720703125, -113.0234375, -109.326171875, -105.62890625, -101.931640625, -98.234375, -94.537109375, -90.83984375, -87.142578125, -83.4453125, -79.748046875, -76.05078125, -72.353515625, -68.65625, -64.958984375, -61.26171875, -57.564453125, -53.8671875, -50.169921875, -46.47265625, -42.775390625, -39.078125, -35.380859375, -31.68359375, -27.986328125, -24.2890625, -20.591796875, -16.89453125, -13.197265625, -9.5, -5.802734375, -2.10546875, 1.591796875, 5.2890625, 8.986328125, 12.68359375, 16.380859375, 20.078125, 23.775390625, 27.47265625, 31.169921875, 34.8671875, 38.564453125, 42.26171875, 45.958984375, 49.65625, 53.353515625, 57.05078125, 60.748046875, 64.4453125, 68.142578125, 71.83984375, 75.537109375, 79.234375, 82.931640625, 86.62890625, 90.326171875, 94.0234375, 97.720703125, 101.41796875, 105.115234375, 108.8125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 6.0, 3.0, 9.0, 13.0, 14.0, 13.0, 21.0, 20.0, 27.0, 32.0, 28.0, 26.0, 27.0, 46.0, 35.0, 43.0, 48.0, 52.0, 39.0, 43.0, 58.0, 39.0, 45.0, 33.0, 46.0, 41.0, 36.0, 18.0, 21.0, 26.0, 28.0, 17.0, 10.0, 4.0, 10.0, 2.0, 7.0, 2.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-77.8125, -75.61474609375, -73.4169921875, -71.21923828125, -69.021484375, -66.82373046875, -64.6259765625, -62.42822265625, -60.23046875, -58.03271484375, -55.8349609375, -53.63720703125, -51.439453125, -49.24169921875, -47.0439453125, -44.84619140625, -42.6484375, -40.45068359375, -38.2529296875, -36.05517578125, -33.857421875, -31.65966796875, -29.4619140625, -27.26416015625, -25.06640625, -22.86865234375, -20.6708984375, -18.47314453125, -16.275390625, -14.07763671875, -11.8798828125, -9.68212890625, -7.484375, -5.28662109375, -3.0888671875, -0.89111328125, 1.306640625, 3.50439453125, 5.7021484375, 7.89990234375, 10.09765625, 12.29541015625, 14.4931640625, 16.69091796875, 18.888671875, 21.08642578125, 23.2841796875, 25.48193359375, 27.6796875, 29.87744140625, 32.0751953125, 34.27294921875, 36.470703125, 38.66845703125, 40.8662109375, 43.06396484375, 45.26171875, 47.45947265625, 49.6572265625, 51.85498046875, 54.052734375, 56.25048828125, 58.4482421875, 60.64599609375, 62.84375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 4.0, 6.0, 1.0, 9.0, 15.0, 23.0, 40.0, 49.0, 71.0, 139.0, 265.0, 743.0, 3135.0, 36056.0, 909496.0, 91629.0, 5102.0, 1009.0, 341.0, 171.0, 73.0, 61.0, 46.0, 24.0, 10.0, 7.0, 5.0, 11.0, 1.0, 6.0, 0.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.46875, -41.77294921875, -40.0771484375, -38.38134765625, -36.685546875, -34.98974609375, -33.2939453125, -31.59814453125, -29.90234375, -28.20654296875, -26.5107421875, -24.81494140625, -23.119140625, -21.42333984375, -19.7275390625, -18.03173828125, -16.3359375, -14.64013671875, -12.9443359375, -11.24853515625, -9.552734375, -7.85693359375, -6.1611328125, -4.46533203125, -2.76953125, -1.07373046875, 0.6220703125, 2.31787109375, 4.013671875, 5.70947265625, 7.4052734375, 9.10107421875, 10.796875, 12.49267578125, 14.1884765625, 15.88427734375, 17.580078125, 19.27587890625, 20.9716796875, 22.66748046875, 24.36328125, 26.05908203125, 27.7548828125, 29.45068359375, 31.146484375, 32.84228515625, 34.5380859375, 36.23388671875, 37.9296875, 39.62548828125, 41.3212890625, 43.01708984375, 44.712890625, 46.40869140625, 48.1044921875, 49.80029296875, 51.49609375, 53.19189453125, 54.8876953125, 56.58349609375, 58.279296875, 59.97509765625, 61.6708984375, 63.36669921875, 65.0625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 0.0, 3.0, 5.0, 6.0, 1.0, 7.0, 5.0, 5.0, 7.0, 14.0, 14.0, 19.0, 10.0, 22.0, 32.0, 39.0, 46.0, 74.0, 84.0, 132.0, 118.0, 81.0, 61.0, 51.0, 30.0, 23.0, 21.0, 12.0, 18.0, 10.0, 13.0, 5.0, 8.0, 9.0, 5.0, 2.0, 6.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0035114288330078125, -0.0033857524394989014, -0.0032600760459899902, -0.003134399652481079, -0.003008723258972168, -0.002883046865463257, -0.0027573704719543457, -0.0026316940784454346, -0.0025060176849365234, -0.0023803412914276123, -0.002254664897918701, -0.00212898850440979, -0.002003312110900879, -0.0018776357173919678, -0.0017519593238830566, -0.0016262829303741455, -0.0015006065368652344, -0.0013749301433563232, -0.0012492537498474121, -0.001123577356338501, -0.0009979009628295898, -0.0008722245693206787, -0.0007465481758117676, -0.0006208717823028564, -0.0004951953887939453, -0.0003695189952850342, -0.00024384260177612305, -0.00011816620826721191, 7.510185241699219e-06, 0.00013318657875061035, 0.0002588629722595215, 0.0003845393657684326, 0.0005102157592773438, 0.0006358921527862549, 0.000761568546295166, 0.0008872449398040771, 0.0010129213333129883, 0.0011385977268218994, 0.0012642741203308105, 0.0013899505138397217, 0.0015156269073486328, 0.001641303300857544, 0.001766979694366455, 0.0018926560878753662, 0.0020183324813842773, 0.0021440088748931885, 0.0022696852684020996, 0.0023953616619110107, 0.002521038055419922, 0.002646714448928833, 0.002772390842437744, 0.0028980672359466553, 0.0030237436294555664, 0.0031494200229644775, 0.0032750964164733887, 0.0034007728099823, 0.003526449203491211, 0.003652125597000122, 0.003777801990509033, 0.0039034783840179443, 0.0040291547775268555, 0.004154831171035767, 0.004280507564544678, 0.004406183958053589, 0.0045318603515625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 9.0, 6.0, 15.0, 22.0, 31.0, 38.0, 64.0, 89.0, 130.0, 255.0, 477.0, 1075.0, 3029.0, 14420.0, 254126.0, 735664.0, 31528.0, 4734.0, 1441.0, 626.0, 311.0, 160.0, 100.0, 59.0, 49.0, 25.0, 22.0, 13.0, 8.0, 2.0, 3.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.375, -43.076171875, -41.77734375, -40.478515625, -39.1796875, -37.880859375, -36.58203125, -35.283203125, -33.984375, -32.685546875, -31.38671875, -30.087890625, -28.7890625, -27.490234375, -26.19140625, -24.892578125, -23.59375, -22.294921875, -20.99609375, -19.697265625, -18.3984375, -17.099609375, -15.80078125, -14.501953125, -13.203125, -11.904296875, -10.60546875, -9.306640625, -8.0078125, -6.708984375, -5.41015625, -4.111328125, -2.8125, -1.513671875, -0.21484375, 1.083984375, 2.3828125, 3.681640625, 4.98046875, 6.279296875, 7.578125, 8.876953125, 10.17578125, 11.474609375, 12.7734375, 14.072265625, 15.37109375, 16.669921875, 17.96875, 19.267578125, 20.56640625, 21.865234375, 23.1640625, 24.462890625, 25.76171875, 27.060546875, 28.359375, 29.658203125, 30.95703125, 32.255859375, 33.5546875, 34.853515625, 36.15234375, 37.451171875, 38.75]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 7.0, 14.0, 23.0, 28.0, 42.0, 62.0, 78.0, 136.0, 159.0, 142.0, 114.0, 78.0, 39.0, 22.0, 19.0, 10.0, 8.0, 4.0, 7.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-49.78125, -48.555908203125, -47.33056640625, -46.105224609375, -44.8798828125, -43.654541015625, -42.42919921875, -41.203857421875, -39.978515625, -38.753173828125, -37.52783203125, -36.302490234375, -35.0771484375, -33.851806640625, -32.62646484375, -31.401123046875, -30.17578125, -28.950439453125, -27.72509765625, -26.499755859375, -25.2744140625, -24.049072265625, -22.82373046875, -21.598388671875, -20.373046875, -19.147705078125, -17.92236328125, -16.697021484375, -15.4716796875, -14.246337890625, -13.02099609375, -11.795654296875, -10.5703125, -9.344970703125, -8.11962890625, -6.894287109375, -5.6689453125, -4.443603515625, -3.21826171875, -1.992919921875, -0.767578125, 0.457763671875, 1.68310546875, 2.908447265625, 4.1337890625, 5.359130859375, 6.58447265625, 7.809814453125, 9.03515625, 10.260498046875, 11.48583984375, 12.711181640625, 13.9365234375, 15.161865234375, 16.38720703125, 17.612548828125, 18.837890625, 20.063232421875, 21.28857421875, 22.513916015625, 23.7392578125, 24.964599609375, 26.18994140625, 27.415283203125, 28.640625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 6.0, 14.0, 32.0, 88.0, 198.0, 270.0, 204.0, 104.0, 43.0, 23.0, 14.0, 5.0, 2.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-498.6337890625, -474.1600036621094, -449.68621826171875, -425.21240234375, -400.7386169433594, -376.26483154296875, -351.791015625, -327.3172302246094, -302.84344482421875, -278.3696594238281, -253.89585876464844, -229.42205810546875, -204.94827270507812, -180.4744873046875, -156.0006866455078, -131.52688598632812, -107.0531005859375, -82.57930755615234, -58.10551452636719, -33.63172149658203, -9.157928466796875, 15.315864562988281, 39.78965759277344, 64.26345825195312, 88.73724365234375, 113.2110366821289, 137.68482971191406, 162.15863037109375, 186.63241577148438, 211.106201171875, 235.5800018310547, 260.0538024902344, 284.527587890625, 309.0013732910156, 333.47515869140625, 357.948974609375, 382.4227600097656, 406.89654541015625, 431.370361328125, 455.8441467285156, 480.31793212890625, 504.7917175292969, 529.2655029296875, 553.7393188476562, 578.213134765625, 602.6868896484375, 627.1607055664062, 651.634521484375, 676.1082763671875, 700.5820922851562, 725.0558471679688, 749.5296630859375, 774.00341796875, 798.4772338867188, 822.9510498046875, 847.4248046875, 871.8986206054688, 896.3724365234375, 920.84619140625, 945.3200073242188, 969.7938232421875, 994.267578125, 1018.7413940429688, 1043.2152099609375, 1067.68896484375]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 5.0, 5.0, 5.0, 12.0, 14.0, 9.0, 20.0, 21.0, 27.0, 22.0, 28.0, 36.0, 36.0, 29.0, 45.0, 58.0, 48.0, 49.0, 74.0, 55.0, 59.0, 50.0, 43.0, 42.0, 35.0, 31.0, 19.0, 15.0, 28.0, 20.0, 16.0, 7.0, 9.0, 8.0, 8.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-340.7347412109375, -330.76318359375, -320.7916259765625, -310.820068359375, -300.8485107421875, -290.876953125, -280.9053955078125, -270.933837890625, -260.9622802734375, -250.99072265625, -241.0191650390625, -231.047607421875, -221.0760498046875, -211.1044921875, -201.13291931152344, -191.16136169433594, -181.18978881835938, -171.21823120117188, -161.24667358398438, -151.27511596679688, -141.30355834960938, -131.33200073242188, -121.36042785644531, -111.38887023925781, -101.41731262207031, -91.44575500488281, -81.47419738769531, -71.50263214111328, -61.53107452392578, -51.55951690673828, -41.587955474853516, -31.61639404296875, -21.644805908203125, -11.673246383666992, -1.7016868591308594, 8.269872665405273, 18.241432189941406, 28.212989807128906, 38.18455123901367, 48.15611267089844, 58.12767028808594, 68.09922790527344, 78.07078552246094, 88.04235076904297, 98.01390838623047, 107.98546600341797, 117.95703125, 127.9285888671875, 137.900146484375, 147.8717041015625, 157.84326171875, 167.8148193359375, 177.786376953125, 187.7579345703125, 197.72950744628906, 207.70106506347656, 217.67262268066406, 227.64418029785156, 237.61573791503906, 247.58729553222656, 257.5588684082031, 267.5304260253906, 277.5019836425781, 287.4735412597656, 297.4450988769531]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 7.0, 9.0, 21.0, 21.0, 29.0, 33.0, 55.0, 131.0, 183.0, 329.0, 696.0, 1556.0, 3804.0, 10465.0, 38890.0, 292841.0, 3507547.0, 282224.0, 38204.0, 10391.0, 3764.0, 1567.0, 643.0, 342.0, 208.0, 103.0, 66.0, 56.0, 36.0, 19.0, 14.0, 11.0, 7.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.875, -44.37060546875, -42.8662109375, -41.36181640625, -39.857421875, -38.35302734375, -36.8486328125, -35.34423828125, -33.83984375, -32.33544921875, -30.8310546875, -29.32666015625, -27.822265625, -26.31787109375, -24.8134765625, -23.30908203125, -21.8046875, -20.30029296875, -18.7958984375, -17.29150390625, -15.787109375, -14.28271484375, -12.7783203125, -11.27392578125, -9.76953125, -8.26513671875, -6.7607421875, -5.25634765625, -3.751953125, -2.24755859375, -0.7431640625, 0.76123046875, 2.265625, 3.77001953125, 5.2744140625, 6.77880859375, 8.283203125, 9.78759765625, 11.2919921875, 12.79638671875, 14.30078125, 15.80517578125, 17.3095703125, 18.81396484375, 20.318359375, 21.82275390625, 23.3271484375, 24.83154296875, 26.3359375, 27.84033203125, 29.3447265625, 30.84912109375, 32.353515625, 33.85791015625, 35.3623046875, 36.86669921875, 38.37109375, 39.87548828125, 41.3798828125, 42.88427734375, 44.388671875, 45.89306640625, 47.3974609375, 48.90185546875, 50.40625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 5.0, 14.0, 6.0, 7.0, 15.0, 12.0, 25.0, 30.0, 37.0, 45.0, 57.0, 64.0, 63.0, 65.0, 55.0, 60.0, 83.0, 65.0, 56.0, 35.0, 39.0, 43.0, 27.0, 22.0, 16.0, 11.0, 13.0, 14.0, 2.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-22.625, -21.889404296875, -21.15380859375, -20.418212890625, -19.6826171875, -18.947021484375, -18.21142578125, -17.475830078125, -16.740234375, -16.004638671875, -15.26904296875, -14.533447265625, -13.7978515625, -13.062255859375, -12.32666015625, -11.591064453125, -10.85546875, -10.119873046875, -9.38427734375, -8.648681640625, -7.9130859375, -7.177490234375, -6.44189453125, -5.706298828125, -4.970703125, -4.235107421875, -3.49951171875, -2.763916015625, -2.0283203125, -1.292724609375, -0.55712890625, 0.178466796875, 0.9140625, 1.649658203125, 2.38525390625, 3.120849609375, 3.8564453125, 4.592041015625, 5.32763671875, 6.063232421875, 6.798828125, 7.534423828125, 8.27001953125, 9.005615234375, 9.7412109375, 10.476806640625, 11.21240234375, 11.947998046875, 12.68359375, 13.419189453125, 14.15478515625, 14.890380859375, 15.6259765625, 16.361572265625, 17.09716796875, 17.832763671875, 18.568359375, 19.303955078125, 20.03955078125, 20.775146484375, 21.5107421875, 22.246337890625, 22.98193359375, 23.717529296875, 24.453125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 7.0, 11.0, 10.0, 20.0, 22.0, 37.0, 54.0, 99.0, 133.0, 273.0, 480.0, 777.0, 1427.0, 2820.0, 5508.0, 11802.0, 29706.0, 92721.0, 521512.0, 2881772.0, 499189.0, 92201.0, 29738.0, 11998.0, 5513.0, 2918.0, 1571.0, 863.0, 457.0, 235.0, 139.0, 93.0, 56.0, 35.0, 17.0, 19.0, 12.0, 3.0, 10.0, 4.0, 3.0, 4.0, 0.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.796875, -29.81884765625, -28.8408203125, -27.86279296875, -26.884765625, -25.90673828125, -24.9287109375, -23.95068359375, -22.97265625, -21.99462890625, -21.0166015625, -20.03857421875, -19.060546875, -18.08251953125, -17.1044921875, -16.12646484375, -15.1484375, -14.17041015625, -13.1923828125, -12.21435546875, -11.236328125, -10.25830078125, -9.2802734375, -8.30224609375, -7.32421875, -6.34619140625, -5.3681640625, -4.39013671875, -3.412109375, -2.43408203125, -1.4560546875, -0.47802734375, 0.5, 1.47802734375, 2.4560546875, 3.43408203125, 4.412109375, 5.39013671875, 6.3681640625, 7.34619140625, 8.32421875, 9.30224609375, 10.2802734375, 11.25830078125, 12.236328125, 13.21435546875, 14.1923828125, 15.17041015625, 16.1484375, 17.12646484375, 18.1044921875, 19.08251953125, 20.060546875, 21.03857421875, 22.0166015625, 22.99462890625, 23.97265625, 24.95068359375, 25.9287109375, 26.90673828125, 27.884765625, 28.86279296875, 29.8408203125, 30.81884765625, 31.796875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 4.0, 4.0, 3.0, 6.0, 8.0, 6.0, 19.0, 18.0, 21.0, 24.0, 54.0, 65.0, 94.0, 136.0, 251.0, 463.0, 834.0, 794.0, 486.0, 255.0, 182.0, 112.0, 66.0, 38.0, 34.0, 29.0, 7.0, 14.0, 13.0, 11.0, 7.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.0, -35.7666015625, -34.533203125, -33.2998046875, -32.06640625, -30.8330078125, -29.599609375, -28.3662109375, -27.1328125, -25.8994140625, -24.666015625, -23.4326171875, -22.19921875, -20.9658203125, -19.732421875, -18.4990234375, -17.265625, -16.0322265625, -14.798828125, -13.5654296875, -12.33203125, -11.0986328125, -9.865234375, -8.6318359375, -7.3984375, -6.1650390625, -4.931640625, -3.6982421875, -2.46484375, -1.2314453125, 0.001953125, 1.2353515625, 2.46875, 3.7021484375, 4.935546875, 6.1689453125, 7.40234375, 8.6357421875, 9.869140625, 11.1025390625, 12.3359375, 13.5693359375, 14.802734375, 16.0361328125, 17.26953125, 18.5029296875, 19.736328125, 20.9697265625, 22.203125, 23.4365234375, 24.669921875, 25.9033203125, 27.13671875, 28.3701171875, 29.603515625, 30.8369140625, 32.0703125, 33.3037109375, 34.537109375, 35.7705078125, 37.00390625, 38.2373046875, 39.470703125, 40.7041015625, 41.9375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 6.0, 5.0, 10.0, 22.0, 70.0, 141.0, 275.0, 243.0, 143.0, 48.0, 20.0, 10.0, 6.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-519.0661010742188, -501.0537414550781, -483.0414123535156, -465.029052734375, -447.0167236328125, -429.0043640136719, -410.99200439453125, -392.97967529296875, -374.9673156738281, -356.9549560546875, -338.942626953125, -320.9302673339844, -302.91790771484375, -284.90557861328125, -266.8932189941406, -248.88087463378906, -230.8685302734375, -212.85618591308594, -194.84384155273438, -176.83148193359375, -158.8191375732422, -140.80679321289062, -122.79444122314453, -104.78208923339844, -86.76974487304688, -68.75740051269531, -50.74504852294922, -32.73270034790039, -14.720352172851562, 3.2919921875, 21.304344177246094, 39.31669616699219, 57.32904052734375, 75.34138488769531, 93.3537368774414, 111.3660888671875, 129.37843322753906, 147.39077758789062, 165.40313720703125, 183.4154815673828, 201.42782592773438, 219.44017028808594, 237.4525146484375, 255.46487426757812, 273.47723388671875, 291.48956298828125, 309.5019226074219, 327.5142822265625, 345.526611328125, 363.5389709472656, 381.5513000488281, 399.56365966796875, 417.57598876953125, 435.5883483886719, 453.6007080078125, 471.613037109375, 489.6253967285156, 507.63775634765625, 525.6500854492188, 543.6624145507812, 561.6748046875, 579.6871337890625, 597.699462890625, 615.7118530273438, 633.7241821289062]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 5.0, 2.0, 13.0, 17.0, 6.0, 12.0, 24.0, 22.0, 25.0, 25.0, 39.0, 44.0, 44.0, 48.0, 49.0, 63.0, 65.0, 61.0, 63.0, 63.0, 50.0, 39.0, 32.0, 31.0, 30.0, 33.0, 22.0, 22.0, 10.0, 10.0, 6.0, 6.0, 2.0, 2.0, 2.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-232.88919067382812, -226.7714080810547, -220.65362548828125, -214.53582763671875, -208.4180450439453, -202.30026245117188, -196.18247985839844, -190.064697265625, -183.9468994140625, -177.82911682128906, -171.71133422851562, -165.59353637695312, -159.4757537841797, -153.35797119140625, -147.2401885986328, -141.12240600585938, -135.00462341308594, -128.8868408203125, -122.76905059814453, -116.6512680053711, -110.53347778320312, -104.41569519042969, -98.29791259765625, -92.18013000488281, -86.06233978271484, -79.9445571899414, -73.82676696777344, -67.708984375, -61.5911979675293, -55.473411560058594, -49.355628967285156, -43.23784255981445, -37.12005615234375, -31.002269744873047, -24.884485244750977, -18.766700744628906, -12.648914337158203, -6.5311279296875, -0.4133453369140625, 5.704441070556641, 11.822227478027344, 17.940013885498047, 24.057798385620117, 30.175582885742188, 36.29336929321289, 42.411155700683594, 48.52893829345703, 54.646724700927734, 60.76451110839844, 66.88229370117188, 73.00008392333984, 79.11786651611328, 85.23565673828125, 91.35343933105469, 97.47122192382812, 103.58900451660156, 109.70679473876953, 115.82457733154297, 121.94236755371094, 128.06015014648438, 134.1779327392578, 140.29571533203125, 146.41351318359375, 152.5312957763672, 158.64907836914062]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 6.0, 2.0, 4.0, 5.0, 7.0, 15.0, 18.0, 11.0, 29.0, 57.0, 78.0, 123.0, 177.0, 317.0, 534.0, 1027.0, 1856.0, 3789.0, 8344.0, 19460.0, 50334.0, 155024.0, 431578.0, 249975.0, 76224.0, 27791.0, 11331.0, 5163.0, 2327.0, 1284.0, 658.0, 354.0, 238.0, 131.0, 72.0, 78.0, 40.0, 24.0, 25.0, 12.0, 14.0, 5.0, 5.0, 2.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-43.3125, -41.9013671875, -40.490234375, -39.0791015625, -37.66796875, -36.2568359375, -34.845703125, -33.4345703125, -32.0234375, -30.6123046875, -29.201171875, -27.7900390625, -26.37890625, -24.9677734375, -23.556640625, -22.1455078125, -20.734375, -19.3232421875, -17.912109375, -16.5009765625, -15.08984375, -13.6787109375, -12.267578125, -10.8564453125, -9.4453125, -8.0341796875, -6.623046875, -5.2119140625, -3.80078125, -2.3896484375, -0.978515625, 0.4326171875, 1.84375, 3.2548828125, 4.666015625, 6.0771484375, 7.48828125, 8.8994140625, 10.310546875, 11.7216796875, 13.1328125, 14.5439453125, 15.955078125, 17.3662109375, 18.77734375, 20.1884765625, 21.599609375, 23.0107421875, 24.421875, 25.8330078125, 27.244140625, 28.6552734375, 30.06640625, 31.4775390625, 32.888671875, 34.2998046875, 35.7109375, 37.1220703125, 38.533203125, 39.9443359375, 41.35546875, 42.7666015625, 44.177734375, 45.5888671875, 47.0]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 5.0, 6.0, 8.0, 16.0, 10.0, 20.0, 19.0, 31.0, 27.0, 43.0, 55.0, 54.0, 59.0, 71.0, 60.0, 46.0, 66.0, 68.0, 54.0, 45.0, 44.0, 34.0, 29.0, 24.0, 30.0, 18.0, 12.0, 14.0, 11.0, 3.0, 4.0, 8.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-20.921875, -20.2099609375, -19.498046875, -18.7861328125, -18.07421875, -17.3623046875, -16.650390625, -15.9384765625, -15.2265625, -14.5146484375, -13.802734375, -13.0908203125, -12.37890625, -11.6669921875, -10.955078125, -10.2431640625, -9.53125, -8.8193359375, -8.107421875, -7.3955078125, -6.68359375, -5.9716796875, -5.259765625, -4.5478515625, -3.8359375, -3.1240234375, -2.412109375, -1.7001953125, -0.98828125, -0.2763671875, 0.435546875, 1.1474609375, 1.859375, 2.5712890625, 3.283203125, 3.9951171875, 4.70703125, 5.4189453125, 6.130859375, 6.8427734375, 7.5546875, 8.2666015625, 8.978515625, 9.6904296875, 10.40234375, 11.1142578125, 11.826171875, 12.5380859375, 13.25, 13.9619140625, 14.673828125, 15.3857421875, 16.09765625, 16.8095703125, 17.521484375, 18.2333984375, 18.9453125, 19.6572265625, 20.369140625, 21.0810546875, 21.79296875, 22.5048828125, 23.216796875, 23.9287109375, 24.640625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 4.0, 5.0, 5.0, 10.0, 9.0, 17.0, 26.0, 21.0, 33.0, 48.0, 74.0, 108.0, 165.0, 255.0, 483.0, 927.0, 2213.0, 6987.0, 30102.0, 194346.0, 680504.0, 105142.0, 18817.0, 4656.0, 1690.0, 790.0, 409.0, 263.0, 145.0, 76.0, 48.0, 47.0, 35.0, 29.0, 20.0, 11.0, 7.0, 9.0, 7.0, 6.0, 4.0, 2.0, 2.0, 2.0], "bins": [-87.0625, -84.90478515625, -82.7470703125, -80.58935546875, -78.431640625, -76.27392578125, -74.1162109375, -71.95849609375, -69.80078125, -67.64306640625, -65.4853515625, -63.32763671875, -61.169921875, -59.01220703125, -56.8544921875, -54.69677734375, -52.5390625, -50.38134765625, -48.2236328125, -46.06591796875, -43.908203125, -41.75048828125, -39.5927734375, -37.43505859375, -35.27734375, -33.11962890625, -30.9619140625, -28.80419921875, -26.646484375, -24.48876953125, -22.3310546875, -20.17333984375, -18.015625, -15.85791015625, -13.7001953125, -11.54248046875, -9.384765625, -7.22705078125, -5.0693359375, -2.91162109375, -0.75390625, 1.40380859375, 3.5615234375, 5.71923828125, 7.876953125, 10.03466796875, 12.1923828125, 14.35009765625, 16.5078125, 18.66552734375, 20.8232421875, 22.98095703125, 25.138671875, 27.29638671875, 29.4541015625, 31.61181640625, 33.76953125, 35.92724609375, 38.0849609375, 40.24267578125, 42.400390625, 44.55810546875, 46.7158203125, 48.87353515625, 51.03125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 8.0, 5.0, 5.0, 12.0, 6.0, 8.0, 15.0, 13.0, 16.0, 15.0, 23.0, 23.0, 27.0, 22.0, 19.0, 35.0, 26.0, 32.0, 32.0, 37.0, 37.0, 24.0, 42.0, 37.0, 42.0, 47.0, 23.0, 42.0, 33.0, 46.0, 32.0, 30.0, 23.0, 28.0, 19.0, 20.0, 13.0, 19.0, 10.0, 10.0, 8.0, 7.0, 3.0, 9.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-51.25, -49.5703125, -47.890625, -46.2109375, -44.53125, -42.8515625, -41.171875, -39.4921875, -37.8125, -36.1328125, -34.453125, -32.7734375, -31.09375, -29.4140625, -27.734375, -26.0546875, -24.375, -22.6953125, -21.015625, -19.3359375, -17.65625, -15.9765625, -14.296875, -12.6171875, -10.9375, -9.2578125, -7.578125, -5.8984375, -4.21875, -2.5390625, -0.859375, 0.8203125, 2.5, 4.1796875, 5.859375, 7.5390625, 9.21875, 10.8984375, 12.578125, 14.2578125, 15.9375, 17.6171875, 19.296875, 20.9765625, 22.65625, 24.3359375, 26.015625, 27.6953125, 29.375, 31.0546875, 32.734375, 34.4140625, 36.09375, 37.7734375, 39.453125, 41.1328125, 42.8125, 44.4921875, 46.171875, 47.8515625, 49.53125, 51.2109375, 52.890625, 54.5703125, 56.25]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 1.0, 3.0, 6.0, 7.0, 0.0, 3.0, 10.0, 9.0, 15.0, 20.0, 25.0, 41.0, 59.0, 101.0, 250.0, 528.0, 1472.0, 6477.0, 74201.0, 863922.0, 91378.0, 7305.0, 1645.0, 525.0, 229.0, 119.0, 58.0, 44.0, 21.0, 16.0, 13.0, 8.0, 8.0, 5.0, 1.0, 6.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-37.71875, -36.4833984375, -35.248046875, -34.0126953125, -32.77734375, -31.5419921875, -30.306640625, -29.0712890625, -27.8359375, -26.6005859375, -25.365234375, -24.1298828125, -22.89453125, -21.6591796875, -20.423828125, -19.1884765625, -17.953125, -16.7177734375, -15.482421875, -14.2470703125, -13.01171875, -11.7763671875, -10.541015625, -9.3056640625, -8.0703125, -6.8349609375, -5.599609375, -4.3642578125, -3.12890625, -1.8935546875, -0.658203125, 0.5771484375, 1.8125, 3.0478515625, 4.283203125, 5.5185546875, 6.75390625, 7.9892578125, 9.224609375, 10.4599609375, 11.6953125, 12.9306640625, 14.166015625, 15.4013671875, 16.63671875, 17.8720703125, 19.107421875, 20.3427734375, 21.578125, 22.8134765625, 24.048828125, 25.2841796875, 26.51953125, 27.7548828125, 28.990234375, 30.2255859375, 31.4609375, 32.6962890625, 33.931640625, 35.1669921875, 36.40234375, 37.6376953125, 38.873046875, 40.1083984375, 41.34375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 4.0, 7.0, 12.0, 4.0, 10.0, 11.0, 11.0, 16.0, 16.0, 22.0, 31.0, 39.0, 53.0, 51.0, 62.0, 78.0, 119.0, 97.0, 66.0, 60.0, 49.0, 38.0, 29.0, 24.0, 16.0, 9.0, 7.0, 14.0, 6.0, 8.0, 2.0, 4.0, 5.0, 7.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0031871795654296875, -0.0030864179134368896, -0.002985656261444092, -0.002884894609451294, -0.002784132957458496, -0.0026833713054656982, -0.0025826096534729004, -0.0024818480014801025, -0.0023810863494873047, -0.002280324697494507, -0.002179563045501709, -0.002078801393508911, -0.0019780397415161133, -0.0018772780895233154, -0.0017765164375305176, -0.0016757547855377197, -0.0015749931335449219, -0.001474231481552124, -0.0013734698295593262, -0.0012727081775665283, -0.0011719465255737305, -0.0010711848735809326, -0.0009704232215881348, -0.0008696615695953369, -0.0007688999176025391, -0.0006681382656097412, -0.0005673766136169434, -0.0004666149616241455, -0.00036585330963134766, -0.0002650916576385498, -0.00016433000564575195, -6.35683536529541e-05, 3.719329833984375e-05, 0.0001379549503326416, 0.00023871660232543945, 0.0003394782543182373, 0.00044023990631103516, 0.000541001558303833, 0.0006417632102966309, 0.0007425248622894287, 0.0008432865142822266, 0.0009440481662750244, 0.0010448098182678223, 0.0011455714702606201, 0.001246333122253418, 0.0013470947742462158, 0.0014478564262390137, 0.0015486180782318115, 0.0016493797302246094, 0.0017501413822174072, 0.001850903034210205, 0.001951664686203003, 0.0020524263381958008, 0.0021531879901885986, 0.0022539496421813965, 0.0023547112941741943, 0.002455472946166992, 0.00255623459815979, 0.002656996250152588, 0.0027577579021453857, 0.0028585195541381836, 0.0029592812061309814, 0.0030600428581237793, 0.003160804510116577, 0.003261566162109375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 8.0, 8.0, 11.0, 16.0, 15.0, 32.0, 49.0, 78.0, 124.0, 197.0, 381.0, 763.0, 1741.0, 4964.0, 20367.0, 166016.0, 735871.0, 96833.0, 14318.0, 3791.0, 1410.0, 672.0, 377.0, 176.0, 113.0, 83.0, 52.0, 25.0, 22.0, 16.0, 9.0, 7.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.40625, -22.581787109375, -21.75732421875, -20.932861328125, -20.1083984375, -19.283935546875, -18.45947265625, -17.635009765625, -16.810546875, -15.986083984375, -15.16162109375, -14.337158203125, -13.5126953125, -12.688232421875, -11.86376953125, -11.039306640625, -10.21484375, -9.390380859375, -8.56591796875, -7.741455078125, -6.9169921875, -6.092529296875, -5.26806640625, -4.443603515625, -3.619140625, -2.794677734375, -1.97021484375, -1.145751953125, -0.3212890625, 0.503173828125, 1.32763671875, 2.152099609375, 2.9765625, 3.801025390625, 4.62548828125, 5.449951171875, 6.2744140625, 7.098876953125, 7.92333984375, 8.747802734375, 9.572265625, 10.396728515625, 11.22119140625, 12.045654296875, 12.8701171875, 13.694580078125, 14.51904296875, 15.343505859375, 16.16796875, 16.992431640625, 17.81689453125, 18.641357421875, 19.4658203125, 20.290283203125, 21.11474609375, 21.939208984375, 22.763671875, 23.588134765625, 24.41259765625, 25.237060546875, 26.0615234375, 26.885986328125, 27.71044921875, 28.534912109375, 29.359375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 6.0, 3.0, 7.0, 5.0, 8.0, 11.0, 19.0, 22.0, 43.0, 44.0, 58.0, 58.0, 95.0, 106.0, 110.0, 94.0, 72.0, 68.0, 47.0, 46.0, 27.0, 14.0, 6.0, 11.0, 10.0, 8.0, 1.0, 5.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.3125, -21.597412109375, -20.88232421875, -20.167236328125, -19.4521484375, -18.737060546875, -18.02197265625, -17.306884765625, -16.591796875, -15.876708984375, -15.16162109375, -14.446533203125, -13.7314453125, -13.016357421875, -12.30126953125, -11.586181640625, -10.87109375, -10.156005859375, -9.44091796875, -8.725830078125, -8.0107421875, -7.295654296875, -6.58056640625, -5.865478515625, -5.150390625, -4.435302734375, -3.72021484375, -3.005126953125, -2.2900390625, -1.574951171875, -0.85986328125, -0.144775390625, 0.5703125, 1.285400390625, 2.00048828125, 2.715576171875, 3.4306640625, 4.145751953125, 4.86083984375, 5.575927734375, 6.291015625, 7.006103515625, 7.72119140625, 8.436279296875, 9.1513671875, 9.866455078125, 10.58154296875, 11.296630859375, 12.01171875, 12.726806640625, 13.44189453125, 14.156982421875, 14.8720703125, 15.587158203125, 16.30224609375, 17.017333984375, 17.732421875, 18.447509765625, 19.16259765625, 19.877685546875, 20.5927734375, 21.307861328125, 22.02294921875, 22.738037109375, 23.453125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 9.0, 14.0, 37.0, 83.0, 142.0, 202.0, 229.0, 148.0, 66.0, 32.0, 13.0, 6.0, 5.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-354.76593017578125, -336.0225524902344, -317.2791748046875, -298.5357971191406, -279.79241943359375, -261.04901123046875, -242.30563354492188, -223.562255859375, -204.81887817382812, -186.07550048828125, -167.33212280273438, -148.58872985839844, -129.84535217285156, -111.10197448730469, -92.35858917236328, -73.61520385742188, -54.871826171875, -36.12844467163086, -17.38506317138672, 1.3583183288574219, 20.101699829101562, 38.84507751464844, 57.588462829589844, 76.33184814453125, 95.07522583007812, 113.818603515625, 132.56198120117188, 151.3053741455078, 170.0487518310547, 188.79212951660156, 207.5355224609375, 226.27890014648438, 245.0223388671875, 263.7657165527344, 282.50909423828125, 301.2524719238281, 319.995849609375, 338.7392578125, 357.4826354980469, 376.22601318359375, 394.9693908691406, 413.7127685546875, 432.4561462402344, 451.19952392578125, 469.94293212890625, 488.686279296875, 507.4296875, 526.173095703125, 544.9164428710938, 563.6598510742188, 582.4031982421875, 601.1466064453125, 619.8899536132812, 638.6333618164062, 657.376708984375, 676.1201171875, 694.863525390625, 713.60693359375, 732.3502807617188, 751.0936889648438, 769.8370361328125, 788.5804443359375, 807.3237915039062, 826.0671997070312, 844.810546875]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 6.0, 2.0, 2.0, 2.0, 7.0, 5.0, 10.0, 7.0, 4.0, 13.0, 13.0, 16.0, 15.0, 17.0, 21.0, 28.0, 22.0, 23.0, 36.0, 39.0, 42.0, 35.0, 46.0, 44.0, 56.0, 52.0, 38.0, 47.0, 38.0, 37.0, 34.0, 29.0, 34.0, 31.0, 26.0, 22.0, 25.0, 13.0, 13.0, 8.0, 14.0, 9.0, 6.0, 5.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-239.80885314941406, -232.10250854492188, -224.39614868164062, -216.68980407714844, -208.98345947265625, -201.27711486816406, -193.57077026367188, -185.86441040039062, -178.15806579589844, -170.45172119140625, -162.745361328125, -155.0390167236328, -147.33267211914062, -139.62632751464844, -131.91998291015625, -124.213623046875, -116.50727844238281, -108.80093383789062, -101.0945816040039, -93.38822937011719, -85.681884765625, -77.97554016113281, -70.2691879272461, -62.56283950805664, -54.85649108886719, -47.150142669677734, -39.44379425048828, -31.737445831298828, -24.031097412109375, -16.324748992919922, -8.618400573730469, -0.9120521545410156, 6.794281005859375, 14.500629425048828, 22.20697784423828, 29.913326263427734, 37.61967468261719, 45.32602310180664, 53.032371520996094, 60.73871994018555, 68.445068359375, 76.15141296386719, 83.8577651977539, 91.56411743164062, 99.27046203613281, 106.976806640625, 114.68315887451172, 122.38951110839844, 130.09585571289062, 137.8022003173828, 145.508544921875, 153.21490478515625, 160.92124938964844, 168.62759399414062, 176.33395385742188, 184.04029846191406, 191.74664306640625, 199.45298767089844, 207.15933227539062, 214.86569213867188, 222.57203674316406, 230.27838134765625, 237.9847412109375, 245.6910858154297, 253.39743041992188]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 7.0, 5.0, 13.0, 17.0, 14.0, 30.0, 39.0, 59.0, 100.0, 165.0, 301.0, 518.0, 1005.0, 2194.0, 4992.0, 12806.0, 38807.0, 147231.0, 895032.0, 2398496.0, 544207.0, 102121.0, 28669.0, 9783.0, 3852.0, 1763.0, 837.0, 460.0, 266.0, 151.0, 89.0, 68.0, 46.0, 37.0, 30.0, 14.0, 12.0, 15.0, 6.0, 6.0, 3.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-23.46875, -22.6416015625, -21.814453125, -20.9873046875, -20.16015625, -19.3330078125, -18.505859375, -17.6787109375, -16.8515625, -16.0244140625, -15.197265625, -14.3701171875, -13.54296875, -12.7158203125, -11.888671875, -11.0615234375, -10.234375, -9.4072265625, -8.580078125, -7.7529296875, -6.92578125, -6.0986328125, -5.271484375, -4.4443359375, -3.6171875, -2.7900390625, -1.962890625, -1.1357421875, -0.30859375, 0.5185546875, 1.345703125, 2.1728515625, 3.0, 3.8271484375, 4.654296875, 5.4814453125, 6.30859375, 7.1357421875, 7.962890625, 8.7900390625, 9.6171875, 10.4443359375, 11.271484375, 12.0986328125, 12.92578125, 13.7529296875, 14.580078125, 15.4072265625, 16.234375, 17.0615234375, 17.888671875, 18.7158203125, 19.54296875, 20.3701171875, 21.197265625, 22.0244140625, 22.8515625, 23.6787109375, 24.505859375, 25.3330078125, 26.16015625, 26.9873046875, 27.814453125, 28.6416015625, 29.46875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 7.0, 11.0, 8.0, 13.0, 23.0, 33.0, 30.0, 39.0, 42.0, 66.0, 65.0, 56.0, 50.0, 62.0, 83.0, 68.0, 54.0, 57.0, 51.0, 37.0, 40.0, 30.0, 21.0, 14.0, 9.0, 13.0, 12.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-22.296875, -21.5703125, -20.84375, -20.1171875, -19.390625, -18.6640625, -17.9375, -17.2109375, -16.484375, -15.7578125, -15.03125, -14.3046875, -13.578125, -12.8515625, -12.125, -11.3984375, -10.671875, -9.9453125, -9.21875, -8.4921875, -7.765625, -7.0390625, -6.3125, -5.5859375, -4.859375, -4.1328125, -3.40625, -2.6796875, -1.953125, -1.2265625, -0.5, 0.2265625, 0.953125, 1.6796875, 2.40625, 3.1328125, 3.859375, 4.5859375, 5.3125, 6.0390625, 6.765625, 7.4921875, 8.21875, 8.9453125, 9.671875, 10.3984375, 11.125, 11.8515625, 12.578125, 13.3046875, 14.03125, 14.7578125, 15.484375, 16.2109375, 16.9375, 17.6640625, 18.390625, 19.1171875, 19.84375, 20.5703125, 21.296875, 22.0234375, 22.75, 23.4765625, 24.203125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 6.0, 0.0, 5.0, 14.0, 13.0, 18.0, 24.0, 41.0, 70.0, 105.0, 217.0, 412.0, 949.0, 2695.0, 8453.0, 34324.0, 196254.0, 2555527.0, 1248742.0, 113224.0, 23144.0, 6357.0, 2123.0, 765.0, 375.0, 164.0, 106.0, 53.0, 47.0, 16.0, 17.0, 10.0, 3.0, 5.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.875, -39.591796875, -38.30859375, -37.025390625, -35.7421875, -34.458984375, -33.17578125, -31.892578125, -30.609375, -29.326171875, -28.04296875, -26.759765625, -25.4765625, -24.193359375, -22.91015625, -21.626953125, -20.34375, -19.060546875, -17.77734375, -16.494140625, -15.2109375, -13.927734375, -12.64453125, -11.361328125, -10.078125, -8.794921875, -7.51171875, -6.228515625, -4.9453125, -3.662109375, -2.37890625, -1.095703125, 0.1875, 1.470703125, 2.75390625, 4.037109375, 5.3203125, 6.603515625, 7.88671875, 9.169921875, 10.453125, 11.736328125, 13.01953125, 14.302734375, 15.5859375, 16.869140625, 18.15234375, 19.435546875, 20.71875, 22.001953125, 23.28515625, 24.568359375, 25.8515625, 27.134765625, 28.41796875, 29.701171875, 30.984375, 32.267578125, 33.55078125, 34.833984375, 36.1171875, 37.400390625, 38.68359375, 39.966796875, 41.25]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 4.0, 5.0, 3.0, 4.0, 7.0, 9.0, 12.0, 15.0, 12.0, 20.0, 29.0, 37.0, 44.0, 58.0, 76.0, 105.0, 130.0, 192.0, 296.0, 389.0, 503.0, 505.0, 430.0, 313.0, 224.0, 156.0, 127.0, 87.0, 54.0, 42.0, 40.0, 35.0, 25.0, 22.0, 16.0, 8.0, 8.0, 6.0, 7.0, 6.0, 3.0, 4.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-30.109375, -29.074951171875, -28.04052734375, -27.006103515625, -25.9716796875, -24.937255859375, -23.90283203125, -22.868408203125, -21.833984375, -20.799560546875, -19.76513671875, -18.730712890625, -17.6962890625, -16.661865234375, -15.62744140625, -14.593017578125, -13.55859375, -12.524169921875, -11.48974609375, -10.455322265625, -9.4208984375, -8.386474609375, -7.35205078125, -6.317626953125, -5.283203125, -4.248779296875, -3.21435546875, -2.179931640625, -1.1455078125, -0.111083984375, 0.92333984375, 1.957763671875, 2.9921875, 4.026611328125, 5.06103515625, 6.095458984375, 7.1298828125, 8.164306640625, 9.19873046875, 10.233154296875, 11.267578125, 12.302001953125, 13.33642578125, 14.370849609375, 15.4052734375, 16.439697265625, 17.47412109375, 18.508544921875, 19.54296875, 20.577392578125, 21.61181640625, 22.646240234375, 23.6806640625, 24.715087890625, 25.74951171875, 26.783935546875, 27.818359375, 28.852783203125, 29.88720703125, 30.921630859375, 31.9560546875, 32.990478515625, 34.02490234375, 35.059326171875, 36.09375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 13.0, 19.0, 25.0, 63.0, 154.0, 198.0, 206.0, 161.0, 80.0, 43.0, 16.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-368.93560791015625, -351.4669189453125, -333.9981994628906, -316.52947998046875, -299.060791015625, -281.59210205078125, -264.1233825683594, -246.65467834472656, -229.18597412109375, -211.71726989746094, -194.24856567382812, -176.7798614501953, -159.3111572265625, -141.8424530029297, -124.37374877929688, -106.90504455566406, -89.43634033203125, -71.96763610839844, -54.498931884765625, -37.03022766113281, -19.5615234375, -2.0928192138671875, 15.375885009765625, 32.84458923339844, 50.31329345703125, 67.78199768066406, 85.25070190429688, 102.71940612792969, 120.1881103515625, 137.6568145751953, 155.12551879882812, 172.59422302246094, 190.0628662109375, 207.5315704345703, 225.00027465820312, 242.46897888183594, 259.93768310546875, 277.4063720703125, 294.8750915527344, 312.34381103515625, 329.8125, 347.28118896484375, 364.7499084472656, 382.2186279296875, 399.68731689453125, 417.156005859375, 434.6247253417969, 452.09344482421875, 469.5621337890625, 487.03082275390625, 504.4995422363281, 521.96826171875, 539.4369506835938, 556.9056396484375, 574.3743896484375, 591.8430786132812, 609.311767578125, 626.7804565429688, 644.2491455078125, 661.7178955078125, 679.1865844726562, 696.6552734375, 714.1240234375, 731.5927124023438, 749.0614013671875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 6.0, 5.0, 9.0, 11.0, 10.0, 25.0, 16.0, 35.0, 36.0, 47.0, 49.0, 65.0, 56.0, 52.0, 84.0, 81.0, 71.0, 64.0, 61.0, 40.0, 42.0, 34.0, 29.0, 23.0, 11.0, 17.0, 9.0, 6.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-228.9528045654297, -219.63490295410156, -210.3170166015625, -200.99911499023438, -191.68121337890625, -182.36331176757812, -173.04541015625, -163.72752380371094, -154.4096221923828, -145.0917205810547, -135.77383422851562, -126.4559326171875, -117.13803100585938, -107.82012939453125, -98.50223541259766, -89.18434143066406, -79.86643981933594, -70.54853820800781, -61.23064422607422, -51.91274642944336, -42.5948486328125, -33.27695083618164, -23.95905303955078, -14.641159057617188, -5.3232574462890625, 3.994640350341797, 13.312538146972656, 22.630435943603516, 31.948333740234375, 41.266231536865234, 50.584129333496094, 59.90202331542969, 69.21990966796875, 78.53781127929688, 87.85570526123047, 97.17359924316406, 106.49150085449219, 115.80940246582031, 125.1272964477539, 134.4451904296875, 143.76309204101562, 153.08099365234375, 162.39889526367188, 171.71678161621094, 181.03468322753906, 190.3525848388672, 199.67047119140625, 208.98837280273438, 218.3062744140625, 227.62417602539062, 236.94207763671875, 246.2599639892578, 255.57786560058594, 264.895751953125, 274.2136535644531, 283.53155517578125, 292.8494567871094, 302.1673583984375, 311.4852600097656, 320.80316162109375, 330.12103271484375, 339.4389343261719, 348.7568359375, 358.0747375488281, 367.39263916015625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 8.0, 14.0, 11.0, 14.0, 17.0, 28.0, 43.0, 62.0, 77.0, 118.0, 162.0, 280.0, 440.0, 772.0, 1412.0, 2620.0, 5191.0, 11386.0, 27034.0, 65894.0, 157826.0, 332175.0, 255070.0, 108109.0, 44473.0, 18664.0, 8127.0, 3883.0, 1930.0, 1061.0, 602.0, 345.0, 214.0, 140.0, 97.0, 56.0, 58.0, 41.0, 38.0, 18.0, 16.0, 8.0, 8.0, 5.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-35.96875, -34.87158203125, -33.7744140625, -32.67724609375, -31.580078125, -30.48291015625, -29.3857421875, -28.28857421875, -27.19140625, -26.09423828125, -24.9970703125, -23.89990234375, -22.802734375, -21.70556640625, -20.6083984375, -19.51123046875, -18.4140625, -17.31689453125, -16.2197265625, -15.12255859375, -14.025390625, -12.92822265625, -11.8310546875, -10.73388671875, -9.63671875, -8.53955078125, -7.4423828125, -6.34521484375, -5.248046875, -4.15087890625, -3.0537109375, -1.95654296875, -0.859375, 0.23779296875, 1.3349609375, 2.43212890625, 3.529296875, 4.62646484375, 5.7236328125, 6.82080078125, 7.91796875, 9.01513671875, 10.1123046875, 11.20947265625, 12.306640625, 13.40380859375, 14.5009765625, 15.59814453125, 16.6953125, 17.79248046875, 18.8896484375, 19.98681640625, 21.083984375, 22.18115234375, 23.2783203125, 24.37548828125, 25.47265625, 26.56982421875, 27.6669921875, 28.76416015625, 29.861328125, 30.95849609375, 32.0556640625, 33.15283203125, 34.25]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 12.0, 2.0, 9.0, 11.0, 13.0, 24.0, 30.0, 23.0, 38.0, 45.0, 54.0, 58.0, 59.0, 61.0, 72.0, 64.0, 62.0, 56.0, 55.0, 43.0, 47.0, 41.0, 35.0, 29.0, 17.0, 12.0, 10.0, 3.0, 7.0, 6.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-21.3125, -20.599365234375, -19.88623046875, -19.173095703125, -18.4599609375, -17.746826171875, -17.03369140625, -16.320556640625, -15.607421875, -14.894287109375, -14.18115234375, -13.468017578125, -12.7548828125, -12.041748046875, -11.32861328125, -10.615478515625, -9.90234375, -9.189208984375, -8.47607421875, -7.762939453125, -7.0498046875, -6.336669921875, -5.62353515625, -4.910400390625, -4.197265625, -3.484130859375, -2.77099609375, -2.057861328125, -1.3447265625, -0.631591796875, 0.08154296875, 0.794677734375, 1.5078125, 2.220947265625, 2.93408203125, 3.647216796875, 4.3603515625, 5.073486328125, 5.78662109375, 6.499755859375, 7.212890625, 7.926025390625, 8.63916015625, 9.352294921875, 10.0654296875, 10.778564453125, 11.49169921875, 12.204833984375, 12.91796875, 13.631103515625, 14.34423828125, 15.057373046875, 15.7705078125, 16.483642578125, 17.19677734375, 17.909912109375, 18.623046875, 19.336181640625, 20.04931640625, 20.762451171875, 21.4755859375, 22.188720703125, 22.90185546875, 23.614990234375, 24.328125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 8.0, 4.0, 18.0, 15.0, 26.0, 32.0, 39.0, 60.0, 91.0, 155.0, 205.0, 368.0, 604.0, 1089.0, 2167.0, 5434.0, 30777.0, 475876.0, 490164.0, 30936.0, 5622.0, 2171.0, 1049.0, 620.0, 347.0, 221.0, 140.0, 89.0, 75.0, 44.0, 28.0, 21.0, 16.0, 17.0, 7.0, 8.0, 8.0, 7.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.1875, -100.3212890625, -97.455078125, -94.5888671875, -91.72265625, -88.8564453125, -85.990234375, -83.1240234375, -80.2578125, -77.3916015625, -74.525390625, -71.6591796875, -68.79296875, -65.9267578125, -63.060546875, -60.1943359375, -57.328125, -54.4619140625, -51.595703125, -48.7294921875, -45.86328125, -42.9970703125, -40.130859375, -37.2646484375, -34.3984375, -31.5322265625, -28.666015625, -25.7998046875, -22.93359375, -20.0673828125, -17.201171875, -14.3349609375, -11.46875, -8.6025390625, -5.736328125, -2.8701171875, -0.00390625, 2.8623046875, 5.728515625, 8.5947265625, 11.4609375, 14.3271484375, 17.193359375, 20.0595703125, 22.92578125, 25.7919921875, 28.658203125, 31.5244140625, 34.390625, 37.2568359375, 40.123046875, 42.9892578125, 45.85546875, 48.7216796875, 51.587890625, 54.4541015625, 57.3203125, 60.1865234375, 63.052734375, 65.9189453125, 68.78515625, 71.6513671875, 74.517578125, 77.3837890625, 80.25]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 5.0, 1.0, 8.0, 8.0, 7.0, 9.0, 14.0, 17.0, 22.0, 22.0, 37.0, 30.0, 32.0, 32.0, 52.0, 58.0, 34.0, 53.0, 54.0, 46.0, 51.0, 38.0, 39.0, 35.0, 44.0, 36.0, 40.0, 29.0, 30.0, 32.0, 13.0, 16.0, 18.0, 12.0, 7.0, 4.0, 4.0, 2.0, 3.0, 4.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-69.0, -66.5927734375, -64.185546875, -61.7783203125, -59.37109375, -56.9638671875, -54.556640625, -52.1494140625, -49.7421875, -47.3349609375, -44.927734375, -42.5205078125, -40.11328125, -37.7060546875, -35.298828125, -32.8916015625, -30.484375, -28.0771484375, -25.669921875, -23.2626953125, -20.85546875, -18.4482421875, -16.041015625, -13.6337890625, -11.2265625, -8.8193359375, -6.412109375, -4.0048828125, -1.59765625, 0.8095703125, 3.216796875, 5.6240234375, 8.03125, 10.4384765625, 12.845703125, 15.2529296875, 17.66015625, 20.0673828125, 22.474609375, 24.8818359375, 27.2890625, 29.6962890625, 32.103515625, 34.5107421875, 36.91796875, 39.3251953125, 41.732421875, 44.1396484375, 46.546875, 48.9541015625, 51.361328125, 53.7685546875, 56.17578125, 58.5830078125, 60.990234375, 63.3974609375, 65.8046875, 68.2119140625, 70.619140625, 73.0263671875, 75.43359375, 77.8408203125, 80.248046875, 82.6552734375, 85.0625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 6.0, 5.0, 11.0, 13.0, 16.0, 27.0, 30.0, 61.0, 104.0, 144.0, 303.0, 625.0, 1649.0, 7050.0, 57928.0, 744085.0, 212395.0, 18881.0, 3225.0, 973.0, 433.0, 218.0, 122.0, 78.0, 44.0, 28.0, 24.0, 11.0, 15.0, 12.0, 7.0, 5.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.546875, -24.7900390625, -24.033203125, -23.2763671875, -22.51953125, -21.7626953125, -21.005859375, -20.2490234375, -19.4921875, -18.7353515625, -17.978515625, -17.2216796875, -16.46484375, -15.7080078125, -14.951171875, -14.1943359375, -13.4375, -12.6806640625, -11.923828125, -11.1669921875, -10.41015625, -9.6533203125, -8.896484375, -8.1396484375, -7.3828125, -6.6259765625, -5.869140625, -5.1123046875, -4.35546875, -3.5986328125, -2.841796875, -2.0849609375, -1.328125, -0.5712890625, 0.185546875, 0.9423828125, 1.69921875, 2.4560546875, 3.212890625, 3.9697265625, 4.7265625, 5.4833984375, 6.240234375, 6.9970703125, 7.75390625, 8.5107421875, 9.267578125, 10.0244140625, 10.78125, 11.5380859375, 12.294921875, 13.0517578125, 13.80859375, 14.5654296875, 15.322265625, 16.0791015625, 16.8359375, 17.5927734375, 18.349609375, 19.1064453125, 19.86328125, 20.6201171875, 21.376953125, 22.1337890625, 22.890625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 7.0, 3.0, 5.0, 6.0, 9.0, 15.0, 16.0, 12.0, 19.0, 19.0, 21.0, 29.0, 39.0, 52.0, 39.0, 75.0, 108.0, 106.0, 92.0, 61.0, 46.0, 45.0, 31.0, 20.0, 20.0, 15.0, 14.0, 7.0, 12.0, 9.0, 8.0, 13.0, 5.0, 9.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00330352783203125, -0.003193795680999756, -0.0030840635299682617, -0.0029743313789367676, -0.0028645992279052734, -0.0027548670768737793, -0.002645134925842285, -0.002535402774810791, -0.002425670623779297, -0.0023159384727478027, -0.0022062063217163086, -0.0020964741706848145, -0.0019867420196533203, -0.0018770098686218262, -0.001767277717590332, -0.0016575455665588379, -0.0015478134155273438, -0.0014380812644958496, -0.0013283491134643555, -0.0012186169624328613, -0.0011088848114013672, -0.000999152660369873, -0.0008894205093383789, -0.0007796883583068848, -0.0006699562072753906, -0.0005602240562438965, -0.00045049190521240234, -0.0003407597541809082, -0.00023102760314941406, -0.00012129545211791992, -1.1563301086425781e-05, 9.816884994506836e-05, 0.0002079010009765625, 0.00031763315200805664, 0.0004273653030395508, 0.0005370974540710449, 0.0006468296051025391, 0.0007565617561340332, 0.0008662939071655273, 0.0009760260581970215, 0.0010857582092285156, 0.0011954903602600098, 0.001305222511291504, 0.001414954662322998, 0.0015246868133544922, 0.0016344189643859863, 0.0017441511154174805, 0.0018538832664489746, 0.0019636154174804688, 0.002073347568511963, 0.002183079719543457, 0.002292811870574951, 0.0024025440216064453, 0.0025122761726379395, 0.0026220083236694336, 0.0027317404747009277, 0.002841472625732422, 0.002951204776763916, 0.00306093692779541, 0.0031706690788269043, 0.0032804012298583984, 0.0033901333808898926, 0.0034998655319213867, 0.003609597682952881, 0.003719329833984375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 8.0, 6.0, 11.0, 15.0, 16.0, 18.0, 28.0, 59.0, 46.0, 67.0, 84.0, 154.0, 224.0, 330.0, 518.0, 869.0, 1738.0, 3684.0, 10095.0, 41938.0, 302061.0, 596766.0, 66708.0, 13624.0, 4622.0, 2009.0, 1043.0, 604.0, 360.0, 253.0, 166.0, 129.0, 84.0, 47.0, 31.0, 34.0, 25.0, 23.0, 16.0, 5.0, 8.0, 8.0, 7.0, 3.0, 3.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.53125, -14.0146484375, -13.498046875, -12.9814453125, -12.46484375, -11.9482421875, -11.431640625, -10.9150390625, -10.3984375, -9.8818359375, -9.365234375, -8.8486328125, -8.33203125, -7.8154296875, -7.298828125, -6.7822265625, -6.265625, -5.7490234375, -5.232421875, -4.7158203125, -4.19921875, -3.6826171875, -3.166015625, -2.6494140625, -2.1328125, -1.6162109375, -1.099609375, -0.5830078125, -0.06640625, 0.4501953125, 0.966796875, 1.4833984375, 2.0, 2.5166015625, 3.033203125, 3.5498046875, 4.06640625, 4.5830078125, 5.099609375, 5.6162109375, 6.1328125, 6.6494140625, 7.166015625, 7.6826171875, 8.19921875, 8.7158203125, 9.232421875, 9.7490234375, 10.265625, 10.7822265625, 11.298828125, 11.8154296875, 12.33203125, 12.8486328125, 13.365234375, 13.8818359375, 14.3984375, 14.9150390625, 15.431640625, 15.9482421875, 16.46484375, 16.9814453125, 17.498046875, 18.0146484375, 18.53125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 7.0, 14.0, 18.0, 11.0, 21.0, 30.0, 28.0, 32.0, 38.0, 48.0, 66.0, 55.0, 72.0, 86.0, 68.0, 80.0, 61.0, 54.0, 41.0, 35.0, 20.0, 30.0, 23.0, 15.0, 14.0, 2.0, 10.0, 7.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.90625, -15.3974609375, -14.888671875, -14.3798828125, -13.87109375, -13.3623046875, -12.853515625, -12.3447265625, -11.8359375, -11.3271484375, -10.818359375, -10.3095703125, -9.80078125, -9.2919921875, -8.783203125, -8.2744140625, -7.765625, -7.2568359375, -6.748046875, -6.2392578125, -5.73046875, -5.2216796875, -4.712890625, -4.2041015625, -3.6953125, -3.1865234375, -2.677734375, -2.1689453125, -1.66015625, -1.1513671875, -0.642578125, -0.1337890625, 0.375, 0.8837890625, 1.392578125, 1.9013671875, 2.41015625, 2.9189453125, 3.427734375, 3.9365234375, 4.4453125, 4.9541015625, 5.462890625, 5.9716796875, 6.48046875, 6.9892578125, 7.498046875, 8.0068359375, 8.515625, 9.0244140625, 9.533203125, 10.0419921875, 10.55078125, 11.0595703125, 11.568359375, 12.0771484375, 12.5859375, 13.0947265625, 13.603515625, 14.1123046875, 14.62109375, 15.1298828125, 15.638671875, 16.1474609375, 16.65625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 10.0, 16.0, 15.0, 26.0, 65.0, 117.0, 190.0, 245.0, 139.0, 94.0, 39.0, 20.0, 7.0, 9.0, 5.0, 4.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-676.3380737304688, -661.01611328125, -645.694091796875, -630.3721313476562, -615.0501708984375, -599.7281494140625, -584.4061889648438, -569.084228515625, -553.76220703125, -538.4402465820312, -523.1182250976562, -507.7962646484375, -492.4742736816406, -477.15228271484375, -461.830322265625, -446.5083312988281, -431.18634033203125, -415.8643493652344, -400.5423889160156, -385.22039794921875, -369.8984069824219, -354.576416015625, -339.25445556640625, -323.9324645996094, -308.6105041503906, -293.28851318359375, -277.966552734375, -262.6445617675781, -247.32257080078125, -232.00059509277344, -216.67861938476562, -201.35662841796875, -186.03463745117188, -170.71266174316406, -155.3906707763672, -140.06869506835938, -124.7467041015625, -109.42472839355469, -94.10274505615234, -78.78076171875, -63.458778381347656, -48.13679504394531, -32.81481170654297, -17.49283218383789, -2.170848846435547, 13.151130676269531, 28.473114013671875, 43.79509735107422, 59.11708068847656, 74.4390640258789, 89.76104736328125, 105.08302307128906, 120.40501403808594, 135.72698974609375, 151.04898071289062, 166.37095642089844, 181.69293212890625, 197.01490783691406, 212.33689880371094, 227.65887451171875, 242.98086547851562, 258.3028564453125, 273.62481689453125, 288.9468078613281, 304.268798828125]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 8.0, 9.0, 4.0, 9.0, 12.0, 6.0, 21.0, 15.0, 18.0, 37.0, 28.0, 36.0, 42.0, 26.0, 34.0, 55.0, 61.0, 63.0, 94.0, 65.0, 50.0, 39.0, 34.0, 32.0, 31.0, 27.0, 30.0, 19.0, 14.0, 17.0, 19.0, 5.0, 10.0, 4.0, 5.0, 4.0, 6.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-347.7723388671875, -337.8692321777344, -327.96612548828125, -318.0630187988281, -308.159912109375, -298.2568054199219, -288.35369873046875, -278.45062255859375, -268.5474853515625, -258.6443786621094, -248.74127197265625, -238.83816528320312, -228.93505859375, -219.03195190429688, -209.1288604736328, -199.2257537841797, -189.32266235351562, -179.4195556640625, -169.51644897460938, -159.61334228515625, -149.71023559570312, -139.80712890625, -129.90403747558594, -120.00093078613281, -110.09782409667969, -100.19471740722656, -90.29161071777344, -80.38851165771484, -70.48540496826172, -60.582298278808594, -50.679195404052734, -40.776092529296875, -30.872955322265625, -20.969850540161133, -11.06674575805664, -1.1636409759521484, 8.739463806152344, 18.64257049560547, 28.545673370361328, 38.44877624511719, 48.35188293457031, 58.25498962402344, 68.15809631347656, 78.06119537353516, 87.96430206298828, 97.8674087524414, 107.7705078125, 117.67361450195312, 127.57672119140625, 137.47982788085938, 147.3829345703125, 157.28604125976562, 167.18914794921875, 177.09225463867188, 186.99534606933594, 196.89845275878906, 206.8015594482422, 216.7046661376953, 226.60777282714844, 236.51087951660156, 246.41397094726562, 256.31707763671875, 266.2201843261719, 276.123291015625, 286.0263977050781]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 5.0, 5.0, 14.0, 22.0, 37.0, 55.0, 120.0, 229.0, 470.0, 1176.0, 3073.0, 10243.0, 42843.0, 326889.0, 2895487.0, 813525.0, 77343.0, 15426.0, 4471.0, 1523.0, 670.0, 281.0, 147.0, 82.0, 53.0, 41.0, 14.0, 17.0, 10.0, 7.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.515625, -28.486083984375, -27.45654296875, -26.427001953125, -25.3974609375, -24.367919921875, -23.33837890625, -22.308837890625, -21.279296875, -20.249755859375, -19.22021484375, -18.190673828125, -17.1611328125, -16.131591796875, -15.10205078125, -14.072509765625, -13.04296875, -12.013427734375, -10.98388671875, -9.954345703125, -8.9248046875, -7.895263671875, -6.86572265625, -5.836181640625, -4.806640625, -3.777099609375, -2.74755859375, -1.718017578125, -0.6884765625, 0.341064453125, 1.37060546875, 2.400146484375, 3.4296875, 4.459228515625, 5.48876953125, 6.518310546875, 7.5478515625, 8.577392578125, 9.60693359375, 10.636474609375, 11.666015625, 12.695556640625, 13.72509765625, 14.754638671875, 15.7841796875, 16.813720703125, 17.84326171875, 18.872802734375, 19.90234375, 20.931884765625, 21.96142578125, 22.990966796875, 24.0205078125, 25.050048828125, 26.07958984375, 27.109130859375, 28.138671875, 29.168212890625, 30.19775390625, 31.227294921875, 32.2568359375, 33.286376953125, 34.31591796875, 35.345458984375, 36.375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 7.0, 10.0, 8.0, 13.0, 8.0, 19.0, 26.0, 31.0, 28.0, 43.0, 47.0, 48.0, 44.0, 55.0, 65.0, 59.0, 63.0, 54.0, 64.0, 44.0, 44.0, 44.0, 40.0, 31.0, 20.0, 25.0, 17.0, 13.0, 6.0, 6.0, 7.0, 4.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-19.515625, -18.83740234375, -18.1591796875, -17.48095703125, -16.802734375, -16.12451171875, -15.4462890625, -14.76806640625, -14.08984375, -13.41162109375, -12.7333984375, -12.05517578125, -11.376953125, -10.69873046875, -10.0205078125, -9.34228515625, -8.6640625, -7.98583984375, -7.3076171875, -6.62939453125, -5.951171875, -5.27294921875, -4.5947265625, -3.91650390625, -3.23828125, -2.56005859375, -1.8818359375, -1.20361328125, -0.525390625, 0.15283203125, 0.8310546875, 1.50927734375, 2.1875, 2.86572265625, 3.5439453125, 4.22216796875, 4.900390625, 5.57861328125, 6.2568359375, 6.93505859375, 7.61328125, 8.29150390625, 8.9697265625, 9.64794921875, 10.326171875, 11.00439453125, 11.6826171875, 12.36083984375, 13.0390625, 13.71728515625, 14.3955078125, 15.07373046875, 15.751953125, 16.43017578125, 17.1083984375, 17.78662109375, 18.46484375, 19.14306640625, 19.8212890625, 20.49951171875, 21.177734375, 21.85595703125, 22.5341796875, 23.21240234375, 23.890625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 7.0, 8.0, 6.0, 13.0, 14.0, 17.0, 33.0, 58.0, 88.0, 157.0, 297.0, 664.0, 1554.0, 4203.0, 13980.0, 64304.0, 719418.0, 3113223.0, 223387.0, 36680.0, 9658.0, 3442.0, 1452.0, 674.0, 334.0, 230.0, 145.0, 81.0, 49.0, 35.0, 24.0, 15.0, 7.0, 12.0, 2.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-41.875, -40.578125, -39.28125, -37.984375, -36.6875, -35.390625, -34.09375, -32.796875, -31.5, -30.203125, -28.90625, -27.609375, -26.3125, -25.015625, -23.71875, -22.421875, -21.125, -19.828125, -18.53125, -17.234375, -15.9375, -14.640625, -13.34375, -12.046875, -10.75, -9.453125, -8.15625, -6.859375, -5.5625, -4.265625, -2.96875, -1.671875, -0.375, 0.921875, 2.21875, 3.515625, 4.8125, 6.109375, 7.40625, 8.703125, 10.0, 11.296875, 12.59375, 13.890625, 15.1875, 16.484375, 17.78125, 19.078125, 20.375, 21.671875, 22.96875, 24.265625, 25.5625, 26.859375, 28.15625, 29.453125, 30.75, 32.046875, 33.34375, 34.640625, 35.9375, 37.234375, 38.53125, 39.828125, 41.125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 3.0, 0.0, 6.0, 3.0, 5.0, 7.0, 7.0, 17.0, 15.0, 30.0, 50.0, 65.0, 143.0, 281.0, 551.0, 877.0, 847.0, 520.0, 246.0, 133.0, 86.0, 58.0, 40.0, 23.0, 19.0, 16.0, 10.0, 5.0, 8.0, 4.0, 0.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.625, -30.90234375, -29.1796875, -27.45703125, -25.734375, -24.01171875, -22.2890625, -20.56640625, -18.84375, -17.12109375, -15.3984375, -13.67578125, -11.953125, -10.23046875, -8.5078125, -6.78515625, -5.0625, -3.33984375, -1.6171875, 0.10546875, 1.828125, 3.55078125, 5.2734375, 6.99609375, 8.71875, 10.44140625, 12.1640625, 13.88671875, 15.609375, 17.33203125, 19.0546875, 20.77734375, 22.5, 24.22265625, 25.9453125, 27.66796875, 29.390625, 31.11328125, 32.8359375, 34.55859375, 36.28125, 38.00390625, 39.7265625, 41.44921875, 43.171875, 44.89453125, 46.6171875, 48.33984375, 50.0625, 51.78515625, 53.5078125, 55.23046875, 56.953125, 58.67578125, 60.3984375, 62.12109375, 63.84375, 65.56640625, 67.2890625, 69.01171875, 70.734375, 72.45703125, 74.1796875, 75.90234375, 77.625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 7.0, 31.0, 64.0, 131.0, 216.0, 263.0, 143.0, 75.0, 31.0, 15.0, 5.0, 7.0, 4.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-428.302734375, -410.3797607421875, -392.456787109375, -374.5338439941406, -356.6108703613281, -338.6878967285156, -320.76495361328125, -302.84197998046875, -284.91900634765625, -266.99603271484375, -249.0730743408203, -231.15011596679688, -213.22714233398438, -195.30416870117188, -177.38121032714844, -159.458251953125, -141.5352783203125, -123.61231231689453, -105.68934631347656, -87.7663803100586, -69.84341430664062, -51.920448303222656, -33.99748229980469, -16.07451629638672, 1.84844970703125, 19.77141571044922, 37.69438171386719, 55.617347717285156, 73.54031372070312, 91.4632797241211, 109.38624572753906, 127.30921173095703, 145.23223876953125, 163.15521240234375, 181.0781707763672, 199.00112915039062, 216.92410278320312, 234.84707641601562, 252.77003479003906, 270.6929931640625, 288.615966796875, 306.5389404296875, 324.4619140625, 342.3848571777344, 360.3078308105469, 378.2308044433594, 396.15374755859375, 414.07672119140625, 431.99969482421875, 449.92266845703125, 467.84564208984375, 485.7685852050781, 503.6915588378906, 521.614501953125, 539.5374755859375, 557.46044921875, 575.3834228515625, 593.306396484375, 611.2293701171875, 629.15234375, 647.0753173828125, 664.9982299804688, 682.9212036132812, 700.8441772460938, 718.7671508789062]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 2.0, 3.0, 10.0, 11.0, 20.0, 13.0, 19.0, 40.0, 39.0, 50.0, 55.0, 52.0, 61.0, 66.0, 57.0, 71.0, 74.0, 67.0, 58.0, 54.0, 35.0, 32.0, 38.0, 20.0, 20.0, 12.0, 9.0, 8.0, 7.0, 3.0, 0.0, 0.0, 2.0, 3.0], "bins": [-404.4827880859375, -395.73114013671875, -386.9794921875, -378.22784423828125, -369.4761962890625, -360.72454833984375, -351.972900390625, -343.22125244140625, -334.4696044921875, -325.71795654296875, -316.96630859375, -308.21466064453125, -299.4630126953125, -290.71136474609375, -281.959716796875, -273.20806884765625, -264.4563903808594, -255.70474243164062, -246.95309448242188, -238.20144653320312, -229.44979858398438, -220.69815063476562, -211.9464874267578, -203.19483947753906, -194.4431915283203, -185.69154357910156, -176.9398956298828, -168.18824768066406, -159.43658447265625, -150.6849365234375, -141.93328857421875, -133.181640625, -124.43002319335938, -115.67837524414062, -106.92672729492188, -98.1750717163086, -89.42342376708984, -80.6717758178711, -71.92012023925781, -63.16847229003906, -54.41682434082031, -45.66517639160156, -36.91352462768555, -28.161874771118164, -19.41022491455078, -10.658576965332031, -1.9069252014160156, 6.8447265625, 15.59637451171875, 24.348024368286133, 33.099674224853516, 41.85132598876953, 50.60297393798828, 59.35462188720703, 68.10627746582031, 76.85792541503906, 85.60957336425781, 94.36122131347656, 103.11286926269531, 111.8645248413086, 120.61617279052734, 129.36782836914062, 138.11947631835938, 146.87112426757812, 155.62277221679688]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 11.0, 10.0, 14.0, 20.0, 35.0, 42.0, 54.0, 86.0, 141.0, 198.0, 360.0, 573.0, 1098.0, 1866.0, 3598.0, 6731.0, 13620.0, 30019.0, 71353.0, 190099.0, 372944.0, 212491.0, 79620.0, 33091.0, 14969.0, 7093.0, 3609.0, 1986.0, 1087.0, 638.0, 431.0, 245.0, 155.0, 78.0, 55.0, 51.0, 26.0, 19.0, 15.0, 9.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.609375, -30.607666015625, -29.60595703125, -28.604248046875, -27.6025390625, -26.600830078125, -25.59912109375, -24.597412109375, -23.595703125, -22.593994140625, -21.59228515625, -20.590576171875, -19.5888671875, -18.587158203125, -17.58544921875, -16.583740234375, -15.58203125, -14.580322265625, -13.57861328125, -12.576904296875, -11.5751953125, -10.573486328125, -9.57177734375, -8.570068359375, -7.568359375, -6.566650390625, -5.56494140625, -4.563232421875, -3.5615234375, -2.559814453125, -1.55810546875, -0.556396484375, 0.4453125, 1.447021484375, 2.44873046875, 3.450439453125, 4.4521484375, 5.453857421875, 6.45556640625, 7.457275390625, 8.458984375, 9.460693359375, 10.46240234375, 11.464111328125, 12.4658203125, 13.467529296875, 14.46923828125, 15.470947265625, 16.47265625, 17.474365234375, 18.47607421875, 19.477783203125, 20.4794921875, 21.481201171875, 22.48291015625, 23.484619140625, 24.486328125, 25.488037109375, 26.48974609375, 27.491455078125, 28.4931640625, 29.494873046875, 30.49658203125, 31.498291015625, 32.5]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 11.0, 14.0, 9.0, 14.0, 23.0, 18.0, 23.0, 32.0, 39.0, 43.0, 42.0, 67.0, 57.0, 50.0, 53.0, 78.0, 63.0, 55.0, 48.0, 61.0, 38.0, 29.0, 28.0, 22.0, 22.0, 18.0, 6.0, 5.0, 12.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-19.53125, -18.848388671875, -18.16552734375, -17.482666015625, -16.7998046875, -16.116943359375, -15.43408203125, -14.751220703125, -14.068359375, -13.385498046875, -12.70263671875, -12.019775390625, -11.3369140625, -10.654052734375, -9.97119140625, -9.288330078125, -8.60546875, -7.922607421875, -7.23974609375, -6.556884765625, -5.8740234375, -5.191162109375, -4.50830078125, -3.825439453125, -3.142578125, -2.459716796875, -1.77685546875, -1.093994140625, -0.4111328125, 0.271728515625, 0.95458984375, 1.637451171875, 2.3203125, 3.003173828125, 3.68603515625, 4.368896484375, 5.0517578125, 5.734619140625, 6.41748046875, 7.100341796875, 7.783203125, 8.466064453125, 9.14892578125, 9.831787109375, 10.5146484375, 11.197509765625, 11.88037109375, 12.563232421875, 13.24609375, 13.928955078125, 14.61181640625, 15.294677734375, 15.9775390625, 16.660400390625, 17.34326171875, 18.026123046875, 18.708984375, 19.391845703125, 20.07470703125, 20.757568359375, 21.4404296875, 22.123291015625, 22.80615234375, 23.489013671875, 24.171875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 5.0, 6.0, 5.0, 10.0, 15.0, 23.0, 32.0, 41.0, 63.0, 96.0, 156.0, 204.0, 369.0, 530.0, 866.0, 1657.0, 3743.0, 13423.0, 85766.0, 748121.0, 162616.0, 20902.0, 5027.0, 2028.0, 1063.0, 642.0, 378.0, 249.0, 163.0, 110.0, 76.0, 63.0, 29.0, 22.0, 15.0, 14.0, 7.0, 6.0, 7.0, 1.0, 6.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-77.0, -74.7109375, -72.421875, -70.1328125, -67.84375, -65.5546875, -63.265625, -60.9765625, -58.6875, -56.3984375, -54.109375, -51.8203125, -49.53125, -47.2421875, -44.953125, -42.6640625, -40.375, -38.0859375, -35.796875, -33.5078125, -31.21875, -28.9296875, -26.640625, -24.3515625, -22.0625, -19.7734375, -17.484375, -15.1953125, -12.90625, -10.6171875, -8.328125, -6.0390625, -3.75, -1.4609375, 0.828125, 3.1171875, 5.40625, 7.6953125, 9.984375, 12.2734375, 14.5625, 16.8515625, 19.140625, 21.4296875, 23.71875, 26.0078125, 28.296875, 30.5859375, 32.875, 35.1640625, 37.453125, 39.7421875, 42.03125, 44.3203125, 46.609375, 48.8984375, 51.1875, 53.4765625, 55.765625, 58.0546875, 60.34375, 62.6328125, 64.921875, 67.2109375, 69.5]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 6.0, 1.0, 5.0, 6.0, 6.0, 5.0, 6.0, 6.0, 16.0, 15.0, 14.0, 17.0, 25.0, 36.0, 24.0, 32.0, 32.0, 50.0, 45.0, 40.0, 39.0, 47.0, 47.0, 53.0, 48.0, 52.0, 31.0, 39.0, 32.0, 36.0, 25.0, 19.0, 25.0, 27.0, 13.0, 19.0, 14.0, 14.0, 9.0, 10.0, 1.0, 7.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0], "bins": [-69.1875, -67.2275390625, -65.267578125, -63.3076171875, -61.34765625, -59.3876953125, -57.427734375, -55.4677734375, -53.5078125, -51.5478515625, -49.587890625, -47.6279296875, -45.66796875, -43.7080078125, -41.748046875, -39.7880859375, -37.828125, -35.8681640625, -33.908203125, -31.9482421875, -29.98828125, -28.0283203125, -26.068359375, -24.1083984375, -22.1484375, -20.1884765625, -18.228515625, -16.2685546875, -14.30859375, -12.3486328125, -10.388671875, -8.4287109375, -6.46875, -4.5087890625, -2.548828125, -0.5888671875, 1.37109375, 3.3310546875, 5.291015625, 7.2509765625, 9.2109375, 11.1708984375, 13.130859375, 15.0908203125, 17.05078125, 19.0107421875, 20.970703125, 22.9306640625, 24.890625, 26.8505859375, 28.810546875, 30.7705078125, 32.73046875, 34.6904296875, 36.650390625, 38.6103515625, 40.5703125, 42.5302734375, 44.490234375, 46.4501953125, 48.41015625, 50.3701171875, 52.330078125, 54.2900390625, 56.25]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 9.0, 7.0, 12.0, 17.0, 19.0, 38.0, 43.0, 77.0, 92.0, 172.0, 375.0, 731.0, 2084.0, 8908.0, 64161.0, 776486.0, 171333.0, 18342.0, 3527.0, 1047.0, 456.0, 222.0, 134.0, 77.0, 45.0, 35.0, 31.0, 24.0, 14.0, 11.0, 8.0, 3.0, 3.0, 5.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.453125, -16.79931640625, -16.1455078125, -15.49169921875, -14.837890625, -14.18408203125, -13.5302734375, -12.87646484375, -12.22265625, -11.56884765625, -10.9150390625, -10.26123046875, -9.607421875, -8.95361328125, -8.2998046875, -7.64599609375, -6.9921875, -6.33837890625, -5.6845703125, -5.03076171875, -4.376953125, -3.72314453125, -3.0693359375, -2.41552734375, -1.76171875, -1.10791015625, -0.4541015625, 0.19970703125, 0.853515625, 1.50732421875, 2.1611328125, 2.81494140625, 3.46875, 4.12255859375, 4.7763671875, 5.43017578125, 6.083984375, 6.73779296875, 7.3916015625, 8.04541015625, 8.69921875, 9.35302734375, 10.0068359375, 10.66064453125, 11.314453125, 11.96826171875, 12.6220703125, 13.27587890625, 13.9296875, 14.58349609375, 15.2373046875, 15.89111328125, 16.544921875, 17.19873046875, 17.8525390625, 18.50634765625, 19.16015625, 19.81396484375, 20.4677734375, 21.12158203125, 21.775390625, 22.42919921875, 23.0830078125, 23.73681640625, 24.390625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 5.0, 6.0, 4.0, 3.0, 6.0, 7.0, 14.0, 10.0, 17.0, 12.0, 22.0, 27.0, 48.0, 48.0, 82.0, 119.0, 138.0, 111.0, 70.0, 48.0, 43.0, 26.0, 23.0, 17.0, 17.0, 22.0, 13.0, 8.0, 6.0, 6.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.00366973876953125, -0.003556668758392334, -0.003443598747253418, -0.003330528736114502, -0.003217458724975586, -0.00310438871383667, -0.002991318702697754, -0.002878248691558838, -0.002765178680419922, -0.002652108669281006, -0.00253903865814209, -0.002425968647003174, -0.002312898635864258, -0.002199828624725342, -0.0020867586135864258, -0.0019736886024475098, -0.0018606185913085938, -0.0017475485801696777, -0.0016344785690307617, -0.0015214085578918457, -0.0014083385467529297, -0.0012952685356140137, -0.0011821985244750977, -0.0010691285133361816, -0.0009560585021972656, -0.0008429884910583496, -0.0007299184799194336, -0.0006168484687805176, -0.0005037784576416016, -0.00039070844650268555, -0.00027763843536376953, -0.00016456842422485352, -5.14984130859375e-05, 6.157159805297852e-05, 0.00017464160919189453, 0.00028771162033081055, 0.00040078163146972656, 0.0005138516426086426, 0.0006269216537475586, 0.0007399916648864746, 0.0008530616760253906, 0.0009661316871643066, 0.0010792016983032227, 0.0011922717094421387, 0.0013053417205810547, 0.0014184117317199707, 0.0015314817428588867, 0.0016445517539978027, 0.0017576217651367188, 0.0018706917762756348, 0.0019837617874145508, 0.002096831798553467, 0.002209901809692383, 0.002322971820831299, 0.002436041831970215, 0.002549111843109131, 0.002662181854248047, 0.002775251865386963, 0.002888321876525879, 0.003001391887664795, 0.003114461898803711, 0.003227531909942627, 0.003340601921081543, 0.003453671932220459, 0.003566741943359375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 23.0, 16.0, 22.0, 39.0, 70.0, 167.0, 315.0, 547.0, 1277.0, 3435.0, 14415.0, 161009.0, 797280.0, 57896.0, 7933.0, 2291.0, 950.0, 427.0, 210.0, 101.0, 63.0, 23.0, 20.0, 7.0, 8.0, 5.0, 3.0, 1.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.453125, -21.8173828125, -21.181640625, -20.5458984375, -19.91015625, -19.2744140625, -18.638671875, -18.0029296875, -17.3671875, -16.7314453125, -16.095703125, -15.4599609375, -14.82421875, -14.1884765625, -13.552734375, -12.9169921875, -12.28125, -11.6455078125, -11.009765625, -10.3740234375, -9.73828125, -9.1025390625, -8.466796875, -7.8310546875, -7.1953125, -6.5595703125, -5.923828125, -5.2880859375, -4.65234375, -4.0166015625, -3.380859375, -2.7451171875, -2.109375, -1.4736328125, -0.837890625, -0.2021484375, 0.43359375, 1.0693359375, 1.705078125, 2.3408203125, 2.9765625, 3.6123046875, 4.248046875, 4.8837890625, 5.51953125, 6.1552734375, 6.791015625, 7.4267578125, 8.0625, 8.6982421875, 9.333984375, 9.9697265625, 10.60546875, 11.2412109375, 11.876953125, 12.5126953125, 13.1484375, 13.7841796875, 14.419921875, 15.0556640625, 15.69140625, 16.3271484375, 16.962890625, 17.5986328125, 18.234375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 3.0, 9.0, 9.0, 9.0, 24.0, 13.0, 11.0, 16.0, 28.0, 39.0, 37.0, 61.0, 59.0, 70.0, 79.0, 65.0, 90.0, 61.0, 52.0, 38.0, 45.0, 34.0, 27.0, 28.0, 20.0, 7.0, 16.0, 7.0, 11.0, 5.0, 6.0, 5.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.46875, -10.099853515625, -9.73095703125, -9.362060546875, -8.9931640625, -8.624267578125, -8.25537109375, -7.886474609375, -7.517578125, -7.148681640625, -6.77978515625, -6.410888671875, -6.0419921875, -5.673095703125, -5.30419921875, -4.935302734375, -4.56640625, -4.197509765625, -3.82861328125, -3.459716796875, -3.0908203125, -2.721923828125, -2.35302734375, -1.984130859375, -1.615234375, -1.246337890625, -0.87744140625, -0.508544921875, -0.1396484375, 0.229248046875, 0.59814453125, 0.967041015625, 1.3359375, 1.704833984375, 2.07373046875, 2.442626953125, 2.8115234375, 3.180419921875, 3.54931640625, 3.918212890625, 4.287109375, 4.656005859375, 5.02490234375, 5.393798828125, 5.7626953125, 6.131591796875, 6.50048828125, 6.869384765625, 7.23828125, 7.607177734375, 7.97607421875, 8.344970703125, 8.7138671875, 9.082763671875, 9.45166015625, 9.820556640625, 10.189453125, 10.558349609375, 10.92724609375, 11.296142578125, 11.6650390625, 12.033935546875, 12.40283203125, 12.771728515625, 13.140625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 7.0, 6.0, 14.0, 39.0, 65.0, 182.0, 284.0, 193.0, 107.0, 49.0, 23.0, 11.0, 8.0, 6.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-566.0093383789062, -550.6088256835938, -535.2083740234375, -519.807861328125, -504.4073791503906, -489.00689697265625, -473.6064147949219, -458.2059326171875, -442.805419921875, -427.4049377441406, -412.00445556640625, -396.60394287109375, -381.2034606933594, -365.802978515625, -350.4024963378906, -335.00201416015625, -319.60150146484375, -304.2010192871094, -288.800537109375, -273.4000244140625, -257.9995422363281, -242.59906005859375, -227.19857788085938, -211.79808044433594, -196.39761352539062, -180.99713134765625, -165.5966339111328, -150.19615173339844, -134.795654296875, -119.39517211914062, -103.99468231201172, -88.59419250488281, -73.19369506835938, -57.79320526123047, -42.39271545410156, -26.992229461669922, -11.591739654541016, 3.808746337890625, 19.20923614501953, 34.60972595214844, 50.010215759277344, 65.41070556640625, 80.81119537353516, 96.21168518066406, 111.61216735839844, 127.01265716552734, 142.41314697265625, 157.81362915039062, 173.21412658691406, 188.61460876464844, 204.01510620117188, 219.41558837890625, 234.8160858154297, 250.21656799316406, 265.6170654296875, 281.0175476074219, 296.41802978515625, 311.8185119628906, 327.218994140625, 342.6195068359375, 358.0199890136719, 373.42047119140625, 388.8209533691406, 404.221435546875, 419.6219482421875]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 4.0, 5.0, 1.0, 6.0, 3.0, 4.0, 10.0, 13.0, 12.0, 10.0, 21.0, 23.0, 24.0, 17.0, 26.0, 30.0, 24.0, 29.0, 34.0, 38.0, 48.0, 58.0, 72.0, 65.0, 52.0, 44.0, 41.0, 30.0, 38.0, 34.0, 25.0, 21.0, 26.0, 15.0, 17.0, 14.0, 17.0, 11.0, 10.0, 6.0, 8.0, 4.0, 6.0, 3.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-199.12289428710938, -191.53216552734375, -183.94142150878906, -176.35069274902344, -168.75994873046875, -161.16921997070312, -153.5784912109375, -145.9877471923828, -138.3970184326172, -130.80628967285156, -123.21554565429688, -115.62481689453125, -108.0340805053711, -100.44334411621094, -92.85260772705078, -85.26187133789062, -77.67113494873047, -70.08039855957031, -62.48966598510742, -54.898929595947266, -47.308197021484375, -39.71746063232422, -32.12672424316406, -24.535991668701172, -16.945255279541016, -9.354520797729492, -1.7637853622436523, 5.8269500732421875, 13.417684555053711, 21.008419036865234, 28.59915542602539, 36.18988800048828, 43.78062438964844, 51.371360778808594, 58.962093353271484, 66.55282592773438, 74.14356231689453, 81.73429870605469, 89.32503509521484, 96.915771484375, 104.50650024414062, 112.09723663330078, 119.68797302246094, 127.27870178222656, 134.86944580078125, 142.46017456054688, 150.0509033203125, 157.6416473388672, 165.23239135742188, 172.8231201171875, 180.4138641357422, 188.0045928955078, 195.5953369140625, 203.18606567382812, 210.77679443359375, 218.36753845214844, 225.95826721191406, 233.5489959716797, 241.13973999023438, 248.73046875, 256.3211975097656, 263.91192626953125, 271.502685546875, 279.0934143066406, 286.68414306640625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 3.0, 5.0, 6.0, 12.0, 22.0, 20.0, 20.0, 43.0, 60.0, 68.0, 96.0, 165.0, 274.0, 484.0, 878.0, 1573.0, 3396.0, 7974.0, 24701.0, 124338.0, 1216053.0, 2452150.0, 297871.0, 43155.0, 11485.0, 4564.0, 2169.0, 1064.0, 610.0, 380.0, 217.0, 128.0, 84.0, 52.0, 35.0, 34.0, 25.0, 21.0, 9.0, 12.0, 6.0, 3.0, 0.0, 4.0, 3.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.65625, -24.833984375, -24.01171875, -23.189453125, -22.3671875, -21.544921875, -20.72265625, -19.900390625, -19.078125, -18.255859375, -17.43359375, -16.611328125, -15.7890625, -14.966796875, -14.14453125, -13.322265625, -12.5, -11.677734375, -10.85546875, -10.033203125, -9.2109375, -8.388671875, -7.56640625, -6.744140625, -5.921875, -5.099609375, -4.27734375, -3.455078125, -2.6328125, -1.810546875, -0.98828125, -0.166015625, 0.65625, 1.478515625, 2.30078125, 3.123046875, 3.9453125, 4.767578125, 5.58984375, 6.412109375, 7.234375, 8.056640625, 8.87890625, 9.701171875, 10.5234375, 11.345703125, 12.16796875, 12.990234375, 13.8125, 14.634765625, 15.45703125, 16.279296875, 17.1015625, 17.923828125, 18.74609375, 19.568359375, 20.390625, 21.212890625, 22.03515625, 22.857421875, 23.6796875, 24.501953125, 25.32421875, 26.146484375, 26.96875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 7.0, 6.0, 11.0, 13.0, 12.0, 28.0, 18.0, 22.0, 28.0, 38.0, 46.0, 50.0, 47.0, 65.0, 64.0, 53.0, 47.0, 57.0, 66.0, 61.0, 48.0, 40.0, 33.0, 22.0, 22.0, 34.0, 21.0, 11.0, 6.0, 8.0, 8.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.640625, -17.972412109375, -17.30419921875, -16.635986328125, -15.9677734375, -15.299560546875, -14.63134765625, -13.963134765625, -13.294921875, -12.626708984375, -11.95849609375, -11.290283203125, -10.6220703125, -9.953857421875, -9.28564453125, -8.617431640625, -7.94921875, -7.281005859375, -6.61279296875, -5.944580078125, -5.2763671875, -4.608154296875, -3.93994140625, -3.271728515625, -2.603515625, -1.935302734375, -1.26708984375, -0.598876953125, 0.0693359375, 0.737548828125, 1.40576171875, 2.073974609375, 2.7421875, 3.410400390625, 4.07861328125, 4.746826171875, 5.4150390625, 6.083251953125, 6.75146484375, 7.419677734375, 8.087890625, 8.756103515625, 9.42431640625, 10.092529296875, 10.7607421875, 11.428955078125, 12.09716796875, 12.765380859375, 13.43359375, 14.101806640625, 14.77001953125, 15.438232421875, 16.1064453125, 16.774658203125, 17.44287109375, 18.111083984375, 18.779296875, 19.447509765625, 20.11572265625, 20.783935546875, 21.4521484375, 22.120361328125, 22.78857421875, 23.456787109375, 24.125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 3.0, 7.0, 7.0, 15.0, 15.0, 35.0, 45.0, 60.0, 114.0, 210.0, 432.0, 1112.0, 3151.0, 11685.0, 72234.0, 2225509.0, 1798473.0, 64908.0, 11227.0, 3010.0, 1031.0, 435.0, 211.0, 123.0, 67.0, 62.0, 37.0, 16.0, 21.0, 11.0, 5.0, 3.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.8125, -33.3603515625, -31.908203125, -30.4560546875, -29.00390625, -27.5517578125, -26.099609375, -24.6474609375, -23.1953125, -21.7431640625, -20.291015625, -18.8388671875, -17.38671875, -15.9345703125, -14.482421875, -13.0302734375, -11.578125, -10.1259765625, -8.673828125, -7.2216796875, -5.76953125, -4.3173828125, -2.865234375, -1.4130859375, 0.0390625, 1.4912109375, 2.943359375, 4.3955078125, 5.84765625, 7.2998046875, 8.751953125, 10.2041015625, 11.65625, 13.1083984375, 14.560546875, 16.0126953125, 17.46484375, 18.9169921875, 20.369140625, 21.8212890625, 23.2734375, 24.7255859375, 26.177734375, 27.6298828125, 29.08203125, 30.5341796875, 31.986328125, 33.4384765625, 34.890625, 36.3427734375, 37.794921875, 39.2470703125, 40.69921875, 42.1513671875, 43.603515625, 45.0556640625, 46.5078125, 47.9599609375, 49.412109375, 50.8642578125, 52.31640625, 53.7685546875, 55.220703125, 56.6728515625, 58.125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 8.0, 10.0, 15.0, 19.0, 24.0, 30.0, 47.0, 85.0, 134.0, 210.0, 393.0, 632.0, 790.0, 639.0, 434.0, 210.0, 140.0, 73.0, 48.0, 26.0, 23.0, 30.0, 13.0, 9.0, 5.0, 6.0, 3.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.5625, -29.32080078125, -28.0791015625, -26.83740234375, -25.595703125, -24.35400390625, -23.1123046875, -21.87060546875, -20.62890625, -19.38720703125, -18.1455078125, -16.90380859375, -15.662109375, -14.42041015625, -13.1787109375, -11.93701171875, -10.6953125, -9.45361328125, -8.2119140625, -6.97021484375, -5.728515625, -4.48681640625, -3.2451171875, -2.00341796875, -0.76171875, 0.47998046875, 1.7216796875, 2.96337890625, 4.205078125, 5.44677734375, 6.6884765625, 7.93017578125, 9.171875, 10.41357421875, 11.6552734375, 12.89697265625, 14.138671875, 15.38037109375, 16.6220703125, 17.86376953125, 19.10546875, 20.34716796875, 21.5888671875, 22.83056640625, 24.072265625, 25.31396484375, 26.5556640625, 27.79736328125, 29.0390625, 30.28076171875, 31.5224609375, 32.76416015625, 34.005859375, 35.24755859375, 36.4892578125, 37.73095703125, 38.97265625, 40.21435546875, 41.4560546875, 42.69775390625, 43.939453125, 45.18115234375, 46.4228515625, 47.66455078125, 48.90625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 14.0, 37.0, 157.0, 356.0, 287.0, 99.0, 24.0, 13.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-724.652587890625, -702.5910034179688, -680.5293579101562, -658.4677734375, -636.4061279296875, -614.3445434570312, -592.282958984375, -570.2213134765625, -548.1597290039062, -526.09814453125, -504.0364990234375, -481.97491455078125, -459.9132995605469, -437.8516845703125, -415.7900695800781, -393.72845458984375, -371.6668395996094, -349.605224609375, -327.5436096191406, -305.48199462890625, -283.42041015625, -261.3587951660156, -239.29718017578125, -217.23558044433594, -195.17396545410156, -173.1123504638672, -151.05075073242188, -128.9891357421875, -106.92752838134766, -84.86592102050781, -62.80430603027344, -40.742706298828125, -18.68109130859375, 3.3805179595947266, 25.442127227783203, 47.50373840332031, 69.56534576416016, 91.626953125, 113.68856811523438, 135.7501678466797, 157.81178283691406, 179.87339782714844, 201.93499755859375, 223.99661254882812, 246.0582275390625, 268.11981201171875, 290.18145751953125, 312.2430419921875, 334.3046569824219, 356.36627197265625, 378.4278869628906, 400.489501953125, 422.55108642578125, 444.6127014160156, 466.67431640625, 488.73590087890625, 510.79754638671875, 532.859130859375, 554.9207763671875, 576.9823608398438, 599.0440063476562, 621.1055908203125, 643.167236328125, 665.2288208007812, 687.2904052734375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 6.0, 13.0, 8.0, 16.0, 13.0, 19.0, 17.0, 13.0, 27.0, 38.0, 35.0, 30.0, 35.0, 43.0, 43.0, 41.0, 55.0, 50.0, 45.0, 58.0, 48.0, 42.0, 41.0, 45.0, 24.0, 24.0, 30.0, 23.0, 15.0, 12.0, 21.0, 13.0, 15.0, 9.0, 6.0, 6.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-146.69329833984375, -141.41461181640625, -136.13592529296875, -130.85723876953125, -125.57854461669922, -120.29985809326172, -115.02116394042969, -109.74247741699219, -104.46379089355469, -99.18510437011719, -93.90641784667969, -88.62772369384766, -83.34903717041016, -78.07035064697266, -72.79165649414062, -67.51296997070312, -62.234283447265625, -56.955596923828125, -51.67690658569336, -46.398216247558594, -41.119529724121094, -35.840843200683594, -30.562152862548828, -25.283462524414062, -20.004776000976562, -14.72608757019043, -9.447399139404297, -4.168710708618164, 1.1099777221679688, 6.388666152954102, 11.667354583740234, 16.946044921875, 22.2247314453125, 27.503419876098633, 32.782108306884766, 38.06079864501953, 43.33948516845703, 48.61817169189453, 53.8968620300293, 59.17555236816406, 64.45423889160156, 69.73292541503906, 75.01161193847656, 80.2903060913086, 85.5689926147461, 90.8476791381836, 96.12637329101562, 101.40505981445312, 106.68374633789062, 111.96243286132812, 117.24111938476562, 122.51981353759766, 127.79850006103516, 133.0771942138672, 138.3558807373047, 143.6345672607422, 148.9132537841797, 154.1919403076172, 159.4706268310547, 164.7493133544922, 170.02801513671875, 175.30670166015625, 180.58538818359375, 185.86407470703125, 191.14276123046875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 6.0, 3.0, 5.0, 6.0, 6.0, 9.0, 22.0, 28.0, 45.0, 49.0, 98.0, 129.0, 223.0, 418.0, 755.0, 1435.0, 3012.0, 6507.0, 15646.0, 42884.0, 126853.0, 319138.0, 325674.0, 131781.0, 44615.0, 16171.0, 6740.0, 3004.0, 1442.0, 791.0, 415.0, 226.0, 141.0, 81.0, 61.0, 52.0, 25.0, 23.0, 9.0, 10.0, 7.0, 5.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.375, -23.56298828125, -22.7509765625, -21.93896484375, -21.126953125, -20.31494140625, -19.5029296875, -18.69091796875, -17.87890625, -17.06689453125, -16.2548828125, -15.44287109375, -14.630859375, -13.81884765625, -13.0068359375, -12.19482421875, -11.3828125, -10.57080078125, -9.7587890625, -8.94677734375, -8.134765625, -7.32275390625, -6.5107421875, -5.69873046875, -4.88671875, -4.07470703125, -3.2626953125, -2.45068359375, -1.638671875, -0.82666015625, -0.0146484375, 0.79736328125, 1.609375, 2.42138671875, 3.2333984375, 4.04541015625, 4.857421875, 5.66943359375, 6.4814453125, 7.29345703125, 8.10546875, 8.91748046875, 9.7294921875, 10.54150390625, 11.353515625, 12.16552734375, 12.9775390625, 13.78955078125, 14.6015625, 15.41357421875, 16.2255859375, 17.03759765625, 17.849609375, 18.66162109375, 19.4736328125, 20.28564453125, 21.09765625, 21.90966796875, 22.7216796875, 23.53369140625, 24.345703125, 25.15771484375, 25.9697265625, 26.78173828125, 27.59375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 7.0, 7.0, 12.0, 12.0, 15.0, 17.0, 18.0, 30.0, 29.0, 35.0, 41.0, 60.0, 59.0, 54.0, 67.0, 47.0, 51.0, 46.0, 56.0, 42.0, 42.0, 44.0, 33.0, 33.0, 27.0, 28.0, 21.0, 13.0, 17.0, 6.0, 7.0, 7.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.109375, -16.468994140625, -15.82861328125, -15.188232421875, -14.5478515625, -13.907470703125, -13.26708984375, -12.626708984375, -11.986328125, -11.345947265625, -10.70556640625, -10.065185546875, -9.4248046875, -8.784423828125, -8.14404296875, -7.503662109375, -6.86328125, -6.222900390625, -5.58251953125, -4.942138671875, -4.3017578125, -3.661376953125, -3.02099609375, -2.380615234375, -1.740234375, -1.099853515625, -0.45947265625, 0.180908203125, 0.8212890625, 1.461669921875, 2.10205078125, 2.742431640625, 3.3828125, 4.023193359375, 4.66357421875, 5.303955078125, 5.9443359375, 6.584716796875, 7.22509765625, 7.865478515625, 8.505859375, 9.146240234375, 9.78662109375, 10.427001953125, 11.0673828125, 11.707763671875, 12.34814453125, 12.988525390625, 13.62890625, 14.269287109375, 14.90966796875, 15.550048828125, 16.1904296875, 16.830810546875, 17.47119140625, 18.111572265625, 18.751953125, 19.392333984375, 20.03271484375, 20.673095703125, 21.3134765625, 21.953857421875, 22.59423828125, 23.234619140625, 23.875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 4.0, 9.0, 16.0, 25.0, 39.0, 51.0, 81.0, 146.0, 308.0, 714.0, 2034.0, 7183.0, 37290.0, 298868.0, 621885.0, 64353.0, 10954.0, 2798.0, 925.0, 408.0, 184.0, 115.0, 59.0, 31.0, 19.0, 15.0, 11.0, 8.0, 6.0, 5.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.0625, -48.4013671875, -46.740234375, -45.0791015625, -43.41796875, -41.7568359375, -40.095703125, -38.4345703125, -36.7734375, -35.1123046875, -33.451171875, -31.7900390625, -30.12890625, -28.4677734375, -26.806640625, -25.1455078125, -23.484375, -21.8232421875, -20.162109375, -18.5009765625, -16.83984375, -15.1787109375, -13.517578125, -11.8564453125, -10.1953125, -8.5341796875, -6.873046875, -5.2119140625, -3.55078125, -1.8896484375, -0.228515625, 1.4326171875, 3.09375, 4.7548828125, 6.416015625, 8.0771484375, 9.73828125, 11.3994140625, 13.060546875, 14.7216796875, 16.3828125, 18.0439453125, 19.705078125, 21.3662109375, 23.02734375, 24.6884765625, 26.349609375, 28.0107421875, 29.671875, 31.3330078125, 32.994140625, 34.6552734375, 36.31640625, 37.9775390625, 39.638671875, 41.2998046875, 42.9609375, 44.6220703125, 46.283203125, 47.9443359375, 49.60546875, 51.2666015625, 52.927734375, 54.5888671875, 56.25]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 8.0, 7.0, 6.0, 9.0, 15.0, 24.0, 17.0, 18.0, 24.0, 31.0, 26.0, 32.0, 44.0, 47.0, 44.0, 48.0, 50.0, 47.0, 42.0, 36.0, 50.0, 42.0, 50.0, 45.0, 39.0, 35.0, 29.0, 28.0, 19.0, 16.0, 13.0, 12.0, 12.0, 6.0, 4.0, 5.0, 4.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 3.0], "bins": [-73.125, -71.17919921875, -69.2333984375, -67.28759765625, -65.341796875, -63.39599609375, -61.4501953125, -59.50439453125, -57.55859375, -55.61279296875, -53.6669921875, -51.72119140625, -49.775390625, -47.82958984375, -45.8837890625, -43.93798828125, -41.9921875, -40.04638671875, -38.1005859375, -36.15478515625, -34.208984375, -32.26318359375, -30.3173828125, -28.37158203125, -26.42578125, -24.47998046875, -22.5341796875, -20.58837890625, -18.642578125, -16.69677734375, -14.7509765625, -12.80517578125, -10.859375, -8.91357421875, -6.9677734375, -5.02197265625, -3.076171875, -1.13037109375, 0.8154296875, 2.76123046875, 4.70703125, 6.65283203125, 8.5986328125, 10.54443359375, 12.490234375, 14.43603515625, 16.3818359375, 18.32763671875, 20.2734375, 22.21923828125, 24.1650390625, 26.11083984375, 28.056640625, 30.00244140625, 31.9482421875, 33.89404296875, 35.83984375, 37.78564453125, 39.7314453125, 41.67724609375, 43.623046875, 45.56884765625, 47.5146484375, 49.46044921875, 51.40625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 4.0, 6.0, 8.0, 9.0, 11.0, 25.0, 39.0, 58.0, 84.0, 145.0, 283.0, 582.0, 1147.0, 3358.0, 11381.0, 50913.0, 287257.0, 591155.0, 78452.0, 16296.0, 4434.0, 1496.0, 646.0, 283.0, 152.0, 105.0, 61.0, 39.0, 34.0, 26.0, 15.0, 10.0, 7.0, 7.0, 4.0, 6.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-10.796875, -10.498046875, -10.19921875, -9.900390625, -9.6015625, -9.302734375, -9.00390625, -8.705078125, -8.40625, -8.107421875, -7.80859375, -7.509765625, -7.2109375, -6.912109375, -6.61328125, -6.314453125, -6.015625, -5.716796875, -5.41796875, -5.119140625, -4.8203125, -4.521484375, -4.22265625, -3.923828125, -3.625, -3.326171875, -3.02734375, -2.728515625, -2.4296875, -2.130859375, -1.83203125, -1.533203125, -1.234375, -0.935546875, -0.63671875, -0.337890625, -0.0390625, 0.259765625, 0.55859375, 0.857421875, 1.15625, 1.455078125, 1.75390625, 2.052734375, 2.3515625, 2.650390625, 2.94921875, 3.248046875, 3.546875, 3.845703125, 4.14453125, 4.443359375, 4.7421875, 5.041015625, 5.33984375, 5.638671875, 5.9375, 6.236328125, 6.53515625, 6.833984375, 7.1328125, 7.431640625, 7.73046875, 8.029296875, 8.328125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 5.0, 1.0, 4.0, 3.0, 8.0, 12.0, 7.0, 10.0, 9.0, 29.0, 35.0, 50.0, 65.0, 80.0, 107.0, 135.0, 115.0, 103.0, 60.0, 47.0, 38.0, 18.0, 22.0, 14.0, 3.0, 9.0, 4.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0023784637451171875, -0.0023027658462524414, -0.0022270679473876953, -0.0021513700485229492, -0.002075672149658203, -0.001999974250793457, -0.001924276351928711, -0.0018485784530639648, -0.0017728805541992188, -0.0016971826553344727, -0.0016214847564697266, -0.0015457868576049805, -0.0014700889587402344, -0.0013943910598754883, -0.0013186931610107422, -0.001242995262145996, -0.00116729736328125, -0.001091599464416504, -0.0010159015655517578, -0.0009402036666870117, -0.0008645057678222656, -0.0007888078689575195, -0.0007131099700927734, -0.0006374120712280273, -0.0005617141723632812, -0.00048601627349853516, -0.00041031837463378906, -0.00033462047576904297, -0.0002589225769042969, -0.00018322467803955078, -0.00010752677917480469, -3.1828880310058594e-05, 4.38690185546875e-05, 0.0001195669174194336, 0.0001952648162841797, 0.0002709627151489258, 0.0003466606140136719, 0.00042235851287841797, 0.0004980564117431641, 0.0005737543106079102, 0.0006494522094726562, 0.0007251501083374023, 0.0008008480072021484, 0.0008765459060668945, 0.0009522438049316406, 0.0010279417037963867, 0.0011036396026611328, 0.001179337501525879, 0.001255035400390625, 0.001330733299255371, 0.0014064311981201172, 0.0014821290969848633, 0.0015578269958496094, 0.0016335248947143555, 0.0017092227935791016, 0.0017849206924438477, 0.0018606185913085938, 0.0019363164901733398, 0.002012014389038086, 0.002087712287902832, 0.002163410186767578, 0.0022391080856323242, 0.0023148059844970703, 0.0023905038833618164, 0.0024662017822265625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 8.0, 6.0, 10.0, 10.0, 11.0, 19.0, 32.0, 39.0, 53.0, 94.0, 160.0, 341.0, 707.0, 1543.0, 4042.0, 13263.0, 61250.0, 481474.0, 405758.0, 59754.0, 12928.0, 4072.0, 1516.0, 671.0, 323.0, 185.0, 103.0, 59.0, 38.0, 26.0, 18.0, 12.0, 11.0, 5.0, 2.0, 3.0, 2.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.25, -7.919921875, -7.58984375, -7.259765625, -6.9296875, -6.599609375, -6.26953125, -5.939453125, -5.609375, -5.279296875, -4.94921875, -4.619140625, -4.2890625, -3.958984375, -3.62890625, -3.298828125, -2.96875, -2.638671875, -2.30859375, -1.978515625, -1.6484375, -1.318359375, -0.98828125, -0.658203125, -0.328125, 0.001953125, 0.33203125, 0.662109375, 0.9921875, 1.322265625, 1.65234375, 1.982421875, 2.3125, 2.642578125, 2.97265625, 3.302734375, 3.6328125, 3.962890625, 4.29296875, 4.623046875, 4.953125, 5.283203125, 5.61328125, 5.943359375, 6.2734375, 6.603515625, 6.93359375, 7.263671875, 7.59375, 7.923828125, 8.25390625, 8.583984375, 8.9140625, 9.244140625, 9.57421875, 9.904296875, 10.234375, 10.564453125, 10.89453125, 11.224609375, 11.5546875, 11.884765625, 12.21484375, 12.544921875, 12.875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 9.0, 7.0, 11.0, 11.0, 6.0, 17.0, 21.0, 27.0, 27.0, 43.0, 46.0, 52.0, 55.0, 70.0, 69.0, 68.0, 69.0, 61.0, 66.0, 56.0, 38.0, 23.0, 30.0, 16.0, 19.0, 10.0, 14.0, 10.0, 11.0, 4.0, 4.0, 6.0, 8.0, 2.0, 2.0, 1.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.078125, -6.827392578125, -6.57666015625, -6.325927734375, -6.0751953125, -5.824462890625, -5.57373046875, -5.322998046875, -5.072265625, -4.821533203125, -4.57080078125, -4.320068359375, -4.0693359375, -3.818603515625, -3.56787109375, -3.317138671875, -3.06640625, -2.815673828125, -2.56494140625, -2.314208984375, -2.0634765625, -1.812744140625, -1.56201171875, -1.311279296875, -1.060546875, -0.809814453125, -0.55908203125, -0.308349609375, -0.0576171875, 0.193115234375, 0.44384765625, 0.694580078125, 0.9453125, 1.196044921875, 1.44677734375, 1.697509765625, 1.9482421875, 2.198974609375, 2.44970703125, 2.700439453125, 2.951171875, 3.201904296875, 3.45263671875, 3.703369140625, 3.9541015625, 4.204833984375, 4.45556640625, 4.706298828125, 4.95703125, 5.207763671875, 5.45849609375, 5.709228515625, 5.9599609375, 6.210693359375, 6.46142578125, 6.712158203125, 6.962890625, 7.213623046875, 7.46435546875, 7.715087890625, 7.9658203125, 8.216552734375, 8.46728515625, 8.718017578125, 8.96875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 5.0, 14.0, 17.0, 39.0, 89.0, 168.0, 310.0, 181.0, 98.0, 33.0, 27.0, 6.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-606.7669677734375, -594.0113525390625, -581.2557373046875, -568.5000610351562, -555.7444458007812, -542.9888305664062, -530.2332153320312, -517.4776000976562, -504.7219543457031, -491.9663391113281, -479.210693359375, -466.455078125, -453.699462890625, -440.9438171386719, -428.1882019042969, -415.43255615234375, -402.67694091796875, -389.92132568359375, -377.1656799316406, -364.4100646972656, -351.6544189453125, -338.8988037109375, -326.1431884765625, -313.3875732421875, -300.6319274902344, -287.8763122558594, -275.12066650390625, -262.36505126953125, -249.6094207763672, -236.85379028320312, -224.09817504882812, -211.34254455566406, -198.58688354492188, -185.8312530517578, -173.07562255859375, -160.32000732421875, -147.5643768310547, -134.80874633789062, -122.0531234741211, -109.29750061035156, -96.5418701171875, -83.78623962402344, -71.0306167602539, -58.27499008178711, -45.51936340332031, -32.763736724853516, -20.00811004638672, -7.2524871826171875, 5.503143310546875, 18.258769989013672, 31.01439666748047, 43.770023345947266, 56.52565002441406, 69.28128051757812, 82.03690338134766, 94.79252624511719, 107.54815673828125, 120.30378723144531, 133.05941772460938, 145.81503295898438, 158.57066345214844, 171.3262939453125, 184.0819091796875, 196.83753967285156, 209.59317016601562]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 4.0, 9.0, 8.0, 9.0, 11.0, 11.0, 11.0, 17.0, 24.0, 17.0, 29.0, 28.0, 35.0, 33.0, 33.0, 46.0, 49.0, 79.0, 86.0, 84.0, 41.0, 44.0, 32.0, 31.0, 33.0, 22.0, 29.0, 33.0, 13.0, 13.0, 17.0, 12.0, 6.0, 11.0, 9.0, 8.0, 9.0, 1.0, 5.0, 6.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-220.49673461914062, -212.74285888671875, -204.9889678955078, -197.23509216308594, -189.48121643066406, -181.72732543945312, -173.97344970703125, -166.21957397460938, -158.46568298339844, -150.71180725097656, -142.95791625976562, -135.20404052734375, -127.45015716552734, -119.69627380371094, -111.94239807128906, -104.18851470947266, -96.43463897705078, -88.68075561523438, -80.9268798828125, -73.1729965209961, -65.41911315917969, -57.66523361206055, -49.911354064941406, -42.157470703125, -34.40359115600586, -26.649709701538086, -18.895828247070312, -11.141948699951172, -3.3880672454833984, 4.365814208984375, 12.119693756103516, 19.873577117919922, 27.627456665039062, 35.3813362121582, 43.13521957397461, 50.88909912109375, 58.642982482910156, 66.39686584472656, 74.15074157714844, 81.90462493896484, 89.65850830078125, 97.41239166259766, 105.16626739501953, 112.92015075683594, 120.67403411865234, 128.42791748046875, 136.18179321289062, 143.9356689453125, 151.68954467773438, 159.44342041015625, 167.1973114013672, 174.95118713378906, 182.70506286621094, 190.45895385742188, 198.21282958984375, 205.96670532226562, 213.72059631347656, 221.47447204589844, 229.22836303710938, 236.98223876953125, 244.73611450195312, 252.49000549316406, 260.243896484375, 267.9977722167969, 275.75164794921875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 5.0, 9.0, 8.0, 14.0, 14.0, 25.0, 33.0, 44.0, 88.0, 137.0, 222.0, 362.0, 639.0, 1305.0, 2677.0, 5859.0, 14531.0, 45595.0, 197626.0, 991298.0, 2075615.0, 668873.0, 136142.0, 33735.0, 10826.0, 4293.0, 1928.0, 978.0, 579.0, 303.0, 172.0, 109.0, 76.0, 42.0, 33.0, 22.0, 13.0, 13.0, 14.0, 8.0, 1.0, 5.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.640625, -15.14208984375, -14.6435546875, -14.14501953125, -13.646484375, -13.14794921875, -12.6494140625, -12.15087890625, -11.65234375, -11.15380859375, -10.6552734375, -10.15673828125, -9.658203125, -9.15966796875, -8.6611328125, -8.16259765625, -7.6640625, -7.16552734375, -6.6669921875, -6.16845703125, -5.669921875, -5.17138671875, -4.6728515625, -4.17431640625, -3.67578125, -3.17724609375, -2.6787109375, -2.18017578125, -1.681640625, -1.18310546875, -0.6845703125, -0.18603515625, 0.3125, 0.81103515625, 1.3095703125, 1.80810546875, 2.306640625, 2.80517578125, 3.3037109375, 3.80224609375, 4.30078125, 4.79931640625, 5.2978515625, 5.79638671875, 6.294921875, 6.79345703125, 7.2919921875, 7.79052734375, 8.2890625, 8.78759765625, 9.2861328125, 9.78466796875, 10.283203125, 10.78173828125, 11.2802734375, 11.77880859375, 12.27734375, 12.77587890625, 13.2744140625, 13.77294921875, 14.271484375, 14.77001953125, 15.2685546875, 15.76708984375, 16.265625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 5.0, 0.0, 4.0, 1.0, 6.0, 2.0, 7.0, 6.0, 11.0, 13.0, 18.0, 16.0, 25.0, 32.0, 30.0, 21.0, 37.0, 43.0, 51.0, 55.0, 56.0, 50.0, 54.0, 46.0, 43.0, 67.0, 35.0, 43.0, 41.0, 41.0, 34.0, 23.0, 20.0, 20.0, 14.0, 11.0, 11.0, 9.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.890625, -15.289306640625, -14.68798828125, -14.086669921875, -13.4853515625, -12.884033203125, -12.28271484375, -11.681396484375, -11.080078125, -10.478759765625, -9.87744140625, -9.276123046875, -8.6748046875, -8.073486328125, -7.47216796875, -6.870849609375, -6.26953125, -5.668212890625, -5.06689453125, -4.465576171875, -3.8642578125, -3.262939453125, -2.66162109375, -2.060302734375, -1.458984375, -0.857666015625, -0.25634765625, 0.344970703125, 0.9462890625, 1.547607421875, 2.14892578125, 2.750244140625, 3.3515625, 3.952880859375, 4.55419921875, 5.155517578125, 5.7568359375, 6.358154296875, 6.95947265625, 7.560791015625, 8.162109375, 8.763427734375, 9.36474609375, 9.966064453125, 10.5673828125, 11.168701171875, 11.77001953125, 12.371337890625, 12.97265625, 13.573974609375, 14.17529296875, 14.776611328125, 15.3779296875, 15.979248046875, 16.58056640625, 17.181884765625, 17.783203125, 18.384521484375, 18.98583984375, 19.587158203125, 20.1884765625, 20.789794921875, 21.39111328125, 21.992431640625, 22.59375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 3.0, 4.0, 7.0, 7.0, 7.0, 19.0, 19.0, 38.0, 61.0, 101.0, 137.0, 398.0, 1271.0, 6478.0, 54622.0, 2897339.0, 1196139.0, 31236.0, 4521.0, 1044.0, 373.0, 178.0, 105.0, 71.0, 36.0, 20.0, 18.0, 10.0, 11.0, 4.0, 5.0, 4.0, 0.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.78125, -52.36181640625, -50.9423828125, -49.52294921875, -48.103515625, -46.68408203125, -45.2646484375, -43.84521484375, -42.42578125, -41.00634765625, -39.5869140625, -38.16748046875, -36.748046875, -35.32861328125, -33.9091796875, -32.48974609375, -31.0703125, -29.65087890625, -28.2314453125, -26.81201171875, -25.392578125, -23.97314453125, -22.5537109375, -21.13427734375, -19.71484375, -18.29541015625, -16.8759765625, -15.45654296875, -14.037109375, -12.61767578125, -11.1982421875, -9.77880859375, -8.359375, -6.93994140625, -5.5205078125, -4.10107421875, -2.681640625, -1.26220703125, 0.1572265625, 1.57666015625, 2.99609375, 4.41552734375, 5.8349609375, 7.25439453125, 8.673828125, 10.09326171875, 11.5126953125, 12.93212890625, 14.3515625, 15.77099609375, 17.1904296875, 18.60986328125, 20.029296875, 21.44873046875, 22.8681640625, 24.28759765625, 25.70703125, 27.12646484375, 28.5458984375, 29.96533203125, 31.384765625, 32.80419921875, 34.2236328125, 35.64306640625, 37.0625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 5.0, 14.0, 10.0, 20.0, 34.0, 51.0, 70.0, 184.0, 267.0, 462.0, 757.0, 749.0, 600.0, 363.0, 184.0, 117.0, 44.0, 44.0, 26.0, 20.0, 8.0, 9.0, 6.0, 7.0, 6.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.421875, -19.305908203125, -18.18994140625, -17.073974609375, -15.9580078125, -14.842041015625, -13.72607421875, -12.610107421875, -11.494140625, -10.378173828125, -9.26220703125, -8.146240234375, -7.0302734375, -5.914306640625, -4.79833984375, -3.682373046875, -2.56640625, -1.450439453125, -0.33447265625, 0.781494140625, 1.8974609375, 3.013427734375, 4.12939453125, 5.245361328125, 6.361328125, 7.477294921875, 8.59326171875, 9.709228515625, 10.8251953125, 11.941162109375, 13.05712890625, 14.173095703125, 15.2890625, 16.405029296875, 17.52099609375, 18.636962890625, 19.7529296875, 20.868896484375, 21.98486328125, 23.100830078125, 24.216796875, 25.332763671875, 26.44873046875, 27.564697265625, 28.6806640625, 29.796630859375, 30.91259765625, 32.028564453125, 33.14453125, 34.260498046875, 35.37646484375, 36.492431640625, 37.6083984375, 38.724365234375, 39.84033203125, 40.956298828125, 42.072265625, 43.188232421875, 44.30419921875, 45.420166015625, 46.5361328125, 47.652099609375, 48.76806640625, 49.884033203125, 51.0]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 8.0, 40.0, 89.0, 195.0, 266.0, 189.0, 112.0, 58.0, 20.0, 7.0, 8.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-226.63174438476562, -215.13035583496094, -203.62896728515625, -192.12759399414062, -180.62620544433594, -169.12481689453125, -157.62344360351562, -146.12205505371094, -134.62066650390625, -123.11927795410156, -111.6178970336914, -100.11651611328125, -88.61512756347656, -77.11373901367188, -65.61235809326172, -54.11097717285156, -42.609588623046875, -31.108203887939453, -19.60681915283203, -8.10543441772461, 3.3959503173828125, 14.897335052490234, 26.398719787597656, 37.90010070800781, 49.4014892578125, 60.90287399291992, 72.40425872802734, 83.9056396484375, 95.40702819824219, 106.90841674804688, 118.40979766845703, 129.9111785888672, 141.41253662109375, 152.91392517089844, 164.41531372070312, 175.91668701171875, 187.41807556152344, 198.91946411132812, 210.42083740234375, 221.92222595214844, 233.42361450195312, 244.9250030517578, 256.4263916015625, 267.9277648925781, 279.42913818359375, 290.9305419921875, 302.4319152832031, 313.93328857421875, 325.4346923828125, 336.9360656738281, 348.4374694824219, 359.9388427734375, 371.44024658203125, 382.9416198730469, 394.4429931640625, 405.94439697265625, 417.4457702636719, 428.9471435546875, 440.44854736328125, 451.9499206542969, 463.4512939453125, 474.95269775390625, 486.4540710449219, 497.9554443359375, 509.45684814453125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 3.0, 5.0, 12.0, 15.0, 14.0, 16.0, 16.0, 24.0, 21.0, 35.0, 36.0, 31.0, 58.0, 43.0, 69.0, 55.0, 61.0, 73.0, 61.0, 56.0, 44.0, 37.0, 42.0, 42.0, 24.0, 24.0, 22.0, 15.0, 11.0, 7.0, 7.0, 5.0, 4.0, 10.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-172.08407592773438, -167.24609375, -162.4081268310547, -157.57015991210938, -152.732177734375, -147.89419555664062, -143.0562286376953, -138.21826171875, -133.38027954101562, -128.54229736328125, -123.70433044433594, -118.8663558959961, -114.02838134765625, -109.1904067993164, -104.35243225097656, -99.51445770263672, -94.67648315429688, -89.83850860595703, -85.00053405761719, -80.16255950927734, -75.3245849609375, -70.48661041259766, -65.64863586425781, -60.81066131591797, -55.972686767578125, -51.13471221923828, -46.29673767089844, -41.458763122558594, -36.62078857421875, -31.782814025878906, -26.944839477539062, -22.10686492919922, -17.268905639648438, -12.430931091308594, -7.59295654296875, -2.7549819946289062, 2.0829925537109375, 6.920967102050781, 11.758941650390625, 16.59691619873047, 21.434890747070312, 26.272865295410156, 31.11083984375, 35.948814392089844, 40.78678894042969, 45.62476348876953, 50.462738037109375, 55.30071258544922, 60.13868713378906, 64.9766616821289, 69.81463623046875, 74.6526107788086, 79.49058532714844, 84.32855987548828, 89.16653442382812, 94.00450897216797, 98.84248352050781, 103.68045806884766, 108.5184326171875, 113.35640716552734, 118.19438171386719, 123.03235626220703, 127.87033081054688, 132.70831298828125, 137.54627990722656]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 6.0, 17.0, 15.0, 20.0, 30.0, 43.0, 73.0, 121.0, 197.0, 361.0, 598.0, 1092.0, 2155.0, 4328.0, 9998.0, 23598.0, 60687.0, 164255.0, 345789.0, 265438.0, 102615.0, 38464.0, 15242.0, 6796.0, 3018.0, 1555.0, 811.0, 490.0, 266.0, 164.0, 115.0, 68.0, 49.0, 24.0, 23.0, 11.0, 6.0, 7.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.375, -18.701416015625, -18.02783203125, -17.354248046875, -16.6806640625, -16.007080078125, -15.33349609375, -14.659912109375, -13.986328125, -13.312744140625, -12.63916015625, -11.965576171875, -11.2919921875, -10.618408203125, -9.94482421875, -9.271240234375, -8.59765625, -7.924072265625, -7.25048828125, -6.576904296875, -5.9033203125, -5.229736328125, -4.55615234375, -3.882568359375, -3.208984375, -2.535400390625, -1.86181640625, -1.188232421875, -0.5146484375, 0.158935546875, 0.83251953125, 1.506103515625, 2.1796875, 2.853271484375, 3.52685546875, 4.200439453125, 4.8740234375, 5.547607421875, 6.22119140625, 6.894775390625, 7.568359375, 8.241943359375, 8.91552734375, 9.589111328125, 10.2626953125, 10.936279296875, 11.60986328125, 12.283447265625, 12.95703125, 13.630615234375, 14.30419921875, 14.977783203125, 15.6513671875, 16.324951171875, 16.99853515625, 17.672119140625, 18.345703125, 19.019287109375, 19.69287109375, 20.366455078125, 21.0400390625, 21.713623046875, 22.38720703125, 23.060791015625, 23.734375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 3.0, 5.0, 7.0, 4.0, 4.0, 14.0, 8.0, 10.0, 24.0, 20.0, 30.0, 26.0, 32.0, 29.0, 37.0, 52.0, 60.0, 45.0, 55.0, 58.0, 43.0, 57.0, 57.0, 50.0, 41.0, 36.0, 40.0, 31.0, 20.0, 24.0, 24.0, 20.0, 11.0, 7.0, 10.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.03125, -15.42822265625, -14.8251953125, -14.22216796875, -13.619140625, -13.01611328125, -12.4130859375, -11.81005859375, -11.20703125, -10.60400390625, -10.0009765625, -9.39794921875, -8.794921875, -8.19189453125, -7.5888671875, -6.98583984375, -6.3828125, -5.77978515625, -5.1767578125, -4.57373046875, -3.970703125, -3.36767578125, -2.7646484375, -2.16162109375, -1.55859375, -0.95556640625, -0.3525390625, 0.25048828125, 0.853515625, 1.45654296875, 2.0595703125, 2.66259765625, 3.265625, 3.86865234375, 4.4716796875, 5.07470703125, 5.677734375, 6.28076171875, 6.8837890625, 7.48681640625, 8.08984375, 8.69287109375, 9.2958984375, 9.89892578125, 10.501953125, 11.10498046875, 11.7080078125, 12.31103515625, 12.9140625, 13.51708984375, 14.1201171875, 14.72314453125, 15.326171875, 15.92919921875, 16.5322265625, 17.13525390625, 17.73828125, 18.34130859375, 18.9443359375, 19.54736328125, 20.150390625, 20.75341796875, 21.3564453125, 21.95947265625, 22.5625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 7.0, 17.0, 12.0, 14.0, 17.0, 31.0, 39.0, 40.0, 73.0, 81.0, 135.0, 175.0, 251.0, 363.0, 544.0, 949.0, 1759.0, 4064.0, 11319.0, 40445.0, 178185.0, 626778.0, 135235.0, 31314.0, 9227.0, 3369.0, 1569.0, 804.0, 561.0, 339.0, 226.0, 145.0, 122.0, 83.0, 61.0, 52.0, 35.0, 26.0, 24.0, 14.0, 11.0, 11.0, 9.0, 4.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-31.921875, -30.905517578125, -29.88916015625, -28.872802734375, -27.8564453125, -26.840087890625, -25.82373046875, -24.807373046875, -23.791015625, -22.774658203125, -21.75830078125, -20.741943359375, -19.7255859375, -18.709228515625, -17.69287109375, -16.676513671875, -15.66015625, -14.643798828125, -13.62744140625, -12.611083984375, -11.5947265625, -10.578369140625, -9.56201171875, -8.545654296875, -7.529296875, -6.512939453125, -5.49658203125, -4.480224609375, -3.4638671875, -2.447509765625, -1.43115234375, -0.414794921875, 0.6015625, 1.617919921875, 2.63427734375, 3.650634765625, 4.6669921875, 5.683349609375, 6.69970703125, 7.716064453125, 8.732421875, 9.748779296875, 10.76513671875, 11.781494140625, 12.7978515625, 13.814208984375, 14.83056640625, 15.846923828125, 16.86328125, 17.879638671875, 18.89599609375, 19.912353515625, 20.9287109375, 21.945068359375, 22.96142578125, 23.977783203125, 24.994140625, 26.010498046875, 27.02685546875, 28.043212890625, 29.0595703125, 30.075927734375, 31.09228515625, 32.108642578125, 33.125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 1.0, 3.0, 5.0, 6.0, 6.0, 6.0, 7.0, 16.0, 16.0, 14.0, 15.0, 30.0, 29.0, 37.0, 31.0, 30.0, 41.0, 36.0, 49.0, 50.0, 64.0, 49.0, 60.0, 33.0, 45.0, 32.0, 41.0, 29.0, 31.0, 31.0, 23.0, 30.0, 24.0, 19.0, 14.0, 13.0, 7.0, 3.0, 5.0, 6.0, 4.0, 3.0, 2.0, 4.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.65625, -48.87646484375, -47.0966796875, -45.31689453125, -43.537109375, -41.75732421875, -39.9775390625, -38.19775390625, -36.41796875, -34.63818359375, -32.8583984375, -31.07861328125, -29.298828125, -27.51904296875, -25.7392578125, -23.95947265625, -22.1796875, -20.39990234375, -18.6201171875, -16.84033203125, -15.060546875, -13.28076171875, -11.5009765625, -9.72119140625, -7.94140625, -6.16162109375, -4.3818359375, -2.60205078125, -0.822265625, 0.95751953125, 2.7373046875, 4.51708984375, 6.296875, 8.07666015625, 9.8564453125, 11.63623046875, 13.416015625, 15.19580078125, 16.9755859375, 18.75537109375, 20.53515625, 22.31494140625, 24.0947265625, 25.87451171875, 27.654296875, 29.43408203125, 31.2138671875, 32.99365234375, 34.7734375, 36.55322265625, 38.3330078125, 40.11279296875, 41.892578125, 43.67236328125, 45.4521484375, 47.23193359375, 49.01171875, 50.79150390625, 52.5712890625, 54.35107421875, 56.130859375, 57.91064453125, 59.6904296875, 61.47021484375, 63.25]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 6.0, 2.0, 13.0, 15.0, 10.0, 26.0, 43.0, 55.0, 98.0, 193.0, 295.0, 580.0, 1318.0, 3135.0, 8912.0, 29052.0, 142221.0, 719361.0, 106591.0, 24078.0, 7479.0, 2745.0, 1127.0, 526.0, 260.0, 152.0, 91.0, 46.0, 47.0, 29.0, 15.0, 7.0, 13.0, 6.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.59765625, -6.34796142578125, -6.0982666015625, -5.84857177734375, -5.598876953125, -5.34918212890625, -5.0994873046875, -4.84979248046875, -4.60009765625, -4.35040283203125, -4.1007080078125, -3.85101318359375, -3.601318359375, -3.35162353515625, -3.1019287109375, -2.85223388671875, -2.6025390625, -2.35284423828125, -2.1031494140625, -1.85345458984375, -1.603759765625, -1.35406494140625, -1.1043701171875, -0.85467529296875, -0.60498046875, -0.35528564453125, -0.1055908203125, 0.14410400390625, 0.393798828125, 0.64349365234375, 0.8931884765625, 1.14288330078125, 1.392578125, 1.64227294921875, 1.8919677734375, 2.14166259765625, 2.391357421875, 2.64105224609375, 2.8907470703125, 3.14044189453125, 3.39013671875, 3.63983154296875, 3.8895263671875, 4.13922119140625, 4.388916015625, 4.63861083984375, 4.8883056640625, 5.13800048828125, 5.3876953125, 5.63739013671875, 5.8870849609375, 6.13677978515625, 6.386474609375, 6.63616943359375, 6.8858642578125, 7.13555908203125, 7.38525390625, 7.63494873046875, 7.8846435546875, 8.13433837890625, 8.384033203125, 8.63372802734375, 8.8834228515625, 9.13311767578125, 9.3828125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 8.0, 1.0, 4.0, 6.0, 7.0, 9.0, 16.0, 16.0, 29.0, 49.0, 86.0, 129.0, 181.0, 170.0, 111.0, 54.0, 37.0, 24.0, 17.0, 16.0, 16.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0029430389404296875, -0.0028631985187530518, -0.002783358097076416, -0.0027035176753997803, -0.0026236772537231445, -0.002543836832046509, -0.002463996410369873, -0.0023841559886932373, -0.0023043155670166016, -0.002224475145339966, -0.00214463472366333, -0.0020647943019866943, -0.0019849538803100586, -0.0019051134586334229, -0.0018252730369567871, -0.0017454326152801514, -0.0016655921936035156, -0.0015857517719268799, -0.0015059113502502441, -0.0014260709285736084, -0.0013462305068969727, -0.001266390085220337, -0.0011865496635437012, -0.0011067092418670654, -0.0010268688201904297, -0.0009470283985137939, -0.0008671879768371582, -0.0007873475551605225, -0.0007075071334838867, -0.000627666711807251, -0.0005478262901306152, -0.0004679858684539795, -0.00038814544677734375, -0.000308305025100708, -0.00022846460342407227, -0.00014862418174743652, -6.878376007080078e-05, 1.1056661605834961e-05, 9.08970832824707e-05, 0.00017073750495910645, 0.0002505779266357422, 0.00033041834831237793, 0.00041025876998901367, 0.0004900991916656494, 0.0005699396133422852, 0.0006497800350189209, 0.0007296204566955566, 0.0008094608783721924, 0.0008893013000488281, 0.0009691417217254639, 0.0010489821434020996, 0.0011288225650787354, 0.001208662986755371, 0.0012885034084320068, 0.0013683438301086426, 0.0014481842517852783, 0.001528024673461914, 0.0016078650951385498, 0.0016877055168151855, 0.0017675459384918213, 0.001847386360168457, 0.0019272267818450928, 0.0020070672035217285, 0.0020869076251983643, 0.002166748046875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 8.0, 13.0, 11.0, 14.0, 25.0, 36.0, 42.0, 51.0, 95.0, 179.0, 229.0, 393.0, 781.0, 1599.0, 3568.0, 10009.0, 34870.0, 170444.0, 687990.0, 101815.0, 23666.0, 7097.0, 2740.0, 1292.0, 630.0, 367.0, 203.0, 117.0, 83.0, 63.0, 31.0, 30.0, 23.0, 11.0, 12.0, 11.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2109375, -7.9571533203125, -7.703369140625, -7.4495849609375, -7.19580078125, -6.9420166015625, -6.688232421875, -6.4344482421875, -6.1806640625, -5.9268798828125, -5.673095703125, -5.4193115234375, -5.16552734375, -4.9117431640625, -4.657958984375, -4.4041748046875, -4.150390625, -3.8966064453125, -3.642822265625, -3.3890380859375, -3.13525390625, -2.8814697265625, -2.627685546875, -2.3739013671875, -2.1201171875, -1.8663330078125, -1.612548828125, -1.3587646484375, -1.10498046875, -0.8511962890625, -0.597412109375, -0.3436279296875, -0.08984375, 0.1639404296875, 0.417724609375, 0.6715087890625, 0.92529296875, 1.1790771484375, 1.432861328125, 1.6866455078125, 1.9404296875, 2.1942138671875, 2.447998046875, 2.7017822265625, 2.95556640625, 3.2093505859375, 3.463134765625, 3.7169189453125, 3.970703125, 4.2244873046875, 4.478271484375, 4.7320556640625, 4.98583984375, 5.2396240234375, 5.493408203125, 5.7471923828125, 6.0009765625, 6.2547607421875, 6.508544921875, 6.7623291015625, 7.01611328125, 7.2698974609375, 7.523681640625, 7.7774658203125, 8.03125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 4.0, 8.0, 10.0, 8.0, 17.0, 18.0, 23.0, 38.0, 33.0, 43.0, 70.0, 76.0, 88.0, 89.0, 89.0, 77.0, 67.0, 39.0, 46.0, 38.0, 25.0, 21.0, 13.0, 11.0, 9.0, 10.0, 1.0, 4.0, 1.0, 6.0, 0.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.84375, -7.569580078125, -7.29541015625, -7.021240234375, -6.7470703125, -6.472900390625, -6.19873046875, -5.924560546875, -5.650390625, -5.376220703125, -5.10205078125, -4.827880859375, -4.5537109375, -4.279541015625, -4.00537109375, -3.731201171875, -3.45703125, -3.182861328125, -2.90869140625, -2.634521484375, -2.3603515625, -2.086181640625, -1.81201171875, -1.537841796875, -1.263671875, -0.989501953125, -0.71533203125, -0.441162109375, -0.1669921875, 0.107177734375, 0.38134765625, 0.655517578125, 0.9296875, 1.203857421875, 1.47802734375, 1.752197265625, 2.0263671875, 2.300537109375, 2.57470703125, 2.848876953125, 3.123046875, 3.397216796875, 3.67138671875, 3.945556640625, 4.2197265625, 4.493896484375, 4.76806640625, 5.042236328125, 5.31640625, 5.590576171875, 5.86474609375, 6.138916015625, 6.4130859375, 6.687255859375, 6.96142578125, 7.235595703125, 7.509765625, 7.783935546875, 8.05810546875, 8.332275390625, 8.6064453125, 8.880615234375, 9.15478515625, 9.428955078125, 9.703125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 4.0, 5.0, 12.0, 28.0, 42.0, 98.0, 198.0, 342.0, 133.0, 72.0, 31.0, 16.0, 11.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-318.91046142578125, -308.029052734375, -297.1476745605469, -286.2662658691406, -275.3848876953125, -264.50347900390625, -253.6220703125, -242.7406768798828, -231.85928344726562, -220.97789001464844, -210.09649658203125, -199.215087890625, -188.3336944580078, -177.45230102539062, -166.57089233398438, -155.6894989013672, -144.80810546875, -133.9267120361328, -123.0453109741211, -112.16390991210938, -101.28251647949219, -90.401123046875, -79.51972198486328, -68.63832092285156, -57.756927490234375, -46.87553024291992, -35.99413299560547, -25.112735748291016, -14.231338500976562, -3.3499412536621094, 7.531455993652344, 18.412857055664062, 29.294281005859375, 40.17567825317383, 51.05707550048828, 61.938472747802734, 72.81986999511719, 83.70126342773438, 94.5826644897461, 105.46406555175781, 116.345458984375, 127.22685241699219, 138.10824584960938, 148.98965454101562, 159.8710479736328, 170.75244140625, 181.63385009765625, 192.51524353027344, 203.39663696289062, 214.2780303955078, 225.159423828125, 236.04083251953125, 246.92222595214844, 257.8036193847656, 268.6850280761719, 279.56640625, 290.44781494140625, 301.3292236328125, 312.2106018066406, 323.0920104980469, 333.973388671875, 344.85479736328125, 355.7362060546875, 366.61761474609375, 377.4989929199219]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 4.0, 10.0, 12.0, 9.0, 5.0, 14.0, 17.0, 20.0, 15.0, 13.0, 26.0, 26.0, 26.0, 26.0, 37.0, 46.0, 70.0, 79.0, 93.0, 85.0, 53.0, 32.0, 40.0, 38.0, 27.0, 26.0, 20.0, 16.0, 14.0, 15.0, 14.0, 17.0, 7.0, 11.0, 10.0, 2.0, 4.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-212.47348022460938, -205.71902465820312, -198.96456909179688, -192.2101287841797, -185.45567321777344, -178.7012176513672, -171.94677734375, -165.19232177734375, -158.4378662109375, -151.68341064453125, -144.928955078125, -138.1745147705078, -131.42005920410156, -124.66560363769531, -117.9111557006836, -111.15670776367188, -104.40225219726562, -97.64779663085938, -90.89334869384766, -84.13890075683594, -77.38444519042969, -70.62998962402344, -63.87554168701172, -57.121089935302734, -50.36663818359375, -43.612186431884766, -36.85773468017578, -30.103282928466797, -23.348831176757812, -16.594379425048828, -9.839927673339844, -3.0854759216308594, 3.668975830078125, 10.42342758178711, 17.177879333496094, 23.932331085205078, 30.686782836914062, 37.44123458862305, 44.19568634033203, 50.950138092041016, 57.70458984375, 64.45904541015625, 71.21349334716797, 77.96794128417969, 84.72239685058594, 91.47685241699219, 98.2313003540039, 104.98574829101562, 111.74020385742188, 118.49465942382812, 125.24910736083984, 132.00355529785156, 138.7580108642578, 145.51246643066406, 152.26690673828125, 159.0213623046875, 165.77581787109375, 172.5302734375, 179.28472900390625, 186.03916931152344, 192.7936248779297, 199.54808044433594, 206.30252075195312, 213.05697631835938, 219.81143188476562]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 2.0, 13.0, 17.0, 20.0, 30.0, 75.0, 125.0, 294.0, 709.0, 2756.0, 15258.0, 167309.0, 2613241.0, 1317059.0, 67194.0, 7507.0, 1602.0, 549.0, 241.0, 106.0, 61.0, 38.0, 30.0, 18.0, 11.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.046875, -20.989013671875, -19.93115234375, -18.873291015625, -17.8154296875, -16.757568359375, -15.69970703125, -14.641845703125, -13.583984375, -12.526123046875, -11.46826171875, -10.410400390625, -9.3525390625, -8.294677734375, -7.23681640625, -6.178955078125, -5.12109375, -4.063232421875, -3.00537109375, -1.947509765625, -0.8896484375, 0.168212890625, 1.22607421875, 2.283935546875, 3.341796875, 4.399658203125, 5.45751953125, 6.515380859375, 7.5732421875, 8.631103515625, 9.68896484375, 10.746826171875, 11.8046875, 12.862548828125, 13.92041015625, 14.978271484375, 16.0361328125, 17.093994140625, 18.15185546875, 19.209716796875, 20.267578125, 21.325439453125, 22.38330078125, 23.441162109375, 24.4990234375, 25.556884765625, 26.61474609375, 27.672607421875, 28.73046875, 29.788330078125, 30.84619140625, 31.904052734375, 32.9619140625, 34.019775390625, 35.07763671875, 36.135498046875, 37.193359375, 38.251220703125, 39.30908203125, 40.366943359375, 41.4248046875, 42.482666015625, 43.54052734375, 44.598388671875, 45.65625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 7.0, 4.0, 8.0, 10.0, 12.0, 9.0, 25.0, 21.0, 24.0, 32.0, 37.0, 47.0, 42.0, 44.0, 54.0, 48.0, 53.0, 55.0, 60.0, 56.0, 56.0, 51.0, 39.0, 36.0, 37.0, 33.0, 18.0, 20.0, 15.0, 13.0, 8.0, 8.0, 3.0, 4.0, 2.0, 5.0, 1.0, 5.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.59375, -15.98681640625, -15.3798828125, -14.77294921875, -14.166015625, -13.55908203125, -12.9521484375, -12.34521484375, -11.73828125, -11.13134765625, -10.5244140625, -9.91748046875, -9.310546875, -8.70361328125, -8.0966796875, -7.48974609375, -6.8828125, -6.27587890625, -5.6689453125, -5.06201171875, -4.455078125, -3.84814453125, -3.2412109375, -2.63427734375, -2.02734375, -1.42041015625, -0.8134765625, -0.20654296875, 0.400390625, 1.00732421875, 1.6142578125, 2.22119140625, 2.828125, 3.43505859375, 4.0419921875, 4.64892578125, 5.255859375, 5.86279296875, 6.4697265625, 7.07666015625, 7.68359375, 8.29052734375, 8.8974609375, 9.50439453125, 10.111328125, 10.71826171875, 11.3251953125, 11.93212890625, 12.5390625, 13.14599609375, 13.7529296875, 14.35986328125, 14.966796875, 15.57373046875, 16.1806640625, 16.78759765625, 17.39453125, 18.00146484375, 18.6083984375, 19.21533203125, 19.822265625, 20.42919921875, 21.0361328125, 21.64306640625, 22.25]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 4.0, 4.0, 4.0, 6.0, 9.0, 20.0, 14.0, 19.0, 30.0, 39.0, 55.0, 114.0, 194.0, 385.0, 980.0, 3459.0, 16478.0, 228685.0, 3649084.0, 271282.0, 17771.0, 3626.0, 1134.0, 386.0, 183.0, 107.0, 72.0, 31.0, 26.0, 18.0, 16.0, 12.0, 10.0, 6.0, 3.0, 5.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0], "bins": [-39.71875, -38.49755859375, -37.2763671875, -36.05517578125, -34.833984375, -33.61279296875, -32.3916015625, -31.17041015625, -29.94921875, -28.72802734375, -27.5068359375, -26.28564453125, -25.064453125, -23.84326171875, -22.6220703125, -21.40087890625, -20.1796875, -18.95849609375, -17.7373046875, -16.51611328125, -15.294921875, -14.07373046875, -12.8525390625, -11.63134765625, -10.41015625, -9.18896484375, -7.9677734375, -6.74658203125, -5.525390625, -4.30419921875, -3.0830078125, -1.86181640625, -0.640625, 0.58056640625, 1.8017578125, 3.02294921875, 4.244140625, 5.46533203125, 6.6865234375, 7.90771484375, 9.12890625, 10.35009765625, 11.5712890625, 12.79248046875, 14.013671875, 15.23486328125, 16.4560546875, 17.67724609375, 18.8984375, 20.11962890625, 21.3408203125, 22.56201171875, 23.783203125, 25.00439453125, 26.2255859375, 27.44677734375, 28.66796875, 29.88916015625, 31.1103515625, 32.33154296875, 33.552734375, 34.77392578125, 35.9951171875, 37.21630859375, 38.4375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 3.0, 5.0, 1.0, 9.0, 12.0, 12.0, 19.0, 39.0, 43.0, 76.0, 134.0, 195.0, 272.0, 446.0, 599.0, 652.0, 542.0, 342.0, 238.0, 146.0, 80.0, 70.0, 54.0, 19.0, 15.0, 16.0, 10.0, 4.0, 6.0, 4.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.015625, -29.030029296875, -28.04443359375, -27.058837890625, -26.0732421875, -25.087646484375, -24.10205078125, -23.116455078125, -22.130859375, -21.145263671875, -20.15966796875, -19.174072265625, -18.1884765625, -17.202880859375, -16.21728515625, -15.231689453125, -14.24609375, -13.260498046875, -12.27490234375, -11.289306640625, -10.3037109375, -9.318115234375, -8.33251953125, -7.346923828125, -6.361328125, -5.375732421875, -4.39013671875, -3.404541015625, -2.4189453125, -1.433349609375, -0.44775390625, 0.537841796875, 1.5234375, 2.509033203125, 3.49462890625, 4.480224609375, 5.4658203125, 6.451416015625, 7.43701171875, 8.422607421875, 9.408203125, 10.393798828125, 11.37939453125, 12.364990234375, 13.3505859375, 14.336181640625, 15.32177734375, 16.307373046875, 17.29296875, 18.278564453125, 19.26416015625, 20.249755859375, 21.2353515625, 22.220947265625, 23.20654296875, 24.192138671875, 25.177734375, 26.163330078125, 27.14892578125, 28.134521484375, 29.1201171875, 30.105712890625, 31.09130859375, 32.076904296875, 33.0625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 2.0, 11.0, 20.0, 41.0, 117.0, 264.0, 309.0, 165.0, 48.0, 14.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-675.2928466796875, -660.3777465820312, -645.4627075195312, -630.547607421875, -615.632568359375, -600.7174682617188, -585.8024291992188, -570.8873291015625, -555.9722900390625, -541.0571899414062, -526.1421508789062, -511.2270812988281, -496.31201171875, -481.3969421386719, -466.48187255859375, -451.5667724609375, -436.6517028808594, -421.73663330078125, -406.8215637207031, -391.906494140625, -376.9914245605469, -362.07635498046875, -347.1612548828125, -332.2462158203125, -317.33111572265625, -302.4160461425781, -287.5009765625, -272.5859069824219, -257.67083740234375, -242.75576782226562, -227.84068298339844, -212.9256134033203, -198.01052856445312, -183.095458984375, -168.18038940429688, -153.26531982421875, -138.35025024414062, -123.43517303466797, -108.52009582519531, -93.60502624511719, -78.68995666503906, -63.77488708496094, -48.85981369018555, -33.944740295410156, -19.02967071533203, -4.114601135253906, 10.80047607421875, 25.715545654296875, 40.630615234375, 55.545684814453125, 70.46075439453125, 85.3758316040039, 100.29090118408203, 115.20597076416016, 130.1210479736328, 145.03611755371094, 159.95118713378906, 174.8662567138672, 189.7813262939453, 204.6964111328125, 219.61148071289062, 234.52655029296875, 249.44161987304688, 264.356689453125, 279.2717590332031]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 0.0, 4.0, 2.0, 5.0, 4.0, 8.0, 15.0, 16.0, 10.0, 12.0, 18.0, 15.0, 16.0, 24.0, 24.0, 28.0, 18.0, 34.0, 47.0, 33.0, 39.0, 41.0, 36.0, 30.0, 40.0, 36.0, 35.0, 43.0, 27.0, 36.0, 33.0, 26.0, 28.0, 31.0, 29.0, 25.0, 20.0, 22.0, 21.0, 11.0, 12.0, 8.0, 9.0, 6.0, 11.0, 3.0, 2.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-129.9894561767578, -126.17731475830078, -122.36516571044922, -118.55302429199219, -114.74087524414062, -110.9287338256836, -107.11659240722656, -103.304443359375, -99.49230194091797, -95.68016052246094, -91.86801147460938, -88.05587005615234, -84.24372863769531, -80.43157958984375, -76.61943817138672, -72.80729675292969, -68.99514770507812, -65.1830062866211, -61.37085723876953, -57.5587158203125, -53.7465705871582, -49.934425354003906, -46.122283935546875, -42.31013870239258, -38.49799346923828, -34.685848236083984, -30.87370491027832, -27.061561584472656, -23.24941635131836, -19.437271118164062, -15.625127792358398, -11.812984466552734, -8.000839233398438, -4.188694953918457, -0.37655067443847656, 3.435593605041504, 7.247737884521484, 11.059883117675781, 14.872026443481445, 18.68416976928711, 22.496315002441406, 26.308460235595703, 30.120603561401367, 33.93274688720703, 37.74489212036133, 41.557037353515625, 45.369178771972656, 49.18132400512695, 52.99346923828125, 56.80561447143555, 60.617759704589844, 64.42990112304688, 68.24205017089844, 72.05419158935547, 75.8663330078125, 79.67848205566406, 83.4906234741211, 87.30276489257812, 91.11491394042969, 94.92705535888672, 98.73919677734375, 102.55134582519531, 106.36348724365234, 110.17562866210938, 113.98777770996094]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 6.0, 3.0, 4.0, 8.0, 3.0, 16.0, 16.0, 35.0, 62.0, 88.0, 122.0, 221.0, 287.0, 476.0, 856.0, 1562.0, 3030.0, 6335.0, 13825.0, 34181.0, 92223.0, 254336.0, 375443.0, 163774.0, 59249.0, 22749.0, 9858.0, 4482.0, 2278.0, 1231.0, 657.0, 429.0, 255.0, 156.0, 90.0, 68.0, 37.0, 44.0, 27.0, 16.0, 10.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-24.546875, -23.809326171875, -23.07177734375, -22.334228515625, -21.5966796875, -20.859130859375, -20.12158203125, -19.384033203125, -18.646484375, -17.908935546875, -17.17138671875, -16.433837890625, -15.6962890625, -14.958740234375, -14.22119140625, -13.483642578125, -12.74609375, -12.008544921875, -11.27099609375, -10.533447265625, -9.7958984375, -9.058349609375, -8.32080078125, -7.583251953125, -6.845703125, -6.108154296875, -5.37060546875, -4.633056640625, -3.8955078125, -3.157958984375, -2.42041015625, -1.682861328125, -0.9453125, -0.207763671875, 0.52978515625, 1.267333984375, 2.0048828125, 2.742431640625, 3.47998046875, 4.217529296875, 4.955078125, 5.692626953125, 6.43017578125, 7.167724609375, 7.9052734375, 8.642822265625, 9.38037109375, 10.117919921875, 10.85546875, 11.593017578125, 12.33056640625, 13.068115234375, 13.8056640625, 14.543212890625, 15.28076171875, 16.018310546875, 16.755859375, 17.493408203125, 18.23095703125, 18.968505859375, 19.7060546875, 20.443603515625, 21.18115234375, 21.918701171875, 22.65625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 3.0, 5.0, 7.0, 8.0, 3.0, 15.0, 22.0, 24.0, 31.0, 37.0, 26.0, 48.0, 41.0, 43.0, 46.0, 49.0, 58.0, 73.0, 61.0, 43.0, 58.0, 39.0, 47.0, 34.0, 23.0, 35.0, 29.0, 22.0, 13.0, 9.0, 7.0, 9.0, 5.0, 2.0, 4.0, 6.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.625, -16.0166015625, -15.408203125, -14.7998046875, -14.19140625, -13.5830078125, -12.974609375, -12.3662109375, -11.7578125, -11.1494140625, -10.541015625, -9.9326171875, -9.32421875, -8.7158203125, -8.107421875, -7.4990234375, -6.890625, -6.2822265625, -5.673828125, -5.0654296875, -4.45703125, -3.8486328125, -3.240234375, -2.6318359375, -2.0234375, -1.4150390625, -0.806640625, -0.1982421875, 0.41015625, 1.0185546875, 1.626953125, 2.2353515625, 2.84375, 3.4521484375, 4.060546875, 4.6689453125, 5.27734375, 5.8857421875, 6.494140625, 7.1025390625, 7.7109375, 8.3193359375, 8.927734375, 9.5361328125, 10.14453125, 10.7529296875, 11.361328125, 11.9697265625, 12.578125, 13.1865234375, 13.794921875, 14.4033203125, 15.01171875, 15.6201171875, 16.228515625, 16.8369140625, 17.4453125, 18.0537109375, 18.662109375, 19.2705078125, 19.87890625, 20.4873046875, 21.095703125, 21.7041015625, 22.3125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 6.0, 5.0, 5.0, 3.0, 5.0, 4.0, 13.0, 15.0, 21.0, 24.0, 35.0, 50.0, 55.0, 67.0, 115.0, 108.0, 198.0, 224.0, 325.0, 514.0, 753.0, 1226.0, 2198.0, 4966.0, 15461.0, 69731.0, 677927.0, 220224.0, 36122.0, 9548.0, 3515.0, 1849.0, 1021.0, 638.0, 421.0, 330.0, 225.0, 131.0, 123.0, 90.0, 58.0, 43.0, 39.0, 34.0, 30.0, 17.0, 15.0, 9.0, 16.0, 3.0, 3.0, 3.0, 5.0, 2.0, 0.0, 1.0], "bins": [-42.09375, -40.88427734375, -39.6748046875, -38.46533203125, -37.255859375, -36.04638671875, -34.8369140625, -33.62744140625, -32.41796875, -31.20849609375, -29.9990234375, -28.78955078125, -27.580078125, -26.37060546875, -25.1611328125, -23.95166015625, -22.7421875, -21.53271484375, -20.3232421875, -19.11376953125, -17.904296875, -16.69482421875, -15.4853515625, -14.27587890625, -13.06640625, -11.85693359375, -10.6474609375, -9.43798828125, -8.228515625, -7.01904296875, -5.8095703125, -4.60009765625, -3.390625, -2.18115234375, -0.9716796875, 0.23779296875, 1.447265625, 2.65673828125, 3.8662109375, 5.07568359375, 6.28515625, 7.49462890625, 8.7041015625, 9.91357421875, 11.123046875, 12.33251953125, 13.5419921875, 14.75146484375, 15.9609375, 17.17041015625, 18.3798828125, 19.58935546875, 20.798828125, 22.00830078125, 23.2177734375, 24.42724609375, 25.63671875, 26.84619140625, 28.0556640625, 29.26513671875, 30.474609375, 31.68408203125, 32.8935546875, 34.10302734375, 35.3125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 7.0, 10.0, 12.0, 14.0, 19.0, 14.0, 27.0, 26.0, 23.0, 34.0, 32.0, 31.0, 43.0, 39.0, 51.0, 42.0, 48.0, 46.0, 44.0, 53.0, 52.0, 41.0, 34.0, 40.0, 31.0, 30.0, 26.0, 22.0, 14.0, 16.0, 11.0, 12.0, 9.0, 7.0, 5.0, 5.0, 3.0, 2.0, 3.0, 5.0, 5.0, 2.0, 1.0, 0.0, 4.0], "bins": [-65.5, -63.67626953125, -61.8525390625, -60.02880859375, -58.205078125, -56.38134765625, -54.5576171875, -52.73388671875, -50.91015625, -49.08642578125, -47.2626953125, -45.43896484375, -43.615234375, -41.79150390625, -39.9677734375, -38.14404296875, -36.3203125, -34.49658203125, -32.6728515625, -30.84912109375, -29.025390625, -27.20166015625, -25.3779296875, -23.55419921875, -21.73046875, -19.90673828125, -18.0830078125, -16.25927734375, -14.435546875, -12.61181640625, -10.7880859375, -8.96435546875, -7.140625, -5.31689453125, -3.4931640625, -1.66943359375, 0.154296875, 1.97802734375, 3.8017578125, 5.62548828125, 7.44921875, 9.27294921875, 11.0966796875, 12.92041015625, 14.744140625, 16.56787109375, 18.3916015625, 20.21533203125, 22.0390625, 23.86279296875, 25.6865234375, 27.51025390625, 29.333984375, 31.15771484375, 32.9814453125, 34.80517578125, 36.62890625, 38.45263671875, 40.2763671875, 42.10009765625, 43.923828125, 45.74755859375, 47.5712890625, 49.39501953125, 51.21875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 4.0, 5.0, 7.0, 13.0, 12.0, 17.0, 33.0, 53.0, 61.0, 57.0, 141.0, 263.0, 566.0, 1407.0, 5103.0, 32928.0, 900049.0, 95150.0, 9066.0, 2100.0, 745.0, 301.0, 167.0, 93.0, 61.0, 35.0, 40.0, 18.0, 12.0, 10.0, 7.0, 5.0, 8.0, 7.0, 6.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.28125, -12.8748779296875, -12.468505859375, -12.0621337890625, -11.65576171875, -11.2493896484375, -10.843017578125, -10.4366455078125, -10.0302734375, -9.6239013671875, -9.217529296875, -8.8111572265625, -8.40478515625, -7.9984130859375, -7.592041015625, -7.1856689453125, -6.779296875, -6.3729248046875, -5.966552734375, -5.5601806640625, -5.15380859375, -4.7474365234375, -4.341064453125, -3.9346923828125, -3.5283203125, -3.1219482421875, -2.715576171875, -2.3092041015625, -1.90283203125, -1.4964599609375, -1.090087890625, -0.6837158203125, -0.27734375, 0.1290283203125, 0.535400390625, 0.9417724609375, 1.34814453125, 1.7545166015625, 2.160888671875, 2.5672607421875, 2.9736328125, 3.3800048828125, 3.786376953125, 4.1927490234375, 4.59912109375, 5.0054931640625, 5.411865234375, 5.8182373046875, 6.224609375, 6.6309814453125, 7.037353515625, 7.4437255859375, 7.85009765625, 8.2564697265625, 8.662841796875, 9.0692138671875, 9.4755859375, 9.8819580078125, 10.288330078125, 10.6947021484375, 11.10107421875, 11.5074462890625, 11.913818359375, 12.3201904296875, 12.7265625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 4.0, 2.0, 11.0, 3.0, 11.0, 20.0, 40.0, 60.0, 157.0, 299.0, 176.0, 86.0, 35.0, 27.0, 12.0, 14.0, 5.0, 8.0, 7.0, 1.0, 5.0, 0.0, 5.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00255584716796875, -0.00244748592376709, -0.0023391246795654297, -0.0022307634353637695, -0.0021224021911621094, -0.0020140409469604492, -0.001905679702758789, -0.001797318458557129, -0.0016889572143554688, -0.0015805959701538086, -0.0014722347259521484, -0.0013638734817504883, -0.0012555122375488281, -0.001147150993347168, -0.0010387897491455078, -0.0009304285049438477, -0.0008220672607421875, -0.0007137060165405273, -0.0006053447723388672, -0.000496983528137207, -0.0003886222839355469, -0.0002802610397338867, -0.00017189979553222656, -6.35385513305664e-05, 4.482269287109375e-05, 0.0001531839370727539, 0.00026154518127441406, 0.0003699064254760742, 0.0004782676696777344, 0.0005866289138793945, 0.0006949901580810547, 0.0008033514022827148, 0.000911712646484375, 0.0010200738906860352, 0.0011284351348876953, 0.0012367963790893555, 0.0013451576232910156, 0.0014535188674926758, 0.001561880111694336, 0.001670241355895996, 0.0017786026000976562, 0.0018869638442993164, 0.0019953250885009766, 0.0021036863327026367, 0.002212047576904297, 0.002320408821105957, 0.002428770065307617, 0.0025371313095092773, 0.0026454925537109375, 0.0027538537979125977, 0.002862215042114258, 0.002970576286315918, 0.003078937530517578, 0.0031872987747192383, 0.0032956600189208984, 0.0034040212631225586, 0.0035123825073242188, 0.003620743751525879, 0.003729104995727539, 0.0038374662399291992, 0.003945827484130859, 0.0040541887283325195, 0.00416254997253418, 0.00427091121673584, 0.0043792724609375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 4.0, 7.0, 5.0, 26.0, 22.0, 30.0, 37.0, 48.0, 54.0, 75.0, 99.0, 155.0, 261.0, 332.0, 606.0, 900.0, 1755.0, 3424.0, 7188.0, 18987.0, 74523.0, 681406.0, 199580.0, 36747.0, 11378.0, 5020.0, 2286.0, 1347.0, 750.0, 467.0, 298.0, 184.0, 147.0, 105.0, 90.0, 48.0, 48.0, 30.0, 23.0, 15.0, 11.0, 11.0, 7.0, 8.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.7421875, -5.5555419921875, -5.368896484375, -5.1822509765625, -4.99560546875, -4.8089599609375, -4.622314453125, -4.4356689453125, -4.2490234375, -4.0623779296875, -3.875732421875, -3.6890869140625, -3.50244140625, -3.3157958984375, -3.129150390625, -2.9425048828125, -2.755859375, -2.5692138671875, -2.382568359375, -2.1959228515625, -2.00927734375, -1.8226318359375, -1.635986328125, -1.4493408203125, -1.2626953125, -1.0760498046875, -0.889404296875, -0.7027587890625, -0.51611328125, -0.3294677734375, -0.142822265625, 0.0438232421875, 0.23046875, 0.4171142578125, 0.603759765625, 0.7904052734375, 0.97705078125, 1.1636962890625, 1.350341796875, 1.5369873046875, 1.7236328125, 1.9102783203125, 2.096923828125, 2.2835693359375, 2.47021484375, 2.6568603515625, 2.843505859375, 3.0301513671875, 3.216796875, 3.4034423828125, 3.590087890625, 3.7767333984375, 3.96337890625, 4.1500244140625, 4.336669921875, 4.5233154296875, 4.7099609375, 4.8966064453125, 5.083251953125, 5.2698974609375, 5.45654296875, 5.6431884765625, 5.829833984375, 6.0164794921875, 6.203125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 1.0, 5.0, 8.0, 5.0, 13.0, 14.0, 14.0, 20.0, 22.0, 28.0, 41.0, 50.0, 87.0, 101.0, 112.0, 114.0, 83.0, 58.0, 58.0, 40.0, 24.0, 23.0, 13.0, 16.0, 7.0, 5.0, 8.0, 6.0, 5.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.7421875, -7.4920654296875, -7.241943359375, -6.9918212890625, -6.74169921875, -6.4915771484375, -6.241455078125, -5.9913330078125, -5.7412109375, -5.4910888671875, -5.240966796875, -4.9908447265625, -4.74072265625, -4.4906005859375, -4.240478515625, -3.9903564453125, -3.740234375, -3.4901123046875, -3.239990234375, -2.9898681640625, -2.73974609375, -2.4896240234375, -2.239501953125, -1.9893798828125, -1.7392578125, -1.4891357421875, -1.239013671875, -0.9888916015625, -0.73876953125, -0.4886474609375, -0.238525390625, 0.0115966796875, 0.26171875, 0.5118408203125, 0.761962890625, 1.0120849609375, 1.26220703125, 1.5123291015625, 1.762451171875, 2.0125732421875, 2.2626953125, 2.5128173828125, 2.762939453125, 3.0130615234375, 3.26318359375, 3.5133056640625, 3.763427734375, 4.0135498046875, 4.263671875, 4.5137939453125, 4.763916015625, 5.0140380859375, 5.26416015625, 5.5142822265625, 5.764404296875, 6.0145263671875, 6.2646484375, 6.5147705078125, 6.764892578125, 7.0150146484375, 7.26513671875, 7.5152587890625, 7.765380859375, 8.0155029296875, 8.265625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 1.0, 2.0, 5.0, 11.0, 17.0, 34.0, 45.0, 81.0, 176.0, 329.0, 133.0, 62.0, 37.0, 22.0, 15.0, 7.0, 5.0, 7.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-201.1312255859375, -192.88150024414062, -184.63177490234375, -176.38204956054688, -168.13232421875, -159.88259887695312, -151.63287353515625, -143.38314819335938, -135.1334228515625, -126.88369750976562, -118.63397216796875, -110.38424682617188, -102.134521484375, -93.88479614257812, -85.63507080078125, -77.38534545898438, -69.1356201171875, -60.885894775390625, -52.63616943359375, -44.386444091796875, -36.13671875, -27.886993408203125, -19.63726806640625, -11.387542724609375, -3.1378173828125, 5.111907958984375, 13.36163330078125, 21.611358642578125, 29.861083984375, 38.110809326171875, 46.36053466796875, 54.610260009765625, 62.860015869140625, 71.1097412109375, 79.35946655273438, 87.60919189453125, 95.85891723632812, 104.108642578125, 112.35836791992188, 120.60809326171875, 128.85781860351562, 137.1075439453125, 145.35726928710938, 153.60699462890625, 161.85671997070312, 170.1064453125, 178.35617065429688, 186.60589599609375, 194.85562133789062, 203.1053466796875, 211.35507202148438, 219.60479736328125, 227.85452270507812, 236.104248046875, 244.35397338867188, 252.60369873046875, 260.8534240722656, 269.1031494140625, 277.3528747558594, 285.60260009765625, 293.8523254394531, 302.10205078125, 310.3517761230469, 318.60150146484375, 326.8512268066406]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 11.0, 7.0, 10.0, 12.0, 13.0, 11.0, 10.0, 18.0, 20.0, 23.0, 24.0, 26.0, 28.0, 25.0, 27.0, 71.0, 89.0, 122.0, 114.0, 47.0, 35.0, 37.0, 26.0, 20.0, 20.0, 16.0, 20.0, 24.0, 14.0, 17.0, 10.0, 11.0, 14.0, 7.0, 2.0, 6.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-208.0072784423828, -200.46408081054688, -192.9208984375, -185.37770080566406, -177.83450317382812, -170.29132080078125, -162.7481231689453, -155.20492553710938, -147.6617431640625, -140.11854553222656, -132.5753631591797, -125.03216552734375, -117.48897552490234, -109.94578552246094, -102.402587890625, -94.8593978881836, -87.31620788574219, -79.77301788330078, -72.22982788085938, -64.68663024902344, -57.14344024658203, -49.600250244140625, -42.05705642700195, -34.51386260986328, -26.970672607421875, -19.427480697631836, -11.884288787841797, -4.341096878051758, 3.2020950317382812, 10.745285034179688, 18.28847885131836, 25.83167266845703, 33.374847412109375, 40.91803741455078, 48.46123123168945, 56.004425048828125, 63.54761505126953, 71.09080505371094, 78.63400268554688, 86.17719268798828, 93.72038269042969, 101.2635726928711, 108.8067626953125, 116.34996032714844, 123.89315032958984, 131.43634033203125, 138.9795379638672, 146.52273559570312, 154.06591796875, 161.60911560058594, 169.1522979736328, 176.69549560546875, 184.23867797851562, 191.78187561035156, 199.3250732421875, 206.86825561523438, 214.4114532470703, 221.95465087890625, 229.49783325195312, 237.04103088378906, 244.584228515625, 252.12741088867188, 259.67059326171875, 267.21380615234375, 274.7569885253906]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 7.0, 7.0, 7.0, 12.0, 17.0, 19.0, 36.0, 61.0, 70.0, 128.0, 188.0, 350.0, 568.0, 999.0, 2220.0, 6292.0, 22037.0, 128437.0, 1080382.0, 2386092.0, 490875.0, 57563.0, 10795.0, 3471.0, 1548.0, 864.0, 484.0, 264.0, 174.0, 100.0, 58.0, 44.0, 37.0, 25.0, 18.0, 13.0, 11.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.6875, -23.815185546875, -22.94287109375, -22.070556640625, -21.1982421875, -20.325927734375, -19.45361328125, -18.581298828125, -17.708984375, -16.836669921875, -15.96435546875, -15.092041015625, -14.2197265625, -13.347412109375, -12.47509765625, -11.602783203125, -10.73046875, -9.858154296875, -8.98583984375, -8.113525390625, -7.2412109375, -6.368896484375, -5.49658203125, -4.624267578125, -3.751953125, -2.879638671875, -2.00732421875, -1.135009765625, -0.2626953125, 0.609619140625, 1.48193359375, 2.354248046875, 3.2265625, 4.098876953125, 4.97119140625, 5.843505859375, 6.7158203125, 7.588134765625, 8.46044921875, 9.332763671875, 10.205078125, 11.077392578125, 11.94970703125, 12.822021484375, 13.6943359375, 14.566650390625, 15.43896484375, 16.311279296875, 17.18359375, 18.055908203125, 18.92822265625, 19.800537109375, 20.6728515625, 21.545166015625, 22.41748046875, 23.289794921875, 24.162109375, 25.034423828125, 25.90673828125, 26.779052734375, 27.6513671875, 28.523681640625, 29.39599609375, 30.268310546875, 31.140625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 4.0, 8.0, 5.0, 7.0, 7.0, 19.0, 21.0, 25.0, 33.0, 45.0, 41.0, 43.0, 39.0, 60.0, 55.0, 74.0, 56.0, 56.0, 70.0, 56.0, 48.0, 46.0, 25.0, 37.0, 27.0, 23.0, 23.0, 11.0, 10.0, 11.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.640625, -16.030517578125, -15.42041015625, -14.810302734375, -14.2001953125, -13.590087890625, -12.97998046875, -12.369873046875, -11.759765625, -11.149658203125, -10.53955078125, -9.929443359375, -9.3193359375, -8.709228515625, -8.09912109375, -7.489013671875, -6.87890625, -6.268798828125, -5.65869140625, -5.048583984375, -4.4384765625, -3.828369140625, -3.21826171875, -2.608154296875, -1.998046875, -1.387939453125, -0.77783203125, -0.167724609375, 0.4423828125, 1.052490234375, 1.66259765625, 2.272705078125, 2.8828125, 3.492919921875, 4.10302734375, 4.713134765625, 5.3232421875, 5.933349609375, 6.54345703125, 7.153564453125, 7.763671875, 8.373779296875, 8.98388671875, 9.593994140625, 10.2041015625, 10.814208984375, 11.42431640625, 12.034423828125, 12.64453125, 13.254638671875, 13.86474609375, 14.474853515625, 15.0849609375, 15.695068359375, 16.30517578125, 16.915283203125, 17.525390625, 18.135498046875, 18.74560546875, 19.355712890625, 19.9658203125, 20.575927734375, 21.18603515625, 21.796142578125, 22.40625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 9.0, 9.0, 12.0, 13.0, 30.0, 38.0, 36.0, 86.0, 147.0, 273.0, 516.0, 1359.0, 4894.0, 45361.0, 3962462.0, 167551.0, 8266.0, 1832.0, 646.0, 300.0, 172.0, 83.0, 64.0, 41.0, 18.0, 21.0, 11.0, 10.0, 10.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.6875, -69.1865234375, -66.685546875, -64.1845703125, -61.68359375, -59.1826171875, -56.681640625, -54.1806640625, -51.6796875, -49.1787109375, -46.677734375, -44.1767578125, -41.67578125, -39.1748046875, -36.673828125, -34.1728515625, -31.671875, -29.1708984375, -26.669921875, -24.1689453125, -21.66796875, -19.1669921875, -16.666015625, -14.1650390625, -11.6640625, -9.1630859375, -6.662109375, -4.1611328125, -1.66015625, 0.8408203125, 3.341796875, 5.8427734375, 8.34375, 10.8447265625, 13.345703125, 15.8466796875, 18.34765625, 20.8486328125, 23.349609375, 25.8505859375, 28.3515625, 30.8525390625, 33.353515625, 35.8544921875, 38.35546875, 40.8564453125, 43.357421875, 45.8583984375, 48.359375, 50.8603515625, 53.361328125, 55.8623046875, 58.36328125, 60.8642578125, 63.365234375, 65.8662109375, 68.3671875, 70.8681640625, 73.369140625, 75.8701171875, 78.37109375, 80.8720703125, 83.373046875, 85.8740234375, 88.375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 1.0, 13.0, 6.0, 7.0, 11.0, 21.0, 22.0, 44.0, 56.0, 73.0, 130.0, 204.0, 303.0, 539.0, 701.0, 663.0, 504.0, 285.0, 180.0, 97.0, 61.0, 43.0, 42.0, 16.0, 10.0, 12.0, 9.0, 5.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-52.03125, -50.50341796875, -48.9755859375, -47.44775390625, -45.919921875, -44.39208984375, -42.8642578125, -41.33642578125, -39.80859375, -38.28076171875, -36.7529296875, -35.22509765625, -33.697265625, -32.16943359375, -30.6416015625, -29.11376953125, -27.5859375, -26.05810546875, -24.5302734375, -23.00244140625, -21.474609375, -19.94677734375, -18.4189453125, -16.89111328125, -15.36328125, -13.83544921875, -12.3076171875, -10.77978515625, -9.251953125, -7.72412109375, -6.1962890625, -4.66845703125, -3.140625, -1.61279296875, -0.0849609375, 1.44287109375, 2.970703125, 4.49853515625, 6.0263671875, 7.55419921875, 9.08203125, 10.60986328125, 12.1376953125, 13.66552734375, 15.193359375, 16.72119140625, 18.2490234375, 19.77685546875, 21.3046875, 22.83251953125, 24.3603515625, 25.88818359375, 27.416015625, 28.94384765625, 30.4716796875, 31.99951171875, 33.52734375, 35.05517578125, 36.5830078125, 38.11083984375, 39.638671875, 41.16650390625, 42.6943359375, 44.22216796875, 45.75]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 4.0, 7.0, 10.0, 16.0, 25.0, 35.0, 80.0, 158.0, 240.0, 173.0, 116.0, 53.0, 34.0, 13.0, 10.0, 9.0, 5.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-340.818603515625, -325.2418518066406, -309.66510009765625, -294.0883483886719, -278.5115966796875, -262.934814453125, -247.35806274414062, -231.78131103515625, -216.20455932617188, -200.6278076171875, -185.05105590820312, -169.4742889404297, -153.8975372314453, -138.32078552246094, -122.74402618408203, -107.16726684570312, -91.59051513671875, -76.01376342773438, -60.43700408935547, -44.86024856567383, -29.283493041992188, -13.706741333007812, 1.8700180053710938, 17.44677734375, 33.023529052734375, 48.600284576416016, 64.17704010009766, 79.75379943847656, 95.33055114746094, 110.90730285644531, 126.48406219482422, 142.06082153320312, 157.6375732421875, 173.21432495117188, 188.79107666015625, 204.3678436279297, 219.94459533691406, 235.52134704589844, 251.09811401367188, 266.67486572265625, 282.2516174316406, 297.828369140625, 313.4051208496094, 328.98187255859375, 344.55865478515625, 360.1353759765625, 375.712158203125, 391.2889099121094, 406.86566162109375, 422.4424133300781, 438.0191650390625, 453.5959167480469, 469.17266845703125, 484.74945068359375, 500.3262023925781, 515.9029541015625, 531.479736328125, 547.0565185546875, 562.6332397460938, 578.2100219726562, 593.7867431640625, 609.363525390625, 624.9402465820312, 640.5170288085938, 656.09375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 4.0, 6.0, 4.0, 13.0, 9.0, 17.0, 29.0, 19.0, 27.0, 28.0, 45.0, 41.0, 43.0, 53.0, 63.0, 68.0, 54.0, 73.0, 47.0, 48.0, 30.0, 41.0, 49.0, 36.0, 33.0, 15.0, 20.0, 20.0, 17.0, 13.0, 6.0, 10.0, 6.0, 11.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-266.8985900878906, -258.9678039550781, -251.03701782226562, -243.10623168945312, -235.17544555664062, -227.24465942382812, -219.31385803222656, -211.38307189941406, -203.45228576660156, -195.52149963378906, -187.59071350097656, -179.65992736816406, -171.7291259765625, -163.79833984375, -155.8675537109375, -147.936767578125, -140.0059814453125, -132.0751953125, -124.1444091796875, -116.21361541748047, -108.28282928466797, -100.35204315185547, -92.42124938964844, -84.49046325683594, -76.55967712402344, -68.62889099121094, -60.69810104370117, -52.767311096191406, -44.836524963378906, -36.905738830566406, -28.97494888305664, -21.044158935546875, -13.113388061523438, -5.182600021362305, 2.748188018798828, 10.678976058959961, 18.609764099121094, 26.540550231933594, 34.47134017944336, 42.402130126953125, 50.332916259765625, 58.263702392578125, 66.19448852539062, 74.12528228759766, 82.05606842041016, 89.98685455322266, 97.91764831542969, 105.84843444824219, 113.77922058105469, 121.71000671386719, 129.6407928466797, 137.5715789794922, 145.50238037109375, 153.43316650390625, 161.36395263671875, 169.29473876953125, 177.22552490234375, 185.15631103515625, 193.08709716796875, 201.01788330078125, 208.94866943359375, 216.87945556640625, 224.8102569580078, 232.7410430908203, 240.6718292236328]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 4.0, 9.0, 16.0, 24.0, 28.0, 45.0, 76.0, 101.0, 180.0, 307.0, 466.0, 771.0, 1520.0, 3077.0, 6498.0, 15982.0, 44897.0, 145213.0, 444968.0, 262200.0, 77619.0, 25582.0, 9835.0, 4389.0, 2043.0, 1115.0, 619.0, 338.0, 217.0, 111.0, 95.0, 70.0, 32.0, 32.0, 23.0, 8.0, 14.0, 8.0, 4.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.703125, -23.970947265625, -23.23876953125, -22.506591796875, -21.7744140625, -21.042236328125, -20.31005859375, -19.577880859375, -18.845703125, -18.113525390625, -17.38134765625, -16.649169921875, -15.9169921875, -15.184814453125, -14.45263671875, -13.720458984375, -12.98828125, -12.256103515625, -11.52392578125, -10.791748046875, -10.0595703125, -9.327392578125, -8.59521484375, -7.863037109375, -7.130859375, -6.398681640625, -5.66650390625, -4.934326171875, -4.2021484375, -3.469970703125, -2.73779296875, -2.005615234375, -1.2734375, -0.541259765625, 0.19091796875, 0.923095703125, 1.6552734375, 2.387451171875, 3.11962890625, 3.851806640625, 4.583984375, 5.316162109375, 6.04833984375, 6.780517578125, 7.5126953125, 8.244873046875, 8.97705078125, 9.709228515625, 10.44140625, 11.173583984375, 11.90576171875, 12.637939453125, 13.3701171875, 14.102294921875, 14.83447265625, 15.566650390625, 16.298828125, 17.031005859375, 17.76318359375, 18.495361328125, 19.2275390625, 19.959716796875, 20.69189453125, 21.424072265625, 22.15625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 6.0, 4.0, 5.0, 6.0, 13.0, 16.0, 22.0, 23.0, 28.0, 44.0, 37.0, 26.0, 61.0, 55.0, 61.0, 44.0, 47.0, 50.0, 49.0, 59.0, 54.0, 52.0, 42.0, 34.0, 35.0, 22.0, 25.0, 20.0, 9.0, 10.0, 13.0, 10.0, 6.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-17.984375, -17.385986328125, -16.78759765625, -16.189208984375, -15.5908203125, -14.992431640625, -14.39404296875, -13.795654296875, -13.197265625, -12.598876953125, -12.00048828125, -11.402099609375, -10.8037109375, -10.205322265625, -9.60693359375, -9.008544921875, -8.41015625, -7.811767578125, -7.21337890625, -6.614990234375, -6.0166015625, -5.418212890625, -4.81982421875, -4.221435546875, -3.623046875, -3.024658203125, -2.42626953125, -1.827880859375, -1.2294921875, -0.631103515625, -0.03271484375, 0.565673828125, 1.1640625, 1.762451171875, 2.36083984375, 2.959228515625, 3.5576171875, 4.156005859375, 4.75439453125, 5.352783203125, 5.951171875, 6.549560546875, 7.14794921875, 7.746337890625, 8.3447265625, 8.943115234375, 9.54150390625, 10.139892578125, 10.73828125, 11.336669921875, 11.93505859375, 12.533447265625, 13.1318359375, 13.730224609375, 14.32861328125, 14.927001953125, 15.525390625, 16.123779296875, 16.72216796875, 17.320556640625, 17.9189453125, 18.517333984375, 19.11572265625, 19.714111328125, 20.3125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 7.0, 12.0, 13.0, 26.0, 36.0, 42.0, 53.0, 86.0, 134.0, 205.0, 448.0, 985.0, 2988.0, 18795.0, 647429.0, 359052.0, 14020.0, 2409.0, 806.0, 418.0, 227.0, 109.0, 87.0, 57.0, 32.0, 27.0, 17.0, 10.0, 11.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.15625, -32.83935546875, -31.5224609375, -30.20556640625, -28.888671875, -27.57177734375, -26.2548828125, -24.93798828125, -23.62109375, -22.30419921875, -20.9873046875, -19.67041015625, -18.353515625, -17.03662109375, -15.7197265625, -14.40283203125, -13.0859375, -11.76904296875, -10.4521484375, -9.13525390625, -7.818359375, -6.50146484375, -5.1845703125, -3.86767578125, -2.55078125, -1.23388671875, 0.0830078125, 1.39990234375, 2.716796875, 4.03369140625, 5.3505859375, 6.66748046875, 7.984375, 9.30126953125, 10.6181640625, 11.93505859375, 13.251953125, 14.56884765625, 15.8857421875, 17.20263671875, 18.51953125, 19.83642578125, 21.1533203125, 22.47021484375, 23.787109375, 25.10400390625, 26.4208984375, 27.73779296875, 29.0546875, 30.37158203125, 31.6884765625, 33.00537109375, 34.322265625, 35.63916015625, 36.9560546875, 38.27294921875, 39.58984375, 40.90673828125, 42.2236328125, 43.54052734375, 44.857421875, 46.17431640625, 47.4912109375, 48.80810546875, 50.125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 5.0, 5.0, 8.0, 9.0, 7.0, 16.0, 20.0, 23.0, 33.0, 41.0, 29.0, 79.0, 73.0, 102.0, 83.0, 98.0, 92.0, 60.0, 42.0, 29.0, 35.0, 27.0, 26.0, 18.0, 10.0, 6.0, 4.0, 8.0, 0.0, 4.0, 5.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.375, -71.69140625, -69.0078125, -66.32421875, -63.640625, -60.95703125, -58.2734375, -55.58984375, -52.90625, -50.22265625, -47.5390625, -44.85546875, -42.171875, -39.48828125, -36.8046875, -34.12109375, -31.4375, -28.75390625, -26.0703125, -23.38671875, -20.703125, -18.01953125, -15.3359375, -12.65234375, -9.96875, -7.28515625, -4.6015625, -1.91796875, 0.765625, 3.44921875, 6.1328125, 8.81640625, 11.5, 14.18359375, 16.8671875, 19.55078125, 22.234375, 24.91796875, 27.6015625, 30.28515625, 32.96875, 35.65234375, 38.3359375, 41.01953125, 43.703125, 46.38671875, 49.0703125, 51.75390625, 54.4375, 57.12109375, 59.8046875, 62.48828125, 65.171875, 67.85546875, 70.5390625, 73.22265625, 75.90625, 78.58984375, 81.2734375, 83.95703125, 86.640625, 89.32421875, 92.0078125, 94.69140625, 97.375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 3.0, 4.0, 1.0, 10.0, 11.0, 11.0, 12.0, 32.0, 41.0, 60.0, 129.0, 246.0, 539.0, 1708.0, 8848.0, 170716.0, 848523.0, 14102.0, 2247.0, 671.0, 292.0, 131.0, 64.0, 50.0, 41.0, 14.0, 13.0, 10.0, 4.0, 6.0, 2.0, 1.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.80859375, -6.5897216796875, -6.370849609375, -6.1519775390625, -5.93310546875, -5.7142333984375, -5.495361328125, -5.2764892578125, -5.0576171875, -4.8387451171875, -4.619873046875, -4.4010009765625, -4.18212890625, -3.9632568359375, -3.744384765625, -3.5255126953125, -3.306640625, -3.0877685546875, -2.868896484375, -2.6500244140625, -2.43115234375, -2.2122802734375, -1.993408203125, -1.7745361328125, -1.5556640625, -1.3367919921875, -1.117919921875, -0.8990478515625, -0.68017578125, -0.4613037109375, -0.242431640625, -0.0235595703125, 0.1953125, 0.4141845703125, 0.633056640625, 0.8519287109375, 1.07080078125, 1.2896728515625, 1.508544921875, 1.7274169921875, 1.9462890625, 2.1651611328125, 2.384033203125, 2.6029052734375, 2.82177734375, 3.0406494140625, 3.259521484375, 3.4783935546875, 3.697265625, 3.9161376953125, 4.135009765625, 4.3538818359375, 4.57275390625, 4.7916259765625, 5.010498046875, 5.2293701171875, 5.4482421875, 5.6671142578125, 5.885986328125, 6.1048583984375, 6.32373046875, 6.5426025390625, 6.761474609375, 6.9803466796875, 7.19921875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 12.0, 9.0, 6.0, 10.0, 9.0, 16.0, 21.0, 23.0, 32.0, 42.0, 53.0, 60.0, 90.0, 94.0, 91.0, 82.0, 85.0, 73.0, 47.0, 21.0, 21.0, 26.0, 10.0, 10.0, 14.0, 8.0, 6.0, 7.0, 3.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0008563995361328125, -0.0008327588438987732, -0.0008091181516647339, -0.0007854774594306946, -0.0007618367671966553, -0.000738196074962616, -0.0007145553827285767, -0.0006909146904945374, -0.000667273998260498, -0.0006436333060264587, -0.0006199926137924194, -0.0005963519215583801, -0.0005727112293243408, -0.0005490705370903015, -0.0005254298448562622, -0.0005017891526222229, -0.0004781484603881836, -0.0004545077681541443, -0.000430867075920105, -0.0004072263836860657, -0.00038358569145202637, -0.00035994499921798706, -0.00033630430698394775, -0.00031266361474990845, -0.00028902292251586914, -0.00026538223028182983, -0.00024174153804779053, -0.00021810084581375122, -0.00019446015357971191, -0.0001708194613456726, -0.0001471787691116333, -0.000123538076877594, -9.989738464355469e-05, -7.625669240951538e-05, -5.2616000175476074e-05, -2.8975307941436768e-05, -5.334615707397461e-06, 1.8306076526641846e-05, 4.194676876068115e-05, 6.558746099472046e-05, 8.922815322875977e-05, 0.00011286884546279907, 0.00013650953769683838, 0.00016015022993087769, 0.000183790922164917, 0.0002074316143989563, 0.0002310723066329956, 0.0002547129988670349, 0.0002783536911010742, 0.0003019943833351135, 0.00032563507556915283, 0.00034927576780319214, 0.00037291646003723145, 0.00039655715227127075, 0.00042019784450531006, 0.00044383853673934937, 0.00046747922897338867, 0.000491119921207428, 0.0005147606134414673, 0.0005384013056755066, 0.0005620419979095459, 0.0005856826901435852, 0.0006093233823776245, 0.0006329640746116638, 0.0006566047668457031]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 1.0, 1.0, 3.0, 4.0, 6.0, 10.0, 14.0, 19.0, 30.0, 52.0, 69.0, 111.0, 200.0, 326.0, 565.0, 1187.0, 2597.0, 7025.0, 23391.0, 154762.0, 780903.0, 56076.0, 12888.0, 4442.0, 1932.0, 773.0, 469.0, 255.0, 150.0, 89.0, 60.0, 43.0, 30.0, 15.0, 9.0, 15.0, 8.0, 7.0, 2.0, 6.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.66796875, -3.5543212890625, -3.440673828125, -3.3270263671875, -3.21337890625, -3.0997314453125, -2.986083984375, -2.8724365234375, -2.7587890625, -2.6451416015625, -2.531494140625, -2.4178466796875, -2.30419921875, -2.1905517578125, -2.076904296875, -1.9632568359375, -1.849609375, -1.7359619140625, -1.622314453125, -1.5086669921875, -1.39501953125, -1.2813720703125, -1.167724609375, -1.0540771484375, -0.9404296875, -0.8267822265625, -0.713134765625, -0.5994873046875, -0.48583984375, -0.3721923828125, -0.258544921875, -0.1448974609375, -0.03125, 0.0823974609375, 0.196044921875, 0.3096923828125, 0.42333984375, 0.5369873046875, 0.650634765625, 0.7642822265625, 0.8779296875, 0.9915771484375, 1.105224609375, 1.2188720703125, 1.33251953125, 1.4461669921875, 1.559814453125, 1.6734619140625, 1.787109375, 1.9007568359375, 2.014404296875, 2.1280517578125, 2.24169921875, 2.3553466796875, 2.468994140625, 2.5826416015625, 2.6962890625, 2.8099365234375, 2.923583984375, 3.0372314453125, 3.15087890625, 3.2645263671875, 3.378173828125, 3.4918212890625, 3.60546875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 2.0, 4.0, 0.0, 11.0, 6.0, 8.0, 8.0, 11.0, 7.0, 17.0, 22.0, 23.0, 61.0, 85.0, 133.0, 167.0, 126.0, 98.0, 56.0, 48.0, 25.0, 20.0, 10.0, 16.0, 10.0, 14.0, 3.0, 3.0, 4.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9296875, -5.73651123046875, -5.5433349609375, -5.35015869140625, -5.156982421875, -4.96380615234375, -4.7706298828125, -4.57745361328125, -4.38427734375, -4.19110107421875, -3.9979248046875, -3.80474853515625, -3.611572265625, -3.41839599609375, -3.2252197265625, -3.03204345703125, -2.8388671875, -2.64569091796875, -2.4525146484375, -2.25933837890625, -2.066162109375, -1.87298583984375, -1.6798095703125, -1.48663330078125, -1.29345703125, -1.10028076171875, -0.9071044921875, -0.71392822265625, -0.520751953125, -0.32757568359375, -0.1343994140625, 0.05877685546875, 0.251953125, 0.44512939453125, 0.6383056640625, 0.83148193359375, 1.024658203125, 1.21783447265625, 1.4110107421875, 1.60418701171875, 1.79736328125, 1.99053955078125, 2.1837158203125, 2.37689208984375, 2.570068359375, 2.76324462890625, 2.9564208984375, 3.14959716796875, 3.3427734375, 3.53594970703125, 3.7291259765625, 3.92230224609375, 4.115478515625, 4.30865478515625, 4.5018310546875, 4.69500732421875, 4.88818359375, 5.08135986328125, 5.2745361328125, 5.46771240234375, 5.660888671875, 5.85406494140625, 6.0472412109375, 6.24041748046875, 6.43359375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 11.0, 33.0, 65.0, 280.0, 453.0, 97.0, 29.0, 14.0, 9.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-443.47271728515625, -431.5397033691406, -419.6067199707031, -407.6737060546875, -395.7406921386719, -383.80767822265625, -371.87469482421875, -359.9416809082031, -348.0086669921875, -336.0756530761719, -324.1426696777344, -312.20965576171875, -300.2766418457031, -288.3436279296875, -276.41064453125, -264.4776306152344, -252.54464721679688, -240.6116485595703, -228.6786346435547, -216.74563598632812, -204.8126220703125, -192.87962341308594, -180.94662475585938, -169.01361083984375, -157.0806121826172, -145.14761352539062, -133.214599609375, -121.28160095214844, -109.34859466552734, -97.41558837890625, -85.48258972167969, -73.5495834350586, -61.616607666015625, -49.68360137939453, -37.7505989074707, -25.817596435546875, -13.884590148925781, -1.9515838623046875, 9.981414794921875, 21.91442108154297, 33.84742736816406, 45.780433654785156, 57.713436126708984, 69.64643859863281, 81.5794448852539, 93.512451171875, 105.44544982910156, 117.37845611572266, 129.31146240234375, 141.2444610595703, 153.17747497558594, 165.1104736328125, 177.04348754882812, 188.9764862060547, 200.90948486328125, 212.84249877929688, 224.77549743652344, 236.70849609375, 248.64151000976562, 260.57452392578125, 272.50750732421875, 284.4405212402344, 296.37353515625, 308.3065185546875, 320.2395324707031]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 5.0, 4.0, 5.0, 11.0, 13.0, 12.0, 17.0, 17.0, 18.0, 17.0, 26.0, 18.0, 37.0, 126.0, 123.0, 59.0, 109.0, 154.0, 35.0, 23.0, 33.0, 22.0, 19.0, 15.0, 24.0, 15.0, 9.0, 8.0, 10.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-227.55841064453125, -220.78248596191406, -214.00656127929688, -207.23065185546875, -200.45472717285156, -193.67880249023438, -186.9028778076172, -180.126953125, -173.35104370117188, -166.5751190185547, -159.7991943359375, -153.02328491210938, -146.2473602294922, -139.471435546875, -132.6955108642578, -125.91959381103516, -119.14366912841797, -112.36774444580078, -105.59182739257812, -98.81590270996094, -92.03998565673828, -85.2640609741211, -78.48814392089844, -71.71221923828125, -64.93629455566406, -58.16037368774414, -51.38445281982422, -44.60852813720703, -37.832611083984375, -31.056686401367188, -24.280765533447266, -17.504844665527344, -10.728927612304688, -3.9530062675476074, 2.8229150772094727, 9.598836898803711, 16.374757766723633, 23.150680541992188, 29.92660140991211, 36.70252227783203, 43.47844314575195, 50.254364013671875, 57.0302848815918, 63.80620574951172, 70.5821304321289, 77.35804748535156, 84.13397216796875, 90.90989685058594, 97.6858139038086, 104.46173858642578, 111.23765563964844, 118.01358032226562, 124.78949737548828, 131.5654296875, 138.34133911132812, 145.1172637939453, 151.8931884765625, 158.6691131591797, 165.44503784179688, 172.220947265625, 178.9968719482422, 185.77279663085938, 192.54872131347656, 199.32464599609375, 206.10055541992188]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 4.0, 8.0, 8.0, 5.0, 15.0, 18.0, 19.0, 23.0, 25.0, 21.0, 43.0, 32.0, 37.0, 62.0, 216.0, 182.0, 56.0, 44.0, 29.0, 20.0, 24.0, 19.0, 16.0, 20.0, 16.0, 7.0, 13.0, 5.0, 4.0, 5.0, 1.0, 1.0, 5.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.4375, -16.8740234375, -16.310546875, -15.7470703125, -15.18359375, -14.6201171875, -14.056640625, -13.4931640625, -12.9296875, -12.3662109375, -11.802734375, -11.2392578125, -10.67578125, -10.1123046875, -9.548828125, -8.9853515625, -8.421875, -7.8583984375, -7.294921875, -6.7314453125, -6.16796875, -5.6044921875, -5.041015625, -4.4775390625, -3.9140625, -3.3505859375, -2.787109375, -2.2236328125, -1.66015625, -1.0966796875, -0.533203125, 0.0302734375, 0.59375, 1.1572265625, 1.720703125, 2.2841796875, 2.84765625, 3.4111328125, 3.974609375, 4.5380859375, 5.1015625, 5.6650390625, 6.228515625, 6.7919921875, 7.35546875, 7.9189453125, 8.482421875, 9.0458984375, 9.609375, 10.1728515625, 10.736328125, 11.2998046875, 11.86328125, 12.4267578125, 12.990234375, 13.5537109375, 14.1171875, 14.6806640625, 15.244140625, 15.8076171875, 16.37109375, 16.9345703125, 17.498046875, 18.0615234375, 18.625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 8.0, 3.0, 8.0, 14.0, 15.0, 18.0, 18.0, 27.0, 28.0, 46.0, 93.0, 232.0, 562.0, 2174.0, 17322.0, 8354671.0, 10760.0, 1648.0, 466.0, 205.0, 96.0, 55.0, 18.0, 26.0, 20.0, 14.0, 6.0, 11.0, 10.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0], "bins": [-205.54661560058594, -199.00250244140625, -192.45838928222656, -185.91427612304688, -179.3701629638672, -172.8260498046875, -166.28192138671875, -159.73782348632812, -153.19369506835938, -146.6495819091797, -140.10546875, -133.5613555908203, -127.01724243164062, -120.47312927246094, -113.92900848388672, -107.38489532470703, -100.84078979492188, -94.29667663574219, -87.7525634765625, -81.20845031738281, -74.66433715820312, -68.12022399902344, -61.57610321044922, -55.03199005126953, -48.487876892089844, -41.943763732910156, -35.39965057373047, -28.855533599853516, -22.311420440673828, -15.76730728149414, -9.223190307617188, -2.6790771484375, 3.865020751953125, 10.409134864807129, 16.953248977661133, 23.497364044189453, 30.04147720336914, 36.58559036254883, 43.12970733642578, 49.67382049560547, 56.217933654785156, 62.762046813964844, 69.30615997314453, 75.85028076171875, 82.39439392089844, 88.93850708007812, 95.48262023925781, 102.0267333984375, 108.57084655761719, 115.11495971679688, 121.65907287597656, 128.20318603515625, 134.74729919433594, 141.29141235351562, 147.83554077148438, 154.379638671875, 160.92376708984375, 167.46788024902344, 174.01199340820312, 180.5561065673828, 187.1002197265625, 193.6443328857422, 200.18844604492188, 206.73257446289062, 213.27667236328125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 4.0, 2.0, 8.0, 6.0, 5.0, 5.0, 4.0, 4.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 3.0, 3.0, 8.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-186.46343994140625, -180.51824951171875, -174.5730743408203, -168.6278839111328, -162.68270874023438, -156.73751831054688, -150.79232788085938, -144.84715270996094, -138.90196228027344, -132.95677185058594, -127.0115966796875, -121.06640625, -115.12122344970703, -109.17604064941406, -103.2308578491211, -97.28567504882812, -91.34049224853516, -85.39530944824219, -79.45012664794922, -73.50494384765625, -67.55975341796875, -61.61457061767578, -55.66938781738281, -49.72420120239258, -43.77901840209961, -37.83383560180664, -31.888648986816406, -25.943466186523438, -19.998281478881836, -14.053096771240234, -8.107913970947266, -2.1627273559570312, 3.7824554443359375, 9.727640151977539, 15.672823905944824, 21.61800765991211, 27.56319236755371, 33.50837707519531, 39.45355987548828, 45.398746490478516, 51.343929290771484, 57.28911209106445, 63.23429870605469, 69.17948150634766, 75.12466430664062, 81.06985473632812, 87.01502990722656, 92.96022033691406, 98.90540313720703, 104.8505859375, 110.79576873779297, 116.74095153808594, 122.68614196777344, 128.63131713867188, 134.57650756835938, 140.52169799804688, 146.4668731689453, 152.4120635986328, 158.35723876953125, 164.30242919921875, 170.2476043701172, 176.1927947998047, 182.13796997070312, 188.08316040039062, 194.02835083007812]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 5.0, 8.0, 9.0, 9.0, 15.0, 22.0, 35.0, 56.0, 79.0, 109.0, 200.0, 277.0, 471.0, 821.0, 1544.0, 2840.0, 5131.0, 9703.0, 18230.0, 34522.0, 65765.0, 112609.0, 117542.0, 72353.0, 38075.0, 20099.0, 10735.0, 5643.0, 3206.0, 1728.0, 933.0, 517.0, 380.0, 216.0, 143.0, 77.0, 48.0, 38.0, 24.0, 23.0, 15.0, 1.0, 5.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-82.5625, -80.2734375, -77.984375, -75.6953125, -73.40625, -71.1171875, -68.828125, -66.5390625, -64.25, -61.9609375, -59.671875, -57.3828125, -55.09375, -52.8046875, -50.515625, -48.2265625, -45.9375, -43.6484375, -41.359375, -39.0703125, -36.78125, -34.4921875, -32.203125, -29.9140625, -27.625, -25.3359375, -23.046875, -20.7578125, -18.46875, -16.1796875, -13.890625, -11.6015625, -9.3125, -7.0234375, -4.734375, -2.4453125, -0.15625, 2.1328125, 4.421875, 6.7109375, 9.0, 11.2890625, 13.578125, 15.8671875, 18.15625, 20.4453125, 22.734375, 25.0234375, 27.3125, 29.6015625, 31.890625, 34.1796875, 36.46875, 38.7578125, 41.046875, 43.3359375, 45.625, 47.9140625, 50.203125, 52.4921875, 54.78125, 57.0703125, 59.359375, 61.6484375, 63.9375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 5.0, 4.0, 4.0, 4.0, 5.0, 8.0, 9.0, 15.0, 21.0, 31.0, 26.0, 39.0, 45.0, 51.0, 62.0, 79.0, 63.0, 55.0, 62.0, 68.0, 66.0, 54.0, 53.0, 33.0, 33.0, 19.0, 19.0, 11.0, 15.0, 9.0, 4.0, 6.0, 9.0, 3.0, 9.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.234375, -17.6123046875, -16.990234375, -16.3681640625, -15.74609375, -15.1240234375, -14.501953125, -13.8798828125, -13.2578125, -12.6357421875, -12.013671875, -11.3916015625, -10.76953125, -10.1474609375, -9.525390625, -8.9033203125, -8.28125, -7.6591796875, -7.037109375, -6.4150390625, -5.79296875, -5.1708984375, -4.548828125, -3.9267578125, -3.3046875, -2.6826171875, -2.060546875, -1.4384765625, -0.81640625, -0.1943359375, 0.427734375, 1.0498046875, 1.671875, 2.2939453125, 2.916015625, 3.5380859375, 4.16015625, 4.7822265625, 5.404296875, 6.0263671875, 6.6484375, 7.2705078125, 7.892578125, 8.5146484375, 9.13671875, 9.7587890625, 10.380859375, 11.0029296875, 11.625, 12.2470703125, 12.869140625, 13.4912109375, 14.11328125, 14.7353515625, 15.357421875, 15.9794921875, 16.6015625, 17.2236328125, 17.845703125, 18.4677734375, 19.08984375, 19.7119140625, 20.333984375, 20.9560546875, 21.578125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 8.0, 5.0, 17.0, 19.0, 21.0, 30.0, 49.0, 72.0, 62.0, 64.0, 39.0, 35.0, 15.0, 15.0, 9.0, 10.0, 2.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-113.70374298095703, -110.53536987304688, -107.36700439453125, -104.1986312866211, -101.03025817871094, -97.86189270019531, -94.69351959228516, -91.525146484375, -88.35678100585938, -85.18840789794922, -82.0200424194336, -78.85166931152344, -75.68330383300781, -72.51493072509766, -69.3465576171875, -66.17819213867188, -63.00981903076172, -59.84144973754883, -56.67308044433594, -53.50470733642578, -50.33633804321289, -47.16796875, -43.999595642089844, -40.83122634887695, -37.66285705566406, -34.49448776245117, -31.32611656188965, -28.157745361328125, -24.989376068115234, -21.821006774902344, -18.65263557434082, -15.484264373779297, -12.315902709960938, -9.14753246307373, -5.979162216186523, -2.8107919692993164, 0.3575782775878906, 3.5259485244750977, 6.694318771362305, 9.862689971923828, 13.031059265136719, 16.19942855834961, 19.367799758911133, 22.536170959472656, 25.704540252685547, 28.872909545898438, 32.041282653808594, 35.209651947021484, 38.378021240234375, 41.546390533447266, 44.714759826660156, 47.88313293457031, 51.0515022277832, 54.219871520996094, 57.38824462890625, 60.55661392211914, 63.72498321533203, 66.89335632324219, 70.06172180175781, 73.23009490966797, 76.39846801757812, 79.56683349609375, 82.7352066040039, 85.90357971191406, 89.07194519042969]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 7.0, 11.0, 16.0, 12.0, 30.0, 55.0, 74.0, 85.0, 58.0, 39.0, 24.0, 16.0, 8.0, 4.0, 6.0, 7.0, 7.0, 2.0, 2.0, 4.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.78057098388672, -66.1164321899414, -63.452293395996094, -60.78815460205078, -58.12401580810547, -55.459877014160156, -52.795738220214844, -50.13159942626953, -47.46746063232422, -44.803321838378906, -42.139183044433594, -39.47504425048828, -36.81090545654297, -34.146766662597656, -31.482627868652344, -28.81848907470703, -26.15435028076172, -23.490211486816406, -20.826072692871094, -18.16193389892578, -15.497795104980469, -12.833656311035156, -10.169517517089844, -7.505378723144531, -4.841239929199219, -2.1771011352539062, 0.48703765869140625, 3.1511764526367188, 5.815315246582031, 8.479454040527344, 11.143592834472656, 13.807731628417969, 16.47186279296875, 19.136001586914062, 21.800140380859375, 24.464279174804688, 27.12841796875, 29.792556762695312, 32.456695556640625, 35.12083435058594, 37.78497314453125, 40.44911193847656, 43.113250732421875, 45.77738952636719, 48.4415283203125, 51.10566711425781, 53.769805908203125, 56.43394470214844, 59.09808349609375, 61.76222229003906, 64.42636108398438, 67.09049987792969, 69.754638671875, 72.41877746582031, 75.08291625976562, 77.74705505371094, 80.41119384765625, 83.07533264160156, 85.73947143554688, 88.40361022949219, 91.0677490234375, 93.73188781738281, 96.39602661132812, 99.06016540527344, 101.72430419921875]}, "eval/loss": 0.9485552906990051, "eval/wer": 0.11520527015496954, "eval/runtime": 942.9186, "eval/samples_per_second": 2.802, "eval/steps_per_second": 0.351, "train/train_runtime": 116020.8621, "train/train_samples_per_second": 4.919, "train/train_steps_per_second": 0.154, "train/total_flos": 0.0, "train/train_loss": 2.37383288616657} \ No newline at end of file