diff --git "a/wandb/run-20220306_154329-3378nr4g/files/wandb-summary.json" "b/wandb/run-20220306_154329-3378nr4g/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220306_154329-3378nr4g/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 7.6909, "train/learning_rate": 6e-06, "train/epoch": 0.78, "train/global_step": 200, "_runtime": 3619, "_timestamp": 1646585028, "_step": 199, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 53.0, 0.0, 0.0, 1.0, 0.0, 0.0, 30458.0], "bins": [-964.5, -949.20166015625, -933.9033203125, -918.60498046875, -903.306640625, -888.00830078125, -872.7099609375, -857.41162109375, -842.11328125, -826.81494140625, -811.5166015625, -796.21826171875, -780.919921875, -765.62158203125, -750.3232421875, -735.02490234375, -719.7265625, -704.42822265625, -689.1298828125, -673.83154296875, -658.533203125, -643.23486328125, -627.9365234375, -612.63818359375, -597.33984375, -582.04150390625, -566.7431640625, -551.44482421875, -536.146484375, -520.84814453125, -505.5498046875, -490.25146484375, -474.953125, -459.65478515625, -444.3564453125, -429.05810546875, -413.759765625, -398.46142578125, -383.1630859375, -367.86474609375, -352.56640625, -337.26806640625, -321.9697265625, -306.67138671875, -291.373046875, -276.07470703125, -260.7763671875, -245.47802734375, -230.1796875, -214.88134765625, -199.5830078125, -184.28466796875, -168.986328125, -153.68798828125, -138.3896484375, -123.09130859375, -107.79296875, -92.49462890625, -77.1962890625, -61.89794921875, -46.599609375, -31.30126953125, -16.0029296875, -0.70458984375, 14.59375]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0, 4.0, 3.0, 8.0, 6.0, 10.0, 9.0, 9.0, 12.0, 6.0, 26.0, 15.0, 25.0, 29.0, 38.0, 44.0, 39.0, 36.0, 34.0, 56.0, 48.0, 77.0, 85.0, 104.0, 86.0, 51.0, 47.0, 31.0, 21.0, 7.0, 10.0, 8.0, 5.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-163.7496795654297, -160.185302734375, -156.6209259033203, -153.0565643310547, -149.4921875, -145.9278106689453, -142.36343383789062, -138.79905700683594, -135.23468017578125, -131.67030334472656, -128.10592651367188, -124.54155731201172, -120.97718811035156, -117.41281127929688, -113.84843444824219, -110.2840576171875, -106.71969604492188, -103.15531921386719, -99.59095001220703, -96.02657318115234, -92.46220397949219, -88.8978271484375, -85.33345031738281, -81.76907348632812, -78.20470428466797, -74.64032745361328, -71.07595825195312, -67.51158142089844, -63.947208404541016, -60.382835388183594, -56.818458557128906, -53.254085540771484, -49.689720153808594, -46.12534713745117, -42.56097412109375, -38.99659729003906, -35.43222427368164, -31.86785125732422, -28.303476333618164, -24.73910140991211, -21.174728393554688, -17.610355377197266, -14.045980453491211, -10.481606483459473, -6.917232513427734, -3.3528594970703125, 0.2115154266357422, 3.775890350341797, 7.340263366699219, 10.904637336730957, 14.469011306762695, 18.03338623046875, 21.597759246826172, 25.162132263183594, 28.72650718688965, 32.2908821105957, 35.855255126953125, 39.41962814331055, 42.98400115966797, 46.548377990722656, 50.11275100708008, 53.6771240234375, 57.24150085449219, 60.80587387084961, 64.37024688720703]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [5.0, 3.0, 7.0, 6.0, 3.0, 3.0, 9.0, 6.0, 9.0, 13.0, 11.0, 13.0, 18.0, 15.0, 15.0, 25.0, 16.0, 29.0, 20.0, 40.0, 35.0, 41.0, 38.0, 31.0, 33.0, 30.0, 40.0, 32.0, 44.0, 30.0, 43.0, 33.0, 34.0, 32.0, 27.0, 17.0, 19.0, 27.0, 27.0, 14.0, 28.0, 13.0, 15.0, 16.0, 15.0, 12.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.77153778076172, -63.26768493652344, -60.763832092285156, -58.259979248046875, -55.756126403808594, -53.25227355957031, -50.7484245300293, -48.244571685791016, -45.740718841552734, -43.23686599731445, -40.73301315307617, -38.22916030883789, -35.725311279296875, -33.221458435058594, -30.717605590820312, -28.21375274658203, -25.70989990234375, -23.20604705810547, -20.702194213867188, -18.19834327697754, -15.694490432739258, -13.190637588500977, -10.686785697937012, -8.182933807373047, -5.679080963134766, -3.1752285957336426, -0.6713762283325195, 1.8324761390686035, 4.336328506469727, 6.840181350708008, 9.344033241271973, 11.847885131835938, 14.351730346679688, 16.85558319091797, 19.35943603515625, 21.8632869720459, 24.36713981628418, 26.87099266052246, 29.37484359741211, 31.87869644165039, 34.38254928588867, 36.88640213012695, 39.390254974365234, 41.894107818603516, 44.39795684814453, 46.90180969238281, 49.405662536621094, 51.909515380859375, 54.413368225097656, 56.91722106933594, 59.42107391357422, 61.9249267578125, 64.42877960205078, 66.93263244628906, 69.43648529052734, 71.94033813476562, 74.44418334960938, 76.94803619384766, 79.45188903808594, 81.95574188232422, 84.4595947265625, 86.96344757080078, 89.46730041503906, 91.97114562988281, 94.47500610351562]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 4.0, 7.0, 18.0, 17.0, 32.0, 33.0, 52.0, 68.0, 100.0, 107.0, 201.0, 282.0, 403.0, 559.0, 884.0, 1328.0, 2039.0, 3091.0, 4552.0, 7412.0, 11974.0, 19535.0, 33173.0, 63679.0, 161088.0, 489862.0, 119427.0, 52931.0, 29118.0, 17133.0, 10477.0, 6571.0, 4177.0, 2646.0, 1868.0, 1221.0, 779.0, 520.0, 340.0, 239.0, 209.0, 132.0, 77.0, 60.0, 47.0, 26.0, 23.0, 10.0, 10.0, 9.0, 3.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-493.75, -476.34765625, -458.9453125, -441.54296875, -424.140625, -406.73828125, -389.3359375, -371.93359375, -354.53125, -337.12890625, -319.7265625, -302.32421875, -284.921875, -267.51953125, -250.1171875, -232.71484375, -215.3125, -197.91015625, -180.5078125, -163.10546875, -145.703125, -128.30078125, -110.8984375, -93.49609375, -76.09375, -58.69140625, -41.2890625, -23.88671875, -6.484375, 10.91796875, 28.3203125, 45.72265625, 63.125, 80.52734375, 97.9296875, 115.33203125, 132.734375, 150.13671875, 167.5390625, 184.94140625, 202.34375, 219.74609375, 237.1484375, 254.55078125, 271.953125, 289.35546875, 306.7578125, 324.16015625, 341.5625, 358.96484375, 376.3671875, 393.76953125, 411.171875, 428.57421875, 445.9765625, 463.37890625, 480.78125, 498.18359375, 515.5859375, 532.98828125, 550.390625, 567.79296875, 585.1953125, 602.59765625, 620.0]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 2.0, 11.0, 8.0, 11.0, 8.0, 11.0, 7.0, 8.0, 13.0, 13.0, 20.0, 18.0, 20.0, 41.0, 23.0, 50.0, 39.0, 56.0, 124.0, 133.0, 75.0, 60.0, 24.0, 27.0, 31.0, 23.0, 18.0, 13.0, 19.0, 19.0, 13.0, 18.0, 8.0, 8.0, 4.0, 5.0, 4.0, 3.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-131.375, -126.509765625, -121.64453125, -116.779296875, -111.9140625, -107.048828125, -102.18359375, -97.318359375, -92.453125, -87.587890625, -82.72265625, -77.857421875, -72.9921875, -68.126953125, -63.26171875, -58.396484375, -53.53125, -48.666015625, -43.80078125, -38.935546875, -34.0703125, -29.205078125, -24.33984375, -19.474609375, -14.609375, -9.744140625, -4.87890625, -0.013671875, 4.8515625, 9.716796875, 14.58203125, 19.447265625, 24.3125, 29.177734375, 34.04296875, 38.908203125, 43.7734375, 48.638671875, 53.50390625, 58.369140625, 63.234375, 68.099609375, 72.96484375, 77.830078125, 82.6953125, 87.560546875, 92.42578125, 97.291015625, 102.15625, 107.021484375, 111.88671875, 116.751953125, 121.6171875, 126.482421875, 131.34765625, 136.212890625, 141.078125, 145.943359375, 150.80859375, 155.673828125, 160.5390625, 165.404296875, 170.26953125, 175.134765625, 180.0]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 0.0, 4.0, 3.0, 9.0, 5.0, 5.0, 11.0, 13.0, 19.0, 27.0, 37.0, 57.0, 85.0, 107.0, 159.0, 146.0, 87.0, 67.0, 37.0, 25.0, 20.0, 25.0, 13.0, 14.0, 6.0, 6.0, 6.0, 1.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.96563720703125, -140.23910522460938, -135.51258850097656, -130.78607177734375, -126.05953979492188, -121.33301544189453, -116.60649108886719, -111.87996673583984, -107.1534423828125, -102.42691802978516, -97.70039367675781, -92.97386932373047, -88.24734497070312, -83.52082061767578, -78.79429626464844, -74.0677719116211, -69.34124755859375, -64.6147232055664, -59.88819885253906, -55.16167449951172, -50.435150146484375, -45.70862579345703, -40.98210144042969, -36.255577087402344, -31.529052734375, -26.802528381347656, -22.076004028320312, -17.34947967529297, -12.622955322265625, -7.896430969238281, -3.1699066162109375, 1.5566177368164062, 6.2831268310546875, 11.009651184082031, 15.736175537109375, 20.46269989013672, 25.189224243164062, 29.915748596191406, 34.64227294921875, 39.368797302246094, 44.09532165527344, 48.82184600830078, 53.548370361328125, 58.27489471435547, 63.00141906738281, 67.72794342041016, 72.4544677734375, 77.18099212646484, 81.90751647949219, 86.63404083251953, 91.36056518554688, 96.08708953857422, 100.81361389160156, 105.5401382446289, 110.26666259765625, 114.9931869506836, 119.71971130371094, 124.44623565673828, 129.17276000976562, 133.8992919921875, 138.6258087158203, 143.35232543945312, 148.078857421875, 152.80538940429688, 157.5319061279297]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 6.0, 5.0, 5.0, 7.0, 8.0, 12.0, 13.0, 11.0, 16.0, 10.0, 17.0, 32.0, 34.0, 29.0, 33.0, 32.0, 44.0, 39.0, 30.0, 51.0, 35.0, 42.0, 43.0, 33.0, 41.0, 34.0, 40.0, 31.0, 25.0, 37.0, 25.0, 38.0, 27.0, 23.0, 10.0, 13.0, 10.0, 7.0, 13.0, 7.0, 12.0, 3.0, 7.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-74.86651611328125, -72.51985168457031, -70.1731948852539, -67.82653045654297, -65.47987365722656, -63.133209228515625, -60.78654861450195, -58.43988800048828, -56.09322738647461, -53.74656677246094, -51.399906158447266, -49.053245544433594, -46.706581115722656, -44.35992431640625, -42.01325988769531, -39.66659927368164, -37.31993865966797, -34.9732780456543, -32.626617431640625, -30.27995491027832, -27.93329429626465, -25.586633682250977, -23.239971160888672, -20.893310546875, -18.546649932861328, -16.199989318847656, -13.853327751159668, -11.50666618347168, -9.160005569458008, -6.813344955444336, -4.466683387756348, -2.1200218200683594, 0.2266387939453125, 2.5732998847961426, 4.919960975646973, 7.266622066497803, 9.613283157348633, 11.959943771362305, 14.306605339050293, 16.65326690673828, 18.999927520751953, 21.346588134765625, 23.693248748779297, 26.0399112701416, 28.386571884155273, 30.733232498168945, 33.07989501953125, 35.42655563354492, 37.773216247558594, 40.119876861572266, 42.46653747558594, 44.81319808959961, 47.15985870361328, 49.50652313232422, 51.85318374633789, 54.19984436035156, 56.546504974365234, 58.893165588378906, 61.23982620239258, 63.58648681640625, 65.93315124511719, 68.2798080444336, 70.62647247314453, 72.97312927246094, 75.31979370117188]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 8.0, 3.0, 6.0, 6.0, 13.0, 19.0, 23.0, 39.0, 43.0, 71.0, 112.0, 163.0, 231.0, 333.0, 475.0, 736.0, 1109.0, 1681.0, 2595.0, 3957.0, 6094.0, 9674.0, 15378.0, 24724.0, 41699.0, 72919.0, 153500.0, 627137.0, 2201205.0, 697072.0, 150852.0, 72512.0, 41199.0, 24700.0, 15232.0, 9700.0, 6412.0, 4140.0, 2852.0, 1898.0, 1231.0, 821.0, 569.0, 397.0, 264.0, 159.0, 106.0, 80.0, 55.0, 29.0, 27.0, 14.0, 9.0, 6.0, 5.0, 0.0, 3.0], "bins": [-143.25, -139.2177734375, -135.185546875, -131.1533203125, -127.12109375, -123.0888671875, -119.056640625, -115.0244140625, -110.9921875, -106.9599609375, -102.927734375, -98.8955078125, -94.86328125, -90.8310546875, -86.798828125, -82.7666015625, -78.734375, -74.7021484375, -70.669921875, -66.6376953125, -62.60546875, -58.5732421875, -54.541015625, -50.5087890625, -46.4765625, -42.4443359375, -38.412109375, -34.3798828125, -30.34765625, -26.3154296875, -22.283203125, -18.2509765625, -14.21875, -10.1865234375, -6.154296875, -2.1220703125, 1.91015625, 5.9423828125, 9.974609375, 14.0068359375, 18.0390625, 22.0712890625, 26.103515625, 30.1357421875, 34.16796875, 38.2001953125, 42.232421875, 46.2646484375, 50.296875, 54.3291015625, 58.361328125, 62.3935546875, 66.42578125, 70.4580078125, 74.490234375, 78.5224609375, 82.5546875, 86.5869140625, 90.619140625, 94.6513671875, 98.68359375, 102.7158203125, 106.748046875, 110.7802734375, 114.8125]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 7.0, 4.0, 7.0, 12.0, 11.0, 8.0, 10.0, 17.0, 20.0, 22.0, 25.0, 23.0, 31.0, 43.0, 23.0, 40.0, 36.0, 46.0, 42.0, 36.0, 47.0, 40.0, 50.0, 36.0, 40.0, 42.0, 25.0, 33.0, 37.0, 32.0, 23.0, 23.0, 20.0, 12.0, 12.0, 11.0, 11.0, 8.0, 9.0, 9.0, 4.0, 5.0, 6.0, 1.0, 3.0, 3.0, 3.0, 1.0, 2.0], "bins": [-65.3125, -63.49560546875, -61.6787109375, -59.86181640625, -58.044921875, -56.22802734375, -54.4111328125, -52.59423828125, -50.77734375, -48.96044921875, -47.1435546875, -45.32666015625, -43.509765625, -41.69287109375, -39.8759765625, -38.05908203125, -36.2421875, -34.42529296875, -32.6083984375, -30.79150390625, -28.974609375, -27.15771484375, -25.3408203125, -23.52392578125, -21.70703125, -19.89013671875, -18.0732421875, -16.25634765625, -14.439453125, -12.62255859375, -10.8056640625, -8.98876953125, -7.171875, -5.35498046875, -3.5380859375, -1.72119140625, 0.095703125, 1.91259765625, 3.7294921875, 5.54638671875, 7.36328125, 9.18017578125, 10.9970703125, 12.81396484375, 14.630859375, 16.44775390625, 18.2646484375, 20.08154296875, 21.8984375, 23.71533203125, 25.5322265625, 27.34912109375, 29.166015625, 30.98291015625, 32.7998046875, 34.61669921875, 36.43359375, 38.25048828125, 40.0673828125, 41.88427734375, 43.701171875, 45.51806640625, 47.3349609375, 49.15185546875, 50.96875]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 3.0, 1.0, 6.0, 9.0, 13.0, 15.0, 31.0, 27.0, 58.0, 80.0, 112.0, 171.0, 252.0, 381.0, 554.0, 931.0, 1500.0, 2369.0, 3613.0, 6097.0, 10098.0, 17595.0, 31357.0, 60253.0, 123375.0, 295022.0, 1280494.0, 1746718.0, 332823.0, 135129.0, 64747.0, 33797.0, 18846.0, 10823.0, 6387.0, 3791.0, 2414.0, 1536.0, 966.0, 659.0, 400.0, 272.0, 200.0, 118.0, 80.0, 53.0, 42.0, 21.0, 22.0, 15.0, 5.0, 3.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-130.5, -126.158203125, -121.81640625, -117.474609375, -113.1328125, -108.791015625, -104.44921875, -100.107421875, -95.765625, -91.423828125, -87.08203125, -82.740234375, -78.3984375, -74.056640625, -69.71484375, -65.373046875, -61.03125, -56.689453125, -52.34765625, -48.005859375, -43.6640625, -39.322265625, -34.98046875, -30.638671875, -26.296875, -21.955078125, -17.61328125, -13.271484375, -8.9296875, -4.587890625, -0.24609375, 4.095703125, 8.4375, 12.779296875, 17.12109375, 21.462890625, 25.8046875, 30.146484375, 34.48828125, 38.830078125, 43.171875, 47.513671875, 51.85546875, 56.197265625, 60.5390625, 64.880859375, 69.22265625, 73.564453125, 77.90625, 82.248046875, 86.58984375, 90.931640625, 95.2734375, 99.615234375, 103.95703125, 108.298828125, 112.640625, 116.982421875, 121.32421875, 125.666015625, 130.0078125, 134.349609375, 138.69140625, 143.033203125, 147.375]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 3.0, 1.0, 8.0, 16.0, 3.0, 8.0, 13.0, 19.0, 26.0, 21.0, 28.0, 48.0, 69.0, 69.0, 88.0, 110.0, 140.0, 180.0, 250.0, 331.0, 602.0, 593.0, 313.0, 251.0, 186.0, 122.0, 105.0, 94.0, 67.0, 75.0, 41.0, 38.0, 29.0, 27.0, 21.0, 19.0, 19.0, 8.0, 6.0, 11.0, 2.0, 5.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.96875, -35.7373046875, -34.505859375, -33.2744140625, -32.04296875, -30.8115234375, -29.580078125, -28.3486328125, -27.1171875, -25.8857421875, -24.654296875, -23.4228515625, -22.19140625, -20.9599609375, -19.728515625, -18.4970703125, -17.265625, -16.0341796875, -14.802734375, -13.5712890625, -12.33984375, -11.1083984375, -9.876953125, -8.6455078125, -7.4140625, -6.1826171875, -4.951171875, -3.7197265625, -2.48828125, -1.2568359375, -0.025390625, 1.2060546875, 2.4375, 3.6689453125, 4.900390625, 6.1318359375, 7.36328125, 8.5947265625, 9.826171875, 11.0576171875, 12.2890625, 13.5205078125, 14.751953125, 15.9833984375, 17.21484375, 18.4462890625, 19.677734375, 20.9091796875, 22.140625, 23.3720703125, 24.603515625, 25.8349609375, 27.06640625, 28.2978515625, 29.529296875, 30.7607421875, 31.9921875, 33.2236328125, 34.455078125, 35.6865234375, 36.91796875, 38.1494140625, 39.380859375, 40.6123046875, 41.84375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 7.0, 7.0, 6.0, 4.0, 11.0, 8.0, 21.0, 24.0, 24.0, 39.0, 40.0, 91.0, 120.0, 155.0, 123.0, 99.0, 66.0, 43.0, 28.0, 30.0, 12.0, 18.0, 6.0, 9.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.23155975341797, -89.43646240234375, -85.641357421875, -81.84625244140625, -78.05115509033203, -74.25605773925781, -70.46095275878906, -66.66584777832031, -62.870750427246094, -59.07564926147461, -55.280548095703125, -51.48544692993164, -47.690345764160156, -43.89524459838867, -40.10014343261719, -36.3050422668457, -32.50994110107422, -28.714839935302734, -24.91973876953125, -21.124637603759766, -17.32953643798828, -13.534435272216797, -9.739334106445312, -5.944232940673828, -2.1491317749023438, 1.6459693908691406, 5.441070556640625, 9.23617172241211, 13.031272888183594, 16.826374053955078, 20.621475219726562, 24.416576385498047, 28.211685180664062, 32.00678634643555, 35.80188751220703, 39.596988677978516, 43.39208984375, 47.187191009521484, 50.98229217529297, 54.77739334106445, 58.57249450683594, 62.36759567260742, 66.1626968383789, 69.95779418945312, 73.75289916992188, 77.54800415039062, 81.34310150146484, 85.13819885253906, 88.93330383300781, 92.72840881347656, 96.52350616455078, 100.318603515625, 104.11370849609375, 107.9088134765625, 111.70391082763672, 115.49900817871094, 119.29411315917969, 123.08921813964844, 126.88431549072266, 130.67941284179688, 134.47451782226562, 138.26962280273438, 142.06472778320312, 145.8598175048828, 149.65492248535156]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 6.0, 5.0, 7.0, 11.0, 21.0, 9.0, 18.0, 15.0, 22.0, 23.0, 21.0, 19.0, 34.0, 41.0, 39.0, 32.0, 47.0, 39.0, 41.0, 42.0, 41.0, 39.0, 45.0, 37.0, 51.0, 39.0, 34.0, 27.0, 28.0, 26.0, 25.0, 23.0, 16.0, 7.0, 16.0, 9.0, 9.0, 7.0, 3.0, 5.0, 8.0, 8.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.161930084228516, -54.16505432128906, -52.168174743652344, -50.17129898071289, -48.17441940307617, -46.17754364013672, -44.1806640625, -42.18378829956055, -40.186912536621094, -38.19003677368164, -36.19315719604492, -34.19628143310547, -32.19940185546875, -30.202526092529297, -28.20564842224121, -26.208770751953125, -24.211891174316406, -22.21501350402832, -20.218135833740234, -18.22126007080078, -16.224380493164062, -14.227503776550293, -12.230627059936523, -10.233749389648438, -8.236871719360352, -6.239994049072266, -4.243116855621338, -2.24623966217041, -0.24936199188232422, 1.7475156784057617, 3.7443923950195312, 5.741270065307617, 7.738151550292969, 9.735029220581055, 11.73190689086914, 13.72878360748291, 15.725661277770996, 17.722537994384766, 19.71941566467285, 21.716293334960938, 23.713171005249023, 25.71004867553711, 27.706926345825195, 29.70380401611328, 31.700679779052734, 33.69755935668945, 35.694435119628906, 37.691314697265625, 39.68819046020508, 41.68506622314453, 43.68194580078125, 45.6788215637207, 47.67570114135742, 49.672576904296875, 51.669456481933594, 53.66633224487305, 55.6632080078125, 57.66008377075195, 59.65696334838867, 61.653839111328125, 63.650718688964844, 65.64759826660156, 67.64447021484375, 69.64134979248047, 71.63822937011719]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 4.0, 10.0, 12.0, 8.0, 30.0, 46.0, 39.0, 65.0, 135.0, 205.0, 271.0, 381.0, 596.0, 763.0, 1036.0, 1662.0, 2397.0, 3114.0, 4527.0, 6312.0, 9448.0, 13053.0, 19356.0, 28368.0, 43345.0, 68393.0, 118491.0, 283918.0, 179853.0, 92304.0, 56283.0, 35961.0, 23938.0, 16211.0, 11460.0, 7627.0, 5723.0, 3983.0, 2802.0, 1956.0, 1338.0, 1006.0, 696.0, 501.0, 309.0, 169.0, 126.0, 126.0, 86.0, 49.0, 27.0, 13.0, 20.0, 11.0, 1.0, 1.0, 5.0, 0.0, 0.0, 1.0], "bins": [-16.25, -15.73876953125, -15.2275390625, -14.71630859375, -14.205078125, -13.69384765625, -13.1826171875, -12.67138671875, -12.16015625, -11.64892578125, -11.1376953125, -10.62646484375, -10.115234375, -9.60400390625, -9.0927734375, -8.58154296875, -8.0703125, -7.55908203125, -7.0478515625, -6.53662109375, -6.025390625, -5.51416015625, -5.0029296875, -4.49169921875, -3.98046875, -3.46923828125, -2.9580078125, -2.44677734375, -1.935546875, -1.42431640625, -0.9130859375, -0.40185546875, 0.109375, 0.62060546875, 1.1318359375, 1.64306640625, 2.154296875, 2.66552734375, 3.1767578125, 3.68798828125, 4.19921875, 4.71044921875, 5.2216796875, 5.73291015625, 6.244140625, 6.75537109375, 7.2666015625, 7.77783203125, 8.2890625, 8.80029296875, 9.3115234375, 9.82275390625, 10.333984375, 10.84521484375, 11.3564453125, 11.86767578125, 12.37890625, 12.89013671875, 13.4013671875, 13.91259765625, 14.423828125, 14.93505859375, 15.4462890625, 15.95751953125, 16.46875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 8.0, 7.0, 10.0, 11.0, 9.0, 10.0, 8.0, 28.0, 22.0, 16.0, 15.0, 23.0, 26.0, 32.0, 33.0, 31.0, 46.0, 42.0, 43.0, 46.0, 42.0, 48.0, 30.0, 36.0, 34.0, 39.0, 40.0, 33.0, 27.0, 40.0, 24.0, 18.0, 20.0, 20.0, 9.0, 11.0, 15.0, 12.0, 6.0, 3.0, 3.0, 10.0, 6.0, 5.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.53125, -53.61962890625, -51.7080078125, -49.79638671875, -47.884765625, -45.97314453125, -44.0615234375, -42.14990234375, -40.23828125, -38.32666015625, -36.4150390625, -34.50341796875, -32.591796875, -30.68017578125, -28.7685546875, -26.85693359375, -24.9453125, -23.03369140625, -21.1220703125, -19.21044921875, -17.298828125, -15.38720703125, -13.4755859375, -11.56396484375, -9.65234375, -7.74072265625, -5.8291015625, -3.91748046875, -2.005859375, -0.09423828125, 1.8173828125, 3.72900390625, 5.640625, 7.55224609375, 9.4638671875, 11.37548828125, 13.287109375, 15.19873046875, 17.1103515625, 19.02197265625, 20.93359375, 22.84521484375, 24.7568359375, 26.66845703125, 28.580078125, 30.49169921875, 32.4033203125, 34.31494140625, 36.2265625, 38.13818359375, 40.0498046875, 41.96142578125, 43.873046875, 45.78466796875, 47.6962890625, 49.60791015625, 51.51953125, 53.43115234375, 55.3427734375, 57.25439453125, 59.166015625, 61.07763671875, 62.9892578125, 64.90087890625, 66.8125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 6.0, 6.0, 9.0, 17.0, 28.0, 38.0, 54.0, 70.0, 127.0, 125.0, 188.0, 276.0, 410.0, 501.0, 733.0, 981.0, 1488.0, 2042.0, 3015.0, 4577.0, 6633.0, 9937.0, 14986.0, 23417.0, 37433.0, 60634.0, 106380.0, 250455.0, 249842.0, 105893.0, 60591.0, 37299.0, 23511.0, 15322.0, 9877.0, 6712.0, 4548.0, 3121.0, 2148.0, 1423.0, 1052.0, 761.0, 541.0, 360.0, 265.0, 210.0, 170.0, 117.0, 74.0, 62.0, 34.0, 21.0, 24.0, 6.0, 5.0, 6.0, 3.0, 1.0, 1.0, 3.0], "bins": [-16.640625, -16.12060546875, -15.6005859375, -15.08056640625, -14.560546875, -14.04052734375, -13.5205078125, -13.00048828125, -12.48046875, -11.96044921875, -11.4404296875, -10.92041015625, -10.400390625, -9.88037109375, -9.3603515625, -8.84033203125, -8.3203125, -7.80029296875, -7.2802734375, -6.76025390625, -6.240234375, -5.72021484375, -5.2001953125, -4.68017578125, -4.16015625, -3.64013671875, -3.1201171875, -2.60009765625, -2.080078125, -1.56005859375, -1.0400390625, -0.52001953125, 0.0, 0.52001953125, 1.0400390625, 1.56005859375, 2.080078125, 2.60009765625, 3.1201171875, 3.64013671875, 4.16015625, 4.68017578125, 5.2001953125, 5.72021484375, 6.240234375, 6.76025390625, 7.2802734375, 7.80029296875, 8.3203125, 8.84033203125, 9.3603515625, 9.88037109375, 10.400390625, 10.92041015625, 11.4404296875, 11.96044921875, 12.48046875, 13.00048828125, 13.5205078125, 14.04052734375, 14.560546875, 15.08056640625, 15.6005859375, 16.12060546875, 16.640625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 4.0, 2.0, 7.0, 7.0, 5.0, 8.0, 8.0, 9.0, 11.0, 15.0, 15.0, 29.0, 28.0, 20.0, 27.0, 22.0, 30.0, 41.0, 44.0, 44.0, 41.0, 48.0, 41.0, 37.0, 41.0, 26.0, 41.0, 38.0, 43.0, 33.0, 35.0, 35.0, 28.0, 25.0, 25.0, 15.0, 14.0, 14.0, 4.0, 10.0, 8.0, 3.0, 9.0, 3.0, 7.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.59375, -40.306640625, -39.01953125, -37.732421875, -36.4453125, -35.158203125, -33.87109375, -32.583984375, -31.296875, -30.009765625, -28.72265625, -27.435546875, -26.1484375, -24.861328125, -23.57421875, -22.287109375, -21.0, -19.712890625, -18.42578125, -17.138671875, -15.8515625, -14.564453125, -13.27734375, -11.990234375, -10.703125, -9.416015625, -8.12890625, -6.841796875, -5.5546875, -4.267578125, -2.98046875, -1.693359375, -0.40625, 0.880859375, 2.16796875, 3.455078125, 4.7421875, 6.029296875, 7.31640625, 8.603515625, 9.890625, 11.177734375, 12.46484375, 13.751953125, 15.0390625, 16.326171875, 17.61328125, 18.900390625, 20.1875, 21.474609375, 22.76171875, 24.048828125, 25.3359375, 26.623046875, 27.91015625, 29.197265625, 30.484375, 31.771484375, 33.05859375, 34.345703125, 35.6328125, 36.919921875, 38.20703125, 39.494140625, 40.78125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 3.0, 3.0, 16.0, 8.0, 8.0, 6.0, 15.0, 22.0, 51.0, 96.0, 146.0, 287.0, 446.0, 719.0, 1230.0, 2191.0, 3587.0, 6522.0, 12518.0, 27232.0, 69640.0, 302158.0, 464318.0, 90905.0, 33606.0, 15224.0, 7530.0, 4205.0, 2484.0, 1354.0, 828.0, 492.0, 295.0, 146.0, 107.0, 56.0, 26.0, 19.0, 8.0, 14.0, 6.0, 5.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.06640625, -0.06433868408203125, -0.0622711181640625, -0.06020355224609375, -0.058135986328125, -0.05606842041015625, -0.0540008544921875, -0.05193328857421875, -0.04986572265625, -0.04779815673828125, -0.0457305908203125, -0.04366302490234375, -0.041595458984375, -0.03952789306640625, -0.0374603271484375, -0.03539276123046875, -0.0333251953125, -0.03125762939453125, -0.0291900634765625, -0.02712249755859375, -0.025054931640625, -0.02298736572265625, -0.0209197998046875, -0.01885223388671875, -0.01678466796875, -0.01471710205078125, -0.0126495361328125, -0.01058197021484375, -0.008514404296875, -0.00644683837890625, -0.0043792724609375, -0.00231170654296875, -0.000244140625, 0.00182342529296875, 0.0038909912109375, 0.00595855712890625, 0.008026123046875, 0.01009368896484375, 0.0121612548828125, 0.01422882080078125, 0.01629638671875, 0.01836395263671875, 0.0204315185546875, 0.02249908447265625, 0.024566650390625, 0.02663421630859375, 0.0287017822265625, 0.03076934814453125, 0.0328369140625, 0.03490447998046875, 0.0369720458984375, 0.03903961181640625, 0.041107177734375, 0.04317474365234375, 0.0452423095703125, 0.04730987548828125, 0.04937744140625, 0.05144500732421875, 0.0535125732421875, 0.05558013916015625, 0.057647705078125, 0.05971527099609375, 0.0617828369140625, 0.06385040283203125, 0.06591796875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 2.0, 6.0, 4.0, 7.0, 12.0, 14.0, 17.0, 25.0, 26.0, 24.0, 43.0, 61.0, 89.0, 137.0, 103.0, 91.0, 80.0, 43.0, 47.0, 45.0, 34.0, 13.0, 17.0, 8.0, 10.0, 8.0, 7.0, 3.0, 3.0, 3.0, 1.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8710575103759766e-05, -5.71003183722496e-05, -5.549006164073944e-05, -5.387980490922928e-05, -5.2269548177719116e-05, -5.0659291446208954e-05, -4.904903471469879e-05, -4.743877798318863e-05, -4.582852125167847e-05, -4.4218264520168304e-05, -4.260800778865814e-05, -4.099775105714798e-05, -3.938749432563782e-05, -3.7777237594127655e-05, -3.616698086261749e-05, -3.455672413110733e-05, -3.294646739959717e-05, -3.1336210668087006e-05, -2.9725953936576843e-05, -2.811569720506668e-05, -2.650544047355652e-05, -2.4895183742046356e-05, -2.3284927010536194e-05, -2.167467027902603e-05, -2.006441354751587e-05, -1.8454156816005707e-05, -1.6843900084495544e-05, -1.5233643352985382e-05, -1.362338662147522e-05, -1.2013129889965057e-05, -1.0402873158454895e-05, -8.792616426944733e-06, -7.18235969543457e-06, -5.572102963924408e-06, -3.961846232414246e-06, -2.3515895009040833e-06, -7.413327693939209e-07, 8.689239621162415e-07, 2.479180693626404e-06, 4.089437425136566e-06, 5.6996941566467285e-06, 7.309950888156891e-06, 8.920207619667053e-06, 1.0530464351177216e-05, 1.2140721082687378e-05, 1.375097781419754e-05, 1.5361234545707703e-05, 1.6971491277217865e-05, 1.8581748008728027e-05, 2.019200474023819e-05, 2.1802261471748352e-05, 2.3412518203258514e-05, 2.5022774934768677e-05, 2.663303166627884e-05, 2.8243288397789e-05, 2.9853545129299164e-05, 3.1463801860809326e-05, 3.307405859231949e-05, 3.468431532382965e-05, 3.629457205533981e-05, 3.7904828786849976e-05, 3.951508551836014e-05, 4.11253422498703e-05, 4.273559898138046e-05, 4.4345855712890625e-05]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 12.0, 7.0, 11.0, 20.0, 37.0, 33.0, 44.0, 63.0, 100.0, 107.0, 193.0, 290.0, 418.0, 538.0, 775.0, 1068.0, 1626.0, 2403.0, 3491.0, 5680.0, 8771.0, 14714.0, 26189.0, 50599.0, 112684.0, 344656.0, 274327.0, 95004.0, 44318.0, 23451.0, 13171.0, 8000.0, 5117.0, 3436.0, 2242.0, 1533.0, 974.0, 726.0, 507.0, 357.0, 266.0, 157.0, 114.0, 105.0, 70.0, 36.0, 33.0, 28.0, 17.0, 10.0, 13.0, 6.0, 6.0, 3.0, 2.0, 3.0], "bins": [-0.044281005859375, -0.04297494888305664, -0.04166889190673828, -0.04036283493041992, -0.03905677795410156, -0.0377507209777832, -0.036444664001464844, -0.035138607025146484, -0.033832550048828125, -0.032526493072509766, -0.031220436096191406, -0.029914379119873047, -0.028608322143554688, -0.027302265167236328, -0.02599620819091797, -0.02469015121459961, -0.02338409423828125, -0.02207803726196289, -0.02077198028564453, -0.019465923309326172, -0.018159866333007812, -0.016853809356689453, -0.015547752380371094, -0.014241695404052734, -0.012935638427734375, -0.011629581451416016, -0.010323524475097656, -0.009017467498779297, -0.0077114105224609375, -0.006405353546142578, -0.005099296569824219, -0.0037932395935058594, -0.0024871826171875, -0.0011811256408691406, 0.00012493133544921875, 0.0014309883117675781, 0.0027370452880859375, 0.004043102264404297, 0.005349159240722656, 0.006655216217041016, 0.007961273193359375, 0.009267330169677734, 0.010573387145996094, 0.011879444122314453, 0.013185501098632812, 0.014491558074951172, 0.01579761505126953, 0.01710367202758789, 0.01840972900390625, 0.01971578598022461, 0.02102184295654297, 0.022327899932861328, 0.023633956909179688, 0.024940013885498047, 0.026246070861816406, 0.027552127838134766, 0.028858184814453125, 0.030164241790771484, 0.031470298767089844, 0.0327763557434082, 0.03408241271972656, 0.03538846969604492, 0.03669452667236328, 0.03800058364868164, 0.039306640625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 7.0, 6.0, 13.0, 18.0, 10.0, 16.0, 17.0, 28.0, 26.0, 35.0, 52.0, 38.0, 74.0, 73.0, 77.0, 75.0, 56.0, 62.0, 52.0, 39.0, 45.0, 29.0, 25.0, 27.0, 13.0, 11.0, 13.0, 8.0, 2.0, 4.0, 4.0, 8.0, 3.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0131683349609375, -0.012782096862792969, -0.012395858764648438, -0.012009620666503906, -0.011623382568359375, -0.011237144470214844, -0.010850906372070312, -0.010464668273925781, -0.01007843017578125, -0.009692192077636719, -0.009305953979492188, -0.008919715881347656, -0.008533477783203125, -0.008147239685058594, -0.0077610015869140625, -0.007374763488769531, -0.006988525390625, -0.006602287292480469, -0.0062160491943359375, -0.005829811096191406, -0.005443572998046875, -0.005057334899902344, -0.0046710968017578125, -0.004284858703613281, -0.00389862060546875, -0.0035123825073242188, -0.0031261444091796875, -0.0027399063110351562, -0.002353668212890625, -0.0019674301147460938, -0.0015811920166015625, -0.0011949539184570312, -0.0008087158203125, -0.00042247772216796875, -3.62396240234375e-05, 0.00034999847412109375, 0.000736236572265625, 0.0011224746704101562, 0.0015087127685546875, 0.0018949508666992188, 0.00228118896484375, 0.0026674270629882812, 0.0030536651611328125, 0.0034399032592773438, 0.003826141357421875, 0.004212379455566406, 0.0045986175537109375, 0.004984855651855469, 0.00537109375, 0.005757331848144531, 0.0061435699462890625, 0.006529808044433594, 0.006916046142578125, 0.007302284240722656, 0.0076885223388671875, 0.008074760437011719, 0.00846099853515625, 0.008847236633300781, 0.009233474731445312, 0.009619712829589844, 0.010005950927734375, 0.010392189025878906, 0.010778427124023438, 0.011164665222167969, 0.0115509033203125]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 3.0, 8.0, 5.0, 7.0, 6.0, 8.0, 12.0, 19.0, 21.0, 28.0, 43.0, 46.0, 90.0, 120.0, 152.0, 122.0, 101.0, 64.0, 40.0, 30.0, 28.0, 9.0, 18.0, 7.0, 7.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.24986267089844, -86.56324005126953, -82.8766098022461, -79.18998718261719, -75.50335693359375, -71.81673431396484, -68.13011169433594, -64.4434814453125, -60.756858825683594, -57.07023239135742, -53.38360595703125, -49.696983337402344, -46.01035690307617, -42.32373046875, -38.637107849121094, -34.95048141479492, -31.26385498046875, -27.577228546142578, -23.89060401916504, -20.2039794921875, -16.517353057861328, -12.830726623535156, -9.144102096557617, -5.457477569580078, -1.7708511352539062, 1.9157743453979492, 5.602399826049805, 9.28902530670166, 12.975650787353516, 16.662277221679688, 20.348901748657227, 24.035526275634766, 27.722152709960938, 31.40877914428711, 35.09540557861328, 38.78202819824219, 42.46865463256836, 46.15528106689453, 49.84190368652344, 53.52853012084961, 57.21515655517578, 60.90178298950195, 64.58840942382812, 68.27503204345703, 71.96165466308594, 75.64828491210938, 79.33490753173828, 83.02153015136719, 86.70816040039062, 90.39478302001953, 94.08141326904297, 97.76803588867188, 101.45466613769531, 105.14128875732422, 108.82791137695312, 112.51454162597656, 116.20116424560547, 119.88778686523438, 123.57441711425781, 127.26103973388672, 130.94766235351562, 134.63429260253906, 138.3209228515625, 142.00753784179688, 145.6941680908203]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 3.0, 6.0, 6.0, 6.0, 11.0, 21.0, 9.0, 17.0, 15.0, 22.0, 25.0, 19.0, 20.0, 34.0, 41.0, 36.0, 33.0, 46.0, 41.0, 41.0, 41.0, 43.0, 38.0, 45.0, 38.0, 50.0, 38.0, 35.0, 27.0, 27.0, 26.0, 27.0, 23.0, 16.0, 7.0, 16.0, 8.0, 9.0, 8.0, 3.0, 5.0, 8.0, 8.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.2835807800293, -52.350990295410156, -50.418399810791016, -48.485809326171875, -46.55321502685547, -44.620628356933594, -42.68803405761719, -40.75544357299805, -38.822853088378906, -36.890262603759766, -34.957672119140625, -33.025081634521484, -31.09248924255371, -29.15989875793457, -27.227306365966797, -25.294715881347656, -23.362125396728516, -21.429534912109375, -19.496944427490234, -17.56435203552246, -15.63176155090332, -13.69917106628418, -11.766579627990723, -9.833988189697266, -7.901397705078125, -5.968806743621826, -4.036215782165527, -2.1036248207092285, -0.1710338592529297, 1.761556625366211, 3.694148063659668, 5.626739501953125, 7.559326171875, 9.49191665649414, 11.424508094787598, 13.357099533081055, 15.289690017700195, 17.222280502319336, 19.15487289428711, 21.08746337890625, 23.02005386352539, 24.95264434814453, 26.885234832763672, 28.817827224731445, 30.750417709350586, 32.683006286621094, 34.6156005859375, 36.54819107055664, 38.48078155517578, 40.41337203979492, 42.34596252441406, 44.2785530090332, 46.211143493652344, 48.14373779296875, 50.07632827758789, 52.00891876220703, 53.94150924682617, 55.87409973144531, 57.80669021606445, 59.739280700683594, 61.671875, 63.604461669921875, 65.53705596923828, 67.46965026855469, 69.40223693847656]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 10.0, 5.0, 10.0, 22.0, 20.0, 35.0, 68.0, 116.0, 144.0, 205.0, 291.0, 458.0, 751.0, 1027.0, 1554.0, 2258.0, 3512.0, 5225.0, 7865.0, 12232.0, 18690.0, 29700.0, 48775.0, 85775.0, 170161.0, 275211.0, 168346.0, 84220.0, 48509.0, 29567.0, 18623.0, 11895.0, 7757.0, 5069.0, 3382.0, 2322.0, 1511.0, 1055.0, 721.0, 465.0, 359.0, 233.0, 146.0, 84.0, 59.0, 41.0, 33.0, 18.0, 9.0, 7.0, 6.0, 4.0, 4.0, 0.0, 3.0], "bins": [-119.0625, -115.6103515625, -112.158203125, -108.7060546875, -105.25390625, -101.8017578125, -98.349609375, -94.8974609375, -91.4453125, -87.9931640625, -84.541015625, -81.0888671875, -77.63671875, -74.1845703125, -70.732421875, -67.2802734375, -63.828125, -60.3759765625, -56.923828125, -53.4716796875, -50.01953125, -46.5673828125, -43.115234375, -39.6630859375, -36.2109375, -32.7587890625, -29.306640625, -25.8544921875, -22.40234375, -18.9501953125, -15.498046875, -12.0458984375, -8.59375, -5.1416015625, -1.689453125, 1.7626953125, 5.21484375, 8.6669921875, 12.119140625, 15.5712890625, 19.0234375, 22.4755859375, 25.927734375, 29.3798828125, 32.83203125, 36.2841796875, 39.736328125, 43.1884765625, 46.640625, 50.0927734375, 53.544921875, 56.9970703125, 60.44921875, 63.9013671875, 67.353515625, 70.8056640625, 74.2578125, 77.7099609375, 81.162109375, 84.6142578125, 88.06640625, 91.5185546875, 94.970703125, 98.4228515625, 101.875]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 3.0, 7.0, 6.0, 14.0, 9.0, 11.0, 11.0, 20.0, 29.0, 25.0, 20.0, 27.0, 26.0, 36.0, 46.0, 39.0, 52.0, 44.0, 41.0, 39.0, 49.0, 36.0, 48.0, 41.0, 37.0, 33.0, 40.0, 36.0, 28.0, 26.0, 22.0, 16.0, 19.0, 12.0, 10.0, 7.0, 5.0, 3.0, 8.0, 8.0, 4.0, 5.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.84375, -46.1279296875, -44.412109375, -42.6962890625, -40.98046875, -39.2646484375, -37.548828125, -35.8330078125, -34.1171875, -32.4013671875, -30.685546875, -28.9697265625, -27.25390625, -25.5380859375, -23.822265625, -22.1064453125, -20.390625, -18.6748046875, -16.958984375, -15.2431640625, -13.52734375, -11.8115234375, -10.095703125, -8.3798828125, -6.6640625, -4.9482421875, -3.232421875, -1.5166015625, 0.19921875, 1.9150390625, 3.630859375, 5.3466796875, 7.0625, 8.7783203125, 10.494140625, 12.2099609375, 13.92578125, 15.6416015625, 17.357421875, 19.0732421875, 20.7890625, 22.5048828125, 24.220703125, 25.9365234375, 27.65234375, 29.3681640625, 31.083984375, 32.7998046875, 34.515625, 36.2314453125, 37.947265625, 39.6630859375, 41.37890625, 43.0947265625, 44.810546875, 46.5263671875, 48.2421875, 49.9580078125, 51.673828125, 53.3896484375, 55.10546875, 56.8212890625, 58.537109375, 60.2529296875, 61.96875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 6.0, 9.0, 7.0, 20.0, 15.0, 21.0, 40.0, 51.0, 86.0, 123.0, 203.0, 252.0, 398.0, 584.0, 880.0, 1382.0, 2020.0, 3138.0, 4927.0, 7758.0, 12375.0, 19872.0, 33051.0, 55348.0, 99705.0, 207845.0, 281707.0, 135047.0, 72235.0, 42099.0, 25219.0, 15441.0, 9552.0, 5975.0, 3857.0, 2489.0, 1584.0, 1094.0, 690.0, 474.0, 301.0, 212.0, 133.0, 103.0, 76.0, 51.0, 34.0, 25.0, 17.0, 11.0, 9.0, 6.0, 1.0, 2.0, 4.0, 0.0, 4.0], "bins": [-124.875, -121.1171875, -117.359375, -113.6015625, -109.84375, -106.0859375, -102.328125, -98.5703125, -94.8125, -91.0546875, -87.296875, -83.5390625, -79.78125, -76.0234375, -72.265625, -68.5078125, -64.75, -60.9921875, -57.234375, -53.4765625, -49.71875, -45.9609375, -42.203125, -38.4453125, -34.6875, -30.9296875, -27.171875, -23.4140625, -19.65625, -15.8984375, -12.140625, -8.3828125, -4.625, -0.8671875, 2.890625, 6.6484375, 10.40625, 14.1640625, 17.921875, 21.6796875, 25.4375, 29.1953125, 32.953125, 36.7109375, 40.46875, 44.2265625, 47.984375, 51.7421875, 55.5, 59.2578125, 63.015625, 66.7734375, 70.53125, 74.2890625, 78.046875, 81.8046875, 85.5625, 89.3203125, 93.078125, 96.8359375, 100.59375, 104.3515625, 108.109375, 111.8671875, 115.625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 9.0, 6.0, 6.0, 11.0, 12.0, 17.0, 15.0, 28.0, 20.0, 26.0, 29.0, 40.0, 45.0, 42.0, 42.0, 41.0, 31.0, 35.0, 47.0, 59.0, 49.0, 39.0, 38.0, 40.0, 43.0, 35.0, 25.0, 23.0, 28.0, 23.0, 17.0, 13.0, 14.0, 7.0, 10.0, 10.0, 8.0, 4.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-38.375, -37.22412109375, -36.0732421875, -34.92236328125, -33.771484375, -32.62060546875, -31.4697265625, -30.31884765625, -29.16796875, -28.01708984375, -26.8662109375, -25.71533203125, -24.564453125, -23.41357421875, -22.2626953125, -21.11181640625, -19.9609375, -18.81005859375, -17.6591796875, -16.50830078125, -15.357421875, -14.20654296875, -13.0556640625, -11.90478515625, -10.75390625, -9.60302734375, -8.4521484375, -7.30126953125, -6.150390625, -4.99951171875, -3.8486328125, -2.69775390625, -1.546875, -0.39599609375, 0.7548828125, 1.90576171875, 3.056640625, 4.20751953125, 5.3583984375, 6.50927734375, 7.66015625, 8.81103515625, 9.9619140625, 11.11279296875, 12.263671875, 13.41455078125, 14.5654296875, 15.71630859375, 16.8671875, 18.01806640625, 19.1689453125, 20.31982421875, 21.470703125, 22.62158203125, 23.7724609375, 24.92333984375, 26.07421875, 27.22509765625, 28.3759765625, 29.52685546875, 30.677734375, 31.82861328125, 32.9794921875, 34.13037109375, 35.28125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 5.0, 7.0, 7.0, 14.0, 15.0, 28.0, 31.0, 59.0, 68.0, 113.0, 184.0, 272.0, 421.0, 595.0, 966.0, 1486.0, 2284.0, 3496.0, 5885.0, 9100.0, 15059.0, 25445.0, 44716.0, 84472.0, 189476.0, 312128.0, 171268.0, 77554.0, 41406.0, 23789.0, 14425.0, 8644.0, 5529.0, 3435.0, 2126.0, 1469.0, 891.0, 592.0, 351.0, 262.0, 166.0, 105.0, 73.0, 48.0, 32.0, 18.0, 20.0, 14.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3173828125, -1.275482177734375, -1.23358154296875, -1.191680908203125, -1.1497802734375, -1.107879638671875, -1.06597900390625, -1.024078369140625, -0.982177734375, -0.940277099609375, -0.89837646484375, -0.856475830078125, -0.8145751953125, -0.772674560546875, -0.73077392578125, -0.688873291015625, -0.64697265625, -0.605072021484375, -0.56317138671875, -0.521270751953125, -0.4793701171875, -0.437469482421875, -0.39556884765625, -0.353668212890625, -0.311767578125, -0.269866943359375, -0.22796630859375, -0.186065673828125, -0.1441650390625, -0.102264404296875, -0.06036376953125, -0.018463134765625, 0.0234375, 0.065338134765625, 0.10723876953125, 0.149139404296875, 0.1910400390625, 0.232940673828125, 0.27484130859375, 0.316741943359375, 0.358642578125, 0.400543212890625, 0.44244384765625, 0.484344482421875, 0.5262451171875, 0.568145751953125, 0.61004638671875, 0.651947021484375, 0.69384765625, 0.735748291015625, 0.77764892578125, 0.819549560546875, 0.8614501953125, 0.903350830078125, 0.94525146484375, 0.987152099609375, 1.029052734375, 1.070953369140625, 1.11285400390625, 1.154754638671875, 1.1966552734375, 1.238555908203125, 1.28045654296875, 1.322357177734375, 1.3642578125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 2.0, 3.0, 4.0, 6.0, 7.0, 9.0, 8.0, 13.0, 21.0, 28.0, 35.0, 35.0, 50.0, 66.0, 90.0, 119.0, 104.0, 86.0, 72.0, 54.0, 36.0, 30.0, 24.0, 21.0, 9.0, 13.0, 11.0, 8.0, 11.0, 4.0, 10.0, 2.0, 0.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.000537872314453125, -0.0005229823291301727, -0.0005080923438072205, -0.0004932023584842682, -0.0004783123731613159, -0.00046342238783836365, -0.0004485324025154114, -0.0004336424171924591, -0.00041875243186950684, -0.00040386244654655457, -0.0003889724612236023, -0.00037408247590065, -0.00035919249057769775, -0.0003443025052547455, -0.0003294125199317932, -0.00031452253460884094, -0.00029963254928588867, -0.0002847425639629364, -0.00026985257863998413, -0.00025496259331703186, -0.0002400726079940796, -0.00022518262267112732, -0.00021029263734817505, -0.00019540265202522278, -0.0001805126667022705, -0.00016562268137931824, -0.00015073269605636597, -0.0001358427107334137, -0.00012095272541046143, -0.00010606274008750916, -9.117275476455688e-05, -7.628276944160461e-05, -6.139278411865234e-05, -4.650279879570007e-05, -3.16128134727478e-05, -1.6722828149795532e-05, -1.8328428268432617e-06, 1.3057142496109009e-05, 2.794712781906128e-05, 4.283711314201355e-05, 5.772709846496582e-05, 7.261708378791809e-05, 8.750706911087036e-05, 0.00010239705443382263, 0.0001172870397567749, 0.00013217702507972717, 0.00014706701040267944, 0.00016195699572563171, 0.00017684698104858398, 0.00019173696637153625, 0.00020662695169448853, 0.0002215169370174408, 0.00023640692234039307, 0.00025129690766334534, 0.0002661868929862976, 0.0002810768783092499, 0.00029596686363220215, 0.0003108568489551544, 0.0003257468342781067, 0.00034063681960105896, 0.00035552680492401123, 0.0003704167902469635, 0.00038530677556991577, 0.00040019676089286804, 0.0004150867462158203]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 1.0, 6.0, 11.0, 16.0, 29.0, 29.0, 56.0, 74.0, 116.0, 147.0, 235.0, 348.0, 550.0, 759.0, 1167.0, 1910.0, 2941.0, 4725.0, 7200.0, 11896.0, 20271.0, 34860.0, 63999.0, 132100.0, 298670.0, 238193.0, 101990.0, 52271.0, 29188.0, 17067.0, 10355.0, 6285.0, 4044.0, 2458.0, 1575.0, 1027.0, 650.0, 425.0, 292.0, 202.0, 136.0, 97.0, 49.0, 31.0, 38.0, 29.0, 9.0, 9.0, 9.0, 9.0, 2.0, 5.0, 0.0, 2.0, 0.0, 2.0], "bins": [-1.4189453125, -1.375732421875, -1.33251953125, -1.289306640625, -1.24609375, -1.202880859375, -1.15966796875, -1.116455078125, -1.0732421875, -1.030029296875, -0.98681640625, -0.943603515625, -0.900390625, -0.857177734375, -0.81396484375, -0.770751953125, -0.7275390625, -0.684326171875, -0.64111328125, -0.597900390625, -0.5546875, -0.511474609375, -0.46826171875, -0.425048828125, -0.3818359375, -0.338623046875, -0.29541015625, -0.252197265625, -0.208984375, -0.165771484375, -0.12255859375, -0.079345703125, -0.0361328125, 0.007080078125, 0.05029296875, 0.093505859375, 0.13671875, 0.179931640625, 0.22314453125, 0.266357421875, 0.3095703125, 0.352783203125, 0.39599609375, 0.439208984375, 0.482421875, 0.525634765625, 0.56884765625, 0.612060546875, 0.6552734375, 0.698486328125, 0.74169921875, 0.784912109375, 0.828125, 0.871337890625, 0.91455078125, 0.957763671875, 1.0009765625, 1.044189453125, 1.08740234375, 1.130615234375, 1.173828125, 1.217041015625, 1.26025390625, 1.303466796875, 1.3466796875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 4.0, 5.0, 4.0, 11.0, 6.0, 14.0, 19.0, 17.0, 19.0, 32.0, 31.0, 29.0, 41.0, 40.0, 51.0, 51.0, 59.0, 50.0, 48.0, 56.0, 48.0, 43.0, 41.0, 39.0, 39.0, 26.0, 29.0, 20.0, 22.0, 16.0, 9.0, 18.0, 10.0, 12.0, 9.0, 5.0, 5.0, 7.0, 5.0, 5.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3916015625, -0.3792076110839844, -0.36681365966796875, -0.3544197082519531, -0.3420257568359375, -0.3296318054199219, -0.31723785400390625, -0.3048439025878906, -0.292449951171875, -0.2800559997558594, -0.26766204833984375, -0.2552680969238281, -0.2428741455078125, -0.23048019409179688, -0.21808624267578125, -0.20569229125976562, -0.19329833984375, -0.18090438842773438, -0.16851043701171875, -0.15611648559570312, -0.1437225341796875, -0.13132858276367188, -0.11893463134765625, -0.10654067993164062, -0.094146728515625, -0.08175277709960938, -0.06935882568359375, -0.056964874267578125, -0.0445709228515625, -0.032176971435546875, -0.01978302001953125, -0.007389068603515625, 0.0050048828125, 0.017398834228515625, 0.02979278564453125, 0.042186737060546875, 0.0545806884765625, 0.06697463989257812, 0.07936859130859375, 0.09176254272460938, 0.104156494140625, 0.11655044555664062, 0.12894439697265625, 0.14133834838867188, 0.1537322998046875, 0.16612625122070312, 0.17852020263671875, 0.19091415405273438, 0.20330810546875, 0.21570205688476562, 0.22809600830078125, 0.24048995971679688, 0.2528839111328125, 0.2652778625488281, 0.27767181396484375, 0.2900657653808594, 0.302459716796875, 0.3148536682128906, 0.32724761962890625, 0.3396415710449219, 0.3520355224609375, 0.3644294738769531, 0.37682342529296875, 0.3892173767089844, 0.401611328125]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 4.0, 7.0, 5.0, 11.0, 7.0, 9.0, 15.0, 18.0, 29.0, 29.0, 40.0, 61.0, 96.0, 125.0, 125.0, 96.0, 89.0, 50.0, 46.0, 34.0, 22.0, 23.0, 12.0, 6.0, 6.0, 8.0, 11.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.01657104492188, -65.22066497802734, -62.42475128173828, -59.62884521484375, -56.83293151855469, -54.037025451660156, -51.24111557006836, -48.44520568847656, -45.649295806884766, -42.85338592529297, -40.05747604370117, -37.261566162109375, -34.465660095214844, -31.669748306274414, -28.87384033203125, -26.077930450439453, -23.282020568847656, -20.48611068725586, -17.690200805664062, -14.894292831420898, -12.098382949829102, -9.302473068237305, -6.506565093994141, -3.7106552124023438, -0.9147453308105469, 1.8811640739440918, 4.6770734786987305, 7.472982406616211, 10.268892288208008, 13.064802169799805, 15.860710144042969, 18.656620025634766, 21.452537536621094, 24.24844741821289, 27.044357299804688, 29.84026527404785, 32.63617706298828, 35.43208312988281, 38.22799301147461, 41.023902893066406, 43.8198127746582, 46.61572265625, 49.4116325378418, 52.207542419433594, 55.003448486328125, 57.79936218261719, 60.59526824951172, 63.391178131103516, 66.18708801269531, 68.98299407958984, 71.7789077758789, 74.57481384277344, 77.3707275390625, 80.16663360595703, 82.96253967285156, 85.75845336914062, 88.55436706542969, 91.35027313232422, 94.14618682861328, 96.94209289550781, 99.73800659179688, 102.5339126586914, 105.32981872558594, 108.125732421875, 110.92163848876953]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 3.0, 9.0, 12.0, 4.0, 4.0, 12.0, 15.0, 16.0, 13.0, 23.0, 21.0, 25.0, 26.0, 35.0, 34.0, 35.0, 35.0, 41.0, 57.0, 41.0, 42.0, 35.0, 32.0, 37.0, 51.0, 39.0, 28.0, 34.0, 36.0, 28.0, 29.0, 23.0, 19.0, 14.0, 20.0, 11.0, 14.0, 10.0, 6.0, 6.0, 7.0, 4.0, 6.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.93473815917969, -44.284820556640625, -42.63490295410156, -40.984981536865234, -39.33506393432617, -37.68514633178711, -36.03522491455078, -34.38530731201172, -32.735389709472656, -31.085472106933594, -29.4355525970459, -27.785633087158203, -26.13571548461914, -24.485797882080078, -22.835878372192383, -21.185958862304688, -19.536041259765625, -17.886123657226562, -16.236204147338867, -14.586285591125488, -12.93636703491211, -11.28644847869873, -9.636529922485352, -7.986611366271973, -6.336692810058594, -4.686774253845215, -3.036855697631836, -1.386937141418457, 0.2629814147949219, 1.9128999710083008, 3.5628185272216797, 5.212737083435059, 6.862651824951172, 8.51257038116455, 10.16248893737793, 11.812407493591309, 13.462326049804688, 15.112244606018066, 16.762163162231445, 18.41208267211914, 20.062000274658203, 21.711917877197266, 23.36183738708496, 25.011756896972656, 26.66167449951172, 28.31159210205078, 29.961511611938477, 31.611431121826172, 33.261348724365234, 34.9112663269043, 36.561187744140625, 38.21110534667969, 39.86102294921875, 41.51094055175781, 43.160858154296875, 44.8107795715332, 46.460697174072266, 48.11061477661133, 49.760536193847656, 51.41045379638672, 53.06037139892578, 54.710289001464844, 56.360206604003906, 58.010128021240234, 59.6600456237793]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 15.0, 19.0, 18.0, 32.0, 56.0, 69.0, 103.0, 128.0, 247.0, 278.0, 407.0, 563.0, 818.0, 1144.0, 1635.0, 2197.0, 3218.0, 4522.0, 6512.0, 9319.0, 13983.0, 20911.0, 32192.0, 52127.0, 90222.0, 220313.0, 954621.0, 1877717.0, 548326.0, 152537.0, 72623.0, 43337.0, 27529.0, 17728.0, 11929.0, 8116.0, 5576.0, 3898.0, 2675.0, 1921.0, 1335.0, 1000.0, 729.0, 474.0, 327.0, 254.0, 177.0, 141.0, 83.0, 66.0, 45.0, 31.0, 20.0, 10.0, 4.0, 5.0, 5.0, 5.0, 3.0, 2.0], "bins": [-75.875, -73.453125, -71.03125, -68.609375, -66.1875, -63.765625, -61.34375, -58.921875, -56.5, -54.078125, -51.65625, -49.234375, -46.8125, -44.390625, -41.96875, -39.546875, -37.125, -34.703125, -32.28125, -29.859375, -27.4375, -25.015625, -22.59375, -20.171875, -17.75, -15.328125, -12.90625, -10.484375, -8.0625, -5.640625, -3.21875, -0.796875, 1.625, 4.046875, 6.46875, 8.890625, 11.3125, 13.734375, 16.15625, 18.578125, 21.0, 23.421875, 25.84375, 28.265625, 30.6875, 33.109375, 35.53125, 37.953125, 40.375, 42.796875, 45.21875, 47.640625, 50.0625, 52.484375, 54.90625, 57.328125, 59.75, 62.171875, 64.59375, 67.015625, 69.4375, 71.859375, 74.28125, 76.703125, 79.125]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 7.0, 2.0, 2.0, 8.0, 6.0, 6.0, 7.0, 12.0, 10.0, 11.0, 16.0, 16.0, 14.0, 25.0, 15.0, 35.0, 37.0, 32.0, 24.0, 42.0, 31.0, 40.0, 45.0, 35.0, 42.0, 40.0, 41.0, 27.0, 37.0, 40.0, 32.0, 40.0, 24.0, 24.0, 23.0, 34.0, 16.0, 16.0, 14.0, 16.0, 10.0, 16.0, 3.0, 6.0, 5.0, 3.0, 10.0, 2.0, 3.0, 7.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-35.90625, -34.7392578125, -33.572265625, -32.4052734375, -31.23828125, -30.0712890625, -28.904296875, -27.7373046875, -26.5703125, -25.4033203125, -24.236328125, -23.0693359375, -21.90234375, -20.7353515625, -19.568359375, -18.4013671875, -17.234375, -16.0673828125, -14.900390625, -13.7333984375, -12.56640625, -11.3994140625, -10.232421875, -9.0654296875, -7.8984375, -6.7314453125, -5.564453125, -4.3974609375, -3.23046875, -2.0634765625, -0.896484375, 0.2705078125, 1.4375, 2.6044921875, 3.771484375, 4.9384765625, 6.10546875, 7.2724609375, 8.439453125, 9.6064453125, 10.7734375, 11.9404296875, 13.107421875, 14.2744140625, 15.44140625, 16.6083984375, 17.775390625, 18.9423828125, 20.109375, 21.2763671875, 22.443359375, 23.6103515625, 24.77734375, 25.9443359375, 27.111328125, 28.2783203125, 29.4453125, 30.6123046875, 31.779296875, 32.9462890625, 34.11328125, 35.2802734375, 36.447265625, 37.6142578125, 38.78125]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 6.0, 10.0, 7.0, 19.0, 21.0, 16.0, 32.0, 42.0, 71.0, 101.0, 135.0, 196.0, 298.0, 432.0, 626.0, 884.0, 1364.0, 2004.0, 3001.0, 4733.0, 7359.0, 11723.0, 18862.0, 31457.0, 52218.0, 92544.0, 181154.0, 436275.0, 1947963.0, 834386.0, 266033.0, 126122.0, 68519.0, 40030.0, 24116.0, 14883.0, 9433.0, 5759.0, 3767.0, 2516.0, 1664.0, 1113.0, 748.0, 494.0, 347.0, 221.0, 184.0, 113.0, 86.0, 62.0, 42.0, 31.0, 24.0, 16.0, 15.0, 6.0, 4.0, 7.0, 4.0, 1.0], "bins": [-81.0625, -78.5869140625, -76.111328125, -73.6357421875, -71.16015625, -68.6845703125, -66.208984375, -63.7333984375, -61.2578125, -58.7822265625, -56.306640625, -53.8310546875, -51.35546875, -48.8798828125, -46.404296875, -43.9287109375, -41.453125, -38.9775390625, -36.501953125, -34.0263671875, -31.55078125, -29.0751953125, -26.599609375, -24.1240234375, -21.6484375, -19.1728515625, -16.697265625, -14.2216796875, -11.74609375, -9.2705078125, -6.794921875, -4.3193359375, -1.84375, 0.6318359375, 3.107421875, 5.5830078125, 8.05859375, 10.5341796875, 13.009765625, 15.4853515625, 17.9609375, 20.4365234375, 22.912109375, 25.3876953125, 27.86328125, 30.3388671875, 32.814453125, 35.2900390625, 37.765625, 40.2412109375, 42.716796875, 45.1923828125, 47.66796875, 50.1435546875, 52.619140625, 55.0947265625, 57.5703125, 60.0458984375, 62.521484375, 64.9970703125, 67.47265625, 69.9482421875, 72.423828125, 74.8994140625, 77.375]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 4.0, 11.0, 23.0, 23.0, 33.0, 27.0, 39.0, 40.0, 41.0, 62.0, 61.0, 83.0, 92.0, 119.0, 144.0, 176.0, 270.0, 419.0, 617.0, 460.0, 285.0, 192.0, 142.0, 121.0, 112.0, 78.0, 73.0, 53.0, 55.0, 46.0, 29.0, 23.0, 20.0, 18.0, 15.0, 9.0, 8.0, 10.0, 10.0, 4.0, 5.0, 6.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-25.796875, -25.029296875, -24.26171875, -23.494140625, -22.7265625, -21.958984375, -21.19140625, -20.423828125, -19.65625, -18.888671875, -18.12109375, -17.353515625, -16.5859375, -15.818359375, -15.05078125, -14.283203125, -13.515625, -12.748046875, -11.98046875, -11.212890625, -10.4453125, -9.677734375, -8.91015625, -8.142578125, -7.375, -6.607421875, -5.83984375, -5.072265625, -4.3046875, -3.537109375, -2.76953125, -2.001953125, -1.234375, -0.466796875, 0.30078125, 1.068359375, 1.8359375, 2.603515625, 3.37109375, 4.138671875, 4.90625, 5.673828125, 6.44140625, 7.208984375, 7.9765625, 8.744140625, 9.51171875, 10.279296875, 11.046875, 11.814453125, 12.58203125, 13.349609375, 14.1171875, 14.884765625, 15.65234375, 16.419921875, 17.1875, 17.955078125, 18.72265625, 19.490234375, 20.2578125, 21.025390625, 21.79296875, 22.560546875, 23.328125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 7.0, 5.0, 6.0, 12.0, 15.0, 15.0, 25.0, 29.0, 34.0, 46.0, 80.0, 112.0, 132.0, 136.0, 94.0, 58.0, 48.0, 28.0, 24.0, 17.0, 20.0, 10.0, 14.0, 7.0, 6.0, 5.0, 4.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.93584442138672, -64.44532775878906, -61.954811096191406, -59.46429443359375, -56.97378158569336, -54.4832649230957, -51.99274826049805, -49.502235412597656, -47.01171875, -44.521202087402344, -42.03068542480469, -39.54016876220703, -37.04965591430664, -34.559139251708984, -32.06862258911133, -29.578107833862305, -27.087589263916016, -24.59707260131836, -22.106557846069336, -19.61604118347168, -17.125526428222656, -14.635009765625, -12.144493103027344, -9.65397834777832, -7.163461685180664, -4.672945976257324, -2.182429790496826, 0.3080863952636719, 2.7986021041870117, 5.289117813110352, 7.779634475708008, 10.270149230957031, 12.760665893554688, 15.251181602478027, 17.741697311401367, 20.232213973999023, 22.722728729248047, 25.213245391845703, 27.70376205444336, 30.194276809692383, 32.684791564941406, 35.17530822753906, 37.66582489013672, 40.156341552734375, 42.646854400634766, 45.13737106323242, 47.62788772583008, 50.11840057373047, 52.60892105102539, 55.09943771362305, 57.5899543762207, 60.080467224121094, 62.57098388671875, 65.0615005493164, 67.55201721191406, 70.04253387451172, 72.53305053710938, 75.02356719970703, 77.51408386230469, 80.00460052490234, 82.4951171875, 84.98562622070312, 87.47615051269531, 89.96665954589844, 92.4571762084961]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 11.0, 10.0, 12.0, 10.0, 15.0, 8.0, 22.0, 14.0, 19.0, 21.0, 25.0, 25.0, 38.0, 25.0, 34.0, 33.0, 34.0, 35.0, 39.0, 39.0, 39.0, 39.0, 43.0, 32.0, 48.0, 44.0, 42.0, 28.0, 21.0, 19.0, 17.0, 20.0, 29.0, 13.0, 13.0, 18.0, 10.0, 10.0, 7.0, 7.0, 8.0, 3.0, 3.0, 7.0, 5.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.24929428100586, -38.97118377685547, -37.693077087402344, -36.41496658325195, -35.13685989379883, -33.85874938964844, -32.58064270019531, -31.302532196044922, -30.024425506591797, -28.74631690979004, -27.46820831298828, -26.190099716186523, -24.911991119384766, -23.633882522583008, -22.35577392578125, -21.07766342163086, -19.7995548248291, -18.521446228027344, -17.243337631225586, -15.965229034423828, -14.68712043762207, -13.409011840820312, -12.130902290344238, -10.85279369354248, -9.574685096740723, -8.296576499938965, -7.018467903137207, -5.740358829498291, -4.462250232696533, -3.1841416358947754, -1.9060325622558594, -0.6279239654541016, 0.6501846313476562, 1.9282933473587036, 3.206402063369751, 4.484510898590088, 5.762619495391846, 7.0407280921936035, 8.31883716583252, 9.596945762634277, 10.875054359436035, 12.153162956237793, 13.43127155303955, 14.709381103515625, 15.987489700317383, 17.26559829711914, 18.5437068939209, 19.821815490722656, 21.099924087524414, 22.378032684326172, 23.65614128112793, 24.934249877929688, 26.212358474731445, 27.490467071533203, 28.768577575683594, 30.04668426513672, 31.32479476928711, 32.6029052734375, 33.881011962890625, 35.159122467041016, 36.43722915649414, 37.71533966064453, 38.993446350097656, 40.27155685424805, 41.54966354370117]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 6.0, 6.0, 6.0, 5.0, 13.0, 19.0, 36.0, 52.0, 52.0, 70.0, 87.0, 143.0, 221.0, 297.0, 411.0, 553.0, 798.0, 1118.0, 1548.0, 2186.0, 3240.0, 4381.0, 6533.0, 9418.0, 13739.0, 20361.0, 30330.0, 46351.0, 74219.0, 134023.0, 300144.0, 158773.0, 84716.0, 50769.0, 32907.0, 21973.0, 15020.0, 10271.0, 7159.0, 4905.0, 3489.0, 2389.0, 1725.0, 1235.0, 771.0, 625.0, 401.0, 332.0, 226.0, 145.0, 112.0, 72.0, 49.0, 58.0, 36.0, 20.0, 14.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0], "bins": [-11.125, -10.7730712890625, -10.421142578125, -10.0692138671875, -9.71728515625, -9.3653564453125, -9.013427734375, -8.6614990234375, -8.3095703125, -7.9576416015625, -7.605712890625, -7.2537841796875, -6.90185546875, -6.5499267578125, -6.197998046875, -5.8460693359375, -5.494140625, -5.1422119140625, -4.790283203125, -4.4383544921875, -4.08642578125, -3.7344970703125, -3.382568359375, -3.0306396484375, -2.6787109375, -2.3267822265625, -1.974853515625, -1.6229248046875, -1.27099609375, -0.9190673828125, -0.567138671875, -0.2152099609375, 0.13671875, 0.4886474609375, 0.840576171875, 1.1925048828125, 1.54443359375, 1.8963623046875, 2.248291015625, 2.6002197265625, 2.9521484375, 3.3040771484375, 3.656005859375, 4.0079345703125, 4.35986328125, 4.7117919921875, 5.063720703125, 5.4156494140625, 5.767578125, 6.1195068359375, 6.471435546875, 6.8233642578125, 7.17529296875, 7.5272216796875, 7.879150390625, 8.2310791015625, 8.5830078125, 8.9349365234375, 9.286865234375, 9.6387939453125, 9.99072265625, 10.3426513671875, 10.694580078125, 11.0465087890625, 11.3984375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0, 9.0, 4.0, 6.0, 7.0, 5.0, 7.0, 13.0, 12.0, 19.0, 23.0, 21.0, 18.0, 26.0, 30.0, 34.0, 35.0, 37.0, 26.0, 33.0, 37.0, 38.0, 35.0, 46.0, 46.0, 40.0, 41.0, 51.0, 40.0, 23.0, 27.0, 20.0, 23.0, 19.0, 26.0, 18.0, 17.0, 21.0, 8.0, 14.0, 11.0, 4.0, 10.0, 6.0, 3.0, 4.0, 3.0, 0.0, 5.0, 3.0, 2.0, 2.0], "bins": [-46.21875, -44.90380859375, -43.5888671875, -42.27392578125, -40.958984375, -39.64404296875, -38.3291015625, -37.01416015625, -35.69921875, -34.38427734375, -33.0693359375, -31.75439453125, -30.439453125, -29.12451171875, -27.8095703125, -26.49462890625, -25.1796875, -23.86474609375, -22.5498046875, -21.23486328125, -19.919921875, -18.60498046875, -17.2900390625, -15.97509765625, -14.66015625, -13.34521484375, -12.0302734375, -10.71533203125, -9.400390625, -8.08544921875, -6.7705078125, -5.45556640625, -4.140625, -2.82568359375, -1.5107421875, -0.19580078125, 1.119140625, 2.43408203125, 3.7490234375, 5.06396484375, 6.37890625, 7.69384765625, 9.0087890625, 10.32373046875, 11.638671875, 12.95361328125, 14.2685546875, 15.58349609375, 16.8984375, 18.21337890625, 19.5283203125, 20.84326171875, 22.158203125, 23.47314453125, 24.7880859375, 26.10302734375, 27.41796875, 28.73291015625, 30.0478515625, 31.36279296875, 32.677734375, 33.99267578125, 35.3076171875, 36.62255859375, 37.9375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 4.0, 6.0, 2.0, 9.0, 10.0, 10.0, 13.0, 36.0, 48.0, 70.0, 98.0, 134.0, 178.0, 275.0, 379.0, 658.0, 889.0, 1355.0, 2029.0, 3053.0, 4816.0, 7666.0, 12371.0, 20444.0, 33920.0, 58253.0, 109593.0, 282276.0, 262011.0, 105402.0, 56840.0, 32872.0, 19785.0, 11967.0, 7474.0, 4699.0, 3008.0, 2030.0, 1203.0, 902.0, 571.0, 361.0, 270.0, 183.0, 132.0, 63.0, 60.0, 45.0, 25.0, 17.0, 16.0, 11.0, 6.0, 6.0, 5.0, 4.0, 1.0, 2.0, 2.0, 2.0], "bins": [-13.4921875, -13.0701904296875, -12.648193359375, -12.2261962890625, -11.80419921875, -11.3822021484375, -10.960205078125, -10.5382080078125, -10.1162109375, -9.6942138671875, -9.272216796875, -8.8502197265625, -8.42822265625, -8.0062255859375, -7.584228515625, -7.1622314453125, -6.740234375, -6.3182373046875, -5.896240234375, -5.4742431640625, -5.05224609375, -4.6302490234375, -4.208251953125, -3.7862548828125, -3.3642578125, -2.9422607421875, -2.520263671875, -2.0982666015625, -1.67626953125, -1.2542724609375, -0.832275390625, -0.4102783203125, 0.01171875, 0.4337158203125, 0.855712890625, 1.2777099609375, 1.69970703125, 2.1217041015625, 2.543701171875, 2.9656982421875, 3.3876953125, 3.8096923828125, 4.231689453125, 4.6536865234375, 5.07568359375, 5.4976806640625, 5.919677734375, 6.3416748046875, 6.763671875, 7.1856689453125, 7.607666015625, 8.0296630859375, 8.45166015625, 8.8736572265625, 9.295654296875, 9.7176513671875, 10.1396484375, 10.5616455078125, 10.983642578125, 11.4056396484375, 11.82763671875, 12.2496337890625, 12.671630859375, 13.0936279296875, 13.515625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 2.0, 7.0, 9.0, 13.0, 13.0, 17.0, 14.0, 27.0, 19.0, 28.0, 30.0, 42.0, 35.0, 44.0, 41.0, 45.0, 58.0, 46.0, 44.0, 41.0, 50.0, 45.0, 38.0, 50.0, 34.0, 31.0, 27.0, 27.0, 22.0, 25.0, 17.0, 18.0, 10.0, 12.0, 4.0, 6.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.40625, -31.37744140625, -30.3486328125, -29.31982421875, -28.291015625, -27.26220703125, -26.2333984375, -25.20458984375, -24.17578125, -23.14697265625, -22.1181640625, -21.08935546875, -20.060546875, -19.03173828125, -18.0029296875, -16.97412109375, -15.9453125, -14.91650390625, -13.8876953125, -12.85888671875, -11.830078125, -10.80126953125, -9.7724609375, -8.74365234375, -7.71484375, -6.68603515625, -5.6572265625, -4.62841796875, -3.599609375, -2.57080078125, -1.5419921875, -0.51318359375, 0.515625, 1.54443359375, 2.5732421875, 3.60205078125, 4.630859375, 5.65966796875, 6.6884765625, 7.71728515625, 8.74609375, 9.77490234375, 10.8037109375, 11.83251953125, 12.861328125, 13.89013671875, 14.9189453125, 15.94775390625, 16.9765625, 18.00537109375, 19.0341796875, 20.06298828125, 21.091796875, 22.12060546875, 23.1494140625, 24.17822265625, 25.20703125, 26.23583984375, 27.2646484375, 28.29345703125, 29.322265625, 30.35107421875, 31.3798828125, 32.40869140625, 33.4375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 4.0, 3.0, 4.0, 4.0, 10.0, 9.0, 13.0, 15.0, 16.0, 24.0, 41.0, 54.0, 54.0, 101.0, 125.0, 180.0, 227.0, 323.0, 536.0, 779.0, 1221.0, 1934.0, 3414.0, 5902.0, 11369.0, 23614.0, 56082.0, 172443.0, 503134.0, 163863.0, 54296.0, 22885.0, 11047.0, 5692.0, 3436.0, 1999.0, 1199.0, 821.0, 488.0, 327.0, 238.0, 164.0, 115.0, 86.0, 68.0, 45.0, 37.0, 29.0, 26.0, 16.0, 9.0, 9.0, 8.0, 10.0, 10.0, 6.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.034271240234375, -0.033182621002197266, -0.03209400177001953, -0.031005382537841797, -0.029916763305664062, -0.028828144073486328, -0.027739524841308594, -0.02665090560913086, -0.025562286376953125, -0.02447366714477539, -0.023385047912597656, -0.022296428680419922, -0.021207809448242188, -0.020119190216064453, -0.01903057098388672, -0.017941951751708984, -0.01685333251953125, -0.015764713287353516, -0.014676094055175781, -0.013587474822998047, -0.012498855590820312, -0.011410236358642578, -0.010321617126464844, -0.00923299789428711, -0.008144378662109375, -0.007055759429931641, -0.005967140197753906, -0.004878520965576172, -0.0037899017333984375, -0.002701282501220703, -0.0016126632690429688, -0.0005240440368652344, 0.0005645751953125, 0.0016531944274902344, 0.0027418136596679688, 0.003830432891845703, 0.0049190521240234375, 0.006007671356201172, 0.007096290588378906, 0.00818490982055664, 0.009273529052734375, 0.01036214828491211, 0.011450767517089844, 0.012539386749267578, 0.013628005981445312, 0.014716625213623047, 0.01580524444580078, 0.016893863677978516, 0.01798248291015625, 0.019071102142333984, 0.02015972137451172, 0.021248340606689453, 0.022336959838867188, 0.023425579071044922, 0.024514198303222656, 0.02560281753540039, 0.026691436767578125, 0.02778005599975586, 0.028868675231933594, 0.029957294464111328, 0.031045913696289062, 0.0321345329284668, 0.03322315216064453, 0.034311771392822266, 0.035400390625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 1.0, 4.0, 9.0, 10.0, 4.0, 9.0, 21.0, 32.0, 28.0, 56.0, 60.0, 101.0, 135.0, 128.0, 114.0, 76.0, 45.0, 39.0, 26.0, 19.0, 16.0, 18.0, 10.0, 11.0, 6.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.838539123535156e-05, -3.7264078855514526e-05, -3.614276647567749e-05, -3.5021454095840454e-05, -3.390014171600342e-05, -3.277882933616638e-05, -3.1657516956329346e-05, -3.053620457649231e-05, -2.9414892196655273e-05, -2.8293579816818237e-05, -2.71722674369812e-05, -2.6050955057144165e-05, -2.492964267730713e-05, -2.3808330297470093e-05, -2.2687017917633057e-05, -2.156570553779602e-05, -2.0444393157958984e-05, -1.9323080778121948e-05, -1.8201768398284912e-05, -1.7080456018447876e-05, -1.595914363861084e-05, -1.4837831258773804e-05, -1.3716518878936768e-05, -1.2595206499099731e-05, -1.1473894119262695e-05, -1.035258173942566e-05, -9.231269359588623e-06, -8.109956979751587e-06, -6.988644599914551e-06, -5.867332220077515e-06, -4.7460198402404785e-06, -3.6247074604034424e-06, -2.5033950805664062e-06, -1.3820827007293701e-06, -2.60770320892334e-07, 8.605420589447021e-07, 1.9818544387817383e-06, 3.1031668186187744e-06, 4.2244791984558105e-06, 5.345791578292847e-06, 6.467103958129883e-06, 7.588416337966919e-06, 8.709728717803955e-06, 9.831041097640991e-06, 1.0952353477478027e-05, 1.2073665857315063e-05, 1.31949782371521e-05, 1.4316290616989136e-05, 1.5437602996826172e-05, 1.6558915376663208e-05, 1.7680227756500244e-05, 1.880154013633728e-05, 1.9922852516174316e-05, 2.1044164896011353e-05, 2.216547727584839e-05, 2.3286789655685425e-05, 2.440810203552246e-05, 2.5529414415359497e-05, 2.6650726795196533e-05, 2.777203917503357e-05, 2.8893351554870605e-05, 3.001466393470764e-05, 3.113597631454468e-05, 3.2257288694381714e-05, 3.337860107421875e-05]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 4.0, 1.0, 7.0, 6.0, 3.0, 9.0, 13.0, 25.0, 20.0, 41.0, 53.0, 78.0, 71.0, 145.0, 192.0, 271.0, 389.0, 531.0, 789.0, 1101.0, 1693.0, 2559.0, 3993.0, 6826.0, 11763.0, 21910.0, 43226.0, 96342.0, 287944.0, 350819.0, 111805.0, 48496.0, 24185.0, 13003.0, 7278.0, 4439.0, 2732.0, 1750.0, 1275.0, 779.0, 595.0, 421.0, 283.0, 201.0, 134.0, 104.0, 73.0, 47.0, 40.0, 33.0, 23.0, 11.0, 11.0, 7.0, 9.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.02764892578125, -0.02678704261779785, -0.025925159454345703, -0.025063276290893555, -0.024201393127441406, -0.023339509963989258, -0.02247762680053711, -0.02161574363708496, -0.020753860473632812, -0.019891977310180664, -0.019030094146728516, -0.018168210983276367, -0.01730632781982422, -0.01644444465637207, -0.015582561492919922, -0.014720678329467773, -0.013858795166015625, -0.012996912002563477, -0.012135028839111328, -0.01127314567565918, -0.010411262512207031, -0.009549379348754883, -0.008687496185302734, -0.007825613021850586, -0.0069637298583984375, -0.006101846694946289, -0.005239963531494141, -0.004378080368041992, -0.0035161972045898438, -0.0026543140411376953, -0.0017924308776855469, -0.0009305477142333984, -6.866455078125e-05, 0.0007932186126708984, 0.0016551017761230469, 0.0025169849395751953, 0.0033788681030273438, 0.004240751266479492, 0.005102634429931641, 0.005964517593383789, 0.0068264007568359375, 0.007688283920288086, 0.008550167083740234, 0.009412050247192383, 0.010273933410644531, 0.01113581657409668, 0.011997699737548828, 0.012859582901000977, 0.013721466064453125, 0.014583349227905273, 0.015445232391357422, 0.01630711555480957, 0.01716899871826172, 0.018030881881713867, 0.018892765045166016, 0.019754648208618164, 0.020616531372070312, 0.02147841453552246, 0.02234029769897461, 0.023202180862426758, 0.024064064025878906, 0.024925947189331055, 0.025787830352783203, 0.02664971351623535, 0.0275115966796875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 11.0, 3.0, 8.0, 12.0, 11.0, 20.0, 25.0, 30.0, 32.0, 37.0, 46.0, 69.0, 72.0, 67.0, 76.0, 78.0, 69.0, 69.0, 63.0, 35.0, 35.0, 32.0, 21.0, 13.0, 15.0, 11.0, 12.0, 5.0, 4.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00856781005859375, -0.008302688598632812, -0.008037567138671875, -0.0077724456787109375, -0.00750732421875, -0.0072422027587890625, -0.006977081298828125, -0.0067119598388671875, -0.00644683837890625, -0.0061817169189453125, -0.005916595458984375, -0.0056514739990234375, -0.0053863525390625, -0.0051212310791015625, -0.004856109619140625, -0.0045909881591796875, -0.00432586669921875, -0.0040607452392578125, -0.003795623779296875, -0.0035305023193359375, -0.003265380859375, -0.0030002593994140625, -0.002735137939453125, -0.0024700164794921875, -0.00220489501953125, -0.0019397735595703125, -0.001674652099609375, -0.0014095306396484375, -0.0011444091796875, -0.0008792877197265625, -0.000614166259765625, -0.0003490447998046875, -8.392333984375e-05, 0.0001811981201171875, 0.000446319580078125, 0.0007114410400390625, 0.0009765625, 0.0012416839599609375, 0.001506805419921875, 0.0017719268798828125, 0.00203704833984375, 0.0023021697998046875, 0.002567291259765625, 0.0028324127197265625, 0.0030975341796875, 0.0033626556396484375, 0.003627777099609375, 0.0038928985595703125, 0.00415802001953125, 0.0044231414794921875, 0.004688262939453125, 0.0049533843994140625, 0.005218505859375, 0.0054836273193359375, 0.005748748779296875, 0.0060138702392578125, 0.00627899169921875, 0.0065441131591796875, 0.006809234619140625, 0.0070743560791015625, 0.0073394775390625, 0.0076045989990234375, 0.007869720458984375, 0.008134841918945312, 0.00839996337890625]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 7.0, 8.0, 13.0, 17.0, 16.0, 23.0, 34.0, 38.0, 49.0, 88.0, 128.0, 146.0, 110.0, 85.0, 58.0, 43.0, 25.0, 17.0, 21.0, 19.0, 6.0, 16.0, 7.0, 3.0, 5.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.39168548583984, -62.9315185546875, -60.471351623535156, -58.01118469238281, -55.5510139465332, -53.09084701538086, -50.630680084228516, -48.170509338378906, -45.71034240722656, -43.25017547607422, -40.790008544921875, -38.32984161376953, -35.86967086791992, -33.40950393676758, -30.949337005615234, -28.489168167114258, -26.029003143310547, -23.568836212158203, -21.108667373657227, -18.648500442504883, -16.188331604003906, -13.728164672851562, -11.267997741699219, -8.807828903198242, -6.347661972045898, -3.8874943256378174, -1.4273266792297363, 1.0328407287597656, 3.493008613586426, 5.953176498413086, 8.41334342956543, 10.873512268066406, 13.33367919921875, 15.79384708404541, 18.25401496887207, 20.714181900024414, 23.17435073852539, 25.634517669677734, 28.094684600830078, 30.554853439331055, 33.01502227783203, 35.475189208984375, 37.93535614013672, 40.39552307128906, 42.85569381713867, 45.315860748291016, 47.77602767944336, 50.23619842529297, 52.69636154174805, 55.15652847290039, 57.616695404052734, 60.076866149902344, 62.53703308105469, 64.99720001220703, 67.45736694335938, 69.91753387451172, 72.37770080566406, 74.8378677368164, 77.29803466796875, 79.7582015991211, 82.21836853027344, 84.67854309082031, 87.13870239257812, 89.598876953125, 92.05904388427734]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 11.0, 10.0, 12.0, 10.0, 14.0, 9.0, 23.0, 13.0, 19.0, 21.0, 25.0, 25.0, 38.0, 26.0, 33.0, 33.0, 34.0, 36.0, 38.0, 39.0, 39.0, 39.0, 44.0, 33.0, 46.0, 45.0, 41.0, 28.0, 21.0, 19.0, 17.0, 20.0, 29.0, 13.0, 13.0, 18.0, 10.0, 10.0, 7.0, 7.0, 8.0, 3.0, 3.0, 7.0, 5.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.07429504394531, -37.827972412109375, -36.58164596557617, -35.335323333740234, -34.0890007019043, -32.84267807006836, -31.596351623535156, -30.35002899169922, -29.10370635986328, -27.85738182067871, -26.611059188842773, -25.364734649658203, -24.118412017822266, -22.872087478637695, -21.625762939453125, -20.379440307617188, -19.133115768432617, -17.886791229248047, -16.64046859741211, -15.394144058227539, -14.147821426391602, -12.901496887207031, -11.655173301696777, -10.408849716186523, -9.16252613067627, -7.916202545166016, -6.669878959655762, -5.42355489730835, -4.177231311798096, -2.930907726287842, -1.6845836639404297, -0.4382600784301758, 0.8080635070800781, 2.054387092590332, 3.300710916519165, 4.547034740447998, 5.793358325958252, 7.039681911468506, 8.286005973815918, 9.532329559326172, 10.778653144836426, 12.02497673034668, 13.271300315856934, 14.517623901367188, 15.763948440551758, 17.010271072387695, 18.256595611572266, 19.502918243408203, 20.749242782592773, 21.995567321777344, 23.24188995361328, 24.48821449279785, 25.73453712463379, 26.98086166381836, 28.227184295654297, 29.473508834838867, 30.719833374023438, 31.966157913208008, 33.21248245239258, 34.458805084228516, 35.70512771606445, 36.95145034790039, 38.197776794433594, 39.44409942626953, 40.69042205810547]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 5.0, 5.0, 4.0, 5.0, 16.0, 28.0, 41.0, 61.0, 76.0, 113.0, 170.0, 232.0, 349.0, 519.0, 728.0, 990.0, 1515.0, 2036.0, 2868.0, 4317.0, 6022.0, 9043.0, 13435.0, 20526.0, 31842.0, 49683.0, 84932.0, 163216.0, 251354.0, 168659.0, 87959.0, 51218.0, 32037.0, 20839.0, 13741.0, 9295.0, 6370.0, 4509.0, 2932.0, 2020.0, 1483.0, 1002.0, 710.0, 469.0, 336.0, 257.0, 204.0, 105.0, 74.0, 59.0, 37.0, 41.0, 29.0, 14.0, 13.0, 8.0, 9.0, 3.0, 3.0, 1.0], "bins": [-71.5625, -69.3623046875, -67.162109375, -64.9619140625, -62.76171875, -60.5615234375, -58.361328125, -56.1611328125, -53.9609375, -51.7607421875, -49.560546875, -47.3603515625, -45.16015625, -42.9599609375, -40.759765625, -38.5595703125, -36.359375, -34.1591796875, -31.958984375, -29.7587890625, -27.55859375, -25.3583984375, -23.158203125, -20.9580078125, -18.7578125, -16.5576171875, -14.357421875, -12.1572265625, -9.95703125, -7.7568359375, -5.556640625, -3.3564453125, -1.15625, 1.0439453125, 3.244140625, 5.4443359375, 7.64453125, 9.8447265625, 12.044921875, 14.2451171875, 16.4453125, 18.6455078125, 20.845703125, 23.0458984375, 25.24609375, 27.4462890625, 29.646484375, 31.8466796875, 34.046875, 36.2470703125, 38.447265625, 40.6474609375, 42.84765625, 45.0478515625, 47.248046875, 49.4482421875, 51.6484375, 53.8486328125, 56.048828125, 58.2490234375, 60.44921875, 62.6494140625, 64.849609375, 67.0498046875, 69.25]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 0.0, 3.0, 3.0, 6.0, 7.0, 8.0, 12.0, 12.0, 3.0, 9.0, 16.0, 16.0, 23.0, 21.0, 25.0, 27.0, 31.0, 25.0, 29.0, 30.0, 35.0, 34.0, 38.0, 32.0, 54.0, 35.0, 41.0, 27.0, 41.0, 32.0, 33.0, 39.0, 38.0, 23.0, 25.0, 17.0, 16.0, 20.0, 18.0, 15.0, 11.0, 11.0, 11.0, 8.0, 10.0, 4.0, 5.0, 3.0, 7.0, 3.0, 7.0, 4.0, 1.0, 2.0], "bins": [-35.625, -34.607666015625, -33.59033203125, -32.572998046875, -31.5556640625, -30.538330078125, -29.52099609375, -28.503662109375, -27.486328125, -26.468994140625, -25.45166015625, -24.434326171875, -23.4169921875, -22.399658203125, -21.38232421875, -20.364990234375, -19.34765625, -18.330322265625, -17.31298828125, -16.295654296875, -15.2783203125, -14.260986328125, -13.24365234375, -12.226318359375, -11.208984375, -10.191650390625, -9.17431640625, -8.156982421875, -7.1396484375, -6.122314453125, -5.10498046875, -4.087646484375, -3.0703125, -2.052978515625, -1.03564453125, -0.018310546875, 0.9990234375, 2.016357421875, 3.03369140625, 4.051025390625, 5.068359375, 6.085693359375, 7.10302734375, 8.120361328125, 9.1376953125, 10.155029296875, 11.17236328125, 12.189697265625, 13.20703125, 14.224365234375, 15.24169921875, 16.259033203125, 17.2763671875, 18.293701171875, 19.31103515625, 20.328369140625, 21.345703125, 22.363037109375, 23.38037109375, 24.397705078125, 25.4150390625, 26.432373046875, 27.44970703125, 28.467041015625, 29.484375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 5.0, 9.0, 13.0, 21.0, 45.0, 40.0, 69.0, 88.0, 119.0, 187.0, 291.0, 406.0, 635.0, 1039.0, 1441.0, 2241.0, 3266.0, 4811.0, 7262.0, 10982.0, 16687.0, 26658.0, 41324.0, 68058.0, 125142.0, 242830.0, 217732.0, 108226.0, 61643.0, 37536.0, 24108.0, 15393.0, 10087.0, 6633.0, 4419.0, 2986.0, 2001.0, 1364.0, 897.0, 613.0, 453.0, 262.0, 180.0, 135.0, 76.0, 62.0, 24.0, 24.0, 15.0, 8.0, 4.0, 6.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-70.8125, -68.5205078125, -66.228515625, -63.9365234375, -61.64453125, -59.3525390625, -57.060546875, -54.7685546875, -52.4765625, -50.1845703125, -47.892578125, -45.6005859375, -43.30859375, -41.0166015625, -38.724609375, -36.4326171875, -34.140625, -31.8486328125, -29.556640625, -27.2646484375, -24.97265625, -22.6806640625, -20.388671875, -18.0966796875, -15.8046875, -13.5126953125, -11.220703125, -8.9287109375, -6.63671875, -4.3447265625, -2.052734375, 0.2392578125, 2.53125, 4.8232421875, 7.115234375, 9.4072265625, 11.69921875, 13.9912109375, 16.283203125, 18.5751953125, 20.8671875, 23.1591796875, 25.451171875, 27.7431640625, 30.03515625, 32.3271484375, 34.619140625, 36.9111328125, 39.203125, 41.4951171875, 43.787109375, 46.0791015625, 48.37109375, 50.6630859375, 52.955078125, 55.2470703125, 57.5390625, 59.8310546875, 62.123046875, 64.4150390625, 66.70703125, 68.9990234375, 71.291015625, 73.5830078125, 75.875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [5.0, 2.0, 4.0, 10.0, 6.0, 4.0, 3.0, 9.0, 11.0, 9.0, 10.0, 13.0, 6.0, 21.0, 17.0, 21.0, 32.0, 32.0, 30.0, 34.0, 25.0, 33.0, 34.0, 42.0, 36.0, 26.0, 41.0, 43.0, 34.0, 36.0, 36.0, 30.0, 28.0, 23.0, 28.0, 35.0, 20.0, 22.0, 19.0, 19.0, 22.0, 22.0, 14.0, 8.0, 9.0, 7.0, 9.0, 8.0, 10.0, 4.0, 3.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-17.40625, -16.775390625, -16.14453125, -15.513671875, -14.8828125, -14.251953125, -13.62109375, -12.990234375, -12.359375, -11.728515625, -11.09765625, -10.466796875, -9.8359375, -9.205078125, -8.57421875, -7.943359375, -7.3125, -6.681640625, -6.05078125, -5.419921875, -4.7890625, -4.158203125, -3.52734375, -2.896484375, -2.265625, -1.634765625, -1.00390625, -0.373046875, 0.2578125, 0.888671875, 1.51953125, 2.150390625, 2.78125, 3.412109375, 4.04296875, 4.673828125, 5.3046875, 5.935546875, 6.56640625, 7.197265625, 7.828125, 8.458984375, 9.08984375, 9.720703125, 10.3515625, 10.982421875, 11.61328125, 12.244140625, 12.875, 13.505859375, 14.13671875, 14.767578125, 15.3984375, 16.029296875, 16.66015625, 17.291015625, 17.921875, 18.552734375, 19.18359375, 19.814453125, 20.4453125, 21.076171875, 21.70703125, 22.337890625, 22.96875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 4.0, 10.0, 19.0, 25.0, 33.0, 56.0, 74.0, 101.0, 191.0, 233.0, 358.0, 557.0, 828.0, 1183.0, 1808.0, 2682.0, 4320.0, 6952.0, 11649.0, 20487.0, 37289.0, 77008.0, 197931.0, 359107.0, 173301.0, 69938.0, 34458.0, 18677.0, 10914.0, 6577.0, 4100.0, 2484.0, 1735.0, 1122.0, 750.0, 516.0, 317.0, 270.0, 152.0, 121.0, 87.0, 41.0, 32.0, 15.0, 13.0, 15.0, 4.0, 8.0, 3.0, 2.0, 1.0, 2.0, 2.0], "bins": [-1.39453125, -1.354034423828125, -1.31353759765625, -1.273040771484375, -1.2325439453125, -1.192047119140625, -1.15155029296875, -1.111053466796875, -1.070556640625, -1.030059814453125, -0.98956298828125, -0.949066162109375, -0.9085693359375, -0.868072509765625, -0.82757568359375, -0.787078857421875, -0.74658203125, -0.706085205078125, -0.66558837890625, -0.625091552734375, -0.5845947265625, -0.544097900390625, -0.50360107421875, -0.463104248046875, -0.422607421875, -0.382110595703125, -0.34161376953125, -0.301116943359375, -0.2606201171875, -0.220123291015625, -0.17962646484375, -0.139129638671875, -0.0986328125, -0.058135986328125, -0.01763916015625, 0.022857666015625, 0.0633544921875, 0.103851318359375, 0.14434814453125, 0.184844970703125, 0.225341796875, 0.265838623046875, 0.30633544921875, 0.346832275390625, 0.3873291015625, 0.427825927734375, 0.46832275390625, 0.508819580078125, 0.54931640625, 0.589813232421875, 0.63031005859375, 0.670806884765625, 0.7113037109375, 0.751800537109375, 0.79229736328125, 0.832794189453125, 0.873291015625, 0.913787841796875, 0.95428466796875, 0.994781494140625, 1.0352783203125, 1.075775146484375, 1.11627197265625, 1.156768798828125, 1.197265625]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 15.0, 8.0, 16.0, 18.0, 15.0, 24.0, 28.0, 40.0, 38.0, 52.0, 71.0, 94.0, 106.0, 107.0, 71.0, 75.0, 47.0, 43.0, 24.0, 20.0, 16.0, 16.0, 14.0, 11.0, 10.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0004019737243652344, -0.00039042532444000244, -0.0003788769245147705, -0.0003673285245895386, -0.00035578012466430664, -0.0003442317247390747, -0.0003326833248138428, -0.00032113492488861084, -0.0003095865249633789, -0.00029803812503814697, -0.00028648972511291504, -0.0002749413251876831, -0.00026339292526245117, -0.00025184452533721924, -0.0002402961254119873, -0.00022874772548675537, -0.00021719932556152344, -0.0002056509256362915, -0.00019410252571105957, -0.00018255412578582764, -0.0001710057258605957, -0.00015945732593536377, -0.00014790892601013184, -0.0001363605260848999, -0.00012481212615966797, -0.00011326372623443604, -0.0001017153263092041, -9.016692638397217e-05, -7.861852645874023e-05, -6.70701265335083e-05, -5.552172660827637e-05, -4.3973326683044434e-05, -3.24249267578125e-05, -2.0876526832580566e-05, -9.328126907348633e-06, 2.2202730178833008e-06, 1.3768672943115234e-05, 2.5317072868347168e-05, 3.68654727935791e-05, 4.8413872718811035e-05, 5.996227264404297e-05, 7.15106725692749e-05, 8.305907249450684e-05, 9.460747241973877e-05, 0.0001061558723449707, 0.00011770427227020264, 0.00012925267219543457, 0.0001408010721206665, 0.00015234947204589844, 0.00016389787197113037, 0.0001754462718963623, 0.00018699467182159424, 0.00019854307174682617, 0.0002100914716720581, 0.00022163987159729004, 0.00023318827152252197, 0.0002447366714477539, 0.00025628507137298584, 0.0002678334712982178, 0.0002793818712234497, 0.00029093027114868164, 0.0003024786710739136, 0.0003140270709991455, 0.00032557547092437744, 0.0003371238708496094]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 6.0, 10.0, 12.0, 14.0, 18.0, 25.0, 35.0, 50.0, 84.0, 100.0, 123.0, 200.0, 255.0, 402.0, 576.0, 816.0, 1174.0, 1768.0, 2717.0, 4218.0, 6693.0, 10712.0, 18208.0, 31497.0, 59683.0, 131199.0, 304045.0, 252357.0, 103545.0, 49138.0, 26785.0, 15412.0, 9398.0, 5999.0, 3728.0, 2385.0, 1617.0, 1072.0, 728.0, 509.0, 402.0, 238.0, 158.0, 135.0, 93.0, 61.0, 45.0, 29.0, 27.0, 17.0, 15.0, 11.0, 10.0, 0.0, 3.0, 4.0, 1.0, 1.0], "bins": [-1.1376953125, -1.1030731201171875, -1.068450927734375, -1.0338287353515625, -0.99920654296875, -0.9645843505859375, -0.929962158203125, -0.8953399658203125, -0.8607177734375, -0.8260955810546875, -0.791473388671875, -0.7568511962890625, -0.72222900390625, -0.6876068115234375, -0.652984619140625, -0.6183624267578125, -0.583740234375, -0.5491180419921875, -0.514495849609375, -0.4798736572265625, -0.44525146484375, -0.4106292724609375, -0.376007080078125, -0.3413848876953125, -0.3067626953125, -0.2721405029296875, -0.237518310546875, -0.2028961181640625, -0.16827392578125, -0.1336517333984375, -0.099029541015625, -0.0644073486328125, -0.02978515625, 0.0048370361328125, 0.039459228515625, 0.0740814208984375, 0.10870361328125, 0.1433258056640625, 0.177947998046875, 0.2125701904296875, 0.2471923828125, 0.2818145751953125, 0.316436767578125, 0.3510589599609375, 0.38568115234375, 0.4203033447265625, 0.454925537109375, 0.4895477294921875, 0.524169921875, 0.5587921142578125, 0.593414306640625, 0.6280364990234375, 0.66265869140625, 0.6972808837890625, 0.731903076171875, 0.7665252685546875, 0.8011474609375, 0.8357696533203125, 0.870391845703125, 0.9050140380859375, 0.93963623046875, 0.9742584228515625, 1.008880615234375, 1.0435028076171875, 1.078125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 8.0, 5.0, 8.0, 13.0, 18.0, 14.0, 11.0, 28.0, 29.0, 25.0, 45.0, 38.0, 59.0, 68.0, 61.0, 57.0, 66.0, 71.0, 48.0, 44.0, 45.0, 34.0, 37.0, 27.0, 24.0, 22.0, 17.0, 12.0, 13.0, 10.0, 8.0, 8.0, 6.0, 5.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.35546875, -0.3447761535644531, -0.33408355712890625, -0.3233909606933594, -0.3126983642578125, -0.3020057678222656, -0.29131317138671875, -0.2806205749511719, -0.269927978515625, -0.2592353820800781, -0.24854278564453125, -0.23785018920898438, -0.2271575927734375, -0.21646499633789062, -0.20577239990234375, -0.19507980346679688, -0.18438720703125, -0.17369461059570312, -0.16300201416015625, -0.15230941772460938, -0.1416168212890625, -0.13092422485351562, -0.12023162841796875, -0.10953903198242188, -0.098846435546875, -0.08815383911132812, -0.07746124267578125, -0.06676864624023438, -0.0560760498046875, -0.045383453369140625, -0.03469085693359375, -0.023998260498046875, -0.0133056640625, -0.002613067626953125, 0.00807952880859375, 0.018772125244140625, 0.0294647216796875, 0.040157318115234375, 0.05084991455078125, 0.061542510986328125, 0.072235107421875, 0.08292770385742188, 0.09362030029296875, 0.10431289672851562, 0.1150054931640625, 0.12569808959960938, 0.13639068603515625, 0.14708328247070312, 0.15777587890625, 0.16846847534179688, 0.17916107177734375, 0.18985366821289062, 0.2005462646484375, 0.21123886108398438, 0.22193145751953125, 0.23262405395507812, 0.243316650390625, 0.2540092468261719, 0.26470184326171875, 0.2753944396972656, 0.2860870361328125, 0.2967796325683594, 0.30747222900390625, 0.3181648254394531, 0.328857421875]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 3.0, 10.0, 7.0, 15.0, 13.0, 6.0, 26.0, 18.0, 34.0, 53.0, 55.0, 88.0, 125.0, 135.0, 102.0, 92.0, 51.0, 40.0, 19.0, 22.0, 16.0, 16.0, 9.0, 15.0, 10.0, 7.0, 3.0, 0.0, 5.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-49.350677490234375, -47.32404708862305, -45.29741668701172, -43.270782470703125, -41.2441520690918, -39.21752166748047, -37.190887451171875, -35.16425704956055, -33.13762664794922, -31.11099624633789, -29.08436393737793, -27.05773162841797, -25.03110122680664, -23.004470825195312, -20.97783851623535, -18.95120620727539, -16.924575805664062, -14.897944450378418, -12.871313095092773, -10.844681739807129, -8.818050384521484, -6.79141902923584, -4.764787673950195, -2.738156318664551, -0.7115249633789062, 1.3151063919067383, 3.341737747192383, 5.368369102478027, 7.395000457763672, 9.421631813049316, 11.448263168334961, 13.474894523620605, 15.50152587890625, 17.528156280517578, 19.55478858947754, 21.5814208984375, 23.608051300048828, 25.634681701660156, 27.661314010620117, 29.687946319580078, 31.714576721191406, 33.741207122802734, 35.76783752441406, 37.794471740722656, 39.821102142333984, 41.84773254394531, 43.874366760253906, 45.900997161865234, 47.92762756347656, 49.95425796508789, 51.98088836669922, 54.00752258300781, 56.03415298461914, 58.06078338623047, 60.08741760253906, 62.11404800415039, 64.14067840576172, 66.16731262207031, 68.19393920898438, 70.22057342529297, 72.24720764160156, 74.27383422851562, 76.30046844482422, 78.32709503173828, 80.35372924804688]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 3.0, 4.0, 4.0, 2.0, 4.0, 8.0, 12.0, 11.0, 20.0, 12.0, 19.0, 24.0, 24.0, 23.0, 32.0, 32.0, 32.0, 32.0, 31.0, 51.0, 40.0, 48.0, 38.0, 40.0, 34.0, 43.0, 52.0, 30.0, 45.0, 32.0, 34.0, 35.0, 23.0, 13.0, 22.0, 17.0, 19.0, 8.0, 13.0, 7.0, 6.0, 2.0, 5.0, 10.0, 6.0, 2.0, 4.0, 0.0, 2.0, 4.0, 0.0, 1.0], "bins": [-41.59947204589844, -40.40892028808594, -39.21836853027344, -38.02781677246094, -36.83726501464844, -35.64671325683594, -34.45616149902344, -33.26560974121094, -32.07505798339844, -30.884506225585938, -29.693954467773438, -28.503402709960938, -27.312850952148438, -26.122299194335938, -24.931747436523438, -23.741195678710938, -22.55064582824707, -21.36009407043457, -20.16954231262207, -18.97899055480957, -17.78843879699707, -16.59788703918457, -15.407336235046387, -14.216784477233887, -13.026232719421387, -11.835680961608887, -10.645129203796387, -9.454578399658203, -8.264026641845703, -7.073474407196045, -5.882923126220703, -4.692371368408203, -3.501819610595703, -2.311267852783203, -1.1207163333892822, 0.06983518600463867, 1.2603869438171387, 2.4509387016296387, 3.6414899826049805, 4.8320417404174805, 6.0225934982299805, 7.2131452560424805, 8.40369701385498, 9.594247817993164, 10.784799575805664, 11.975351333618164, 13.165903091430664, 14.356454849243164, 15.547006607055664, 16.737558364868164, 17.928110122680664, 19.118661880493164, 20.309213638305664, 21.499765396118164, 22.69031524658203, 23.88086700439453, 25.07141876220703, 26.26197052001953, 27.45252227783203, 28.64307403564453, 29.83362579345703, 31.02417755126953, 32.21472930908203, 33.40528106689453, 34.59583282470703]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 7.0, 10.0, 16.0, 16.0, 33.0, 34.0, 48.0, 74.0, 114.0, 148.0, 192.0, 322.0, 453.0, 584.0, 871.0, 1276.0, 1888.0, 2751.0, 3938.0, 5906.0, 9121.0, 13777.0, 21617.0, 34883.0, 58873.0, 110191.0, 324872.0, 1461104.0, 1522184.0, 341376.0, 115777.0, 60506.0, 35943.0, 22064.0, 14204.0, 9353.0, 6250.0, 4301.0, 2878.0, 1987.0, 1370.0, 914.0, 654.0, 439.0, 312.0, 209.0, 147.0, 100.0, 72.0, 44.0, 39.0, 16.0, 15.0, 5.0, 3.0, 2.0], "bins": [-68.1875, -66.29443359375, -64.4013671875, -62.50830078125, -60.615234375, -58.72216796875, -56.8291015625, -54.93603515625, -53.04296875, -51.14990234375, -49.2568359375, -47.36376953125, -45.470703125, -43.57763671875, -41.6845703125, -39.79150390625, -37.8984375, -36.00537109375, -34.1123046875, -32.21923828125, -30.326171875, -28.43310546875, -26.5400390625, -24.64697265625, -22.75390625, -20.86083984375, -18.9677734375, -17.07470703125, -15.181640625, -13.28857421875, -11.3955078125, -9.50244140625, -7.609375, -5.71630859375, -3.8232421875, -1.93017578125, -0.037109375, 1.85595703125, 3.7490234375, 5.64208984375, 7.53515625, 9.42822265625, 11.3212890625, 13.21435546875, 15.107421875, 17.00048828125, 18.8935546875, 20.78662109375, 22.6796875, 24.57275390625, 26.4658203125, 28.35888671875, 30.251953125, 32.14501953125, 34.0380859375, 35.93115234375, 37.82421875, 39.71728515625, 41.6103515625, 43.50341796875, 45.396484375, 47.28955078125, 49.1826171875, 51.07568359375, 52.96875]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 12.0, 3.0, 7.0, 15.0, 14.0, 10.0, 19.0, 17.0, 30.0, 31.0, 35.0, 23.0, 38.0, 32.0, 47.0, 37.0, 43.0, 40.0, 44.0, 34.0, 46.0, 46.0, 48.0, 36.0, 39.0, 32.0, 36.0, 29.0, 22.0, 15.0, 22.0, 20.0, 9.0, 12.0, 14.0, 8.0, 5.0, 5.0, 6.0, 5.0, 2.0, 4.0, 1.0, 2.0, 4.0, 0.0, 1.0], "bins": [-34.375, -33.41162109375, -32.4482421875, -31.48486328125, -30.521484375, -29.55810546875, -28.5947265625, -27.63134765625, -26.66796875, -25.70458984375, -24.7412109375, -23.77783203125, -22.814453125, -21.85107421875, -20.8876953125, -19.92431640625, -18.9609375, -17.99755859375, -17.0341796875, -16.07080078125, -15.107421875, -14.14404296875, -13.1806640625, -12.21728515625, -11.25390625, -10.29052734375, -9.3271484375, -8.36376953125, -7.400390625, -6.43701171875, -5.4736328125, -4.51025390625, -3.546875, -2.58349609375, -1.6201171875, -0.65673828125, 0.306640625, 1.27001953125, 2.2333984375, 3.19677734375, 4.16015625, 5.12353515625, 6.0869140625, 7.05029296875, 8.013671875, 8.97705078125, 9.9404296875, 10.90380859375, 11.8671875, 12.83056640625, 13.7939453125, 14.75732421875, 15.720703125, 16.68408203125, 17.6474609375, 18.61083984375, 19.57421875, 20.53759765625, 21.5009765625, 22.46435546875, 23.427734375, 24.39111328125, 25.3544921875, 26.31787109375, 27.28125]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 6.0, 13.0, 30.0, 24.0, 45.0, 76.0, 87.0, 132.0, 181.0, 269.0, 444.0, 579.0, 908.0, 1284.0, 1922.0, 2686.0, 3979.0, 6167.0, 9102.0, 14366.0, 22233.0, 36077.0, 61171.0, 109768.0, 220913.0, 562192.0, 1945162.0, 658799.0, 244624.0, 118701.0, 65290.0, 38594.0, 23823.0, 15038.0, 9728.0, 6443.0, 4296.0, 2960.0, 1950.0, 1318.0, 920.0, 631.0, 427.0, 277.0, 222.0, 141.0, 95.0, 58.0, 48.0, 33.0, 13.0, 21.0, 15.0, 3.0, 5.0, 2.0, 0.0, 1.0], "bins": [-55.9375, -54.2197265625, -52.501953125, -50.7841796875, -49.06640625, -47.3486328125, -45.630859375, -43.9130859375, -42.1953125, -40.4775390625, -38.759765625, -37.0419921875, -35.32421875, -33.6064453125, -31.888671875, -30.1708984375, -28.453125, -26.7353515625, -25.017578125, -23.2998046875, -21.58203125, -19.8642578125, -18.146484375, -16.4287109375, -14.7109375, -12.9931640625, -11.275390625, -9.5576171875, -7.83984375, -6.1220703125, -4.404296875, -2.6865234375, -0.96875, 0.7490234375, 2.466796875, 4.1845703125, 5.90234375, 7.6201171875, 9.337890625, 11.0556640625, 12.7734375, 14.4912109375, 16.208984375, 17.9267578125, 19.64453125, 21.3623046875, 23.080078125, 24.7978515625, 26.515625, 28.2333984375, 29.951171875, 31.6689453125, 33.38671875, 35.1044921875, 36.822265625, 38.5400390625, 40.2578125, 41.9755859375, 43.693359375, 45.4111328125, 47.12890625, 48.8466796875, 50.564453125, 52.2822265625, 54.0]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 8.0, 4.0, 8.0, 12.0, 10.0, 9.0, 12.0, 12.0, 20.0, 22.0, 30.0, 39.0, 45.0, 44.0, 59.0, 76.0, 81.0, 114.0, 128.0, 164.0, 194.0, 293.0, 448.0, 554.0, 389.0, 227.0, 217.0, 149.0, 122.0, 121.0, 80.0, 67.0, 58.0, 36.0, 42.0, 32.0, 26.0, 27.0, 18.0, 18.0, 14.0, 9.0, 5.0, 6.0, 7.0, 2.0, 5.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 4.0, 1.0, 1.0], "bins": [-16.8125, -16.2763671875, -15.740234375, -15.2041015625, -14.66796875, -14.1318359375, -13.595703125, -13.0595703125, -12.5234375, -11.9873046875, -11.451171875, -10.9150390625, -10.37890625, -9.8427734375, -9.306640625, -8.7705078125, -8.234375, -7.6982421875, -7.162109375, -6.6259765625, -6.08984375, -5.5537109375, -5.017578125, -4.4814453125, -3.9453125, -3.4091796875, -2.873046875, -2.3369140625, -1.80078125, -1.2646484375, -0.728515625, -0.1923828125, 0.34375, 0.8798828125, 1.416015625, 1.9521484375, 2.48828125, 3.0244140625, 3.560546875, 4.0966796875, 4.6328125, 5.1689453125, 5.705078125, 6.2412109375, 6.77734375, 7.3134765625, 7.849609375, 8.3857421875, 8.921875, 9.4580078125, 9.994140625, 10.5302734375, 11.06640625, 11.6025390625, 12.138671875, 12.6748046875, 13.2109375, 13.7470703125, 14.283203125, 14.8193359375, 15.35546875, 15.8916015625, 16.427734375, 16.9638671875, 17.5]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 3.0, 6.0, 16.0, 10.0, 13.0, 16.0, 19.0, 25.0, 27.0, 48.0, 60.0, 110.0, 133.0, 131.0, 97.0, 73.0, 46.0, 37.0, 27.0, 28.0, 18.0, 12.0, 10.0, 10.0, 8.0, 2.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.24962615966797, -40.42340850830078, -38.597190856933594, -36.77096939086914, -34.94475173950195, -33.118534088134766, -31.292314529418945, -29.466094970703125, -27.639877319335938, -25.81365966796875, -23.98744010925293, -22.16122055053711, -20.335002899169922, -18.508785247802734, -16.682565689086914, -14.85634708404541, -13.030128479003906, -11.203909873962402, -9.377691268920898, -7.5514726638793945, -5.725254058837891, -3.8990354537963867, -2.072816848754883, -0.2465982437133789, 1.579620361328125, 3.405838966369629, 5.232057571411133, 7.058276176452637, 8.88449478149414, 10.710713386535645, 12.536931991577148, 14.363150596618652, 16.189369201660156, 18.015586853027344, 19.841806411743164, 21.668025970458984, 23.494243621826172, 25.32046127319336, 27.14668083190918, 28.972900390625, 30.799118041992188, 32.625335693359375, 34.45155334472656, 36.277774810791016, 38.1039924621582, 39.93021011352539, 41.756431579589844, 43.58264923095703, 45.40886688232422, 47.235084533691406, 49.061302185058594, 50.88752365112305, 52.713741302490234, 54.53995895385742, 56.366180419921875, 58.19239807128906, 60.01861572265625, 61.84483337402344, 63.671051025390625, 65.49726867675781, 67.323486328125, 69.14971160888672, 70.9759292602539, 72.8021469116211, 74.62836456298828]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 6.0, 10.0, 3.0, 8.0, 9.0, 15.0, 16.0, 14.0, 16.0, 14.0, 28.0, 22.0, 23.0, 31.0, 31.0, 32.0, 37.0, 31.0, 34.0, 34.0, 43.0, 34.0, 28.0, 37.0, 45.0, 32.0, 34.0, 38.0, 35.0, 32.0, 35.0, 20.0, 26.0, 20.0, 22.0, 18.0, 11.0, 12.0, 15.0, 8.0, 9.0, 10.0, 4.0, 5.0, 4.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-30.16838264465332, -29.231956481933594, -28.295530319213867, -27.35910415649414, -26.422677993774414, -25.486251831054688, -24.54982566833496, -23.613399505615234, -22.676973342895508, -21.74054718017578, -20.804121017456055, -19.867694854736328, -18.9312686920166, -17.994842529296875, -17.05841636657715, -16.121990203857422, -15.185564041137695, -14.249137878417969, -13.312711715698242, -12.376285552978516, -11.439859390258789, -10.503433227539062, -9.567007064819336, -8.63058090209961, -7.694154739379883, -6.757728576660156, -5.82130241394043, -4.884876251220703, -3.9484500885009766, -3.01202392578125, -2.0755977630615234, -1.1391716003417969, -0.20274734497070312, 0.7336788177490234, 1.67010498046875, 2.6065311431884766, 3.542957305908203, 4.47938346862793, 5.415809631347656, 6.352235794067383, 7.288661956787109, 8.225088119506836, 9.161514282226562, 10.097940444946289, 11.034366607666016, 11.970792770385742, 12.907218933105469, 13.843645095825195, 14.780071258544922, 15.716497421264648, 16.652923583984375, 17.5893497467041, 18.525775909423828, 19.462202072143555, 20.39862823486328, 21.335054397583008, 22.271480560302734, 23.20790672302246, 24.144332885742188, 25.080759048461914, 26.01718521118164, 26.953611373901367, 27.890037536621094, 28.82646369934082, 29.762889862060547]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [4.0, 4.0, 2.0, 10.0, 9.0, 7.0, 17.0, 20.0, 32.0, 35.0, 48.0, 76.0, 125.0, 148.0, 241.0, 343.0, 433.0, 594.0, 892.0, 1307.0, 1909.0, 2751.0, 3851.0, 5677.0, 8315.0, 12052.0, 17710.0, 26541.0, 41116.0, 64890.0, 114248.0, 266663.0, 209988.0, 98093.0, 57982.0, 36482.0, 24048.0, 16291.0, 10969.0, 7460.0, 5237.0, 3642.0, 2484.0, 1831.0, 1141.0, 826.0, 604.0, 417.0, 296.0, 192.0, 163.0, 110.0, 66.0, 42.0, 39.0, 32.0, 28.0, 8.0, 10.0, 8.0, 4.0, 6.0, 5.0, 2.0], "bins": [-8.28125, -8.021484375, -7.76171875, -7.501953125, -7.2421875, -6.982421875, -6.72265625, -6.462890625, -6.203125, -5.943359375, -5.68359375, -5.423828125, -5.1640625, -4.904296875, -4.64453125, -4.384765625, -4.125, -3.865234375, -3.60546875, -3.345703125, -3.0859375, -2.826171875, -2.56640625, -2.306640625, -2.046875, -1.787109375, -1.52734375, -1.267578125, -1.0078125, -0.748046875, -0.48828125, -0.228515625, 0.03125, 0.291015625, 0.55078125, 0.810546875, 1.0703125, 1.330078125, 1.58984375, 1.849609375, 2.109375, 2.369140625, 2.62890625, 2.888671875, 3.1484375, 3.408203125, 3.66796875, 3.927734375, 4.1875, 4.447265625, 4.70703125, 4.966796875, 5.2265625, 5.486328125, 5.74609375, 6.005859375, 6.265625, 6.525390625, 6.78515625, 7.044921875, 7.3046875, 7.564453125, 7.82421875, 8.083984375, 8.34375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 5.0, 6.0, 8.0, 9.0, 15.0, 13.0, 8.0, 29.0, 14.0, 14.0, 23.0, 20.0, 24.0, 25.0, 26.0, 33.0, 45.0, 33.0, 34.0, 45.0, 28.0, 29.0, 30.0, 33.0, 55.0, 24.0, 37.0, 32.0, 30.0, 28.0, 30.0, 35.0, 25.0, 18.0, 23.0, 21.0, 16.0, 12.0, 9.0, 9.0, 5.0, 13.0, 7.0, 8.0, 4.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-29.078125, -28.169677734375, -27.26123046875, -26.352783203125, -25.4443359375, -24.535888671875, -23.62744140625, -22.718994140625, -21.810546875, -20.902099609375, -19.99365234375, -19.085205078125, -18.1767578125, -17.268310546875, -16.35986328125, -15.451416015625, -14.54296875, -13.634521484375, -12.72607421875, -11.817626953125, -10.9091796875, -10.000732421875, -9.09228515625, -8.183837890625, -7.275390625, -6.366943359375, -5.45849609375, -4.550048828125, -3.6416015625, -2.733154296875, -1.82470703125, -0.916259765625, -0.0078125, 0.900634765625, 1.80908203125, 2.717529296875, 3.6259765625, 4.534423828125, 5.44287109375, 6.351318359375, 7.259765625, 8.168212890625, 9.07666015625, 9.985107421875, 10.8935546875, 11.802001953125, 12.71044921875, 13.618896484375, 14.52734375, 15.435791015625, 16.34423828125, 17.252685546875, 18.1611328125, 19.069580078125, 19.97802734375, 20.886474609375, 21.794921875, 22.703369140625, 23.61181640625, 24.520263671875, 25.4287109375, 26.337158203125, 27.24560546875, 28.154052734375, 29.0625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 8.0, 4.0, 9.0, 13.0, 20.0, 20.0, 27.0, 40.0, 53.0, 59.0, 96.0, 136.0, 187.0, 261.0, 368.0, 528.0, 661.0, 996.0, 1438.0, 2100.0, 2948.0, 4362.0, 6547.0, 9557.0, 14890.0, 22748.0, 36096.0, 58450.0, 105618.0, 255635.0, 256439.0, 105621.0, 58463.0, 35876.0, 23103.0, 14738.0, 9765.0, 6408.0, 4313.0, 2964.0, 2015.0, 1457.0, 1052.0, 694.0, 486.0, 350.0, 249.0, 208.0, 146.0, 100.0, 80.0, 47.0, 40.0, 27.0, 17.0, 12.0, 10.0, 7.0, 3.0, 7.0, 0.0, 2.0], "bins": [-8.359375, -8.09814453125, -7.8369140625, -7.57568359375, -7.314453125, -7.05322265625, -6.7919921875, -6.53076171875, -6.26953125, -6.00830078125, -5.7470703125, -5.48583984375, -5.224609375, -4.96337890625, -4.7021484375, -4.44091796875, -4.1796875, -3.91845703125, -3.6572265625, -3.39599609375, -3.134765625, -2.87353515625, -2.6123046875, -2.35107421875, -2.08984375, -1.82861328125, -1.5673828125, -1.30615234375, -1.044921875, -0.78369140625, -0.5224609375, -0.26123046875, 0.0, 0.26123046875, 0.5224609375, 0.78369140625, 1.044921875, 1.30615234375, 1.5673828125, 1.82861328125, 2.08984375, 2.35107421875, 2.6123046875, 2.87353515625, 3.134765625, 3.39599609375, 3.6572265625, 3.91845703125, 4.1796875, 4.44091796875, 4.7021484375, 4.96337890625, 5.224609375, 5.48583984375, 5.7470703125, 6.00830078125, 6.26953125, 6.53076171875, 6.7919921875, 7.05322265625, 7.314453125, 7.57568359375, 7.8369140625, 8.09814453125, 8.359375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 5.0, 8.0, 7.0, 9.0, 11.0, 15.0, 16.0, 19.0, 27.0, 18.0, 26.0, 27.0, 24.0, 26.0, 36.0, 40.0, 47.0, 45.0, 49.0, 42.0, 39.0, 42.0, 36.0, 37.0, 40.0, 32.0, 34.0, 22.0, 35.0, 23.0, 29.0, 20.0, 13.0, 15.0, 14.0, 17.0, 11.0, 9.0, 5.0, 4.0, 7.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-20.6875, -20.06640625, -19.4453125, -18.82421875, -18.203125, -17.58203125, -16.9609375, -16.33984375, -15.71875, -15.09765625, -14.4765625, -13.85546875, -13.234375, -12.61328125, -11.9921875, -11.37109375, -10.75, -10.12890625, -9.5078125, -8.88671875, -8.265625, -7.64453125, -7.0234375, -6.40234375, -5.78125, -5.16015625, -4.5390625, -3.91796875, -3.296875, -2.67578125, -2.0546875, -1.43359375, -0.8125, -0.19140625, 0.4296875, 1.05078125, 1.671875, 2.29296875, 2.9140625, 3.53515625, 4.15625, 4.77734375, 5.3984375, 6.01953125, 6.640625, 7.26171875, 7.8828125, 8.50390625, 9.125, 9.74609375, 10.3671875, 10.98828125, 11.609375, 12.23046875, 12.8515625, 13.47265625, 14.09375, 14.71484375, 15.3359375, 15.95703125, 16.578125, 17.19921875, 17.8203125, 18.44140625, 19.0625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 11.0, 10.0, 11.0, 13.0, 32.0, 33.0, 34.0, 55.0, 61.0, 98.0, 122.0, 138.0, 215.0, 280.0, 414.0, 542.0, 850.0, 1301.0, 1986.0, 2983.0, 4920.0, 8417.0, 15825.0, 34177.0, 89208.0, 359146.0, 364560.0, 90218.0, 34349.0, 16033.0, 8425.0, 4821.0, 3034.0, 1923.0, 1264.0, 888.0, 565.0, 420.0, 315.0, 222.0, 173.0, 134.0, 80.0, 72.0, 43.0, 37.0, 29.0, 18.0, 17.0, 9.0, 8.0, 4.0, 6.0, 3.0, 3.0, 2.0, 1.0], "bins": [-0.027801513671875, -0.02695918083190918, -0.02611684799194336, -0.02527451515197754, -0.02443218231201172, -0.0235898494720459, -0.022747516632080078, -0.021905183792114258, -0.021062850952148438, -0.020220518112182617, -0.019378185272216797, -0.018535852432250977, -0.017693519592285156, -0.016851186752319336, -0.016008853912353516, -0.015166521072387695, -0.014324188232421875, -0.013481855392456055, -0.012639522552490234, -0.011797189712524414, -0.010954856872558594, -0.010112524032592773, -0.009270191192626953, -0.008427858352661133, -0.0075855255126953125, -0.006743192672729492, -0.005900859832763672, -0.0050585269927978516, -0.004216194152832031, -0.003373861312866211, -0.0025315284729003906, -0.0016891956329345703, -0.00084686279296875, -4.5299530029296875e-06, 0.0008378028869628906, 0.001680135726928711, 0.0025224685668945312, 0.0033648014068603516, 0.004207134246826172, 0.005049467086791992, 0.0058917999267578125, 0.006734132766723633, 0.007576465606689453, 0.008418798446655273, 0.009261131286621094, 0.010103464126586914, 0.010945796966552734, 0.011788129806518555, 0.012630462646484375, 0.013472795486450195, 0.014315128326416016, 0.015157461166381836, 0.015999794006347656, 0.016842126846313477, 0.017684459686279297, 0.018526792526245117, 0.019369125366210938, 0.020211458206176758, 0.021053791046142578, 0.0218961238861084, 0.02273845672607422, 0.02358078956604004, 0.02442312240600586, 0.02526545524597168, 0.0261077880859375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 4.0, 2.0, 6.0, 9.0, 6.0, 9.0, 14.0, 15.0, 13.0, 20.0, 40.0, 33.0, 59.0, 69.0, 73.0, 105.0, 84.0, 82.0, 83.0, 56.0, 40.0, 32.0, 31.0, 19.0, 20.0, 9.0, 7.0, 14.0, 7.0, 6.0, 10.0, 7.0, 2.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9669532775878906e-05, -1.8971972167491913e-05, -1.827441155910492e-05, -1.7576850950717926e-05, -1.6879290342330933e-05, -1.618172973394394e-05, -1.5484169125556946e-05, -1.4786608517169952e-05, -1.4089047908782959e-05, -1.3391487300395966e-05, -1.2693926692008972e-05, -1.1996366083621979e-05, -1.1298805475234985e-05, -1.0601244866847992e-05, -9.903684258460999e-06, -9.206123650074005e-06, -8.508563041687012e-06, -7.811002433300018e-06, -7.113441824913025e-06, -6.4158812165260315e-06, -5.718320608139038e-06, -5.020759999752045e-06, -4.323199391365051e-06, -3.625638782978058e-06, -2.9280781745910645e-06, -2.230517566204071e-06, -1.5329569578170776e-06, -8.353963494300842e-07, -1.3783574104309082e-07, 5.597248673439026e-07, 1.257285475730896e-06, 1.9548460841178894e-06, 2.652406692504883e-06, 3.3499673008918762e-06, 4.04752790927887e-06, 4.745088517665863e-06, 5.4426491260528564e-06, 6.14020973443985e-06, 6.837770342826843e-06, 7.535330951213837e-06, 8.23289155960083e-06, 8.930452167987823e-06, 9.628012776374817e-06, 1.032557338476181e-05, 1.1023133993148804e-05, 1.1720694601535797e-05, 1.241825520992279e-05, 1.3115815818309784e-05, 1.3813376426696777e-05, 1.451093703508377e-05, 1.5208497643470764e-05, 1.5906058251857758e-05, 1.660361886024475e-05, 1.7301179468631744e-05, 1.7998740077018738e-05, 1.869630068540573e-05, 1.9393861293792725e-05, 2.0091421902179718e-05, 2.078898251056671e-05, 2.1486543118953705e-05, 2.2184103727340698e-05, 2.288166433572769e-05, 2.3579224944114685e-05, 2.427678555250168e-05, 2.4974346160888672e-05]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 8.0, 5.0, 15.0, 12.0, 27.0, 34.0, 56.0, 61.0, 108.0, 149.0, 199.0, 273.0, 382.0, 610.0, 854.0, 1236.0, 1784.0, 2766.0, 4323.0, 7319.0, 12854.0, 24022.0, 50580.0, 129786.0, 439009.0, 225299.0, 72561.0, 32460.0, 16843.0, 9358.0, 5354.0, 3387.0, 2194.0, 1399.0, 998.0, 635.0, 490.0, 326.0, 223.0, 148.0, 121.0, 76.0, 61.0, 55.0, 24.0, 18.0, 18.0, 18.0, 6.0, 7.0, 1.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0222625732421875, -0.02153778076171875, -0.02081298828125, -0.02008819580078125, -0.0193634033203125, -0.01863861083984375, -0.017913818359375, -0.01718902587890625, -0.0164642333984375, -0.01573944091796875, -0.0150146484375, -0.01428985595703125, -0.0135650634765625, -0.01284027099609375, -0.012115478515625, -0.01139068603515625, -0.0106658935546875, -0.00994110107421875, -0.00921630859375, -0.00849151611328125, -0.0077667236328125, -0.00704193115234375, -0.006317138671875, -0.00559234619140625, -0.0048675537109375, -0.00414276123046875, -0.00341796875, -0.00269317626953125, -0.0019683837890625, -0.00124359130859375, -0.000518798828125, 0.00020599365234375, 0.0009307861328125, 0.00165557861328125, 0.00238037109375, 0.00310516357421875, 0.0038299560546875, 0.00455474853515625, 0.005279541015625, 0.00600433349609375, 0.0067291259765625, 0.00745391845703125, 0.0081787109375, 0.00890350341796875, 0.0096282958984375, 0.01035308837890625, 0.011077880859375, 0.01180267333984375, 0.0125274658203125, 0.01325225830078125, 0.01397705078125, 0.01470184326171875, 0.0154266357421875, 0.01615142822265625, 0.016876220703125, 0.01760101318359375, 0.0183258056640625, 0.01905059814453125, 0.019775390625, 0.02050018310546875, 0.0212249755859375, 0.02194976806640625, 0.022674560546875, 0.02339935302734375, 0.0241241455078125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 1.0, 4.0, 6.0, 11.0, 11.0, 10.0, 13.0, 21.0, 11.0, 27.0, 38.0, 43.0, 53.0, 80.0, 73.0, 99.0, 93.0, 68.0, 80.0, 46.0, 39.0, 54.0, 20.0, 28.0, 10.0, 12.0, 10.0, 6.0, 7.0, 7.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005985260009765625, -0.0057694315910339355, -0.005553603172302246, -0.005337774753570557, -0.005121946334838867, -0.004906117916107178, -0.004690289497375488, -0.004474461078643799, -0.004258632659912109, -0.00404280424118042, -0.0038269758224487305, -0.003611147403717041, -0.0033953189849853516, -0.003179490566253662, -0.0029636621475219727, -0.002747833728790283, -0.0025320053100585938, -0.0023161768913269043, -0.002100348472595215, -0.0018845200538635254, -0.001668691635131836, -0.0014528632164001465, -0.001237034797668457, -0.0010212063789367676, -0.0008053779602050781, -0.0005895495414733887, -0.0003737211227416992, -0.00015789270401000977, 5.793571472167969e-05, 0.00027376413345336914, 0.0004895925521850586, 0.000705420970916748, 0.0009212493896484375, 0.001137077808380127, 0.0013529062271118164, 0.0015687346458435059, 0.0017845630645751953, 0.0020003914833068848, 0.0022162199020385742, 0.0024320483207702637, 0.002647876739501953, 0.0028637051582336426, 0.003079533576965332, 0.0032953619956970215, 0.003511190414428711, 0.0037270188331604004, 0.00394284725189209, 0.004158675670623779, 0.004374504089355469, 0.004590332508087158, 0.004806160926818848, 0.005021989345550537, 0.0052378177642822266, 0.005453646183013916, 0.0056694746017456055, 0.005885303020477295, 0.006101131439208984, 0.006316959857940674, 0.006532788276672363, 0.006748616695404053, 0.006964445114135742, 0.007180273532867432, 0.007396101951599121, 0.0076119303703308105, 0.0078277587890625]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 8.0, 13.0, 10.0, 12.0, 15.0, 19.0, 25.0, 23.0, 44.0, 56.0, 99.0, 137.0, 132.0, 112.0, 77.0, 48.0, 41.0, 26.0, 31.0, 17.0, 13.0, 7.0, 9.0, 8.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.989097595214844, -41.14594268798828, -39.30278778076172, -37.459632873535156, -35.616477966308594, -33.77332305908203, -31.930166244506836, -30.08700942993164, -28.243854522705078, -26.400699615478516, -24.557544708251953, -22.71438980102539, -20.871232986450195, -19.028078079223633, -17.18492317199707, -15.341767311096191, -13.498613357543945, -11.655458450317383, -9.812302589416504, -7.969147682189941, -6.125992298126221, -4.2828369140625, -2.4396820068359375, -0.5965261459350586, 1.246628761291504, 3.0897841453552246, 4.932939529418945, 6.776094436645508, 8.61924934387207, 10.46240520477295, 12.305560111999512, 14.14871597290039, 15.991870880126953, 17.835025787353516, 19.678180694580078, 21.52133560180664, 23.364492416381836, 25.2076473236084, 27.05080223083496, 28.893959045410156, 30.73711395263672, 32.58026885986328, 34.423423767089844, 36.266578674316406, 38.10973358154297, 39.95288848876953, 41.796043395996094, 43.63920211791992, 45.48235321044922, 47.32550811767578, 49.168663024902344, 51.011817932128906, 52.85497283935547, 54.69812774658203, 56.541282653808594, 58.38444137573242, 60.227596282958984, 62.07075119018555, 63.91390609741211, 65.75706481933594, 67.6002197265625, 69.44337463378906, 71.28652954101562, 73.12968444824219, 74.97283935546875]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 7.0, 9.0, 3.0, 9.0, 8.0, 17.0, 15.0, 15.0, 15.0, 17.0, 24.0, 24.0, 21.0, 33.0, 30.0, 33.0, 38.0, 30.0, 33.0, 38.0, 39.0, 35.0, 29.0, 37.0, 43.0, 34.0, 33.0, 38.0, 34.0, 31.0, 35.0, 22.0, 25.0, 19.0, 23.0, 17.0, 12.0, 11.0, 15.0, 8.0, 9.0, 10.0, 4.0, 5.0, 4.0, 5.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-29.347915649414062, -28.430574417114258, -27.513233184814453, -26.59589195251465, -25.678550720214844, -24.76120948791504, -23.843868255615234, -22.92652702331543, -22.009185791015625, -21.09184455871582, -20.174503326416016, -19.25716209411621, -18.339820861816406, -17.4224796295166, -16.505138397216797, -15.587797164916992, -14.670454978942871, -13.753113746643066, -12.835772514343262, -11.918431282043457, -11.001090049743652, -10.083747863769531, -9.166406631469727, -8.249065399169922, -7.331724643707275, -6.414383411407471, -5.497042179107666, -4.579700469970703, -3.6623594760894775, -2.7450180053710938, -1.827676773071289, -0.9103355407714844, 0.0070056915283203125, 0.9243469834327698, 1.8416882753372192, 2.7590296268463135, 3.676370859146118, 4.593712329864502, 5.511053562164307, 6.428394794464111, 7.345736026763916, 8.263077735900879, 9.180418968200684, 10.097760200500488, 11.015101432800293, 11.932442665100098, 12.849783897399902, 13.767125129699707, 14.684466361999512, 15.601807594299316, 16.519149780273438, 17.436491012573242, 18.353832244873047, 19.27117347717285, 20.188514709472656, 21.10585594177246, 22.023197174072266, 22.94053840637207, 23.857879638671875, 24.77522087097168, 25.692562103271484, 26.60990333557129, 27.527244567871094, 28.4445858001709, 29.361927032470703]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 7.0, 10.0, 22.0, 22.0, 43.0, 70.0, 101.0, 138.0, 238.0, 346.0, 538.0, 757.0, 1181.0, 1847.0, 2738.0, 4371.0, 6549.0, 10171.0, 16339.0, 25516.0, 41286.0, 70920.0, 139051.0, 255012.0, 213828.0, 106109.0, 57082.0, 34538.0, 21408.0, 13493.0, 8752.0, 5549.0, 3697.0, 2379.0, 1477.0, 988.0, 692.0, 410.0, 315.0, 178.0, 144.0, 87.0, 51.0, 31.0, 33.0, 17.0, 7.0, 7.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-60.0625, -58.17431640625, -56.2861328125, -54.39794921875, -52.509765625, -50.62158203125, -48.7333984375, -46.84521484375, -44.95703125, -43.06884765625, -41.1806640625, -39.29248046875, -37.404296875, -35.51611328125, -33.6279296875, -31.73974609375, -29.8515625, -27.96337890625, -26.0751953125, -24.18701171875, -22.298828125, -20.41064453125, -18.5224609375, -16.63427734375, -14.74609375, -12.85791015625, -10.9697265625, -9.08154296875, -7.193359375, -5.30517578125, -3.4169921875, -1.52880859375, 0.359375, 2.24755859375, 4.1357421875, 6.02392578125, 7.912109375, 9.80029296875, 11.6884765625, 13.57666015625, 15.46484375, 17.35302734375, 19.2412109375, 21.12939453125, 23.017578125, 24.90576171875, 26.7939453125, 28.68212890625, 30.5703125, 32.45849609375, 34.3466796875, 36.23486328125, 38.123046875, 40.01123046875, 41.8994140625, 43.78759765625, 45.67578125, 47.56396484375, 49.4521484375, 51.34033203125, 53.228515625, 55.11669921875, 57.0048828125, 58.89306640625, 60.78125]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 7.0, 4.0, 9.0, 2.0, 12.0, 11.0, 9.0, 15.0, 10.0, 19.0, 15.0, 21.0, 20.0, 29.0, 31.0, 31.0, 39.0, 37.0, 40.0, 49.0, 38.0, 32.0, 41.0, 38.0, 49.0, 45.0, 45.0, 28.0, 33.0, 24.0, 33.0, 20.0, 24.0, 28.0, 30.0, 22.0, 7.0, 16.0, 10.0, 8.0, 7.0, 8.0, 3.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.671875, -25.81982421875, -24.9677734375, -24.11572265625, -23.263671875, -22.41162109375, -21.5595703125, -20.70751953125, -19.85546875, -19.00341796875, -18.1513671875, -17.29931640625, -16.447265625, -15.59521484375, -14.7431640625, -13.89111328125, -13.0390625, -12.18701171875, -11.3349609375, -10.48291015625, -9.630859375, -8.77880859375, -7.9267578125, -7.07470703125, -6.22265625, -5.37060546875, -4.5185546875, -3.66650390625, -2.814453125, -1.96240234375, -1.1103515625, -0.25830078125, 0.59375, 1.44580078125, 2.2978515625, 3.14990234375, 4.001953125, 4.85400390625, 5.7060546875, 6.55810546875, 7.41015625, 8.26220703125, 9.1142578125, 9.96630859375, 10.818359375, 11.67041015625, 12.5224609375, 13.37451171875, 14.2265625, 15.07861328125, 15.9306640625, 16.78271484375, 17.634765625, 18.48681640625, 19.3388671875, 20.19091796875, 21.04296875, 21.89501953125, 22.7470703125, 23.59912109375, 24.451171875, 25.30322265625, 26.1552734375, 27.00732421875, 27.859375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 8.0, 11.0, 18.0, 18.0, 30.0, 58.0, 86.0, 90.0, 123.0, 200.0, 339.0, 544.0, 733.0, 996.0, 1612.0, 2331.0, 3508.0, 5162.0, 7555.0, 11528.0, 17047.0, 26072.0, 40607.0, 66562.0, 120995.0, 217688.0, 217486.0, 121566.0, 66817.0, 40695.0, 26104.0, 17139.0, 11296.0, 7679.0, 5167.0, 3511.0, 2310.0, 1537.0, 1099.0, 721.0, 516.0, 315.0, 210.0, 158.0, 106.0, 77.0, 49.0, 29.0, 27.0, 10.0, 8.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0], "bins": [-53.5625, -51.939453125, -50.31640625, -48.693359375, -47.0703125, -45.447265625, -43.82421875, -42.201171875, -40.578125, -38.955078125, -37.33203125, -35.708984375, -34.0859375, -32.462890625, -30.83984375, -29.216796875, -27.59375, -25.970703125, -24.34765625, -22.724609375, -21.1015625, -19.478515625, -17.85546875, -16.232421875, -14.609375, -12.986328125, -11.36328125, -9.740234375, -8.1171875, -6.494140625, -4.87109375, -3.248046875, -1.625, -0.001953125, 1.62109375, 3.244140625, 4.8671875, 6.490234375, 8.11328125, 9.736328125, 11.359375, 12.982421875, 14.60546875, 16.228515625, 17.8515625, 19.474609375, 21.09765625, 22.720703125, 24.34375, 25.966796875, 27.58984375, 29.212890625, 30.8359375, 32.458984375, 34.08203125, 35.705078125, 37.328125, 38.951171875, 40.57421875, 42.197265625, 43.8203125, 45.443359375, 47.06640625, 48.689453125, 50.3125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 6.0, 11.0, 6.0, 6.0, 11.0, 7.0, 20.0, 19.0, 16.0, 14.0, 23.0, 23.0, 23.0, 27.0, 34.0, 43.0, 31.0, 39.0, 48.0, 39.0, 29.0, 45.0, 48.0, 49.0, 35.0, 43.0, 37.0, 28.0, 30.0, 34.0, 27.0, 21.0, 22.0, 9.0, 21.0, 18.0, 12.0, 14.0, 8.0, 9.0, 4.0, 3.0, 7.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-17.984375, -17.4576416015625, -16.930908203125, -16.4041748046875, -15.87744140625, -15.3507080078125, -14.823974609375, -14.2972412109375, -13.7705078125, -13.2437744140625, -12.717041015625, -12.1903076171875, -11.66357421875, -11.1368408203125, -10.610107421875, -10.0833740234375, -9.556640625, -9.0299072265625, -8.503173828125, -7.9764404296875, -7.44970703125, -6.9229736328125, -6.396240234375, -5.8695068359375, -5.3427734375, -4.8160400390625, -4.289306640625, -3.7625732421875, -3.23583984375, -2.7091064453125, -2.182373046875, -1.6556396484375, -1.12890625, -0.6021728515625, -0.075439453125, 0.4512939453125, 0.97802734375, 1.5047607421875, 2.031494140625, 2.5582275390625, 3.0849609375, 3.6116943359375, 4.138427734375, 4.6651611328125, 5.19189453125, 5.7186279296875, 6.245361328125, 6.7720947265625, 7.298828125, 7.8255615234375, 8.352294921875, 8.8790283203125, 9.40576171875, 9.9324951171875, 10.459228515625, 10.9859619140625, 11.5126953125, 12.0394287109375, 12.566162109375, 13.0928955078125, 13.61962890625, 14.1463623046875, 14.673095703125, 15.1998291015625, 15.7265625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 6.0, 6.0, 19.0, 13.0, 28.0, 35.0, 57.0, 78.0, 125.0, 191.0, 337.0, 482.0, 789.0, 1275.0, 2072.0, 3492.0, 6160.0, 10684.0, 20269.0, 40065.0, 86109.0, 220953.0, 367510.0, 153883.0, 65056.0, 31278.0, 16121.0, 8750.0, 5086.0, 2978.0, 1702.0, 1101.0, 657.0, 406.0, 278.0, 165.0, 108.0, 71.0, 51.0, 27.0, 19.0, 17.0, 17.0, 6.0, 8.0, 7.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-1.748046875, -1.6939697265625, -1.639892578125, -1.5858154296875, -1.53173828125, -1.4776611328125, -1.423583984375, -1.3695068359375, -1.3154296875, -1.2613525390625, -1.207275390625, -1.1531982421875, -1.09912109375, -1.0450439453125, -0.990966796875, -0.9368896484375, -0.8828125, -0.8287353515625, -0.774658203125, -0.7205810546875, -0.66650390625, -0.6124267578125, -0.558349609375, -0.5042724609375, -0.4501953125, -0.3961181640625, -0.342041015625, -0.2879638671875, -0.23388671875, -0.1798095703125, -0.125732421875, -0.0716552734375, -0.017578125, 0.0364990234375, 0.090576171875, 0.1446533203125, 0.19873046875, 0.2528076171875, 0.306884765625, 0.3609619140625, 0.4150390625, 0.4691162109375, 0.523193359375, 0.5772705078125, 0.63134765625, 0.6854248046875, 0.739501953125, 0.7935791015625, 0.84765625, 0.9017333984375, 0.955810546875, 1.0098876953125, 1.06396484375, 1.1180419921875, 1.172119140625, 1.2261962890625, 1.2802734375, 1.3343505859375, 1.388427734375, 1.4425048828125, 1.49658203125, 1.5506591796875, 1.604736328125, 1.6588134765625, 1.712890625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 6.0, 3.0, 14.0, 11.0, 4.0, 9.0, 21.0, 27.0, 40.0, 44.0, 56.0, 89.0, 110.0, 122.0, 104.0, 83.0, 54.0, 49.0, 40.0, 24.0, 17.0, 14.0, 12.0, 14.0, 12.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003838539123535156, -0.00037334486842155457, -0.0003628358244895935, -0.00035232678055763245, -0.0003418177366256714, -0.00033130869269371033, -0.00032079964876174927, -0.0003102906048297882, -0.00029978156089782715, -0.0002892725169658661, -0.00027876347303390503, -0.00026825442910194397, -0.0002577453851699829, -0.00024723634123802185, -0.0002367272973060608, -0.00022621825337409973, -0.00021570920944213867, -0.0002052001655101776, -0.00019469112157821655, -0.0001841820776462555, -0.00017367303371429443, -0.00016316398978233337, -0.00015265494585037231, -0.00014214590191841125, -0.0001316368579864502, -0.00012112781405448914, -0.00011061877012252808, -0.00010010972619056702, -8.960068225860596e-05, -7.90916383266449e-05, -6.858259439468384e-05, -5.807355046272278e-05, -4.756450653076172e-05, -3.705546259880066e-05, -2.65464186668396e-05, -1.603737473487854e-05, -5.5283308029174805e-06, 4.980713129043579e-06, 1.548975706100464e-05, 2.5998800992965698e-05, 3.650784492492676e-05, 4.701688885688782e-05, 5.752593278884888e-05, 6.803497672080994e-05, 7.8544020652771e-05, 8.905306458473206e-05, 9.956210851669312e-05, 0.00011007115244865417, 0.00012058019638061523, 0.0001310892403125763, 0.00014159828424453735, 0.0001521073281764984, 0.00016261637210845947, 0.00017312541604042053, 0.0001836344599723816, 0.00019414350390434265, 0.0002046525478363037, 0.00021516159176826477, 0.00022567063570022583, 0.0002361796796321869, 0.00024668872356414795, 0.000257197767496109, 0.00026770681142807007, 0.00027821585536003113, 0.0002887248992919922]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 13.0, 12.0, 27.0, 25.0, 32.0, 32.0, 43.0, 70.0, 110.0, 153.0, 197.0, 261.0, 374.0, 468.0, 716.0, 1107.0, 1603.0, 2579.0, 4002.0, 6464.0, 10990.0, 18529.0, 32926.0, 62641.0, 138914.0, 348303.0, 225114.0, 87925.0, 43991.0, 24251.0, 13814.0, 8380.0, 5064.0, 3188.0, 1944.0, 1233.0, 882.0, 611.0, 447.0, 308.0, 215.0, 145.0, 120.0, 93.0, 65.0, 40.0, 39.0, 39.0, 19.0, 10.0, 13.0, 13.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-1.57421875, -1.5246124267578125, -1.475006103515625, -1.4253997802734375, -1.37579345703125, -1.3261871337890625, -1.276580810546875, -1.2269744873046875, -1.1773681640625, -1.1277618408203125, -1.078155517578125, -1.0285491943359375, -0.97894287109375, -0.9293365478515625, -0.879730224609375, -0.8301239013671875, -0.780517578125, -0.7309112548828125, -0.681304931640625, -0.6316986083984375, -0.58209228515625, -0.5324859619140625, -0.482879638671875, -0.4332733154296875, -0.3836669921875, -0.3340606689453125, -0.284454345703125, -0.2348480224609375, -0.18524169921875, -0.1356353759765625, -0.086029052734375, -0.0364227294921875, 0.01318359375, 0.0627899169921875, 0.112396240234375, 0.1620025634765625, 0.21160888671875, 0.2612152099609375, 0.310821533203125, 0.3604278564453125, 0.4100341796875, 0.4596405029296875, 0.509246826171875, 0.5588531494140625, 0.60845947265625, 0.6580657958984375, 0.707672119140625, 0.7572784423828125, 0.806884765625, 0.8564910888671875, 0.906097412109375, 0.9557037353515625, 1.00531005859375, 1.0549163818359375, 1.104522705078125, 1.1541290283203125, 1.2037353515625, 1.2533416748046875, 1.302947998046875, 1.3525543212890625, 1.40216064453125, 1.4517669677734375, 1.501373291015625, 1.5509796142578125, 1.6005859375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 4.0, 4.0, 6.0, 7.0, 9.0, 13.0, 13.0, 20.0, 16.0, 27.0, 27.0, 36.0, 46.0, 46.0, 51.0, 75.0, 74.0, 67.0, 58.0, 62.0, 49.0, 49.0, 44.0, 32.0, 31.0, 24.0, 28.0, 22.0, 15.0, 12.0, 10.0, 11.0, 2.0, 3.0, 1.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.5107421875, -0.49472808837890625, -0.4787139892578125, -0.46269989013671875, -0.446685791015625, -0.43067169189453125, -0.4146575927734375, -0.39864349365234375, -0.38262939453125, -0.36661529541015625, -0.3506011962890625, -0.33458709716796875, -0.318572998046875, -0.30255889892578125, -0.2865447998046875, -0.27053070068359375, -0.2545166015625, -0.23850250244140625, -0.2224884033203125, -0.20647430419921875, -0.190460205078125, -0.17444610595703125, -0.1584320068359375, -0.14241790771484375, -0.12640380859375, -0.11038970947265625, -0.0943756103515625, -0.07836151123046875, -0.062347412109375, -0.04633331298828125, -0.0303192138671875, -0.01430511474609375, 0.001708984375, 0.01772308349609375, 0.0337371826171875, 0.04975128173828125, 0.065765380859375, 0.08177947998046875, 0.0977935791015625, 0.11380767822265625, 0.12982177734375, 0.14583587646484375, 0.1618499755859375, 0.17786407470703125, 0.193878173828125, 0.20989227294921875, 0.2259063720703125, 0.24192047119140625, 0.2579345703125, 0.27394866943359375, 0.2899627685546875, 0.30597686767578125, 0.321990966796875, 0.33800506591796875, 0.3540191650390625, 0.37003326416015625, 0.38604736328125, 0.40206146240234375, 0.4180755615234375, 0.43408966064453125, 0.450103759765625, 0.46611785888671875, 0.4821319580078125, 0.49814605712890625, 0.51416015625]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 7.0, 5.0, 6.0, 11.0, 15.0, 21.0, 21.0, 30.0, 47.0, 57.0, 88.0, 113.0, 134.0, 108.0, 86.0, 56.0, 41.0, 37.0, 23.0, 24.0, 16.0, 11.0, 15.0, 7.0, 6.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.27523422241211, -34.67055130004883, -33.06587219238281, -31.46118927001953, -29.856508255004883, -28.251827239990234, -26.647144317626953, -25.042463302612305, -23.437782287597656, -21.833101272583008, -20.22842025756836, -18.623737335205078, -17.01905632019043, -15.414375305175781, -13.809693336486816, -12.205011367797852, -10.600330352783203, -8.995649337768555, -7.39096736907959, -5.786285877227783, -4.181604385375977, -2.576923370361328, -0.9722414016723633, 0.6324405670166016, 2.23712158203125, 3.8418030738830566, 5.446484565734863, 7.05116605758667, 8.655847549438477, 10.260528564453125, 11.86521053314209, 13.469892501831055, 15.074577331542969, 16.679258346557617, 18.283939361572266, 19.888622283935547, 21.493303298950195, 23.097984313964844, 24.702667236328125, 26.307348251342773, 27.912029266357422, 29.51671028137207, 31.12139129638672, 32.72607421875, 34.33075714111328, 35.9354362487793, 37.54011917114258, 39.144798278808594, 40.749481201171875, 42.354164123535156, 43.95884323120117, 45.56352615356445, 47.16820526123047, 48.77288818359375, 50.37757110595703, 51.98225402832031, 53.58693313598633, 55.19161605834961, 56.796295166015625, 58.400978088378906, 60.00566101074219, 61.6103401184082, 63.215023040771484, 64.8197021484375, 66.42438507080078]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 5.0, 6.0, 2.0, 5.0, 3.0, 7.0, 8.0, 9.0, 4.0, 10.0, 11.0, 18.0, 23.0, 17.0, 27.0, 26.0, 26.0, 21.0, 28.0, 34.0, 41.0, 33.0, 30.0, 42.0, 31.0, 49.0, 44.0, 25.0, 30.0, 34.0, 33.0, 32.0, 30.0, 29.0, 36.0, 26.0, 22.0, 18.0, 19.0, 22.0, 14.0, 9.0, 21.0, 15.0, 6.0, 4.0, 3.0, 5.0, 4.0, 7.0, 2.0, 7.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-24.378782272338867, -23.571640014648438, -22.764497756958008, -21.957355499267578, -21.150211334228516, -20.343069076538086, -19.535926818847656, -18.728784561157227, -17.921642303466797, -17.114500045776367, -16.307357788085938, -15.500214576721191, -14.693071365356445, -13.885929107666016, -13.078786849975586, -12.271644592285156, -11.464500427246094, -10.657358169555664, -9.850214958190918, -9.043072700500488, -8.235929489135742, -7.4287872314453125, -6.621644973754883, -5.814502239227295, -5.007359504699707, -4.200216770172119, -3.3930742740631104, -2.5859317779541016, -1.7787890434265137, -0.9716463088989258, -0.1645040512084961, 0.6426386833190918, 1.4497795104980469, 2.2569222450256348, 3.0640647411346436, 3.8712072372436523, 4.67834997177124, 5.485492706298828, 6.292634963989258, 7.099777698516846, 7.906920433044434, 8.714062690734863, 9.52120590209961, 10.328348159790039, 11.135490417480469, 11.942633628845215, 12.749775886535645, 13.55691909790039, 14.36406135559082, 15.17120361328125, 15.978346824645996, 16.78548812866211, 17.592632293701172, 18.3997745513916, 19.20691680908203, 20.01405906677246, 20.82120132446289, 21.62834358215332, 22.43548583984375, 23.242630004882812, 24.049772262573242, 24.856914520263672, 25.6640567779541, 26.47119903564453, 27.278343200683594]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 6.0, 8.0, 4.0, 6.0, 19.0, 25.0, 35.0, 50.0, 98.0, 135.0, 201.0, 319.0, 410.0, 618.0, 903.0, 1418.0, 2094.0, 3133.0, 4788.0, 7191.0, 11077.0, 17356.0, 27142.0, 45164.0, 78837.0, 181602.0, 817176.0, 1965819.0, 678775.0, 156836.0, 73611.0, 42978.0, 26901.0, 17048.0, 10923.0, 7147.0, 4667.0, 3192.0, 2071.0, 1395.0, 990.0, 656.0, 460.0, 330.0, 229.0, 138.0, 95.0, 63.0, 57.0, 33.0, 23.0, 12.0, 11.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-45.09375, -43.61279296875, -42.1318359375, -40.65087890625, -39.169921875, -37.68896484375, -36.2080078125, -34.72705078125, -33.24609375, -31.76513671875, -30.2841796875, -28.80322265625, -27.322265625, -25.84130859375, -24.3603515625, -22.87939453125, -21.3984375, -19.91748046875, -18.4365234375, -16.95556640625, -15.474609375, -13.99365234375, -12.5126953125, -11.03173828125, -9.55078125, -8.06982421875, -6.5888671875, -5.10791015625, -3.626953125, -2.14599609375, -0.6650390625, 0.81591796875, 2.296875, 3.77783203125, 5.2587890625, 6.73974609375, 8.220703125, 9.70166015625, 11.1826171875, 12.66357421875, 14.14453125, 15.62548828125, 17.1064453125, 18.58740234375, 20.068359375, 21.54931640625, 23.0302734375, 24.51123046875, 25.9921875, 27.47314453125, 28.9541015625, 30.43505859375, 31.916015625, 33.39697265625, 34.8779296875, 36.35888671875, 37.83984375, 39.32080078125, 40.8017578125, 42.28271484375, 43.763671875, 45.24462890625, 46.7255859375, 48.20654296875, 49.6875]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 3.0, 1.0, 4.0, 2.0, 3.0, 5.0, 1.0, 13.0, 11.0, 10.0, 14.0, 16.0, 17.0, 21.0, 16.0, 22.0, 29.0, 23.0, 30.0, 27.0, 39.0, 37.0, 35.0, 41.0, 30.0, 38.0, 34.0, 51.0, 32.0, 34.0, 27.0, 32.0, 25.0, 34.0, 21.0, 28.0, 30.0, 23.0, 22.0, 20.0, 19.0, 20.0, 13.0, 6.0, 9.0, 11.0, 3.0, 6.0, 5.0, 4.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-19.234375, -18.6044921875, -17.974609375, -17.3447265625, -16.71484375, -16.0849609375, -15.455078125, -14.8251953125, -14.1953125, -13.5654296875, -12.935546875, -12.3056640625, -11.67578125, -11.0458984375, -10.416015625, -9.7861328125, -9.15625, -8.5263671875, -7.896484375, -7.2666015625, -6.63671875, -6.0068359375, -5.376953125, -4.7470703125, -4.1171875, -3.4873046875, -2.857421875, -2.2275390625, -1.59765625, -0.9677734375, -0.337890625, 0.2919921875, 0.921875, 1.5517578125, 2.181640625, 2.8115234375, 3.44140625, 4.0712890625, 4.701171875, 5.3310546875, 5.9609375, 6.5908203125, 7.220703125, 7.8505859375, 8.48046875, 9.1103515625, 9.740234375, 10.3701171875, 11.0, 11.6298828125, 12.259765625, 12.8896484375, 13.51953125, 14.1494140625, 14.779296875, 15.4091796875, 16.0390625, 16.6689453125, 17.298828125, 17.9287109375, 18.55859375, 19.1884765625, 19.818359375, 20.4482421875, 21.078125]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 4.0, 5.0, 5.0, 11.0, 20.0, 18.0, 33.0, 45.0, 55.0, 91.0, 133.0, 188.0, 268.0, 408.0, 595.0, 932.0, 1374.0, 2170.0, 3191.0, 5297.0, 8286.0, 13487.0, 22955.0, 38200.0, 68437.0, 130085.0, 285510.0, 877521.0, 1855490.0, 469133.0, 189826.0, 93290.0, 50946.0, 29546.0, 17541.0, 10683.0, 6666.0, 4161.0, 2634.0, 1714.0, 1068.0, 699.0, 521.0, 310.0, 226.0, 157.0, 114.0, 75.0, 56.0, 34.0, 28.0, 16.0, 14.0, 7.0, 2.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0], "bins": [-43.78125, -42.38037109375, -40.9794921875, -39.57861328125, -38.177734375, -36.77685546875, -35.3759765625, -33.97509765625, -32.57421875, -31.17333984375, -29.7724609375, -28.37158203125, -26.970703125, -25.56982421875, -24.1689453125, -22.76806640625, -21.3671875, -19.96630859375, -18.5654296875, -17.16455078125, -15.763671875, -14.36279296875, -12.9619140625, -11.56103515625, -10.16015625, -8.75927734375, -7.3583984375, -5.95751953125, -4.556640625, -3.15576171875, -1.7548828125, -0.35400390625, 1.046875, 2.44775390625, 3.8486328125, 5.24951171875, 6.650390625, 8.05126953125, 9.4521484375, 10.85302734375, 12.25390625, 13.65478515625, 15.0556640625, 16.45654296875, 17.857421875, 19.25830078125, 20.6591796875, 22.06005859375, 23.4609375, 24.86181640625, 26.2626953125, 27.66357421875, 29.064453125, 30.46533203125, 31.8662109375, 33.26708984375, 34.66796875, 36.06884765625, 37.4697265625, 38.87060546875, 40.271484375, 41.67236328125, 43.0732421875, 44.47412109375, 45.875]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 6.0, 3.0, 4.0, 5.0, 7.0, 9.0, 15.0, 16.0, 22.0, 17.0, 35.0, 35.0, 58.0, 51.0, 56.0, 91.0, 96.0, 130.0, 159.0, 193.0, 284.0, 438.0, 604.0, 450.0, 317.0, 190.0, 151.0, 125.0, 104.0, 80.0, 57.0, 46.0, 56.0, 39.0, 29.0, 27.0, 24.0, 13.0, 7.0, 7.0, 7.0, 2.0, 7.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-16.203125, -15.7471923828125, -15.291259765625, -14.8353271484375, -14.37939453125, -13.9234619140625, -13.467529296875, -13.0115966796875, -12.5556640625, -12.0997314453125, -11.643798828125, -11.1878662109375, -10.73193359375, -10.2760009765625, -9.820068359375, -9.3641357421875, -8.908203125, -8.4522705078125, -7.996337890625, -7.5404052734375, -7.08447265625, -6.6285400390625, -6.172607421875, -5.7166748046875, -5.2607421875, -4.8048095703125, -4.348876953125, -3.8929443359375, -3.43701171875, -2.9810791015625, -2.525146484375, -2.0692138671875, -1.61328125, -1.1573486328125, -0.701416015625, -0.2454833984375, 0.21044921875, 0.6663818359375, 1.122314453125, 1.5782470703125, 2.0341796875, 2.4901123046875, 2.946044921875, 3.4019775390625, 3.85791015625, 4.3138427734375, 4.769775390625, 5.2257080078125, 5.681640625, 6.1375732421875, 6.593505859375, 7.0494384765625, 7.50537109375, 7.9613037109375, 8.417236328125, 8.8731689453125, 9.3291015625, 9.7850341796875, 10.240966796875, 10.6968994140625, 11.15283203125, 11.6087646484375, 12.064697265625, 12.5206298828125, 12.9765625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 5.0, 8.0, 8.0, 17.0, 15.0, 18.0, 22.0, 25.0, 34.0, 56.0, 81.0, 101.0, 98.0, 110.0, 90.0, 59.0, 54.0, 49.0, 21.0, 27.0, 18.0, 14.0, 16.0, 10.0, 8.0, 6.0, 7.0, 6.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-42.41312026977539, -41.19807434082031, -39.983028411865234, -38.767982482910156, -37.55293655395508, -36.337890625, -35.12284469604492, -33.907798767089844, -32.692752838134766, -31.477706909179688, -30.26266098022461, -29.04761505126953, -27.832569122314453, -26.617523193359375, -25.402477264404297, -24.18743133544922, -22.97238540649414, -21.757339477539062, -20.542293548583984, -19.327247619628906, -18.112201690673828, -16.89715576171875, -15.682109832763672, -14.467063903808594, -13.252017974853516, -12.036972045898438, -10.82192611694336, -9.606880187988281, -8.391834259033203, -7.176788330078125, -5.961742401123047, -4.746696472167969, -3.5316505432128906, -2.3166046142578125, -1.1015586853027344, 0.11348724365234375, 1.3285331726074219, 2.5435791015625, 3.758625030517578, 4.973670959472656, 6.188716888427734, 7.4037628173828125, 8.61880874633789, 9.833854675292969, 11.048900604248047, 12.263946533203125, 13.478992462158203, 14.694038391113281, 15.90908432006836, 17.124130249023438, 18.339176177978516, 19.554222106933594, 20.769268035888672, 21.98431396484375, 23.199359893798828, 24.414405822753906, 25.629451751708984, 26.844497680664062, 28.05954360961914, 29.27458953857422, 30.489635467529297, 31.704681396484375, 32.91972732543945, 34.13477325439453, 35.34981918334961]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 3.0, 10.0, 6.0, 14.0, 10.0, 11.0, 18.0, 17.0, 17.0, 18.0, 27.0, 30.0, 43.0, 32.0, 40.0, 37.0, 33.0, 32.0, 42.0, 49.0, 51.0, 45.0, 37.0, 48.0, 26.0, 38.0, 24.0, 30.0, 30.0, 24.0, 19.0, 18.0, 19.0, 22.0, 11.0, 11.0, 12.0, 16.0, 4.0, 6.0, 6.0, 6.0, 3.0, 2.0, 0.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.862255096435547, -22.088817596435547, -21.315380096435547, -20.541940689086914, -19.768503189086914, -18.995065689086914, -18.221628189086914, -17.44818878173828, -16.67475128173828, -15.901313781738281, -15.127875328063965, -14.354437828063965, -13.580999374389648, -12.807561874389648, -12.034124374389648, -11.260685920715332, -10.487248420715332, -9.713810920715332, -8.940372467041016, -8.166934967041016, -7.393496513366699, -6.620059013366699, -5.846621036529541, -5.073183059692383, -4.299745082855225, -3.5263071060180664, -2.752869129180908, -1.979431390762329, -1.205993413925171, -0.4325554370880127, 0.3408823013305664, 1.1143202781677246, 1.8877582550048828, 2.661196231842041, 3.434634208679199, 4.208071708679199, 4.981510162353516, 5.754947662353516, 6.528385639190674, 7.301823616027832, 8.075262069702148, 8.848699569702148, 9.622138023376465, 10.395575523376465, 11.169013977050781, 11.942451477050781, 12.715888977050781, 13.489327430725098, 14.262764930725098, 15.036202430725098, 15.809640884399414, 16.583078384399414, 17.356515884399414, 18.129955291748047, 18.903392791748047, 19.676830291748047, 20.450267791748047, 21.223705291748047, 21.997142791748047, 22.77058219909668, 23.54401969909668, 24.31745719909668, 25.09089469909668, 25.864334106445312, 26.637771606445312]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 10.0, 11.0, 21.0, 18.0, 31.0, 54.0, 73.0, 102.0, 182.0, 246.0, 374.0, 518.0, 861.0, 1211.0, 1860.0, 2819.0, 4187.0, 6255.0, 9568.0, 15122.0, 23515.0, 38083.0, 62847.0, 116335.0, 317988.0, 207920.0, 93590.0, 53706.0, 32638.0, 20569.0, 12851.0, 8406.0, 5722.0, 3605.0, 2388.0, 1628.0, 1076.0, 768.0, 459.0, 297.0, 214.0, 142.0, 99.0, 65.0, 50.0, 22.0, 18.0, 12.0, 7.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-7.578125, -7.35418701171875, -7.1302490234375, -6.90631103515625, -6.682373046875, -6.45843505859375, -6.2344970703125, -6.01055908203125, -5.78662109375, -5.56268310546875, -5.3387451171875, -5.11480712890625, -4.890869140625, -4.66693115234375, -4.4429931640625, -4.21905517578125, -3.9951171875, -3.77117919921875, -3.5472412109375, -3.32330322265625, -3.099365234375, -2.87542724609375, -2.6514892578125, -2.42755126953125, -2.20361328125, -1.97967529296875, -1.7557373046875, -1.53179931640625, -1.307861328125, -1.08392333984375, -0.8599853515625, -0.63604736328125, -0.412109375, -0.18817138671875, 0.0357666015625, 0.25970458984375, 0.483642578125, 0.70758056640625, 0.9315185546875, 1.15545654296875, 1.37939453125, 1.60333251953125, 1.8272705078125, 2.05120849609375, 2.275146484375, 2.49908447265625, 2.7230224609375, 2.94696044921875, 3.1708984375, 3.39483642578125, 3.6187744140625, 3.84271240234375, 4.066650390625, 4.29058837890625, 4.5145263671875, 4.73846435546875, 4.96240234375, 5.18634033203125, 5.4102783203125, 5.63421630859375, 5.858154296875, 6.08209228515625, 6.3060302734375, 6.52996826171875, 6.75390625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 11.0, 10.0, 11.0, 10.0, 15.0, 11.0, 12.0, 24.0, 28.0, 21.0, 36.0, 31.0, 26.0, 35.0, 31.0, 36.0, 34.0, 44.0, 43.0, 40.0, 45.0, 34.0, 43.0, 42.0, 38.0, 31.0, 25.0, 25.0, 35.0, 18.0, 21.0, 21.0, 12.0, 18.0, 14.0, 13.0, 12.0, 5.0, 8.0, 9.0, 7.0, 1.0, 6.0, 4.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.6875, -21.932861328125, -21.17822265625, -20.423583984375, -19.6689453125, -18.914306640625, -18.15966796875, -17.405029296875, -16.650390625, -15.895751953125, -15.14111328125, -14.386474609375, -13.6318359375, -12.877197265625, -12.12255859375, -11.367919921875, -10.61328125, -9.858642578125, -9.10400390625, -8.349365234375, -7.5947265625, -6.840087890625, -6.08544921875, -5.330810546875, -4.576171875, -3.821533203125, -3.06689453125, -2.312255859375, -1.5576171875, -0.802978515625, -0.04833984375, 0.706298828125, 1.4609375, 2.215576171875, 2.97021484375, 3.724853515625, 4.4794921875, 5.234130859375, 5.98876953125, 6.743408203125, 7.498046875, 8.252685546875, 9.00732421875, 9.761962890625, 10.5166015625, 11.271240234375, 12.02587890625, 12.780517578125, 13.53515625, 14.289794921875, 15.04443359375, 15.799072265625, 16.5537109375, 17.308349609375, 18.06298828125, 18.817626953125, 19.572265625, 20.326904296875, 21.08154296875, 21.836181640625, 22.5908203125, 23.345458984375, 24.10009765625, 24.854736328125, 25.609375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 3.0, 1.0, 9.0, 11.0, 4.0, 8.0, 17.0, 15.0, 29.0, 59.0, 80.0, 116.0, 148.0, 222.0, 307.0, 460.0, 741.0, 1011.0, 1554.0, 2212.0, 3303.0, 5256.0, 8124.0, 13072.0, 21066.0, 34463.0, 58254.0, 106927.0, 257093.0, 271230.0, 109464.0, 59972.0, 34753.0, 21441.0, 13236.0, 8256.0, 5276.0, 3477.0, 2182.0, 1516.0, 989.0, 766.0, 413.0, 316.0, 227.0, 163.0, 89.0, 79.0, 35.0, 39.0, 21.0, 15.0, 15.0, 10.0, 9.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0], "bins": [-7.08984375, -6.868408203125, -6.64697265625, -6.425537109375, -6.2041015625, -5.982666015625, -5.76123046875, -5.539794921875, -5.318359375, -5.096923828125, -4.87548828125, -4.654052734375, -4.4326171875, -4.211181640625, -3.98974609375, -3.768310546875, -3.546875, -3.325439453125, -3.10400390625, -2.882568359375, -2.6611328125, -2.439697265625, -2.21826171875, -1.996826171875, -1.775390625, -1.553955078125, -1.33251953125, -1.111083984375, -0.8896484375, -0.668212890625, -0.44677734375, -0.225341796875, -0.00390625, 0.217529296875, 0.43896484375, 0.660400390625, 0.8818359375, 1.103271484375, 1.32470703125, 1.546142578125, 1.767578125, 1.989013671875, 2.21044921875, 2.431884765625, 2.6533203125, 2.874755859375, 3.09619140625, 3.317626953125, 3.5390625, 3.760498046875, 3.98193359375, 4.203369140625, 4.4248046875, 4.646240234375, 4.86767578125, 5.089111328125, 5.310546875, 5.531982421875, 5.75341796875, 5.974853515625, 6.1962890625, 6.417724609375, 6.63916015625, 6.860595703125, 7.08203125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 3.0, 5.0, 3.0, 7.0, 10.0, 5.0, 20.0, 21.0, 21.0, 14.0, 15.0, 30.0, 22.0, 37.0, 47.0, 48.0, 42.0, 31.0, 51.0, 34.0, 34.0, 43.0, 66.0, 38.0, 47.0, 41.0, 38.0, 30.0, 34.0, 27.0, 24.0, 22.0, 20.0, 10.0, 18.0, 17.0, 8.0, 8.0, 5.0, 3.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.84375, -17.305419921875, -16.76708984375, -16.228759765625, -15.6904296875, -15.152099609375, -14.61376953125, -14.075439453125, -13.537109375, -12.998779296875, -12.46044921875, -11.922119140625, -11.3837890625, -10.845458984375, -10.30712890625, -9.768798828125, -9.23046875, -8.692138671875, -8.15380859375, -7.615478515625, -7.0771484375, -6.538818359375, -6.00048828125, -5.462158203125, -4.923828125, -4.385498046875, -3.84716796875, -3.308837890625, -2.7705078125, -2.232177734375, -1.69384765625, -1.155517578125, -0.6171875, -0.078857421875, 0.45947265625, 0.997802734375, 1.5361328125, 2.074462890625, 2.61279296875, 3.151123046875, 3.689453125, 4.227783203125, 4.76611328125, 5.304443359375, 5.8427734375, 6.381103515625, 6.91943359375, 7.457763671875, 7.99609375, 8.534423828125, 9.07275390625, 9.611083984375, 10.1494140625, 10.687744140625, 11.22607421875, 11.764404296875, 12.302734375, 12.841064453125, 13.37939453125, 13.917724609375, 14.4560546875, 14.994384765625, 15.53271484375, 16.071044921875, 16.609375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 6.0, 13.0, 7.0, 17.0, 14.0, 30.0, 34.0, 42.0, 36.0, 94.0, 110.0, 178.0, 221.0, 417.0, 588.0, 974.0, 1563.0, 2594.0, 5006.0, 9728.0, 21618.0, 56288.0, 211411.0, 534976.0, 128485.0, 39869.0, 16546.0, 7707.0, 4012.0, 2234.0, 1295.0, 806.0, 529.0, 352.0, 212.0, 150.0, 118.0, 65.0, 58.0, 28.0, 32.0, 28.0, 16.0, 11.0, 6.0, 8.0, 5.0, 6.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.0264739990234375, -0.025679826736450195, -0.02488565444946289, -0.024091482162475586, -0.02329730987548828, -0.022503137588500977, -0.021708965301513672, -0.020914793014526367, -0.020120620727539062, -0.019326448440551758, -0.018532276153564453, -0.01773810386657715, -0.016943931579589844, -0.01614975929260254, -0.015355587005615234, -0.01456141471862793, -0.013767242431640625, -0.01297307014465332, -0.012178897857666016, -0.011384725570678711, -0.010590553283691406, -0.009796380996704102, -0.009002208709716797, -0.008208036422729492, -0.0074138641357421875, -0.006619691848754883, -0.005825519561767578, -0.0050313472747802734, -0.004237174987792969, -0.003443002700805664, -0.0026488304138183594, -0.0018546581268310547, -0.00106048583984375, -0.0002663135528564453, 0.0005278587341308594, 0.001322031021118164, 0.0021162033081054688, 0.0029103755950927734, 0.003704547882080078, 0.004498720169067383, 0.0052928924560546875, 0.006087064743041992, 0.006881237030029297, 0.0076754093170166016, 0.008469581604003906, 0.009263753890991211, 0.010057926177978516, 0.01085209846496582, 0.011646270751953125, 0.01244044303894043, 0.013234615325927734, 0.014028787612915039, 0.014822959899902344, 0.015617132186889648, 0.016411304473876953, 0.017205476760864258, 0.017999649047851562, 0.018793821334838867, 0.019587993621826172, 0.020382165908813477, 0.02117633819580078, 0.021970510482788086, 0.02276468276977539, 0.023558855056762695, 0.02435302734375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 7.0, 11.0, 14.0, 20.0, 23.0, 46.0, 60.0, 88.0, 123.0, 141.0, 119.0, 114.0, 74.0, 43.0, 29.0, 22.0, 15.0, 7.0, 6.0, 12.0, 8.0, 5.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0], "bins": [-3.165006637573242e-05, -3.089196979999542e-05, -3.0133873224258423e-05, -2.9375776648521423e-05, -2.8617680072784424e-05, -2.7859583497047424e-05, -2.7101486921310425e-05, -2.6343390345573425e-05, -2.5585293769836426e-05, -2.4827197194099426e-05, -2.4069100618362427e-05, -2.3311004042625427e-05, -2.2552907466888428e-05, -2.1794810891151428e-05, -2.103671431541443e-05, -2.027861773967743e-05, -1.952052116394043e-05, -1.876242458820343e-05, -1.800432801246643e-05, -1.724623143672943e-05, -1.648813486099243e-05, -1.5730038285255432e-05, -1.4971941709518433e-05, -1.4213845133781433e-05, -1.3455748558044434e-05, -1.2697651982307434e-05, -1.1939555406570435e-05, -1.1181458830833435e-05, -1.0423362255096436e-05, -9.665265679359436e-06, -8.907169103622437e-06, -8.149072527885437e-06, -7.3909759521484375e-06, -6.632879376411438e-06, -5.8747828006744385e-06, -5.116686224937439e-06, -4.3585896492004395e-06, -3.60049307346344e-06, -2.8423964977264404e-06, -2.084299921989441e-06, -1.3262033462524414e-06, -5.681067705154419e-07, 1.8998980522155762e-07, 9.480863809585571e-07, 1.7061829566955566e-06, 2.464279532432556e-06, 3.2223761081695557e-06, 3.980472683906555e-06, 4.738569259643555e-06, 5.496665835380554e-06, 6.254762411117554e-06, 7.012858986854553e-06, 7.770955562591553e-06, 8.529052138328552e-06, 9.287148714065552e-06, 1.0045245289802551e-05, 1.080334186553955e-05, 1.156143844127655e-05, 1.231953501701355e-05, 1.307763159275055e-05, 1.3835728168487549e-05, 1.4593824744224548e-05, 1.5351921319961548e-05, 1.6110017895698547e-05, 1.6868114471435547e-05]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 10.0, 8.0, 14.0, 16.0, 27.0, 30.0, 36.0, 66.0, 80.0, 117.0, 169.0, 255.0, 367.0, 501.0, 765.0, 1237.0, 2048.0, 3452.0, 6031.0, 10283.0, 18386.0, 34823.0, 74437.0, 203769.0, 428140.0, 140980.0, 57267.0, 28630.0, 15274.0, 8404.0, 5013.0, 2829.0, 1718.0, 1139.0, 695.0, 467.0, 323.0, 208.0, 165.0, 97.0, 83.0, 62.0, 47.0, 25.0, 12.0, 19.0, 8.0, 8.0, 5.0, 3.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.018157958984375, -0.017578601837158203, -0.016999244689941406, -0.01641988754272461, -0.015840530395507812, -0.015261173248291016, -0.014681816101074219, -0.014102458953857422, -0.013523101806640625, -0.012943744659423828, -0.012364387512207031, -0.011785030364990234, -0.011205673217773438, -0.01062631607055664, -0.010046958923339844, -0.009467601776123047, -0.00888824462890625, -0.008308887481689453, -0.007729530334472656, -0.007150173187255859, -0.0065708160400390625, -0.005991458892822266, -0.005412101745605469, -0.004832744598388672, -0.004253387451171875, -0.003674030303955078, -0.0030946731567382812, -0.0025153160095214844, -0.0019359588623046875, -0.0013566017150878906, -0.0007772445678710938, -0.00019788742065429688, 0.0003814697265625, 0.0009608268737792969, 0.0015401840209960938, 0.0021195411682128906, 0.0026988983154296875, 0.0032782554626464844, 0.0038576126098632812, 0.004436969757080078, 0.005016326904296875, 0.005595684051513672, 0.006175041198730469, 0.006754398345947266, 0.0073337554931640625, 0.00791311264038086, 0.008492469787597656, 0.009071826934814453, 0.00965118408203125, 0.010230541229248047, 0.010809898376464844, 0.01138925552368164, 0.011968612670898438, 0.012547969818115234, 0.013127326965332031, 0.013706684112548828, 0.014286041259765625, 0.014865398406982422, 0.015444755554199219, 0.016024112701416016, 0.016603469848632812, 0.01718282699584961, 0.017762184143066406, 0.018341541290283203, 0.0189208984375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 6.0, 1.0, 3.0, 6.0, 10.0, 5.0, 15.0, 15.0, 12.0, 22.0, 27.0, 31.0, 42.0, 40.0, 53.0, 86.0, 87.0, 87.0, 76.0, 61.0, 66.0, 45.0, 34.0, 29.0, 32.0, 27.0, 17.0, 16.0, 17.0, 13.0, 10.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.006595611572265625, -0.006419122219085693, -0.006242632865905762, -0.00606614351272583, -0.0058896541595458984, -0.005713164806365967, -0.005536675453186035, -0.0053601861000061035, -0.005183696746826172, -0.00500720739364624, -0.004830718040466309, -0.004654228687286377, -0.004477739334106445, -0.004301249980926514, -0.004124760627746582, -0.00394827127456665, -0.0037717819213867188, -0.003595292568206787, -0.0034188032150268555, -0.003242313861846924, -0.003065824508666992, -0.0028893351554870605, -0.002712845802307129, -0.0025363564491271973, -0.0023598670959472656, -0.002183377742767334, -0.0020068883895874023, -0.0018303990364074707, -0.001653909683227539, -0.0014774203300476074, -0.0013009309768676758, -0.0011244416236877441, -0.0009479522705078125, -0.0007714629173278809, -0.0005949735641479492, -0.0004184842109680176, -0.00024199485778808594, -6.55055046081543e-05, 0.00011098384857177734, 0.000287473201751709, 0.0004639625549316406, 0.0006404519081115723, 0.0008169412612915039, 0.0009934306144714355, 0.0011699199676513672, 0.0013464093208312988, 0.0015228986740112305, 0.0016993880271911621, 0.0018758773803710938, 0.0020523667335510254, 0.002228856086730957, 0.0024053454399108887, 0.0025818347930908203, 0.002758324146270752, 0.0029348134994506836, 0.0031113028526306152, 0.003287792205810547, 0.0034642815589904785, 0.00364077091217041, 0.003817260265350342, 0.0039937496185302734, 0.004170238971710205, 0.004346728324890137, 0.004523217678070068, 0.00469970703125]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 6.0, 5.0, 4.0, 3.0, 12.0, 17.0, 15.0, 19.0, 19.0, 29.0, 33.0, 47.0, 94.0, 96.0, 107.0, 107.0, 89.0, 57.0, 62.0, 42.0, 27.0, 22.0, 15.0, 15.0, 17.0, 9.0, 7.0, 7.0, 10.0, 3.0, 1.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-42.558509826660156, -41.33828353881836, -40.11806106567383, -38.89783477783203, -37.6776123046875, -36.4573860168457, -35.237159729003906, -34.016937255859375, -32.79671096801758, -31.576486587524414, -30.35626220703125, -29.136035919189453, -27.91581153869629, -26.695587158203125, -25.475360870361328, -24.255136489868164, -23.034912109375, -21.814687728881836, -20.594463348388672, -19.374237060546875, -18.15401268005371, -16.933788299560547, -15.713562965393066, -14.493337631225586, -13.273113250732422, -12.052888870239258, -10.832663536071777, -9.612438201904297, -8.392213821411133, -7.1719889640808105, -5.951764106750488, -4.731538772583008, -3.5113182067871094, -2.291093349456787, -1.0708684921264648, 0.14935636520385742, 1.3695812225341797, 2.589806079864502, 3.810030937194824, 5.030256271362305, 6.250480651855469, 7.470705509185791, 8.690930366516113, 9.911155700683594, 11.131380081176758, 12.351604461669922, 13.571829795837402, 14.792055130004883, 16.012279510498047, 17.23250389099121, 18.452728271484375, 19.672954559326172, 20.893178939819336, 22.1134033203125, 23.333629608154297, 24.55385398864746, 25.774078369140625, 26.99430274963379, 28.214527130126953, 29.43475341796875, 30.654977798461914, 31.875202178955078, 33.095428466796875, 34.315650939941406, 35.5358772277832]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 10.0, 6.0, 13.0, 11.0, 10.0, 19.0, 17.0, 17.0, 16.0, 29.0, 30.0, 43.0, 32.0, 40.0, 38.0, 32.0, 34.0, 39.0, 52.0, 49.0, 46.0, 35.0, 49.0, 24.0, 40.0, 24.0, 31.0, 30.0, 23.0, 19.0, 18.0, 19.0, 22.0, 11.0, 11.0, 13.0, 15.0, 4.0, 6.0, 6.0, 6.0, 3.0, 2.0, 0.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.49274444580078, -21.72866439819336, -20.964582443237305, -20.200502395629883, -19.436420440673828, -18.672340393066406, -17.908260345458984, -17.14417839050293, -16.380096435546875, -15.616015434265137, -14.851934432983398, -14.087854385375977, -13.323772430419922, -12.5596923828125, -11.795611381530762, -11.031530380249023, -10.267450332641602, -9.503369331359863, -8.739288330078125, -7.975207805633545, -7.211126804351807, -6.447045803070068, -5.682965278625488, -4.91888427734375, -4.154803276062012, -3.3907222747802734, -2.6266415119171143, -1.862560749053955, -1.0984797477722168, -0.3343987464904785, 0.42968177795410156, 1.1937627792358398, 1.9578418731689453, 2.7219228744506836, 3.4860036373138428, 4.250084400177002, 5.01416540145874, 5.7782464027404785, 6.542326927185059, 7.306407928466797, 8.070488929748535, 8.834569931030273, 9.598650932312012, 10.36273193359375, 11.126811981201172, 11.890893936157227, 12.654973983764648, 13.419054985046387, 14.183135986328125, 14.947216987609863, 15.711297988891602, 16.475378036499023, 17.239459991455078, 18.0035400390625, 18.767620086669922, 19.531702041625977, 20.29578399658203, 21.059864044189453, 21.823945999145508, 22.58802604675293, 23.352108001708984, 24.116188049316406, 24.880268096923828, 25.644350051879883, 26.408430099487305]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 4.0, 1.0, 3.0, 9.0, 17.0, 14.0, 25.0, 32.0, 42.0, 66.0, 96.0, 147.0, 197.0, 321.0, 393.0, 565.0, 867.0, 1200.0, 1719.0, 2574.0, 3707.0, 5449.0, 8080.0, 12468.0, 18730.0, 29862.0, 48870.0, 86534.0, 166155.0, 248600.0, 178113.0, 91766.0, 51213.0, 31032.0, 19814.0, 12933.0, 8614.0, 5734.0, 3889.0, 2637.0, 1817.0, 1257.0, 919.0, 631.0, 443.0, 314.0, 189.0, 145.0, 112.0, 77.0, 51.0, 37.0, 24.0, 20.0, 17.0, 6.0, 7.0, 4.0, 2.0, 4.0, 1.0], "bins": [-45.0625, -43.67822265625, -42.2939453125, -40.90966796875, -39.525390625, -38.14111328125, -36.7568359375, -35.37255859375, -33.98828125, -32.60400390625, -31.2197265625, -29.83544921875, -28.451171875, -27.06689453125, -25.6826171875, -24.29833984375, -22.9140625, -21.52978515625, -20.1455078125, -18.76123046875, -17.376953125, -15.99267578125, -14.6083984375, -13.22412109375, -11.83984375, -10.45556640625, -9.0712890625, -7.68701171875, -6.302734375, -4.91845703125, -3.5341796875, -2.14990234375, -0.765625, 0.61865234375, 2.0029296875, 3.38720703125, 4.771484375, 6.15576171875, 7.5400390625, 8.92431640625, 10.30859375, 11.69287109375, 13.0771484375, 14.46142578125, 15.845703125, 17.22998046875, 18.6142578125, 19.99853515625, 21.3828125, 22.76708984375, 24.1513671875, 25.53564453125, 26.919921875, 28.30419921875, 29.6884765625, 31.07275390625, 32.45703125, 33.84130859375, 35.2255859375, 36.60986328125, 37.994140625, 39.37841796875, 40.7626953125, 42.14697265625, 43.53125]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 4.0, 9.0, 4.0, 6.0, 6.0, 12.0, 16.0, 11.0, 16.0, 20.0, 21.0, 22.0, 40.0, 37.0, 42.0, 28.0, 37.0, 52.0, 42.0, 50.0, 50.0, 47.0, 44.0, 34.0, 31.0, 31.0, 34.0, 27.0, 19.0, 30.0, 27.0, 24.0, 19.0, 16.0, 12.0, 14.0, 22.0, 12.0, 11.0, 6.0, 3.0, 1.0, 3.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-20.421875, -19.741943359375, -19.06201171875, -18.382080078125, -17.7021484375, -17.022216796875, -16.34228515625, -15.662353515625, -14.982421875, -14.302490234375, -13.62255859375, -12.942626953125, -12.2626953125, -11.582763671875, -10.90283203125, -10.222900390625, -9.54296875, -8.863037109375, -8.18310546875, -7.503173828125, -6.8232421875, -6.143310546875, -5.46337890625, -4.783447265625, -4.103515625, -3.423583984375, -2.74365234375, -2.063720703125, -1.3837890625, -0.703857421875, -0.02392578125, 0.656005859375, 1.3359375, 2.015869140625, 2.69580078125, 3.375732421875, 4.0556640625, 4.735595703125, 5.41552734375, 6.095458984375, 6.775390625, 7.455322265625, 8.13525390625, 8.815185546875, 9.4951171875, 10.175048828125, 10.85498046875, 11.534912109375, 12.21484375, 12.894775390625, 13.57470703125, 14.254638671875, 14.9345703125, 15.614501953125, 16.29443359375, 16.974365234375, 17.654296875, 18.334228515625, 19.01416015625, 19.694091796875, 20.3740234375, 21.053955078125, 21.73388671875, 22.413818359375, 23.09375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 15.0, 12.0, 35.0, 53.0, 88.0, 130.0, 197.0, 312.0, 483.0, 716.0, 1047.0, 1607.0, 2415.0, 3386.0, 5137.0, 7456.0, 11032.0, 16323.0, 24604.0, 37421.0, 59004.0, 101468.0, 182286.0, 223443.0, 144838.0, 81336.0, 48701.0, 31322.0, 20830.0, 14049.0, 9326.0, 6389.0, 4330.0, 2802.0, 1920.0, 1330.0, 946.0, 620.0, 401.0, 268.0, 168.0, 109.0, 79.0, 33.0, 32.0, 17.0, 16.0, 7.0, 7.0, 4.0, 2.0, 0.0, 2.0], "bins": [-43.1875, -41.92822265625, -40.6689453125, -39.40966796875, -38.150390625, -36.89111328125, -35.6318359375, -34.37255859375, -33.11328125, -31.85400390625, -30.5947265625, -29.33544921875, -28.076171875, -26.81689453125, -25.5576171875, -24.29833984375, -23.0390625, -21.77978515625, -20.5205078125, -19.26123046875, -18.001953125, -16.74267578125, -15.4833984375, -14.22412109375, -12.96484375, -11.70556640625, -10.4462890625, -9.18701171875, -7.927734375, -6.66845703125, -5.4091796875, -4.14990234375, -2.890625, -1.63134765625, -0.3720703125, 0.88720703125, 2.146484375, 3.40576171875, 4.6650390625, 5.92431640625, 7.18359375, 8.44287109375, 9.7021484375, 10.96142578125, 12.220703125, 13.47998046875, 14.7392578125, 15.99853515625, 17.2578125, 18.51708984375, 19.7763671875, 21.03564453125, 22.294921875, 23.55419921875, 24.8134765625, 26.07275390625, 27.33203125, 28.59130859375, 29.8505859375, 31.10986328125, 32.369140625, 33.62841796875, 34.8876953125, 36.14697265625, 37.40625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 2.0, 8.0, 8.0, 5.0, 6.0, 11.0, 14.0, 15.0, 20.0, 20.0, 20.0, 29.0, 19.0, 35.0, 28.0, 30.0, 49.0, 48.0, 37.0, 39.0, 36.0, 41.0, 45.0, 43.0, 39.0, 35.0, 28.0, 28.0, 45.0, 28.0, 31.0, 13.0, 19.0, 18.0, 14.0, 21.0, 13.0, 18.0, 14.0, 11.0, 4.0, 6.0, 6.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-15.109375, -14.681396484375, -14.25341796875, -13.825439453125, -13.3974609375, -12.969482421875, -12.54150390625, -12.113525390625, -11.685546875, -11.257568359375, -10.82958984375, -10.401611328125, -9.9736328125, -9.545654296875, -9.11767578125, -8.689697265625, -8.26171875, -7.833740234375, -7.40576171875, -6.977783203125, -6.5498046875, -6.121826171875, -5.69384765625, -5.265869140625, -4.837890625, -4.409912109375, -3.98193359375, -3.553955078125, -3.1259765625, -2.697998046875, -2.27001953125, -1.842041015625, -1.4140625, -0.986083984375, -0.55810546875, -0.130126953125, 0.2978515625, 0.725830078125, 1.15380859375, 1.581787109375, 2.009765625, 2.437744140625, 2.86572265625, 3.293701171875, 3.7216796875, 4.149658203125, 4.57763671875, 5.005615234375, 5.43359375, 5.861572265625, 6.28955078125, 6.717529296875, 7.1455078125, 7.573486328125, 8.00146484375, 8.429443359375, 8.857421875, 9.285400390625, 9.71337890625, 10.141357421875, 10.5693359375, 10.997314453125, 11.42529296875, 11.853271484375, 12.28125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 9.0, 10.0, 13.0, 21.0, 30.0, 62.0, 66.0, 110.0, 179.0, 186.0, 314.0, 425.0, 589.0, 889.0, 1258.0, 1728.0, 2436.0, 3610.0, 5003.0, 7626.0, 11481.0, 17931.0, 29030.0, 51302.0, 105585.0, 263785.0, 285863.0, 116701.0, 54866.0, 30824.0, 18715.0, 12264.0, 7974.0, 5341.0, 3702.0, 2545.0, 1808.0, 1264.0, 879.0, 627.0, 474.0, 325.0, 194.0, 149.0, 115.0, 86.0, 44.0, 26.0, 28.0, 32.0, 16.0, 8.0, 3.0, 2.0, 3.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.1279296875, -1.089111328125, -1.05029296875, -1.011474609375, -0.97265625, -0.933837890625, -0.89501953125, -0.856201171875, -0.8173828125, -0.778564453125, -0.73974609375, -0.700927734375, -0.662109375, -0.623291015625, -0.58447265625, -0.545654296875, -0.5068359375, -0.468017578125, -0.42919921875, -0.390380859375, -0.3515625, -0.312744140625, -0.27392578125, -0.235107421875, -0.1962890625, -0.157470703125, -0.11865234375, -0.079833984375, -0.041015625, -0.002197265625, 0.03662109375, 0.075439453125, 0.1142578125, 0.153076171875, 0.19189453125, 0.230712890625, 0.26953125, 0.308349609375, 0.34716796875, 0.385986328125, 0.4248046875, 0.463623046875, 0.50244140625, 0.541259765625, 0.580078125, 0.618896484375, 0.65771484375, 0.696533203125, 0.7353515625, 0.774169921875, 0.81298828125, 0.851806640625, 0.890625, 0.929443359375, 0.96826171875, 1.007080078125, 1.0458984375, 1.084716796875, 1.12353515625, 1.162353515625, 1.201171875, 1.239990234375, 1.27880859375, 1.317626953125, 1.3564453125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 5.0, 4.0, 4.0, 5.0, 13.0, 14.0, 12.0, 14.0, 25.0, 22.0, 26.0, 41.0, 59.0, 69.0, 87.0, 104.0, 78.0, 83.0, 69.0, 53.0, 42.0, 28.0, 36.0, 12.0, 14.0, 11.0, 9.0, 12.0, 9.0, 4.0, 7.0, 4.0, 1.0, 2.0, 4.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.00023937225341796875, -0.00023234263062477112, -0.00022531300783157349, -0.00021828338503837585, -0.00021125376224517822, -0.0002042241394519806, -0.00019719451665878296, -0.00019016489386558533, -0.0001831352710723877, -0.00017610564827919006, -0.00016907602548599243, -0.0001620464026927948, -0.00015501677989959717, -0.00014798715710639954, -0.0001409575343132019, -0.00013392791152000427, -0.00012689828872680664, -0.00011986866593360901, -0.00011283904314041138, -0.00010580942034721375, -9.877979755401611e-05, -9.175017476081848e-05, -8.472055196762085e-05, -7.769092917442322e-05, -7.066130638122559e-05, -6.363168358802795e-05, -5.660206079483032e-05, -4.957243800163269e-05, -4.254281520843506e-05, -3.551319241523743e-05, -2.8483569622039795e-05, -2.1453946828842163e-05, -1.4424324035644531e-05, -7.394701242446899e-06, -3.650784492492676e-07, 6.664544343948364e-06, 1.3694167137145996e-05, 2.0723789930343628e-05, 2.775341272354126e-05, 3.478303551673889e-05, 4.1812658309936523e-05, 4.8842281103134155e-05, 5.587190389633179e-05, 6.290152668952942e-05, 6.993114948272705e-05, 7.696077227592468e-05, 8.399039506912231e-05, 9.102001786231995e-05, 9.804964065551758e-05, 0.00010507926344871521, 0.00011210888624191284, 0.00011913850903511047, 0.0001261681318283081, 0.00013319775462150574, 0.00014022737741470337, 0.000147257000207901, 0.00015428662300109863, 0.00016131624579429626, 0.0001683458685874939, 0.00017537549138069153, 0.00018240511417388916, 0.0001894347369670868, 0.00019646435976028442, 0.00020349398255348206, 0.0002105236053466797]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 6.0, 9.0, 13.0, 23.0, 28.0, 37.0, 59.0, 78.0, 87.0, 137.0, 201.0, 300.0, 383.0, 585.0, 798.0, 1179.0, 1642.0, 2592.0, 3848.0, 6155.0, 10012.0, 17167.0, 31266.0, 64177.0, 166288.0, 396743.0, 191616.0, 70981.0, 34114.0, 18322.0, 10465.0, 6629.0, 4052.0, 2686.0, 1845.0, 1215.0, 849.0, 588.0, 397.0, 278.0, 216.0, 134.0, 102.0, 77.0, 41.0, 33.0, 37.0, 22.0, 16.0, 15.0, 5.0, 9.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-1.474609375, -1.427886962890625, -1.38116455078125, -1.334442138671875, -1.2877197265625, -1.240997314453125, -1.19427490234375, -1.147552490234375, -1.100830078125, -1.054107666015625, -1.00738525390625, -0.960662841796875, -0.9139404296875, -0.867218017578125, -0.82049560546875, -0.773773193359375, -0.72705078125, -0.680328369140625, -0.63360595703125, -0.586883544921875, -0.5401611328125, -0.493438720703125, -0.44671630859375, -0.399993896484375, -0.353271484375, -0.306549072265625, -0.25982666015625, -0.213104248046875, -0.1663818359375, -0.119659423828125, -0.07293701171875, -0.026214599609375, 0.0205078125, 0.067230224609375, 0.11395263671875, 0.160675048828125, 0.2073974609375, 0.254119873046875, 0.30084228515625, 0.347564697265625, 0.394287109375, 0.441009521484375, 0.48773193359375, 0.534454345703125, 0.5811767578125, 0.627899169921875, 0.67462158203125, 0.721343994140625, 0.76806640625, 0.814788818359375, 0.86151123046875, 0.908233642578125, 0.9549560546875, 1.001678466796875, 1.04840087890625, 1.095123291015625, 1.141845703125, 1.188568115234375, 1.23529052734375, 1.282012939453125, 1.3287353515625, 1.375457763671875, 1.42218017578125, 1.468902587890625, 1.515625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 3.0, 4.0, 11.0, 7.0, 8.0, 9.0, 16.0, 17.0, 26.0, 17.0, 33.0, 46.0, 49.0, 54.0, 63.0, 79.0, 92.0, 77.0, 75.0, 69.0, 52.0, 31.0, 35.0, 26.0, 21.0, 19.0, 8.0, 5.0, 10.0, 9.0, 5.0, 6.0, 3.0, 2.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43603515625, -0.42073822021484375, -0.4054412841796875, -0.39014434814453125, -0.374847412109375, -0.35955047607421875, -0.3442535400390625, -0.32895660400390625, -0.31365966796875, -0.29836273193359375, -0.2830657958984375, -0.26776885986328125, -0.252471923828125, -0.23717498779296875, -0.2218780517578125, -0.20658111572265625, -0.1912841796875, -0.17598724365234375, -0.1606903076171875, -0.14539337158203125, -0.130096435546875, -0.11479949951171875, -0.0995025634765625, -0.08420562744140625, -0.06890869140625, -0.05361175537109375, -0.0383148193359375, -0.02301788330078125, -0.007720947265625, 0.00757598876953125, 0.0228729248046875, 0.03816986083984375, 0.053466796875, 0.06876373291015625, 0.0840606689453125, 0.09935760498046875, 0.114654541015625, 0.12995147705078125, 0.1452484130859375, 0.16054534912109375, 0.17584228515625, 0.19113922119140625, 0.2064361572265625, 0.22173309326171875, 0.237030029296875, 0.25232696533203125, 0.2676239013671875, 0.28292083740234375, 0.2982177734375, 0.31351470947265625, 0.3288116455078125, 0.34410858154296875, 0.359405517578125, 0.37470245361328125, 0.3899993896484375, 0.40529632568359375, 0.42059326171875, 0.43589019775390625, 0.4511871337890625, 0.46648406982421875, 0.481781005859375, 0.49707794189453125, 0.5123748779296875, 0.5276718139648438, 0.54296875]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 0.0, 3.0, 4.0, 6.0, 6.0, 9.0, 9.0, 10.0, 16.0, 20.0, 25.0, 32.0, 44.0, 75.0, 96.0, 104.0, 128.0, 114.0, 68.0, 58.0, 46.0, 24.0, 25.0, 25.0, 9.0, 13.0, 12.0, 6.0, 5.0, 3.0, 3.0, 0.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.741722106933594, -43.50756072998047, -42.27340316772461, -41.039241790771484, -39.805084228515625, -38.5709228515625, -37.336761474609375, -36.102603912353516, -34.86844253540039, -33.634281158447266, -32.400123596191406, -31.16596221923828, -29.93180274963379, -28.697643280029297, -27.463483810424805, -26.229324340820312, -24.99516487121582, -23.761005401611328, -22.526845932006836, -21.292686462402344, -20.05852508544922, -18.824365615844727, -17.590206146240234, -16.35604476928711, -15.121886253356934, -13.887726783752441, -12.653566360473633, -11.41940689086914, -10.185247421264648, -8.95108699798584, -7.716927528381348, -6.482767105102539, -5.248607635498047, -4.0144476890563965, -2.780287981033325, -1.546128273010254, -0.3119683265686035, 0.9221916198730469, 2.156351089477539, 3.3905115127563477, 4.62467098236084, 5.85883092880249, 7.092990875244141, 8.327150344848633, 9.561309814453125, 10.795470237731934, 12.029629707336426, 13.263790130615234, 14.497949600219727, 15.732109069824219, 16.96626853942871, 18.200428009033203, 19.434589385986328, 20.66874885559082, 21.902908325195312, 23.137069702148438, 24.371227264404297, 25.60538673400879, 26.83954620361328, 28.073707580566406, 29.3078670501709, 30.54202651977539, 31.776185989379883, 33.010345458984375, 34.2445068359375]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 5.0, 0.0, 2.0, 3.0, 8.0, 3.0, 6.0, 5.0, 6.0, 6.0, 7.0, 14.0, 26.0, 18.0, 20.0, 22.0, 26.0, 33.0, 30.0, 32.0, 28.0, 28.0, 34.0, 44.0, 22.0, 51.0, 42.0, 38.0, 43.0, 37.0, 37.0, 37.0, 26.0, 26.0, 27.0, 25.0, 20.0, 31.0, 14.0, 15.0, 12.0, 12.0, 13.0, 11.0, 17.0, 13.0, 8.0, 4.0, 6.0, 6.0, 4.0, 3.0, 1.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-18.8291015625, -18.183231353759766, -17.537363052368164, -16.891494750976562, -16.245624542236328, -15.59975528717041, -14.953886032104492, -14.308016777038574, -13.662147521972656, -13.016278266906738, -12.37040901184082, -11.724539756774902, -11.078670501708984, -10.432801246643066, -9.786931991577148, -9.14106273651123, -8.495193481445312, -7.8493242263793945, -7.203454971313477, -6.557585716247559, -5.911716461181641, -5.265847206115723, -4.619977951049805, -3.9741086959838867, -3.3282394409179688, -2.682370185852051, -2.036500930786133, -1.3906316757202148, -0.7447624206542969, -0.0988931655883789, 0.5469760894775391, 1.192845344543457, 1.8387165069580078, 2.484585762023926, 3.1304550170898438, 3.7763242721557617, 4.42219352722168, 5.068062782287598, 5.713932037353516, 6.359801292419434, 7.005670547485352, 7.6515398025512695, 8.297409057617188, 8.943278312683105, 9.589147567749023, 10.235016822814941, 10.88088607788086, 11.526755332946777, 12.172624588012695, 12.818493843078613, 13.464363098144531, 14.11023235321045, 14.756101608276367, 15.401970863342285, 16.047840118408203, 16.693710327148438, 17.33957862854004, 17.98544692993164, 18.631317138671875, 19.27718734741211, 19.92305564880371, 20.568923950195312, 21.214794158935547, 21.86066436767578, 22.506532669067383]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 6.0, 4.0, 10.0, 21.0, 15.0, 47.0, 76.0, 108.0, 153.0, 239.0, 332.0, 546.0, 903.0, 1320.0, 2059.0, 3236.0, 5097.0, 8122.0, 13401.0, 22470.0, 39006.0, 72772.0, 166042.0, 724511.0, 2106957.0, 705354.0, 148422.0, 69428.0, 38075.0, 22913.0, 14162.0, 9383.0, 6057.0, 4171.0, 2759.0, 1827.0, 1347.0, 862.0, 649.0, 442.0, 314.0, 213.0, 147.0, 99.0, 55.0, 59.0, 35.0, 30.0, 10.0, 7.0, 6.0, 7.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.875, -34.5703125, -33.265625, -31.9609375, -30.65625, -29.3515625, -28.046875, -26.7421875, -25.4375, -24.1328125, -22.828125, -21.5234375, -20.21875, -18.9140625, -17.609375, -16.3046875, -15.0, -13.6953125, -12.390625, -11.0859375, -9.78125, -8.4765625, -7.171875, -5.8671875, -4.5625, -3.2578125, -1.953125, -0.6484375, 0.65625, 1.9609375, 3.265625, 4.5703125, 5.875, 7.1796875, 8.484375, 9.7890625, 11.09375, 12.3984375, 13.703125, 15.0078125, 16.3125, 17.6171875, 18.921875, 20.2265625, 21.53125, 22.8359375, 24.140625, 25.4453125, 26.75, 28.0546875, 29.359375, 30.6640625, 31.96875, 33.2734375, 34.578125, 35.8828125, 37.1875, 38.4921875, 39.796875, 41.1015625, 42.40625, 43.7109375, 45.015625, 46.3203125, 47.625]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 8.0, 5.0, 7.0, 5.0, 10.0, 11.0, 23.0, 17.0, 18.0, 28.0, 26.0, 29.0, 24.0, 35.0, 45.0, 37.0, 36.0, 39.0, 47.0, 35.0, 40.0, 55.0, 45.0, 34.0, 32.0, 36.0, 22.0, 36.0, 34.0, 25.0, 16.0, 18.0, 19.0, 12.0, 11.0, 9.0, 16.0, 11.0, 12.0, 9.0, 4.0, 9.0, 2.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.40625, -14.846435546875, -14.28662109375, -13.726806640625, -13.1669921875, -12.607177734375, -12.04736328125, -11.487548828125, -10.927734375, -10.367919921875, -9.80810546875, -9.248291015625, -8.6884765625, -8.128662109375, -7.56884765625, -7.009033203125, -6.44921875, -5.889404296875, -5.32958984375, -4.769775390625, -4.2099609375, -3.650146484375, -3.09033203125, -2.530517578125, -1.970703125, -1.410888671875, -0.85107421875, -0.291259765625, 0.2685546875, 0.828369140625, 1.38818359375, 1.947998046875, 2.5078125, 3.067626953125, 3.62744140625, 4.187255859375, 4.7470703125, 5.306884765625, 5.86669921875, 6.426513671875, 6.986328125, 7.546142578125, 8.10595703125, 8.665771484375, 9.2255859375, 9.785400390625, 10.34521484375, 10.905029296875, 11.46484375, 12.024658203125, 12.58447265625, 13.144287109375, 13.7041015625, 14.263916015625, 14.82373046875, 15.383544921875, 15.943359375, 16.503173828125, 17.06298828125, 17.622802734375, 18.1826171875, 18.742431640625, 19.30224609375, 19.862060546875, 20.421875]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 7.0, 3.0, 14.0, 20.0, 24.0, 35.0, 70.0, 102.0, 149.0, 234.0, 373.0, 556.0, 890.0, 1387.0, 2093.0, 3277.0, 5076.0, 8186.0, 13122.0, 22545.0, 38811.0, 70266.0, 136314.0, 298559.0, 853834.0, 1786663.0, 510383.0, 208967.0, 100940.0, 53946.0, 30373.0, 17833.0, 10772.0, 6667.0, 4186.0, 2675.0, 1741.0, 1124.0, 755.0, 455.0, 307.0, 206.0, 127.0, 77.0, 52.0, 28.0, 22.0, 13.0, 13.0, 4.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-35.6875, -34.58203125, -33.4765625, -32.37109375, -31.265625, -30.16015625, -29.0546875, -27.94921875, -26.84375, -25.73828125, -24.6328125, -23.52734375, -22.421875, -21.31640625, -20.2109375, -19.10546875, -18.0, -16.89453125, -15.7890625, -14.68359375, -13.578125, -12.47265625, -11.3671875, -10.26171875, -9.15625, -8.05078125, -6.9453125, -5.83984375, -4.734375, -3.62890625, -2.5234375, -1.41796875, -0.3125, 0.79296875, 1.8984375, 3.00390625, 4.109375, 5.21484375, 6.3203125, 7.42578125, 8.53125, 9.63671875, 10.7421875, 11.84765625, 12.953125, 14.05859375, 15.1640625, 16.26953125, 17.375, 18.48046875, 19.5859375, 20.69140625, 21.796875, 22.90234375, 24.0078125, 25.11328125, 26.21875, 27.32421875, 28.4296875, 29.53515625, 30.640625, 31.74609375, 32.8515625, 33.95703125, 35.0625]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 7.0, 5.0, 15.0, 10.0, 11.0, 15.0, 15.0, 24.0, 23.0, 28.0, 43.0, 48.0, 61.0, 81.0, 93.0, 108.0, 147.0, 178.0, 263.0, 337.0, 511.0, 487.0, 361.0, 233.0, 190.0, 147.0, 130.0, 94.0, 87.0, 62.0, 50.0, 42.0, 41.0, 28.0, 23.0, 14.0, 11.0, 18.0, 14.0, 3.0, 5.0, 3.0, 6.0, 2.0, 0.0, 2.0, 1.0, 3.0], "bins": [-13.0703125, -12.717041015625, -12.36376953125, -12.010498046875, -11.6572265625, -11.303955078125, -10.95068359375, -10.597412109375, -10.244140625, -9.890869140625, -9.53759765625, -9.184326171875, -8.8310546875, -8.477783203125, -8.12451171875, -7.771240234375, -7.41796875, -7.064697265625, -6.71142578125, -6.358154296875, -6.0048828125, -5.651611328125, -5.29833984375, -4.945068359375, -4.591796875, -4.238525390625, -3.88525390625, -3.531982421875, -3.1787109375, -2.825439453125, -2.47216796875, -2.118896484375, -1.765625, -1.412353515625, -1.05908203125, -0.705810546875, -0.3525390625, 0.000732421875, 0.35400390625, 0.707275390625, 1.060546875, 1.413818359375, 1.76708984375, 2.120361328125, 2.4736328125, 2.826904296875, 3.18017578125, 3.533447265625, 3.88671875, 4.239990234375, 4.59326171875, 4.946533203125, 5.2998046875, 5.653076171875, 6.00634765625, 6.359619140625, 6.712890625, 7.066162109375, 7.41943359375, 7.772705078125, 8.1259765625, 8.479248046875, 8.83251953125, 9.185791015625, 9.5390625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 6.0, 4.0, 10.0, 7.0, 6.0, 12.0, 15.0, 12.0, 22.0, 28.0, 41.0, 47.0, 63.0, 92.0, 94.0, 113.0, 82.0, 61.0, 58.0, 43.0, 44.0, 24.0, 19.0, 22.0, 17.0, 11.0, 11.0, 8.0, 7.0, 10.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-34.87495803833008, -33.968265533447266, -33.06157302856445, -32.15488052368164, -31.248188018798828, -30.341495513916016, -29.434803009033203, -28.52811050415039, -27.621417999267578, -26.714725494384766, -25.808032989501953, -24.90134048461914, -23.994647979736328, -23.087955474853516, -22.181262969970703, -21.27457046508789, -20.36787986755371, -19.4611873626709, -18.554494857788086, -17.647802352905273, -16.74110984802246, -15.834417343139648, -14.927725791931152, -14.02103328704834, -13.114340782165527, -12.207648277282715, -11.300955772399902, -10.394264221191406, -9.487571716308594, -8.580879211425781, -7.674186706542969, -6.767494201660156, -5.860803604125977, -4.954111099243164, -4.047418594360352, -3.1407265663146973, -2.2340340614318848, -1.3273415565490723, -0.42064952850341797, 0.48604297637939453, 1.392735481262207, 2.2994279861450195, 3.206120252609253, 4.112812519073486, 5.019505023956299, 5.926197528839111, 6.832889556884766, 7.739582061767578, 8.64627456665039, 9.552967071533203, 10.459659576416016, 11.366352081298828, 12.27304458618164, 13.179737091064453, 14.08642864227295, 14.993121147155762, 15.899813652038574, 16.80650520324707, 17.713197708129883, 18.619890213012695, 19.526582717895508, 20.43327522277832, 21.339967727661133, 22.246660232543945, 23.153352737426758]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 6.0, 14.0, 7.0, 8.0, 11.0, 17.0, 21.0, 13.0, 28.0, 23.0, 29.0, 26.0, 32.0, 32.0, 35.0, 42.0, 35.0, 46.0, 46.0, 49.0, 35.0, 43.0, 47.0, 24.0, 34.0, 29.0, 24.0, 31.0, 26.0, 21.0, 24.0, 27.0, 17.0, 14.0, 9.0, 17.0, 10.0, 13.0, 9.0, 2.0, 9.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-19.713777542114258, -19.120346069335938, -18.526914596557617, -17.933483123779297, -17.340051651000977, -16.746620178222656, -16.153188705444336, -15.5597562789917, -14.966324806213379, -14.372893333435059, -13.779461860656738, -13.186030387878418, -12.592597961425781, -11.999166488647461, -11.40573501586914, -10.81230354309082, -10.2188720703125, -9.62544059753418, -9.03200912475586, -8.438577651977539, -7.8451457023620605, -7.25171422958374, -6.658282279968262, -6.064850807189941, -5.471419334411621, -4.877987861633301, -4.2845563888549805, -3.691124439239502, -3.0976929664611816, -2.5042614936828613, -1.910829782485962, -1.3173980712890625, -0.7239646911621094, -0.1305330991744995, 0.46289849281311035, 1.0563300848007202, 1.64976167678833, 2.2431931495666504, 2.83662486076355, 3.430056571960449, 4.0234880447387695, 4.61691951751709, 5.21035099029541, 5.803782939910889, 6.397214412689209, 6.990645885467529, 7.584077835083008, 8.177509307861328, 8.770940780639648, 9.364372253417969, 9.957803726196289, 10.55123519897461, 11.14466667175293, 11.73809814453125, 12.331530570983887, 12.924962043762207, 13.518393516540527, 14.111824989318848, 14.705256462097168, 15.298687934875488, 15.892120361328125, 16.485551834106445, 17.078983306884766, 17.672414779663086, 18.265846252441406]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 6.0, 15.0, 17.0, 21.0, 33.0, 54.0, 81.0, 89.0, 155.0, 190.0, 298.0, 466.0, 658.0, 1013.0, 1510.0, 2313.0, 3530.0, 5254.0, 8234.0, 12295.0, 19556.0, 30745.0, 49747.0, 84300.0, 169108.0, 338107.0, 131093.0, 71177.0, 42867.0, 26837.0, 16934.0, 10873.0, 7161.0, 4642.0, 3136.0, 2023.0, 1328.0, 898.0, 591.0, 381.0, 265.0, 175.0, 115.0, 81.0, 66.0, 32.0, 28.0, 22.0, 15.0, 8.0, 7.0, 0.0, 5.0, 2.0, 1.0, 2.0, 2.0], "bins": [-5.6640625, -5.48895263671875, -5.3138427734375, -5.13873291015625, -4.963623046875, -4.78851318359375, -4.6134033203125, -4.43829345703125, -4.26318359375, -4.08807373046875, -3.9129638671875, -3.73785400390625, -3.562744140625, -3.38763427734375, -3.2125244140625, -3.03741455078125, -2.8623046875, -2.68719482421875, -2.5120849609375, -2.33697509765625, -2.161865234375, -1.98675537109375, -1.8116455078125, -1.63653564453125, -1.46142578125, -1.28631591796875, -1.1112060546875, -0.93609619140625, -0.760986328125, -0.58587646484375, -0.4107666015625, -0.23565673828125, -0.060546875, 0.11456298828125, 0.2896728515625, 0.46478271484375, 0.639892578125, 0.81500244140625, 0.9901123046875, 1.16522216796875, 1.34033203125, 1.51544189453125, 1.6905517578125, 1.86566162109375, 2.040771484375, 2.21588134765625, 2.3909912109375, 2.56610107421875, 2.7412109375, 2.91632080078125, 3.0914306640625, 3.26654052734375, 3.441650390625, 3.61676025390625, 3.7918701171875, 3.96697998046875, 4.14208984375, 4.31719970703125, 4.4923095703125, 4.66741943359375, 4.842529296875, 5.01763916015625, 5.1927490234375, 5.36785888671875, 5.54296875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 8.0, 8.0, 10.0, 10.0, 12.0, 13.0, 19.0, 18.0, 17.0, 18.0, 16.0, 34.0, 21.0, 34.0, 34.0, 38.0, 43.0, 36.0, 37.0, 53.0, 37.0, 41.0, 43.0, 36.0, 36.0, 28.0, 33.0, 27.0, 28.0, 22.0, 29.0, 34.0, 14.0, 13.0, 18.0, 16.0, 14.0, 8.0, 12.0, 4.0, 9.0, 7.0, 7.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-19.8125, -19.21142578125, -18.6103515625, -18.00927734375, -17.408203125, -16.80712890625, -16.2060546875, -15.60498046875, -15.00390625, -14.40283203125, -13.8017578125, -13.20068359375, -12.599609375, -11.99853515625, -11.3974609375, -10.79638671875, -10.1953125, -9.59423828125, -8.9931640625, -8.39208984375, -7.791015625, -7.18994140625, -6.5888671875, -5.98779296875, -5.38671875, -4.78564453125, -4.1845703125, -3.58349609375, -2.982421875, -2.38134765625, -1.7802734375, -1.17919921875, -0.578125, 0.02294921875, 0.6240234375, 1.22509765625, 1.826171875, 2.42724609375, 3.0283203125, 3.62939453125, 4.23046875, 4.83154296875, 5.4326171875, 6.03369140625, 6.634765625, 7.23583984375, 7.8369140625, 8.43798828125, 9.0390625, 9.64013671875, 10.2412109375, 10.84228515625, 11.443359375, 12.04443359375, 12.6455078125, 13.24658203125, 13.84765625, 14.44873046875, 15.0498046875, 15.65087890625, 16.251953125, 16.85302734375, 17.4541015625, 18.05517578125, 18.65625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 6.0, 3.0, 13.0, 17.0, 27.0, 27.0, 44.0, 62.0, 85.0, 140.0, 180.0, 232.0, 335.0, 487.0, 691.0, 994.0, 1446.0, 2014.0, 2903.0, 4462.0, 6621.0, 10075.0, 15413.0, 23627.0, 37333.0, 59258.0, 104149.0, 241919.0, 258378.0, 107016.0, 61225.0, 37787.0, 24247.0, 15849.0, 10112.0, 6855.0, 4579.0, 3013.0, 2077.0, 1493.0, 1001.0, 710.0, 507.0, 335.0, 241.0, 171.0, 126.0, 82.0, 64.0, 46.0, 32.0, 18.0, 16.0, 12.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0], "bins": [-5.15625, -4.9952392578125, -4.834228515625, -4.6732177734375, -4.51220703125, -4.3511962890625, -4.190185546875, -4.0291748046875, -3.8681640625, -3.7071533203125, -3.546142578125, -3.3851318359375, -3.22412109375, -3.0631103515625, -2.902099609375, -2.7410888671875, -2.580078125, -2.4190673828125, -2.258056640625, -2.0970458984375, -1.93603515625, -1.7750244140625, -1.614013671875, -1.4530029296875, -1.2919921875, -1.1309814453125, -0.969970703125, -0.8089599609375, -0.64794921875, -0.4869384765625, -0.325927734375, -0.1649169921875, -0.00390625, 0.1571044921875, 0.318115234375, 0.4791259765625, 0.64013671875, 0.8011474609375, 0.962158203125, 1.1231689453125, 1.2841796875, 1.4451904296875, 1.606201171875, 1.7672119140625, 1.92822265625, 2.0892333984375, 2.250244140625, 2.4112548828125, 2.572265625, 2.7332763671875, 2.894287109375, 3.0552978515625, 3.21630859375, 3.3773193359375, 3.538330078125, 3.6993408203125, 3.8603515625, 4.0213623046875, 4.182373046875, 4.3433837890625, 4.50439453125, 4.6654052734375, 4.826416015625, 4.9874267578125, 5.1484375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 6.0, 5.0, 5.0, 9.0, 9.0, 13.0, 17.0, 18.0, 14.0, 17.0, 25.0, 21.0, 31.0, 30.0, 32.0, 32.0, 33.0, 37.0, 40.0, 38.0, 36.0, 41.0, 43.0, 33.0, 45.0, 40.0, 36.0, 22.0, 25.0, 30.0, 28.0, 29.0, 29.0, 15.0, 22.0, 16.0, 17.0, 17.0, 6.0, 7.0, 10.0, 3.0, 6.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-12.8828125, -12.50830078125, -12.1337890625, -11.75927734375, -11.384765625, -11.01025390625, -10.6357421875, -10.26123046875, -9.88671875, -9.51220703125, -9.1376953125, -8.76318359375, -8.388671875, -8.01416015625, -7.6396484375, -7.26513671875, -6.890625, -6.51611328125, -6.1416015625, -5.76708984375, -5.392578125, -5.01806640625, -4.6435546875, -4.26904296875, -3.89453125, -3.52001953125, -3.1455078125, -2.77099609375, -2.396484375, -2.02197265625, -1.6474609375, -1.27294921875, -0.8984375, -0.52392578125, -0.1494140625, 0.22509765625, 0.599609375, 0.97412109375, 1.3486328125, 1.72314453125, 2.09765625, 2.47216796875, 2.8466796875, 3.22119140625, 3.595703125, 3.97021484375, 4.3447265625, 4.71923828125, 5.09375, 5.46826171875, 5.8427734375, 6.21728515625, 6.591796875, 6.96630859375, 7.3408203125, 7.71533203125, 8.08984375, 8.46435546875, 8.8388671875, 9.21337890625, 9.587890625, 9.96240234375, 10.3369140625, 10.71142578125, 11.0859375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 0.0, 5.0, 4.0, 7.0, 10.0, 12.0, 18.0, 25.0, 48.0, 71.0, 104.0, 125.0, 203.0, 285.0, 374.0, 557.0, 828.0, 1266.0, 1798.0, 2705.0, 4161.0, 6648.0, 10786.0, 18534.0, 33327.0, 66305.0, 157757.0, 368055.0, 201080.0, 80044.0, 38789.0, 21099.0, 12219.0, 7368.0, 4709.0, 3081.0, 1995.0, 1334.0, 882.0, 595.0, 403.0, 284.0, 208.0, 152.0, 95.0, 65.0, 42.0, 26.0, 23.0, 17.0, 11.0, 7.0, 7.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0117034912109375, -0.011333346366882324, -0.010963201522827148, -0.010593056678771973, -0.010222911834716797, -0.009852766990661621, -0.009482622146606445, -0.00911247730255127, -0.008742332458496094, -0.008372187614440918, -0.008002042770385742, -0.007631897926330566, -0.007261753082275391, -0.006891608238220215, -0.006521463394165039, -0.006151318550109863, -0.0057811737060546875, -0.005411028861999512, -0.005040884017944336, -0.00467073917388916, -0.004300594329833984, -0.003930449485778809, -0.003560304641723633, -0.003190159797668457, -0.0028200149536132812, -0.0024498701095581055, -0.0020797252655029297, -0.001709580421447754, -0.0013394355773925781, -0.0009692907333374023, -0.0005991458892822266, -0.00022900104522705078, 0.000141143798828125, 0.0005112886428833008, 0.0008814334869384766, 0.0012515783309936523, 0.0016217231750488281, 0.001991868019104004, 0.0023620128631591797, 0.0027321577072143555, 0.0031023025512695312, 0.003472447395324707, 0.003842592239379883, 0.004212737083435059, 0.004582881927490234, 0.00495302677154541, 0.005323171615600586, 0.005693316459655762, 0.0060634613037109375, 0.006433606147766113, 0.006803750991821289, 0.007173895835876465, 0.007544040679931641, 0.007914185523986816, 0.008284330368041992, 0.008654475212097168, 0.009024620056152344, 0.00939476490020752, 0.009764909744262695, 0.010135054588317871, 0.010505199432373047, 0.010875344276428223, 0.011245489120483398, 0.011615633964538574, 0.01198577880859375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 6.0, 6.0, 6.0, 8.0, 11.0, 11.0, 18.0, 18.0, 25.0, 34.0, 48.0, 51.0, 61.0, 76.0, 75.0, 82.0, 76.0, 68.0, 63.0, 57.0, 29.0, 34.0, 24.0, 19.0, 19.0, 9.0, 8.0, 8.0, 9.0, 6.0, 5.0, 5.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1742115020751953e-05, -1.1389143764972687e-05, -1.103617250919342e-05, -1.0683201253414154e-05, -1.0330229997634888e-05, -9.977258741855621e-06, -9.624287486076355e-06, -9.271316230297089e-06, -8.918344974517822e-06, -8.565373718738556e-06, -8.21240246295929e-06, -7.859431207180023e-06, -7.506459951400757e-06, -7.1534886956214905e-06, -6.800517439842224e-06, -6.447546184062958e-06, -6.094574928283691e-06, -5.741603672504425e-06, -5.388632416725159e-06, -5.035661160945892e-06, -4.682689905166626e-06, -4.32971864938736e-06, -3.976747393608093e-06, -3.623776137828827e-06, -3.2708048820495605e-06, -2.917833626270294e-06, -2.564862370491028e-06, -2.2118911147117615e-06, -1.8589198589324951e-06, -1.5059486031532288e-06, -1.1529773473739624e-06, -8.00006091594696e-07, -4.470348358154297e-07, -9.406358003616333e-08, 2.5890767574310303e-07, 6.118789315223694e-07, 9.648501873016357e-07, 1.317821443080902e-06, 1.6707926988601685e-06, 2.023763954639435e-06, 2.376735210418701e-06, 2.7297064661979675e-06, 3.082677721977234e-06, 3.4356489777565002e-06, 3.7886202335357666e-06, 4.141591489315033e-06, 4.494562745094299e-06, 4.847534000873566e-06, 5.200505256652832e-06, 5.553476512432098e-06, 5.906447768211365e-06, 6.259419023990631e-06, 6.6123902797698975e-06, 6.965361535549164e-06, 7.31833279132843e-06, 7.671304047107697e-06, 8.024275302886963e-06, 8.37724655866623e-06, 8.730217814445496e-06, 9.083189070224762e-06, 9.436160326004028e-06, 9.789131581783295e-06, 1.0142102837562561e-05, 1.0495074093341827e-05, 1.0848045349121094e-05]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 6.0, 9.0, 1.0, 11.0, 14.0, 22.0, 24.0, 33.0, 58.0, 73.0, 111.0, 152.0, 221.0, 337.0, 527.0, 704.0, 1134.0, 1628.0, 2447.0, 3451.0, 5288.0, 8045.0, 12280.0, 19670.0, 31589.0, 55860.0, 111173.0, 265815.0, 269252.0, 113363.0, 56661.0, 32095.0, 19641.0, 12551.0, 8073.0, 5187.0, 3599.0, 2322.0, 1631.0, 1119.0, 777.0, 497.0, 355.0, 229.0, 149.0, 118.0, 74.0, 67.0, 35.0, 25.0, 18.0, 14.0, 9.0, 7.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.009918212890625, -0.009598374366760254, -0.009278535842895508, -0.008958697319030762, -0.008638858795166016, -0.00831902027130127, -0.007999181747436523, -0.007679343223571777, -0.007359504699707031, -0.007039666175842285, -0.006719827651977539, -0.006399989128112793, -0.006080150604248047, -0.005760312080383301, -0.005440473556518555, -0.005120635032653809, -0.0048007965087890625, -0.004480957984924316, -0.00416111946105957, -0.0038412809371948242, -0.003521442413330078, -0.003201603889465332, -0.002881765365600586, -0.00256192684173584, -0.0022420883178710938, -0.0019222497940063477, -0.0016024112701416016, -0.0012825727462768555, -0.0009627342224121094, -0.0006428956985473633, -0.0003230571746826172, -3.2186508178710938e-06, 0.000316619873046875, 0.0006364583969116211, 0.0009562969207763672, 0.0012761354446411133, 0.0015959739685058594, 0.0019158124923706055, 0.0022356510162353516, 0.0025554895401000977, 0.0028753280639648438, 0.00319516658782959, 0.003515005111694336, 0.003834843635559082, 0.004154682159423828, 0.004474520683288574, 0.00479435920715332, 0.005114197731018066, 0.0054340362548828125, 0.005753874778747559, 0.006073713302612305, 0.006393551826477051, 0.006713390350341797, 0.007033228874206543, 0.007353067398071289, 0.007672905921936035, 0.007992744445800781, 0.008312582969665527, 0.008632421493530273, 0.00895226001739502, 0.009272098541259766, 0.009591937065124512, 0.009911775588989258, 0.010231614112854004, 0.01055145263671875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 9.0, 12.0, 7.0, 10.0, 13.0, 10.0, 17.0, 14.0, 22.0, 26.0, 23.0, 27.0, 38.0, 52.0, 71.0, 63.0, 81.0, 86.0, 57.0, 51.0, 56.0, 31.0, 43.0, 36.0, 18.0, 28.0, 24.0, 12.0, 12.0, 8.0, 8.0, 11.0, 6.0, 6.0, 2.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0034961700439453125, -0.0033806264400482178, -0.003265082836151123, -0.0031495392322540283, -0.0030339956283569336, -0.002918452024459839, -0.002802908420562744, -0.0026873648166656494, -0.0025718212127685547, -0.00245627760887146, -0.0023407340049743652, -0.0022251904010772705, -0.0021096467971801758, -0.001994103193283081, -0.0018785595893859863, -0.0017630159854888916, -0.0016474723815917969, -0.0015319287776947021, -0.0014163851737976074, -0.0013008415699005127, -0.001185297966003418, -0.0010697543621063232, -0.0009542107582092285, -0.0008386671543121338, -0.0007231235504150391, -0.0006075799465179443, -0.0004920363426208496, -0.0003764927387237549, -0.00026094913482666016, -0.00014540553092956543, -2.9861927032470703e-05, 8.568167686462402e-05, 0.00020122528076171875, 0.0003167688846588135, 0.0004323124885559082, 0.0005478560924530029, 0.0006633996963500977, 0.0007789433002471924, 0.0008944869041442871, 0.0010100305080413818, 0.0011255741119384766, 0.0012411177158355713, 0.001356661319732666, 0.0014722049236297607, 0.0015877485275268555, 0.0017032921314239502, 0.001818835735321045, 0.0019343793392181396, 0.0020499229431152344, 0.002165466547012329, 0.002281010150909424, 0.0023965537548065186, 0.0025120973587036133, 0.002627640962600708, 0.0027431845664978027, 0.0028587281703948975, 0.002974271774291992, 0.003089815378189087, 0.0032053589820861816, 0.0033209025859832764, 0.003436446189880371, 0.003551989793777466, 0.0036675333976745605, 0.0037830770015716553, 0.00389862060546875]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 6.0, 4.0, 6.0, 9.0, 5.0, 8.0, 10.0, 17.0, 13.0, 20.0, 34.0, 43.0, 52.0, 67.0, 85.0, 96.0, 115.0, 81.0, 72.0, 42.0, 51.0, 32.0, 25.0, 18.0, 23.0, 13.0, 10.0, 15.0, 4.0, 11.0, 5.0, 1.0, 5.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-34.47951889038086, -33.57868576049805, -32.677852630615234, -31.777019500732422, -30.876188278198242, -29.97535514831543, -29.074522018432617, -28.173688888549805, -27.272857666015625, -26.372024536132812, -25.47119140625, -24.570358276367188, -23.669527053833008, -22.768693923950195, -21.867860794067383, -20.96702766418457, -20.066194534301758, -19.165361404418945, -18.264528274536133, -17.363697052001953, -16.46286392211914, -15.562030792236328, -14.661197662353516, -13.760364532470703, -12.859532356262207, -11.958699226379395, -11.057867050170898, -10.157033920288086, -9.256200790405273, -8.355368614196777, -7.454535484313965, -6.5537028312683105, -5.652872085571289, -4.752039432525635, -3.8512065410614014, -2.950373649597168, -2.0495409965515137, -1.1487083435058594, -0.24787521362304688, 0.6529574394226074, 1.5537900924682617, 2.454622745513916, 3.3554556369781494, 4.256288528442383, 5.157121181488037, 6.057953834533691, 6.958786964416504, 7.859619617462158, 8.760452270507812, 9.661285400390625, 10.562117576599121, 11.462950706481934, 12.36378288269043, 13.264616012573242, 14.165449142456055, 15.066282272338867, 15.967114448547363, 16.86794662475586, 17.768779754638672, 18.669612884521484, 19.570446014404297, 20.47127914428711, 21.372112274169922, 22.2729434967041, 23.173776626586914]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 6.0, 14.0, 6.0, 9.0, 11.0, 17.0, 20.0, 15.0, 27.0, 23.0, 29.0, 26.0, 31.0, 33.0, 35.0, 41.0, 37.0, 45.0, 46.0, 49.0, 36.0, 43.0, 45.0, 25.0, 33.0, 31.0, 23.0, 30.0, 27.0, 21.0, 24.0, 27.0, 17.0, 14.0, 9.0, 18.0, 9.0, 13.0, 9.0, 2.0, 9.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-19.327342987060547, -18.740453720092773, -18.153562545776367, -17.566673278808594, -16.97978401184082, -16.392894744873047, -15.80600357055664, -15.219114303588867, -14.632225036621094, -14.045334815979004, -13.45844554901123, -12.87155532836914, -12.284666061401367, -11.697775840759277, -11.110885620117188, -10.523996353149414, -9.937106132507324, -9.350215911865234, -8.763326644897461, -8.176436424255371, -7.589547157287598, -7.002656936645508, -6.415767192840576, -5.8288774490356445, -5.241987705230713, -4.655097961425781, -4.06820821762085, -3.481318235397339, -2.8944284915924072, -2.3075387477874756, -1.7206487655639648, -1.1337590217590332, -0.5468692779541016, 0.040020525455474854, 0.6269103288650513, 1.2138001918792725, 1.800689935684204, 2.3875796794891357, 2.9744696617126465, 3.561359405517578, 4.14824914932251, 4.735138893127441, 5.322028636932373, 5.908918380737305, 6.4958086013793945, 7.082697868347168, 7.669588088989258, 8.256477355957031, 8.843367576599121, 9.430257797241211, 10.017147064208984, 10.604037284851074, 11.190926551818848, 11.777816772460938, 12.364706039428711, 12.9515962600708, 13.53848648071289, 14.12537670135498, 14.712265968322754, 15.299156188964844, 15.886045455932617, 16.47293472290039, 17.059825897216797, 17.64671516418457, 18.233604431152344]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 9.0, 13.0, 12.0, 22.0, 33.0, 59.0, 86.0, 112.0, 161.0, 242.0, 370.0, 466.0, 783.0, 1180.0, 1663.0, 2475.0, 3778.0, 5738.0, 8964.0, 13965.0, 22575.0, 37217.0, 65325.0, 125963.0, 224513.0, 230909.0, 131351.0, 67730.0, 38304.0, 23176.0, 14485.0, 9100.0, 5963.0, 3952.0, 2525.0, 1659.0, 1156.0, 801.0, 530.0, 372.0, 268.0, 189.0, 126.0, 85.0, 55.0, 37.0, 24.0, 13.0, 11.0, 9.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-36.0625, -34.900390625, -33.73828125, -32.576171875, -31.4140625, -30.251953125, -29.08984375, -27.927734375, -26.765625, -25.603515625, -24.44140625, -23.279296875, -22.1171875, -20.955078125, -19.79296875, -18.630859375, -17.46875, -16.306640625, -15.14453125, -13.982421875, -12.8203125, -11.658203125, -10.49609375, -9.333984375, -8.171875, -7.009765625, -5.84765625, -4.685546875, -3.5234375, -2.361328125, -1.19921875, -0.037109375, 1.125, 2.287109375, 3.44921875, 4.611328125, 5.7734375, 6.935546875, 8.09765625, 9.259765625, 10.421875, 11.583984375, 12.74609375, 13.908203125, 15.0703125, 16.232421875, 17.39453125, 18.556640625, 19.71875, 20.880859375, 22.04296875, 23.205078125, 24.3671875, 25.529296875, 26.69140625, 27.853515625, 29.015625, 30.177734375, 31.33984375, 32.501953125, 33.6640625, 34.826171875, 35.98828125, 37.150390625, 38.3125]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 1.0, 2.0, 3.0, 9.0, 10.0, 3.0, 11.0, 14.0, 13.0, 18.0, 23.0, 24.0, 18.0, 22.0, 27.0, 30.0, 29.0, 25.0, 41.0, 26.0, 46.0, 38.0, 40.0, 48.0, 49.0, 29.0, 43.0, 30.0, 42.0, 31.0, 24.0, 36.0, 25.0, 14.0, 19.0, 23.0, 20.0, 9.0, 12.0, 13.0, 11.0, 3.0, 17.0, 3.0, 5.0, 10.0, 3.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-16.4375, -15.93408203125, -15.4306640625, -14.92724609375, -14.423828125, -13.92041015625, -13.4169921875, -12.91357421875, -12.41015625, -11.90673828125, -11.4033203125, -10.89990234375, -10.396484375, -9.89306640625, -9.3896484375, -8.88623046875, -8.3828125, -7.87939453125, -7.3759765625, -6.87255859375, -6.369140625, -5.86572265625, -5.3623046875, -4.85888671875, -4.35546875, -3.85205078125, -3.3486328125, -2.84521484375, -2.341796875, -1.83837890625, -1.3349609375, -0.83154296875, -0.328125, 0.17529296875, 0.6787109375, 1.18212890625, 1.685546875, 2.18896484375, 2.6923828125, 3.19580078125, 3.69921875, 4.20263671875, 4.7060546875, 5.20947265625, 5.712890625, 6.21630859375, 6.7197265625, 7.22314453125, 7.7265625, 8.22998046875, 8.7333984375, 9.23681640625, 9.740234375, 10.24365234375, 10.7470703125, 11.25048828125, 11.75390625, 12.25732421875, 12.7607421875, 13.26416015625, 13.767578125, 14.27099609375, 14.7744140625, 15.27783203125, 15.78125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 6.0, 7.0, 11.0, 15.0, 28.0, 36.0, 66.0, 104.0, 140.0, 238.0, 305.0, 453.0, 632.0, 1031.0, 1462.0, 2086.0, 3061.0, 4538.0, 6448.0, 9513.0, 13497.0, 19257.0, 28027.0, 41794.0, 63747.0, 101466.0, 156918.0, 183330.0, 142606.0, 90231.0, 56938.0, 37633.0, 25707.0, 17347.0, 12482.0, 8531.0, 5855.0, 4131.0, 2825.0, 1952.0, 1283.0, 955.0, 604.0, 416.0, 289.0, 193.0, 114.0, 92.0, 57.0, 34.0, 35.0, 15.0, 13.0, 3.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-27.796875, -26.910888671875, -26.02490234375, -25.138916015625, -24.2529296875, -23.366943359375, -22.48095703125, -21.594970703125, -20.708984375, -19.822998046875, -18.93701171875, -18.051025390625, -17.1650390625, -16.279052734375, -15.39306640625, -14.507080078125, -13.62109375, -12.735107421875, -11.84912109375, -10.963134765625, -10.0771484375, -9.191162109375, -8.30517578125, -7.419189453125, -6.533203125, -5.647216796875, -4.76123046875, -3.875244140625, -2.9892578125, -2.103271484375, -1.21728515625, -0.331298828125, 0.5546875, 1.440673828125, 2.32666015625, 3.212646484375, 4.0986328125, 4.984619140625, 5.87060546875, 6.756591796875, 7.642578125, 8.528564453125, 9.41455078125, 10.300537109375, 11.1865234375, 12.072509765625, 12.95849609375, 13.844482421875, 14.73046875, 15.616455078125, 16.50244140625, 17.388427734375, 18.2744140625, 19.160400390625, 20.04638671875, 20.932373046875, 21.818359375, 22.704345703125, 23.59033203125, 24.476318359375, 25.3623046875, 26.248291015625, 27.13427734375, 28.020263671875, 28.90625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 6.0, 3.0, 3.0, 8.0, 7.0, 8.0, 8.0, 11.0, 15.0, 19.0, 15.0, 22.0, 21.0, 21.0, 28.0, 32.0, 30.0, 29.0, 33.0, 34.0, 29.0, 42.0, 42.0, 42.0, 34.0, 36.0, 33.0, 41.0, 23.0, 30.0, 36.0, 31.0, 28.0, 23.0, 26.0, 23.0, 17.0, 18.0, 18.0, 17.0, 18.0, 11.0, 7.0, 6.0, 3.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.0234375, -9.7099609375, -9.396484375, -9.0830078125, -8.76953125, -8.4560546875, -8.142578125, -7.8291015625, -7.515625, -7.2021484375, -6.888671875, -6.5751953125, -6.26171875, -5.9482421875, -5.634765625, -5.3212890625, -5.0078125, -4.6943359375, -4.380859375, -4.0673828125, -3.75390625, -3.4404296875, -3.126953125, -2.8134765625, -2.5, -2.1865234375, -1.873046875, -1.5595703125, -1.24609375, -0.9326171875, -0.619140625, -0.3056640625, 0.0078125, 0.3212890625, 0.634765625, 0.9482421875, 1.26171875, 1.5751953125, 1.888671875, 2.2021484375, 2.515625, 2.8291015625, 3.142578125, 3.4560546875, 3.76953125, 4.0830078125, 4.396484375, 4.7099609375, 5.0234375, 5.3369140625, 5.650390625, 5.9638671875, 6.27734375, 6.5908203125, 6.904296875, 7.2177734375, 7.53125, 7.8447265625, 8.158203125, 8.4716796875, 8.78515625, 9.0986328125, 9.412109375, 9.7255859375, 10.0390625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 0.0, 10.0, 11.0, 10.0, 24.0, 31.0, 61.0, 76.0, 100.0, 156.0, 234.0, 312.0, 484.0, 732.0, 1109.0, 1639.0, 2437.0, 3856.0, 6264.0, 9885.0, 16156.0, 27092.0, 49512.0, 104451.0, 253708.0, 300720.0, 129872.0, 59390.0, 31304.0, 18153.0, 11131.0, 6961.0, 4275.0, 2806.0, 1864.0, 1163.0, 849.0, 521.0, 394.0, 261.0, 169.0, 125.0, 70.0, 52.0, 41.0, 31.0, 15.0, 15.0, 9.0, 2.0, 7.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0], "bins": [-1.228515625, -1.190277099609375, -1.15203857421875, -1.113800048828125, -1.0755615234375, -1.037322998046875, -0.99908447265625, -0.960845947265625, -0.922607421875, -0.884368896484375, -0.84613037109375, -0.807891845703125, -0.7696533203125, -0.731414794921875, -0.69317626953125, -0.654937744140625, -0.61669921875, -0.578460693359375, -0.54022216796875, -0.501983642578125, -0.4637451171875, -0.425506591796875, -0.38726806640625, -0.349029541015625, -0.310791015625, -0.272552490234375, -0.23431396484375, -0.196075439453125, -0.1578369140625, -0.119598388671875, -0.08135986328125, -0.043121337890625, -0.0048828125, 0.033355712890625, 0.07159423828125, 0.109832763671875, 0.1480712890625, 0.186309814453125, 0.22454833984375, 0.262786865234375, 0.301025390625, 0.339263916015625, 0.37750244140625, 0.415740966796875, 0.4539794921875, 0.492218017578125, 0.53045654296875, 0.568695068359375, 0.60693359375, 0.645172119140625, 0.68341064453125, 0.721649169921875, 0.7598876953125, 0.798126220703125, 0.83636474609375, 0.874603271484375, 0.912841796875, 0.951080322265625, 0.98931884765625, 1.027557373046875, 1.0657958984375, 1.104034423828125, 1.14227294921875, 1.180511474609375, 1.21875]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 10.0, 9.0, 9.0, 11.0, 12.0, 16.0, 17.0, 24.0, 32.0, 30.0, 84.0, 68.0, 80.0, 73.0, 103.0, 90.0, 63.0, 54.0, 45.0, 34.0, 20.0, 23.0, 12.0, 17.0, 15.0, 9.0, 9.0, 6.0, 5.0, 2.0, 4.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.0001697540283203125, -0.00016408413648605347, -0.00015841424465179443, -0.0001527443528175354, -0.00014707446098327637, -0.00014140456914901733, -0.0001357346773147583, -0.00013006478548049927, -0.00012439489364624023, -0.0001187250018119812, -0.00011305510997772217, -0.00010738521814346313, -0.0001017153263092041, -9.604543447494507e-05, -9.037554264068604e-05, -8.4705650806427e-05, -7.903575897216797e-05, -7.336586713790894e-05, -6.76959753036499e-05, -6.202608346939087e-05, -5.6356191635131836e-05, -5.06862998008728e-05, -4.501640796661377e-05, -3.9346516132354736e-05, -3.36766242980957e-05, -2.800673246383667e-05, -2.2336840629577637e-05, -1.6666948795318604e-05, -1.099705696105957e-05, -5.327165126800537e-06, 3.427267074584961e-07, 6.012618541717529e-06, 1.1682510375976562e-05, 1.7352402210235596e-05, 2.302229404449463e-05, 2.8692185878753662e-05, 3.4362077713012695e-05, 4.003196954727173e-05, 4.570186138153076e-05, 5.1371753215789795e-05, 5.704164505004883e-05, 6.271153688430786e-05, 6.83814287185669e-05, 7.405132055282593e-05, 7.972121238708496e-05, 8.5391104221344e-05, 9.106099605560303e-05, 9.673088788986206e-05, 0.0001024007797241211, 0.00010807067155838013, 0.00011374056339263916, 0.0001194104552268982, 0.00012508034706115723, 0.00013075023889541626, 0.0001364201307296753, 0.00014209002256393433, 0.00014775991439819336, 0.0001534298062324524, 0.00015909969806671143, 0.00016476958990097046, 0.0001704394817352295, 0.00017610937356948853, 0.00018177926540374756, 0.0001874491572380066, 0.00019311904907226562]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 4.0, 4.0, 3.0, 9.0, 8.0, 9.0, 13.0, 23.0, 23.0, 63.0, 75.0, 96.0, 134.0, 191.0, 320.0, 476.0, 718.0, 1073.0, 1629.0, 2571.0, 4005.0, 6627.0, 10949.0, 18207.0, 32311.0, 60450.0, 127194.0, 288358.0, 256732.0, 110566.0, 53563.0, 28911.0, 16840.0, 9730.0, 6007.0, 3713.0, 2410.0, 1538.0, 1029.0, 655.0, 431.0, 273.0, 190.0, 132.0, 89.0, 68.0, 42.0, 31.0, 24.0, 6.0, 12.0, 12.0, 4.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.2607421875, -1.2199554443359375, -1.179168701171875, -1.1383819580078125, -1.09759521484375, -1.0568084716796875, -1.016021728515625, -0.9752349853515625, -0.9344482421875, -0.8936614990234375, -0.852874755859375, -0.8120880126953125, -0.77130126953125, -0.7305145263671875, -0.689727783203125, -0.6489410400390625, -0.608154296875, -0.5673675537109375, -0.526580810546875, -0.4857940673828125, -0.44500732421875, -0.4042205810546875, -0.363433837890625, -0.3226470947265625, -0.2818603515625, -0.2410736083984375, -0.200286865234375, -0.1595001220703125, -0.11871337890625, -0.0779266357421875, -0.037139892578125, 0.0036468505859375, 0.04443359375, 0.0852203369140625, 0.126007080078125, 0.1667938232421875, 0.20758056640625, 0.2483673095703125, 0.289154052734375, 0.3299407958984375, 0.3707275390625, 0.4115142822265625, 0.452301025390625, 0.4930877685546875, 0.53387451171875, 0.5746612548828125, 0.615447998046875, 0.6562347412109375, 0.697021484375, 0.7378082275390625, 0.778594970703125, 0.8193817138671875, 0.86016845703125, 0.9009552001953125, 0.941741943359375, 0.9825286865234375, 1.0233154296875, 1.0641021728515625, 1.104888916015625, 1.1456756591796875, 1.18646240234375, 1.2272491455078125, 1.268035888671875, 1.3088226318359375, 1.349609375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 10.0, 1.0, 3.0, 7.0, 10.0, 12.0, 21.0, 17.0, 21.0, 22.0, 43.0, 43.0, 47.0, 52.0, 54.0, 44.0, 55.0, 72.0, 68.0, 80.0, 63.0, 49.0, 29.0, 33.0, 31.0, 26.0, 20.0, 17.0, 16.0, 8.0, 5.0, 8.0, 6.0, 3.0, 4.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41015625, -0.3960380554199219, -0.38191986083984375, -0.3678016662597656, -0.3536834716796875, -0.3395652770996094, -0.32544708251953125, -0.3113288879394531, -0.297210693359375, -0.2830924987792969, -0.26897430419921875, -0.2548561096191406, -0.2407379150390625, -0.22661972045898438, -0.21250152587890625, -0.19838333129882812, -0.18426513671875, -0.17014694213867188, -0.15602874755859375, -0.14191055297851562, -0.1277923583984375, -0.11367416381835938, -0.09955596923828125, -0.08543777465820312, -0.071319580078125, -0.057201385498046875, -0.04308319091796875, -0.028964996337890625, -0.0148468017578125, -0.000728607177734375, 0.01338958740234375, 0.027507781982421875, 0.0416259765625, 0.055744171142578125, 0.06986236572265625, 0.08398056030273438, 0.0980987548828125, 0.11221694946289062, 0.12633514404296875, 0.14045333862304688, 0.154571533203125, 0.16868972778320312, 0.18280792236328125, 0.19692611694335938, 0.2110443115234375, 0.22516250610351562, 0.23928070068359375, 0.2533988952636719, 0.26751708984375, 0.2816352844238281, 0.29575347900390625, 0.3098716735839844, 0.3239898681640625, 0.3381080627441406, 0.35222625732421875, 0.3663444519042969, 0.380462646484375, 0.3945808410644531, 0.40869903564453125, 0.4228172302246094, 0.4369354248046875, 0.4510536193847656, 0.46517181396484375, 0.4792900085449219, 0.493408203125]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 6.0, 7.0, 9.0, 10.0, 9.0, 21.0, 27.0, 35.0, 35.0, 53.0, 60.0, 71.0, 81.0, 80.0, 90.0, 69.0, 65.0, 49.0, 35.0, 30.0, 32.0, 22.0, 17.0, 17.0, 13.0, 10.0, 5.0, 8.0, 9.0, 5.0, 4.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.57021141052246, -25.787111282348633, -25.004011154174805, -24.220911026000977, -23.43781280517578, -22.654712677001953, -21.871612548828125, -21.088512420654297, -20.30541229248047, -19.52231216430664, -18.739212036132812, -17.956111907958984, -17.173011779785156, -16.38991355895996, -15.606813430786133, -14.823713302612305, -14.040613174438477, -13.257513046264648, -12.47441291809082, -11.691313743591309, -10.90821361541748, -10.125113487243652, -9.34201431274414, -8.558914184570312, -7.775814056396484, -6.992713928222656, -6.209614276885986, -5.426514625549316, -4.643414497375488, -3.8603146076202393, -3.0772147178649902, -2.2941150665283203, -1.5110149383544922, -0.7279150485992432, 0.05518484115600586, 0.8382847309112549, 1.621384620666504, 2.404484510421753, 3.187584400177002, 3.970684051513672, 4.7537841796875, 5.536884307861328, 6.319983959197998, 7.103083610534668, 7.886183738708496, 8.669283866882324, 9.452383041381836, 10.235483169555664, 11.018583297729492, 11.80168342590332, 12.584783554077148, 13.36788272857666, 14.150982856750488, 14.934082984924316, 15.717182159423828, 16.500282287597656, 17.283382415771484, 18.066482543945312, 18.84958267211914, 19.63268280029297, 20.415782928466797, 21.198881149291992, 21.98198127746582, 22.76508140563965, 23.548181533813477]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 8.0, 3.0, 7.0, 5.0, 14.0, 9.0, 23.0, 23.0, 18.0, 26.0, 22.0, 30.0, 23.0, 28.0, 30.0, 37.0, 34.0, 37.0, 36.0, 42.0, 46.0, 33.0, 35.0, 38.0, 34.0, 37.0, 24.0, 34.0, 19.0, 30.0, 31.0, 25.0, 17.0, 23.0, 27.0, 14.0, 14.0, 9.0, 10.0, 10.0, 7.0, 7.0, 8.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-17.002159118652344, -16.475196838378906, -15.948235511779785, -15.421273231506348, -14.89431095123291, -14.367349624633789, -13.840387344360352, -13.313425064086914, -12.786462783813477, -12.259500503540039, -11.732539176940918, -11.20557689666748, -10.678614616394043, -10.151653289794922, -9.624691009521484, -9.097728729248047, -8.570767402648926, -8.043805122375488, -7.516843318939209, -6.98988151550293, -6.462919235229492, -5.935957431793213, -5.408995628356934, -4.882033348083496, -4.355071544647217, -3.8281095027923584, -3.3011474609375, -2.7741856575012207, -2.2472236156463623, -1.720261573791504, -1.1932997703552246, -0.6663377285003662, -0.1393756866455078, 0.3875862956047058, 0.9145482778549194, 1.4415102005004883, 1.9684722423553467, 2.495434284210205, 3.0223960876464844, 3.5493581295013428, 4.076320171356201, 4.6032819747924805, 5.130244255065918, 5.657206058502197, 6.184167861938477, 6.711130142211914, 7.238091945648193, 7.765053749084473, 8.29201602935791, 8.818978309631348, 9.345939636230469, 9.872901916503906, 10.399864196777344, 10.926826477050781, 11.453787803649902, 11.98075008392334, 12.507711410522461, 13.034673690795898, 13.56163501739502, 14.088597297668457, 14.615559577941895, 15.142520904541016, 15.669483184814453, 16.19644546508789, 16.723407745361328]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 4.0, 8.0, 10.0, 11.0, 25.0, 29.0, 48.0, 61.0, 85.0, 136.0, 209.0, 298.0, 447.0, 666.0, 873.0, 1277.0, 1974.0, 2876.0, 4443.0, 6832.0, 10493.0, 16497.0, 26677.0, 44329.0, 78055.0, 157144.0, 528367.0, 1683805.0, 1125590.0, 257094.0, 99798.0, 54853.0, 32546.0, 20124.0, 12846.0, 8357.0, 5620.0, 3718.0, 2528.0, 1716.0, 1180.0, 835.0, 596.0, 354.0, 267.0, 183.0, 116.0, 83.0, 61.0, 53.0, 31.0, 18.0, 20.0, 8.0, 9.0, 2.0, 4.0, 4.0, 1.0, 2.0], "bins": [-29.859375, -28.919189453125, -27.97900390625, -27.038818359375, -26.0986328125, -25.158447265625, -24.21826171875, -23.278076171875, -22.337890625, -21.397705078125, -20.45751953125, -19.517333984375, -18.5771484375, -17.636962890625, -16.69677734375, -15.756591796875, -14.81640625, -13.876220703125, -12.93603515625, -11.995849609375, -11.0556640625, -10.115478515625, -9.17529296875, -8.235107421875, -7.294921875, -6.354736328125, -5.41455078125, -4.474365234375, -3.5341796875, -2.593994140625, -1.65380859375, -0.713623046875, 0.2265625, 1.166748046875, 2.10693359375, 3.047119140625, 3.9873046875, 4.927490234375, 5.86767578125, 6.807861328125, 7.748046875, 8.688232421875, 9.62841796875, 10.568603515625, 11.5087890625, 12.448974609375, 13.38916015625, 14.329345703125, 15.26953125, 16.209716796875, 17.14990234375, 18.090087890625, 19.0302734375, 19.970458984375, 20.91064453125, 21.850830078125, 22.791015625, 23.731201171875, 24.67138671875, 25.611572265625, 26.5517578125, 27.491943359375, 28.43212890625, 29.372314453125, 30.3125]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 7.0, 4.0, 8.0, 7.0, 12.0, 13.0, 12.0, 17.0, 20.0, 20.0, 12.0, 31.0, 18.0, 33.0, 36.0, 30.0, 43.0, 39.0, 31.0, 32.0, 33.0, 36.0, 37.0, 35.0, 33.0, 44.0, 27.0, 36.0, 33.0, 34.0, 24.0, 20.0, 23.0, 17.0, 27.0, 12.0, 22.0, 10.0, 14.0, 9.0, 9.0, 9.0, 8.0, 6.0, 6.0, 3.0, 1.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-13.1875, -12.7674560546875, -12.347412109375, -11.9273681640625, -11.50732421875, -11.0872802734375, -10.667236328125, -10.2471923828125, -9.8271484375, -9.4071044921875, -8.987060546875, -8.5670166015625, -8.14697265625, -7.7269287109375, -7.306884765625, -6.8868408203125, -6.466796875, -6.0467529296875, -5.626708984375, -5.2066650390625, -4.78662109375, -4.3665771484375, -3.946533203125, -3.5264892578125, -3.1064453125, -2.6864013671875, -2.266357421875, -1.8463134765625, -1.42626953125, -1.0062255859375, -0.586181640625, -0.1661376953125, 0.25390625, 0.6739501953125, 1.093994140625, 1.5140380859375, 1.93408203125, 2.3541259765625, 2.774169921875, 3.1942138671875, 3.6142578125, 4.0343017578125, 4.454345703125, 4.8743896484375, 5.29443359375, 5.7144775390625, 6.134521484375, 6.5545654296875, 6.974609375, 7.3946533203125, 7.814697265625, 8.2347412109375, 8.65478515625, 9.0748291015625, 9.494873046875, 9.9149169921875, 10.3349609375, 10.7550048828125, 11.175048828125, 11.5950927734375, 12.01513671875, 12.4351806640625, 12.855224609375, 13.2752685546875, 13.6953125]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [4.0, 4.0, 1.0, 9.0, 17.0, 16.0, 30.0, 45.0, 53.0, 110.0, 130.0, 178.0, 235.0, 408.0, 571.0, 833.0, 1169.0, 1804.0, 2637.0, 4250.0, 6424.0, 9927.0, 15479.0, 23894.0, 38926.0, 65264.0, 116067.0, 221591.0, 487986.0, 1513298.0, 931592.0, 348171.0, 169973.0, 91105.0, 52728.0, 32022.0, 20155.0, 12714.0, 8381.0, 5393.0, 3494.0, 2330.0, 1525.0, 1060.0, 703.0, 486.0, 329.0, 244.0, 164.0, 116.0, 66.0, 54.0, 40.0, 29.0, 23.0, 11.0, 6.0, 9.0, 7.0, 7.0, 2.0, 2.0, 1.0, 2.0], "bins": [-23.5, -22.71142578125, -21.9228515625, -21.13427734375, -20.345703125, -19.55712890625, -18.7685546875, -17.97998046875, -17.19140625, -16.40283203125, -15.6142578125, -14.82568359375, -14.037109375, -13.24853515625, -12.4599609375, -11.67138671875, -10.8828125, -10.09423828125, -9.3056640625, -8.51708984375, -7.728515625, -6.93994140625, -6.1513671875, -5.36279296875, -4.57421875, -3.78564453125, -2.9970703125, -2.20849609375, -1.419921875, -0.63134765625, 0.1572265625, 0.94580078125, 1.734375, 2.52294921875, 3.3115234375, 4.10009765625, 4.888671875, 5.67724609375, 6.4658203125, 7.25439453125, 8.04296875, 8.83154296875, 9.6201171875, 10.40869140625, 11.197265625, 11.98583984375, 12.7744140625, 13.56298828125, 14.3515625, 15.14013671875, 15.9287109375, 16.71728515625, 17.505859375, 18.29443359375, 19.0830078125, 19.87158203125, 20.66015625, 21.44873046875, 22.2373046875, 23.02587890625, 23.814453125, 24.60302734375, 25.3916015625, 26.18017578125, 26.96875]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 3.0, 2.0, 7.0, 7.0, 15.0, 15.0, 21.0, 19.0, 37.0, 40.0, 45.0, 62.0, 47.0, 65.0, 94.0, 109.0, 152.0, 159.0, 211.0, 300.0, 424.0, 515.0, 378.0, 253.0, 216.0, 163.0, 136.0, 108.0, 82.0, 74.0, 48.0, 50.0, 36.0, 41.0, 32.0, 23.0, 16.0, 15.0, 13.0, 7.0, 6.0, 5.0, 6.0, 2.0, 3.0, 8.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.92578125, -7.64581298828125, -7.3658447265625, -7.08587646484375, -6.805908203125, -6.52593994140625, -6.2459716796875, -5.96600341796875, -5.68603515625, -5.40606689453125, -5.1260986328125, -4.84613037109375, -4.566162109375, -4.28619384765625, -4.0062255859375, -3.72625732421875, -3.4462890625, -3.16632080078125, -2.8863525390625, -2.60638427734375, -2.326416015625, -2.04644775390625, -1.7664794921875, -1.48651123046875, -1.20654296875, -0.92657470703125, -0.6466064453125, -0.36663818359375, -0.086669921875, 0.19329833984375, 0.4732666015625, 0.75323486328125, 1.033203125, 1.31317138671875, 1.5931396484375, 1.87310791015625, 2.153076171875, 2.43304443359375, 2.7130126953125, 2.99298095703125, 3.27294921875, 3.55291748046875, 3.8328857421875, 4.11285400390625, 4.392822265625, 4.67279052734375, 4.9527587890625, 5.23272705078125, 5.5126953125, 5.79266357421875, 6.0726318359375, 6.35260009765625, 6.632568359375, 6.91253662109375, 7.1925048828125, 7.47247314453125, 7.75244140625, 8.03240966796875, 8.3123779296875, 8.59234619140625, 8.872314453125, 9.15228271484375, 9.4322509765625, 9.71221923828125, 9.9921875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 3.0, 9.0, 12.0, 5.0, 8.0, 16.0, 16.0, 19.0, 25.0, 32.0, 42.0, 42.0, 70.0, 62.0, 87.0, 89.0, 60.0, 62.0, 61.0, 53.0, 40.0, 24.0, 37.0, 13.0, 24.0, 14.0, 11.0, 11.0, 8.0, 10.0, 6.0, 5.0, 6.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.668960571289062, -20.013935089111328, -19.35890769958496, -18.703882217407227, -18.048856735229492, -17.393829345703125, -16.73880386352539, -16.083778381347656, -15.428751945495605, -14.773725509643555, -14.11870002746582, -13.46367359161377, -12.808647155761719, -12.153621673583984, -11.498595237731934, -10.843568801879883, -10.188543319702148, -9.533516883850098, -8.878491401672363, -8.223464965820312, -7.56843900680542, -6.913413047790527, -6.258386611938477, -5.603360652923584, -4.948334693908691, -4.293308734893799, -3.638282537460327, -2.9832563400268555, -2.328230381011963, -1.6732044219970703, -1.0181782245635986, -0.36315202713012695, 0.29187583923339844, 0.9469019174575806, 1.6019279956817627, 2.2569541931152344, 2.911980152130127, 3.5670061111450195, 4.22203254699707, 4.877058506011963, 5.5320844650268555, 6.187110424041748, 6.842136383056641, 7.497162818908691, 8.152189254760742, 8.807214736938477, 9.462241172790527, 10.117267608642578, 10.772293090820312, 11.427319526672363, 12.082345008850098, 12.737371444702148, 13.392396926879883, 14.047423362731934, 14.702449798583984, 15.357475280761719, 16.012500762939453, 16.667526245117188, 17.322553634643555, 17.97757911682129, 18.632604598999023, 19.28763198852539, 19.942657470703125, 20.59768295288086, 21.252710342407227]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 4.0, 3.0, 8.0, 2.0, 3.0, 6.0, 11.0, 15.0, 10.0, 9.0, 21.0, 25.0, 20.0, 14.0, 14.0, 35.0, 28.0, 35.0, 33.0, 26.0, 36.0, 28.0, 34.0, 36.0, 34.0, 30.0, 35.0, 42.0, 35.0, 30.0, 32.0, 32.0, 22.0, 32.0, 20.0, 18.0, 27.0, 26.0, 21.0, 16.0, 21.0, 9.0, 12.0, 9.0, 6.0, 10.0, 12.0, 6.0, 5.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-14.787582397460938, -14.345206260681152, -13.902830123901367, -13.460453987121582, -13.018077850341797, -12.575701713562012, -12.133325576782227, -11.690948486328125, -11.248573303222656, -10.806197166442871, -10.363821029663086, -9.9214448928833, -9.479068756103516, -9.03669261932373, -8.594316482543945, -8.151939392089844, -7.709563255310059, -7.267187118530273, -6.824810981750488, -6.382434844970703, -5.940058708190918, -5.497682571411133, -5.0553059577941895, -4.612929821014404, -4.170553684234619, -3.728177547454834, -3.285801410675049, -2.8434250354766846, -2.4010488986968994, -1.9586727619171143, -1.51629638671875, -1.0739202499389648, -0.6315441131591797, -0.18916791677474976, 0.2532082796096802, 0.6955845355987549, 1.13796067237854, 1.5803368091583252, 2.0227131843566895, 2.4650893211364746, 2.9074654579162598, 3.349841594696045, 3.79221773147583, 4.234594345092773, 4.676970481872559, 5.119346618652344, 5.561722755432129, 6.004098892211914, 6.446475028991699, 6.888851165771484, 7.3312273025512695, 7.773603439331055, 8.21597957611084, 8.658355712890625, 9.100732803344727, 9.543107986450195, 9.985485076904297, 10.427861213684082, 10.870237350463867, 11.312613487243652, 11.754989624023438, 12.197365760803223, 12.639741897583008, 13.08211898803711, 13.524494171142578]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 8.0, 8.0, 12.0, 12.0, 46.0, 54.0, 73.0, 107.0, 162.0, 220.0, 292.0, 370.0, 559.0, 797.0, 1084.0, 1583.0, 2265.0, 3373.0, 4601.0, 6499.0, 9607.0, 13875.0, 20652.0, 30547.0, 46004.0, 72433.0, 120881.0, 297813.0, 159673.0, 87264.0, 54850.0, 35963.0, 23835.0, 16486.0, 10875.0, 7732.0, 5422.0, 3667.0, 2587.0, 1790.0, 1378.0, 896.0, 605.0, 461.0, 368.0, 248.0, 153.0, 111.0, 76.0, 53.0, 42.0, 35.0, 21.0, 15.0, 12.0, 2.0, 3.0, 3.0], "bins": [-4.08984375, -3.968475341796875, -3.84710693359375, -3.725738525390625, -3.6043701171875, -3.483001708984375, -3.36163330078125, -3.240264892578125, -3.118896484375, -2.997528076171875, -2.87615966796875, -2.754791259765625, -2.6334228515625, -2.512054443359375, -2.39068603515625, -2.269317626953125, -2.14794921875, -2.026580810546875, -1.90521240234375, -1.783843994140625, -1.6624755859375, -1.541107177734375, -1.41973876953125, -1.298370361328125, -1.177001953125, -1.055633544921875, -0.93426513671875, -0.812896728515625, -0.6915283203125, -0.570159912109375, -0.44879150390625, -0.327423095703125, -0.2060546875, -0.084686279296875, 0.03668212890625, 0.158050537109375, 0.2794189453125, 0.400787353515625, 0.52215576171875, 0.643524169921875, 0.764892578125, 0.886260986328125, 1.00762939453125, 1.128997802734375, 1.2503662109375, 1.371734619140625, 1.49310302734375, 1.614471435546875, 1.73583984375, 1.857208251953125, 1.97857666015625, 2.099945068359375, 2.2213134765625, 2.342681884765625, 2.46405029296875, 2.585418701171875, 2.706787109375, 2.828155517578125, 2.94952392578125, 3.070892333984375, 3.1922607421875, 3.313629150390625, 3.43499755859375, 3.556365966796875, 3.677734375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 5.0, 6.0, 3.0, 1.0, 3.0, 4.0, 13.0, 8.0, 7.0, 18.0, 14.0, 15.0, 19.0, 23.0, 25.0, 22.0, 19.0, 34.0, 25.0, 27.0, 39.0, 32.0, 34.0, 36.0, 20.0, 30.0, 42.0, 43.0, 33.0, 39.0, 31.0, 27.0, 22.0, 24.0, 29.0, 29.0, 25.0, 24.0, 26.0, 17.0, 18.0, 21.0, 10.0, 10.0, 11.0, 7.0, 11.0, 6.0, 3.0, 10.0, 4.0, 4.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-13.5234375, -13.0777587890625, -12.632080078125, -12.1864013671875, -11.74072265625, -11.2950439453125, -10.849365234375, -10.4036865234375, -9.9580078125, -9.5123291015625, -9.066650390625, -8.6209716796875, -8.17529296875, -7.7296142578125, -7.283935546875, -6.8382568359375, -6.392578125, -5.9468994140625, -5.501220703125, -5.0555419921875, -4.60986328125, -4.1641845703125, -3.718505859375, -3.2728271484375, -2.8271484375, -2.3814697265625, -1.935791015625, -1.4901123046875, -1.04443359375, -0.5987548828125, -0.153076171875, 0.2926025390625, 0.73828125, 1.1839599609375, 1.629638671875, 2.0753173828125, 2.52099609375, 2.9666748046875, 3.412353515625, 3.8580322265625, 4.3037109375, 4.7493896484375, 5.195068359375, 5.6407470703125, 6.08642578125, 6.5321044921875, 6.977783203125, 7.4234619140625, 7.869140625, 8.3148193359375, 8.760498046875, 9.2061767578125, 9.65185546875, 10.0975341796875, 10.543212890625, 10.9888916015625, 11.4345703125, 11.8802490234375, 12.325927734375, 12.7716064453125, 13.21728515625, 13.6629638671875, 14.108642578125, 14.5543212890625, 15.0]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 11.0, 9.0, 15.0, 34.0, 46.0, 65.0, 129.0, 158.0, 241.0, 314.0, 469.0, 619.0, 968.0, 1438.0, 2062.0, 2976.0, 4292.0, 6595.0, 10297.0, 15354.0, 23975.0, 37034.0, 60633.0, 106959.0, 256501.0, 246345.0, 105300.0, 59909.0, 36627.0, 23707.0, 15322.0, 10069.0, 6586.0, 4284.0, 2902.0, 1910.0, 1447.0, 869.0, 643.0, 494.0, 294.0, 207.0, 152.0, 98.0, 76.0, 37.0, 33.0, 19.0, 14.0, 9.0, 8.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-4.46484375, -4.32525634765625, -4.1856689453125, -4.04608154296875, -3.906494140625, -3.76690673828125, -3.6273193359375, -3.48773193359375, -3.34814453125, -3.20855712890625, -3.0689697265625, -2.92938232421875, -2.789794921875, -2.65020751953125, -2.5106201171875, -2.37103271484375, -2.2314453125, -2.09185791015625, -1.9522705078125, -1.81268310546875, -1.673095703125, -1.53350830078125, -1.3939208984375, -1.25433349609375, -1.11474609375, -0.97515869140625, -0.8355712890625, -0.69598388671875, -0.556396484375, -0.41680908203125, -0.2772216796875, -0.13763427734375, 0.001953125, 0.14154052734375, 0.2811279296875, 0.42071533203125, 0.560302734375, 0.69989013671875, 0.8394775390625, 0.97906494140625, 1.11865234375, 1.25823974609375, 1.3978271484375, 1.53741455078125, 1.677001953125, 1.81658935546875, 1.9561767578125, 2.09576416015625, 2.2353515625, 2.37493896484375, 2.5145263671875, 2.65411376953125, 2.793701171875, 2.93328857421875, 3.0728759765625, 3.21246337890625, 3.35205078125, 3.49163818359375, 3.6312255859375, 3.77081298828125, 3.910400390625, 4.04998779296875, 4.1895751953125, 4.32916259765625, 4.46875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 2.0, 8.0, 13.0, 5.0, 8.0, 7.0, 13.0, 10.0, 12.0, 30.0, 11.0, 24.0, 17.0, 19.0, 25.0, 31.0, 26.0, 32.0, 21.0, 39.0, 39.0, 35.0, 34.0, 43.0, 39.0, 36.0, 40.0, 32.0, 41.0, 28.0, 35.0, 42.0, 23.0, 29.0, 17.0, 18.0, 19.0, 22.0, 13.0, 13.0, 12.0, 11.0, 9.0, 4.0, 10.0, 7.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.71875, -8.408447265625, -8.09814453125, -7.787841796875, -7.4775390625, -7.167236328125, -6.85693359375, -6.546630859375, -6.236328125, -5.926025390625, -5.61572265625, -5.305419921875, -4.9951171875, -4.684814453125, -4.37451171875, -4.064208984375, -3.75390625, -3.443603515625, -3.13330078125, -2.822998046875, -2.5126953125, -2.202392578125, -1.89208984375, -1.581787109375, -1.271484375, -0.961181640625, -0.65087890625, -0.340576171875, -0.0302734375, 0.280029296875, 0.59033203125, 0.900634765625, 1.2109375, 1.521240234375, 1.83154296875, 2.141845703125, 2.4521484375, 2.762451171875, 3.07275390625, 3.383056640625, 3.693359375, 4.003662109375, 4.31396484375, 4.624267578125, 4.9345703125, 5.244873046875, 5.55517578125, 5.865478515625, 6.17578125, 6.486083984375, 6.79638671875, 7.106689453125, 7.4169921875, 7.727294921875, 8.03759765625, 8.347900390625, 8.658203125, 8.968505859375, 9.27880859375, 9.589111328125, 9.8994140625, 10.209716796875, 10.52001953125, 10.830322265625, 11.140625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 2.0, 8.0, 9.0, 12.0, 13.0, 15.0, 18.0, 21.0, 52.0, 51.0, 77.0, 93.0, 131.0, 172.0, 246.0, 278.0, 422.0, 534.0, 800.0, 1124.0, 1708.0, 2626.0, 4422.0, 7689.0, 14632.0, 29881.0, 70520.0, 205961.0, 423231.0, 166850.0, 59593.0, 25750.0, 12821.0, 6789.0, 4031.0, 2536.0, 1596.0, 1100.0, 743.0, 507.0, 389.0, 274.0, 203.0, 181.0, 123.0, 69.0, 74.0, 60.0, 38.0, 23.0, 18.0, 10.0, 12.0, 8.0, 9.0, 6.0, 1.0, 0.0, 5.0, 1.0], "bins": [-0.0112152099609375, -0.010869145393371582, -0.010523080825805664, -0.010177016258239746, -0.009830951690673828, -0.00948488712310791, -0.009138822555541992, -0.008792757987976074, -0.008446693420410156, -0.008100628852844238, -0.00775456428527832, -0.007408499717712402, -0.007062435150146484, -0.006716370582580566, -0.0063703060150146484, -0.0060242414474487305, -0.0056781768798828125, -0.0053321123123168945, -0.0049860477447509766, -0.004639983177185059, -0.004293918609619141, -0.003947854042053223, -0.0036017894744873047, -0.0032557249069213867, -0.0029096603393554688, -0.0025635957717895508, -0.002217531204223633, -0.0018714666366577148, -0.0015254020690917969, -0.001179337501525879, -0.0008332729339599609, -0.00048720836639404297, -0.000141143798828125, 0.00020492076873779297, 0.0005509853363037109, 0.0008970499038696289, 0.0012431144714355469, 0.0015891790390014648, 0.0019352436065673828, 0.0022813081741333008, 0.0026273727416992188, 0.0029734373092651367, 0.0033195018768310547, 0.0036655664443969727, 0.004011631011962891, 0.004357695579528809, 0.0047037601470947266, 0.0050498247146606445, 0.0053958892822265625, 0.0057419538497924805, 0.0060880184173583984, 0.006434082984924316, 0.006780147552490234, 0.007126212120056152, 0.00747227668762207, 0.007818341255187988, 0.008164405822753906, 0.008510470390319824, 0.008856534957885742, 0.00920259952545166, 0.009548664093017578, 0.009894728660583496, 0.010240793228149414, 0.010586857795715332, 0.01093292236328125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 4.0, 4.0, 3.0, 8.0, 11.0, 13.0, 12.0, 16.0, 22.0, 35.0, 50.0, 61.0, 74.0, 108.0, 103.0, 103.0, 114.0, 62.0, 42.0, 41.0, 34.0, 15.0, 21.0, 12.0, 11.0, 9.0, 7.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0609626770019531e-05, -1.0166317224502563e-05, -9.723007678985596e-06, -9.279698133468628e-06, -8.83638858795166e-06, -8.393079042434692e-06, -7.949769496917725e-06, -7.506459951400757e-06, -7.063150405883789e-06, -6.619840860366821e-06, -6.1765313148498535e-06, -5.733221769332886e-06, -5.289912223815918e-06, -4.84660267829895e-06, -4.403293132781982e-06, -3.959983587265015e-06, -3.516674041748047e-06, -3.073364496231079e-06, -2.6300549507141113e-06, -2.1867454051971436e-06, -1.7434358596801758e-06, -1.300126314163208e-06, -8.568167686462402e-07, -4.1350722312927246e-07, 2.9802322387695312e-08, 4.731118679046631e-07, 9.164214134216309e-07, 1.3597309589385986e-06, 1.8030405044555664e-06, 2.246350049972534e-06, 2.689659595489502e-06, 3.1329691410064697e-06, 3.5762786865234375e-06, 4.019588232040405e-06, 4.462897777557373e-06, 4.906207323074341e-06, 5.349516868591309e-06, 5.792826414108276e-06, 6.236135959625244e-06, 6.679445505142212e-06, 7.12275505065918e-06, 7.5660645961761475e-06, 8.009374141693115e-06, 8.452683687210083e-06, 8.89599323272705e-06, 9.339302778244019e-06, 9.782612323760986e-06, 1.0225921869277954e-05, 1.0669231414794922e-05, 1.111254096031189e-05, 1.1555850505828857e-05, 1.1999160051345825e-05, 1.2442469596862793e-05, 1.288577914237976e-05, 1.3329088687896729e-05, 1.3772398233413696e-05, 1.4215707778930664e-05, 1.4659017324447632e-05, 1.51023268699646e-05, 1.5545636415481567e-05, 1.5988945960998535e-05, 1.6432255506515503e-05, 1.687556505203247e-05, 1.731887459754944e-05, 1.7762184143066406e-05]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 5.0, 4.0, 10.0, 7.0, 9.0, 12.0, 24.0, 32.0, 52.0, 80.0, 108.0, 158.0, 207.0, 294.0, 484.0, 637.0, 919.0, 1369.0, 2128.0, 3288.0, 5359.0, 8618.0, 14831.0, 27916.0, 57652.0, 141387.0, 375246.0, 233597.0, 85723.0, 38937.0, 19862.0, 11170.0, 6511.0, 4072.0, 2587.0, 1659.0, 1220.0, 697.0, 542.0, 349.0, 256.0, 150.0, 126.0, 79.0, 46.0, 42.0, 36.0, 23.0, 18.0, 11.0, 7.0, 7.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0102081298828125, -0.009896278381347656, -0.009584426879882812, -0.009272575378417969, -0.008960723876953125, -0.008648872375488281, -0.008337020874023438, -0.008025169372558594, -0.00771331787109375, -0.007401466369628906, -0.0070896148681640625, -0.006777763366699219, -0.006465911865234375, -0.006154060363769531, -0.0058422088623046875, -0.005530357360839844, -0.005218505859375, -0.004906654357910156, -0.0045948028564453125, -0.004282951354980469, -0.003971099853515625, -0.0036592483520507812, -0.0033473968505859375, -0.0030355453491210938, -0.00272369384765625, -0.0024118423461914062, -0.0020999908447265625, -0.0017881393432617188, -0.001476287841796875, -0.0011644363403320312, -0.0008525848388671875, -0.0005407333374023438, -0.0002288818359375, 8.296966552734375e-05, 0.0003948211669921875, 0.0007066726684570312, 0.001018524169921875, 0.0013303756713867188, 0.0016422271728515625, 0.0019540786743164062, 0.00226593017578125, 0.0025777816772460938, 0.0028896331787109375, 0.0032014846801757812, 0.003513336181640625, 0.0038251876831054688, 0.0041370391845703125, 0.004448890686035156, 0.0047607421875, 0.005072593688964844, 0.0053844451904296875, 0.005696296691894531, 0.006008148193359375, 0.006319999694824219, 0.0066318511962890625, 0.006943702697753906, 0.00725555419921875, 0.007567405700683594, 0.007879257202148438, 0.008191108703613281, 0.008502960205078125, 0.008814811706542969, 0.009126663208007812, 0.009438514709472656, 0.0097503662109375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 5.0, 3.0, 7.0, 1.0, 5.0, 8.0, 6.0, 14.0, 13.0, 10.0, 15.0, 19.0, 20.0, 36.0, 54.0, 52.0, 95.0, 122.0, 122.0, 106.0, 71.0, 47.0, 36.0, 29.0, 27.0, 13.0, 18.0, 14.0, 4.0, 8.0, 8.0, 5.0, 5.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00386810302734375, -0.0037619173526763916, -0.003655731678009033, -0.003549546003341675, -0.0034433603286743164, -0.003337174654006958, -0.0032309889793395996, -0.003124803304672241, -0.003018617630004883, -0.0029124319553375244, -0.002806246280670166, -0.0027000606060028076, -0.0025938749313354492, -0.002487689256668091, -0.0023815035820007324, -0.002275317907333374, -0.0021691322326660156, -0.0020629465579986572, -0.001956760883331299, -0.0018505752086639404, -0.001744389533996582, -0.0016382038593292236, -0.0015320181846618652, -0.0014258325099945068, -0.0013196468353271484, -0.00121346116065979, -0.0011072754859924316, -0.0010010898113250732, -0.0008949041366577148, -0.0007887184619903564, -0.000682532787322998, -0.0005763471126556396, -0.00047016143798828125, -0.00036397576332092285, -0.00025779008865356445, -0.00015160441398620605, -4.5418739318847656e-05, 6.076693534851074e-05, 0.00016695261001586914, 0.00027313828468322754, 0.00037932395935058594, 0.00048550963401794434, 0.0005916953086853027, 0.0006978809833526611, 0.0008040666580200195, 0.0009102523326873779, 0.0010164380073547363, 0.0011226236820220947, 0.0012288093566894531, 0.0013349950313568115, 0.00144118070602417, 0.0015473663806915283, 0.0016535520553588867, 0.0017597377300262451, 0.0018659234046936035, 0.001972109079360962, 0.0020782947540283203, 0.0021844804286956787, 0.002290666103363037, 0.0023968517780303955, 0.002503037452697754, 0.0026092231273651123, 0.0027154088020324707, 0.002821594476699829, 0.0029277801513671875]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 2.0, 9.0, 5.0, 5.0, 9.0, 11.0, 10.0, 12.0, 16.0, 20.0, 24.0, 37.0, 44.0, 41.0, 67.0, 80.0, 69.0, 92.0, 56.0, 66.0, 47.0, 63.0, 37.0, 29.0, 32.0, 15.0, 24.0, 11.0, 14.0, 11.0, 8.0, 3.0, 12.0, 2.0, 8.0, 1.0, 2.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.40215301513672, -19.755403518676758, -19.108652114868164, -18.461902618408203, -17.81515121459961, -17.16840171813965, -16.521650314331055, -15.874900817871094, -15.228150367736816, -14.581399917602539, -13.934649467468262, -13.287899017333984, -12.641149520874023, -11.99439811706543, -11.347648620605469, -10.700898170471191, -10.054147720336914, -9.407397270202637, -8.76064682006836, -8.113896369934082, -7.467146396636963, -6.8203959465026855, -6.173645973205566, -5.526895523071289, -4.880145072937012, -4.233394622802734, -3.586644411087036, -2.939894199371338, -2.2931437492370605, -1.6463932991027832, -0.999643087387085, -0.3528928756713867, 0.2938556671142578, 0.9406059980392456, 1.5873563289642334, 2.2341065406799316, 2.880856990814209, 3.5276074409484863, 4.1743574142456055, 4.821107864379883, 5.46785831451416, 6.1146087646484375, 6.761359214782715, 7.408109188079834, 8.054859161376953, 8.701610565185547, 9.348360061645508, 9.995110511779785, 10.641860961914062, 11.28861141204834, 11.935361862182617, 12.582112312316895, 13.228862762451172, 13.875612258911133, 14.52236270904541, 15.169113159179688, 15.815863609313965, 16.462614059448242, 17.109363555908203, 17.756114959716797, 18.402864456176758, 19.04961585998535, 19.696365356445312, 20.343116760253906, 20.989866256713867]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 4.0, 4.0, 7.0, 2.0, 3.0, 7.0, 10.0, 15.0, 10.0, 11.0, 19.0, 24.0, 21.0, 15.0, 12.0, 35.0, 33.0, 31.0, 33.0, 28.0, 34.0, 28.0, 37.0, 32.0, 37.0, 29.0, 34.0, 43.0, 33.0, 31.0, 32.0, 33.0, 20.0, 32.0, 21.0, 18.0, 26.0, 26.0, 22.0, 16.0, 21.0, 10.0, 9.0, 12.0, 5.0, 9.0, 13.0, 5.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-14.600467681884766, -14.163003921508789, -13.725541114807129, -13.288077354431152, -12.850613594055176, -12.413150787353516, -11.975687026977539, -11.538223266601562, -11.100759506225586, -10.66329574584961, -10.22583293914795, -9.788369178771973, -9.350905418395996, -8.913442611694336, -8.47597885131836, -8.038515090942383, -7.601052284240723, -7.163589000701904, -6.726125240325928, -6.288661956787109, -5.851198196411133, -5.4137349128723145, -4.976271629333496, -4.5388078689575195, -4.101344585418701, -3.6638810634613037, -3.2264175415039062, -2.788954257965088, -2.3514907360076904, -1.914027214050293, -1.4765639305114746, -1.0391004085540771, -0.6016368865966797, -0.164173424243927, 0.2732900381088257, 0.7107534408569336, 1.148216962814331, 1.5856804847717285, 2.023143768310547, 2.4606072902679443, 2.898070812225342, 3.3355343341827393, 3.7729978561401367, 4.210461139678955, 4.647924423217773, 5.08538818359375, 5.522851467132568, 5.960314750671387, 6.397778511047363, 6.835241794586182, 7.272705554962158, 7.710168838500977, 8.147632598876953, 8.58509635925293, 9.02255916595459, 9.460022926330566, 9.897485733032227, 10.334949493408203, 10.772412300109863, 11.20987606048584, 11.647339820861816, 12.084802627563477, 12.522266387939453, 12.95973014831543, 13.397193908691406]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 7.0, 8.0, 16.0, 20.0, 24.0, 34.0, 86.0, 107.0, 171.0, 240.0, 351.0, 537.0, 781.0, 1096.0, 1528.0, 2176.0, 3044.0, 4333.0, 5993.0, 8450.0, 11906.0, 17472.0, 25027.0, 38677.0, 59931.0, 97632.0, 149320.0, 180462.0, 151989.0, 100460.0, 61913.0, 39402.0, 26015.0, 17790.0, 12103.0, 8518.0, 6144.0, 4287.0, 3181.0, 2197.0, 1596.0, 1081.0, 780.0, 505.0, 428.0, 272.0, 188.0, 92.0, 54.0, 61.0, 38.0, 24.0, 12.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-22.859375, -22.110595703125, -21.36181640625, -20.613037109375, -19.8642578125, -19.115478515625, -18.36669921875, -17.617919921875, -16.869140625, -16.120361328125, -15.37158203125, -14.622802734375, -13.8740234375, -13.125244140625, -12.37646484375, -11.627685546875, -10.87890625, -10.130126953125, -9.38134765625, -8.632568359375, -7.8837890625, -7.135009765625, -6.38623046875, -5.637451171875, -4.888671875, -4.139892578125, -3.39111328125, -2.642333984375, -1.8935546875, -1.144775390625, -0.39599609375, 0.352783203125, 1.1015625, 1.850341796875, 2.59912109375, 3.347900390625, 4.0966796875, 4.845458984375, 5.59423828125, 6.343017578125, 7.091796875, 7.840576171875, 8.58935546875, 9.338134765625, 10.0869140625, 10.835693359375, 11.58447265625, 12.333251953125, 13.08203125, 13.830810546875, 14.57958984375, 15.328369140625, 16.0771484375, 16.825927734375, 17.57470703125, 18.323486328125, 19.072265625, 19.821044921875, 20.56982421875, 21.318603515625, 22.0673828125, 22.816162109375, 23.56494140625, 24.313720703125, 25.0625]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 3.0, 8.0, 4.0, 9.0, 7.0, 10.0, 17.0, 11.0, 13.0, 10.0, 19.0, 16.0, 20.0, 28.0, 26.0, 35.0, 29.0, 28.0, 37.0, 34.0, 33.0, 36.0, 31.0, 29.0, 32.0, 34.0, 36.0, 30.0, 37.0, 30.0, 32.0, 28.0, 21.0, 28.0, 29.0, 29.0, 18.0, 15.0, 15.0, 18.0, 7.0, 14.0, 8.0, 9.0, 10.0, 12.0, 4.0, 5.0, 5.0, 2.0, 2.0, 1.0, 4.0], "bins": [-13.8046875, -13.4119873046875, -13.019287109375, -12.6265869140625, -12.23388671875, -11.8411865234375, -11.448486328125, -11.0557861328125, -10.6630859375, -10.2703857421875, -9.877685546875, -9.4849853515625, -9.09228515625, -8.6995849609375, -8.306884765625, -7.9141845703125, -7.521484375, -7.1287841796875, -6.736083984375, -6.3433837890625, -5.95068359375, -5.5579833984375, -5.165283203125, -4.7725830078125, -4.3798828125, -3.9871826171875, -3.594482421875, -3.2017822265625, -2.80908203125, -2.4163818359375, -2.023681640625, -1.6309814453125, -1.23828125, -0.8455810546875, -0.452880859375, -0.0601806640625, 0.33251953125, 0.7252197265625, 1.117919921875, 1.5106201171875, 1.9033203125, 2.2960205078125, 2.688720703125, 3.0814208984375, 3.47412109375, 3.8668212890625, 4.259521484375, 4.6522216796875, 5.044921875, 5.4376220703125, 5.830322265625, 6.2230224609375, 6.61572265625, 7.0084228515625, 7.401123046875, 7.7938232421875, 8.1865234375, 8.5792236328125, 8.971923828125, 9.3646240234375, 9.75732421875, 10.1500244140625, 10.542724609375, 10.9354248046875, 11.328125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 6.0, 11.0, 17.0, 22.0, 29.0, 46.0, 60.0, 103.0, 128.0, 197.0, 283.0, 442.0, 688.0, 1011.0, 1590.0, 2499.0, 3821.0, 6093.0, 9662.0, 15127.0, 23869.0, 37912.0, 63817.0, 114081.0, 196701.0, 221363.0, 144668.0, 79335.0, 46451.0, 28621.0, 18011.0, 11464.0, 7216.0, 4671.0, 2945.0, 1944.0, 1245.0, 755.0, 520.0, 351.0, 224.0, 189.0, 115.0, 72.0, 81.0, 40.0, 28.0, 13.0, 9.0, 4.0, 2.0, 6.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.1875, -30.248046875, -29.30859375, -28.369140625, -27.4296875, -26.490234375, -25.55078125, -24.611328125, -23.671875, -22.732421875, -21.79296875, -20.853515625, -19.9140625, -18.974609375, -18.03515625, -17.095703125, -16.15625, -15.216796875, -14.27734375, -13.337890625, -12.3984375, -11.458984375, -10.51953125, -9.580078125, -8.640625, -7.701171875, -6.76171875, -5.822265625, -4.8828125, -3.943359375, -3.00390625, -2.064453125, -1.125, -0.185546875, 0.75390625, 1.693359375, 2.6328125, 3.572265625, 4.51171875, 5.451171875, 6.390625, 7.330078125, 8.26953125, 9.208984375, 10.1484375, 11.087890625, 12.02734375, 12.966796875, 13.90625, 14.845703125, 15.78515625, 16.724609375, 17.6640625, 18.603515625, 19.54296875, 20.482421875, 21.421875, 22.361328125, 23.30078125, 24.240234375, 25.1796875, 26.119140625, 27.05859375, 27.998046875, 28.9375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 2.0, 8.0, 9.0, 25.0, 17.0, 13.0, 24.0, 15.0, 35.0, 23.0, 33.0, 27.0, 45.0, 27.0, 37.0, 52.0, 49.0, 57.0, 42.0, 43.0, 39.0, 52.0, 40.0, 37.0, 26.0, 21.0, 28.0, 31.0, 28.0, 25.0, 15.0, 19.0, 22.0, 5.0, 8.0, 4.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3671875, -10.0457763671875, -9.724365234375, -9.4029541015625, -9.08154296875, -8.7601318359375, -8.438720703125, -8.1173095703125, -7.7958984375, -7.4744873046875, -7.153076171875, -6.8316650390625, -6.51025390625, -6.1888427734375, -5.867431640625, -5.5460205078125, -5.224609375, -4.9031982421875, -4.581787109375, -4.2603759765625, -3.93896484375, -3.6175537109375, -3.296142578125, -2.9747314453125, -2.6533203125, -2.3319091796875, -2.010498046875, -1.6890869140625, -1.36767578125, -1.0462646484375, -0.724853515625, -0.4034423828125, -0.08203125, 0.2393798828125, 0.560791015625, 0.8822021484375, 1.20361328125, 1.5250244140625, 1.846435546875, 2.1678466796875, 2.4892578125, 2.8106689453125, 3.132080078125, 3.4534912109375, 3.77490234375, 4.0963134765625, 4.417724609375, 4.7391357421875, 5.060546875, 5.3819580078125, 5.703369140625, 6.0247802734375, 6.34619140625, 6.6676025390625, 6.989013671875, 7.3104248046875, 7.6318359375, 7.9532470703125, 8.274658203125, 8.5960693359375, 8.91748046875, 9.2388916015625, 9.560302734375, 9.8817138671875, 10.203125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 6.0, 6.0, 2.0, 5.0, 9.0, 9.0, 16.0, 39.0, 30.0, 51.0, 99.0, 95.0, 146.0, 197.0, 299.0, 421.0, 616.0, 930.0, 1345.0, 2066.0, 3308.0, 5361.0, 8880.0, 15862.0, 30091.0, 69581.0, 224058.0, 434130.0, 143072.0, 50760.0, 23964.0, 12612.0, 7486.0, 4452.0, 2878.0, 1866.0, 1229.0, 811.0, 506.0, 363.0, 288.0, 172.0, 137.0, 89.0, 75.0, 38.0, 33.0, 20.0, 19.0, 14.0, 10.0, 7.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.7734375, -1.7185821533203125, -1.663726806640625, -1.6088714599609375, -1.55401611328125, -1.4991607666015625, -1.444305419921875, -1.3894500732421875, -1.3345947265625, -1.2797393798828125, -1.224884033203125, -1.1700286865234375, -1.11517333984375, -1.0603179931640625, -1.005462646484375, -0.9506072998046875, -0.895751953125, -0.8408966064453125, -0.786041259765625, -0.7311859130859375, -0.67633056640625, -0.6214752197265625, -0.566619873046875, -0.5117645263671875, -0.4569091796875, -0.4020538330078125, -0.347198486328125, -0.2923431396484375, -0.23748779296875, -0.1826324462890625, -0.127777099609375, -0.0729217529296875, -0.01806640625, 0.0367889404296875, 0.091644287109375, 0.1464996337890625, 0.20135498046875, 0.2562103271484375, 0.311065673828125, 0.3659210205078125, 0.4207763671875, 0.4756317138671875, 0.530487060546875, 0.5853424072265625, 0.64019775390625, 0.6950531005859375, 0.749908447265625, 0.8047637939453125, 0.859619140625, 0.9144744873046875, 0.969329833984375, 1.0241851806640625, 1.07904052734375, 1.1338958740234375, 1.188751220703125, 1.2436065673828125, 1.2984619140625, 1.3533172607421875, 1.408172607421875, 1.4630279541015625, 1.51788330078125, 1.5727386474609375, 1.627593994140625, 1.6824493408203125, 1.7373046875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 3.0, 6.0, 9.0, 4.0, 8.0, 6.0, 11.0, 17.0, 14.0, 18.0, 23.0, 41.0, 58.0, 56.0, 74.0, 81.0, 95.0, 93.0, 85.0, 60.0, 58.0, 34.0, 29.0, 22.0, 21.0, 19.0, 13.0, 10.0, 9.0, 11.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00014543533325195312, -0.00014054030179977417, -0.00013564527034759521, -0.00013075023889541626, -0.0001258552074432373, -0.00012096017599105835, -0.0001160651445388794, -0.00011117011308670044, -0.00010627508163452148, -0.00010138005018234253, -9.648501873016357e-05, -9.158998727798462e-05, -8.669495582580566e-05, -8.179992437362671e-05, -7.690489292144775e-05, -7.20098614692688e-05, -6.711483001708984e-05, -6.221979856491089e-05, -5.7324767112731934e-05, -5.242973566055298e-05, -4.7534704208374023e-05, -4.263967275619507e-05, -3.774464130401611e-05, -3.284960985183716e-05, -2.7954578399658203e-05, -2.3059546947479248e-05, -1.8164515495300293e-05, -1.3269484043121338e-05, -8.374452590942383e-06, -3.4794211387634277e-06, 1.4156103134155273e-06, 6.310641765594482e-06, 1.1205673217773438e-05, 1.6100704669952393e-05, 2.0995736122131348e-05, 2.5890767574310303e-05, 3.078579902648926e-05, 3.568083047866821e-05, 4.057586193084717e-05, 4.547089338302612e-05, 5.036592483520508e-05, 5.526095628738403e-05, 6.015598773956299e-05, 6.505101919174194e-05, 6.99460506439209e-05, 7.484108209609985e-05, 7.973611354827881e-05, 8.463114500045776e-05, 8.952617645263672e-05, 9.442120790481567e-05, 9.931623935699463e-05, 0.00010421127080917358, 0.00010910630226135254, 0.0001140013337135315, 0.00011889636516571045, 0.0001237913966178894, 0.00012868642807006836, 0.00013358145952224731, 0.00013847649097442627, 0.00014337152242660522, 0.00014826655387878418, 0.00015316158533096313, 0.0001580566167831421, 0.00016295164823532104, 0.0001678466796875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 8.0, 10.0, 20.0, 24.0, 31.0, 53.0, 79.0, 117.0, 158.0, 242.0, 383.0, 497.0, 823.0, 1103.0, 1718.0, 2443.0, 3547.0, 5386.0, 8272.0, 12888.0, 20955.0, 35806.0, 70294.0, 183740.0, 382464.0, 163343.0, 64514.0, 33644.0, 19776.0, 12262.0, 7822.0, 5196.0, 3487.0, 2387.0, 1628.0, 1099.0, 788.0, 526.0, 358.0, 220.0, 152.0, 101.0, 63.0, 52.0, 23.0, 17.0, 11.0, 12.0, 9.0, 6.0, 1.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.3974609375, -1.3515625, -1.3056640625, -1.259765625, -1.2138671875, -1.16796875, -1.1220703125, -1.076171875, -1.0302734375, -0.984375, -0.9384765625, -0.892578125, -0.8466796875, -0.80078125, -0.7548828125, -0.708984375, -0.6630859375, -0.6171875, -0.5712890625, -0.525390625, -0.4794921875, -0.43359375, -0.3876953125, -0.341796875, -0.2958984375, -0.25, -0.2041015625, -0.158203125, -0.1123046875, -0.06640625, -0.0205078125, 0.025390625, 0.0712890625, 0.1171875, 0.1630859375, 0.208984375, 0.2548828125, 0.30078125, 0.3466796875, 0.392578125, 0.4384765625, 0.484375, 0.5302734375, 0.576171875, 0.6220703125, 0.66796875, 0.7138671875, 0.759765625, 0.8056640625, 0.8515625, 0.8974609375, 0.943359375, 0.9892578125, 1.03515625, 1.0810546875, 1.126953125, 1.1728515625, 1.21875, 1.2646484375, 1.310546875, 1.3564453125, 1.40234375, 1.4482421875, 1.494140625, 1.5400390625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 4.0, 5.0, 2.0, 4.0, 6.0, 7.0, 6.0, 9.0, 6.0, 10.0, 15.0, 11.0, 17.0, 16.0, 30.0, 23.0, 33.0, 21.0, 71.0, 48.0, 86.0, 69.0, 91.0, 63.0, 49.0, 60.0, 33.0, 31.0, 28.0, 31.0, 22.0, 13.0, 17.0, 11.0, 13.0, 8.0, 4.0, 2.0, 11.0, 4.0, 3.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.421630859375, -0.4070625305175781, -0.39249420166015625, -0.3779258728027344, -0.3633575439453125, -0.3487892150878906, -0.33422088623046875, -0.3196525573730469, -0.305084228515625, -0.2905158996582031, -0.27594757080078125, -0.2613792419433594, -0.2468109130859375, -0.23224258422851562, -0.21767425537109375, -0.20310592651367188, -0.18853759765625, -0.17396926879882812, -0.15940093994140625, -0.14483261108398438, -0.1302642822265625, -0.11569595336914062, -0.10112762451171875, -0.08655929565429688, -0.071990966796875, -0.057422637939453125, -0.04285430908203125, -0.028285980224609375, -0.0137176513671875, 0.000850677490234375, 0.01541900634765625, 0.029987335205078125, 0.0445556640625, 0.059123992919921875, 0.07369232177734375, 0.08826065063476562, 0.1028289794921875, 0.11739730834960938, 0.13196563720703125, 0.14653396606445312, 0.161102294921875, 0.17567062377929688, 0.19023895263671875, 0.20480728149414062, 0.2193756103515625, 0.23394393920898438, 0.24851226806640625, 0.2630805969238281, 0.27764892578125, 0.2922172546386719, 0.30678558349609375, 0.3213539123535156, 0.3359222412109375, 0.3504905700683594, 0.36505889892578125, 0.3796272277832031, 0.394195556640625, 0.4087638854980469, 0.42333221435546875, 0.4379005432128906, 0.4524688720703125, 0.4670372009277344, 0.48160552978515625, 0.4961738586425781, 0.5107421875]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 4.0, 2.0, 2.0, 4.0, 6.0, 6.0, 5.0, 7.0, 12.0, 12.0, 15.0, 21.0, 29.0, 33.0, 46.0, 61.0, 65.0, 87.0, 76.0, 84.0, 84.0, 56.0, 51.0, 48.0, 32.0, 33.0, 23.0, 18.0, 12.0, 13.0, 13.0, 11.0, 6.0, 5.0, 1.0, 9.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-21.365304946899414, -20.722469329833984, -20.079633712768555, -19.436798095703125, -18.793960571289062, -18.151124954223633, -17.508289337158203, -16.865453720092773, -16.222618103027344, -15.579782485961914, -14.936946868896484, -14.294110298156738, -13.651274681091309, -13.008439064025879, -12.365602493286133, -11.722766876220703, -11.079931259155273, -10.437095642089844, -9.794260025024414, -9.151423454284668, -8.508587837219238, -7.865752220153809, -7.222916126251221, -6.580080032348633, -5.937244415283203, -5.294408798217773, -4.6515727043151855, -4.008736610412598, -3.365900993347168, -2.723065137863159, -2.0802292823791504, -1.4373931884765625, -0.7945575714111328, -0.15172171592712402, 0.49111413955688477, 1.1339499950408936, 1.7767858505249023, 2.419621706008911, 3.06245756149292, 3.705293655395508, 4.3481292724609375, 4.990964889526367, 5.633800983428955, 6.276637077331543, 6.919472694396973, 7.562308311462402, 8.205144882202148, 8.847980499267578, 9.490816116333008, 10.133651733398438, 10.776487350463867, 11.419323921203613, 12.062159538269043, 12.704995155334473, 13.347831726074219, 13.990667343139648, 14.633502960205078, 15.276338577270508, 15.919174194335938, 16.562009811401367, 17.204845428466797, 17.84768295288086, 18.49051856994629, 19.13335418701172, 19.77618980407715]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 2.0, 5.0, 2.0, 6.0, 8.0, 10.0, 11.0, 16.0, 10.0, 14.0, 17.0, 18.0, 21.0, 18.0, 29.0, 26.0, 26.0, 27.0, 28.0, 45.0, 42.0, 34.0, 34.0, 25.0, 28.0, 36.0, 34.0, 42.0, 36.0, 39.0, 31.0, 39.0, 21.0, 31.0, 29.0, 22.0, 24.0, 22.0, 9.0, 11.0, 14.0, 14.0, 9.0, 8.0, 9.0, 5.0, 7.0, 8.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.79038143157959, -13.354720115661621, -12.919058799743652, -12.483397483825684, -12.047736167907715, -11.612074851989746, -11.176413536071777, -10.740752220153809, -10.30509090423584, -9.869429588317871, -9.433768272399902, -8.998106956481934, -8.562445640563965, -8.126784324645996, -7.691123008728027, -7.255461692810059, -6.81980037689209, -6.384139060974121, -5.948477745056152, -5.512816429138184, -5.077155113220215, -4.641493797302246, -4.205832481384277, -3.7701711654663086, -3.33450984954834, -2.898848533630371, -2.4631872177124023, -2.0275259017944336, -1.5918645858764648, -1.156203269958496, -0.7205419540405273, -0.2848806381225586, 0.15077972412109375, 0.5864410400390625, 1.0221023559570312, 1.457763671875, 1.8934249877929688, 2.3290863037109375, 2.7647476196289062, 3.200408935546875, 3.6360702514648438, 4.0717315673828125, 4.507392883300781, 4.94305419921875, 5.378715515136719, 5.8143768310546875, 6.250038146972656, 6.685699462890625, 7.121360778808594, 7.5570220947265625, 7.992683410644531, 8.4283447265625, 8.864006042480469, 9.299667358398438, 9.735328674316406, 10.170989990234375, 10.606651306152344, 11.042312622070312, 11.477973937988281, 11.91363525390625, 12.349296569824219, 12.784957885742188, 13.220619201660156, 13.656280517578125, 14.091941833496094]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 13.0, 15.0, 28.0, 67.0, 86.0, 120.0, 184.0, 290.0, 357.0, 568.0, 820.0, 1209.0, 1758.0, 2453.0, 3548.0, 5262.0, 7853.0, 11815.0, 18151.0, 28738.0, 48005.0, 82419.0, 165524.0, 555010.0, 1598721.0, 1097769.0, 288944.0, 110797.0, 61421.0, 36198.0, 22375.0, 14381.0, 9370.0, 6178.0, 4229.0, 2977.0, 2090.0, 1401.0, 977.0, 685.0, 483.0, 339.0, 219.0, 161.0, 102.0, 65.0, 37.0, 27.0, 12.0, 10.0, 4.0, 7.0, 9.0, 3.0, 0.0, 2.0], "bins": [-24.671875, -23.918701171875, -23.16552734375, -22.412353515625, -21.6591796875, -20.906005859375, -20.15283203125, -19.399658203125, -18.646484375, -17.893310546875, -17.14013671875, -16.386962890625, -15.6337890625, -14.880615234375, -14.12744140625, -13.374267578125, -12.62109375, -11.867919921875, -11.11474609375, -10.361572265625, -9.6083984375, -8.855224609375, -8.10205078125, -7.348876953125, -6.595703125, -5.842529296875, -5.08935546875, -4.336181640625, -3.5830078125, -2.829833984375, -2.07666015625, -1.323486328125, -0.5703125, 0.182861328125, 0.93603515625, 1.689208984375, 2.4423828125, 3.195556640625, 3.94873046875, 4.701904296875, 5.455078125, 6.208251953125, 6.96142578125, 7.714599609375, 8.4677734375, 9.220947265625, 9.97412109375, 10.727294921875, 11.48046875, 12.233642578125, 12.98681640625, 13.739990234375, 14.4931640625, 15.246337890625, 15.99951171875, 16.752685546875, 17.505859375, 18.259033203125, 19.01220703125, 19.765380859375, 20.5185546875, 21.271728515625, 22.02490234375, 22.778076171875, 23.53125]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 3.0, 1.0, 5.0, 5.0, 10.0, 8.0, 8.0, 4.0, 10.0, 11.0, 13.0, 13.0, 17.0, 15.0, 24.0, 9.0, 22.0, 33.0, 26.0, 29.0, 22.0, 36.0, 22.0, 39.0, 27.0, 32.0, 28.0, 28.0, 28.0, 37.0, 31.0, 28.0, 34.0, 36.0, 27.0, 32.0, 31.0, 23.0, 23.0, 16.0, 24.0, 23.0, 13.0, 16.0, 18.0, 12.0, 7.0, 8.0, 7.0, 6.0, 7.0, 8.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-10.0546875, -9.73046875, -9.40625, -9.08203125, -8.7578125, -8.43359375, -8.109375, -7.78515625, -7.4609375, -7.13671875, -6.8125, -6.48828125, -6.1640625, -5.83984375, -5.515625, -5.19140625, -4.8671875, -4.54296875, -4.21875, -3.89453125, -3.5703125, -3.24609375, -2.921875, -2.59765625, -2.2734375, -1.94921875, -1.625, -1.30078125, -0.9765625, -0.65234375, -0.328125, -0.00390625, 0.3203125, 0.64453125, 0.96875, 1.29296875, 1.6171875, 1.94140625, 2.265625, 2.58984375, 2.9140625, 3.23828125, 3.5625, 3.88671875, 4.2109375, 4.53515625, 4.859375, 5.18359375, 5.5078125, 5.83203125, 6.15625, 6.48046875, 6.8046875, 7.12890625, 7.453125, 7.77734375, 8.1015625, 8.42578125, 8.75, 9.07421875, 9.3984375, 9.72265625, 10.046875, 10.37109375, 10.6953125]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 6.0, 2.0, 9.0, 10.0, 12.0, 14.0, 24.0, 26.0, 56.0, 85.0, 116.0, 172.0, 265.0, 409.0, 626.0, 895.0, 1329.0, 2067.0, 3235.0, 4946.0, 7835.0, 12902.0, 21366.0, 36599.0, 64735.0, 120876.0, 245609.0, 576733.0, 1659496.0, 792425.0, 308942.0, 147140.0, 76961.0, 42894.0, 25044.0, 14918.0, 9210.0, 5704.0, 3650.0, 2336.0, 1562.0, 997.0, 659.0, 425.0, 323.0, 203.0, 138.0, 100.0, 66.0, 45.0, 29.0, 22.0, 15.0, 8.0, 9.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-23.140625, -22.409423828125, -21.67822265625, -20.947021484375, -20.2158203125, -19.484619140625, -18.75341796875, -18.022216796875, -17.291015625, -16.559814453125, -15.82861328125, -15.097412109375, -14.3662109375, -13.635009765625, -12.90380859375, -12.172607421875, -11.44140625, -10.710205078125, -9.97900390625, -9.247802734375, -8.5166015625, -7.785400390625, -7.05419921875, -6.322998046875, -5.591796875, -4.860595703125, -4.12939453125, -3.398193359375, -2.6669921875, -1.935791015625, -1.20458984375, -0.473388671875, 0.2578125, 0.989013671875, 1.72021484375, 2.451416015625, 3.1826171875, 3.913818359375, 4.64501953125, 5.376220703125, 6.107421875, 6.838623046875, 7.56982421875, 8.301025390625, 9.0322265625, 9.763427734375, 10.49462890625, 11.225830078125, 11.95703125, 12.688232421875, 13.41943359375, 14.150634765625, 14.8818359375, 15.613037109375, 16.34423828125, 17.075439453125, 17.806640625, 18.537841796875, 19.26904296875, 20.000244140625, 20.7314453125, 21.462646484375, 22.19384765625, 22.925048828125, 23.65625]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 2.0, 9.0, 11.0, 14.0, 25.0, 25.0, 36.0, 26.0, 56.0, 69.0, 66.0, 89.0, 111.0, 131.0, 163.0, 184.0, 259.0, 396.0, 512.0, 418.0, 299.0, 225.0, 191.0, 154.0, 110.0, 84.0, 82.0, 52.0, 56.0, 40.0, 30.0, 29.0, 20.0, 22.0, 16.0, 18.0, 6.0, 3.0, 7.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-8.3125, -8.06536865234375, -7.8182373046875, -7.57110595703125, -7.323974609375, -7.07684326171875, -6.8297119140625, -6.58258056640625, -6.33544921875, -6.08831787109375, -5.8411865234375, -5.59405517578125, -5.346923828125, -5.09979248046875, -4.8526611328125, -4.60552978515625, -4.3583984375, -4.11126708984375, -3.8641357421875, -3.61700439453125, -3.369873046875, -3.12274169921875, -2.8756103515625, -2.62847900390625, -2.38134765625, -2.13421630859375, -1.8870849609375, -1.63995361328125, -1.392822265625, -1.14569091796875, -0.8985595703125, -0.65142822265625, -0.404296875, -0.15716552734375, 0.0899658203125, 0.33709716796875, 0.584228515625, 0.83135986328125, 1.0784912109375, 1.32562255859375, 1.57275390625, 1.81988525390625, 2.0670166015625, 2.31414794921875, 2.561279296875, 2.80841064453125, 3.0555419921875, 3.30267333984375, 3.5498046875, 3.79693603515625, 4.0440673828125, 4.29119873046875, 4.538330078125, 4.78546142578125, 5.0325927734375, 5.27972412109375, 5.52685546875, 5.77398681640625, 6.0211181640625, 6.26824951171875, 6.515380859375, 6.76251220703125, 7.0096435546875, 7.25677490234375, 7.50390625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 5.0, 3.0, 2.0, 3.0, 4.0, 15.0, 12.0, 10.0, 7.0, 21.0, 24.0, 34.0, 49.0, 35.0, 58.0, 78.0, 72.0, 81.0, 84.0, 61.0, 64.0, 54.0, 42.0, 35.0, 31.0, 27.0, 19.0, 10.0, 8.0, 10.0, 10.0, 9.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-20.844694137573242, -20.244922637939453, -19.64514923095703, -19.04537582397461, -18.44560432434082, -17.84583282470703, -17.24605941772461, -16.646286010742188, -16.0465145111084, -15.446742057800293, -14.846969604492188, -14.247197151184082, -13.647424697875977, -13.047652244567871, -12.447879791259766, -11.84810733795166, -11.248334884643555, -10.64856243133545, -10.048789978027344, -9.449017524719238, -8.849245071411133, -8.249472618103027, -7.649700164794922, -7.049927711486816, -6.450155258178711, -5.8503828048706055, -5.2506103515625, -4.6508378982543945, -4.051065444946289, -3.4512929916381836, -2.851520538330078, -2.2517480850219727, -1.6519756317138672, -1.0522031784057617, -0.45243072509765625, 0.14734172821044922, 0.7471141815185547, 1.3468866348266602, 1.9466590881347656, 2.546431541442871, 3.1462039947509766, 3.745976448059082, 4.3457489013671875, 4.945521354675293, 5.545293807983398, 6.145066261291504, 6.744838714599609, 7.344611167907715, 7.94438362121582, 8.544156074523926, 9.143928527832031, 9.743700981140137, 10.343473434448242, 10.943245887756348, 11.543018341064453, 12.142790794372559, 12.742563247680664, 13.34233570098877, 13.942108154296875, 14.54188060760498, 15.141653060913086, 15.741425514221191, 16.341197967529297, 16.94097137451172, 17.540742874145508]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 3.0, 6.0, 4.0, 10.0, 9.0, 8.0, 10.0, 13.0, 17.0, 15.0, 20.0, 38.0, 24.0, 40.0, 34.0, 27.0, 30.0, 32.0, 39.0, 32.0, 36.0, 36.0, 46.0, 37.0, 43.0, 24.0, 32.0, 49.0, 35.0, 32.0, 28.0, 31.0, 29.0, 18.0, 11.0, 15.0, 11.0, 16.0, 14.0, 13.0, 6.0, 9.0, 9.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-13.738736152648926, -13.312158584594727, -12.885580062866211, -12.459002494812012, -12.032424926757812, -11.605846405029297, -11.179268836975098, -10.752691268920898, -10.3261137008667, -9.8995361328125, -9.472957611083984, -9.046380043029785, -8.619802474975586, -8.19322395324707, -7.766646385192871, -7.340068817138672, -6.9134907722473145, -6.486912727355957, -6.060335159301758, -5.6337571144104, -5.207179546356201, -4.780601501464844, -4.3540239334106445, -3.927445888519287, -3.500868082046509, -3.0742902755737305, -2.647712469100952, -2.221134662628174, -1.794556736946106, -1.367978811264038, -0.9414010047912598, -0.5148231983184814, -0.08824539184570312, 0.3383324444293976, 0.7649102807044983, 1.1914881467819214, 1.6180659532546997, 2.0446438789367676, 2.471221685409546, 2.897799491882324, 3.3243772983551025, 3.750955104827881, 4.177533149719238, 4.6041107177734375, 5.030688762664795, 5.457266807556152, 5.883844375610352, 6.310421943664551, 6.736999988555908, 7.163578033447266, 7.590155601501465, 8.016733169555664, 8.44331169128418, 8.869889259338379, 9.296466827392578, 9.723045349121094, 10.149622917175293, 10.576200485229492, 11.002779006958008, 11.429356575012207, 11.855934143066406, 12.282512664794922, 12.709090232849121, 13.13566780090332, 13.56224536895752]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 9.0, 8.0, 15.0, 14.0, 34.0, 45.0, 71.0, 100.0, 140.0, 212.0, 323.0, 464.0, 712.0, 1111.0, 1658.0, 2588.0, 3971.0, 6166.0, 9717.0, 15420.0, 24509.0, 40364.0, 68308.0, 121321.0, 307657.0, 198624.0, 97381.0, 56533.0, 33908.0, 20826.0, 12931.0, 8318.0, 5262.0, 3444.0, 2165.0, 1439.0, 926.0, 613.0, 414.0, 289.0, 180.0, 123.0, 72.0, 62.0, 35.0, 28.0, 15.0, 18.0, 6.0, 8.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.16015625, -4.0294189453125, -3.898681640625, -3.7679443359375, -3.63720703125, -3.5064697265625, -3.375732421875, -3.2449951171875, -3.1142578125, -2.9835205078125, -2.852783203125, -2.7220458984375, -2.59130859375, -2.4605712890625, -2.329833984375, -2.1990966796875, -2.068359375, -1.9376220703125, -1.806884765625, -1.6761474609375, -1.54541015625, -1.4146728515625, -1.283935546875, -1.1531982421875, -1.0224609375, -0.8917236328125, -0.760986328125, -0.6302490234375, -0.49951171875, -0.3687744140625, -0.238037109375, -0.1072998046875, 0.0234375, 0.1541748046875, 0.284912109375, 0.4156494140625, 0.54638671875, 0.6771240234375, 0.807861328125, 0.9385986328125, 1.0693359375, 1.2000732421875, 1.330810546875, 1.4615478515625, 1.59228515625, 1.7230224609375, 1.853759765625, 1.9844970703125, 2.115234375, 2.2459716796875, 2.376708984375, 2.5074462890625, 2.63818359375, 2.7689208984375, 2.899658203125, 3.0303955078125, 3.1611328125, 3.2918701171875, 3.422607421875, 3.5533447265625, 3.68408203125, 3.8148193359375, 3.945556640625, 4.0762939453125, 4.20703125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 6.0, 3.0, 3.0, 2.0, 4.0, 8.0, 9.0, 16.0, 10.0, 16.0, 21.0, 28.0, 26.0, 30.0, 35.0, 42.0, 36.0, 39.0, 41.0, 40.0, 34.0, 42.0, 40.0, 57.0, 38.0, 46.0, 36.0, 45.0, 41.0, 26.0, 30.0, 29.0, 26.0, 18.0, 19.0, 17.0, 14.0, 9.0, 10.0, 9.0, 2.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.265625, -15.760986328125, -15.25634765625, -14.751708984375, -14.2470703125, -13.742431640625, -13.23779296875, -12.733154296875, -12.228515625, -11.723876953125, -11.21923828125, -10.714599609375, -10.2099609375, -9.705322265625, -9.20068359375, -8.696044921875, -8.19140625, -7.686767578125, -7.18212890625, -6.677490234375, -6.1728515625, -5.668212890625, -5.16357421875, -4.658935546875, -4.154296875, -3.649658203125, -3.14501953125, -2.640380859375, -2.1357421875, -1.631103515625, -1.12646484375, -0.621826171875, -0.1171875, 0.387451171875, 0.89208984375, 1.396728515625, 1.9013671875, 2.406005859375, 2.91064453125, 3.415283203125, 3.919921875, 4.424560546875, 4.92919921875, 5.433837890625, 5.9384765625, 6.443115234375, 6.94775390625, 7.452392578125, 7.95703125, 8.461669921875, 8.96630859375, 9.470947265625, 9.9755859375, 10.480224609375, 10.98486328125, 11.489501953125, 11.994140625, 12.498779296875, 13.00341796875, 13.508056640625, 14.0126953125, 14.517333984375, 15.02197265625, 15.526611328125, 16.03125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 5.0, 7.0, 13.0, 16.0, 18.0, 34.0, 32.0, 54.0, 85.0, 114.0, 145.0, 195.0, 286.0, 390.0, 581.0, 744.0, 1075.0, 1505.0, 2217.0, 3106.0, 4607.0, 6698.0, 10123.0, 14952.0, 23405.0, 36578.0, 59810.0, 107337.0, 245791.0, 251801.0, 108771.0, 60140.0, 36992.0, 23515.0, 15302.0, 10189.0, 6768.0, 4583.0, 3153.0, 2204.0, 1499.0, 1071.0, 742.0, 509.0, 418.0, 303.0, 193.0, 145.0, 98.0, 71.0, 47.0, 43.0, 32.0, 18.0, 14.0, 12.0, 8.0, 1.0, 1.0, 1.0, 3.0], "bins": [-3.951171875, -3.827728271484375, -3.70428466796875, -3.580841064453125, -3.4573974609375, -3.333953857421875, -3.21051025390625, -3.087066650390625, -2.963623046875, -2.840179443359375, -2.71673583984375, -2.593292236328125, -2.4698486328125, -2.346405029296875, -2.22296142578125, -2.099517822265625, -1.97607421875, -1.852630615234375, -1.72918701171875, -1.605743408203125, -1.4822998046875, -1.358856201171875, -1.23541259765625, -1.111968994140625, -0.988525390625, -0.865081787109375, -0.74163818359375, -0.618194580078125, -0.4947509765625, -0.371307373046875, -0.24786376953125, -0.124420166015625, -0.0009765625, 0.122467041015625, 0.24591064453125, 0.369354248046875, 0.4927978515625, 0.616241455078125, 0.73968505859375, 0.863128662109375, 0.986572265625, 1.110015869140625, 1.23345947265625, 1.356903076171875, 1.4803466796875, 1.603790283203125, 1.72723388671875, 1.850677490234375, 1.97412109375, 2.097564697265625, 2.22100830078125, 2.344451904296875, 2.4678955078125, 2.591339111328125, 2.71478271484375, 2.838226318359375, 2.961669921875, 3.085113525390625, 3.20855712890625, 3.332000732421875, 3.4554443359375, 3.578887939453125, 3.70233154296875, 3.825775146484375, 3.94921875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 4.0, 4.0, 3.0, 4.0, 6.0, 9.0, 11.0, 10.0, 10.0, 15.0, 17.0, 17.0, 24.0, 19.0, 22.0, 26.0, 24.0, 17.0, 36.0, 42.0, 43.0, 36.0, 40.0, 43.0, 47.0, 28.0, 32.0, 38.0, 47.0, 41.0, 41.0, 34.0, 29.0, 25.0, 27.0, 21.0, 22.0, 14.0, 18.0, 8.0, 8.0, 7.0, 10.0, 8.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-9.84375, -9.550048828125, -9.25634765625, -8.962646484375, -8.6689453125, -8.375244140625, -8.08154296875, -7.787841796875, -7.494140625, -7.200439453125, -6.90673828125, -6.613037109375, -6.3193359375, -6.025634765625, -5.73193359375, -5.438232421875, -5.14453125, -4.850830078125, -4.55712890625, -4.263427734375, -3.9697265625, -3.676025390625, -3.38232421875, -3.088623046875, -2.794921875, -2.501220703125, -2.20751953125, -1.913818359375, -1.6201171875, -1.326416015625, -1.03271484375, -0.739013671875, -0.4453125, -0.151611328125, 0.14208984375, 0.435791015625, 0.7294921875, 1.023193359375, 1.31689453125, 1.610595703125, 1.904296875, 2.197998046875, 2.49169921875, 2.785400390625, 3.0791015625, 3.372802734375, 3.66650390625, 3.960205078125, 4.25390625, 4.547607421875, 4.84130859375, 5.135009765625, 5.4287109375, 5.722412109375, 6.01611328125, 6.309814453125, 6.603515625, 6.897216796875, 7.19091796875, 7.484619140625, 7.7783203125, 8.072021484375, 8.36572265625, 8.659423828125, 8.953125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 6.0, 4.0, 5.0, 5.0, 7.0, 10.0, 17.0, 31.0, 44.0, 71.0, 81.0, 116.0, 164.0, 272.0, 395.0, 577.0, 773.0, 1087.0, 1535.0, 2134.0, 3293.0, 4810.0, 7174.0, 11483.0, 18585.0, 32505.0, 63731.0, 148147.0, 348172.0, 213296.0, 85790.0, 41637.0, 22656.0, 13497.0, 8577.0, 5705.0, 3689.0, 2556.0, 1729.0, 1232.0, 873.0, 615.0, 445.0, 297.0, 226.0, 140.0, 116.0, 95.0, 56.0, 37.0, 25.0, 22.0, 15.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.007549285888671875, -0.007303297519683838, -0.007057309150695801, -0.006811320781707764, -0.0065653324127197266, -0.0063193440437316895, -0.006073355674743652, -0.005827367305755615, -0.005581378936767578, -0.005335390567779541, -0.005089402198791504, -0.004843413829803467, -0.00459742546081543, -0.004351437091827393, -0.0041054487228393555, -0.0038594603538513184, -0.0036134719848632812, -0.003367483615875244, -0.003121495246887207, -0.00287550687789917, -0.002629518508911133, -0.0023835301399230957, -0.0021375417709350586, -0.0018915534019470215, -0.0016455650329589844, -0.0013995766639709473, -0.0011535882949829102, -0.000907599925994873, -0.0006616115570068359, -0.00041562318801879883, -0.00016963481903076172, 7.635354995727539e-05, 0.0003223419189453125, 0.0005683302879333496, 0.0008143186569213867, 0.0010603070259094238, 0.001306295394897461, 0.001552283763885498, 0.0017982721328735352, 0.0020442605018615723, 0.0022902488708496094, 0.0025362372398376465, 0.0027822256088256836, 0.0030282139778137207, 0.003274202346801758, 0.003520190715789795, 0.003766179084777832, 0.004012167453765869, 0.004258155822753906, 0.004504144191741943, 0.0047501325607299805, 0.004996120929718018, 0.005242109298706055, 0.005488097667694092, 0.005734086036682129, 0.005980074405670166, 0.006226062774658203, 0.00647205114364624, 0.006718039512634277, 0.0069640278816223145, 0.0072100162506103516, 0.007456004619598389, 0.007701992988586426, 0.007947981357574463, 0.0081939697265625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 7.0, 7.0, 11.0, 7.0, 9.0, 14.0, 7.0, 18.0, 26.0, 22.0, 30.0, 44.0, 41.0, 60.0, 54.0, 62.0, 77.0, 72.0, 57.0, 57.0, 50.0, 47.0, 41.0, 32.0, 22.0, 21.0, 17.0, 16.0, 7.0, 9.0, 15.0, 7.0, 4.0, 5.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-8.046627044677734e-06, -7.80448317527771e-06, -7.5623393058776855e-06, -7.320195436477661e-06, -7.078051567077637e-06, -6.835907697677612e-06, -6.593763828277588e-06, -6.3516199588775635e-06, -6.109476089477539e-06, -5.867332220077515e-06, -5.62518835067749e-06, -5.383044481277466e-06, -5.140900611877441e-06, -4.898756742477417e-06, -4.656612873077393e-06, -4.414469003677368e-06, -4.172325134277344e-06, -3.930181264877319e-06, -3.688037395477295e-06, -3.4458935260772705e-06, -3.203749656677246e-06, -2.9616057872772217e-06, -2.7194619178771973e-06, -2.477318048477173e-06, -2.2351741790771484e-06, -1.993030309677124e-06, -1.7508864402770996e-06, -1.5087425708770752e-06, -1.2665987014770508e-06, -1.0244548320770264e-06, -7.82310962677002e-07, -5.401670932769775e-07, -2.980232238769531e-07, -5.587935447692871e-08, 1.862645149230957e-07, 4.284083843231201e-07, 6.705522537231445e-07, 9.126961231231689e-07, 1.1548399925231934e-06, 1.3969838619232178e-06, 1.6391277313232422e-06, 1.8812716007232666e-06, 2.123415470123291e-06, 2.3655593395233154e-06, 2.60770320892334e-06, 2.8498470783233643e-06, 3.0919909477233887e-06, 3.334134817123413e-06, 3.5762786865234375e-06, 3.818422555923462e-06, 4.060566425323486e-06, 4.302710294723511e-06, 4.544854164123535e-06, 4.7869980335235596e-06, 5.029141902923584e-06, 5.271285772323608e-06, 5.513429641723633e-06, 5.755573511123657e-06, 5.997717380523682e-06, 6.239861249923706e-06, 6.4820051193237305e-06, 6.724148988723755e-06, 6.966292858123779e-06, 7.208436727523804e-06, 7.450580596923828e-06]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 9.0, 6.0, 4.0, 14.0, 23.0, 31.0, 39.0, 59.0, 94.0, 142.0, 162.0, 270.0, 364.0, 534.0, 856.0, 1293.0, 2085.0, 3364.0, 5340.0, 8508.0, 14495.0, 25654.0, 48109.0, 99857.0, 232755.0, 319176.0, 140516.0, 64808.0, 33162.0, 18323.0, 10653.0, 6497.0, 4104.0, 2551.0, 1595.0, 1005.0, 676.0, 429.0, 274.0, 219.0, 166.0, 82.0, 86.0, 53.0, 37.0, 27.0, 19.0, 7.0, 7.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.00814056396484375, -0.007887840270996094, -0.0076351165771484375, -0.007382392883300781, -0.007129669189453125, -0.006876945495605469, -0.0066242218017578125, -0.006371498107910156, -0.0061187744140625, -0.005866050720214844, -0.0056133270263671875, -0.005360603332519531, -0.005107879638671875, -0.004855155944824219, -0.0046024322509765625, -0.004349708557128906, -0.00409698486328125, -0.0038442611694335938, -0.0035915374755859375, -0.0033388137817382812, -0.003086090087890625, -0.0028333663940429688, -0.0025806427001953125, -0.0023279190063476562, -0.0020751953125, -0.0018224716186523438, -0.0015697479248046875, -0.0013170242309570312, -0.001064300537109375, -0.0008115768432617188, -0.0005588531494140625, -0.00030612945556640625, -5.340576171875e-05, 0.00019931793212890625, 0.0004520416259765625, 0.0007047653198242188, 0.000957489013671875, 0.0012102127075195312, 0.0014629364013671875, 0.0017156600952148438, 0.0019683837890625, 0.0022211074829101562, 0.0024738311767578125, 0.0027265548706054688, 0.002979278564453125, 0.0032320022583007812, 0.0034847259521484375, 0.0037374496459960938, 0.00399017333984375, 0.004242897033691406, 0.0044956207275390625, 0.004748344421386719, 0.005001068115234375, 0.005253791809082031, 0.0055065155029296875, 0.005759239196777344, 0.006011962890625, 0.006264686584472656, 0.0065174102783203125, 0.006770133972167969, 0.007022857666015625, 0.007275581359863281, 0.0075283050537109375, 0.007781028747558594, 0.00803375244140625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 8.0, 6.0, 7.0, 7.0, 13.0, 13.0, 11.0, 16.0, 18.0, 13.0, 17.0, 30.0, 39.0, 56.0, 53.0, 56.0, 76.0, 96.0, 77.0, 55.0, 55.0, 33.0, 35.0, 35.0, 33.0, 22.0, 19.0, 18.0, 25.0, 3.0, 19.0, 4.0, 10.0, 0.0, 8.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0024623870849609375, -0.0023846328258514404, -0.0023068785667419434, -0.0022291243076324463, -0.0021513700485229492, -0.002073615789413452, -0.001995861530303955, -0.001918107271194458, -0.001840353012084961, -0.0017625987529754639, -0.0016848444938659668, -0.0016070902347564697, -0.0015293359756469727, -0.0014515817165374756, -0.0013738274574279785, -0.0012960731983184814, -0.0012183189392089844, -0.0011405646800994873, -0.0010628104209899902, -0.0009850561618804932, -0.0009073019027709961, -0.000829547643661499, -0.000751793384552002, -0.0006740391254425049, -0.0005962848663330078, -0.0005185306072235107, -0.00044077634811401367, -0.0003630220890045166, -0.00028526782989501953, -0.00020751357078552246, -0.0001297593116760254, -5.200505256652832e-05, 2.574920654296875e-05, 0.00010350346565246582, 0.0001812577247619629, 0.00025901198387145996, 0.00033676624298095703, 0.0004145205020904541, 0.0004922747611999512, 0.0005700290203094482, 0.0006477832794189453, 0.0007255375385284424, 0.0008032917976379395, 0.0008810460567474365, 0.0009588003158569336, 0.0010365545749664307, 0.0011143088340759277, 0.0011920630931854248, 0.0012698173522949219, 0.001347571611404419, 0.001425325870513916, 0.001503080129623413, 0.0015808343887329102, 0.0016585886478424072, 0.0017363429069519043, 0.0018140971660614014, 0.0018918514251708984, 0.0019696056842803955, 0.0020473599433898926, 0.0021251142024993896, 0.0022028684616088867, 0.002280622720718384, 0.002358376979827881, 0.002436131238937378, 0.002513885498046875]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 6.0, 3.0, 4.0, 4.0, 2.0, 4.0, 4.0, 13.0, 13.0, 8.0, 10.0, 25.0, 21.0, 27.0, 51.0, 37.0, 54.0, 84.0, 69.0, 84.0, 88.0, 56.0, 64.0, 58.0, 41.0, 36.0, 34.0, 22.0, 17.0, 10.0, 14.0, 7.0, 11.0, 5.0, 8.0, 1.0, 5.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-20.903148651123047, -20.30223274230957, -19.701318740844727, -19.10040283203125, -18.499488830566406, -17.89857292175293, -17.297658920288086, -16.69674301147461, -16.095829010009766, -15.494914054870605, -14.893999099731445, -14.293084144592285, -13.692169189453125, -13.091254234313965, -12.490339279174805, -11.889423370361328, -11.288508415222168, -10.687593460083008, -10.086678504943848, -9.485763549804688, -8.884848594665527, -8.283933639526367, -7.683018207550049, -7.082103252410889, -6.4811882972717285, -5.880273342132568, -5.279358386993408, -4.67844295501709, -4.07752799987793, -3.4766132831573486, -2.8756980895996094, -2.274783134460449, -1.673868179321289, -1.072953224182129, -0.4720381498336792, 0.1288769245147705, 0.7297918796539307, 1.3307068347930908, 1.93162202835083, 2.5325369834899902, 3.1334519386291504, 3.7343668937683105, 4.335281848907471, 4.936197280883789, 5.537112236022949, 6.138027191162109, 6.7389421463012695, 7.33985710144043, 7.94077205657959, 8.54168701171875, 9.14260196685791, 9.74351692199707, 10.34443187713623, 10.94534683227539, 11.546262741088867, 12.147176742553711, 12.748092651367188, 13.349007606506348, 13.949922561645508, 14.550837516784668, 15.151752471923828, 15.752667427062988, 16.35358238220215, 16.954498291015625, 17.55541229248047]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 3.0, 6.0, 5.0, 9.0, 9.0, 7.0, 11.0, 13.0, 16.0, 16.0, 19.0, 38.0, 25.0, 39.0, 36.0, 26.0, 30.0, 33.0, 36.0, 34.0, 34.0, 37.0, 47.0, 35.0, 44.0, 26.0, 31.0, 47.0, 33.0, 36.0, 30.0, 29.0, 30.0, 17.0, 11.0, 15.0, 12.0, 15.0, 16.0, 11.0, 6.0, 9.0, 9.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-13.66439437866211, -13.24014949798584, -12.81590461730957, -12.3916597366333, -11.967414855957031, -11.543169975280762, -11.118925094604492, -10.694681167602539, -10.270435333251953, -9.846190452575684, -9.421945571899414, -8.997700691223145, -8.573455810546875, -8.149210929870605, -7.724966526031494, -7.300721645355225, -6.876477241516113, -6.452232360839844, -6.027987480163574, -5.603742599487305, -5.179497718811035, -4.755252838134766, -4.331008434295654, -3.9067635536193848, -3.4825186729431152, -3.0582737922668457, -2.634028911590576, -2.2097842693328857, -1.7855393886566162, -1.3612945079803467, -0.9370498657226562, -0.5128049850463867, -0.0885610580444336, 0.33568376302719116, 0.7599285840988159, 1.184173345565796, 1.6084182262420654, 2.032663106918335, 2.4569077491760254, 2.881152629852295, 3.3053975105285645, 3.729642391204834, 4.1538872718811035, 4.578131675720215, 5.002376556396484, 5.426621437072754, 5.850866317749023, 6.275111198425293, 6.6993560791015625, 7.123600959777832, 7.547845840454102, 7.972090721130371, 8.39633560180664, 8.82058048248291, 9.24482536315918, 9.669069290161133, 10.093315124511719, 10.517560005187988, 10.941804885864258, 11.366049766540527, 11.790294647216797, 12.214539527893066, 12.638784408569336, 13.063028335571289, 13.487273216247559]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 1.0, 3.0, 10.0, 14.0, 28.0, 37.0, 63.0, 91.0, 120.0, 195.0, 277.0, 478.0, 766.0, 1202.0, 1867.0, 2911.0, 4732.0, 7389.0, 12242.0, 20062.0, 34003.0, 60930.0, 115368.0, 207599.0, 237756.0, 152065.0, 79526.0, 43480.0, 25387.0, 14910.0, 9368.0, 5810.0, 3595.0, 2293.0, 1426.0, 917.0, 577.0, 378.0, 250.0, 145.0, 101.0, 62.0, 43.0, 26.0, 20.0, 9.0, 9.0, 10.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.265625, -26.36328125, -25.4609375, -24.55859375, -23.65625, -22.75390625, -21.8515625, -20.94921875, -20.046875, -19.14453125, -18.2421875, -17.33984375, -16.4375, -15.53515625, -14.6328125, -13.73046875, -12.828125, -11.92578125, -11.0234375, -10.12109375, -9.21875, -8.31640625, -7.4140625, -6.51171875, -5.609375, -4.70703125, -3.8046875, -2.90234375, -2.0, -1.09765625, -0.1953125, 0.70703125, 1.609375, 2.51171875, 3.4140625, 4.31640625, 5.21875, 6.12109375, 7.0234375, 7.92578125, 8.828125, 9.73046875, 10.6328125, 11.53515625, 12.4375, 13.33984375, 14.2421875, 15.14453125, 16.046875, 16.94921875, 17.8515625, 18.75390625, 19.65625, 20.55859375, 21.4609375, 22.36328125, 23.265625, 24.16796875, 25.0703125, 25.97265625, 26.875, 27.77734375, 28.6796875, 29.58203125, 30.484375]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 5.0, 4.0, 6.0, 9.0, 9.0, 9.0, 3.0, 15.0, 11.0, 19.0, 21.0, 20.0, 34.0, 45.0, 31.0, 37.0, 27.0, 45.0, 27.0, 47.0, 38.0, 51.0, 43.0, 40.0, 31.0, 34.0, 42.0, 37.0, 23.0, 40.0, 28.0, 20.0, 24.0, 26.0, 14.0, 17.0, 20.0, 12.0, 11.0, 7.0, 12.0, 5.0, 4.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-13.484375, -13.08935546875, -12.6943359375, -12.29931640625, -11.904296875, -11.50927734375, -11.1142578125, -10.71923828125, -10.32421875, -9.92919921875, -9.5341796875, -9.13916015625, -8.744140625, -8.34912109375, -7.9541015625, -7.55908203125, -7.1640625, -6.76904296875, -6.3740234375, -5.97900390625, -5.583984375, -5.18896484375, -4.7939453125, -4.39892578125, -4.00390625, -3.60888671875, -3.2138671875, -2.81884765625, -2.423828125, -2.02880859375, -1.6337890625, -1.23876953125, -0.84375, -0.44873046875, -0.0537109375, 0.34130859375, 0.736328125, 1.13134765625, 1.5263671875, 1.92138671875, 2.31640625, 2.71142578125, 3.1064453125, 3.50146484375, 3.896484375, 4.29150390625, 4.6865234375, 5.08154296875, 5.4765625, 5.87158203125, 6.2666015625, 6.66162109375, 7.056640625, 7.45166015625, 7.8466796875, 8.24169921875, 8.63671875, 9.03173828125, 9.4267578125, 9.82177734375, 10.216796875, 10.61181640625, 11.0068359375, 11.40185546875, 11.796875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 8.0, 11.0, 11.0, 19.0, 23.0, 28.0, 48.0, 60.0, 106.0, 159.0, 225.0, 311.0, 524.0, 780.0, 1193.0, 1757.0, 2706.0, 4167.0, 6613.0, 10389.0, 16478.0, 26469.0, 44627.0, 77422.0, 135160.0, 200993.0, 197633.0, 131677.0, 75040.0, 43592.0, 26007.0, 16221.0, 10022.0, 6293.0, 4012.0, 2677.0, 1728.0, 1144.0, 725.0, 485.0, 357.0, 198.0, 159.0, 90.0, 58.0, 44.0, 52.0, 20.0, 16.0, 9.0, 5.0, 6.0, 6.0, 0.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-22.765625, -22.006103515625, -21.24658203125, -20.487060546875, -19.7275390625, -18.968017578125, -18.20849609375, -17.448974609375, -16.689453125, -15.929931640625, -15.17041015625, -14.410888671875, -13.6513671875, -12.891845703125, -12.13232421875, -11.372802734375, -10.61328125, -9.853759765625, -9.09423828125, -8.334716796875, -7.5751953125, -6.815673828125, -6.05615234375, -5.296630859375, -4.537109375, -3.777587890625, -3.01806640625, -2.258544921875, -1.4990234375, -0.739501953125, 0.02001953125, 0.779541015625, 1.5390625, 2.298583984375, 3.05810546875, 3.817626953125, 4.5771484375, 5.336669921875, 6.09619140625, 6.855712890625, 7.615234375, 8.374755859375, 9.13427734375, 9.893798828125, 10.6533203125, 11.412841796875, 12.17236328125, 12.931884765625, 13.69140625, 14.450927734375, 15.21044921875, 15.969970703125, 16.7294921875, 17.489013671875, 18.24853515625, 19.008056640625, 19.767578125, 20.527099609375, 21.28662109375, 22.046142578125, 22.8056640625, 23.565185546875, 24.32470703125, 25.084228515625, 25.84375]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 1.0, 5.0, 4.0, 7.0, 13.0, 10.0, 7.0, 22.0, 24.0, 21.0, 23.0, 20.0, 19.0, 28.0, 22.0, 31.0, 35.0, 36.0, 33.0, 30.0, 46.0, 49.0, 31.0, 36.0, 34.0, 39.0, 43.0, 35.0, 40.0, 34.0, 40.0, 18.0, 23.0, 20.0, 15.0, 20.0, 18.0, 8.0, 8.0, 11.0, 10.0, 11.0, 3.0, 5.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.5625, -6.3336181640625, -6.104736328125, -5.8758544921875, -5.64697265625, -5.4180908203125, -5.189208984375, -4.9603271484375, -4.7314453125, -4.5025634765625, -4.273681640625, -4.0447998046875, -3.81591796875, -3.5870361328125, -3.358154296875, -3.1292724609375, -2.900390625, -2.6715087890625, -2.442626953125, -2.2137451171875, -1.98486328125, -1.7559814453125, -1.527099609375, -1.2982177734375, -1.0693359375, -0.8404541015625, -0.611572265625, -0.3826904296875, -0.15380859375, 0.0750732421875, 0.303955078125, 0.5328369140625, 0.76171875, 0.9906005859375, 1.219482421875, 1.4483642578125, 1.67724609375, 1.9061279296875, 2.135009765625, 2.3638916015625, 2.5927734375, 2.8216552734375, 3.050537109375, 3.2794189453125, 3.50830078125, 3.7371826171875, 3.966064453125, 4.1949462890625, 4.423828125, 4.6527099609375, 4.881591796875, 5.1104736328125, 5.33935546875, 5.5682373046875, 5.797119140625, 6.0260009765625, 6.2548828125, 6.4837646484375, 6.712646484375, 6.9415283203125, 7.17041015625, 7.3992919921875, 7.628173828125, 7.8570556640625, 8.0859375]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 3.0, 4.0, 7.0, 13.0, 9.0, 14.0, 16.0, 38.0, 63.0, 56.0, 95.0, 136.0, 195.0, 287.0, 403.0, 628.0, 1038.0, 1599.0, 2432.0, 4052.0, 6897.0, 12695.0, 26713.0, 69762.0, 275354.0, 451572.0, 116452.0, 38524.0, 17207.0, 8744.0, 5066.0, 2994.0, 1918.0, 1155.0, 801.0, 505.0, 334.0, 235.0, 148.0, 125.0, 78.0, 50.0, 37.0, 29.0, 24.0, 13.0, 11.0, 12.0, 2.0, 4.0, 4.0, 2.0, 4.0, 6.0], "bins": [-2.1640625, -2.10260009765625, -2.0411376953125, -1.97967529296875, -1.918212890625, -1.85675048828125, -1.7952880859375, -1.73382568359375, -1.67236328125, -1.61090087890625, -1.5494384765625, -1.48797607421875, -1.426513671875, -1.36505126953125, -1.3035888671875, -1.24212646484375, -1.1806640625, -1.11920166015625, -1.0577392578125, -0.99627685546875, -0.934814453125, -0.87335205078125, -0.8118896484375, -0.75042724609375, -0.68896484375, -0.62750244140625, -0.5660400390625, -0.50457763671875, -0.443115234375, -0.38165283203125, -0.3201904296875, -0.25872802734375, -0.197265625, -0.13580322265625, -0.0743408203125, -0.01287841796875, 0.048583984375, 0.11004638671875, 0.1715087890625, 0.23297119140625, 0.29443359375, 0.35589599609375, 0.4173583984375, 0.47882080078125, 0.540283203125, 0.60174560546875, 0.6632080078125, 0.72467041015625, 0.7861328125, 0.84759521484375, 0.9090576171875, 0.97052001953125, 1.031982421875, 1.09344482421875, 1.1549072265625, 1.21636962890625, 1.27783203125, 1.33929443359375, 1.4007568359375, 1.46221923828125, 1.523681640625, 1.58514404296875, 1.6466064453125, 1.70806884765625, 1.76953125]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 4.0, 4.0, 4.0, 9.0, 6.0, 12.0, 16.0, 15.0, 23.0, 26.0, 55.0, 52.0, 75.0, 78.0, 104.0, 110.0, 81.0, 68.0, 65.0, 47.0, 34.0, 21.0, 19.0, 17.0, 19.0, 6.0, 6.0, 5.0, 5.0, 2.0, 0.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00017976760864257812, -0.00017493776977062225, -0.00017010793089866638, -0.0001652780920267105, -0.00016044825315475464, -0.00015561841428279877, -0.0001507885754108429, -0.00014595873653888702, -0.00014112889766693115, -0.00013629905879497528, -0.0001314692199230194, -0.00012663938105106354, -0.00012180954217910767, -0.0001169797033071518, -0.00011214986443519592, -0.00010732002556324005, -0.00010249018669128418, -9.766034781932831e-05, -9.283050894737244e-05, -8.800067007541656e-05, -8.31708312034607e-05, -7.834099233150482e-05, -7.351115345954895e-05, -6.868131458759308e-05, -6.385147571563721e-05, -5.9021636843681335e-05, -5.4191797971725464e-05, -4.936195909976959e-05, -4.453212022781372e-05, -3.970228135585785e-05, -3.487244248390198e-05, -3.0042603611946106e-05, -2.5212764739990234e-05, -2.0382925868034363e-05, -1.555308699607849e-05, -1.072324812412262e-05, -5.893409252166748e-06, -1.0635703802108765e-06, 3.766268491744995e-06, 8.596107363700867e-06, 1.3425946235656738e-05, 1.825578510761261e-05, 2.308562397956848e-05, 2.7915462851524353e-05, 3.2745301723480225e-05, 3.7575140595436096e-05, 4.240497946739197e-05, 4.723481833934784e-05, 5.206465721130371e-05, 5.689449608325958e-05, 6.172433495521545e-05, 6.655417382717133e-05, 7.13840126991272e-05, 7.621385157108307e-05, 8.104369044303894e-05, 8.587352931499481e-05, 9.070336818695068e-05, 9.553320705890656e-05, 0.00010036304593086243, 0.0001051928848028183, 0.00011002272367477417, 0.00011485256254673004, 0.00011968240141868591, 0.00012451224029064178, 0.00012934207916259766]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 3.0, 13.0, 11.0, 11.0, 22.0, 30.0, 48.0, 64.0, 87.0, 130.0, 209.0, 320.0, 457.0, 784.0, 1172.0, 1889.0, 3247.0, 5232.0, 9331.0, 17577.0, 37463.0, 98051.0, 361329.0, 342185.0, 93374.0, 35929.0, 16891.0, 9159.0, 5222.0, 3146.0, 1864.0, 1172.0, 726.0, 488.0, 303.0, 198.0, 146.0, 78.0, 60.0, 46.0, 24.0, 24.0, 10.0, 11.0, 10.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0], "bins": [-2.076171875, -2.018463134765625, -1.96075439453125, -1.903045654296875, -1.8453369140625, -1.787628173828125, -1.72991943359375, -1.672210693359375, -1.614501953125, -1.556793212890625, -1.49908447265625, -1.441375732421875, -1.3836669921875, -1.325958251953125, -1.26824951171875, -1.210540771484375, -1.15283203125, -1.095123291015625, -1.03741455078125, -0.979705810546875, -0.9219970703125, -0.864288330078125, -0.80657958984375, -0.748870849609375, -0.691162109375, -0.633453369140625, -0.57574462890625, -0.518035888671875, -0.4603271484375, -0.402618408203125, -0.34490966796875, -0.287200927734375, -0.2294921875, -0.171783447265625, -0.11407470703125, -0.056365966796875, 0.0013427734375, 0.059051513671875, 0.11676025390625, 0.174468994140625, 0.232177734375, 0.289886474609375, 0.34759521484375, 0.405303955078125, 0.4630126953125, 0.520721435546875, 0.57843017578125, 0.636138916015625, 0.69384765625, 0.751556396484375, 0.80926513671875, 0.866973876953125, 0.9246826171875, 0.982391357421875, 1.04010009765625, 1.097808837890625, 1.155517578125, 1.213226318359375, 1.27093505859375, 1.328643798828125, 1.3863525390625, 1.444061279296875, 1.50177001953125, 1.559478759765625, 1.6171875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 4.0, 1.0, 3.0, 4.0, 9.0, 6.0, 6.0, 9.0, 7.0, 20.0, 14.0, 16.0, 25.0, 51.0, 45.0, 53.0, 64.0, 97.0, 97.0, 90.0, 88.0, 62.0, 55.0, 41.0, 31.0, 23.0, 13.0, 9.0, 10.0, 13.0, 10.0, 6.0, 8.0, 7.0, 0.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6123046875, -0.5955810546875, -0.578857421875, -0.5621337890625, -0.54541015625, -0.5286865234375, -0.511962890625, -0.4952392578125, -0.478515625, -0.4617919921875, -0.445068359375, -0.4283447265625, -0.41162109375, -0.3948974609375, -0.378173828125, -0.3614501953125, -0.3447265625, -0.3280029296875, -0.311279296875, -0.2945556640625, -0.27783203125, -0.2611083984375, -0.244384765625, -0.2276611328125, -0.2109375, -0.1942138671875, -0.177490234375, -0.1607666015625, -0.14404296875, -0.1273193359375, -0.110595703125, -0.0938720703125, -0.0771484375, -0.0604248046875, -0.043701171875, -0.0269775390625, -0.01025390625, 0.0064697265625, 0.023193359375, 0.0399169921875, 0.056640625, 0.0733642578125, 0.090087890625, 0.1068115234375, 0.12353515625, 0.1402587890625, 0.156982421875, 0.1737060546875, 0.1904296875, 0.2071533203125, 0.223876953125, 0.2406005859375, 0.25732421875, 0.2740478515625, 0.290771484375, 0.3074951171875, 0.32421875, 0.3409423828125, 0.357666015625, 0.3743896484375, 0.39111328125, 0.4078369140625, 0.424560546875, 0.4412841796875, 0.4580078125]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 7.0, 1.0, 6.0, 12.0, 11.0, 16.0, 25.0, 23.0, 32.0, 54.0, 70.0, 115.0, 118.0, 97.0, 110.0, 88.0, 63.0, 33.0, 25.0, 25.0, 20.0, 16.0, 19.0, 5.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.48492431640625, -18.68439292907715, -17.883861541748047, -17.083328247070312, -16.28279685974121, -15.48226547241211, -14.681734085083008, -13.881202697753906, -13.080670356750488, -12.280138969421387, -11.479606628417969, -10.679075241088867, -9.878543853759766, -9.078011512756348, -8.277480125427246, -7.476948261260986, -6.676416397094727, -5.875884532928467, -5.075352668762207, -4.2748212814331055, -3.4742894172668457, -2.673757553100586, -1.8732261657714844, -1.0726943016052246, -0.27216243743896484, 0.5283693075180054, 1.3289010524749756, 2.1294326782226562, 2.929964542388916, 3.730496406555176, 4.531027793884277, 5.331559658050537, 6.132091522216797, 6.932623386383057, 7.733155250549316, 8.533686637878418, 9.334218978881836, 10.134750366210938, 10.935281753540039, 11.73581314086914, 12.536345481872559, 13.33687686920166, 14.137409210205078, 14.93794059753418, 15.738471984863281, 16.539005279541016, 17.339534759521484, 18.14006805419922, 18.94059944152832, 19.741130828857422, 20.541662216186523, 21.342193603515625, 22.14272689819336, 22.94325828552246, 23.743789672851562, 24.544321060180664, 25.344852447509766, 26.145383834838867, 26.94591522216797, 27.746448516845703, 28.546979904174805, 29.347511291503906, 30.148042678833008, 30.94857406616211, 31.749107360839844]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 8.0, 6.0, 7.0, 11.0, 11.0, 18.0, 19.0, 18.0, 28.0, 28.0, 32.0, 34.0, 38.0, 27.0, 41.0, 38.0, 37.0, 39.0, 35.0, 53.0, 44.0, 55.0, 31.0, 41.0, 45.0, 36.0, 26.0, 34.0, 28.0, 24.0, 13.0, 24.0, 10.0, 14.0, 9.0, 7.0, 10.0, 4.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.426748275756836, -12.977045059204102, -12.52734088897705, -12.077637672424316, -11.627934455871582, -11.178230285644531, -10.728527069091797, -10.278823852539062, -9.829119682312012, -9.379416465759277, -8.929712295532227, -8.480009078979492, -8.030305862426758, -7.580601692199707, -7.130898475646973, -6.68119478225708, -6.231491565704346, -5.781787872314453, -5.332084655761719, -4.882380962371826, -4.432677268981934, -3.98297381401062, -3.5332703590393066, -3.083566665649414, -2.6338632106781006, -2.184159755706787, -1.7344560623168945, -1.284752607345581, -0.835049033164978, -0.385345458984375, 0.06435799598693848, 0.514061689376831, 0.9637651443481445, 1.4134687185287476, 1.8631722927093506, 2.312875747680664, 2.7625794410705566, 3.21228289604187, 3.6619863510131836, 4.111690044403076, 4.561393737792969, 5.011097431182861, 5.460800647735596, 5.910504341125488, 6.360208034515381, 6.809911727905273, 7.259614944458008, 7.7093186378479, 8.159021377563477, 8.608724594116211, 9.058428764343262, 9.508131980895996, 9.95783519744873, 10.407539367675781, 10.857242584228516, 11.30694580078125, 11.7566499710083, 12.206353187561035, 12.656057357788086, 13.10576057434082, 13.555463790893555, 14.005167961120605, 14.45487117767334, 14.90457534790039, 15.354278564453125]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 6.0, 12.0, 16.0, 18.0, 22.0, 47.0, 57.0, 82.0, 121.0, 139.0, 208.0, 287.0, 405.0, 584.0, 854.0, 1094.0, 1594.0, 2309.0, 3417.0, 4842.0, 7370.0, 10862.0, 16859.0, 26166.0, 41398.0, 69195.0, 127728.0, 319638.0, 1088037.0, 1490315.0, 568091.0, 181801.0, 88005.0, 51515.0, 31161.0, 19695.0, 12817.0, 8546.0, 5883.0, 3856.0, 2777.0, 1930.0, 1337.0, 930.0, 705.0, 472.0, 318.0, 221.0, 155.0, 117.0, 74.0, 56.0, 52.0, 29.0, 30.0, 20.0, 7.0, 6.0, 9.0, 2.0, 1.0, 1.0], "bins": [-19.453125, -18.830078125, -18.20703125, -17.583984375, -16.9609375, -16.337890625, -15.71484375, -15.091796875, -14.46875, -13.845703125, -13.22265625, -12.599609375, -11.9765625, -11.353515625, -10.73046875, -10.107421875, -9.484375, -8.861328125, -8.23828125, -7.615234375, -6.9921875, -6.369140625, -5.74609375, -5.123046875, -4.5, -3.876953125, -3.25390625, -2.630859375, -2.0078125, -1.384765625, -0.76171875, -0.138671875, 0.484375, 1.107421875, 1.73046875, 2.353515625, 2.9765625, 3.599609375, 4.22265625, 4.845703125, 5.46875, 6.091796875, 6.71484375, 7.337890625, 7.9609375, 8.583984375, 9.20703125, 9.830078125, 10.453125, 11.076171875, 11.69921875, 12.322265625, 12.9453125, 13.568359375, 14.19140625, 14.814453125, 15.4375, 16.060546875, 16.68359375, 17.306640625, 17.9296875, 18.552734375, 19.17578125, 19.798828125, 20.421875]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 1.0, 5.0, 6.0, 2.0, 9.0, 9.0, 10.0, 9.0, 17.0, 18.0, 26.0, 29.0, 24.0, 30.0, 18.0, 35.0, 32.0, 26.0, 33.0, 40.0, 30.0, 30.0, 42.0, 42.0, 46.0, 45.0, 42.0, 41.0, 29.0, 27.0, 37.0, 29.0, 29.0, 21.0, 16.0, 16.0, 18.0, 17.0, 13.0, 8.0, 9.0, 7.0, 5.0, 6.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-10.4765625, -10.1378173828125, -9.799072265625, -9.4603271484375, -9.12158203125, -8.7828369140625, -8.444091796875, -8.1053466796875, -7.7666015625, -7.4278564453125, -7.089111328125, -6.7503662109375, -6.41162109375, -6.0728759765625, -5.734130859375, -5.3953857421875, -5.056640625, -4.7178955078125, -4.379150390625, -4.0404052734375, -3.70166015625, -3.3629150390625, -3.024169921875, -2.6854248046875, -2.3466796875, -2.0079345703125, -1.669189453125, -1.3304443359375, -0.99169921875, -0.6529541015625, -0.314208984375, 0.0245361328125, 0.36328125, 0.7020263671875, 1.040771484375, 1.3795166015625, 1.71826171875, 2.0570068359375, 2.395751953125, 2.7344970703125, 3.0732421875, 3.4119873046875, 3.750732421875, 4.0894775390625, 4.42822265625, 4.7669677734375, 5.105712890625, 5.4444580078125, 5.783203125, 6.1219482421875, 6.460693359375, 6.7994384765625, 7.13818359375, 7.4769287109375, 7.815673828125, 8.1544189453125, 8.4931640625, 8.8319091796875, 9.170654296875, 9.5093994140625, 9.84814453125, 10.1868896484375, 10.525634765625, 10.8643798828125, 11.203125]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 9.0, 12.0, 12.0, 30.0, 28.0, 63.0, 100.0, 184.0, 287.0, 459.0, 794.0, 1355.0, 2295.0, 4014.0, 7069.0, 12687.0, 24008.0, 46662.0, 96541.0, 218810.0, 597511.0, 1895259.0, 786441.0, 269612.0, 114319.0, 54345.0, 27728.0, 14716.0, 8055.0, 4608.0, 2572.0, 1560.0, 864.0, 495.0, 292.0, 177.0, 110.0, 65.0, 40.0, 35.0, 20.0, 15.0, 8.0, 11.0, 7.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-25.484375, -24.67822265625, -23.8720703125, -23.06591796875, -22.259765625, -21.45361328125, -20.6474609375, -19.84130859375, -19.03515625, -18.22900390625, -17.4228515625, -16.61669921875, -15.810546875, -15.00439453125, -14.1982421875, -13.39208984375, -12.5859375, -11.77978515625, -10.9736328125, -10.16748046875, -9.361328125, -8.55517578125, -7.7490234375, -6.94287109375, -6.13671875, -5.33056640625, -4.5244140625, -3.71826171875, -2.912109375, -2.10595703125, -1.2998046875, -0.49365234375, 0.3125, 1.11865234375, 1.9248046875, 2.73095703125, 3.537109375, 4.34326171875, 5.1494140625, 5.95556640625, 6.76171875, 7.56787109375, 8.3740234375, 9.18017578125, 9.986328125, 10.79248046875, 11.5986328125, 12.40478515625, 13.2109375, 14.01708984375, 14.8232421875, 15.62939453125, 16.435546875, 17.24169921875, 18.0478515625, 18.85400390625, 19.66015625, 20.46630859375, 21.2724609375, 22.07861328125, 22.884765625, 23.69091796875, 24.4970703125, 25.30322265625, 26.109375]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 8.0, 3.0, 8.0, 10.0, 23.0, 14.0, 24.0, 25.0, 38.0, 50.0, 54.0, 57.0, 67.0, 83.0, 86.0, 120.0, 175.0, 174.0, 215.0, 328.0, 421.0, 440.0, 327.0, 254.0, 223.0, 171.0, 104.0, 86.0, 87.0, 67.0, 64.0, 55.0, 32.0, 35.0, 29.0, 18.0, 10.0, 17.0, 15.0, 12.0, 7.0, 12.0, 6.0, 10.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0], "bins": [-6.5703125, -6.365234375, -6.16015625, -5.955078125, -5.75, -5.544921875, -5.33984375, -5.134765625, -4.9296875, -4.724609375, -4.51953125, -4.314453125, -4.109375, -3.904296875, -3.69921875, -3.494140625, -3.2890625, -3.083984375, -2.87890625, -2.673828125, -2.46875, -2.263671875, -2.05859375, -1.853515625, -1.6484375, -1.443359375, -1.23828125, -1.033203125, -0.828125, -0.623046875, -0.41796875, -0.212890625, -0.0078125, 0.197265625, 0.40234375, 0.607421875, 0.8125, 1.017578125, 1.22265625, 1.427734375, 1.6328125, 1.837890625, 2.04296875, 2.248046875, 2.453125, 2.658203125, 2.86328125, 3.068359375, 3.2734375, 3.478515625, 3.68359375, 3.888671875, 4.09375, 4.298828125, 4.50390625, 4.708984375, 4.9140625, 5.119140625, 5.32421875, 5.529296875, 5.734375, 5.939453125, 6.14453125, 6.349609375, 6.5546875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 1.0, 3.0, 7.0, 6.0, 11.0, 11.0, 13.0, 18.0, 30.0, 27.0, 54.0, 58.0, 79.0, 83.0, 104.0, 85.0, 104.0, 67.0, 39.0, 45.0, 31.0, 20.0, 21.0, 16.0, 17.0, 12.0, 11.0, 10.0, 4.0, 8.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.623504638671875, -16.973432540893555, -16.323360443115234, -15.67328929901123, -15.023218154907227, -14.373146057128906, -13.723073959350586, -13.073002815246582, -12.422931671142578, -11.772859573364258, -11.122788429260254, -10.472716331481934, -9.82264518737793, -9.17257308959961, -8.522500991821289, -7.872429847717285, -7.222357749938965, -6.572286128997803, -5.922214508056641, -5.27214241027832, -4.622071266174316, -3.971999406814575, -3.321927547454834, -2.671855926513672, -2.0217843055725098, -1.3717126846313477, -0.721640944480896, -0.07156920433044434, 0.5785024166107178, 1.2285740375518799, 1.878645896911621, 2.528717517852783, 3.1787891387939453, 3.8288607597351074, 4.4789323806762695, 5.12900447845459, 5.779075622558594, 6.429147720336914, 7.079219341278076, 7.729290962219238, 8.379362106323242, 9.029434204101562, 9.679505348205566, 10.329577445983887, 10.97964859008789, 11.629720687866211, 12.279792785644531, 12.929863929748535, 13.579936027526855, 14.230008125305176, 14.88007926940918, 15.5301513671875, 16.18022346496582, 16.830293655395508, 17.480365753173828, 18.13043785095215, 18.78050994873047, 19.43058204650879, 20.08065414428711, 20.730724334716797, 21.380796432495117, 22.030868530273438, 22.680940628051758, 23.331012725830078, 23.981082916259766]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 5.0, 8.0, 13.0, 16.0, 11.0, 16.0, 12.0, 18.0, 23.0, 21.0, 20.0, 28.0, 31.0, 27.0, 38.0, 39.0, 34.0, 35.0, 34.0, 51.0, 51.0, 32.0, 33.0, 27.0, 31.0, 24.0, 27.0, 35.0, 34.0, 28.0, 31.0, 27.0, 27.0, 19.0, 18.0, 15.0, 11.0, 9.0, 7.0, 10.0, 8.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-12.096494674682617, -11.71364974975586, -11.330803871154785, -10.947958946228027, -10.56511402130127, -10.182268142700195, -9.799423217773438, -9.41657829284668, -9.033733367919922, -8.650888442993164, -8.26804256439209, -7.885197639465332, -7.502352714538574, -7.119507312774658, -6.736661911010742, -6.353816986083984, -5.97097110748291, -5.588125705718994, -5.205280780792236, -4.82243537902832, -4.4395904541015625, -4.0567450523376465, -3.6738996505737305, -3.2910544872283936, -2.9082093238830566, -2.5253641605377197, -2.142518997192383, -1.7596735954284668, -1.3768284320831299, -0.993983268737793, -0.611137866973877, -0.22829270362854004, 0.15455150604248047, 0.5373967289924622, 0.9202419519424438, 1.3030872344970703, 1.6859323978424072, 2.068777561187744, 2.45162296295166, 2.834468126296997, 3.217313289642334, 3.600158452987671, 3.983003616333008, 4.365849018096924, 4.74869441986084, 5.131539344787598, 5.514384746551514, 5.89723014831543, 6.2800750732421875, 6.6629204750061035, 7.045765399932861, 7.428610801696777, 7.811455726623535, 8.19430160522461, 8.577146530151367, 8.959991455078125, 9.342836380004883, 9.72568130493164, 10.108527183532715, 10.491372108459473, 10.87421703338623, 11.257062911987305, 11.639907836914062, 12.02275276184082, 12.405598640441895]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 11.0, 8.0, 26.0, 39.0, 31.0, 55.0, 66.0, 136.0, 183.0, 263.0, 437.0, 674.0, 894.0, 1408.0, 2191.0, 3059.0, 4666.0, 6919.0, 10504.0, 16166.0, 24674.0, 38365.0, 62036.0, 109776.0, 253452.0, 237494.0, 106661.0, 60319.0, 37338.0, 23663.0, 15813.0, 10484.0, 7015.0, 4617.0, 2982.0, 2057.0, 1257.0, 908.0, 619.0, 412.0, 282.0, 199.0, 137.0, 91.0, 46.0, 45.0, 29.0, 19.0, 13.0, 11.0, 0.0, 1.0, 5.0, 3.0, 0.0, 1.0, 2.0], "bins": [-3.505859375, -3.396209716796875, -3.28656005859375, -3.176910400390625, -3.0672607421875, -2.957611083984375, -2.84796142578125, -2.738311767578125, -2.628662109375, -2.519012451171875, -2.40936279296875, -2.299713134765625, -2.1900634765625, -2.080413818359375, -1.97076416015625, -1.861114501953125, -1.75146484375, -1.641815185546875, -1.53216552734375, -1.422515869140625, -1.3128662109375, -1.203216552734375, -1.09356689453125, -0.983917236328125, -0.874267578125, -0.764617919921875, -0.65496826171875, -0.545318603515625, -0.4356689453125, -0.326019287109375, -0.21636962890625, -0.106719970703125, 0.0029296875, 0.112579345703125, 0.22222900390625, 0.331878662109375, 0.4415283203125, 0.551177978515625, 0.66082763671875, 0.770477294921875, 0.880126953125, 0.989776611328125, 1.09942626953125, 1.209075927734375, 1.3187255859375, 1.428375244140625, 1.53802490234375, 1.647674560546875, 1.75732421875, 1.866973876953125, 1.97662353515625, 2.086273193359375, 2.1959228515625, 2.305572509765625, 2.41522216796875, 2.524871826171875, 2.634521484375, 2.744171142578125, 2.85382080078125, 2.963470458984375, 3.0731201171875, 3.182769775390625, 3.29241943359375, 3.402069091796875, 3.51171875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 7.0, 6.0, 8.0, 6.0, 12.0, 17.0, 13.0, 19.0, 14.0, 24.0, 21.0, 30.0, 23.0, 39.0, 38.0, 38.0, 41.0, 46.0, 44.0, 36.0, 31.0, 45.0, 40.0, 37.0, 42.0, 23.0, 34.0, 41.0, 18.0, 33.0, 22.0, 30.0, 19.0, 20.0, 23.0, 20.0, 7.0, 6.0, 6.0, 2.0, 6.0, 3.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.0390625, -12.6256103515625, -12.212158203125, -11.7987060546875, -11.38525390625, -10.9718017578125, -10.558349609375, -10.1448974609375, -9.7314453125, -9.3179931640625, -8.904541015625, -8.4910888671875, -8.07763671875, -7.6641845703125, -7.250732421875, -6.8372802734375, -6.423828125, -6.0103759765625, -5.596923828125, -5.1834716796875, -4.77001953125, -4.3565673828125, -3.943115234375, -3.5296630859375, -3.1162109375, -2.7027587890625, -2.289306640625, -1.8758544921875, -1.46240234375, -1.0489501953125, -0.635498046875, -0.2220458984375, 0.19140625, 0.6048583984375, 1.018310546875, 1.4317626953125, 1.84521484375, 2.2586669921875, 2.672119140625, 3.0855712890625, 3.4990234375, 3.9124755859375, 4.325927734375, 4.7393798828125, 5.15283203125, 5.5662841796875, 5.979736328125, 6.3931884765625, 6.806640625, 7.2200927734375, 7.633544921875, 8.0469970703125, 8.46044921875, 8.8739013671875, 9.287353515625, 9.7008056640625, 10.1142578125, 10.5277099609375, 10.941162109375, 11.3546142578125, 11.76806640625, 12.1815185546875, 12.594970703125, 13.0084228515625, 13.421875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 3.0, 3.0, 9.0, 11.0, 13.0, 39.0, 41.0, 58.0, 95.0, 154.0, 207.0, 299.0, 362.0, 528.0, 741.0, 1098.0, 1623.0, 2228.0, 3166.0, 4658.0, 7014.0, 10546.0, 15598.0, 24035.0, 36944.0, 59850.0, 105333.0, 244618.0, 251719.0, 106722.0, 60571.0, 37177.0, 24181.0, 15836.0, 10562.0, 7187.0, 4626.0, 3271.0, 2259.0, 1555.0, 1049.0, 770.0, 514.0, 387.0, 276.0, 209.0, 142.0, 88.0, 72.0, 31.0, 31.0, 17.0, 10.0, 12.0, 7.0, 2.0, 6.0, 3.0, 1.0, 1.0], "bins": [-3.376953125, -3.271453857421875, -3.16595458984375, -3.060455322265625, -2.9549560546875, -2.849456787109375, -2.74395751953125, -2.638458251953125, -2.532958984375, -2.427459716796875, -2.32196044921875, -2.216461181640625, -2.1109619140625, -2.005462646484375, -1.89996337890625, -1.794464111328125, -1.68896484375, -1.583465576171875, -1.47796630859375, -1.372467041015625, -1.2669677734375, -1.161468505859375, -1.05596923828125, -0.950469970703125, -0.844970703125, -0.739471435546875, -0.63397216796875, -0.528472900390625, -0.4229736328125, -0.317474365234375, -0.21197509765625, -0.106475830078125, -0.0009765625, 0.104522705078125, 0.21002197265625, 0.315521240234375, 0.4210205078125, 0.526519775390625, 0.63201904296875, 0.737518310546875, 0.843017578125, 0.948516845703125, 1.05401611328125, 1.159515380859375, 1.2650146484375, 1.370513916015625, 1.47601318359375, 1.581512451171875, 1.68701171875, 1.792510986328125, 1.89801025390625, 2.003509521484375, 2.1090087890625, 2.214508056640625, 2.32000732421875, 2.425506591796875, 2.531005859375, 2.636505126953125, 2.74200439453125, 2.847503662109375, 2.9530029296875, 3.058502197265625, 3.16400146484375, 3.269500732421875, 3.375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 9.0, 5.0, 12.0, 8.0, 6.0, 11.0, 10.0, 13.0, 26.0, 15.0, 19.0, 26.0, 18.0, 18.0, 34.0, 32.0, 30.0, 43.0, 34.0, 43.0, 41.0, 42.0, 36.0, 36.0, 47.0, 31.0, 37.0, 39.0, 33.0, 32.0, 33.0, 20.0, 24.0, 21.0, 22.0, 20.0, 9.0, 14.0, 11.0, 8.0, 7.0, 11.0, 8.0, 2.0, 4.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.6328125, -7.3814697265625, -7.130126953125, -6.8787841796875, -6.62744140625, -6.3760986328125, -6.124755859375, -5.8734130859375, -5.6220703125, -5.3707275390625, -5.119384765625, -4.8680419921875, -4.61669921875, -4.3653564453125, -4.114013671875, -3.8626708984375, -3.611328125, -3.3599853515625, -3.108642578125, -2.8572998046875, -2.60595703125, -2.3546142578125, -2.103271484375, -1.8519287109375, -1.6005859375, -1.3492431640625, -1.097900390625, -0.8465576171875, -0.59521484375, -0.3438720703125, -0.092529296875, 0.1588134765625, 0.41015625, 0.6614990234375, 0.912841796875, 1.1641845703125, 1.41552734375, 1.6668701171875, 1.918212890625, 2.1695556640625, 2.4208984375, 2.6722412109375, 2.923583984375, 3.1749267578125, 3.42626953125, 3.6776123046875, 3.928955078125, 4.1802978515625, 4.431640625, 4.6829833984375, 4.934326171875, 5.1856689453125, 5.43701171875, 5.6883544921875, 5.939697265625, 6.1910400390625, 6.4423828125, 6.6937255859375, 6.945068359375, 7.1964111328125, 7.44775390625, 7.6990966796875, 7.950439453125, 8.2017822265625, 8.453125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 10.0, 8.0, 10.0, 13.0, 19.0, 21.0, 47.0, 59.0, 58.0, 119.0, 166.0, 245.0, 347.0, 503.0, 717.0, 1017.0, 1523.0, 2422.0, 3654.0, 5758.0, 9712.0, 16236.0, 28855.0, 54477.0, 116425.0, 277594.0, 282004.0, 118885.0, 55507.0, 29000.0, 16446.0, 9787.0, 5811.0, 3705.0, 2418.0, 1580.0, 1004.0, 687.0, 500.0, 391.0, 237.0, 175.0, 136.0, 73.0, 50.0, 39.0, 30.0, 23.0, 11.0, 14.0, 9.0, 9.0, 1.0, 6.0, 3.0, 0.0, 3.0], "bins": [-0.00634765625, -0.00615537166595459, -0.00596308708190918, -0.0057708024978637695, -0.005578517913818359, -0.005386233329772949, -0.005193948745727539, -0.005001664161682129, -0.004809379577636719, -0.004617094993591309, -0.0044248104095458984, -0.004232525825500488, -0.004040241241455078, -0.003847956657409668, -0.003655672073364258, -0.0034633874893188477, -0.0032711029052734375, -0.0030788183212280273, -0.002886533737182617, -0.002694249153137207, -0.002501964569091797, -0.0023096799850463867, -0.0021173954010009766, -0.0019251108169555664, -0.0017328262329101562, -0.001540541648864746, -0.001348257064819336, -0.0011559724807739258, -0.0009636878967285156, -0.0007714033126831055, -0.0005791187286376953, -0.00038683414459228516, -0.000194549560546875, -2.2649765014648438e-06, 0.0001900196075439453, 0.00038230419158935547, 0.0005745887756347656, 0.0007668733596801758, 0.0009591579437255859, 0.001151442527770996, 0.0013437271118164062, 0.0015360116958618164, 0.0017282962799072266, 0.0019205808639526367, 0.002112865447998047, 0.002305150032043457, 0.002497434616088867, 0.0026897192001342773, 0.0028820037841796875, 0.0030742883682250977, 0.003266572952270508, 0.003458857536315918, 0.003651142120361328, 0.0038434267044067383, 0.0040357112884521484, 0.004227995872497559, 0.004420280456542969, 0.004612565040588379, 0.004804849624633789, 0.004997134208679199, 0.005189418792724609, 0.0053817033767700195, 0.00557398796081543, 0.00576627254486084, 0.00595855712890625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 4.0, 5.0, 10.0, 9.0, 16.0, 17.0, 30.0, 26.0, 64.0, 49.0, 54.0, 79.0, 91.0, 108.0, 80.0, 67.0, 56.0, 52.0, 50.0, 26.0, 21.0, 12.0, 20.0, 13.0, 10.0, 4.0, 5.0, 1.0, 5.0, 5.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.417533874511719e-06, -9.095296263694763e-06, -8.773058652877808e-06, -8.450821042060852e-06, -8.128583431243896e-06, -7.806345820426941e-06, -7.484108209609985e-06, -7.16187059879303e-06, -6.839632987976074e-06, -6.517395377159119e-06, -6.195157766342163e-06, -5.8729201555252075e-06, -5.550682544708252e-06, -5.228444933891296e-06, -4.906207323074341e-06, -4.583969712257385e-06, -4.26173210144043e-06, -3.939494490623474e-06, -3.6172568798065186e-06, -3.295019268989563e-06, -2.9727816581726074e-06, -2.650544047355652e-06, -2.3283064365386963e-06, -2.0060688257217407e-06, -1.6838312149047852e-06, -1.3615936040878296e-06, -1.039355993270874e-06, -7.171183824539185e-07, -3.948807716369629e-07, -7.264316082000732e-08, 2.4959444999694824e-07, 5.718320608139038e-07, 8.940696716308594e-07, 1.216307282447815e-06, 1.5385448932647705e-06, 1.860782504081726e-06, 2.1830201148986816e-06, 2.505257725715637e-06, 2.8274953365325928e-06, 3.1497329473495483e-06, 3.471970558166504e-06, 3.7942081689834595e-06, 4.116445779800415e-06, 4.438683390617371e-06, 4.760921001434326e-06, 5.083158612251282e-06, 5.405396223068237e-06, 5.727633833885193e-06, 6.0498714447021484e-06, 6.372109055519104e-06, 6.6943466663360596e-06, 7.016584277153015e-06, 7.338821887969971e-06, 7.661059498786926e-06, 7.983297109603882e-06, 8.305534720420837e-06, 8.627772331237793e-06, 8.950009942054749e-06, 9.272247552871704e-06, 9.59448516368866e-06, 9.916722774505615e-06, 1.023896038532257e-05, 1.0561197996139526e-05, 1.0883435606956482e-05, 1.1205673217773438e-05]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 5.0, 6.0, 5.0, 9.0, 28.0, 30.0, 36.0, 65.0, 85.0, 148.0, 235.0, 397.0, 703.0, 1147.0, 2005.0, 3494.0, 6411.0, 12320.0, 25208.0, 54445.0, 133836.0, 364338.0, 265345.0, 95908.0, 40919.0, 19644.0, 9646.0, 5173.0, 2837.0, 1609.0, 986.0, 602.0, 362.0, 215.0, 132.0, 79.0, 50.0, 39.0, 19.0, 12.0, 8.0, 11.0, 5.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006198883056640625, -0.005958855152130127, -0.005718827247619629, -0.005478799343109131, -0.005238771438598633, -0.004998743534088135, -0.004758715629577637, -0.004518687725067139, -0.004278659820556641, -0.004038631916046143, -0.0037986040115356445, -0.0035585761070251465, -0.0033185482025146484, -0.0030785202980041504, -0.0028384923934936523, -0.0025984644889831543, -0.0023584365844726562, -0.002118408679962158, -0.0018783807754516602, -0.0016383528709411621, -0.001398324966430664, -0.001158297061920166, -0.000918269157409668, -0.0006782412528991699, -0.0004382133483886719, -0.00019818544387817383, 4.184246063232422e-05, 0.00028187036514282227, 0.0005218982696533203, 0.0007619261741638184, 0.0010019540786743164, 0.0012419819831848145, 0.0014820098876953125, 0.0017220377922058105, 0.0019620656967163086, 0.0022020936012268066, 0.0024421215057373047, 0.0026821494102478027, 0.0029221773147583008, 0.003162205219268799, 0.003402233123779297, 0.003642261028289795, 0.003882288932800293, 0.004122316837310791, 0.004362344741821289, 0.004602372646331787, 0.004842400550842285, 0.005082428455352783, 0.005322456359863281, 0.005562484264373779, 0.005802512168884277, 0.006042540073394775, 0.0062825679779052734, 0.0065225958824157715, 0.0067626237869262695, 0.007002651691436768, 0.007242679595947266, 0.007482707500457764, 0.007722735404968262, 0.00796276330947876, 0.008202791213989258, 0.008442819118499756, 0.008682847023010254, 0.008922874927520752, 0.00916290283203125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 1.0, 2.0, 3.0, 7.0, 8.0, 6.0, 9.0, 8.0, 18.0, 18.0, 20.0, 28.0, 28.0, 41.0, 33.0, 39.0, 66.0, 60.0, 75.0, 74.0, 68.0, 65.0, 51.0, 53.0, 31.0, 40.0, 26.0, 27.0, 18.0, 13.0, 16.0, 13.0, 11.0, 6.0, 1.0, 5.0, 4.0, 3.0, 0.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00156402587890625, -0.0015059709548950195, -0.001447916030883789, -0.0013898611068725586, -0.0013318061828613281, -0.0012737512588500977, -0.0012156963348388672, -0.0011576414108276367, -0.0010995864868164062, -0.0010415315628051758, -0.0009834766387939453, -0.0009254217147827148, -0.0008673667907714844, -0.0008093118667602539, -0.0007512569427490234, -0.000693202018737793, -0.0006351470947265625, -0.000577092170715332, -0.0005190372467041016, -0.0004609823226928711, -0.0004029273986816406, -0.00034487247467041016, -0.0002868175506591797, -0.00022876262664794922, -0.00017070770263671875, -0.00011265277862548828, -5.459785461425781e-05, 3.4570693969726562e-06, 6.151199340820312e-05, 0.0001195669174194336, 0.00017762184143066406, 0.00023567676544189453, 0.000293731689453125, 0.00035178661346435547, 0.00040984153747558594, 0.0004678964614868164, 0.0005259513854980469, 0.0005840063095092773, 0.0006420612335205078, 0.0007001161575317383, 0.0007581710815429688, 0.0008162260055541992, 0.0008742809295654297, 0.0009323358535766602, 0.0009903907775878906, 0.001048445701599121, 0.0011065006256103516, 0.001164555549621582, 0.0012226104736328125, 0.001280665397644043, 0.0013387203216552734, 0.001396775245666504, 0.0014548301696777344, 0.0015128850936889648, 0.0015709400177001953, 0.0016289949417114258, 0.0016870498657226562, 0.0017451047897338867, 0.0018031597137451172, 0.0018612146377563477, 0.0019192695617675781, 0.0019773244857788086, 0.002035379409790039, 0.0020934343338012695, 0.0021514892578125]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 6.0, 4.0, 13.0, 10.0, 13.0, 15.0, 30.0, 36.0, 45.0, 60.0, 73.0, 94.0, 100.0, 86.0, 104.0, 64.0, 46.0, 37.0, 31.0, 21.0, 24.0, 16.0, 16.0, 12.0, 10.0, 8.0, 7.0, 7.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.597755432128906, -16.94927978515625, -16.300806045532227, -15.652331352233887, -15.003856658935547, -14.355381965637207, -13.706907272338867, -13.058431625366211, -12.409957885742188, -11.761483192443848, -11.113008499145508, -10.464533805847168, -9.816059112548828, -9.167584419250488, -8.519109725952148, -7.87063455581665, -7.222159385681152, -6.5736846923828125, -5.925209999084473, -5.276735305786133, -4.628260612487793, -3.979785680770874, -3.331310749053955, -2.6828360557556152, -2.0343613624572754, -1.3858866691589355, -0.7374118566513062, -0.08893704414367676, 0.5595376491546631, 1.208012342453003, 1.8564872741699219, 2.5049619674682617, 3.1534366607666016, 3.8019113540649414, 4.450386047363281, 5.098860740661621, 5.747335433959961, 6.395810127258301, 7.044285297393799, 7.692759990692139, 8.34123420715332, 8.98970890045166, 9.63818359375, 10.28665828704834, 10.93513298034668, 11.58360767364502, 12.23208236694336, 12.880558013916016, 13.529032707214355, 14.177507400512695, 14.825982093811035, 15.474456787109375, 16.12293243408203, 16.771406173706055, 17.41988182067871, 18.068355560302734, 18.71683120727539, 19.365306854248047, 20.01378059387207, 20.662256240844727, 21.31072998046875, 21.959205627441406, 22.60767936706543, 23.256155014038086, 23.90462875366211]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 5.0, 8.0, 13.0, 16.0, 11.0, 16.0, 12.0, 18.0, 24.0, 20.0, 19.0, 29.0, 29.0, 29.0, 38.0, 37.0, 34.0, 36.0, 35.0, 51.0, 51.0, 31.0, 34.0, 27.0, 31.0, 23.0, 26.0, 36.0, 35.0, 27.0, 32.0, 26.0, 27.0, 19.0, 19.0, 15.0, 11.0, 9.0, 7.0, 10.0, 8.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-12.099799156188965, -11.718282699584961, -11.33676528930664, -10.955248832702637, -10.573731422424316, -10.192214965820312, -9.810697555541992, -9.429181098937988, -9.047663688659668, -8.666147232055664, -8.284629821777344, -7.903112888336182, -7.5215959548950195, -7.140079021453857, -6.758562088012695, -6.377045631408691, -5.995528697967529, -5.614011764526367, -5.232494831085205, -4.850977897644043, -4.469460964202881, -4.087944030761719, -3.7064273357391357, -3.3249104022979736, -2.9433934688568115, -2.5618765354156494, -2.1803596019744873, -1.7988427877426147, -1.4173258543014526, -1.0358089208602905, -0.654292106628418, -0.27277517318725586, 0.10874176025390625, 0.49025866389274597, 0.8717755675315857, 1.253292441368103, 1.6348093748092651, 2.016326427459717, 2.3978431224823, 2.779360055923462, 3.160876989364624, 3.542393922805786, 3.9239108562469482, 4.305427551269531, 4.686944484710693, 5.0684614181518555, 5.449978351593018, 5.83149528503418, 6.213012218475342, 6.594529151916504, 6.976046085357666, 7.357563018798828, 7.73907995223999, 8.120596885681152, 8.502113342285156, 8.883630752563477, 9.26514720916748, 9.646663665771484, 10.028181076049805, 10.409697532653809, 10.791214942932129, 11.172731399536133, 11.554248809814453, 11.935765266418457, 12.317282676696777]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 10.0, 6.0, 7.0, 25.0, 18.0, 30.0, 53.0, 90.0, 170.0, 241.0, 319.0, 484.0, 767.0, 1210.0, 1967.0, 3100.0, 4926.0, 7967.0, 13646.0, 22778.0, 40127.0, 75179.0, 142512.0, 230018.0, 218723.0, 127646.0, 67180.0, 36422.0, 20675.0, 12303.0, 7545.0, 4536.0, 2816.0, 1850.0, 1199.0, 774.0, 448.0, 279.0, 178.0, 106.0, 79.0, 53.0, 37.0, 23.0, 9.0, 14.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.203125, -25.382080078125, -24.56103515625, -23.739990234375, -22.9189453125, -22.097900390625, -21.27685546875, -20.455810546875, -19.634765625, -18.813720703125, -17.99267578125, -17.171630859375, -16.3505859375, -15.529541015625, -14.70849609375, -13.887451171875, -13.06640625, -12.245361328125, -11.42431640625, -10.603271484375, -9.7822265625, -8.961181640625, -8.14013671875, -7.319091796875, -6.498046875, -5.677001953125, -4.85595703125, -4.034912109375, -3.2138671875, -2.392822265625, -1.57177734375, -0.750732421875, 0.0703125, 0.891357421875, 1.71240234375, 2.533447265625, 3.3544921875, 4.175537109375, 4.99658203125, 5.817626953125, 6.638671875, 7.459716796875, 8.28076171875, 9.101806640625, 9.9228515625, 10.743896484375, 11.56494140625, 12.385986328125, 13.20703125, 14.028076171875, 14.84912109375, 15.670166015625, 16.4912109375, 17.312255859375, 18.13330078125, 18.954345703125, 19.775390625, 20.596435546875, 21.41748046875, 22.238525390625, 23.0595703125, 23.880615234375, 24.70166015625, 25.522705078125, 26.34375]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 8.0, 4.0, 10.0, 9.0, 6.0, 16.0, 15.0, 20.0, 20.0, 21.0, 28.0, 25.0, 36.0, 28.0, 32.0, 36.0, 43.0, 36.0, 34.0, 51.0, 42.0, 37.0, 39.0, 40.0, 27.0, 35.0, 21.0, 36.0, 34.0, 37.0, 25.0, 23.0, 36.0, 19.0, 8.0, 15.0, 12.0, 12.0, 5.0, 6.0, 7.0, 4.0, 1.0, 0.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.765625, -11.3983154296875, -11.031005859375, -10.6636962890625, -10.29638671875, -9.9290771484375, -9.561767578125, -9.1944580078125, -8.8271484375, -8.4598388671875, -8.092529296875, -7.7252197265625, -7.35791015625, -6.9906005859375, -6.623291015625, -6.2559814453125, -5.888671875, -5.5213623046875, -5.154052734375, -4.7867431640625, -4.41943359375, -4.0521240234375, -3.684814453125, -3.3175048828125, -2.9501953125, -2.5828857421875, -2.215576171875, -1.8482666015625, -1.48095703125, -1.1136474609375, -0.746337890625, -0.3790283203125, -0.01171875, 0.3555908203125, 0.722900390625, 1.0902099609375, 1.45751953125, 1.8248291015625, 2.192138671875, 2.5594482421875, 2.9267578125, 3.2940673828125, 3.661376953125, 4.0286865234375, 4.39599609375, 4.7633056640625, 5.130615234375, 5.4979248046875, 5.865234375, 6.2325439453125, 6.599853515625, 6.9671630859375, 7.33447265625, 7.7017822265625, 8.069091796875, 8.4364013671875, 8.8037109375, 9.1710205078125, 9.538330078125, 9.9056396484375, 10.27294921875, 10.6402587890625, 11.007568359375, 11.3748779296875, 11.7421875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 6.0, 10.0, 20.0, 13.0, 22.0, 37.0, 69.0, 122.0, 197.0, 365.0, 578.0, 1027.0, 1719.0, 2928.0, 5114.0, 9234.0, 16879.0, 30323.0, 58415.0, 120423.0, 241294.0, 267307.0, 144212.0, 69154.0, 35126.0, 19169.0, 10748.0, 5947.0, 3396.0, 1994.0, 1118.0, 646.0, 366.0, 240.0, 117.0, 75.0, 51.0, 37.0, 22.0, 9.0, 15.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.5625, -25.5830078125, -24.603515625, -23.6240234375, -22.64453125, -21.6650390625, -20.685546875, -19.7060546875, -18.7265625, -17.7470703125, -16.767578125, -15.7880859375, -14.80859375, -13.8291015625, -12.849609375, -11.8701171875, -10.890625, -9.9111328125, -8.931640625, -7.9521484375, -6.97265625, -5.9931640625, -5.013671875, -4.0341796875, -3.0546875, -2.0751953125, -1.095703125, -0.1162109375, 0.86328125, 1.8427734375, 2.822265625, 3.8017578125, 4.78125, 5.7607421875, 6.740234375, 7.7197265625, 8.69921875, 9.6787109375, 10.658203125, 11.6376953125, 12.6171875, 13.5966796875, 14.576171875, 15.5556640625, 16.53515625, 17.5146484375, 18.494140625, 19.4736328125, 20.453125, 21.4326171875, 22.412109375, 23.3916015625, 24.37109375, 25.3505859375, 26.330078125, 27.3095703125, 28.2890625, 29.2685546875, 30.248046875, 31.2275390625, 32.20703125, 33.1865234375, 34.166015625, 35.1455078125, 36.125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 9.0, 5.0, 10.0, 6.0, 11.0, 8.0, 14.0, 20.0, 15.0, 26.0, 35.0, 32.0, 38.0, 25.0, 45.0, 41.0, 36.0, 40.0, 42.0, 53.0, 43.0, 50.0, 44.0, 42.0, 49.0, 46.0, 31.0, 24.0, 19.0, 23.0, 32.0, 23.0, 14.0, 11.0, 10.0, 11.0, 8.0, 2.0, 5.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5390625, -7.2662353515625, -6.993408203125, -6.7205810546875, -6.44775390625, -6.1749267578125, -5.902099609375, -5.6292724609375, -5.3564453125, -5.0836181640625, -4.810791015625, -4.5379638671875, -4.26513671875, -3.9923095703125, -3.719482421875, -3.4466552734375, -3.173828125, -2.9010009765625, -2.628173828125, -2.3553466796875, -2.08251953125, -1.8096923828125, -1.536865234375, -1.2640380859375, -0.9912109375, -0.7183837890625, -0.445556640625, -0.1727294921875, 0.10009765625, 0.3729248046875, 0.645751953125, 0.9185791015625, 1.19140625, 1.4642333984375, 1.737060546875, 2.0098876953125, 2.28271484375, 2.5555419921875, 2.828369140625, 3.1011962890625, 3.3740234375, 3.6468505859375, 3.919677734375, 4.1925048828125, 4.46533203125, 4.7381591796875, 5.010986328125, 5.2838134765625, 5.556640625, 5.8294677734375, 6.102294921875, 6.3751220703125, 6.64794921875, 6.9207763671875, 7.193603515625, 7.4664306640625, 7.7392578125, 8.0120849609375, 8.284912109375, 8.5577392578125, 8.83056640625, 9.1033935546875, 9.376220703125, 9.6490478515625, 9.921875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 3.0, 3.0, 5.0, 6.0, 16.0, 11.0, 24.0, 23.0, 27.0, 34.0, 72.0, 84.0, 132.0, 176.0, 264.0, 326.0, 515.0, 809.0, 1177.0, 1723.0, 2629.0, 4190.0, 6930.0, 11925.0, 21827.0, 46097.0, 117066.0, 367554.0, 290496.0, 90117.0, 37796.0, 18934.0, 10430.0, 6051.0, 3701.0, 2421.0, 1492.0, 1097.0, 724.0, 504.0, 340.0, 249.0, 161.0, 101.0, 74.0, 68.0, 56.0, 30.0, 21.0, 23.0, 12.0, 7.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.7744140625, -1.716949462890625, -1.65948486328125, -1.602020263671875, -1.5445556640625, -1.487091064453125, -1.42962646484375, -1.372161865234375, -1.314697265625, -1.257232666015625, -1.19976806640625, -1.142303466796875, -1.0848388671875, -1.027374267578125, -0.96990966796875, -0.912445068359375, -0.85498046875, -0.797515869140625, -0.74005126953125, -0.682586669921875, -0.6251220703125, -0.567657470703125, -0.51019287109375, -0.452728271484375, -0.395263671875, -0.337799072265625, -0.28033447265625, -0.222869873046875, -0.1654052734375, -0.107940673828125, -0.05047607421875, 0.006988525390625, 0.064453125, 0.121917724609375, 0.17938232421875, 0.236846923828125, 0.2943115234375, 0.351776123046875, 0.40924072265625, 0.466705322265625, 0.524169921875, 0.581634521484375, 0.63909912109375, 0.696563720703125, 0.7540283203125, 0.811492919921875, 0.86895751953125, 0.926422119140625, 0.98388671875, 1.041351318359375, 1.09881591796875, 1.156280517578125, 1.2137451171875, 1.271209716796875, 1.32867431640625, 1.386138916015625, 1.443603515625, 1.501068115234375, 1.55853271484375, 1.615997314453125, 1.6734619140625, 1.730926513671875, 1.78839111328125, 1.845855712890625, 1.9033203125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 8.0, 8.0, 10.0, 9.0, 15.0, 14.0, 21.0, 28.0, 42.0, 40.0, 63.0, 69.0, 96.0, 90.0, 92.0, 71.0, 65.0, 57.0, 47.0, 36.0, 29.0, 13.0, 14.0, 16.0, 12.0, 8.0, 5.0, 3.0, 6.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0001380443572998047, -0.0001336894929409027, -0.00012933462858200073, -0.00012497976422309875, -0.00012062489986419678, -0.0001162700355052948, -0.00011191517114639282, -0.00010756030678749084, -0.00010320544242858887, -9.885057806968689e-05, -9.449571371078491e-05, -9.014084935188293e-05, -8.578598499298096e-05, -8.143112063407898e-05, -7.7076256275177e-05, -7.272139191627502e-05, -6.836652755737305e-05, -6.401166319847107e-05, -5.965679883956909e-05, -5.5301934480667114e-05, -5.094707012176514e-05, -4.659220576286316e-05, -4.223734140396118e-05, -3.7882477045059204e-05, -3.3527612686157227e-05, -2.917274832725525e-05, -2.481788396835327e-05, -2.0463019609451294e-05, -1.6108155250549316e-05, -1.1753290891647339e-05, -7.398426532745361e-06, -3.043562173843384e-06, 1.3113021850585938e-06, 5.666166543960571e-06, 1.0021030902862549e-05, 1.4375895261764526e-05, 1.8730759620666504e-05, 2.308562397956848e-05, 2.744048833847046e-05, 3.1795352697372437e-05, 3.6150217056274414e-05, 4.050508141517639e-05, 4.485994577407837e-05, 4.921481013298035e-05, 5.3569674491882324e-05, 5.79245388507843e-05, 6.227940320968628e-05, 6.663426756858826e-05, 7.098913192749023e-05, 7.534399628639221e-05, 7.969886064529419e-05, 8.405372500419617e-05, 8.840858936309814e-05, 9.276345372200012e-05, 9.71183180809021e-05, 0.00010147318243980408, 0.00010582804679870605, 0.00011018291115760803, 0.00011453777551651001, 0.00011889263987541199, 0.00012324750423431396, 0.00012760236859321594, 0.00013195723295211792, 0.0001363120973110199, 0.00014066696166992188]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 15.0, 11.0, 21.0, 33.0, 37.0, 56.0, 86.0, 132.0, 175.0, 308.0, 412.0, 645.0, 1041.0, 1549.0, 2439.0, 4017.0, 6744.0, 11759.0, 21653.0, 43847.0, 106388.0, 351381.0, 312556.0, 95392.0, 39895.0, 20148.0, 11070.0, 6307.0, 3836.0, 2373.0, 1412.0, 931.0, 639.0, 428.0, 254.0, 175.0, 130.0, 87.0, 63.0, 37.0, 26.0, 20.0, 7.0, 10.0, 5.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0], "bins": [-1.9951171875, -1.93634033203125, -1.8775634765625, -1.81878662109375, -1.760009765625, -1.70123291015625, -1.6424560546875, -1.58367919921875, -1.52490234375, -1.46612548828125, -1.4073486328125, -1.34857177734375, -1.289794921875, -1.23101806640625, -1.1722412109375, -1.11346435546875, -1.0546875, -0.99591064453125, -0.9371337890625, -0.87835693359375, -0.819580078125, -0.76080322265625, -0.7020263671875, -0.64324951171875, -0.58447265625, -0.52569580078125, -0.4669189453125, -0.40814208984375, -0.349365234375, -0.29058837890625, -0.2318115234375, -0.17303466796875, -0.1142578125, -0.05548095703125, 0.0032958984375, 0.06207275390625, 0.120849609375, 0.17962646484375, 0.2384033203125, 0.29718017578125, 0.35595703125, 0.41473388671875, 0.4735107421875, 0.53228759765625, 0.591064453125, 0.64984130859375, 0.7086181640625, 0.76739501953125, 0.826171875, 0.88494873046875, 0.9437255859375, 1.00250244140625, 1.061279296875, 1.12005615234375, 1.1788330078125, 1.23760986328125, 1.29638671875, 1.35516357421875, 1.4139404296875, 1.47271728515625, 1.531494140625, 1.59027099609375, 1.6490478515625, 1.70782470703125, 1.7666015625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 8.0, 6.0, 8.0, 9.0, 20.0, 18.0, 20.0, 18.0, 29.0, 28.0, 39.0, 56.0, 53.0, 68.0, 71.0, 72.0, 71.0, 77.0, 60.0, 46.0, 42.0, 29.0, 16.0, 22.0, 19.0, 17.0, 11.0, 10.0, 8.0, 11.0, 7.0, 2.0, 6.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.55810546875, -0.5419998168945312, -0.5258941650390625, -0.5097885131835938, -0.493682861328125, -0.47757720947265625, -0.4614715576171875, -0.44536590576171875, -0.42926025390625, -0.41315460205078125, -0.3970489501953125, -0.38094329833984375, -0.364837646484375, -0.34873199462890625, -0.3326263427734375, -0.31652069091796875, -0.3004150390625, -0.28430938720703125, -0.2682037353515625, -0.25209808349609375, -0.235992431640625, -0.21988677978515625, -0.2037811279296875, -0.18767547607421875, -0.17156982421875, -0.15546417236328125, -0.1393585205078125, -0.12325286865234375, -0.107147216796875, -0.09104156494140625, -0.0749359130859375, -0.05883026123046875, -0.042724609375, -0.02661895751953125, -0.0105133056640625, 0.00559234619140625, 0.021697998046875, 0.03780364990234375, 0.0539093017578125, 0.07001495361328125, 0.08612060546875, 0.10222625732421875, 0.1183319091796875, 0.13443756103515625, 0.150543212890625, 0.16664886474609375, 0.1827545166015625, 0.19886016845703125, 0.2149658203125, 0.23107147216796875, 0.2471771240234375, 0.26328277587890625, 0.279388427734375, 0.29549407958984375, 0.3115997314453125, 0.32770538330078125, 0.34381103515625, 0.35991668701171875, 0.3760223388671875, 0.39212799072265625, 0.408233642578125, 0.42433929443359375, 0.4404449462890625, 0.45655059814453125, 0.47265625]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 4.0, 6.0, 7.0, 10.0, 14.0, 10.0, 13.0, 21.0, 27.0, 48.0, 35.0, 67.0, 86.0, 89.0, 89.0, 104.0, 80.0, 64.0, 60.0, 27.0, 30.0, 18.0, 23.0, 12.0, 9.0, 9.0, 7.0, 1.0, 8.0, 3.0, 11.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.81728744506836, -19.21150779724121, -18.605728149414062, -17.999950408935547, -17.3941707611084, -16.78839111328125, -16.182613372802734, -15.576833724975586, -14.971054077148438, -14.365274429321289, -13.759495735168457, -13.153717041015625, -12.547937393188477, -11.942157745361328, -11.336379051208496, -10.730600357055664, -10.124820709228516, -9.519041061401367, -8.913262367248535, -8.307483673095703, -7.701704025268555, -7.0959248542785645, -6.490145683288574, -5.884366512298584, -5.278587341308594, -4.6728081703186035, -4.067028999328613, -3.461249828338623, -2.855470657348633, -2.2496914863586426, -1.6439123153686523, -1.038133144378662, -0.4323558807373047, 0.17342329025268555, 0.7792024612426758, 1.384981632232666, 1.9907608032226562, 2.5965399742126465, 3.2023191452026367, 3.808098316192627, 4.413877487182617, 5.019656658172607, 5.625435829162598, 6.231215000152588, 6.836994171142578, 7.442773342132568, 8.048552513122559, 8.65433120727539, 9.260110855102539, 9.865890502929688, 10.47166919708252, 11.077447891235352, 11.6832275390625, 12.289007186889648, 12.89478588104248, 13.500564575195312, 14.106344223022461, 14.71212387084961, 15.317902565002441, 15.923681259155273, 16.529460906982422, 17.13524055480957, 17.74102020263672, 18.346797943115234, 18.952577590942383]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 7.0, 3.0, 9.0, 7.0, 4.0, 9.0, 13.0, 7.0, 17.0, 22.0, 12.0, 22.0, 26.0, 26.0, 32.0, 24.0, 29.0, 42.0, 36.0, 41.0, 43.0, 36.0, 47.0, 39.0, 35.0, 27.0, 28.0, 38.0, 29.0, 28.0, 29.0, 26.0, 29.0, 25.0, 25.0, 22.0, 25.0, 15.0, 12.0, 9.0, 13.0, 10.0, 11.0, 6.0, 5.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.936172485351562, -11.564640998840332, -11.193109512329102, -10.821577072143555, -10.450045585632324, -10.078514099121094, -9.706981658935547, -9.335450172424316, -8.963918685913086, -8.592387199401855, -8.220855712890625, -7.849323272705078, -7.477791786193848, -7.106260299682617, -6.7347283363342285, -6.36319637298584, -5.991664886474609, -5.620133399963379, -5.24860143661499, -4.877069473266602, -4.505537986755371, -4.134006500244141, -3.762474536895752, -3.3909428119659424, -3.019411087036133, -2.6478793621063232, -2.2763476371765137, -1.904815912246704, -1.5332841873168945, -1.161752462387085, -0.7902207374572754, -0.4186890125274658, -0.047158241271972656, 0.3243734836578369, 0.6959052085876465, 1.067436933517456, 1.4389686584472656, 1.8105003833770752, 2.1820321083068848, 2.5535638332366943, 2.925095558166504, 3.2966272830963135, 3.668159008026123, 4.039690971374512, 4.411222457885742, 4.782753944396973, 5.154285907745361, 5.52581787109375, 5.8973493576049805, 6.268880844116211, 6.6404128074646, 7.011944770812988, 7.383476257324219, 7.755007743835449, 8.12653923034668, 8.498071670532227, 8.869603157043457, 9.241134643554688, 9.612667083740234, 9.984198570251465, 10.355730056762695, 10.727261543273926, 11.098793029785156, 11.470325469970703, 11.841856956481934]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 7.0, 12.0, 8.0, 9.0, 24.0, 40.0, 39.0, 74.0, 91.0, 143.0, 200.0, 258.0, 373.0, 580.0, 765.0, 1155.0, 1653.0, 2268.0, 3437.0, 4943.0, 7342.0, 11011.0, 16392.0, 24643.0, 39963.0, 65697.0, 114703.0, 272877.0, 908898.0, 1522075.0, 704740.0, 215140.0, 101814.0, 60645.0, 37837.0, 24315.0, 16004.0, 10786.0, 7198.0, 4962.0, 3434.0, 2330.0, 1638.0, 1202.0, 758.0, 573.0, 383.0, 254.0, 197.0, 132.0, 95.0, 62.0, 43.0, 30.0, 12.0, 10.0, 12.0, 2.0, 10.0], "bins": [-19.265625, -18.70556640625, -18.1455078125, -17.58544921875, -17.025390625, -16.46533203125, -15.9052734375, -15.34521484375, -14.78515625, -14.22509765625, -13.6650390625, -13.10498046875, -12.544921875, -11.98486328125, -11.4248046875, -10.86474609375, -10.3046875, -9.74462890625, -9.1845703125, -8.62451171875, -8.064453125, -7.50439453125, -6.9443359375, -6.38427734375, -5.82421875, -5.26416015625, -4.7041015625, -4.14404296875, -3.583984375, -3.02392578125, -2.4638671875, -1.90380859375, -1.34375, -0.78369140625, -0.2236328125, 0.33642578125, 0.896484375, 1.45654296875, 2.0166015625, 2.57666015625, 3.13671875, 3.69677734375, 4.2568359375, 4.81689453125, 5.376953125, 5.93701171875, 6.4970703125, 7.05712890625, 7.6171875, 8.17724609375, 8.7373046875, 9.29736328125, 9.857421875, 10.41748046875, 10.9775390625, 11.53759765625, 12.09765625, 12.65771484375, 13.2177734375, 13.77783203125, 14.337890625, 14.89794921875, 15.4580078125, 16.01806640625, 16.578125]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 7.0, 3.0, 8.0, 6.0, 8.0, 9.0, 9.0, 12.0, 19.0, 21.0, 17.0, 20.0, 25.0, 28.0, 22.0, 32.0, 37.0, 36.0, 49.0, 42.0, 39.0, 26.0, 46.0, 35.0, 33.0, 29.0, 35.0, 29.0, 26.0, 32.0, 33.0, 25.0, 27.0, 27.0, 31.0, 17.0, 14.0, 17.0, 10.0, 16.0, 10.0, 10.0, 6.0, 7.0, 4.0, 3.0, 7.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-10.4609375, -10.1514892578125, -9.842041015625, -9.5325927734375, -9.22314453125, -8.9136962890625, -8.604248046875, -8.2947998046875, -7.9853515625, -7.6759033203125, -7.366455078125, -7.0570068359375, -6.74755859375, -6.4381103515625, -6.128662109375, -5.8192138671875, -5.509765625, -5.2003173828125, -4.890869140625, -4.5814208984375, -4.27197265625, -3.9625244140625, -3.653076171875, -3.3436279296875, -3.0341796875, -2.7247314453125, -2.415283203125, -2.1058349609375, -1.79638671875, -1.4869384765625, -1.177490234375, -0.8680419921875, -0.55859375, -0.2491455078125, 0.060302734375, 0.3697509765625, 0.67919921875, 0.9886474609375, 1.298095703125, 1.6075439453125, 1.9169921875, 2.2264404296875, 2.535888671875, 2.8453369140625, 3.15478515625, 3.4642333984375, 3.773681640625, 4.0831298828125, 4.392578125, 4.7020263671875, 5.011474609375, 5.3209228515625, 5.63037109375, 5.9398193359375, 6.249267578125, 6.5587158203125, 6.8681640625, 7.1776123046875, 7.487060546875, 7.7965087890625, 8.10595703125, 8.4154052734375, 8.724853515625, 9.0343017578125, 9.34375]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 7.0, 5.0, 13.0, 15.0, 23.0, 43.0, 55.0, 82.0, 132.0, 167.0, 226.0, 382.0, 638.0, 1001.0, 1572.0, 2699.0, 4470.0, 7494.0, 13132.0, 23087.0, 41520.0, 80082.0, 165720.0, 392506.0, 1222417.0, 1424848.0, 439397.0, 181997.0, 86626.0, 45433.0, 24555.0, 13690.0, 7994.0, 4700.0, 2825.0, 1754.0, 1037.0, 659.0, 423.0, 279.0, 185.0, 138.0, 82.0, 63.0, 38.0, 24.0, 15.0, 14.0, 10.0, 6.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-21.328125, -20.662841796875, -19.99755859375, -19.332275390625, -18.6669921875, -18.001708984375, -17.33642578125, -16.671142578125, -16.005859375, -15.340576171875, -14.67529296875, -14.010009765625, -13.3447265625, -12.679443359375, -12.01416015625, -11.348876953125, -10.68359375, -10.018310546875, -9.35302734375, -8.687744140625, -8.0224609375, -7.357177734375, -6.69189453125, -6.026611328125, -5.361328125, -4.696044921875, -4.03076171875, -3.365478515625, -2.7001953125, -2.034912109375, -1.36962890625, -0.704345703125, -0.0390625, 0.626220703125, 1.29150390625, 1.956787109375, 2.6220703125, 3.287353515625, 3.95263671875, 4.617919921875, 5.283203125, 5.948486328125, 6.61376953125, 7.279052734375, 7.9443359375, 8.609619140625, 9.27490234375, 9.940185546875, 10.60546875, 11.270751953125, 11.93603515625, 12.601318359375, 13.2666015625, 13.931884765625, 14.59716796875, 15.262451171875, 15.927734375, 16.593017578125, 17.25830078125, 17.923583984375, 18.5888671875, 19.254150390625, 19.91943359375, 20.584716796875, 21.25]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 10.0, 12.0, 11.0, 15.0, 27.0, 26.0, 35.0, 43.0, 51.0, 66.0, 96.0, 102.0, 133.0, 178.0, 204.0, 267.0, 377.0, 523.0, 440.0, 333.0, 227.0, 185.0, 124.0, 124.0, 81.0, 83.0, 54.0, 53.0, 43.0, 38.0, 22.0, 23.0, 25.0, 12.0, 11.0, 7.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.18359375, -6.96331787109375, -6.7430419921875, -6.52276611328125, -6.302490234375, -6.08221435546875, -5.8619384765625, -5.64166259765625, -5.42138671875, -5.20111083984375, -4.9808349609375, -4.76055908203125, -4.540283203125, -4.32000732421875, -4.0997314453125, -3.87945556640625, -3.6591796875, -3.43890380859375, -3.2186279296875, -2.99835205078125, -2.778076171875, -2.55780029296875, -2.3375244140625, -2.11724853515625, -1.89697265625, -1.67669677734375, -1.4564208984375, -1.23614501953125, -1.015869140625, -0.79559326171875, -0.5753173828125, -0.35504150390625, -0.134765625, 0.08551025390625, 0.3057861328125, 0.52606201171875, 0.746337890625, 0.96661376953125, 1.1868896484375, 1.40716552734375, 1.62744140625, 1.84771728515625, 2.0679931640625, 2.28826904296875, 2.508544921875, 2.72882080078125, 2.9490966796875, 3.16937255859375, 3.3896484375, 3.60992431640625, 3.8302001953125, 4.05047607421875, 4.270751953125, 4.49102783203125, 4.7113037109375, 4.93157958984375, 5.15185546875, 5.37213134765625, 5.5924072265625, 5.81268310546875, 6.032958984375, 6.25323486328125, 6.4735107421875, 6.69378662109375, 6.9140625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 3.0, 8.0, 5.0, 8.0, 10.0, 10.0, 9.0, 22.0, 23.0, 26.0, 31.0, 46.0, 65.0, 71.0, 72.0, 86.0, 74.0, 82.0, 70.0, 63.0, 33.0, 29.0, 25.0, 18.0, 23.0, 14.0, 10.0, 10.0, 10.0, 8.0, 8.0, 4.0, 8.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.028542518615723, -14.546941757202148, -14.06534194946289, -13.583741188049316, -13.102141380310059, -12.620540618896484, -12.138940811157227, -11.657340049743652, -11.175740242004395, -10.69413948059082, -10.212539672851562, -9.730938911437988, -9.24933910369873, -8.767738342285156, -8.286138534545898, -7.804537773132324, -7.322937488555908, -6.841337203979492, -6.359736919403076, -5.87813663482666, -5.396536350250244, -4.914936065673828, -4.433335304260254, -3.951735258102417, -3.470134973526001, -2.988534688949585, -2.506934404373169, -2.025333881378174, -1.5437337160110474, -1.0621333122253418, -0.5805330276489258, -0.09893274307250977, 0.38266754150390625, 0.8642678260803223, 1.3458681106567383, 1.8274685144424438, 2.3090686798095703, 2.7906692028045654, 3.2722694873809814, 3.7538697719573975, 4.235469818115234, 4.71707010269165, 5.198670387268066, 5.680270671844482, 6.161870956420898, 6.643471717834473, 7.1250715255737305, 7.606672286987305, 8.088272094726562, 8.569872856140137, 9.051472663879395, 9.533073425292969, 10.014673233032227, 10.4962739944458, 10.977873802185059, 11.459474563598633, 11.941075325012207, 12.422676086425781, 12.904275894165039, 13.385876655578613, 13.867476463317871, 14.349077224731445, 14.830677032470703, 15.312277793884277, 15.793877601623535]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 6.0, 7.0, 10.0, 8.0, 17.0, 16.0, 15.0, 21.0, 13.0, 25.0, 24.0, 29.0, 33.0, 26.0, 39.0, 39.0, 37.0, 38.0, 50.0, 40.0, 38.0, 42.0, 38.0, 35.0, 44.0, 33.0, 33.0, 25.0, 32.0, 31.0, 21.0, 21.0, 18.0, 21.0, 14.0, 14.0, 9.0, 7.0, 9.0, 3.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.370262145996094, -11.004057884216309, -10.63785457611084, -10.271650314331055, -9.905447006225586, -9.5392427444458, -9.173038482666016, -8.806835174560547, -8.440630912780762, -8.074426651000977, -7.708223342895508, -7.342019081115723, -6.975815296173096, -6.609611511230469, -6.243407249450684, -5.877203464508057, -5.51099967956543, -5.144795894622803, -4.778592109680176, -4.412387847900391, -4.046184062957764, -3.6799802780151367, -3.3137762546539307, -2.9475722312927246, -2.5813684463500977, -2.2151646614074707, -1.8489606380462646, -1.4827567338943481, -1.1165528297424316, -0.7503489255905151, -0.38414502143859863, -0.017940998077392578, 0.34826183319091797, 0.7144657373428345, 1.080669641494751, 1.4468735456466675, 1.813077449798584, 2.179281234741211, 2.545485258102417, 2.911689281463623, 3.27789306640625, 3.644096851348877, 4.010300636291504, 4.376504898071289, 4.742708683013916, 5.108912467956543, 5.475116729736328, 5.841320514678955, 6.207524299621582, 6.573728084564209, 6.939931869506836, 7.306136131286621, 7.672339916229248, 8.038543701171875, 8.40474796295166, 8.770952224731445, 9.137155532836914, 9.5033597946167, 9.869563102722168, 10.235767364501953, 10.601970672607422, 10.968174934387207, 11.334379196166992, 11.700582504272461, 12.066786766052246]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 1.0, 8.0, 14.0, 6.0, 26.0, 41.0, 43.0, 84.0, 110.0, 171.0, 266.0, 464.0, 666.0, 1048.0, 1720.0, 2712.0, 4333.0, 7028.0, 11548.0, 19385.0, 32983.0, 58264.0, 110766.0, 280791.0, 268103.0, 109122.0, 57268.0, 32577.0, 19181.0, 11366.0, 7014.0, 4199.0, 2659.0, 1631.0, 1047.0, 675.0, 436.0, 290.0, 174.0, 136.0, 68.0, 53.0, 31.0, 17.0, 11.0, 11.0, 4.0, 6.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.94921875, -3.829498291015625, -3.70977783203125, -3.590057373046875, -3.4703369140625, -3.350616455078125, -3.23089599609375, -3.111175537109375, -2.991455078125, -2.871734619140625, -2.75201416015625, -2.632293701171875, -2.5125732421875, -2.392852783203125, -2.27313232421875, -2.153411865234375, -2.03369140625, -1.913970947265625, -1.79425048828125, -1.674530029296875, -1.5548095703125, -1.435089111328125, -1.31536865234375, -1.195648193359375, -1.075927734375, -0.956207275390625, -0.83648681640625, -0.716766357421875, -0.5970458984375, -0.477325439453125, -0.35760498046875, -0.237884521484375, -0.1181640625, 0.001556396484375, 0.12127685546875, 0.240997314453125, 0.3607177734375, 0.480438232421875, 0.60015869140625, 0.719879150390625, 0.839599609375, 0.959320068359375, 1.07904052734375, 1.198760986328125, 1.3184814453125, 1.438201904296875, 1.55792236328125, 1.677642822265625, 1.79736328125, 1.917083740234375, 2.03680419921875, 2.156524658203125, 2.2762451171875, 2.395965576171875, 2.51568603515625, 2.635406494140625, 2.755126953125, 2.874847412109375, 2.99456787109375, 3.114288330078125, 3.2340087890625, 3.353729248046875, 3.47344970703125, 3.593170166015625, 3.712890625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 5.0, 5.0, 4.0, 8.0, 10.0, 10.0, 11.0, 10.0, 13.0, 14.0, 23.0, 18.0, 26.0, 29.0, 28.0, 27.0, 33.0, 30.0, 26.0, 54.0, 40.0, 45.0, 40.0, 36.0, 29.0, 44.0, 40.0, 36.0, 47.0, 32.0, 24.0, 27.0, 22.0, 25.0, 20.0, 24.0, 13.0, 14.0, 19.0, 11.0, 8.0, 7.0, 5.0, 3.0, 6.0, 2.0, 2.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-11.9609375, -11.5986328125, -11.236328125, -10.8740234375, -10.51171875, -10.1494140625, -9.787109375, -9.4248046875, -9.0625, -8.7001953125, -8.337890625, -7.9755859375, -7.61328125, -7.2509765625, -6.888671875, -6.5263671875, -6.1640625, -5.8017578125, -5.439453125, -5.0771484375, -4.71484375, -4.3525390625, -3.990234375, -3.6279296875, -3.265625, -2.9033203125, -2.541015625, -2.1787109375, -1.81640625, -1.4541015625, -1.091796875, -0.7294921875, -0.3671875, -0.0048828125, 0.357421875, 0.7197265625, 1.08203125, 1.4443359375, 1.806640625, 2.1689453125, 2.53125, 2.8935546875, 3.255859375, 3.6181640625, 3.98046875, 4.3427734375, 4.705078125, 5.0673828125, 5.4296875, 5.7919921875, 6.154296875, 6.5166015625, 6.87890625, 7.2412109375, 7.603515625, 7.9658203125, 8.328125, 8.6904296875, 9.052734375, 9.4150390625, 9.77734375, 10.1396484375, 10.501953125, 10.8642578125, 11.2265625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 5.0, 2.0, 6.0, 12.0, 12.0, 30.0, 29.0, 42.0, 72.0, 74.0, 130.0, 198.0, 293.0, 410.0, 591.0, 852.0, 1202.0, 1822.0, 2647.0, 3835.0, 5972.0, 9204.0, 14240.0, 22348.0, 35928.0, 59283.0, 106867.0, 268423.0, 253169.0, 104739.0, 58443.0, 34856.0, 22063.0, 14004.0, 9066.0, 5763.0, 3816.0, 2554.0, 1755.0, 1142.0, 802.0, 594.0, 376.0, 292.0, 179.0, 134.0, 71.0, 77.0, 48.0, 27.0, 23.0, 17.0, 9.0, 10.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.259765625, -3.1578369140625, -3.055908203125, -2.9539794921875, -2.85205078125, -2.7501220703125, -2.648193359375, -2.5462646484375, -2.4443359375, -2.3424072265625, -2.240478515625, -2.1385498046875, -2.03662109375, -1.9346923828125, -1.832763671875, -1.7308349609375, -1.62890625, -1.5269775390625, -1.425048828125, -1.3231201171875, -1.22119140625, -1.1192626953125, -1.017333984375, -0.9154052734375, -0.8134765625, -0.7115478515625, -0.609619140625, -0.5076904296875, -0.40576171875, -0.3038330078125, -0.201904296875, -0.0999755859375, 0.001953125, 0.1038818359375, 0.205810546875, 0.3077392578125, 0.40966796875, 0.5115966796875, 0.613525390625, 0.7154541015625, 0.8173828125, 0.9193115234375, 1.021240234375, 1.1231689453125, 1.22509765625, 1.3270263671875, 1.428955078125, 1.5308837890625, 1.6328125, 1.7347412109375, 1.836669921875, 1.9385986328125, 2.04052734375, 2.1424560546875, 2.244384765625, 2.3463134765625, 2.4482421875, 2.5501708984375, 2.652099609375, 2.7540283203125, 2.85595703125, 2.9578857421875, 3.059814453125, 3.1617431640625, 3.263671875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 5.0, 10.0, 9.0, 16.0, 9.0, 17.0, 20.0, 20.0, 17.0, 22.0, 21.0, 31.0, 43.0, 27.0, 32.0, 44.0, 41.0, 40.0, 42.0, 38.0, 42.0, 48.0, 43.0, 33.0, 38.0, 34.0, 32.0, 23.0, 32.0, 29.0, 20.0, 20.0, 17.0, 13.0, 11.0, 14.0, 10.0, 9.0, 8.0, 6.0, 4.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.859375, -6.625, -6.390625, -6.15625, -5.921875, -5.6875, -5.453125, -5.21875, -4.984375, -4.75, -4.515625, -4.28125, -4.046875, -3.8125, -3.578125, -3.34375, -3.109375, -2.875, -2.640625, -2.40625, -2.171875, -1.9375, -1.703125, -1.46875, -1.234375, -1.0, -0.765625, -0.53125, -0.296875, -0.0625, 0.171875, 0.40625, 0.640625, 0.875, 1.109375, 1.34375, 1.578125, 1.8125, 2.046875, 2.28125, 2.515625, 2.75, 2.984375, 3.21875, 3.453125, 3.6875, 3.921875, 4.15625, 4.390625, 4.625, 4.859375, 5.09375, 5.328125, 5.5625, 5.796875, 6.03125, 6.265625, 6.5, 6.734375, 6.96875, 7.203125, 7.4375, 7.671875, 7.90625, 8.140625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 4.0, 8.0, 6.0, 16.0, 19.0, 24.0, 34.0, 48.0, 59.0, 90.0, 104.0, 152.0, 216.0, 267.0, 381.0, 571.0, 860.0, 1232.0, 1764.0, 2582.0, 4124.0, 6755.0, 11934.0, 22872.0, 49726.0, 132396.0, 409220.0, 248854.0, 79583.0, 33264.0, 16747.0, 9032.0, 5312.0, 3225.0, 2129.0, 1419.0, 997.0, 713.0, 478.0, 372.0, 246.0, 186.0, 144.0, 98.0, 74.0, 74.0, 31.0, 32.0, 23.0, 20.0, 18.0, 5.0, 9.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00804901123046875, -0.007778525352478027, -0.007508039474487305, -0.007237553596496582, -0.006967067718505859, -0.006696581840515137, -0.006426095962524414, -0.006155610084533691, -0.005885124206542969, -0.005614638328552246, -0.0053441524505615234, -0.005073666572570801, -0.004803180694580078, -0.0045326948165893555, -0.004262208938598633, -0.00399172306060791, -0.0037212371826171875, -0.003450751304626465, -0.003180265426635742, -0.0029097795486450195, -0.002639293670654297, -0.0023688077926635742, -0.0020983219146728516, -0.001827836036682129, -0.0015573501586914062, -0.0012868642807006836, -0.001016378402709961, -0.0007458925247192383, -0.0004754066467285156, -0.00020492076873779297, 6.556510925292969e-05, 0.00033605098724365234, 0.000606536865234375, 0.0008770227432250977, 0.0011475086212158203, 0.001417994499206543, 0.0016884803771972656, 0.0019589662551879883, 0.002229452133178711, 0.0024999380111694336, 0.0027704238891601562, 0.003040909767150879, 0.0033113956451416016, 0.0035818815231323242, 0.003852367401123047, 0.0041228532791137695, 0.004393339157104492, 0.004663825035095215, 0.0049343109130859375, 0.00520479679107666, 0.005475282669067383, 0.0057457685470581055, 0.006016254425048828, 0.006286740303039551, 0.0065572261810302734, 0.006827712059020996, 0.007098197937011719, 0.007368683815002441, 0.007639169692993164, 0.007909655570983887, 0.00818014144897461, 0.008450627326965332, 0.008721113204956055, 0.008991599082946777, 0.0092620849609375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 7.0, 9.0, 4.0, 6.0, 14.0, 16.0, 13.0, 16.0, 49.0, 44.0, 70.0, 82.0, 85.0, 107.0, 103.0, 89.0, 65.0, 63.0, 38.0, 34.0, 26.0, 11.0, 11.0, 11.0, 5.0, 6.0, 9.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.68899917602539e-06, -7.408671081066132e-06, -7.1283429861068726e-06, -6.8480148911476135e-06, -6.5676867961883545e-06, -6.2873587012290955e-06, -6.0070306062698364e-06, -5.726702511310577e-06, -5.446374416351318e-06, -5.166046321392059e-06, -4.8857182264328e-06, -4.605390131473541e-06, -4.325062036514282e-06, -4.044733941555023e-06, -3.764405846595764e-06, -3.484077751636505e-06, -3.203749656677246e-06, -2.923421561717987e-06, -2.643093466758728e-06, -2.362765371799469e-06, -2.08243727684021e-06, -1.802109181880951e-06, -1.521781086921692e-06, -1.2414529919624329e-06, -9.611248970031738e-07, -6.807968020439148e-07, -4.0046870708465576e-07, -1.2014061212539673e-07, 1.601874828338623e-07, 4.4051557779312134e-07, 7.208436727523804e-07, 1.0011717677116394e-06, 1.2814998626708984e-06, 1.5618279576301575e-06, 1.8421560525894165e-06, 2.1224841475486755e-06, 2.4028122425079346e-06, 2.6831403374671936e-06, 2.9634684324264526e-06, 3.2437965273857117e-06, 3.5241246223449707e-06, 3.8044527173042297e-06, 4.084780812263489e-06, 4.365108907222748e-06, 4.645437002182007e-06, 4.925765097141266e-06, 5.206093192100525e-06, 5.486421287059784e-06, 5.766749382019043e-06, 6.047077476978302e-06, 6.327405571937561e-06, 6.60773366689682e-06, 6.888061761856079e-06, 7.168389856815338e-06, 7.448717951774597e-06, 7.729046046733856e-06, 8.009374141693115e-06, 8.289702236652374e-06, 8.570030331611633e-06, 8.850358426570892e-06, 9.130686521530151e-06, 9.41101461648941e-06, 9.69134271144867e-06, 9.971670806407928e-06, 1.0251998901367188e-05]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 10.0, 5.0, 20.0, 14.0, 24.0, 50.0, 67.0, 93.0, 110.0, 170.0, 238.0, 373.0, 537.0, 891.0, 1339.0, 2040.0, 3338.0, 5466.0, 9279.0, 17094.0, 32900.0, 71558.0, 186968.0, 404956.0, 172695.0, 67420.0, 31205.0, 16307.0, 8976.0, 5467.0, 3150.0, 1996.0, 1353.0, 813.0, 526.0, 382.0, 207.0, 171.0, 106.0, 66.0, 52.0, 48.0, 23.0, 15.0, 14.0, 10.0, 9.0, 6.0, 2.0, 3.0, 0.0, 0.0, 4.0], "bins": [-0.009124755859375, -0.008859992027282715, -0.00859522819519043, -0.008330464363098145, -0.00806570053100586, -0.007800936698913574, -0.007536172866821289, -0.007271409034729004, -0.007006645202636719, -0.006741881370544434, -0.0064771175384521484, -0.006212353706359863, -0.005947589874267578, -0.005682826042175293, -0.005418062210083008, -0.005153298377990723, -0.0048885345458984375, -0.004623770713806152, -0.004359006881713867, -0.004094243049621582, -0.003829479217529297, -0.0035647153854370117, -0.0032999515533447266, -0.0030351877212524414, -0.0027704238891601562, -0.002505660057067871, -0.002240896224975586, -0.0019761323928833008, -0.0017113685607910156, -0.0014466047286987305, -0.0011818408966064453, -0.0009170770645141602, -0.000652313232421875, -0.00038754940032958984, -0.0001227855682373047, 0.00014197826385498047, 0.0004067420959472656, 0.0006715059280395508, 0.0009362697601318359, 0.001201033592224121, 0.0014657974243164062, 0.0017305612564086914, 0.0019953250885009766, 0.0022600889205932617, 0.002524852752685547, 0.002789616584777832, 0.003054380416870117, 0.0033191442489624023, 0.0035839080810546875, 0.0038486719131469727, 0.004113435745239258, 0.004378199577331543, 0.004642963409423828, 0.004907727241516113, 0.0051724910736083984, 0.005437254905700684, 0.005702018737792969, 0.005966782569885254, 0.006231546401977539, 0.006496310234069824, 0.006761074066162109, 0.0070258378982543945, 0.00729060173034668, 0.007555365562438965, 0.00782012939453125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 3.0, 6.0, 6.0, 8.0, 10.0, 17.0, 14.0, 23.0, 31.0, 42.0, 27.0, 60.0, 81.0, 80.0, 81.0, 95.0, 68.0, 64.0, 55.0, 47.0, 38.0, 23.0, 26.0, 17.0, 16.0, 14.0, 12.0, 5.0, 8.0, 4.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0030651092529296875, -0.0029747188091278076, -0.0028843283653259277, -0.002793937921524048, -0.002703547477722168, -0.002613157033920288, -0.002522766590118408, -0.0024323761463165283, -0.0023419857025146484, -0.0022515952587127686, -0.0021612048149108887, -0.002070814371109009, -0.001980423927307129, -0.001890033483505249, -0.0017996430397033691, -0.0017092525959014893, -0.0016188621520996094, -0.0015284717082977295, -0.0014380812644958496, -0.0013476908206939697, -0.0012573003768920898, -0.00116690993309021, -0.00107651948928833, -0.0009861290454864502, -0.0008957386016845703, -0.0008053481578826904, -0.0007149577140808105, -0.0006245672702789307, -0.0005341768264770508, -0.0004437863826751709, -0.000353395938873291, -0.00026300549507141113, -0.00017261505126953125, -8.222460746765137e-05, 8.165836334228516e-06, 9.85562801361084e-05, 0.00018894672393798828, 0.00027933716773986816, 0.00036972761154174805, 0.00046011805534362793, 0.0005505084991455078, 0.0006408989429473877, 0.0007312893867492676, 0.0008216798305511475, 0.0009120702743530273, 0.0010024607181549072, 0.0010928511619567871, 0.001183241605758667, 0.0012736320495605469, 0.0013640224933624268, 0.0014544129371643066, 0.0015448033809661865, 0.0016351938247680664, 0.0017255842685699463, 0.0018159747123718262, 0.001906365156173706, 0.001996755599975586, 0.002087146043777466, 0.0021775364875793457, 0.0022679269313812256, 0.0023583173751831055, 0.0024487078189849854, 0.0025390982627868652, 0.002629488706588745, 0.002719879150390625]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 8.0, 4.0, 14.0, 9.0, 7.0, 14.0, 24.0, 15.0, 38.0, 41.0, 45.0, 72.0, 67.0, 80.0, 76.0, 75.0, 77.0, 67.0, 45.0, 33.0, 33.0, 17.0, 23.0, 19.0, 19.0, 7.0, 10.0, 12.0, 7.0, 6.0, 6.0, 5.0, 6.0, 3.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-14.807815551757812, -14.343450546264648, -13.879085540771484, -13.41472053527832, -12.950355529785156, -12.485990524291992, -12.021625518798828, -11.557260513305664, -11.0928955078125, -10.628530502319336, -10.164165496826172, -9.699800491333008, -9.235435485839844, -8.77107048034668, -8.306705474853516, -7.842339992523193, -7.377974510192871, -6.913609504699707, -6.449244499206543, -5.984879493713379, -5.520514488220215, -5.056149482727051, -4.5917840003967285, -4.1274189949035645, -3.6630539894104004, -3.1986889839172363, -2.7343239784240723, -2.269958734512329, -1.805593729019165, -1.341228723526001, -0.8768634796142578, -0.41249847412109375, 0.05186653137207031, 0.5162315964698792, 0.980596661567688, 1.4449617862701416, 1.9093267917633057, 2.3736917972564697, 2.838057041168213, 3.302422046661377, 3.766787052154541, 4.231152057647705, 4.695517063140869, 5.159882545471191, 5.6242475509643555, 6.0886125564575195, 6.552977561950684, 7.017342567443848, 7.481707572937012, 7.946072578430176, 8.41043758392334, 8.874802589416504, 9.339167594909668, 9.803532600402832, 10.267898559570312, 10.732263565063477, 11.19662857055664, 11.660993576049805, 12.125358581542969, 12.589723587036133, 13.054088592529297, 13.518453598022461, 13.982818603515625, 14.447183609008789, 14.911548614501953]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 6.0, 7.0, 10.0, 8.0, 17.0, 16.0, 16.0, 21.0, 12.0, 26.0, 23.0, 29.0, 33.0, 26.0, 39.0, 40.0, 37.0, 37.0, 50.0, 39.0, 40.0, 40.0, 40.0, 36.0, 43.0, 33.0, 33.0, 25.0, 32.0, 31.0, 20.0, 21.0, 18.0, 21.0, 14.0, 13.0, 10.0, 8.0, 8.0, 3.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.3160982131958, -10.952568054199219, -10.589038848876953, -10.225508689880371, -9.861978530883789, -9.498449325561523, -9.134919166564941, -8.77138900756836, -8.407859802246094, -8.044329643249512, -7.680799961090088, -7.317270278930664, -6.953740119934082, -6.590210437774658, -6.226680755615234, -5.863150596618652, -5.49962043762207, -5.1360907554626465, -4.7725605964660645, -4.409030914306641, -4.045500755310059, -3.6819710731506348, -3.318441390991211, -2.954911470413208, -2.591381549835205, -2.227851629257202, -1.8643218278884888, -1.5007920265197754, -1.1372621059417725, -0.7737321853637695, -0.4102025032043457, -0.04667258262634277, 0.31685733795166016, 0.6803871989250183, 1.0439170598983765, 1.4074468612670898, 1.7709767818450928, 2.1345067024230957, 2.4980363845825195, 2.8615663051605225, 3.2250962257385254, 3.5886261463165283, 3.9521560668945312, 4.315685749053955, 4.679215431213379, 5.042745590209961, 5.406275272369385, 5.769804954528809, 6.133335113525391, 6.4968647956848145, 6.8603949546813965, 7.22392463684082, 7.587454795837402, 7.950984477996826, 8.31451416015625, 8.678044319152832, 9.041574478149414, 9.405104637145996, 9.768633842468262, 10.132164001464844, 10.495694160461426, 10.859224319458008, 11.222753524780273, 11.586283683776855, 11.949812889099121]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 4.0, 9.0, 6.0, 10.0, 19.0, 23.0, 39.0, 53.0, 73.0, 105.0, 153.0, 263.0, 398.0, 594.0, 837.0, 1249.0, 1877.0, 2902.0, 4340.0, 6742.0, 10502.0, 16265.0, 26322.0, 44224.0, 78201.0, 135782.0, 201792.0, 197688.0, 130503.0, 74570.0, 42712.0, 25352.0, 15779.0, 10122.0, 6581.0, 4275.0, 2794.0, 1729.0, 1191.0, 865.0, 523.0, 340.0, 239.0, 174.0, 110.0, 76.0, 63.0, 31.0, 21.0, 12.0, 14.0, 5.0, 3.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-19.8125, -19.172607421875, -18.53271484375, -17.892822265625, -17.2529296875, -16.613037109375, -15.97314453125, -15.333251953125, -14.693359375, -14.053466796875, -13.41357421875, -12.773681640625, -12.1337890625, -11.493896484375, -10.85400390625, -10.214111328125, -9.57421875, -8.934326171875, -8.29443359375, -7.654541015625, -7.0146484375, -6.374755859375, -5.73486328125, -5.094970703125, -4.455078125, -3.815185546875, -3.17529296875, -2.535400390625, -1.8955078125, -1.255615234375, -0.61572265625, 0.024169921875, 0.6640625, 1.303955078125, 1.94384765625, 2.583740234375, 3.2236328125, 3.863525390625, 4.50341796875, 5.143310546875, 5.783203125, 6.423095703125, 7.06298828125, 7.702880859375, 8.3427734375, 8.982666015625, 9.62255859375, 10.262451171875, 10.90234375, 11.542236328125, 12.18212890625, 12.822021484375, 13.4619140625, 14.101806640625, 14.74169921875, 15.381591796875, 16.021484375, 16.661376953125, 17.30126953125, 17.941162109375, 18.5810546875, 19.220947265625, 19.86083984375, 20.500732421875, 21.140625]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 3.0, 6.0, 6.0, 8.0, 8.0, 12.0, 12.0, 22.0, 19.0, 20.0, 21.0, 19.0, 24.0, 26.0, 28.0, 44.0, 44.0, 34.0, 32.0, 47.0, 40.0, 38.0, 41.0, 41.0, 46.0, 41.0, 35.0, 27.0, 35.0, 27.0, 29.0, 25.0, 22.0, 20.0, 19.0, 17.0, 11.0, 16.0, 10.0, 7.0, 4.0, 2.0, 2.0, 5.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-10.5859375, -10.261962890625, -9.93798828125, -9.614013671875, -9.2900390625, -8.966064453125, -8.64208984375, -8.318115234375, -7.994140625, -7.670166015625, -7.34619140625, -7.022216796875, -6.6982421875, -6.374267578125, -6.05029296875, -5.726318359375, -5.40234375, -5.078369140625, -4.75439453125, -4.430419921875, -4.1064453125, -3.782470703125, -3.45849609375, -3.134521484375, -2.810546875, -2.486572265625, -2.16259765625, -1.838623046875, -1.5146484375, -1.190673828125, -0.86669921875, -0.542724609375, -0.21875, 0.105224609375, 0.42919921875, 0.753173828125, 1.0771484375, 1.401123046875, 1.72509765625, 2.049072265625, 2.373046875, 2.697021484375, 3.02099609375, 3.344970703125, 3.6689453125, 3.992919921875, 4.31689453125, 4.640869140625, 4.96484375, 5.288818359375, 5.61279296875, 5.936767578125, 6.2607421875, 6.584716796875, 6.90869140625, 7.232666015625, 7.556640625, 7.880615234375, 8.20458984375, 8.528564453125, 8.8525390625, 9.176513671875, 9.50048828125, 9.824462890625, 10.1484375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 14.0, 10.0, 22.0, 38.0, 49.0, 62.0, 107.0, 167.0, 274.0, 455.0, 733.0, 1213.0, 1929.0, 3199.0, 5351.0, 8949.0, 15352.0, 26182.0, 46817.0, 86140.0, 158361.0, 230706.0, 199723.0, 116664.0, 62944.0, 34634.0, 19676.0, 11615.0, 6843.0, 4017.0, 2468.0, 1485.0, 897.0, 543.0, 336.0, 202.0, 135.0, 90.0, 50.0, 39.0, 17.0, 14.0, 16.0, 9.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-20.875, -20.173095703125, -19.47119140625, -18.769287109375, -18.0673828125, -17.365478515625, -16.66357421875, -15.961669921875, -15.259765625, -14.557861328125, -13.85595703125, -13.154052734375, -12.4521484375, -11.750244140625, -11.04833984375, -10.346435546875, -9.64453125, -8.942626953125, -8.24072265625, -7.538818359375, -6.8369140625, -6.135009765625, -5.43310546875, -4.731201171875, -4.029296875, -3.327392578125, -2.62548828125, -1.923583984375, -1.2216796875, -0.519775390625, 0.18212890625, 0.884033203125, 1.5859375, 2.287841796875, 2.98974609375, 3.691650390625, 4.3935546875, 5.095458984375, 5.79736328125, 6.499267578125, 7.201171875, 7.903076171875, 8.60498046875, 9.306884765625, 10.0087890625, 10.710693359375, 11.41259765625, 12.114501953125, 12.81640625, 13.518310546875, 14.22021484375, 14.922119140625, 15.6240234375, 16.325927734375, 17.02783203125, 17.729736328125, 18.431640625, 19.133544921875, 19.83544921875, 20.537353515625, 21.2392578125, 21.941162109375, 22.64306640625, 23.344970703125, 24.046875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 6.0, 8.0, 5.0, 9.0, 6.0, 7.0, 9.0, 13.0, 22.0, 22.0, 20.0, 27.0, 24.0, 36.0, 38.0, 35.0, 34.0, 34.0, 35.0, 28.0, 42.0, 44.0, 43.0, 40.0, 43.0, 51.0, 36.0, 43.0, 37.0, 26.0, 26.0, 21.0, 26.0, 17.0, 28.0, 5.0, 11.0, 10.0, 14.0, 5.0, 3.0, 3.0, 4.0, 1.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.953125, -5.74603271484375, -5.5389404296875, -5.33184814453125, -5.124755859375, -4.91766357421875, -4.7105712890625, -4.50347900390625, -4.29638671875, -4.08929443359375, -3.8822021484375, -3.67510986328125, -3.468017578125, -3.26092529296875, -3.0538330078125, -2.84674072265625, -2.6396484375, -2.43255615234375, -2.2254638671875, -2.01837158203125, -1.811279296875, -1.60418701171875, -1.3970947265625, -1.19000244140625, -0.98291015625, -0.77581787109375, -0.5687255859375, -0.36163330078125, -0.154541015625, 0.05255126953125, 0.2596435546875, 0.46673583984375, 0.673828125, 0.88092041015625, 1.0880126953125, 1.29510498046875, 1.502197265625, 1.70928955078125, 1.9163818359375, 2.12347412109375, 2.33056640625, 2.53765869140625, 2.7447509765625, 2.95184326171875, 3.158935546875, 3.36602783203125, 3.5731201171875, 3.78021240234375, 3.9873046875, 4.19439697265625, 4.4014892578125, 4.60858154296875, 4.815673828125, 5.02276611328125, 5.2298583984375, 5.43695068359375, 5.64404296875, 5.85113525390625, 6.0582275390625, 6.26531982421875, 6.472412109375, 6.67950439453125, 6.8865966796875, 7.09368896484375, 7.30078125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 6.0, 5.0, 5.0, 13.0, 5.0, 24.0, 21.0, 35.0, 53.0, 81.0, 101.0, 166.0, 248.0, 351.0, 470.0, 665.0, 1093.0, 1685.0, 2585.0, 4079.0, 6557.0, 10867.0, 18687.0, 35313.0, 75000.0, 203414.0, 379434.0, 168024.0, 64701.0, 31058.0, 17063.0, 9887.0, 5945.0, 3734.0, 2387.0, 1607.0, 999.0, 711.0, 485.0, 315.0, 207.0, 154.0, 93.0, 68.0, 45.0, 41.0, 22.0, 16.0, 17.0, 8.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0], "bins": [-1.6865234375, -1.63604736328125, -1.5855712890625, -1.53509521484375, -1.484619140625, -1.43414306640625, -1.3836669921875, -1.33319091796875, -1.28271484375, -1.23223876953125, -1.1817626953125, -1.13128662109375, -1.080810546875, -1.03033447265625, -0.9798583984375, -0.92938232421875, -0.87890625, -0.82843017578125, -0.7779541015625, -0.72747802734375, -0.677001953125, -0.62652587890625, -0.5760498046875, -0.52557373046875, -0.47509765625, -0.42462158203125, -0.3741455078125, -0.32366943359375, -0.273193359375, -0.22271728515625, -0.1722412109375, -0.12176513671875, -0.0712890625, -0.02081298828125, 0.0296630859375, 0.08013916015625, 0.130615234375, 0.18109130859375, 0.2315673828125, 0.28204345703125, 0.33251953125, 0.38299560546875, 0.4334716796875, 0.48394775390625, 0.534423828125, 0.58489990234375, 0.6353759765625, 0.68585205078125, 0.736328125, 0.78680419921875, 0.8372802734375, 0.88775634765625, 0.938232421875, 0.98870849609375, 1.0391845703125, 1.08966064453125, 1.14013671875, 1.19061279296875, 1.2410888671875, 1.29156494140625, 1.342041015625, 1.39251708984375, 1.4429931640625, 1.49346923828125, 1.5439453125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 9.0, 10.0, 8.0, 8.0, 11.0, 14.0, 24.0, 28.0, 34.0, 37.0, 56.0, 41.0, 76.0, 78.0, 74.0, 75.0, 74.0, 76.0, 67.0, 35.0, 35.0, 21.0, 26.0, 20.0, 10.0, 10.0, 9.0, 5.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0001289844512939453, -0.00012502819299697876, -0.00012107193470001221, -0.00011711567640304565, -0.0001131594181060791, -0.00010920315980911255, -0.000105246901512146, -0.00010129064321517944, -9.733438491821289e-05, -9.337812662124634e-05, -8.942186832427979e-05, -8.546561002731323e-05, -8.150935173034668e-05, -7.755309343338013e-05, -7.359683513641357e-05, -6.964057683944702e-05, -6.568431854248047e-05, -6.172806024551392e-05, -5.777180194854736e-05, -5.381554365158081e-05, -4.985928535461426e-05, -4.5903027057647705e-05, -4.194676876068115e-05, -3.79905104637146e-05, -3.403425216674805e-05, -3.0077993869781494e-05, -2.612173557281494e-05, -2.216547727584839e-05, -1.8209218978881836e-05, -1.4252960681915283e-05, -1.029670238494873e-05, -6.340444087982178e-06, -2.384185791015625e-06, 1.5720725059509277e-06, 5.5283308029174805e-06, 9.484589099884033e-06, 1.3440847396850586e-05, 1.739710569381714e-05, 2.135336399078369e-05, 2.5309622287750244e-05, 2.9265880584716797e-05, 3.322213888168335e-05, 3.71783971786499e-05, 4.1134655475616455e-05, 4.509091377258301e-05, 4.904717206954956e-05, 5.300343036651611e-05, 5.6959688663482666e-05, 6.091594696044922e-05, 6.487220525741577e-05, 6.882846355438232e-05, 7.278472185134888e-05, 7.674098014831543e-05, 8.069723844528198e-05, 8.465349674224854e-05, 8.860975503921509e-05, 9.256601333618164e-05, 9.65222716331482e-05, 0.00010047852993011475, 0.0001044347882270813, 0.00010839104652404785, 0.0001123473048210144, 0.00011630356311798096, 0.00012025982141494751, 0.00012421607971191406]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 0.0, 1.0, 5.0, 10.0, 14.0, 15.0, 24.0, 38.0, 53.0, 69.0, 121.0, 163.0, 224.0, 412.0, 590.0, 864.0, 1238.0, 1998.0, 2939.0, 4710.0, 7735.0, 13057.0, 22344.0, 41589.0, 85172.0, 217226.0, 353134.0, 149831.0, 64946.0, 33029.0, 18278.0, 10787.0, 6456.0, 3972.0, 2555.0, 1699.0, 1044.0, 720.0, 529.0, 333.0, 202.0, 134.0, 100.0, 58.0, 49.0, 35.0, 16.0, 13.0, 11.0, 9.0, 5.0, 0.0, 3.0, 2.0, 2.0, 1.0], "bins": [-1.662109375, -1.613677978515625, -1.56524658203125, -1.516815185546875, -1.4683837890625, -1.419952392578125, -1.37152099609375, -1.323089599609375, -1.274658203125, -1.226226806640625, -1.17779541015625, -1.129364013671875, -1.0809326171875, -1.032501220703125, -0.98406982421875, -0.935638427734375, -0.88720703125, -0.838775634765625, -0.79034423828125, -0.741912841796875, -0.6934814453125, -0.645050048828125, -0.59661865234375, -0.548187255859375, -0.499755859375, -0.451324462890625, -0.40289306640625, -0.354461669921875, -0.3060302734375, -0.257598876953125, -0.20916748046875, -0.160736083984375, -0.1123046875, -0.063873291015625, -0.01544189453125, 0.032989501953125, 0.0814208984375, 0.129852294921875, 0.17828369140625, 0.226715087890625, 0.275146484375, 0.323577880859375, 0.37200927734375, 0.420440673828125, 0.4688720703125, 0.517303466796875, 0.56573486328125, 0.614166259765625, 0.66259765625, 0.711029052734375, 0.75946044921875, 0.807891845703125, 0.8563232421875, 0.904754638671875, 0.95318603515625, 1.001617431640625, 1.050048828125, 1.098480224609375, 1.14691162109375, 1.195343017578125, 1.2437744140625, 1.292205810546875, 1.34063720703125, 1.389068603515625, 1.4375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 4.0, 7.0, 8.0, 8.0, 11.0, 12.0, 12.0, 10.0, 25.0, 29.0, 22.0, 38.0, 48.0, 41.0, 55.0, 54.0, 45.0, 69.0, 57.0, 57.0, 47.0, 44.0, 41.0, 33.0, 32.0, 24.0, 24.0, 24.0, 21.0, 22.0, 15.0, 8.0, 9.0, 5.0, 8.0, 7.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3935546875, -0.37939453125, -0.365234375, -0.35107421875, -0.3369140625, -0.32275390625, -0.30859375, -0.29443359375, -0.2802734375, -0.26611328125, -0.251953125, -0.23779296875, -0.2236328125, -0.20947265625, -0.1953125, -0.18115234375, -0.1669921875, -0.15283203125, -0.138671875, -0.12451171875, -0.1103515625, -0.09619140625, -0.08203125, -0.06787109375, -0.0537109375, -0.03955078125, -0.025390625, -0.01123046875, 0.0029296875, 0.01708984375, 0.03125, 0.04541015625, 0.0595703125, 0.07373046875, 0.087890625, 0.10205078125, 0.1162109375, 0.13037109375, 0.14453125, 0.15869140625, 0.1728515625, 0.18701171875, 0.201171875, 0.21533203125, 0.2294921875, 0.24365234375, 0.2578125, 0.27197265625, 0.2861328125, 0.30029296875, 0.314453125, 0.32861328125, 0.3427734375, 0.35693359375, 0.37109375, 0.38525390625, 0.3994140625, 0.41357421875, 0.427734375, 0.44189453125, 0.4560546875, 0.47021484375, 0.484375, 0.49853515625, 0.5126953125]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 2.0, 4.0, 8.0, 7.0, 6.0, 7.0, 14.0, 20.0, 17.0, 22.0, 31.0, 27.0, 49.0, 51.0, 72.0, 64.0, 77.0, 91.0, 62.0, 76.0, 55.0, 37.0, 38.0, 28.0, 18.0, 23.0, 19.0, 12.0, 12.0, 5.0, 9.0, 10.0, 11.0, 4.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.077596664428711, -12.632695198059082, -12.187792778015137, -11.742891311645508, -11.297989845275879, -10.85308837890625, -10.408185958862305, -9.963284492492676, -9.518383026123047, -9.073481559753418, -8.628579139709473, -8.183677673339844, -7.738776206970215, -7.293874263763428, -6.848972320556641, -6.404070854187012, -5.959168434143066, -5.514266490936279, -5.06936502456665, -4.624463081359863, -4.179561614990234, -3.7346596717834473, -3.28975772857666, -2.844856023788452, -2.399954319000244, -1.9550526142120361, -1.5101507902145386, -1.065248966217041, -0.620347261428833, -0.175445556640625, 0.2694563865661621, 0.7143580913543701, 1.1592607498168945, 1.6041624546051025, 2.0490641593933105, 2.4939661026000977, 2.9388678073883057, 3.3837695121765137, 3.828671455383301, 4.27357292175293, 4.718474864959717, 5.163376808166504, 5.608278274536133, 6.05318021774292, 6.498082160949707, 6.942983627319336, 7.387885570526123, 7.83278751373291, 8.277688980102539, 8.722590446472168, 9.167492866516113, 9.612394332885742, 10.057295799255371, 10.502197265625, 10.947099685668945, 11.392001152038574, 11.836902618408203, 12.281804084777832, 12.726706504821777, 13.171607971191406, 13.616509437561035, 14.061410903930664, 14.50631332397461, 14.951214790344238, 15.396117210388184]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 6.0, 5.0, 7.0, 5.0, 12.0, 13.0, 15.0, 13.0, 18.0, 20.0, 26.0, 17.0, 23.0, 35.0, 32.0, 34.0, 38.0, 31.0, 35.0, 37.0, 32.0, 41.0, 30.0, 20.0, 39.0, 40.0, 24.0, 43.0, 23.0, 32.0, 33.0, 25.0, 26.0, 28.0, 17.0, 23.0, 16.0, 13.0, 15.0, 5.0, 12.0, 10.0, 8.0, 7.0, 4.0, 3.0, 5.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.616646766662598, -9.303574562072754, -8.99050235748291, -8.677431106567383, -8.364358901977539, -8.051286697387695, -7.738214492797852, -7.425142288208008, -7.112070560455322, -6.7989983558654785, -6.485926628112793, -6.172854423522949, -5.8597822189331055, -5.54671049118042, -5.233638286590576, -4.920566558837891, -4.607494354248047, -4.294422149658203, -3.9813504219055176, -3.668278217315674, -3.355206251144409, -3.0421342849731445, -2.729062080383301, -2.415990114212036, -2.1029181480407715, -1.7898461818695068, -1.4767740964889526, -1.1637020111083984, -0.8506300449371338, -0.5375580787658691, -0.22448599338531494, 0.08858609199523926, 0.4016571044921875, 0.7147291302680969, 1.0278011560440063, 1.3408732414245605, 1.6539452075958252, 1.9670171737670898, 2.2800893783569336, 2.5931613445281982, 2.906233310699463, 3.2193052768707275, 3.532377243041992, 3.845449447631836, 4.15852165222168, 4.471593379974365, 4.784665584564209, 5.0977373123168945, 5.410809516906738, 5.723881721496582, 6.036953449249268, 6.350025653839111, 6.663097381591797, 6.976169586181641, 7.289241790771484, 7.602313995361328, 7.915385723114014, 8.2284574508667, 8.541529655456543, 8.854601860046387, 9.16767406463623, 9.480745315551758, 9.793817520141602, 10.106889724731445, 10.419961929321289]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 5.0, 3.0, 6.0, 8.0, 12.0, 25.0, 30.0, 38.0, 68.0, 103.0, 133.0, 191.0, 274.0, 458.0, 670.0, 960.0, 1448.0, 2120.0, 3159.0, 4810.0, 7285.0, 11356.0, 17775.0, 28367.0, 45671.0, 77837.0, 142755.0, 374136.0, 1184751.0, 1392878.0, 499017.0, 169141.0, 87518.0, 51515.0, 31501.0, 19920.0, 12997.0, 8512.0, 5623.0, 3734.0, 2538.0, 1570.0, 1120.0, 770.0, 511.0, 317.0, 251.0, 153.0, 99.0, 51.0, 38.0, 23.0, 19.0, 11.0, 3.0, 6.0, 2.0, 2.0], "bins": [-17.828125, -17.3204345703125, -16.812744140625, -16.3050537109375, -15.79736328125, -15.2896728515625, -14.781982421875, -14.2742919921875, -13.7666015625, -13.2589111328125, -12.751220703125, -12.2435302734375, -11.73583984375, -11.2281494140625, -10.720458984375, -10.2127685546875, -9.705078125, -9.1973876953125, -8.689697265625, -8.1820068359375, -7.67431640625, -7.1666259765625, -6.658935546875, -6.1512451171875, -5.6435546875, -5.1358642578125, -4.628173828125, -4.1204833984375, -3.61279296875, -3.1051025390625, -2.597412109375, -2.0897216796875, -1.58203125, -1.0743408203125, -0.566650390625, -0.0589599609375, 0.44873046875, 0.9564208984375, 1.464111328125, 1.9718017578125, 2.4794921875, 2.9871826171875, 3.494873046875, 4.0025634765625, 4.51025390625, 5.0179443359375, 5.525634765625, 6.0333251953125, 6.541015625, 7.0487060546875, 7.556396484375, 8.0640869140625, 8.57177734375, 9.0794677734375, 9.587158203125, 10.0948486328125, 10.6025390625, 11.1102294921875, 11.617919921875, 12.1256103515625, 12.63330078125, 13.1409912109375, 13.648681640625, 14.1563720703125, 14.6640625]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 5.0, 7.0, 11.0, 8.0, 11.0, 17.0, 12.0, 21.0, 22.0, 29.0, 24.0, 23.0, 23.0, 29.0, 36.0, 31.0, 41.0, 26.0, 42.0, 36.0, 41.0, 36.0, 29.0, 47.0, 38.0, 33.0, 36.0, 36.0, 23.0, 17.0, 23.0, 36.0, 29.0, 15.0, 14.0, 12.0, 17.0, 15.0, 9.0, 13.0, 4.0, 7.0, 4.0, 4.0, 2.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.9609375, -8.6893310546875, -8.417724609375, -8.1461181640625, -7.87451171875, -7.6029052734375, -7.331298828125, -7.0596923828125, -6.7880859375, -6.5164794921875, -6.244873046875, -5.9732666015625, -5.70166015625, -5.4300537109375, -5.158447265625, -4.8868408203125, -4.615234375, -4.3436279296875, -4.072021484375, -3.8004150390625, -3.52880859375, -3.2572021484375, -2.985595703125, -2.7139892578125, -2.4423828125, -2.1707763671875, -1.899169921875, -1.6275634765625, -1.35595703125, -1.0843505859375, -0.812744140625, -0.5411376953125, -0.26953125, 0.0020751953125, 0.273681640625, 0.5452880859375, 0.81689453125, 1.0885009765625, 1.360107421875, 1.6317138671875, 1.9033203125, 2.1749267578125, 2.446533203125, 2.7181396484375, 2.98974609375, 3.2613525390625, 3.532958984375, 3.8045654296875, 4.076171875, 4.3477783203125, 4.619384765625, 4.8909912109375, 5.16259765625, 5.4342041015625, 5.705810546875, 5.9774169921875, 6.2490234375, 6.5206298828125, 6.792236328125, 7.0638427734375, 7.33544921875, 7.6070556640625, 7.878662109375, 8.1502685546875, 8.421875]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [4.0, 4.0, 7.0, 7.0, 7.0, 21.0, 15.0, 41.0, 48.0, 96.0, 123.0, 182.0, 282.0, 441.0, 630.0, 942.0, 1445.0, 2174.0, 3210.0, 4927.0, 7713.0, 12211.0, 19584.0, 31950.0, 54122.0, 94849.0, 177601.0, 359981.0, 852665.0, 1402148.0, 577250.0, 265163.0, 136125.0, 74693.0, 43079.0, 25804.0, 16010.0, 10092.0, 6464.0, 4158.0, 2616.0, 1790.0, 1162.0, 807.0, 553.0, 368.0, 242.0, 168.0, 129.0, 61.0, 54.0, 28.0, 24.0, 9.0, 13.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.390625, -12.9334716796875, -12.476318359375, -12.0191650390625, -11.56201171875, -11.1048583984375, -10.647705078125, -10.1905517578125, -9.7333984375, -9.2762451171875, -8.819091796875, -8.3619384765625, -7.90478515625, -7.4476318359375, -6.990478515625, -6.5333251953125, -6.076171875, -5.6190185546875, -5.161865234375, -4.7047119140625, -4.24755859375, -3.7904052734375, -3.333251953125, -2.8760986328125, -2.4189453125, -1.9617919921875, -1.504638671875, -1.0474853515625, -0.59033203125, -0.1331787109375, 0.323974609375, 0.7811279296875, 1.23828125, 1.6954345703125, 2.152587890625, 2.6097412109375, 3.06689453125, 3.5240478515625, 3.981201171875, 4.4383544921875, 4.8955078125, 5.3526611328125, 5.809814453125, 6.2669677734375, 6.72412109375, 7.1812744140625, 7.638427734375, 8.0955810546875, 8.552734375, 9.0098876953125, 9.467041015625, 9.9241943359375, 10.38134765625, 10.8385009765625, 11.295654296875, 11.7528076171875, 12.2099609375, 12.6671142578125, 13.124267578125, 13.5814208984375, 14.03857421875, 14.4957275390625, 14.952880859375, 15.4100341796875, 15.8671875]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 1.0, 2.0, 7.0, 6.0, 8.0, 12.0, 10.0, 14.0, 18.0, 21.0, 27.0, 28.0, 20.0, 46.0, 52.0, 58.0, 72.0, 88.0, 94.0, 128.0, 176.0, 208.0, 225.0, 304.0, 359.0, 377.0, 319.0, 239.0, 183.0, 156.0, 130.0, 118.0, 96.0, 76.0, 60.0, 50.0, 59.0, 45.0, 38.0, 27.0, 22.0, 22.0, 11.0, 13.0, 9.0, 10.0, 5.0, 6.0, 5.0, 3.0, 2.0, 5.0, 4.0, 1.0, 3.0, 2.0], "bins": [-5.00390625, -4.8529052734375, -4.701904296875, -4.5509033203125, -4.39990234375, -4.2489013671875, -4.097900390625, -3.9468994140625, -3.7958984375, -3.6448974609375, -3.493896484375, -3.3428955078125, -3.19189453125, -3.0408935546875, -2.889892578125, -2.7388916015625, -2.587890625, -2.4368896484375, -2.285888671875, -2.1348876953125, -1.98388671875, -1.8328857421875, -1.681884765625, -1.5308837890625, -1.3798828125, -1.2288818359375, -1.077880859375, -0.9268798828125, -0.77587890625, -0.6248779296875, -0.473876953125, -0.3228759765625, -0.171875, -0.0208740234375, 0.130126953125, 0.2811279296875, 0.43212890625, 0.5831298828125, 0.734130859375, 0.8851318359375, 1.0361328125, 1.1871337890625, 1.338134765625, 1.4891357421875, 1.64013671875, 1.7911376953125, 1.942138671875, 2.0931396484375, 2.244140625, 2.3951416015625, 2.546142578125, 2.6971435546875, 2.84814453125, 2.9991455078125, 3.150146484375, 3.3011474609375, 3.4521484375, 3.6031494140625, 3.754150390625, 3.9051513671875, 4.05615234375, 4.2071533203125, 4.358154296875, 4.5091552734375, 4.66015625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 5.0, 10.0, 12.0, 14.0, 13.0, 26.0, 20.0, 31.0, 34.0, 49.0, 74.0, 83.0, 72.0, 100.0, 78.0, 72.0, 51.0, 46.0, 41.0, 35.0, 17.0, 25.0, 23.0, 11.0, 10.0, 11.0, 9.0, 9.0, 1.0, 2.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.018756866455078, -14.571734428405762, -14.124711990356445, -13.677689552307129, -13.230667114257812, -12.78364372253418, -12.336621284484863, -11.889598846435547, -11.44257640838623, -10.995553970336914, -10.548531532287598, -10.101509094238281, -9.654485702514648, -9.207464218139648, -8.760440826416016, -8.3134183883667, -7.866395950317383, -7.419373512268066, -6.97235107421875, -6.525328159332275, -6.078305721282959, -5.631283283233643, -5.184260368347168, -4.737237930297852, -4.290215492248535, -3.8431930541992188, -3.3961703777313232, -2.9491477012634277, -2.5021252632141113, -2.055102825164795, -1.6080801486968994, -1.161057472229004, -0.7140359878540039, -0.26701343059539795, 0.180009126663208, 0.627031683921814, 1.07405424118042, 1.5210766792297363, 1.9680993556976318, 2.4151220321655273, 2.8621444702148438, 3.30916690826416, 3.7561895847320557, 4.203212261199951, 4.650234699249268, 5.097257137298584, 5.544280052185059, 5.991302490234375, 6.438324928283691, 6.885347366333008, 7.332369804382324, 7.779392719268799, 8.226415634155273, 8.673437118530273, 9.120460510253906, 9.567482948303223, 10.014505386352539, 10.461527824401855, 10.908550262451172, 11.355572700500488, 11.802595138549805, 12.249618530273438, 12.696640968322754, 13.14366340637207, 13.590685844421387]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 6.0, 7.0, 6.0, 10.0, 11.0, 14.0, 9.0, 13.0, 17.0, 26.0, 19.0, 27.0, 17.0, 32.0, 33.0, 31.0, 41.0, 36.0, 29.0, 33.0, 41.0, 31.0, 41.0, 36.0, 36.0, 32.0, 39.0, 30.0, 38.0, 32.0, 26.0, 21.0, 32.0, 25.0, 17.0, 15.0, 16.0, 14.0, 7.0, 13.0, 4.0, 9.0, 6.0, 5.0, 3.0, 1.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.870312690734863, -8.57164478302002, -8.272976875305176, -7.974308967590332, -7.675641059875488, -7.3769731521606445, -7.078305244445801, -6.779637336730957, -6.480969429016113, -6.1823015213012695, -5.883633613586426, -5.584965705871582, -5.286297798156738, -4.9876298904418945, -4.688961982727051, -4.390294075012207, -4.091626167297363, -3.7929582595825195, -3.494290351867676, -3.195622444152832, -2.8969545364379883, -2.5982866287231445, -2.299618721008301, -2.000950813293457, -1.7022829055786133, -1.4036149978637695, -1.1049470901489258, -0.806279182434082, -0.5076112747192383, -0.20894336700439453, 0.08972454071044922, 0.38839244842529297, 0.6870603561401367, 0.9857282638549805, 1.2843961715698242, 1.583064079284668, 1.8817319869995117, 2.1803998947143555, 2.479067802429199, 2.777735710144043, 3.0764036178588867, 3.3750715255737305, 3.673739433288574, 3.972407341003418, 4.271075248718262, 4.5697431564331055, 4.868411064147949, 5.167078971862793, 5.465746879577637, 5.7644147872924805, 6.063082695007324, 6.361750602722168, 6.660418510437012, 6.9590864181518555, 7.257754325866699, 7.556422233581543, 7.855090141296387, 8.15375804901123, 8.452425956726074, 8.751093864440918, 9.049761772155762, 9.348429679870605, 9.64709758758545, 9.945765495300293, 10.244433403015137]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 9.0, 6.0, 11.0, 16.0, 26.0, 51.0, 44.0, 57.0, 103.0, 171.0, 219.0, 303.0, 409.0, 644.0, 890.0, 1312.0, 1764.0, 2592.0, 3841.0, 5632.0, 8344.0, 12533.0, 19035.0, 29678.0, 47044.0, 76706.0, 137741.0, 316108.0, 154918.0, 83477.0, 50798.0, 32184.0, 20412.0, 13425.0, 8841.0, 5980.0, 4087.0, 2789.0, 1937.0, 1347.0, 918.0, 640.0, 452.0, 294.0, 224.0, 186.0, 119.0, 71.0, 56.0, 36.0, 34.0, 22.0, 13.0, 13.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-2.900390625, -2.811370849609375, -2.72235107421875, -2.633331298828125, -2.5443115234375, -2.455291748046875, -2.36627197265625, -2.277252197265625, -2.188232421875, -2.099212646484375, -2.01019287109375, -1.921173095703125, -1.8321533203125, -1.743133544921875, -1.65411376953125, -1.565093994140625, -1.47607421875, -1.387054443359375, -1.29803466796875, -1.209014892578125, -1.1199951171875, -1.030975341796875, -0.94195556640625, -0.852935791015625, -0.763916015625, -0.674896240234375, -0.58587646484375, -0.496856689453125, -0.4078369140625, -0.318817138671875, -0.22979736328125, -0.140777587890625, -0.0517578125, 0.037261962890625, 0.12628173828125, 0.215301513671875, 0.3043212890625, 0.393341064453125, 0.48236083984375, 0.571380615234375, 0.660400390625, 0.749420166015625, 0.83843994140625, 0.927459716796875, 1.0164794921875, 1.105499267578125, 1.19451904296875, 1.283538818359375, 1.37255859375, 1.461578369140625, 1.55059814453125, 1.639617919921875, 1.7286376953125, 1.817657470703125, 1.90667724609375, 1.995697021484375, 2.084716796875, 2.173736572265625, 2.26275634765625, 2.351776123046875, 2.4407958984375, 2.529815673828125, 2.61883544921875, 2.707855224609375, 2.796875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 7.0, 6.0, 4.0, 12.0, 10.0, 7.0, 5.0, 20.0, 11.0, 18.0, 21.0, 27.0, 18.0, 38.0, 28.0, 40.0, 32.0, 30.0, 33.0, 37.0, 32.0, 43.0, 48.0, 32.0, 51.0, 36.0, 28.0, 36.0, 35.0, 27.0, 36.0, 28.0, 20.0, 20.0, 18.0, 22.0, 13.0, 12.0, 14.0, 9.0, 8.0, 8.0, 5.0, 4.0, 3.0, 6.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3046875, -8.987548828125, -8.67041015625, -8.353271484375, -8.0361328125, -7.718994140625, -7.40185546875, -7.084716796875, -6.767578125, -6.450439453125, -6.13330078125, -5.816162109375, -5.4990234375, -5.181884765625, -4.86474609375, -4.547607421875, -4.23046875, -3.913330078125, -3.59619140625, -3.279052734375, -2.9619140625, -2.644775390625, -2.32763671875, -2.010498046875, -1.693359375, -1.376220703125, -1.05908203125, -0.741943359375, -0.4248046875, -0.107666015625, 0.20947265625, 0.526611328125, 0.84375, 1.160888671875, 1.47802734375, 1.795166015625, 2.1123046875, 2.429443359375, 2.74658203125, 3.063720703125, 3.380859375, 3.697998046875, 4.01513671875, 4.332275390625, 4.6494140625, 4.966552734375, 5.28369140625, 5.600830078125, 5.91796875, 6.235107421875, 6.55224609375, 6.869384765625, 7.1865234375, 7.503662109375, 7.82080078125, 8.137939453125, 8.455078125, 8.772216796875, 9.08935546875, 9.406494140625, 9.7236328125, 10.040771484375, 10.35791015625, 10.675048828125, 10.9921875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 5.0, 5.0, 4.0, 8.0, 13.0, 15.0, 22.0, 37.0, 39.0, 60.0, 66.0, 120.0, 169.0, 224.0, 297.0, 416.0, 580.0, 754.0, 1101.0, 1644.0, 2315.0, 3179.0, 4689.0, 6891.0, 10462.0, 15662.0, 23806.0, 36750.0, 59804.0, 105786.0, 237609.0, 254376.0, 108753.0, 61323.0, 37539.0, 24477.0, 15830.0, 10490.0, 7219.0, 4799.0, 3319.0, 2303.0, 1608.0, 1176.0, 789.0, 595.0, 410.0, 290.0, 213.0, 154.0, 113.0, 71.0, 53.0, 42.0, 28.0, 24.0, 19.0, 9.0, 7.0, 4.0, 5.0, 3.0, 2.0], "bins": [-2.689453125, -2.60546875, -2.521484375, -2.4375, -2.353515625, -2.26953125, -2.185546875, -2.1015625, -2.017578125, -1.93359375, -1.849609375, -1.765625, -1.681640625, -1.59765625, -1.513671875, -1.4296875, -1.345703125, -1.26171875, -1.177734375, -1.09375, -1.009765625, -0.92578125, -0.841796875, -0.7578125, -0.673828125, -0.58984375, -0.505859375, -0.421875, -0.337890625, -0.25390625, -0.169921875, -0.0859375, -0.001953125, 0.08203125, 0.166015625, 0.25, 0.333984375, 0.41796875, 0.501953125, 0.5859375, 0.669921875, 0.75390625, 0.837890625, 0.921875, 1.005859375, 1.08984375, 1.173828125, 1.2578125, 1.341796875, 1.42578125, 1.509765625, 1.59375, 1.677734375, 1.76171875, 1.845703125, 1.9296875, 2.013671875, 2.09765625, 2.181640625, 2.265625, 2.349609375, 2.43359375, 2.517578125, 2.6015625, 2.685546875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 10.0, 9.0, 9.0, 9.0, 7.0, 13.0, 14.0, 16.0, 25.0, 20.0, 21.0, 22.0, 36.0, 24.0, 45.0, 38.0, 37.0, 39.0, 43.0, 30.0, 48.0, 42.0, 27.0, 47.0, 38.0, 40.0, 38.0, 26.0, 29.0, 24.0, 26.0, 16.0, 20.0, 25.0, 13.0, 15.0, 13.0, 11.0, 8.0, 7.0, 7.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.70703125, -6.50128173828125, -6.2955322265625, -6.08978271484375, -5.884033203125, -5.67828369140625, -5.4725341796875, -5.26678466796875, -5.06103515625, -4.85528564453125, -4.6495361328125, -4.44378662109375, -4.238037109375, -4.03228759765625, -3.8265380859375, -3.62078857421875, -3.4150390625, -3.20928955078125, -3.0035400390625, -2.79779052734375, -2.592041015625, -2.38629150390625, -2.1805419921875, -1.97479248046875, -1.76904296875, -1.56329345703125, -1.3575439453125, -1.15179443359375, -0.946044921875, -0.74029541015625, -0.5345458984375, -0.32879638671875, -0.123046875, 0.08270263671875, 0.2884521484375, 0.49420166015625, 0.699951171875, 0.90570068359375, 1.1114501953125, 1.31719970703125, 1.52294921875, 1.72869873046875, 1.9344482421875, 2.14019775390625, 2.345947265625, 2.55169677734375, 2.7574462890625, 2.96319580078125, 3.1689453125, 3.37469482421875, 3.5804443359375, 3.78619384765625, 3.991943359375, 4.19769287109375, 4.4034423828125, 4.60919189453125, 4.81494140625, 5.02069091796875, 5.2264404296875, 5.43218994140625, 5.637939453125, 5.84368896484375, 6.0494384765625, 6.25518798828125, 6.4609375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 8.0, 6.0, 13.0, 16.0, 22.0, 25.0, 27.0, 57.0, 68.0, 65.0, 96.0, 129.0, 176.0, 240.0, 293.0, 499.0, 607.0, 922.0, 1357.0, 1952.0, 3030.0, 4803.0, 7752.0, 13214.0, 23656.0, 46941.0, 104977.0, 267620.0, 318799.0, 128565.0, 55376.0, 27425.0, 15027.0, 8646.0, 5346.0, 3388.0, 2280.0, 1517.0, 1040.0, 653.0, 546.0, 354.0, 295.0, 172.0, 161.0, 95.0, 85.0, 55.0, 44.0, 27.0, 26.0, 21.0, 15.0, 17.0, 9.0, 1.0, 6.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.00514984130859375, -0.00498431921005249, -0.0048187971115112305, -0.004653275012969971, -0.004487752914428711, -0.004322230815887451, -0.004156708717346191, -0.003991186618804932, -0.003825664520263672, -0.003660142421722412, -0.0034946203231811523, -0.0033290982246398926, -0.003163576126098633, -0.002998054027557373, -0.0028325319290161133, -0.0026670098304748535, -0.0025014877319335938, -0.002335965633392334, -0.0021704435348510742, -0.0020049214363098145, -0.0018393993377685547, -0.001673877239227295, -0.0015083551406860352, -0.0013428330421447754, -0.0011773109436035156, -0.0010117888450622559, -0.0008462667465209961, -0.0006807446479797363, -0.0005152225494384766, -0.0003497004508972168, -0.00018417835235595703, -1.8656253814697266e-05, 0.0001468658447265625, 0.00031238794326782227, 0.00047791004180908203, 0.0006434321403503418, 0.0008089542388916016, 0.0009744763374328613, 0.001139998435974121, 0.0013055205345153809, 0.0014710426330566406, 0.0016365647315979004, 0.0018020868301391602, 0.00196760892868042, 0.0021331310272216797, 0.0022986531257629395, 0.0024641752243041992, 0.002629697322845459, 0.0027952194213867188, 0.0029607415199279785, 0.0031262636184692383, 0.003291785717010498, 0.003457307815551758, 0.0036228299140930176, 0.0037883520126342773, 0.003953874111175537, 0.004119396209716797, 0.004284918308258057, 0.004450440406799316, 0.004615962505340576, 0.004781484603881836, 0.004947006702423096, 0.0051125288009643555, 0.005278050899505615, 0.005443572998046875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 5.0, 14.0, 9.0, 17.0, 12.0, 28.0, 18.0, 34.0, 38.0, 45.0, 35.0, 92.0, 57.0, 98.0, 69.0, 89.0, 78.0, 43.0, 48.0, 32.0, 29.0, 26.0, 15.0, 9.0, 12.0, 9.0, 5.0, 7.0, 5.0, 1.0, 7.0, 4.0, 4.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4373016357421875e-06, -6.226822733879089e-06, -6.016343832015991e-06, -5.805864930152893e-06, -5.595386028289795e-06, -5.384907126426697e-06, -5.174428224563599e-06, -4.9639493227005005e-06, -4.753470420837402e-06, -4.542991518974304e-06, -4.332512617111206e-06, -4.122033715248108e-06, -3.91155481338501e-06, -3.7010759115219116e-06, -3.4905970096588135e-06, -3.2801181077957153e-06, -3.069639205932617e-06, -2.859160304069519e-06, -2.648681402206421e-06, -2.4382025003433228e-06, -2.2277235984802246e-06, -2.0172446966171265e-06, -1.8067657947540283e-06, -1.5962868928909302e-06, -1.385807991027832e-06, -1.1753290891647339e-06, -9.648501873016357e-07, -7.543712854385376e-07, -5.438923835754395e-07, -3.334134817123413e-07, -1.2293457984924316e-07, 8.754432201385498e-08, 2.980232238769531e-07, 5.085021257400513e-07, 7.189810276031494e-07, 9.294599294662476e-07, 1.1399388313293457e-06, 1.3504177331924438e-06, 1.560896635055542e-06, 1.7713755369186401e-06, 1.9818544387817383e-06, 2.1923333406448364e-06, 2.4028122425079346e-06, 2.6132911443710327e-06, 2.823770046234131e-06, 3.034248948097229e-06, 3.244727849960327e-06, 3.4552067518234253e-06, 3.6656856536865234e-06, 3.876164555549622e-06, 4.08664345741272e-06, 4.297122359275818e-06, 4.507601261138916e-06, 4.718080163002014e-06, 4.928559064865112e-06, 5.1390379667282104e-06, 5.349516868591309e-06, 5.559995770454407e-06, 5.770474672317505e-06, 5.980953574180603e-06, 6.191432476043701e-06, 6.401911377906799e-06, 6.6123902797698975e-06, 6.822869181632996e-06, 7.033348083496094e-06]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 11.0, 7.0, 12.0, 9.0, 6.0, 16.0, 27.0, 34.0, 44.0, 52.0, 67.0, 100.0, 118.0, 208.0, 267.0, 392.0, 615.0, 893.0, 1485.0, 2511.0, 4216.0, 7435.0, 13726.0, 26760.0, 56760.0, 137621.0, 357455.0, 254841.0, 94795.0, 42067.0, 20309.0, 10646.0, 5834.0, 3456.0, 2039.0, 1251.0, 766.0, 497.0, 338.0, 227.0, 157.0, 143.0, 87.0, 64.0, 36.0, 49.0, 30.0, 37.0, 16.0, 6.0, 6.0, 3.0, 3.0, 4.0, 3.0, 3.0, 2.0], "bins": [-0.0065460205078125, -0.006352365016937256, -0.006158709526062012, -0.005965054035186768, -0.0057713985443115234, -0.005577743053436279, -0.005384087562561035, -0.005190432071685791, -0.004996776580810547, -0.004803121089935303, -0.004609465599060059, -0.0044158101081848145, -0.00422215461730957, -0.004028499126434326, -0.003834843635559082, -0.003641188144683838, -0.0034475326538085938, -0.0032538771629333496, -0.0030602216720581055, -0.0028665661811828613, -0.002672910690307617, -0.002479255199432373, -0.002285599708557129, -0.0020919442176818848, -0.0018982887268066406, -0.0017046332359313965, -0.0015109777450561523, -0.0013173222541809082, -0.001123666763305664, -0.0009300112724304199, -0.0007363557815551758, -0.0005427002906799316, -0.0003490447998046875, -0.00015538930892944336, 3.826618194580078e-05, 0.00023192167282104492, 0.00042557716369628906, 0.0006192326545715332, 0.0008128881454467773, 0.0010065436363220215, 0.0012001991271972656, 0.0013938546180725098, 0.001587510108947754, 0.001781165599822998, 0.001974821090698242, 0.0021684765815734863, 0.0023621320724487305, 0.0025557875633239746, 0.0027494430541992188, 0.002943098545074463, 0.003136754035949707, 0.003330409526824951, 0.0035240650177001953, 0.0037177205085754395, 0.003911375999450684, 0.004105031490325928, 0.004298686981201172, 0.004492342472076416, 0.00468599796295166, 0.004879653453826904, 0.0050733089447021484, 0.005266964435577393, 0.005460619926452637, 0.005654275417327881, 0.005847930908203125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 4.0, 12.0, 6.0, 19.0, 21.0, 15.0, 20.0, 28.0, 46.0, 52.0, 60.0, 92.0, 77.0, 72.0, 76.0, 59.0, 64.0, 66.0, 48.0, 37.0, 27.0, 25.0, 15.0, 12.0, 8.0, 8.0, 7.0, 6.0, 6.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0023651123046875, -0.002302318811416626, -0.002239525318145752, -0.002176731824874878, -0.002113938331604004, -0.00205114483833313, -0.001988351345062256, -0.0019255578517913818, -0.0018627643585205078, -0.0017999708652496338, -0.0017371773719787598, -0.0016743838787078857, -0.0016115903854370117, -0.0015487968921661377, -0.0014860033988952637, -0.0014232099056243896, -0.0013604164123535156, -0.0012976229190826416, -0.0012348294258117676, -0.0011720359325408936, -0.0011092424392700195, -0.0010464489459991455, -0.0009836554527282715, -0.0009208619594573975, -0.0008580684661865234, -0.0007952749729156494, -0.0007324814796447754, -0.0006696879863739014, -0.0006068944931030273, -0.0005441009998321533, -0.0004813075065612793, -0.0004185140132904053, -0.00035572052001953125, -0.0002929270267486572, -0.0002301335334777832, -0.00016734004020690918, -0.00010454654693603516, -4.175305366516113e-05, 2.104043960571289e-05, 8.383393287658691e-05, 0.00014662742614746094, 0.00020942091941833496, 0.000272214412689209, 0.000335007905960083, 0.00039780139923095703, 0.00046059489250183105, 0.0005233883857727051, 0.0005861818790435791, 0.0006489753723144531, 0.0007117688655853271, 0.0007745623588562012, 0.0008373558521270752, 0.0009001493453979492, 0.0009629428386688232, 0.0010257363319396973, 0.0010885298252105713, 0.0011513233184814453, 0.0012141168117523193, 0.0012769103050231934, 0.0013397037982940674, 0.0014024972915649414, 0.0014652907848358154, 0.0015280842781066895, 0.0015908777713775635, 0.0016536712646484375]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 8.0, 6.0, 6.0, 15.0, 15.0, 24.0, 26.0, 21.0, 33.0, 45.0, 54.0, 93.0, 68.0, 86.0, 78.0, 83.0, 58.0, 54.0, 45.0, 31.0, 23.0, 21.0, 27.0, 13.0, 13.0, 13.0, 9.0, 11.0, 4.0, 2.0, 3.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.538301467895508, -14.098468780517578, -13.658635139465332, -13.218802452087402, -12.778969764709473, -12.339136123657227, -11.899303436279297, -11.459470748901367, -11.019638061523438, -10.579805374145508, -10.139971733093262, -9.700139045715332, -9.260306358337402, -8.820472717285156, -8.380640029907227, -7.940807342529297, -7.500974178314209, -7.061141014099121, -6.621308326721191, -6.1814751625061035, -5.741642475128174, -5.301809310913086, -4.861976623535156, -4.422143459320068, -3.9823105335235596, -3.542477607727051, -3.102644681930542, -2.662811756134033, -2.2229785919189453, -1.7831456661224365, -1.3433127403259277, -0.903479814529419, -0.46364688873291016, -0.02381393313407898, 0.4160190224647522, 0.8558520078659058, 1.2956849336624146, 1.735517978668213, 2.1753509044647217, 2.6151838302612305, 3.0550167560577393, 3.494849681854248, 3.934682607650757, 4.374515533447266, 4.8143486976623535, 5.254181861877441, 5.694014549255371, 6.133847236633301, 6.573680400848389, 7.013513565063477, 7.453346252441406, 7.893179416656494, 8.333012580871582, 8.772845268249512, 9.212677955627441, 9.652511596679688, 10.092344284057617, 10.532176971435547, 10.972010612487793, 11.411843299865723, 11.851675987243652, 12.291509628295898, 12.731342315673828, 13.171175003051758, 13.611007690429688]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 7.0, 6.0, 6.0, 11.0, 10.0, 14.0, 9.0, 13.0, 18.0, 25.0, 20.0, 26.0, 18.0, 31.0, 33.0, 31.0, 41.0, 37.0, 26.0, 37.0, 39.0, 32.0, 44.0, 32.0, 36.0, 32.0, 39.0, 29.0, 39.0, 33.0, 25.0, 22.0, 31.0, 25.0, 17.0, 15.0, 16.0, 14.0, 7.0, 13.0, 5.0, 9.0, 5.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.90501880645752, -8.60777473449707, -8.310529708862305, -8.013285636901855, -7.716041564941406, -7.418797016143799, -7.121552467346191, -6.824308395385742, -6.527063846588135, -6.229819297790527, -5.932575225830078, -5.635330677032471, -5.338086128234863, -5.040842056274414, -4.743597507476807, -4.446352958679199, -4.14910888671875, -3.8518645763397217, -3.5546202659606934, -3.257375717163086, -2.9601314067840576, -2.6628870964050293, -2.365642547607422, -2.0683982372283936, -1.7711539268493652, -1.473909616470337, -1.176665186882019, -0.879420816898346, -0.5821764469146729, -0.28493213653564453, 0.01231229305267334, 0.3095567226409912, 0.6068000793457031, 0.9040444493293762, 1.2012888193130493, 1.4985332489013672, 1.7957775592803955, 2.093021869659424, 2.3902664184570312, 2.6875107288360596, 2.984755039215088, 3.281999349594116, 3.5792436599731445, 3.876488208770752, 4.173732757568359, 4.470976829528809, 4.768221378326416, 5.065465927124023, 5.362709999084473, 5.65995454788208, 5.957198619842529, 6.254443168640137, 6.551687240600586, 6.848931789398193, 7.146176338195801, 7.44342041015625, 7.740664958953857, 8.037909507751465, 8.335153579711914, 8.632397651672363, 8.929642677307129, 9.226886749267578, 9.524130821228027, 9.821375846862793, 10.118619918823242]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 4.0, 9.0, 9.0, 7.0, 16.0, 26.0, 39.0, 66.0, 74.0, 107.0, 160.0, 235.0, 349.0, 529.0, 777.0, 1155.0, 1661.0, 2554.0, 3885.0, 5827.0, 9080.0, 14013.0, 22033.0, 35660.0, 60630.0, 104329.0, 168473.0, 202736.0, 162681.0, 99797.0, 57730.0, 33890.0, 21110.0, 13449.0, 8731.0, 5570.0, 3713.0, 2453.0, 1630.0, 1029.0, 742.0, 519.0, 330.0, 229.0, 141.0, 119.0, 99.0, 40.0, 40.0, 30.0, 22.0, 8.0, 5.0, 5.0, 3.0, 3.0, 3.0, 0.0, 3.0, 2.0], "bins": [-17.984375, -17.41259765625, -16.8408203125, -16.26904296875, -15.697265625, -15.12548828125, -14.5537109375, -13.98193359375, -13.41015625, -12.83837890625, -12.2666015625, -11.69482421875, -11.123046875, -10.55126953125, -9.9794921875, -9.40771484375, -8.8359375, -8.26416015625, -7.6923828125, -7.12060546875, -6.548828125, -5.97705078125, -5.4052734375, -4.83349609375, -4.26171875, -3.68994140625, -3.1181640625, -2.54638671875, -1.974609375, -1.40283203125, -0.8310546875, -0.25927734375, 0.3125, 0.88427734375, 1.4560546875, 2.02783203125, 2.599609375, 3.17138671875, 3.7431640625, 4.31494140625, 4.88671875, 5.45849609375, 6.0302734375, 6.60205078125, 7.173828125, 7.74560546875, 8.3173828125, 8.88916015625, 9.4609375, 10.03271484375, 10.6044921875, 11.17626953125, 11.748046875, 12.31982421875, 12.8916015625, 13.46337890625, 14.03515625, 14.60693359375, 15.1787109375, 15.75048828125, 16.322265625, 16.89404296875, 17.4658203125, 18.03759765625, 18.609375]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 4.0, 6.0, 6.0, 7.0, 6.0, 8.0, 13.0, 8.0, 14.0, 13.0, 16.0, 20.0, 17.0, 21.0, 31.0, 18.0, 31.0, 31.0, 36.0, 30.0, 26.0, 37.0, 34.0, 41.0, 36.0, 41.0, 30.0, 38.0, 39.0, 26.0, 38.0, 36.0, 23.0, 21.0, 24.0, 21.0, 27.0, 20.0, 15.0, 11.0, 14.0, 9.0, 11.0, 13.0, 13.0, 4.0, 4.0, 2.0, 4.0, 4.0, 5.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0], "bins": [-8.3203125, -8.056884765625, -7.79345703125, -7.530029296875, -7.2666015625, -7.003173828125, -6.73974609375, -6.476318359375, -6.212890625, -5.949462890625, -5.68603515625, -5.422607421875, -5.1591796875, -4.895751953125, -4.63232421875, -4.368896484375, -4.10546875, -3.842041015625, -3.57861328125, -3.315185546875, -3.0517578125, -2.788330078125, -2.52490234375, -2.261474609375, -1.998046875, -1.734619140625, -1.47119140625, -1.207763671875, -0.9443359375, -0.680908203125, -0.41748046875, -0.154052734375, 0.109375, 0.372802734375, 0.63623046875, 0.899658203125, 1.1630859375, 1.426513671875, 1.68994140625, 1.953369140625, 2.216796875, 2.480224609375, 2.74365234375, 3.007080078125, 3.2705078125, 3.533935546875, 3.79736328125, 4.060791015625, 4.32421875, 4.587646484375, 4.85107421875, 5.114501953125, 5.3779296875, 5.641357421875, 5.90478515625, 6.168212890625, 6.431640625, 6.695068359375, 6.95849609375, 7.221923828125, 7.4853515625, 7.748779296875, 8.01220703125, 8.275634765625, 8.5390625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 6.0, 6.0, 5.0, 9.0, 13.0, 27.0, 35.0, 52.0, 75.0, 101.0, 146.0, 222.0, 354.0, 468.0, 710.0, 1024.0, 1533.0, 2203.0, 3176.0, 4597.0, 6814.0, 10464.0, 15376.0, 23580.0, 38049.0, 62870.0, 104261.0, 163127.0, 191773.0, 155520.0, 99035.0, 58784.0, 36186.0, 22618.0, 14681.0, 9777.0, 6671.0, 4544.0, 3012.0, 2111.0, 1384.0, 1018.0, 700.0, 481.0, 304.0, 232.0, 118.0, 108.0, 64.0, 41.0, 35.0, 22.0, 15.0, 9.0, 6.0, 5.0, 4.0, 2.0, 2.0, 3.0], "bins": [-17.15625, -16.62744140625, -16.0986328125, -15.56982421875, -15.041015625, -14.51220703125, -13.9833984375, -13.45458984375, -12.92578125, -12.39697265625, -11.8681640625, -11.33935546875, -10.810546875, -10.28173828125, -9.7529296875, -9.22412109375, -8.6953125, -8.16650390625, -7.6376953125, -7.10888671875, -6.580078125, -6.05126953125, -5.5224609375, -4.99365234375, -4.46484375, -3.93603515625, -3.4072265625, -2.87841796875, -2.349609375, -1.82080078125, -1.2919921875, -0.76318359375, -0.234375, 0.29443359375, 0.8232421875, 1.35205078125, 1.880859375, 2.40966796875, 2.9384765625, 3.46728515625, 3.99609375, 4.52490234375, 5.0537109375, 5.58251953125, 6.111328125, 6.64013671875, 7.1689453125, 7.69775390625, 8.2265625, 8.75537109375, 9.2841796875, 9.81298828125, 10.341796875, 10.87060546875, 11.3994140625, 11.92822265625, 12.45703125, 12.98583984375, 13.5146484375, 14.04345703125, 14.572265625, 15.10107421875, 15.6298828125, 16.15869140625, 16.6875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 6.0, 5.0, 8.0, 9.0, 10.0, 13.0, 11.0, 11.0, 18.0, 19.0, 16.0, 21.0, 23.0, 27.0, 26.0, 34.0, 41.0, 43.0, 36.0, 26.0, 50.0, 31.0, 40.0, 43.0, 35.0, 42.0, 44.0, 27.0, 35.0, 41.0, 26.0, 20.0, 22.0, 15.0, 11.0, 18.0, 17.0, 9.0, 11.0, 16.0, 10.0, 8.0, 5.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0], "bins": [-6.0078125, -5.8232421875, -5.638671875, -5.4541015625, -5.26953125, -5.0849609375, -4.900390625, -4.7158203125, -4.53125, -4.3466796875, -4.162109375, -3.9775390625, -3.79296875, -3.6083984375, -3.423828125, -3.2392578125, -3.0546875, -2.8701171875, -2.685546875, -2.5009765625, -2.31640625, -2.1318359375, -1.947265625, -1.7626953125, -1.578125, -1.3935546875, -1.208984375, -1.0244140625, -0.83984375, -0.6552734375, -0.470703125, -0.2861328125, -0.1015625, 0.0830078125, 0.267578125, 0.4521484375, 0.63671875, 0.8212890625, 1.005859375, 1.1904296875, 1.375, 1.5595703125, 1.744140625, 1.9287109375, 2.11328125, 2.2978515625, 2.482421875, 2.6669921875, 2.8515625, 3.0361328125, 3.220703125, 3.4052734375, 3.58984375, 3.7744140625, 3.958984375, 4.1435546875, 4.328125, 4.5126953125, 4.697265625, 4.8818359375, 5.06640625, 5.2509765625, 5.435546875, 5.6201171875, 5.8046875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 12.0, 11.0, 13.0, 22.0, 31.0, 43.0, 89.0, 101.0, 154.0, 248.0, 337.0, 502.0, 800.0, 1333.0, 2096.0, 3429.0, 5932.0, 11183.0, 22077.0, 51945.0, 164150.0, 480763.0, 193015.0, 57712.0, 24222.0, 12211.0, 6408.0, 3753.0, 2157.0, 1326.0, 846.0, 527.0, 381.0, 233.0, 154.0, 109.0, 68.0, 53.0, 34.0, 26.0, 16.0, 15.0, 8.0, 5.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8369140625, -1.7747650146484375, -1.712615966796875, -1.6504669189453125, -1.58831787109375, -1.5261688232421875, -1.464019775390625, -1.4018707275390625, -1.3397216796875, -1.2775726318359375, -1.215423583984375, -1.1532745361328125, -1.09112548828125, -1.0289764404296875, -0.966827392578125, -0.9046783447265625, -0.842529296875, -0.7803802490234375, -0.718231201171875, -0.6560821533203125, -0.59393310546875, -0.5317840576171875, -0.469635009765625, -0.4074859619140625, -0.3453369140625, -0.2831878662109375, -0.221038818359375, -0.1588897705078125, -0.09674072265625, -0.0345916748046875, 0.027557373046875, 0.0897064208984375, 0.15185546875, 0.2140045166015625, 0.276153564453125, 0.3383026123046875, 0.40045166015625, 0.4626007080078125, 0.524749755859375, 0.5868988037109375, 0.6490478515625, 0.7111968994140625, 0.773345947265625, 0.8354949951171875, 0.89764404296875, 0.9597930908203125, 1.021942138671875, 1.0840911865234375, 1.146240234375, 1.2083892822265625, 1.270538330078125, 1.3326873779296875, 1.39483642578125, 1.4569854736328125, 1.519134521484375, 1.5812835693359375, 1.6434326171875, 1.7055816650390625, 1.767730712890625, 1.8298797607421875, 1.89202880859375, 1.9541778564453125, 2.016326904296875, 2.0784759521484375, 2.140625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 4.0, 10.0, 7.0, 12.0, 11.0, 14.0, 14.0, 21.0, 39.0, 28.0, 39.0, 58.0, 61.0, 45.0, 75.0, 77.0, 80.0, 65.0, 57.0, 51.0, 50.0, 41.0, 24.0, 27.0, 19.0, 9.0, 11.0, 9.0, 9.0, 0.0, 6.0, 10.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.00011271238327026367, -0.00010979268699884415, -0.00010687299072742462, -0.0001039532944560051, -0.00010103359818458557, -9.811390191316605e-05, -9.519420564174652e-05, -9.2274509370327e-05, -8.935481309890747e-05, -8.643511682748795e-05, -8.351542055606842e-05, -8.05957242846489e-05, -7.767602801322937e-05, -7.475633174180984e-05, -7.183663547039032e-05, -6.89169391989708e-05, -6.599724292755127e-05, -6.307754665613174e-05, -6.015785038471222e-05, -5.7238154113292694e-05, -5.431845784187317e-05, -5.1398761570453644e-05, -4.847906529903412e-05, -4.5559369027614594e-05, -4.263967275619507e-05, -3.971997648477554e-05, -3.680028021335602e-05, -3.388058394193649e-05, -3.096088767051697e-05, -2.8041191399097443e-05, -2.5121495127677917e-05, -2.2201798856258392e-05, -1.9282102584838867e-05, -1.6362406313419342e-05, -1.3442710041999817e-05, -1.0523013770580292e-05, -7.603317499160767e-06, -4.6836212277412415e-06, -1.7639249563217163e-06, 1.1557713150978088e-06, 4.075467586517334e-06, 6.995163857936859e-06, 9.914860129356384e-06, 1.283455640077591e-05, 1.5754252672195435e-05, 1.867394894361496e-05, 2.1593645215034485e-05, 2.451334148645401e-05, 2.7433037757873535e-05, 3.035273402929306e-05, 3.3272430300712585e-05, 3.619212657213211e-05, 3.9111822843551636e-05, 4.203151911497116e-05, 4.4951215386390686e-05, 4.787091165781021e-05, 5.0790607929229736e-05, 5.371030420064926e-05, 5.663000047206879e-05, 5.954969674348831e-05, 6.246939301490784e-05, 6.538908928632736e-05, 6.830878555774689e-05, 7.122848182916641e-05, 7.414817810058594e-05]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 2.0, 4.0, 3.0, 5.0, 5.0, 11.0, 20.0, 24.0, 57.0, 49.0, 106.0, 123.0, 186.0, 271.0, 454.0, 652.0, 1157.0, 1740.0, 2937.0, 5287.0, 10289.0, 21665.0, 51318.0, 175135.0, 519651.0, 163876.0, 49620.0, 20753.0, 10229.0, 5139.0, 2927.0, 1833.0, 1087.0, 668.0, 423.0, 291.0, 178.0, 134.0, 94.0, 56.0, 28.0, 18.0, 21.0, 15.0, 10.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9482421875, -1.8798370361328125, -1.811431884765625, -1.7430267333984375, -1.67462158203125, -1.6062164306640625, -1.537811279296875, -1.4694061279296875, -1.4010009765625, -1.3325958251953125, -1.264190673828125, -1.1957855224609375, -1.12738037109375, -1.0589752197265625, -0.990570068359375, -0.9221649169921875, -0.853759765625, -0.7853546142578125, -0.716949462890625, -0.6485443115234375, -0.58013916015625, -0.5117340087890625, -0.443328857421875, -0.3749237060546875, -0.3065185546875, -0.2381134033203125, -0.169708251953125, -0.1013031005859375, -0.03289794921875, 0.0355072021484375, 0.103912353515625, 0.1723175048828125, 0.24072265625, 0.3091278076171875, 0.377532958984375, 0.4459381103515625, 0.51434326171875, 0.5827484130859375, 0.651153564453125, 0.7195587158203125, 0.7879638671875, 0.8563690185546875, 0.924774169921875, 0.9931793212890625, 1.06158447265625, 1.1299896240234375, 1.198394775390625, 1.2667999267578125, 1.335205078125, 1.4036102294921875, 1.472015380859375, 1.5404205322265625, 1.60882568359375, 1.6772308349609375, 1.745635986328125, 1.8140411376953125, 1.8824462890625, 1.9508514404296875, 2.019256591796875, 2.0876617431640625, 2.15606689453125, 2.2244720458984375, 2.292877197265625, 2.3612823486328125, 2.4296875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 5.0, 11.0, 11.0, 11.0, 17.0, 17.0, 29.0, 33.0, 46.0, 29.0, 53.0, 78.0, 82.0, 106.0, 84.0, 97.0, 65.0, 51.0, 40.0, 17.0, 27.0, 14.0, 16.0, 17.0, 8.0, 3.0, 4.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 1.0, 3.0], "bins": [-0.689453125, -0.670806884765625, -0.65216064453125, -0.633514404296875, -0.6148681640625, -0.596221923828125, -0.57757568359375, -0.558929443359375, -0.540283203125, -0.521636962890625, -0.50299072265625, -0.484344482421875, -0.4656982421875, -0.447052001953125, -0.42840576171875, -0.409759521484375, -0.39111328125, -0.372467041015625, -0.35382080078125, -0.335174560546875, -0.3165283203125, -0.297882080078125, -0.27923583984375, -0.260589599609375, -0.241943359375, -0.223297119140625, -0.20465087890625, -0.186004638671875, -0.1673583984375, -0.148712158203125, -0.13006591796875, -0.111419677734375, -0.0927734375, -0.074127197265625, -0.05548095703125, -0.036834716796875, -0.0181884765625, 0.000457763671875, 0.01910400390625, 0.037750244140625, 0.056396484375, 0.075042724609375, 0.09368896484375, 0.112335205078125, 0.1309814453125, 0.149627685546875, 0.16827392578125, 0.186920166015625, 0.20556640625, 0.224212646484375, 0.24285888671875, 0.261505126953125, 0.2801513671875, 0.298797607421875, 0.31744384765625, 0.336090087890625, 0.354736328125, 0.373382568359375, 0.39202880859375, 0.410675048828125, 0.4293212890625, 0.447967529296875, 0.46661376953125, 0.485260009765625, 0.50390625]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 4.0, 1.0, 4.0, 2.0, 8.0, 6.0, 12.0, 11.0, 15.0, 18.0, 32.0, 38.0, 39.0, 46.0, 61.0, 64.0, 76.0, 96.0, 72.0, 74.0, 61.0, 52.0, 29.0, 36.0, 30.0, 19.0, 16.0, 13.0, 12.0, 10.0, 11.0, 4.0, 8.0, 3.0, 1.0, 7.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-12.847840309143066, -12.455244064331055, -12.062647819519043, -11.670051574707031, -11.27745532989502, -10.884859085083008, -10.492262840270996, -10.099666595458984, -9.707070350646973, -9.314474105834961, -8.92187786102295, -8.529281616210938, -8.136685371398926, -7.744089126586914, -7.351492881774902, -6.958896636962891, -6.566300868988037, -6.173704624176025, -5.781108379364014, -5.388512134552002, -4.99591588973999, -4.6033196449279785, -4.210723876953125, -3.818127393722534, -3.4255311489105225, -3.0329349040985107, -2.640338659286499, -2.2477426528930664, -1.8551462888717651, -1.4625500440597534, -1.0699539184570312, -0.6773576736450195, -0.2847614288330078, 0.10783478617668152, 0.5004310011863708, 0.8930271863937378, 1.2856234312057495, 1.6782196760177612, 2.0708158016204834, 2.463412046432495, 2.856008291244507, 3.2486045360565186, 3.6412007808685303, 4.033796787261963, 4.426393032073975, 4.818989276885986, 5.211585521697998, 5.60418176651001, 5.9967780113220215, 6.389374256134033, 6.781970500946045, 7.174566745758057, 7.567162990570068, 7.95975923538208, 8.352355003356934, 8.744951248168945, 9.137547492980957, 9.530143737792969, 9.92273998260498, 10.315336227416992, 10.707932472229004, 11.100528717041016, 11.493124961853027, 11.885721206665039, 12.27831745147705]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 0.0, 4.0, 4.0, 2.0, 5.0, 4.0, 10.0, 14.0, 10.0, 11.0, 21.0, 22.0, 16.0, 26.0, 24.0, 31.0, 33.0, 34.0, 37.0, 33.0, 40.0, 38.0, 44.0, 43.0, 39.0, 40.0, 44.0, 37.0, 46.0, 33.0, 30.0, 35.0, 29.0, 29.0, 22.0, 20.0, 19.0, 16.0, 15.0, 10.0, 9.0, 9.0, 4.0, 2.0, 4.0, 3.0, 0.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.92446231842041, -9.59310531616211, -9.261749267578125, -8.930392265319824, -8.59903621673584, -8.267679214477539, -7.9363226890563965, -7.604966163635254, -7.273609161376953, -6.9422526359558105, -6.610896110534668, -6.279539108276367, -5.948182582855225, -5.616826057434082, -5.2854695320129395, -4.954113006591797, -4.622756481170654, -4.291399955749512, -3.96004319190979, -3.6286866664886475, -3.297329902648926, -2.965973377227783, -2.6346168518066406, -2.303260087966919, -1.9719035625457764, -1.6405469179153442, -1.309190273284912, -0.9778337478637695, -0.6464771032333374, -0.3151204586029053, 0.016236066818237305, 0.347592830657959, 0.6789493560791016, 1.0103060007095337, 1.3416626453399658, 1.6730191707611084, 2.00437593460083, 2.3357324600219727, 2.6670889854431152, 2.998445749282837, 3.3298022747039795, 3.661158800125122, 3.9925155639648438, 4.323872089385986, 4.655228614807129, 4.98658561706543, 5.317941665649414, 5.649298667907715, 5.980655193328857, 6.31201171875, 6.643368244171143, 6.974724769592285, 7.306081771850586, 7.6374382972717285, 7.968794822692871, 8.300151824951172, 8.631507873535156, 8.962864875793457, 9.294220924377441, 9.625577926635742, 9.956933975219727, 10.288290977478027, 10.619647979736328, 10.951004028320312, 11.282361030578613]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 7.0, 6.0, 17.0, 16.0, 31.0, 42.0, 69.0, 90.0, 183.0, 259.0, 354.0, 583.0, 933.0, 1506.0, 2495.0, 4102.0, 6710.0, 11990.0, 20483.0, 36744.0, 69612.0, 146827.0, 445327.0, 1657713.0, 1249680.0, 294611.0, 113013.0, 55984.0, 30433.0, 17371.0, 10155.0, 6147.0, 3673.0, 2382.0, 1574.0, 1022.0, 685.0, 460.0, 305.0, 211.0, 133.0, 89.0, 69.0, 49.0, 49.0, 32.0, 15.0, 13.0, 17.0, 4.0, 4.0, 4.0, 5.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0], "bins": [-16.828125, -16.244873046875, -15.66162109375, -15.078369140625, -14.4951171875, -13.911865234375, -13.32861328125, -12.745361328125, -12.162109375, -11.578857421875, -10.99560546875, -10.412353515625, -9.8291015625, -9.245849609375, -8.66259765625, -8.079345703125, -7.49609375, -6.912841796875, -6.32958984375, -5.746337890625, -5.1630859375, -4.579833984375, -3.99658203125, -3.413330078125, -2.830078125, -2.246826171875, -1.66357421875, -1.080322265625, -0.4970703125, 0.086181640625, 0.66943359375, 1.252685546875, 1.8359375, 2.419189453125, 3.00244140625, 3.585693359375, 4.1689453125, 4.752197265625, 5.33544921875, 5.918701171875, 6.501953125, 7.085205078125, 7.66845703125, 8.251708984375, 8.8349609375, 9.418212890625, 10.00146484375, 10.584716796875, 11.16796875, 11.751220703125, 12.33447265625, 12.917724609375, 13.5009765625, 14.084228515625, 14.66748046875, 15.250732421875, 15.833984375, 16.417236328125, 17.00048828125, 17.583740234375, 18.1669921875, 18.750244140625, 19.33349609375, 19.916748046875, 20.5]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 3.0, 5.0, 12.0, 18.0, 10.0, 13.0, 16.0, 21.0, 30.0, 24.0, 34.0, 33.0, 33.0, 32.0, 42.0, 37.0, 31.0, 58.0, 48.0, 32.0, 43.0, 49.0, 45.0, 38.0, 33.0, 32.0, 32.0, 31.0, 27.0, 26.0, 26.0, 12.0, 12.0, 14.0, 11.0, 10.0, 5.0, 5.0, 5.0, 3.0, 1.0, 3.0, 0.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-8.4375, -8.147216796875, -7.85693359375, -7.566650390625, -7.2763671875, -6.986083984375, -6.69580078125, -6.405517578125, -6.115234375, -5.824951171875, -5.53466796875, -5.244384765625, -4.9541015625, -4.663818359375, -4.37353515625, -4.083251953125, -3.79296875, -3.502685546875, -3.21240234375, -2.922119140625, -2.6318359375, -2.341552734375, -2.05126953125, -1.760986328125, -1.470703125, -1.180419921875, -0.89013671875, -0.599853515625, -0.3095703125, -0.019287109375, 0.27099609375, 0.561279296875, 0.8515625, 1.141845703125, 1.43212890625, 1.722412109375, 2.0126953125, 2.302978515625, 2.59326171875, 2.883544921875, 3.173828125, 3.464111328125, 3.75439453125, 4.044677734375, 4.3349609375, 4.625244140625, 4.91552734375, 5.205810546875, 5.49609375, 5.786376953125, 6.07666015625, 6.366943359375, 6.6572265625, 6.947509765625, 7.23779296875, 7.528076171875, 7.818359375, 8.108642578125, 8.39892578125, 8.689208984375, 8.9794921875, 9.269775390625, 9.56005859375, 9.850341796875, 10.140625]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 7.0, 15.0, 27.0, 37.0, 71.0, 97.0, 186.0, 264.0, 441.0, 752.0, 1229.0, 2224.0, 3916.0, 6770.0, 12344.0, 22555.0, 42746.0, 86214.0, 188220.0, 463307.0, 1452821.0, 1190652.0, 394644.0, 163428.0, 76769.0, 38406.0, 20446.0, 11101.0, 6165.0, 3522.0, 2073.0, 1139.0, 668.0, 418.0, 233.0, 134.0, 98.0, 58.0, 32.0, 17.0, 15.0, 11.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.453125, -18.89599609375, -18.3388671875, -17.78173828125, -17.224609375, -16.66748046875, -16.1103515625, -15.55322265625, -14.99609375, -14.43896484375, -13.8818359375, -13.32470703125, -12.767578125, -12.21044921875, -11.6533203125, -11.09619140625, -10.5390625, -9.98193359375, -9.4248046875, -8.86767578125, -8.310546875, -7.75341796875, -7.1962890625, -6.63916015625, -6.08203125, -5.52490234375, -4.9677734375, -4.41064453125, -3.853515625, -3.29638671875, -2.7392578125, -2.18212890625, -1.625, -1.06787109375, -0.5107421875, 0.04638671875, 0.603515625, 1.16064453125, 1.7177734375, 2.27490234375, 2.83203125, 3.38916015625, 3.9462890625, 4.50341796875, 5.060546875, 5.61767578125, 6.1748046875, 6.73193359375, 7.2890625, 7.84619140625, 8.4033203125, 8.96044921875, 9.517578125, 10.07470703125, 10.6318359375, 11.18896484375, 11.74609375, 12.30322265625, 12.8603515625, 13.41748046875, 13.974609375, 14.53173828125, 15.0888671875, 15.64599609375, 16.203125]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 9.0, 10.0, 8.0, 11.0, 28.0, 27.0, 38.0, 33.0, 53.0, 55.0, 76.0, 107.0, 112.0, 124.0, 177.0, 224.0, 282.0, 360.0, 437.0, 388.0, 271.0, 236.0, 194.0, 148.0, 127.0, 100.0, 80.0, 67.0, 51.0, 40.0, 44.0, 35.0, 29.0, 17.0, 20.0, 12.0, 10.0, 5.0, 5.0, 8.0, 4.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4375, -4.271240234375, -4.10498046875, -3.938720703125, -3.7724609375, -3.606201171875, -3.43994140625, -3.273681640625, -3.107421875, -2.941162109375, -2.77490234375, -2.608642578125, -2.4423828125, -2.276123046875, -2.10986328125, -1.943603515625, -1.77734375, -1.611083984375, -1.44482421875, -1.278564453125, -1.1123046875, -0.946044921875, -0.77978515625, -0.613525390625, -0.447265625, -0.281005859375, -0.11474609375, 0.051513671875, 0.2177734375, 0.384033203125, 0.55029296875, 0.716552734375, 0.8828125, 1.049072265625, 1.21533203125, 1.381591796875, 1.5478515625, 1.714111328125, 1.88037109375, 2.046630859375, 2.212890625, 2.379150390625, 2.54541015625, 2.711669921875, 2.8779296875, 3.044189453125, 3.21044921875, 3.376708984375, 3.54296875, 3.709228515625, 3.87548828125, 4.041748046875, 4.2080078125, 4.374267578125, 4.54052734375, 4.706787109375, 4.873046875, 5.039306640625, 5.20556640625, 5.371826171875, 5.5380859375, 5.704345703125, 5.87060546875, 6.036865234375, 6.203125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 6.0, 8.0, 9.0, 4.0, 8.0, 8.0, 14.0, 13.0, 24.0, 22.0, 38.0, 45.0, 51.0, 56.0, 77.0, 79.0, 75.0, 75.0, 60.0, 62.0, 56.0, 46.0, 32.0, 20.0, 17.0, 16.0, 14.0, 9.0, 12.0, 7.0, 11.0, 3.0, 9.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.02506160736084, -9.650896072387695, -9.27673053741455, -8.902565002441406, -8.528399467468262, -8.154233932495117, -7.780068874359131, -7.405903339385986, -7.031737804412842, -6.657572269439697, -6.283406734466553, -5.909241676330566, -5.535076141357422, -5.160910606384277, -4.786745071411133, -4.412579536437988, -4.038414001464844, -3.664248466491699, -3.2900829315185547, -2.9159176349639893, -2.5417520999908447, -2.1675865650177, -1.7934212684631348, -1.4192557334899902, -1.0450901985168457, -0.670924723148346, -0.2967592477798462, 0.07740616798400879, 0.4515717029571533, 0.8257372379302979, 1.1999025344848633, 1.5740680694580078, 1.948232650756836, 2.3223981857299805, 2.696563720703125, 3.0707290172576904, 3.444894552230835, 3.8190600872039795, 4.193225383758545, 4.5673909187316895, 4.941556453704834, 5.3157219886779785, 5.689887523651123, 6.064052581787109, 6.438218116760254, 6.812383651733398, 7.186549186706543, 7.5607147216796875, 7.934880256652832, 8.309045791625977, 8.683211326599121, 9.057376861572266, 9.43154239654541, 9.805707931518555, 10.179872512817383, 10.554039001464844, 10.928203582763672, 11.302369117736816, 11.676534652709961, 12.050700187683105, 12.42486572265625, 12.799031257629395, 13.173196792602539, 13.547361373901367, 13.921527862548828]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 0.0, 3.0, 7.0, 12.0, 11.0, 13.0, 10.0, 19.0, 14.0, 16.0, 20.0, 30.0, 24.0, 32.0, 31.0, 29.0, 35.0, 41.0, 32.0, 38.0, 42.0, 39.0, 33.0, 42.0, 41.0, 41.0, 43.0, 40.0, 26.0, 27.0, 34.0, 30.0, 17.0, 15.0, 25.0, 14.0, 15.0, 11.0, 8.0, 5.0, 6.0, 10.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 4.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.709293365478516, -8.406293869018555, -8.103294372558594, -7.800293922424316, -7.4972944259643555, -7.1942949295043945, -6.891294956207275, -6.588294982910156, -6.285295486450195, -5.982295989990234, -5.679296016693115, -5.376296043395996, -5.073296546936035, -4.770297050476074, -4.467297077178955, -4.164297103881836, -3.861297607421875, -3.558297872543335, -3.255298137664795, -2.952298402786255, -2.649298667907715, -2.346298933029175, -2.0432991981506348, -1.7402994632720947, -1.4372997283935547, -1.1342999935150146, -0.8313002586364746, -0.5283005237579346, -0.22530078887939453, 0.07769894599914551, 0.38069868087768555, 0.6836984157562256, 0.9866971969604492, 1.2896969318389893, 1.5926966667175293, 1.8956964015960693, 2.1986961364746094, 2.5016958713531494, 2.8046956062316895, 3.1076953411102295, 3.4106950759887695, 3.7136948108673096, 4.01669454574585, 4.319694519042969, 4.62269401550293, 4.925693511962891, 5.22869348526001, 5.531693458557129, 5.83469295501709, 6.137692451477051, 6.44069242477417, 6.743692398071289, 7.04669189453125, 7.349691390991211, 7.65269136428833, 7.955691337585449, 8.25869083404541, 8.561690330505371, 8.864690780639648, 9.16769027709961, 9.47068977355957, 9.773689270019531, 10.076688766479492, 10.37968921661377, 10.68268871307373]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 7.0, 11.0, 14.0, 20.0, 25.0, 46.0, 72.0, 73.0, 113.0, 166.0, 231.0, 328.0, 498.0, 703.0, 1051.0, 1413.0, 2034.0, 2986.0, 4381.0, 6214.0, 9110.0, 13424.0, 20090.0, 30071.0, 47165.0, 76730.0, 140433.0, 309143.0, 152610.0, 81714.0, 49914.0, 32005.0, 20900.0, 14042.0, 9534.0, 6515.0, 4588.0, 3100.0, 2197.0, 1483.0, 1032.0, 726.0, 533.0, 376.0, 216.0, 178.0, 107.0, 80.0, 60.0, 35.0, 26.0, 17.0, 11.0, 6.0, 2.0, 2.0, 0.0, 2.0], "bins": [-2.6953125, -2.614990234375, -2.53466796875, -2.454345703125, -2.3740234375, -2.293701171875, -2.21337890625, -2.133056640625, -2.052734375, -1.972412109375, -1.89208984375, -1.811767578125, -1.7314453125, -1.651123046875, -1.57080078125, -1.490478515625, -1.41015625, -1.329833984375, -1.24951171875, -1.169189453125, -1.0888671875, -1.008544921875, -0.92822265625, -0.847900390625, -0.767578125, -0.687255859375, -0.60693359375, -0.526611328125, -0.4462890625, -0.365966796875, -0.28564453125, -0.205322265625, -0.125, -0.044677734375, 0.03564453125, 0.115966796875, 0.1962890625, 0.276611328125, 0.35693359375, 0.437255859375, 0.517578125, 0.597900390625, 0.67822265625, 0.758544921875, 0.8388671875, 0.919189453125, 0.99951171875, 1.079833984375, 1.16015625, 1.240478515625, 1.32080078125, 1.401123046875, 1.4814453125, 1.561767578125, 1.64208984375, 1.722412109375, 1.802734375, 1.883056640625, 1.96337890625, 2.043701171875, 2.1240234375, 2.204345703125, 2.28466796875, 2.364990234375, 2.4453125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 5.0, 2.0, 0.0, 3.0, 3.0, 6.0, 5.0, 6.0, 13.0, 13.0, 14.0, 13.0, 13.0, 12.0, 25.0, 20.0, 25.0, 24.0, 32.0, 34.0, 37.0, 37.0, 32.0, 44.0, 32.0, 39.0, 41.0, 32.0, 39.0, 54.0, 28.0, 41.0, 30.0, 23.0, 26.0, 36.0, 28.0, 21.0, 12.0, 18.0, 21.0, 16.0, 9.0, 10.0, 8.0, 7.0, 8.0, 2.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.390625, -8.0865478515625, -7.782470703125, -7.4783935546875, -7.17431640625, -6.8702392578125, -6.566162109375, -6.2620849609375, -5.9580078125, -5.6539306640625, -5.349853515625, -5.0457763671875, -4.74169921875, -4.4376220703125, -4.133544921875, -3.8294677734375, -3.525390625, -3.2213134765625, -2.917236328125, -2.6131591796875, -2.30908203125, -2.0050048828125, -1.700927734375, -1.3968505859375, -1.0927734375, -0.7886962890625, -0.484619140625, -0.1805419921875, 0.12353515625, 0.4276123046875, 0.731689453125, 1.0357666015625, 1.33984375, 1.6439208984375, 1.947998046875, 2.2520751953125, 2.55615234375, 2.8602294921875, 3.164306640625, 3.4683837890625, 3.7724609375, 4.0765380859375, 4.380615234375, 4.6846923828125, 4.98876953125, 5.2928466796875, 5.596923828125, 5.9010009765625, 6.205078125, 6.5091552734375, 6.813232421875, 7.1173095703125, 7.42138671875, 7.7254638671875, 8.029541015625, 8.3336181640625, 8.6376953125, 8.9417724609375, 9.245849609375, 9.5499267578125, 9.85400390625, 10.1580810546875, 10.462158203125, 10.7662353515625, 11.0703125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 6.0, 7.0, 14.0, 12.0, 20.0, 42.0, 46.0, 69.0, 110.0, 124.0, 166.0, 250.0, 330.0, 454.0, 584.0, 790.0, 1114.0, 1484.0, 2218.0, 3038.0, 4173.0, 6023.0, 8594.0, 12689.0, 18606.0, 27125.0, 41808.0, 65812.0, 110030.0, 253144.0, 206016.0, 100706.0, 61163.0, 38851.0, 25671.0, 17280.0, 11815.0, 8207.0, 5799.0, 3945.0, 2836.0, 1991.0, 1416.0, 1095.0, 796.0, 556.0, 423.0, 315.0, 242.0, 143.0, 114.0, 102.0, 57.0, 47.0, 36.0, 25.0, 16.0, 12.0, 9.0, 6.0, 1.0, 1.0], "bins": [-2.390625, -2.31573486328125, -2.2408447265625, -2.16595458984375, -2.091064453125, -2.01617431640625, -1.9412841796875, -1.86639404296875, -1.79150390625, -1.71661376953125, -1.6417236328125, -1.56683349609375, -1.491943359375, -1.41705322265625, -1.3421630859375, -1.26727294921875, -1.1923828125, -1.11749267578125, -1.0426025390625, -0.96771240234375, -0.892822265625, -0.81793212890625, -0.7430419921875, -0.66815185546875, -0.59326171875, -0.51837158203125, -0.4434814453125, -0.36859130859375, -0.293701171875, -0.21881103515625, -0.1439208984375, -0.06903076171875, 0.005859375, 0.08074951171875, 0.1556396484375, 0.23052978515625, 0.305419921875, 0.38031005859375, 0.4552001953125, 0.53009033203125, 0.60498046875, 0.67987060546875, 0.7547607421875, 0.82965087890625, 0.904541015625, 0.97943115234375, 1.0543212890625, 1.12921142578125, 1.2041015625, 1.27899169921875, 1.3538818359375, 1.42877197265625, 1.503662109375, 1.57855224609375, 1.6534423828125, 1.72833251953125, 1.80322265625, 1.87811279296875, 1.9530029296875, 2.02789306640625, 2.102783203125, 2.17767333984375, 2.2525634765625, 2.32745361328125, 2.40234375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 4.0, 2.0, 11.0, 7.0, 9.0, 9.0, 7.0, 12.0, 9.0, 12.0, 18.0, 18.0, 20.0, 30.0, 21.0, 28.0, 28.0, 41.0, 44.0, 31.0, 32.0, 37.0, 42.0, 25.0, 38.0, 34.0, 35.0, 30.0, 29.0, 27.0, 33.0, 32.0, 27.0, 28.0, 24.0, 19.0, 20.0, 14.0, 13.0, 17.0, 15.0, 16.0, 8.0, 12.0, 7.0, 5.0, 4.0, 6.0, 4.0, 6.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0], "bins": [-5.51171875, -5.33203125, -5.15234375, -4.97265625, -4.79296875, -4.61328125, -4.43359375, -4.25390625, -4.07421875, -3.89453125, -3.71484375, -3.53515625, -3.35546875, -3.17578125, -2.99609375, -2.81640625, -2.63671875, -2.45703125, -2.27734375, -2.09765625, -1.91796875, -1.73828125, -1.55859375, -1.37890625, -1.19921875, -1.01953125, -0.83984375, -0.66015625, -0.48046875, -0.30078125, -0.12109375, 0.05859375, 0.23828125, 0.41796875, 0.59765625, 0.77734375, 0.95703125, 1.13671875, 1.31640625, 1.49609375, 1.67578125, 1.85546875, 2.03515625, 2.21484375, 2.39453125, 2.57421875, 2.75390625, 2.93359375, 3.11328125, 3.29296875, 3.47265625, 3.65234375, 3.83203125, 4.01171875, 4.19140625, 4.37109375, 4.55078125, 4.73046875, 4.91015625, 5.08984375, 5.26953125, 5.44921875, 5.62890625, 5.80859375, 5.98828125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 5.0, 7.0, 14.0, 16.0, 29.0, 28.0, 49.0, 43.0, 76.0, 114.0, 142.0, 211.0, 269.0, 377.0, 476.0, 669.0, 996.0, 1436.0, 2062.0, 3076.0, 4756.0, 7661.0, 13012.0, 22852.0, 44191.0, 99507.0, 264781.0, 333073.0, 127183.0, 54289.0, 26872.0, 14879.0, 8861.0, 5435.0, 3408.0, 2311.0, 1539.0, 1059.0, 754.0, 548.0, 386.0, 274.0, 219.0, 161.0, 105.0, 106.0, 69.0, 37.0, 43.0, 29.0, 23.0, 12.0, 10.0, 12.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.005878448486328125, -0.0056833624839782715, -0.005488276481628418, -0.0052931904792785645, -0.005098104476928711, -0.004903018474578857, -0.004707932472229004, -0.00451284646987915, -0.004317760467529297, -0.004122674465179443, -0.00392758846282959, -0.0037325024604797363, -0.003537416458129883, -0.0033423304557800293, -0.0031472444534301758, -0.0029521584510803223, -0.0027570724487304688, -0.0025619864463806152, -0.0023669004440307617, -0.002171814441680908, -0.0019767284393310547, -0.0017816424369812012, -0.0015865564346313477, -0.0013914704322814941, -0.0011963844299316406, -0.0010012984275817871, -0.0008062124252319336, -0.0006111264228820801, -0.00041604042053222656, -0.00022095441818237305, -2.586841583251953e-05, 0.00016921758651733398, 0.0003643035888671875, 0.000559389591217041, 0.0007544755935668945, 0.000949561595916748, 0.0011446475982666016, 0.001339733600616455, 0.0015348196029663086, 0.0017299056053161621, 0.0019249916076660156, 0.002120077610015869, 0.0023151636123657227, 0.002510249614715576, 0.0027053356170654297, 0.002900421619415283, 0.0030955076217651367, 0.0032905936241149902, 0.0034856796264648438, 0.0036807656288146973, 0.0038758516311645508, 0.004070937633514404, 0.004266023635864258, 0.004461109638214111, 0.004656195640563965, 0.004851281642913818, 0.005046367645263672, 0.005241453647613525, 0.005436539649963379, 0.005631625652313232, 0.005826711654663086, 0.0060217976570129395, 0.006216883659362793, 0.0064119696617126465, 0.0066070556640625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 5.0, 1.0, 5.0, 8.0, 9.0, 8.0, 19.0, 16.0, 17.0, 27.0, 29.0, 34.0, 69.0, 47.0, 45.0, 102.0, 56.0, 110.0, 65.0, 67.0, 65.0, 43.0, 25.0, 42.0, 14.0, 6.0, 14.0, 16.0, 10.0, 5.0, 8.0, 5.0, 5.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.735324859619141e-06, -6.536021828651428e-06, -6.336718797683716e-06, -6.137415766716003e-06, -5.938112735748291e-06, -5.738809704780579e-06, -5.539506673812866e-06, -5.340203642845154e-06, -5.140900611877441e-06, -4.941597580909729e-06, -4.742294549942017e-06, -4.542991518974304e-06, -4.343688488006592e-06, -4.144385457038879e-06, -3.945082426071167e-06, -3.7457793951034546e-06, -3.546476364135742e-06, -3.3471733331680298e-06, -3.1478703022003174e-06, -2.948567271232605e-06, -2.7492642402648926e-06, -2.54996120929718e-06, -2.3506581783294678e-06, -2.1513551473617554e-06, -1.952052116394043e-06, -1.7527490854263306e-06, -1.5534460544586182e-06, -1.3541430234909058e-06, -1.1548399925231934e-06, -9.55536961555481e-07, -7.562339305877686e-07, -5.569308996200562e-07, -3.5762786865234375e-07, -1.5832483768463135e-07, 4.0978193283081055e-08, 2.4028122425079346e-07, 4.3958425521850586e-07, 6.388872861862183e-07, 8.381903171539307e-07, 1.037493348121643e-06, 1.2367963790893555e-06, 1.4360994100570679e-06, 1.6354024410247803e-06, 1.8347054719924927e-06, 2.034008502960205e-06, 2.2333115339279175e-06, 2.43261456489563e-06, 2.6319175958633423e-06, 2.8312206268310547e-06, 3.030523657798767e-06, 3.2298266887664795e-06, 3.429129719734192e-06, 3.6284327507019043e-06, 3.827735781669617e-06, 4.027038812637329e-06, 4.2263418436050415e-06, 4.425644874572754e-06, 4.624947905540466e-06, 4.824250936508179e-06, 5.023553967475891e-06, 5.2228569984436035e-06, 5.422160029411316e-06, 5.621463060379028e-06, 5.820766091346741e-06, 6.020069122314453e-06]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 11.0, 14.0, 16.0, 26.0, 40.0, 48.0, 84.0, 117.0, 161.0, 218.0, 307.0, 480.0, 790.0, 1223.0, 2050.0, 3503.0, 6305.0, 12102.0, 24890.0, 56714.0, 150149.0, 408904.0, 231671.0, 80222.0, 33833.0, 15696.0, 7970.0, 4315.0, 2460.0, 1506.0, 918.0, 552.0, 405.0, 249.0, 173.0, 142.0, 95.0, 59.0, 45.0, 35.0, 17.0, 10.0, 14.0, 2.0, 8.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0078125, -0.007565975189208984, -0.007319450378417969, -0.007072925567626953, -0.0068264007568359375, -0.006579875946044922, -0.006333351135253906, -0.006086826324462891, -0.005840301513671875, -0.005593776702880859, -0.005347251892089844, -0.005100727081298828, -0.0048542022705078125, -0.004607677459716797, -0.004361152648925781, -0.004114627838134766, -0.00386810302734375, -0.0036215782165527344, -0.0033750534057617188, -0.003128528594970703, -0.0028820037841796875, -0.002635478973388672, -0.0023889541625976562, -0.0021424293518066406, -0.001895904541015625, -0.0016493797302246094, -0.0014028549194335938, -0.0011563301086425781, -0.0009098052978515625, -0.0006632804870605469, -0.00041675567626953125, -0.00017023086547851562, 7.62939453125e-05, 0.0003228187561035156, 0.0005693435668945312, 0.0008158683776855469, 0.0010623931884765625, 0.0013089179992675781, 0.0015554428100585938, 0.0018019676208496094, 0.002048492431640625, 0.0022950172424316406, 0.0025415420532226562, 0.002788066864013672, 0.0030345916748046875, 0.003281116485595703, 0.0035276412963867188, 0.0037741661071777344, 0.00402069091796875, 0.004267215728759766, 0.004513740539550781, 0.004760265350341797, 0.0050067901611328125, 0.005253314971923828, 0.005499839782714844, 0.005746364593505859, 0.005992889404296875, 0.006239414215087891, 0.006485939025878906, 0.006732463836669922, 0.0069789886474609375, 0.007225513458251953, 0.007472038269042969, 0.007718563079833984, 0.007965087890625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 2.0, 6.0, 4.0, 8.0, 18.0, 14.0, 21.0, 30.0, 25.0, 42.0, 53.0, 72.0, 91.0, 81.0, 76.0, 69.0, 75.0, 66.0, 44.0, 40.0, 35.0, 24.0, 22.0, 11.0, 18.0, 8.0, 9.0, 9.0, 5.0, 5.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.002529144287109375, -0.0024555325508117676, -0.00238192081451416, -0.0023083090782165527, -0.0022346973419189453, -0.002161085605621338, -0.0020874738693237305, -0.002013862133026123, -0.0019402503967285156, -0.0018666386604309082, -0.0017930269241333008, -0.0017194151878356934, -0.001645803451538086, -0.0015721917152404785, -0.001498579978942871, -0.0014249682426452637, -0.0013513565063476562, -0.0012777447700500488, -0.0012041330337524414, -0.001130521297454834, -0.0010569095611572266, -0.0009832978248596191, -0.0009096860885620117, -0.0008360743522644043, -0.0007624626159667969, -0.0006888508796691895, -0.000615239143371582, -0.0005416274070739746, -0.0004680156707763672, -0.00039440393447875977, -0.00032079219818115234, -0.0002471804618835449, -0.0001735687255859375, -9.995698928833008e-05, -2.6345252990722656e-05, 4.7266483306884766e-05, 0.00012087821960449219, 0.0001944899559020996, 0.00026810169219970703, 0.00034171342849731445, 0.0004153251647949219, 0.0004889369010925293, 0.0005625486373901367, 0.0006361603736877441, 0.0007097721099853516, 0.000783383846282959, 0.0008569955825805664, 0.0009306073188781738, 0.0010042190551757812, 0.0010778307914733887, 0.001151442527770996, 0.0012250542640686035, 0.001298666000366211, 0.0013722777366638184, 0.0014458894729614258, 0.0015195012092590332, 0.0015931129455566406, 0.001666724681854248, 0.0017403364181518555, 0.0018139481544494629, 0.0018875598907470703, 0.0019611716270446777, 0.002034783363342285, 0.0021083950996398926, 0.0021820068359375]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 7.0, 7.0, 8.0, 3.0, 9.0, 5.0, 9.0, 19.0, 14.0, 24.0, 24.0, 41.0, 43.0, 54.0, 47.0, 75.0, 82.0, 72.0, 69.0, 59.0, 62.0, 60.0, 38.0, 36.0, 19.0, 21.0, 15.0, 10.0, 16.0, 6.0, 14.0, 6.0, 3.0, 2.0, 8.0, 4.0, 5.0, 0.0, 3.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.00634765625, -9.646516799926758, -9.286685943603516, -8.926855087280273, -8.567024230957031, -8.207194328308105, -7.847363471984863, -7.487532615661621, -7.127701759338379, -6.767870903015137, -6.4080400466918945, -6.0482096672058105, -5.688378810882568, -5.328547954559326, -4.968717575073242, -4.60888671875, -4.249055862426758, -3.8892250061035156, -3.5293943881988525, -3.1695637702941895, -2.8097329139709473, -2.449902057647705, -2.090071439743042, -1.730240821838379, -1.3704099655151367, -1.010579228401184, -0.6507484912872314, -0.2909177541732788, 0.06891298294067383, 0.42874372005462646, 0.7885744571685791, 1.1484050750732422, 1.508234977722168, 1.8680657148361206, 2.2278964519500732, 2.5877270698547363, 2.9475579261779785, 3.3073887825012207, 3.667219400405884, 4.027050018310547, 4.386880874633789, 4.746711730957031, 5.106542587280273, 5.466372966766357, 5.8262038230896, 6.186034679412842, 6.545865058898926, 6.905695915222168, 7.26552677154541, 7.625357627868652, 7.9851884841918945, 8.345019340515137, 8.704849243164062, 9.064680099487305, 9.424510955810547, 9.784341812133789, 10.144172668457031, 10.504003524780273, 10.863834381103516, 11.223665237426758, 11.58349609375, 11.943325996398926, 12.303156852722168, 12.66298770904541, 13.022818565368652]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 2.0, 5.0, 3.0, 1.0, 3.0, 5.0, 11.0, 13.0, 13.0, 7.0, 22.0, 15.0, 15.0, 20.0, 29.0, 23.0, 31.0, 33.0, 27.0, 39.0, 37.0, 34.0, 35.0, 42.0, 40.0, 34.0, 41.0, 43.0, 38.0, 44.0, 37.0, 32.0, 28.0, 33.0, 29.0, 18.0, 18.0, 23.0, 13.0, 14.0, 13.0, 8.0, 4.0, 8.0, 9.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.749335289001465, -8.447405815124512, -8.145476341247559, -7.843547344207764, -7.5416178703308105, -7.239688396453857, -6.9377593994140625, -6.635829925537109, -6.333900451660156, -6.031970977783203, -5.73004150390625, -5.428112506866455, -5.126183032989502, -4.824253559112549, -4.522324562072754, -4.220395088195801, -3.9184656143188477, -3.6165361404418945, -3.3146069049835205, -3.0126776695251465, -2.7107481956481934, -2.4088187217712402, -2.106889486312866, -1.8049602508544922, -1.503030776977539, -1.2011014223098755, -0.8991720676422119, -0.5972427129745483, -0.29531335830688477, 0.006615996360778809, 0.3085453510284424, 0.6104745864868164, 0.9124031066894531, 1.2143324613571167, 1.5162618160247803, 1.8181911706924438, 2.1201205253601074, 2.4220499992370605, 2.7239792346954346, 3.0259084701538086, 3.3278379440307617, 3.629767417907715, 3.931696653366089, 4.233625888824463, 4.535555362701416, 4.837484836578369, 5.139413833618164, 5.441343307495117, 5.74327278137207, 6.045202255249023, 6.347131729125977, 6.6490607261657715, 6.950990200042725, 7.252919673919678, 7.554848670959473, 7.856778144836426, 8.158707618713379, 8.460637092590332, 8.762566566467285, 9.064496040344238, 9.366424560546875, 9.668354034423828, 9.970283508300781, 10.272212982177734, 10.574142456054688]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 0.0, 6.0, 5.0, 9.0, 12.0, 27.0, 28.0, 40.0, 75.0, 88.0, 178.0, 284.0, 362.0, 684.0, 1089.0, 1741.0, 2886.0, 4429.0, 7719.0, 13032.0, 22386.0, 41477.0, 80141.0, 151204.0, 233093.0, 213511.0, 126961.0, 65577.0, 34498.0, 19026.0, 11058.0, 6516.0, 3942.0, 2441.0, 1485.0, 925.0, 595.0, 352.0, 234.0, 164.0, 107.0, 56.0, 36.0, 25.0, 22.0, 12.0, 8.0, 5.0, 7.0, 3.0, 1.0, 3.0, 0.0, 1.0], "bins": [-22.8125, -22.157958984375, -21.50341796875, -20.848876953125, -20.1943359375, -19.539794921875, -18.88525390625, -18.230712890625, -17.576171875, -16.921630859375, -16.26708984375, -15.612548828125, -14.9580078125, -14.303466796875, -13.64892578125, -12.994384765625, -12.33984375, -11.685302734375, -11.03076171875, -10.376220703125, -9.7216796875, -9.067138671875, -8.41259765625, -7.758056640625, -7.103515625, -6.448974609375, -5.79443359375, -5.139892578125, -4.4853515625, -3.830810546875, -3.17626953125, -2.521728515625, -1.8671875, -1.212646484375, -0.55810546875, 0.096435546875, 0.7509765625, 1.405517578125, 2.06005859375, 2.714599609375, 3.369140625, 4.023681640625, 4.67822265625, 5.332763671875, 5.9873046875, 6.641845703125, 7.29638671875, 7.950927734375, 8.60546875, 9.260009765625, 9.91455078125, 10.569091796875, 11.2236328125, 11.878173828125, 12.53271484375, 13.187255859375, 13.841796875, 14.496337890625, 15.15087890625, 15.805419921875, 16.4599609375, 17.114501953125, 17.76904296875, 18.423583984375, 19.078125]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 0.0, 3.0, 6.0, 6.0, 13.0, 6.0, 12.0, 9.0, 17.0, 16.0, 26.0, 24.0, 24.0, 21.0, 37.0, 34.0, 26.0, 37.0, 24.0, 41.0, 39.0, 34.0, 44.0, 43.0, 38.0, 39.0, 44.0, 44.0, 34.0, 36.0, 35.0, 24.0, 20.0, 28.0, 13.0, 18.0, 14.0, 16.0, 8.0, 7.0, 11.0, 7.0, 8.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.171875, -7.8863525390625, -7.600830078125, -7.3153076171875, -7.02978515625, -6.7442626953125, -6.458740234375, -6.1732177734375, -5.8876953125, -5.6021728515625, -5.316650390625, -5.0311279296875, -4.74560546875, -4.4600830078125, -4.174560546875, -3.8890380859375, -3.603515625, -3.3179931640625, -3.032470703125, -2.7469482421875, -2.46142578125, -2.1759033203125, -1.890380859375, -1.6048583984375, -1.3193359375, -1.0338134765625, -0.748291015625, -0.4627685546875, -0.17724609375, 0.1082763671875, 0.393798828125, 0.6793212890625, 0.96484375, 1.2503662109375, 1.535888671875, 1.8214111328125, 2.10693359375, 2.3924560546875, 2.677978515625, 2.9635009765625, 3.2490234375, 3.5345458984375, 3.820068359375, 4.1055908203125, 4.39111328125, 4.6766357421875, 4.962158203125, 5.2476806640625, 5.533203125, 5.8187255859375, 6.104248046875, 6.3897705078125, 6.67529296875, 6.9608154296875, 7.246337890625, 7.5318603515625, 7.8173828125, 8.1029052734375, 8.388427734375, 8.6739501953125, 8.95947265625, 9.2449951171875, 9.530517578125, 9.8160400390625, 10.1015625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 7.0, 6.0, 11.0, 19.0, 18.0, 34.0, 46.0, 84.0, 109.0, 152.0, 241.0, 325.0, 446.0, 725.0, 993.0, 1460.0, 2146.0, 3280.0, 4868.0, 7214.0, 10895.0, 16614.0, 25204.0, 39286.0, 61913.0, 96166.0, 140769.0, 172062.0, 153907.0, 109085.0, 70697.0, 44717.0, 28902.0, 18636.0, 12413.0, 8242.0, 5619.0, 3609.0, 2372.0, 1668.0, 1145.0, 844.0, 500.0, 319.0, 266.0, 160.0, 122.0, 70.0, 56.0, 47.0, 22.0, 19.0, 18.0, 10.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0], "bins": [-14.1328125, -13.686279296875, -13.23974609375, -12.793212890625, -12.3466796875, -11.900146484375, -11.45361328125, -11.007080078125, -10.560546875, -10.114013671875, -9.66748046875, -9.220947265625, -8.7744140625, -8.327880859375, -7.88134765625, -7.434814453125, -6.98828125, -6.541748046875, -6.09521484375, -5.648681640625, -5.2021484375, -4.755615234375, -4.30908203125, -3.862548828125, -3.416015625, -2.969482421875, -2.52294921875, -2.076416015625, -1.6298828125, -1.183349609375, -0.73681640625, -0.290283203125, 0.15625, 0.602783203125, 1.04931640625, 1.495849609375, 1.9423828125, 2.388916015625, 2.83544921875, 3.281982421875, 3.728515625, 4.175048828125, 4.62158203125, 5.068115234375, 5.5146484375, 5.961181640625, 6.40771484375, 6.854248046875, 7.30078125, 7.747314453125, 8.19384765625, 8.640380859375, 9.0869140625, 9.533447265625, 9.97998046875, 10.426513671875, 10.873046875, 11.319580078125, 11.76611328125, 12.212646484375, 12.6591796875, 13.105712890625, 13.55224609375, 13.998779296875, 14.4453125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 6.0, 3.0, 7.0, 12.0, 12.0, 15.0, 15.0, 17.0, 36.0, 24.0, 23.0, 38.0, 35.0, 46.0, 30.0, 30.0, 31.0, 44.0, 37.0, 22.0, 37.0, 33.0, 40.0, 47.0, 43.0, 42.0, 35.0, 34.0, 25.0, 26.0, 30.0, 21.0, 20.0, 17.0, 19.0, 8.0, 7.0, 6.0, 9.0, 5.0, 3.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.42578125, -5.24554443359375, -5.0653076171875, -4.88507080078125, -4.704833984375, -4.52459716796875, -4.3443603515625, -4.16412353515625, -3.98388671875, -3.80364990234375, -3.6234130859375, -3.44317626953125, -3.262939453125, -3.08270263671875, -2.9024658203125, -2.72222900390625, -2.5419921875, -2.36175537109375, -2.1815185546875, -2.00128173828125, -1.821044921875, -1.64080810546875, -1.4605712890625, -1.28033447265625, -1.10009765625, -0.91986083984375, -0.7396240234375, -0.55938720703125, -0.379150390625, -0.19891357421875, -0.0186767578125, 0.16156005859375, 0.341796875, 0.52203369140625, 0.7022705078125, 0.88250732421875, 1.062744140625, 1.24298095703125, 1.4232177734375, 1.60345458984375, 1.78369140625, 1.96392822265625, 2.1441650390625, 2.32440185546875, 2.504638671875, 2.68487548828125, 2.8651123046875, 3.04534912109375, 3.2255859375, 3.40582275390625, 3.5860595703125, 3.76629638671875, 3.946533203125, 4.12677001953125, 4.3070068359375, 4.48724365234375, 4.66748046875, 4.84771728515625, 5.0279541015625, 5.20819091796875, 5.388427734375, 5.56866455078125, 5.7489013671875, 5.92913818359375, 6.109375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 11.0, 8.0, 13.0, 29.0, 44.0, 53.0, 62.0, 92.0, 129.0, 213.0, 309.0, 445.0, 636.0, 1017.0, 1606.0, 2574.0, 4428.0, 7887.0, 14822.0, 32792.0, 94291.0, 392055.0, 348799.0, 83905.0, 29938.0, 13856.0, 7425.0, 4132.0, 2533.0, 1452.0, 1007.0, 657.0, 395.0, 302.0, 200.0, 141.0, 86.0, 72.0, 38.0, 38.0, 28.0, 20.0, 11.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.232421875, -2.1646728515625, -2.096923828125, -2.0291748046875, -1.96142578125, -1.8936767578125, -1.825927734375, -1.7581787109375, -1.6904296875, -1.6226806640625, -1.554931640625, -1.4871826171875, -1.41943359375, -1.3516845703125, -1.283935546875, -1.2161865234375, -1.1484375, -1.0806884765625, -1.012939453125, -0.9451904296875, -0.87744140625, -0.8096923828125, -0.741943359375, -0.6741943359375, -0.6064453125, -0.5386962890625, -0.470947265625, -0.4031982421875, -0.33544921875, -0.2677001953125, -0.199951171875, -0.1322021484375, -0.064453125, 0.0032958984375, 0.071044921875, 0.1387939453125, 0.20654296875, 0.2742919921875, 0.342041015625, 0.4097900390625, 0.4775390625, 0.5452880859375, 0.613037109375, 0.6807861328125, 0.74853515625, 0.8162841796875, 0.884033203125, 0.9517822265625, 1.01953125, 1.0872802734375, 1.155029296875, 1.2227783203125, 1.29052734375, 1.3582763671875, 1.426025390625, 1.4937744140625, 1.5615234375, 1.6292724609375, 1.697021484375, 1.7647705078125, 1.83251953125, 1.9002685546875, 1.968017578125, 2.0357666015625, 2.103515625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 10.0, 8.0, 8.0, 8.0, 8.0, 18.0, 26.0, 34.0, 41.0, 48.0, 69.0, 74.0, 88.0, 89.0, 92.0, 83.0, 64.0, 56.0, 42.0, 29.0, 24.0, 18.0, 15.0, 12.0, 7.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00012731552124023438, -0.00012340396642684937, -0.00011949241161346436, -0.00011558085680007935, -0.00011166930198669434, -0.00010775774717330933, -0.00010384619235992432, -9.99346375465393e-05, -9.60230827331543e-05, -9.211152791976929e-05, -8.819997310638428e-05, -8.428841829299927e-05, -8.037686347961426e-05, -7.646530866622925e-05, -7.255375385284424e-05, -6.864219903945923e-05, -6.473064422607422e-05, -6.081908941268921e-05, -5.69075345993042e-05, -5.299597978591919e-05, -4.908442497253418e-05, -4.517287015914917e-05, -4.126131534576416e-05, -3.734976053237915e-05, -3.343820571899414e-05, -2.952665090560913e-05, -2.561509609222412e-05, -2.170354127883911e-05, -1.77919864654541e-05, -1.3880431652069092e-05, -9.968876838684082e-06, -6.057322025299072e-06, -2.1457672119140625e-06, 1.7657876014709473e-06, 5.677342414855957e-06, 9.588897228240967e-06, 1.3500452041625977e-05, 1.7412006855010986e-05, 2.1323561668395996e-05, 2.5235116481781006e-05, 2.9146671295166016e-05, 3.3058226108551025e-05, 3.6969780921936035e-05, 4.0881335735321045e-05, 4.4792890548706055e-05, 4.8704445362091064e-05, 5.2616000175476074e-05, 5.6527554988861084e-05, 6.0439109802246094e-05, 6.43506646156311e-05, 6.826221942901611e-05, 7.217377424240112e-05, 7.608532905578613e-05, 7.999688386917114e-05, 8.390843868255615e-05, 8.781999349594116e-05, 9.173154830932617e-05, 9.564310312271118e-05, 9.955465793609619e-05, 0.0001034662127494812, 0.00010737776756286621, 0.00011128932237625122, 0.00011520087718963623, 0.00011911243200302124, 0.00012302398681640625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 5.0, 3.0, 4.0, 8.0, 21.0, 19.0, 29.0, 40.0, 49.0, 98.0, 122.0, 163.0, 228.0, 389.0, 549.0, 759.0, 1119.0, 1605.0, 2445.0, 3742.0, 6009.0, 9845.0, 17474.0, 33882.0, 76594.0, 238122.0, 401538.0, 139987.0, 52556.0, 25206.0, 13589.0, 7795.0, 4816.0, 3139.0, 2055.0, 1436.0, 970.0, 647.0, 450.0, 334.0, 233.0, 149.0, 114.0, 76.0, 48.0, 27.0, 27.0, 22.0, 9.0, 9.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-1.70703125, -1.6541595458984375, -1.601287841796875, -1.5484161376953125, -1.49554443359375, -1.4426727294921875, -1.389801025390625, -1.3369293212890625, -1.2840576171875, -1.2311859130859375, -1.178314208984375, -1.1254425048828125, -1.07257080078125, -1.0196990966796875, -0.966827392578125, -0.9139556884765625, -0.861083984375, -0.8082122802734375, -0.755340576171875, -0.7024688720703125, -0.64959716796875, -0.5967254638671875, -0.543853759765625, -0.4909820556640625, -0.4381103515625, -0.3852386474609375, -0.332366943359375, -0.2794952392578125, -0.22662353515625, -0.1737518310546875, -0.120880126953125, -0.0680084228515625, -0.01513671875, 0.0377349853515625, 0.090606689453125, 0.1434783935546875, 0.19635009765625, 0.2492218017578125, 0.302093505859375, 0.3549652099609375, 0.4078369140625, 0.4607086181640625, 0.513580322265625, 0.5664520263671875, 0.61932373046875, 0.6721954345703125, 0.725067138671875, 0.7779388427734375, 0.830810546875, 0.8836822509765625, 0.936553955078125, 0.9894256591796875, 1.04229736328125, 1.0951690673828125, 1.148040771484375, 1.2009124755859375, 1.2537841796875, 1.3066558837890625, 1.359527587890625, 1.4123992919921875, 1.46527099609375, 1.5181427001953125, 1.571014404296875, 1.6238861083984375, 1.6767578125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 8.0, 5.0, 4.0, 6.0, 12.0, 16.0, 26.0, 21.0, 23.0, 33.0, 42.0, 40.0, 62.0, 71.0, 77.0, 87.0, 79.0, 74.0, 55.0, 54.0, 34.0, 30.0, 24.0, 21.0, 14.0, 14.0, 8.0, 9.0, 3.0, 6.0, 5.0, 2.0, 3.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.52587890625, -0.5090484619140625, -0.492218017578125, -0.4753875732421875, -0.45855712890625, -0.4417266845703125, -0.424896240234375, -0.4080657958984375, -0.3912353515625, -0.3744049072265625, -0.357574462890625, -0.3407440185546875, -0.32391357421875, -0.3070831298828125, -0.290252685546875, -0.2734222412109375, -0.256591796875, -0.2397613525390625, -0.222930908203125, -0.2061004638671875, -0.18927001953125, -0.1724395751953125, -0.155609130859375, -0.1387786865234375, -0.1219482421875, -0.1051177978515625, -0.088287353515625, -0.0714569091796875, -0.05462646484375, -0.0377960205078125, -0.020965576171875, -0.0041351318359375, 0.0126953125, 0.0295257568359375, 0.046356201171875, 0.0631866455078125, 0.08001708984375, 0.0968475341796875, 0.113677978515625, 0.1305084228515625, 0.1473388671875, 0.1641693115234375, 0.180999755859375, 0.1978302001953125, 0.21466064453125, 0.2314910888671875, 0.248321533203125, 0.2651519775390625, 0.281982421875, 0.2988128662109375, 0.315643310546875, 0.3324737548828125, 0.34930419921875, 0.3661346435546875, 0.382965087890625, 0.3997955322265625, 0.4166259765625, 0.4334564208984375, 0.450286865234375, 0.4671173095703125, 0.48394775390625, 0.5007781982421875, 0.517608642578125, 0.5344390869140625, 0.55126953125]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 5.0, 4.0, 13.0, 3.0, 5.0, 15.0, 10.0, 18.0, 14.0, 25.0, 37.0, 48.0, 49.0, 61.0, 61.0, 74.0, 77.0, 73.0, 61.0, 57.0, 50.0, 48.0, 38.0, 21.0, 15.0, 31.0, 13.0, 18.0, 13.0, 3.0, 6.0, 5.0, 5.0, 6.0, 4.0, 5.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-10.960943222045898, -10.617575645446777, -10.27420711517334, -9.930839538574219, -9.587471008300781, -9.24410343170166, -8.900735855102539, -8.557367324829102, -8.213998794555664, -7.870630741119385, -7.5272626876831055, -7.183895111083984, -6.840526580810547, -6.497159004211426, -6.1537909507751465, -5.810422897338867, -5.467055320739746, -5.123687267303467, -4.7803192138671875, -4.436951637268066, -4.093583106994629, -3.7502152919769287, -3.4068474769592285, -3.063479423522949, -2.72011137008667, -2.3767433166503906, -2.0333752632141113, -1.6900074481964111, -1.3466393947601318, -1.0032713413238525, -0.6599035263061523, -0.31653547286987305, 0.026831626892089844, 0.37019962072372437, 0.7135676145553589, 1.0569355487823486, 1.400303602218628, 1.7436716556549072, 2.0870394706726074, 2.4304075241088867, 2.773775577545166, 3.1171436309814453, 3.4605116844177246, 3.803879499435425, 4.147247314453125, 4.4906158447265625, 4.833983421325684, 5.177351474761963, 5.520719528198242, 5.8640875816345215, 6.207455635070801, 6.550823211669922, 6.894191741943359, 7.2375593185424805, 7.58092737197876, 7.924295425415039, 8.267663955688477, 8.611031532287598, 8.954400062561035, 9.297767639160156, 9.641136169433594, 9.984503746032715, 10.327871322631836, 10.671239852905273, 11.014607429504395]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 2.0, 8.0, 8.0, 7.0, 6.0, 10.0, 11.0, 18.0, 13.0, 26.0, 23.0, 25.0, 27.0, 26.0, 32.0, 38.0, 38.0, 35.0, 27.0, 43.0, 34.0, 39.0, 36.0, 37.0, 40.0, 34.0, 40.0, 38.0, 32.0, 30.0, 32.0, 27.0, 26.0, 19.0, 17.0, 18.0, 9.0, 15.0, 12.0, 9.0, 8.0, 7.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-9.053244590759277, -8.761343002319336, -8.469441413879395, -8.177539825439453, -7.885638236999512, -7.59373664855957, -7.301835060119629, -7.0099334716796875, -6.718031883239746, -6.426130294799805, -6.134228706359863, -5.842327117919922, -5.5504255294799805, -5.258523941040039, -4.966622352600098, -4.674720764160156, -4.382819175720215, -4.090917587280273, -3.799015998840332, -3.5071144104003906, -3.215212821960449, -2.923311233520508, -2.6314096450805664, -2.339508056640625, -2.0476064682006836, -1.7557048797607422, -1.4638032913208008, -1.1719017028808594, -0.880000114440918, -0.5880985260009766, -0.29619693756103516, -0.00429534912109375, 0.28760623931884766, 0.5795078277587891, 0.8714094161987305, 1.1633110046386719, 1.4552125930786133, 1.7471141815185547, 2.039015769958496, 2.3309173583984375, 2.622818946838379, 2.9147205352783203, 3.2066221237182617, 3.498523712158203, 3.7904253005981445, 4.082326889038086, 4.374228477478027, 4.666130065917969, 4.95803165435791, 5.249933242797852, 5.541834831237793, 5.833736419677734, 6.125638008117676, 6.417539596557617, 6.709441184997559, 7.0013427734375, 7.293244361877441, 7.585145950317383, 7.877047538757324, 8.168949127197266, 8.460850715637207, 8.752752304077148, 9.04465389251709, 9.336555480957031, 9.628457069396973]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0, 5.0, 13.0, 9.0, 19.0, 34.0, 49.0, 73.0, 96.0, 148.0, 238.0, 407.0, 547.0, 959.0, 1456.0, 2397.0, 4074.0, 6847.0, 11500.0, 20101.0, 36043.0, 67012.0, 133089.0, 343586.0, 1292142.0, 1510907.0, 443926.0, 150816.0, 73742.0, 39472.0, 22317.0, 12657.0, 7489.0, 4613.0, 2742.0, 1634.0, 1118.0, 678.0, 450.0, 294.0, 192.0, 152.0, 66.0, 57.0, 30.0, 28.0, 21.0, 21.0, 6.0, 5.0, 8.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-15.828125, -15.319091796875, -14.81005859375, -14.301025390625, -13.7919921875, -13.282958984375, -12.77392578125, -12.264892578125, -11.755859375, -11.246826171875, -10.73779296875, -10.228759765625, -9.7197265625, -9.210693359375, -8.70166015625, -8.192626953125, -7.68359375, -7.174560546875, -6.66552734375, -6.156494140625, -5.6474609375, -5.138427734375, -4.62939453125, -4.120361328125, -3.611328125, -3.102294921875, -2.59326171875, -2.084228515625, -1.5751953125, -1.066162109375, -0.55712890625, -0.048095703125, 0.4609375, 0.969970703125, 1.47900390625, 1.988037109375, 2.4970703125, 3.006103515625, 3.51513671875, 4.024169921875, 4.533203125, 5.042236328125, 5.55126953125, 6.060302734375, 6.5693359375, 7.078369140625, 7.58740234375, 8.096435546875, 8.60546875, 9.114501953125, 9.62353515625, 10.132568359375, 10.6416015625, 11.150634765625, 11.65966796875, 12.168701171875, 12.677734375, 13.186767578125, 13.69580078125, 14.204833984375, 14.7138671875, 15.222900390625, 15.73193359375, 16.240966796875, 16.75]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 5.0, 8.0, 10.0, 6.0, 15.0, 10.0, 16.0, 21.0, 21.0, 25.0, 29.0, 22.0, 39.0, 41.0, 33.0, 36.0, 24.0, 41.0, 36.0, 36.0, 39.0, 44.0, 46.0, 44.0, 40.0, 24.0, 43.0, 30.0, 28.0, 29.0, 32.0, 25.0, 15.0, 9.0, 12.0, 13.0, 9.0, 16.0, 3.0, 2.0, 3.0, 3.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.80078125, -7.54278564453125, -7.2847900390625, -7.02679443359375, -6.768798828125, -6.51080322265625, -6.2528076171875, -5.99481201171875, -5.73681640625, -5.47882080078125, -5.2208251953125, -4.96282958984375, -4.704833984375, -4.44683837890625, -4.1888427734375, -3.93084716796875, -3.6728515625, -3.41485595703125, -3.1568603515625, -2.89886474609375, -2.640869140625, -2.38287353515625, -2.1248779296875, -1.86688232421875, -1.60888671875, -1.35089111328125, -1.0928955078125, -0.83489990234375, -0.576904296875, -0.31890869140625, -0.0609130859375, 0.19708251953125, 0.455078125, 0.71307373046875, 0.9710693359375, 1.22906494140625, 1.487060546875, 1.74505615234375, 2.0030517578125, 2.26104736328125, 2.51904296875, 2.77703857421875, 3.0350341796875, 3.29302978515625, 3.551025390625, 3.80902099609375, 4.0670166015625, 4.32501220703125, 4.5830078125, 4.84100341796875, 5.0989990234375, 5.35699462890625, 5.614990234375, 5.87298583984375, 6.1309814453125, 6.38897705078125, 6.64697265625, 6.90496826171875, 7.1629638671875, 7.42095947265625, 7.678955078125, 7.93695068359375, 8.1949462890625, 8.45294189453125, 8.7109375]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 7.0, 10.0, 17.0, 14.0, 28.0, 48.0, 77.0, 129.0, 230.0, 296.0, 575.0, 897.0, 1507.0, 2590.0, 4295.0, 7352.0, 12737.0, 23153.0, 43965.0, 85350.0, 178654.0, 410358.0, 1161161.0, 1376615.0, 477837.0, 202140.0, 95752.0, 48817.0, 25929.0, 14248.0, 8112.0, 4545.0, 2772.0, 1549.0, 988.0, 571.0, 373.0, 201.0, 141.0, 80.0, 76.0, 36.0, 22.0, 13.0, 11.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-15.8984375, -15.4178466796875, -14.937255859375, -14.4566650390625, -13.97607421875, -13.4954833984375, -13.014892578125, -12.5343017578125, -12.0537109375, -11.5731201171875, -11.092529296875, -10.6119384765625, -10.13134765625, -9.6507568359375, -9.170166015625, -8.6895751953125, -8.208984375, -7.7283935546875, -7.247802734375, -6.7672119140625, -6.28662109375, -5.8060302734375, -5.325439453125, -4.8448486328125, -4.3642578125, -3.8836669921875, -3.403076171875, -2.9224853515625, -2.44189453125, -1.9613037109375, -1.480712890625, -1.0001220703125, -0.51953125, -0.0389404296875, 0.441650390625, 0.9222412109375, 1.40283203125, 1.8834228515625, 2.364013671875, 2.8446044921875, 3.3251953125, 3.8057861328125, 4.286376953125, 4.7669677734375, 5.24755859375, 5.7281494140625, 6.208740234375, 6.6893310546875, 7.169921875, 7.6505126953125, 8.131103515625, 8.6116943359375, 9.09228515625, 9.5728759765625, 10.053466796875, 10.5340576171875, 11.0146484375, 11.4952392578125, 11.975830078125, 12.4564208984375, 12.93701171875, 13.4176025390625, 13.898193359375, 14.3787841796875, 14.859375]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 3.0, 3.0, 9.0, 9.0, 10.0, 16.0, 19.0, 20.0, 38.0, 32.0, 53.0, 63.0, 81.0, 90.0, 127.0, 145.0, 150.0, 208.0, 261.0, 376.0, 443.0, 413.0, 312.0, 240.0, 211.0, 135.0, 127.0, 98.0, 61.0, 74.0, 62.0, 30.0, 39.0, 35.0, 22.0, 20.0, 5.0, 12.0, 4.0, 5.0, 13.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-5.97265625, -5.81011962890625, -5.6475830078125, -5.48504638671875, -5.322509765625, -5.15997314453125, -4.9974365234375, -4.83489990234375, -4.67236328125, -4.50982666015625, -4.3472900390625, -4.18475341796875, -4.022216796875, -3.85968017578125, -3.6971435546875, -3.53460693359375, -3.3720703125, -3.20953369140625, -3.0469970703125, -2.88446044921875, -2.721923828125, -2.55938720703125, -2.3968505859375, -2.23431396484375, -2.07177734375, -1.90924072265625, -1.7467041015625, -1.58416748046875, -1.421630859375, -1.25909423828125, -1.0965576171875, -0.93402099609375, -0.771484375, -0.60894775390625, -0.4464111328125, -0.28387451171875, -0.121337890625, 0.04119873046875, 0.2037353515625, 0.36627197265625, 0.52880859375, 0.69134521484375, 0.8538818359375, 1.01641845703125, 1.178955078125, 1.34149169921875, 1.5040283203125, 1.66656494140625, 1.8291015625, 1.99163818359375, 2.1541748046875, 2.31671142578125, 2.479248046875, 2.64178466796875, 2.8043212890625, 2.96685791015625, 3.12939453125, 3.29193115234375, 3.4544677734375, 3.61700439453125, 3.779541015625, 3.94207763671875, 4.1046142578125, 4.26715087890625, 4.4296875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 3.0, 8.0, 7.0, 16.0, 14.0, 14.0, 20.0, 33.0, 42.0, 32.0, 51.0, 46.0, 64.0, 77.0, 68.0, 75.0, 58.0, 56.0, 42.0, 41.0, 46.0, 32.0, 31.0, 22.0, 17.0, 17.0, 11.0, 10.0, 5.0, 5.0, 8.0, 5.0, 5.0, 3.0, 2.0, 1.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.66112995147705, -8.33098316192627, -8.000835418701172, -7.670688629150391, -7.340541839599609, -7.010395050048828, -6.680247783660889, -6.350100517272949, -6.019953727722168, -5.689806938171387, -5.359659671783447, -5.029512405395508, -4.699365615844727, -4.369218826293945, -4.039071559906006, -3.7089245319366455, -3.378777503967285, -3.048630475997925, -2.7184834480285645, -2.388336420059204, -2.0581893920898438, -1.7280423641204834, -1.397895336151123, -1.0677483081817627, -0.7376012802124023, -0.407454252243042, -0.07730722427368164, 0.2528398036956787, 0.5829868316650391, 0.9131338596343994, 1.2432808876037598, 1.5734279155731201, 1.903573989868164, 2.2337210178375244, 2.5638680458068848, 2.894015073776245, 3.2241621017456055, 3.554309129714966, 3.884456157684326, 4.214603424072266, 4.544750213623047, 4.874897003173828, 5.205044269561768, 5.535191535949707, 5.865338325500488, 6.1954851150512695, 6.525632381439209, 6.855779647827148, 7.18592643737793, 7.516073226928711, 7.84622049331665, 8.17636775970459, 8.506514549255371, 8.836661338806152, 9.16680908203125, 9.496955871582031, 9.827102661132812, 10.157249450683594, 10.487396240234375, 10.817543983459473, 11.147690773010254, 11.477837562561035, 11.807985305786133, 12.138132095336914, 12.468278884887695]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 2.0, 8.0, 5.0, 7.0, 9.0, 7.0, 14.0, 22.0, 20.0, 28.0, 32.0, 16.0, 29.0, 24.0, 37.0, 30.0, 33.0, 40.0, 41.0, 31.0, 29.0, 38.0, 35.0, 39.0, 35.0, 27.0, 34.0, 36.0, 29.0, 34.0, 29.0, 24.0, 26.0, 25.0, 19.0, 18.0, 13.0, 20.0, 11.0, 8.0, 10.0, 9.0, 3.0, 5.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.781655788421631, -7.5052056312561035, -7.228755950927734, -6.952305793762207, -6.675856113433838, -6.3994059562683105, -6.122956275939941, -5.846506118774414, -5.570055961608887, -5.293605804443359, -5.01715612411499, -4.740705966949463, -4.464256286621094, -4.187806129455566, -3.911356210708618, -3.63490629196167, -3.358456611633301, -3.0820066928863525, -2.8055567741394043, -2.529106616973877, -2.252656936645508, -1.97620689868927, -1.6997568607330322, -1.423306941986084, -1.1468570232391357, -0.8704071044921875, -0.5939571261405945, -0.31750714778900146, -0.04105722904205322, 0.23539268970489502, 0.5118427276611328, 0.788292646408081, 1.0647430419921875, 1.3411929607391357, 1.617642879486084, 1.8940929174423218, 2.1705427169799805, 2.446992874145508, 2.723442792892456, 2.9998927116394043, 3.2763426303863525, 3.552792549133301, 3.829242467880249, 4.105692386627197, 4.382142543792725, 4.658592224121094, 4.935042381286621, 5.211492538452148, 5.487942218780518, 5.764392375946045, 6.040842056274414, 6.317292213439941, 6.5937418937683105, 6.870192050933838, 7.146641731262207, 7.423091888427734, 7.699542045593262, 7.975992202758789, 8.252442359924316, 8.528891563415527, 8.805341720581055, 9.081791877746582, 9.35824203491211, 9.63469123840332, 9.911141395568848]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 6.0, 2.0, 9.0, 14.0, 10.0, 20.0, 31.0, 22.0, 73.0, 82.0, 153.0, 203.0, 321.0, 446.0, 708.0, 959.0, 1517.0, 2309.0, 3438.0, 5423.0, 8439.0, 13160.0, 20547.0, 32909.0, 52219.0, 88145.0, 165095.0, 305110.0, 140744.0, 77672.0, 46965.0, 29089.0, 18672.0, 11961.0, 7617.0, 4819.0, 3262.0, 2142.0, 1409.0, 928.0, 604.0, 430.0, 298.0, 204.0, 114.0, 85.0, 50.0, 40.0, 26.0, 16.0, 16.0, 11.0, 6.0, 4.0, 4.0, 2.0, 1.0], "bins": [-2.828125, -2.745880126953125, -2.66363525390625, -2.581390380859375, -2.4991455078125, -2.416900634765625, -2.33465576171875, -2.252410888671875, -2.170166015625, -2.087921142578125, -2.00567626953125, -1.923431396484375, -1.8411865234375, -1.758941650390625, -1.67669677734375, -1.594451904296875, -1.51220703125, -1.429962158203125, -1.34771728515625, -1.265472412109375, -1.1832275390625, -1.100982666015625, -1.01873779296875, -0.936492919921875, -0.854248046875, -0.772003173828125, -0.68975830078125, -0.607513427734375, -0.5252685546875, -0.443023681640625, -0.36077880859375, -0.278533935546875, -0.1962890625, -0.114044189453125, -0.03179931640625, 0.050445556640625, 0.1326904296875, 0.214935302734375, 0.29718017578125, 0.379425048828125, 0.461669921875, 0.543914794921875, 0.62615966796875, 0.708404541015625, 0.7906494140625, 0.872894287109375, 0.95513916015625, 1.037384033203125, 1.11962890625, 1.201873779296875, 1.28411865234375, 1.366363525390625, 1.4486083984375, 1.530853271484375, 1.61309814453125, 1.695343017578125, 1.777587890625, 1.859832763671875, 1.94207763671875, 2.024322509765625, 2.1065673828125, 2.188812255859375, 2.27105712890625, 2.353302001953125, 2.435546875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 2.0, 2.0, 6.0, 8.0, 5.0, 9.0, 9.0, 12.0, 18.0, 15.0, 24.0, 23.0, 29.0, 29.0, 35.0, 29.0, 25.0, 39.0, 34.0, 41.0, 38.0, 30.0, 28.0, 37.0, 30.0, 37.0, 48.0, 35.0, 30.0, 36.0, 27.0, 31.0, 34.0, 25.0, 16.0, 20.0, 12.0, 16.0, 24.0, 14.0, 12.0, 8.0, 6.0, 5.0, 3.0, 4.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.47265625, -7.18975830078125, -6.9068603515625, -6.62396240234375, -6.341064453125, -6.05816650390625, -5.7752685546875, -5.49237060546875, -5.20947265625, -4.92657470703125, -4.6436767578125, -4.36077880859375, -4.077880859375, -3.79498291015625, -3.5120849609375, -3.22918701171875, -2.9462890625, -2.66339111328125, -2.3804931640625, -2.09759521484375, -1.814697265625, -1.53179931640625, -1.2489013671875, -0.96600341796875, -0.68310546875, -0.40020751953125, -0.1173095703125, 0.16558837890625, 0.448486328125, 0.73138427734375, 1.0142822265625, 1.29718017578125, 1.580078125, 1.86297607421875, 2.1458740234375, 2.42877197265625, 2.711669921875, 2.99456787109375, 3.2774658203125, 3.56036376953125, 3.84326171875, 4.12615966796875, 4.4090576171875, 4.69195556640625, 4.974853515625, 5.25775146484375, 5.5406494140625, 5.82354736328125, 6.1064453125, 6.38934326171875, 6.6722412109375, 6.95513916015625, 7.238037109375, 7.52093505859375, 7.8038330078125, 8.08673095703125, 8.36962890625, 8.65252685546875, 8.9354248046875, 9.21832275390625, 9.501220703125, 9.78411865234375, 10.0670166015625, 10.34991455078125, 10.6328125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 8.0, 10.0, 9.0, 21.0, 26.0, 50.0, 60.0, 108.0, 123.0, 239.0, 313.0, 497.0, 659.0, 1002.0, 1668.0, 2422.0, 3559.0, 5564.0, 8703.0, 14110.0, 22553.0, 36219.0, 59468.0, 106559.0, 253603.0, 263707.0, 107839.0, 60392.0, 36583.0, 22784.0, 14033.0, 9044.0, 5594.0, 3695.0, 2382.0, 1598.0, 1120.0, 750.0, 465.0, 339.0, 210.0, 147.0, 98.0, 54.0, 51.0, 33.0, 30.0, 22.0, 11.0, 14.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.662109375, -2.578948974609375, -2.49578857421875, -2.412628173828125, -2.3294677734375, -2.246307373046875, -2.16314697265625, -2.079986572265625, -1.996826171875, -1.913665771484375, -1.83050537109375, -1.747344970703125, -1.6641845703125, -1.581024169921875, -1.49786376953125, -1.414703369140625, -1.33154296875, -1.248382568359375, -1.16522216796875, -1.082061767578125, -0.9989013671875, -0.915740966796875, -0.83258056640625, -0.749420166015625, -0.666259765625, -0.583099365234375, -0.49993896484375, -0.416778564453125, -0.3336181640625, -0.250457763671875, -0.16729736328125, -0.084136962890625, -0.0009765625, 0.082183837890625, 0.16534423828125, 0.248504638671875, 0.3316650390625, 0.414825439453125, 0.49798583984375, 0.581146240234375, 0.664306640625, 0.747467041015625, 0.83062744140625, 0.913787841796875, 0.9969482421875, 1.080108642578125, 1.16326904296875, 1.246429443359375, 1.32958984375, 1.412750244140625, 1.49591064453125, 1.579071044921875, 1.6622314453125, 1.745391845703125, 1.82855224609375, 1.911712646484375, 1.994873046875, 2.078033447265625, 2.16119384765625, 2.244354248046875, 2.3275146484375, 2.410675048828125, 2.49383544921875, 2.576995849609375, 2.66015625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 6.0, 12.0, 8.0, 9.0, 9.0, 15.0, 18.0, 28.0, 14.0, 25.0, 23.0, 32.0, 28.0, 35.0, 33.0, 49.0, 33.0, 39.0, 38.0, 53.0, 42.0, 33.0, 44.0, 32.0, 43.0, 31.0, 38.0, 25.0, 26.0, 29.0, 24.0, 20.0, 26.0, 19.0, 21.0, 14.0, 10.0, 4.0, 10.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-6.6875, -6.4949951171875, -6.302490234375, -6.1099853515625, -5.91748046875, -5.7249755859375, -5.532470703125, -5.3399658203125, -5.1474609375, -4.9549560546875, -4.762451171875, -4.5699462890625, -4.37744140625, -4.1849365234375, -3.992431640625, -3.7999267578125, -3.607421875, -3.4149169921875, -3.222412109375, -3.0299072265625, -2.83740234375, -2.6448974609375, -2.452392578125, -2.2598876953125, -2.0673828125, -1.8748779296875, -1.682373046875, -1.4898681640625, -1.29736328125, -1.1048583984375, -0.912353515625, -0.7198486328125, -0.52734375, -0.3348388671875, -0.142333984375, 0.0501708984375, 0.24267578125, 0.4351806640625, 0.627685546875, 0.8201904296875, 1.0126953125, 1.2052001953125, 1.397705078125, 1.5902099609375, 1.78271484375, 1.9752197265625, 2.167724609375, 2.3602294921875, 2.552734375, 2.7452392578125, 2.937744140625, 3.1302490234375, 3.32275390625, 3.5152587890625, 3.707763671875, 3.9002685546875, 4.0927734375, 4.2852783203125, 4.477783203125, 4.6702880859375, 4.86279296875, 5.0552978515625, 5.247802734375, 5.4403076171875, 5.6328125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 10.0, 14.0, 21.0, 30.0, 41.0, 47.0, 70.0, 84.0, 140.0, 170.0, 232.0, 309.0, 490.0, 699.0, 971.0, 1457.0, 2159.0, 3409.0, 5231.0, 8354.0, 13362.0, 23423.0, 43028.0, 90359.0, 221620.0, 339251.0, 147554.0, 64480.0, 32862.0, 18178.0, 10705.0, 6651.0, 4353.0, 2807.0, 1870.0, 1246.0, 842.0, 593.0, 401.0, 289.0, 189.0, 159.0, 109.0, 94.0, 52.0, 42.0, 31.0, 19.0, 19.0, 9.0, 8.0, 9.0, 2.0, 5.0, 0.0, 0.0, 1.0], "bins": [-0.004528045654296875, -0.004387795925140381, -0.004247546195983887, -0.004107296466827393, -0.0039670467376708984, -0.0038267970085144043, -0.00368654727935791, -0.003546297550201416, -0.003406047821044922, -0.0032657980918884277, -0.0031255483627319336, -0.0029852986335754395, -0.0028450489044189453, -0.002704799175262451, -0.002564549446105957, -0.002424299716949463, -0.0022840499877929688, -0.0021438002586364746, -0.0020035505294799805, -0.0018633008003234863, -0.0017230510711669922, -0.001582801342010498, -0.001442551612854004, -0.0013023018836975098, -0.0011620521545410156, -0.0010218024253845215, -0.0008815526962280273, -0.0007413029670715332, -0.0006010532379150391, -0.0004608035087585449, -0.0003205537796020508, -0.00018030405044555664, -4.00543212890625e-05, 0.00010019540786743164, 0.00024044513702392578, 0.0003806948661804199, 0.0005209445953369141, 0.0006611943244934082, 0.0008014440536499023, 0.0009416937828063965, 0.0010819435119628906, 0.0012221932411193848, 0.001362442970275879, 0.001502692699432373, 0.0016429424285888672, 0.0017831921577453613, 0.0019234418869018555, 0.0020636916160583496, 0.0022039413452148438, 0.002344191074371338, 0.002484440803527832, 0.002624690532684326, 0.0027649402618408203, 0.0029051899909973145, 0.0030454397201538086, 0.0031856894493103027, 0.003325939178466797, 0.003466188907623291, 0.003606438636779785, 0.0037466883659362793, 0.0038869380950927734, 0.004027187824249268, 0.004167437553405762, 0.004307687282562256, 0.00444793701171875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 3.0, 7.0, 1.0, 4.0, 10.0, 6.0, 7.0, 14.0, 16.0, 20.0, 30.0, 22.0, 23.0, 58.0, 34.0, 38.0, 79.0, 44.0, 55.0, 96.0, 46.0, 50.0, 62.0, 33.0, 26.0, 68.0, 17.0, 26.0, 20.0, 10.0, 11.0, 15.0, 6.0, 8.0, 10.0, 7.0, 3.0, 7.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.589557647705078e-06, -4.450790584087372e-06, -4.3120235204696655e-06, -4.173256456851959e-06, -4.034489393234253e-06, -3.895722329616547e-06, -3.7569552659988403e-06, -3.618188202381134e-06, -3.4794211387634277e-06, -3.3406540751457214e-06, -3.201887011528015e-06, -3.063119947910309e-06, -2.9243528842926025e-06, -2.7855858206748962e-06, -2.64681875705719e-06, -2.5080516934394836e-06, -2.3692846298217773e-06, -2.230517566204071e-06, -2.0917505025863647e-06, -1.9529834389686584e-06, -1.8142163753509521e-06, -1.6754493117332458e-06, -1.5366822481155396e-06, -1.3979151844978333e-06, -1.259148120880127e-06, -1.1203810572624207e-06, -9.816139936447144e-07, -8.428469300270081e-07, -7.040798664093018e-07, -5.653128027915955e-07, -4.2654573917388916e-07, -2.8777867555618286e-07, -1.4901161193847656e-07, -1.0244548320770264e-08, 1.2852251529693604e-07, 2.6728957891464233e-07, 4.0605664253234863e-07, 5.448237061500549e-07, 6.835907697677612e-07, 8.223578333854675e-07, 9.611248970031738e-07, 1.0998919606208801e-06, 1.2386590242385864e-06, 1.3774260878562927e-06, 1.516193151473999e-06, 1.6549602150917053e-06, 1.7937272787094116e-06, 1.932494342327118e-06, 2.0712614059448242e-06, 2.2100284695625305e-06, 2.348795533180237e-06, 2.487562596797943e-06, 2.6263296604156494e-06, 2.7650967240333557e-06, 2.903863787651062e-06, 3.0426308512687683e-06, 3.1813979148864746e-06, 3.320164978504181e-06, 3.458932042121887e-06, 3.5976991057395935e-06, 3.7364661693573e-06, 3.875233232975006e-06, 4.014000296592712e-06, 4.152767360210419e-06, 4.291534423828125e-06]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 9.0, 5.0, 13.0, 12.0, 23.0, 22.0, 42.0, 58.0, 71.0, 130.0, 182.0, 239.0, 367.0, 546.0, 721.0, 1099.0, 1555.0, 2400.0, 3489.0, 5578.0, 8462.0, 13597.0, 23067.0, 41238.0, 80221.0, 177044.0, 325407.0, 178877.0, 80829.0, 41210.0, 23191.0, 13982.0, 8533.0, 5348.0, 3471.0, 2412.0, 1590.0, 1069.0, 763.0, 500.0, 373.0, 243.0, 182.0, 124.0, 78.0, 57.0, 50.0, 34.0, 14.0, 9.0, 10.0, 4.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00396728515625, -0.0038328170776367188, -0.0036983489990234375, -0.0035638809204101562, -0.003429412841796875, -0.0032949447631835938, -0.0031604766845703125, -0.0030260086059570312, -0.00289154052734375, -0.0027570724487304688, -0.0026226043701171875, -0.0024881362915039062, -0.002353668212890625, -0.0022192001342773438, -0.0020847320556640625, -0.0019502639770507812, -0.0018157958984375, -0.0016813278198242188, -0.0015468597412109375, -0.0014123916625976562, -0.001277923583984375, -0.0011434555053710938, -0.0010089874267578125, -0.0008745193481445312, -0.00074005126953125, -0.0006055831909179688, -0.0004711151123046875, -0.00033664703369140625, -0.000202178955078125, -6.771087646484375e-05, 6.67572021484375e-05, 0.00020122528076171875, 0.000335693359375, 0.00047016143798828125, 0.0006046295166015625, 0.0007390975952148438, 0.000873565673828125, 0.0010080337524414062, 0.0011425018310546875, 0.0012769699096679688, 0.00141143798828125, 0.0015459060668945312, 0.0016803741455078125, 0.0018148422241210938, 0.001949310302734375, 0.0020837783813476562, 0.0022182464599609375, 0.0023527145385742188, 0.0024871826171875, 0.0026216506958007812, 0.0027561187744140625, 0.0028905868530273438, 0.003025054931640625, 0.0031595230102539062, 0.0032939910888671875, 0.0034284591674804688, 0.00356292724609375, 0.0036973953247070312, 0.0038318634033203125, 0.003966331481933594, 0.004100799560546875, 0.004235267639160156, 0.0043697357177734375, 0.004504203796386719, 0.004638671875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 5.0, 3.0, 6.0, 4.0, 5.0, 12.0, 8.0, 9.0, 15.0, 16.0, 21.0, 24.0, 30.0, 37.0, 38.0, 48.0, 70.0, 70.0, 83.0, 72.0, 73.0, 78.0, 39.0, 44.0, 24.0, 32.0, 18.0, 19.0, 14.0, 18.0, 6.0, 12.0, 9.0, 9.0, 9.0, 5.0, 3.0, 3.0, 5.0, 2.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0014810562133789062, -0.0014330297708511353, -0.0013850033283233643, -0.0013369768857955933, -0.0012889504432678223, -0.0012409240007400513, -0.0011928975582122803, -0.0011448711156845093, -0.0010968446731567383, -0.0010488182306289673, -0.0010007917881011963, -0.0009527653455734253, -0.0009047389030456543, -0.0008567124605178833, -0.0008086860179901123, -0.0007606595754623413, -0.0007126331329345703, -0.0006646066904067993, -0.0006165802478790283, -0.0005685538053512573, -0.0005205273628234863, -0.00047250092029571533, -0.00042447447776794434, -0.00037644803524017334, -0.00032842159271240234, -0.00028039515018463135, -0.00023236870765686035, -0.00018434226512908936, -0.00013631582260131836, -8.828938007354736e-05, -4.026293754577637e-05, 7.763504981994629e-06, 5.5789947509765625e-05, 0.00010381639003753662, 0.00015184283256530762, 0.0001998692750930786, 0.0002478957176208496, 0.0002959221601486206, 0.0003439486026763916, 0.0003919750452041626, 0.0004400014877319336, 0.0004880279302597046, 0.0005360543727874756, 0.0005840808153152466, 0.0006321072578430176, 0.0006801337003707886, 0.0007281601428985596, 0.0007761865854263306, 0.0008242130279541016, 0.0008722394704818726, 0.0009202659130096436, 0.0009682923555374146, 0.0010163187980651855, 0.0010643452405929565, 0.0011123716831207275, 0.0011603981256484985, 0.0012084245681762695, 0.0012564510107040405, 0.0013044774532318115, 0.0013525038957595825, 0.0014005303382873535, 0.0014485567808151245, 0.0014965832233428955, 0.0015446096658706665, 0.0015926361083984375]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 6.0, 5.0, 3.0, 2.0, 9.0, 12.0, 15.0, 15.0, 20.0, 24.0, 37.0, 37.0, 42.0, 46.0, 56.0, 72.0, 83.0, 65.0, 70.0, 48.0, 52.0, 43.0, 45.0, 34.0, 38.0, 23.0, 20.0, 16.0, 11.0, 12.0, 8.0, 7.0, 6.0, 5.0, 2.0, 5.0, 2.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.119053840637207, -8.788862228393555, -8.458671569824219, -8.128480911254883, -7.7982892990112305, -7.468098163604736, -7.137907028198242, -6.807715892791748, -6.477524757385254, -6.14733362197876, -5.817142486572266, -5.4869513511657715, -5.156760215759277, -4.826569080352783, -4.496377944946289, -4.166186809539795, -3.835995674133301, -3.5058045387268066, -3.1756134033203125, -2.8454222679138184, -2.515231132507324, -2.18503999710083, -1.854848861694336, -1.5246577262878418, -1.1944665908813477, -0.8642754554748535, -0.5340843200683594, -0.20389318466186523, 0.1262979507446289, 0.45648908615112305, 0.7866802215576172, 1.1168713569641113, 1.4470634460449219, 1.777254581451416, 2.10744571685791, 2.4376368522644043, 2.7678279876708984, 3.0980191230773926, 3.4282102584838867, 3.758401393890381, 4.088592529296875, 4.418783664703369, 4.748974800109863, 5.079165935516357, 5.409357070922852, 5.739548206329346, 6.06973934173584, 6.399930477142334, 6.730121612548828, 7.060312747955322, 7.390503883361816, 7.7206950187683105, 8.050886154174805, 8.38107681274414, 8.711268424987793, 9.041460037231445, 9.371650695800781, 9.701841354370117, 10.03203296661377, 10.362224578857422, 10.692415237426758, 11.022605895996094, 11.352797508239746, 11.682989120483398, 12.013179779052734]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 2.0, 9.0, 4.0, 7.0, 10.0, 7.0, 14.0, 24.0, 18.0, 28.0, 32.0, 19.0, 26.0, 27.0, 33.0, 31.0, 34.0, 41.0, 38.0, 33.0, 32.0, 36.0, 32.0, 43.0, 31.0, 29.0, 33.0, 39.0, 30.0, 29.0, 30.0, 24.0, 25.0, 26.0, 18.0, 19.0, 13.0, 20.0, 10.0, 8.0, 10.0, 9.0, 3.0, 5.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.700148582458496, -7.4252190589904785, -7.150289535522461, -6.875360012054443, -6.600430488586426, -6.325500965118408, -6.050571441650391, -5.775641918182373, -5.5007123947143555, -5.225782871246338, -4.95085334777832, -4.675923824310303, -4.400994300842285, -4.126064777374268, -3.85113525390625, -3.5762057304382324, -3.301276206970215, -3.0263466835021973, -2.7514171600341797, -2.476487636566162, -2.2015581130981445, -1.926628589630127, -1.6516990661621094, -1.3767695426940918, -1.1018400192260742, -0.8269104957580566, -0.5519809722900391, -0.2770514488220215, -0.0021219253540039062, 0.27280759811401367, 0.5477371215820312, 0.8226666450500488, 1.0975961685180664, 1.372525691986084, 1.6474552154541016, 1.9223847389221191, 2.1973142623901367, 2.4722437858581543, 2.747173309326172, 3.0221028327941895, 3.297032356262207, 3.5719618797302246, 3.846891403198242, 4.12182092666626, 4.396750450134277, 4.671679973602295, 4.9466094970703125, 5.22153902053833, 5.496468544006348, 5.771398067474365, 6.046327590942383, 6.3212571144104, 6.596186637878418, 6.8711161613464355, 7.146045684814453, 7.420975208282471, 7.695904731750488, 7.970834255218506, 8.245763778686523, 8.520692825317383, 8.795622825622559, 9.070552825927734, 9.345481872558594, 9.620410919189453, 9.895340919494629]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 8.0, 10.0, 20.0, 28.0, 40.0, 77.0, 101.0, 159.0, 200.0, 327.0, 509.0, 771.0, 1096.0, 1785.0, 2604.0, 3968.0, 6200.0, 9463.0, 14398.0, 22387.0, 35501.0, 56317.0, 90984.0, 141117.0, 177926.0, 165774.0, 117189.0, 73229.0, 45191.0, 28851.0, 18197.0, 11730.0, 7782.0, 4944.0, 3335.0, 2110.0, 1411.0, 949.0, 583.0, 457.0, 268.0, 174.0, 143.0, 83.0, 45.0, 26.0, 31.0, 17.0, 23.0, 5.0, 6.0, 6.0, 1.0, 1.0, 2.0], "bins": [-14.84375, -14.4041748046875, -13.964599609375, -13.5250244140625, -13.08544921875, -12.6458740234375, -12.206298828125, -11.7667236328125, -11.3271484375, -10.8875732421875, -10.447998046875, -10.0084228515625, -9.56884765625, -9.1292724609375, -8.689697265625, -8.2501220703125, -7.810546875, -7.3709716796875, -6.931396484375, -6.4918212890625, -6.05224609375, -5.6126708984375, -5.173095703125, -4.7335205078125, -4.2939453125, -3.8543701171875, -3.414794921875, -2.9752197265625, -2.53564453125, -2.0960693359375, -1.656494140625, -1.2169189453125, -0.77734375, -0.3377685546875, 0.101806640625, 0.5413818359375, 0.98095703125, 1.4205322265625, 1.860107421875, 2.2996826171875, 2.7392578125, 3.1788330078125, 3.618408203125, 4.0579833984375, 4.49755859375, 4.9371337890625, 5.376708984375, 5.8162841796875, 6.255859375, 6.6954345703125, 7.135009765625, 7.5745849609375, 8.01416015625, 8.4537353515625, 8.893310546875, 9.3328857421875, 9.7724609375, 10.2120361328125, 10.651611328125, 11.0911865234375, 11.53076171875, 11.9703369140625, 12.409912109375, 12.8494873046875, 13.2890625]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 3.0, 4.0, 6.0, 5.0, 13.0, 9.0, 12.0, 14.0, 19.0, 18.0, 39.0, 22.0, 18.0, 29.0, 27.0, 35.0, 39.0, 35.0, 34.0, 32.0, 33.0, 39.0, 40.0, 34.0, 35.0, 36.0, 30.0, 36.0, 34.0, 27.0, 29.0, 33.0, 29.0, 30.0, 20.0, 10.0, 13.0, 13.0, 8.0, 17.0, 13.0, 9.0, 5.0, 8.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.53125, -7.277587890625, -7.02392578125, -6.770263671875, -6.5166015625, -6.262939453125, -6.00927734375, -5.755615234375, -5.501953125, -5.248291015625, -4.99462890625, -4.740966796875, -4.4873046875, -4.233642578125, -3.97998046875, -3.726318359375, -3.47265625, -3.218994140625, -2.96533203125, -2.711669921875, -2.4580078125, -2.204345703125, -1.95068359375, -1.697021484375, -1.443359375, -1.189697265625, -0.93603515625, -0.682373046875, -0.4287109375, -0.175048828125, 0.07861328125, 0.332275390625, 0.5859375, 0.839599609375, 1.09326171875, 1.346923828125, 1.6005859375, 1.854248046875, 2.10791015625, 2.361572265625, 2.615234375, 2.868896484375, 3.12255859375, 3.376220703125, 3.6298828125, 3.883544921875, 4.13720703125, 4.390869140625, 4.64453125, 4.898193359375, 5.15185546875, 5.405517578125, 5.6591796875, 5.912841796875, 6.16650390625, 6.420166015625, 6.673828125, 6.927490234375, 7.18115234375, 7.434814453125, 7.6884765625, 7.942138671875, 8.19580078125, 8.449462890625, 8.703125]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 4.0, 9.0, 11.0, 29.0, 28.0, 45.0, 80.0, 99.0, 144.0, 179.0, 257.0, 353.0, 535.0, 704.0, 989.0, 1374.0, 1859.0, 2677.0, 3599.0, 5227.0, 7235.0, 10487.0, 15112.0, 21964.0, 33201.0, 51251.0, 80286.0, 122548.0, 160351.0, 161604.0, 124502.0, 82350.0, 51968.0, 33479.0, 22183.0, 15287.0, 10597.0, 7330.0, 5285.0, 3846.0, 2594.0, 1949.0, 1405.0, 1026.0, 762.0, 494.0, 385.0, 252.0, 190.0, 141.0, 90.0, 78.0, 56.0, 35.0, 20.0, 10.0, 5.0, 3.0, 2.0, 1.0, 2.0], "bins": [-12.171875, -11.791748046875, -11.41162109375, -11.031494140625, -10.6513671875, -10.271240234375, -9.89111328125, -9.510986328125, -9.130859375, -8.750732421875, -8.37060546875, -7.990478515625, -7.6103515625, -7.230224609375, -6.85009765625, -6.469970703125, -6.08984375, -5.709716796875, -5.32958984375, -4.949462890625, -4.5693359375, -4.189208984375, -3.80908203125, -3.428955078125, -3.048828125, -2.668701171875, -2.28857421875, -1.908447265625, -1.5283203125, -1.148193359375, -0.76806640625, -0.387939453125, -0.0078125, 0.372314453125, 0.75244140625, 1.132568359375, 1.5126953125, 1.892822265625, 2.27294921875, 2.653076171875, 3.033203125, 3.413330078125, 3.79345703125, 4.173583984375, 4.5537109375, 4.933837890625, 5.31396484375, 5.694091796875, 6.07421875, 6.454345703125, 6.83447265625, 7.214599609375, 7.5947265625, 7.974853515625, 8.35498046875, 8.735107421875, 9.115234375, 9.495361328125, 9.87548828125, 10.255615234375, 10.6357421875, 11.015869140625, 11.39599609375, 11.776123046875, 12.15625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 5.0, 4.0, 4.0, 11.0, 10.0, 8.0, 7.0, 9.0, 10.0, 20.0, 27.0, 22.0, 25.0, 28.0, 35.0, 25.0, 39.0, 39.0, 37.0, 44.0, 41.0, 49.0, 44.0, 35.0, 33.0, 39.0, 33.0, 35.0, 30.0, 22.0, 19.0, 26.0, 21.0, 18.0, 13.0, 20.0, 18.0, 19.0, 18.0, 13.0, 8.0, 9.0, 5.0, 4.0, 4.0, 5.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-4.98828125, -4.83282470703125, -4.6773681640625, -4.52191162109375, -4.366455078125, -4.21099853515625, -4.0555419921875, -3.90008544921875, -3.74462890625, -3.58917236328125, -3.4337158203125, -3.27825927734375, -3.122802734375, -2.96734619140625, -2.8118896484375, -2.65643310546875, -2.5009765625, -2.34552001953125, -2.1900634765625, -2.03460693359375, -1.879150390625, -1.72369384765625, -1.5682373046875, -1.41278076171875, -1.25732421875, -1.10186767578125, -0.9464111328125, -0.79095458984375, -0.635498046875, -0.48004150390625, -0.3245849609375, -0.16912841796875, -0.013671875, 0.14178466796875, 0.2972412109375, 0.45269775390625, 0.608154296875, 0.76361083984375, 0.9190673828125, 1.07452392578125, 1.22998046875, 1.38543701171875, 1.5408935546875, 1.69635009765625, 1.851806640625, 2.00726318359375, 2.1627197265625, 2.31817626953125, 2.4736328125, 2.62908935546875, 2.7845458984375, 2.94000244140625, 3.095458984375, 3.25091552734375, 3.4063720703125, 3.56182861328125, 3.71728515625, 3.87274169921875, 4.0281982421875, 4.18365478515625, 4.339111328125, 4.49456787109375, 4.6500244140625, 4.80548095703125, 4.9609375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 4.0, 11.0, 9.0, 12.0, 23.0, 26.0, 45.0, 60.0, 79.0, 117.0, 167.0, 218.0, 276.0, 364.0, 576.0, 770.0, 1115.0, 1608.0, 2246.0, 3246.0, 4784.0, 7400.0, 11741.0, 20551.0, 38635.0, 82312.0, 228416.0, 367569.0, 142887.0, 58786.0, 28881.0, 16236.0, 9616.0, 6267.0, 4017.0, 2642.0, 1940.0, 1395.0, 960.0, 709.0, 544.0, 382.0, 275.0, 181.0, 140.0, 103.0, 61.0, 57.0, 37.0, 19.0, 17.0, 11.0, 4.0, 6.0, 4.0, 1.0, 4.0, 4.0], "bins": [-1.80078125, -1.7466888427734375, -1.692596435546875, -1.6385040283203125, -1.58441162109375, -1.5303192138671875, -1.476226806640625, -1.4221343994140625, -1.3680419921875, -1.3139495849609375, -1.259857177734375, -1.2057647705078125, -1.15167236328125, -1.0975799560546875, -1.043487548828125, -0.9893951416015625, -0.935302734375, -0.8812103271484375, -0.827117919921875, -0.7730255126953125, -0.71893310546875, -0.6648406982421875, -0.610748291015625, -0.5566558837890625, -0.5025634765625, -0.4484710693359375, -0.394378662109375, -0.3402862548828125, -0.28619384765625, -0.2321014404296875, -0.178009033203125, -0.1239166259765625, -0.06982421875, -0.0157318115234375, 0.038360595703125, 0.0924530029296875, 0.14654541015625, 0.2006378173828125, 0.254730224609375, 0.3088226318359375, 0.3629150390625, 0.4170074462890625, 0.471099853515625, 0.5251922607421875, 0.57928466796875, 0.6333770751953125, 0.687469482421875, 0.7415618896484375, 0.795654296875, 0.8497467041015625, 0.903839111328125, 0.9579315185546875, 1.01202392578125, 1.0661163330078125, 1.120208740234375, 1.1743011474609375, 1.2283935546875, 1.2824859619140625, 1.336578369140625, 1.3906707763671875, 1.44476318359375, 1.4988555908203125, 1.552947998046875, 1.6070404052734375, 1.6611328125]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 3.0, 7.0, 5.0, 3.0, 6.0, 7.0, 7.0, 17.0, 23.0, 27.0, 34.0, 42.0, 49.0, 61.0, 70.0, 63.0, 88.0, 78.0, 82.0, 68.0, 49.0, 45.0, 38.0, 34.0, 17.0, 17.0, 12.0, 15.0, 6.0, 8.0, 4.0, 4.0, 5.0, 0.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.000102996826171875, -9.964406490325928e-05, -9.629130363464355e-05, -9.293854236602783e-05, -8.958578109741211e-05, -8.623301982879639e-05, -8.288025856018066e-05, -7.952749729156494e-05, -7.617473602294922e-05, -7.28219747543335e-05, -6.946921348571777e-05, -6.611645221710205e-05, -6.276369094848633e-05, -5.9410929679870605e-05, -5.605816841125488e-05, -5.270540714263916e-05, -4.935264587402344e-05, -4.5999884605407715e-05, -4.264712333679199e-05, -3.929436206817627e-05, -3.594160079956055e-05, -3.2588839530944824e-05, -2.92360782623291e-05, -2.588331699371338e-05, -2.2530555725097656e-05, -1.9177794456481934e-05, -1.582503318786621e-05, -1.2472271919250488e-05, -9.119510650634766e-06, -5.766749382019043e-06, -2.4139881134033203e-06, 9.387731552124023e-07, 4.291534423828125e-06, 7.644295692443848e-06, 1.099705696105957e-05, 1.4349818229675293e-05, 1.7702579498291016e-05, 2.1055340766906738e-05, 2.440810203552246e-05, 2.7760863304138184e-05, 3.1113624572753906e-05, 3.446638584136963e-05, 3.781914710998535e-05, 4.1171908378601074e-05, 4.45246696472168e-05, 4.787743091583252e-05, 5.123019218444824e-05, 5.4582953453063965e-05, 5.793571472167969e-05, 6.128847599029541e-05, 6.464123725891113e-05, 6.799399852752686e-05, 7.134675979614258e-05, 7.46995210647583e-05, 7.805228233337402e-05, 8.140504360198975e-05, 8.475780487060547e-05, 8.811056613922119e-05, 9.146332740783691e-05, 9.481608867645264e-05, 9.816884994506836e-05, 0.00010152161121368408, 0.0001048743724822998, 0.00010822713375091553, 0.00011157989501953125]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 7.0, 6.0, 15.0, 24.0, 25.0, 39.0, 52.0, 91.0, 139.0, 234.0, 348.0, 573.0, 846.0, 1275.0, 2021.0, 3212.0, 4960.0, 7920.0, 13466.0, 23729.0, 47817.0, 114670.0, 362010.0, 283531.0, 90313.0, 39848.0, 20501.0, 11474.0, 7121.0, 4305.0, 2863.0, 1833.0, 1169.0, 763.0, 502.0, 305.0, 191.0, 124.0, 86.0, 47.0, 49.0, 22.0, 10.0, 11.0, 3.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8828125, -1.819793701171875, -1.75677490234375, -1.693756103515625, -1.6307373046875, -1.567718505859375, -1.50469970703125, -1.441680908203125, -1.378662109375, -1.315643310546875, -1.25262451171875, -1.189605712890625, -1.1265869140625, -1.063568115234375, -1.00054931640625, -0.937530517578125, -0.87451171875, -0.811492919921875, -0.74847412109375, -0.685455322265625, -0.6224365234375, -0.559417724609375, -0.49639892578125, -0.433380126953125, -0.370361328125, -0.307342529296875, -0.24432373046875, -0.181304931640625, -0.1182861328125, -0.055267333984375, 0.00775146484375, 0.070770263671875, 0.1337890625, 0.196807861328125, 0.25982666015625, 0.322845458984375, 0.3858642578125, 0.448883056640625, 0.51190185546875, 0.574920654296875, 0.637939453125, 0.700958251953125, 0.76397705078125, 0.826995849609375, 0.8900146484375, 0.953033447265625, 1.01605224609375, 1.079071044921875, 1.14208984375, 1.205108642578125, 1.26812744140625, 1.331146240234375, 1.3941650390625, 1.457183837890625, 1.52020263671875, 1.583221435546875, 1.646240234375, 1.709259033203125, 1.77227783203125, 1.835296630859375, 1.8983154296875, 1.961334228515625, 2.02435302734375, 2.087371826171875, 2.150390625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 3.0, 5.0, 3.0, 3.0, 11.0, 5.0, 7.0, 7.0, 13.0, 13.0, 19.0, 31.0, 31.0, 36.0, 39.0, 53.0, 58.0, 80.0, 87.0, 64.0, 61.0, 70.0, 50.0, 48.0, 39.0, 26.0, 21.0, 19.0, 12.0, 14.0, 10.0, 19.0, 6.0, 7.0, 3.0, 4.0, 8.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.603515625, -0.5833511352539062, -0.5631866455078125, -0.5430221557617188, -0.522857666015625, -0.5026931762695312, -0.4825286865234375, -0.46236419677734375, -0.44219970703125, -0.42203521728515625, -0.4018707275390625, -0.38170623779296875, -0.361541748046875, -0.34137725830078125, -0.3212127685546875, -0.30104827880859375, -0.2808837890625, -0.26071929931640625, -0.2405548095703125, -0.22039031982421875, -0.200225830078125, -0.18006134033203125, -0.1598968505859375, -0.13973236083984375, -0.11956787109375, -0.09940338134765625, -0.0792388916015625, -0.05907440185546875, -0.038909912109375, -0.01874542236328125, 0.0014190673828125, 0.02158355712890625, 0.041748046875, 0.06191253662109375, 0.0820770263671875, 0.10224151611328125, 0.122406005859375, 0.14257049560546875, 0.1627349853515625, 0.18289947509765625, 0.20306396484375, 0.22322845458984375, 0.2433929443359375, 0.26355743408203125, 0.283721923828125, 0.30388641357421875, 0.3240509033203125, 0.34421539306640625, 0.3643798828125, 0.38454437255859375, 0.4047088623046875, 0.42487335205078125, 0.445037841796875, 0.46520233154296875, 0.4853668212890625, 0.5055313110351562, 0.52569580078125, 0.5458602905273438, 0.5660247802734375, 0.5861892700195312, 0.606353759765625, 0.6265182495117188, 0.6466827392578125, 0.6668472290039062, 0.68701171875]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 3.0, 6.0, 3.0, 6.0, 10.0, 12.0, 13.0, 12.0, 31.0, 29.0, 28.0, 38.0, 52.0, 53.0, 72.0, 65.0, 77.0, 59.0, 49.0, 45.0, 54.0, 55.0, 30.0, 45.0, 31.0, 19.0, 17.0, 13.0, 9.0, 4.0, 13.0, 7.0, 7.0, 6.0, 3.0, 10.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-9.717090606689453, -9.41574478149414, -9.114398956298828, -8.8130521774292, -8.511706352233887, -8.210360527038574, -7.9090142250061035, -7.607667922973633, -7.30632209777832, -7.004976272583008, -6.703629970550537, -6.402283668518066, -6.100937843322754, -5.799592018127441, -5.498245716094971, -5.1968994140625, -4.8955535888671875, -4.594207763671875, -4.292861461639404, -3.9915153980255127, -3.690169334411621, -3.3888232707977295, -3.087477207183838, -2.7861311435699463, -2.4847850799560547, -2.183439016342163, -1.8820929527282715, -1.5807468891143799, -1.2794008255004883, -0.9780547618865967, -0.6767086982727051, -0.3753626346588135, -0.07401752471923828, 0.22732853889465332, 0.5286746025085449, 0.8300206661224365, 1.1313667297363281, 1.4327127933502197, 1.7340588569641113, 2.035404920578003, 2.3367509841918945, 2.638097047805786, 2.9394431114196777, 3.2407891750335693, 3.542135238647461, 3.8434813022613525, 4.144827365875244, 4.446173667907715, 4.747519493103027, 5.04886531829834, 5.3502116203308105, 5.651557922363281, 5.952903747558594, 6.254249572753906, 6.555595874786377, 6.856942176818848, 7.15828800201416, 7.459633827209473, 7.760980129241943, 8.062326431274414, 8.363672256469727, 8.665018081665039, 8.966363906860352, 9.26771068572998, 9.569056510925293]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 8.0, 4.0, 4.0, 8.0, 4.0, 14.0, 13.0, 21.0, 22.0, 24.0, 27.0, 38.0, 39.0, 30.0, 40.0, 45.0, 37.0, 39.0, 42.0, 40.0, 34.0, 38.0, 32.0, 45.0, 31.0, 28.0, 44.0, 27.0, 30.0, 29.0, 23.0, 29.0, 17.0, 14.0, 20.0, 14.0, 15.0, 12.0, 10.0, 5.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.089173316955566, -8.791877746582031, -8.494582176208496, -8.197286605834961, -7.899991512298584, -7.602695941925049, -7.305400371551514, -7.008105278015137, -6.710809707641602, -6.413514137268066, -6.116218566894531, -5.818922996520996, -5.521627902984619, -5.224332332611084, -4.927036762237549, -4.629741668701172, -4.3324456214904785, -4.035150051116943, -3.7378547191619873, -3.440559148788452, -3.143263816833496, -2.845968246459961, -2.548672676086426, -2.2513773441314697, -1.9540817737579346, -1.656786322593689, -1.3594908714294434, -1.0621953010559082, -0.7648998498916626, -0.467604398727417, -0.17030882835388184, 0.12698650360107422, 0.4242820739746094, 0.721577525138855, 1.0188729763031006, 1.3161685466766357, 1.6134639978408813, 1.910759449005127, 2.208055019378662, 2.505350351333618, 2.8026459217071533, 3.0999414920806885, 3.3972368240356445, 3.6945323944091797, 3.991827964782715, 4.28912353515625, 4.586419105529785, 4.883714199066162, 5.181009769439697, 5.478305339813232, 5.775600910186768, 6.0728960037231445, 6.37019157409668, 6.667487144470215, 6.96478271484375, 7.262078285217285, 7.55937385559082, 7.8566694259643555, 8.15396499633789, 8.451260566711426, 8.748556137084961, 9.04585075378418, 9.343147277832031, 9.64044189453125, 9.937737464904785]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 4.0, 11.0, 15.0, 27.0, 35.0, 53.0, 97.0, 148.0, 195.0, 338.0, 470.0, 788.0, 1172.0, 1917.0, 3078.0, 4964.0, 7739.0, 12808.0, 21150.0, 35646.0, 61414.0, 111499.0, 230664.0, 689567.0, 1469903.0, 936164.0, 287226.0, 130883.0, 73169.0, 42882.0, 25897.0, 16174.0, 10170.0, 6408.0, 4133.0, 2579.0, 1658.0, 1155.0, 700.0, 460.0, 306.0, 219.0, 135.0, 75.0, 74.0, 43.0, 28.0, 18.0, 9.0, 4.0, 8.0, 8.0, 3.0, 4.0, 0.0, 0.0, 1.0], "bins": [-13.1328125, -12.7177734375, -12.302734375, -11.8876953125, -11.47265625, -11.0576171875, -10.642578125, -10.2275390625, -9.8125, -9.3974609375, -8.982421875, -8.5673828125, -8.15234375, -7.7373046875, -7.322265625, -6.9072265625, -6.4921875, -6.0771484375, -5.662109375, -5.2470703125, -4.83203125, -4.4169921875, -4.001953125, -3.5869140625, -3.171875, -2.7568359375, -2.341796875, -1.9267578125, -1.51171875, -1.0966796875, -0.681640625, -0.2666015625, 0.1484375, 0.5634765625, 0.978515625, 1.3935546875, 1.80859375, 2.2236328125, 2.638671875, 3.0537109375, 3.46875, 3.8837890625, 4.298828125, 4.7138671875, 5.12890625, 5.5439453125, 5.958984375, 6.3740234375, 6.7890625, 7.2041015625, 7.619140625, 8.0341796875, 8.44921875, 8.8642578125, 9.279296875, 9.6943359375, 10.109375, 10.5244140625, 10.939453125, 11.3544921875, 11.76953125, 12.1845703125, 12.599609375, 13.0146484375, 13.4296875]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 2.0, 11.0, 12.0, 10.0, 15.0, 22.0, 13.0, 22.0, 34.0, 28.0, 32.0, 44.0, 36.0, 36.0, 42.0, 40.0, 42.0, 32.0, 29.0, 40.0, 32.0, 49.0, 29.0, 33.0, 36.0, 30.0, 22.0, 25.0, 36.0, 23.0, 30.0, 16.0, 15.0, 14.0, 17.0, 10.0, 9.0, 11.0, 6.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.4375, -7.1883544921875, -6.939208984375, -6.6900634765625, -6.44091796875, -6.1917724609375, -5.942626953125, -5.6934814453125, -5.4443359375, -5.1951904296875, -4.946044921875, -4.6968994140625, -4.44775390625, -4.1986083984375, -3.949462890625, -3.7003173828125, -3.451171875, -3.2020263671875, -2.952880859375, -2.7037353515625, -2.45458984375, -2.2054443359375, -1.956298828125, -1.7071533203125, -1.4580078125, -1.2088623046875, -0.959716796875, -0.7105712890625, -0.46142578125, -0.2122802734375, 0.036865234375, 0.2860107421875, 0.53515625, 0.7843017578125, 1.033447265625, 1.2825927734375, 1.53173828125, 1.7808837890625, 2.030029296875, 2.2791748046875, 2.5283203125, 2.7774658203125, 3.026611328125, 3.2757568359375, 3.52490234375, 3.7740478515625, 4.023193359375, 4.2723388671875, 4.521484375, 4.7706298828125, 5.019775390625, 5.2689208984375, 5.51806640625, 5.7672119140625, 6.016357421875, 6.2655029296875, 6.5146484375, 6.7637939453125, 7.012939453125, 7.2620849609375, 7.51123046875, 7.7603759765625, 8.009521484375, 8.2586669921875, 8.5078125]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 6.0, 8.0, 12.0, 17.0, 22.0, 39.0, 47.0, 92.0, 122.0, 173.0, 277.0, 446.0, 672.0, 1099.0, 1636.0, 2544.0, 4128.0, 6645.0, 10823.0, 17822.0, 30028.0, 53048.0, 94531.0, 179252.0, 362607.0, 832590.0, 1383822.0, 606219.0, 279078.0, 142080.0, 76594.0, 43082.0, 25202.0, 14924.0, 9066.0, 5795.0, 3502.0, 2271.0, 1362.0, 891.0, 564.0, 389.0, 268.0, 166.0, 106.0, 70.0, 51.0, 44.0, 22.0, 12.0, 12.0, 3.0, 3.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.7265625, -11.33984375, -10.953125, -10.56640625, -10.1796875, -9.79296875, -9.40625, -9.01953125, -8.6328125, -8.24609375, -7.859375, -7.47265625, -7.0859375, -6.69921875, -6.3125, -5.92578125, -5.5390625, -5.15234375, -4.765625, -4.37890625, -3.9921875, -3.60546875, -3.21875, -2.83203125, -2.4453125, -2.05859375, -1.671875, -1.28515625, -0.8984375, -0.51171875, -0.125, 0.26171875, 0.6484375, 1.03515625, 1.421875, 1.80859375, 2.1953125, 2.58203125, 2.96875, 3.35546875, 3.7421875, 4.12890625, 4.515625, 4.90234375, 5.2890625, 5.67578125, 6.0625, 6.44921875, 6.8359375, 7.22265625, 7.609375, 7.99609375, 8.3828125, 8.76953125, 9.15625, 9.54296875, 9.9296875, 10.31640625, 10.703125, 11.08984375, 11.4765625, 11.86328125, 12.25, 12.63671875, 13.0234375]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 6.0, 9.0, 10.0, 16.0, 9.0, 27.0, 18.0, 35.0, 27.0, 47.0, 51.0, 75.0, 77.0, 110.0, 141.0, 184.0, 188.0, 237.0, 293.0, 386.0, 417.0, 335.0, 266.0, 219.0, 157.0, 161.0, 102.0, 109.0, 80.0, 59.0, 40.0, 37.0, 31.0, 26.0, 29.0, 12.0, 13.0, 9.0, 7.0, 3.0, 4.0, 7.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-5.06640625, -4.913330078125, -4.76025390625, -4.607177734375, -4.4541015625, -4.301025390625, -4.14794921875, -3.994873046875, -3.841796875, -3.688720703125, -3.53564453125, -3.382568359375, -3.2294921875, -3.076416015625, -2.92333984375, -2.770263671875, -2.6171875, -2.464111328125, -2.31103515625, -2.157958984375, -2.0048828125, -1.851806640625, -1.69873046875, -1.545654296875, -1.392578125, -1.239501953125, -1.08642578125, -0.933349609375, -0.7802734375, -0.627197265625, -0.47412109375, -0.321044921875, -0.16796875, -0.014892578125, 0.13818359375, 0.291259765625, 0.4443359375, 0.597412109375, 0.75048828125, 0.903564453125, 1.056640625, 1.209716796875, 1.36279296875, 1.515869140625, 1.6689453125, 1.822021484375, 1.97509765625, 2.128173828125, 2.28125, 2.434326171875, 2.58740234375, 2.740478515625, 2.8935546875, 3.046630859375, 3.19970703125, 3.352783203125, 3.505859375, 3.658935546875, 3.81201171875, 3.965087890625, 4.1181640625, 4.271240234375, 4.42431640625, 4.577392578125, 4.73046875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 2.0, 6.0, 7.0, 6.0, 14.0, 19.0, 17.0, 25.0, 38.0, 38.0, 54.0, 67.0, 73.0, 59.0, 87.0, 75.0, 67.0, 62.0, 48.0, 35.0, 32.0, 35.0, 34.0, 24.0, 15.0, 10.0, 7.0, 12.0, 4.0, 2.0, 3.0, 6.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-11.494048118591309, -11.164051055908203, -10.834053039550781, -10.504055976867676, -10.17405891418457, -9.844061851501465, -9.51406478881836, -9.184066772460938, -8.854069709777832, -8.524072647094727, -8.194074630737305, -7.864077568054199, -7.534080505371094, -7.204083442687988, -6.874085903167725, -6.544088363647461, -6.2140913009643555, -5.88409423828125, -5.554096698760986, -5.224099159240723, -4.894102096557617, -4.564105033874512, -4.234107494354248, -3.9041101932525635, -3.574112892150879, -3.2441155910491943, -2.9141182899475098, -2.584120988845825, -2.2541236877441406, -1.924126386642456, -1.5941290855407715, -1.264131784439087, -0.9341354370117188, -0.6041381359100342, -0.2741408348083496, 0.05585646629333496, 0.38585376739501953, 0.7158510684967041, 1.0458483695983887, 1.3758456707000732, 1.7058429718017578, 2.0358402729034424, 2.365837574005127, 2.6958348751068115, 3.025832176208496, 3.3558294773101807, 3.6858267784118652, 4.015824317932129, 4.345821380615234, 4.67581844329834, 5.0058159828186035, 5.335813522338867, 5.665810585021973, 5.995807647705078, 6.325805187225342, 6.6558027267456055, 6.985799789428711, 7.315796852111816, 7.64579439163208, 7.975791931152344, 8.30578899383545, 8.635786056518555, 8.965784072875977, 9.295781135559082, 9.625778198242188]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 0.0, 3.0, 10.0, 6.0, 6.0, 11.0, 10.0, 20.0, 14.0, 19.0, 30.0, 34.0, 33.0, 40.0, 40.0, 46.0, 40.0, 50.0, 56.0, 47.0, 32.0, 42.0, 43.0, 43.0, 30.0, 31.0, 33.0, 44.0, 34.0, 26.0, 19.0, 18.0, 24.0, 17.0, 11.0, 11.0, 9.0, 8.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.334036827087402, -8.020307540893555, -7.706579208374023, -7.392850399017334, -7.0791215896606445, -6.765392303466797, -6.451663494110107, -6.137934684753418, -5.8242058753967285, -5.510477066040039, -5.19674825668335, -4.88301944732666, -4.5692901611328125, -4.255561828613281, -3.9418325424194336, -3.628103733062744, -3.3143749237060547, -3.0006461143493652, -2.686917304992676, -2.3731882572174072, -2.0594594478607178, -1.7457306385040283, -1.4320017099380493, -1.1182727813720703, -0.8045439720153809, -0.49081510305404663, -0.1770862340927124, 0.13664263486862183, 0.45037150382995605, 0.7641003131866455, 1.0778292417526245, 1.3915581703186035, 1.7052860260009766, 2.019014835357666, 2.3327436447143555, 2.646472692489624, 2.9602015018463135, 3.273930311203003, 3.5876593589782715, 3.901388168334961, 4.21511697769165, 4.52884578704834, 4.842574596405029, 5.156303405761719, 5.470032691955566, 5.783761024475098, 6.097490310668945, 6.411219120025635, 6.724947929382324, 7.038676738739014, 7.352405548095703, 7.666134357452393, 7.979863166809082, 8.29359245300293, 8.607320785522461, 8.921050071716309, 9.234779357910156, 9.548508644104004, 9.862236976623535, 10.175966262817383, 10.489694595336914, 10.803423881530762, 11.117152214050293, 11.43088150024414, 11.744609832763672]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 3.0, 18.0, 15.0, 39.0, 38.0, 60.0, 75.0, 162.0, 233.0, 347.0, 602.0, 998.0, 1678.0, 2833.0, 5002.0, 9064.0, 16755.0, 31923.0, 62689.0, 131348.0, 402235.0, 201857.0, 87268.0, 43103.0, 22551.0, 11887.0, 6607.0, 3740.0, 2129.0, 1299.0, 725.0, 476.0, 288.0, 199.0, 107.0, 73.0, 44.0, 33.0, 17.0, 8.0, 14.0, 2.0, 1.0, 3.0, 5.0, 5.0, 2.0, 1.0, 2.0], "bins": [-3.8046875, -3.698211669921875, -3.59173583984375, -3.485260009765625, -3.3787841796875, -3.272308349609375, -3.16583251953125, -3.059356689453125, -2.952880859375, -2.846405029296875, -2.73992919921875, -2.633453369140625, -2.5269775390625, -2.420501708984375, -2.31402587890625, -2.207550048828125, -2.10107421875, -1.994598388671875, -1.88812255859375, -1.781646728515625, -1.6751708984375, -1.568695068359375, -1.46221923828125, -1.355743408203125, -1.249267578125, -1.142791748046875, -1.03631591796875, -0.929840087890625, -0.8233642578125, -0.716888427734375, -0.61041259765625, -0.503936767578125, -0.3974609375, -0.290985107421875, -0.18450927734375, -0.078033447265625, 0.0284423828125, 0.134918212890625, 0.24139404296875, 0.347869873046875, 0.454345703125, 0.560821533203125, 0.66729736328125, 0.773773193359375, 0.8802490234375, 0.986724853515625, 1.09320068359375, 1.199676513671875, 1.30615234375, 1.412628173828125, 1.51910400390625, 1.625579833984375, 1.7320556640625, 1.838531494140625, 1.94500732421875, 2.051483154296875, 2.157958984375, 2.264434814453125, 2.37091064453125, 2.477386474609375, 2.5838623046875, 2.690338134765625, 2.79681396484375, 2.903289794921875, 3.009765625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 7.0, 5.0, 6.0, 10.0, 15.0, 19.0, 20.0, 19.0, 26.0, 31.0, 41.0, 34.0, 41.0, 50.0, 52.0, 39.0, 47.0, 42.0, 52.0, 50.0, 32.0, 32.0, 46.0, 30.0, 40.0, 34.0, 30.0, 27.0, 20.0, 25.0, 15.0, 14.0, 10.0, 11.0, 11.0, 5.0, 3.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4296875, -8.10498046875, -7.7802734375, -7.45556640625, -7.130859375, -6.80615234375, -6.4814453125, -6.15673828125, -5.83203125, -5.50732421875, -5.1826171875, -4.85791015625, -4.533203125, -4.20849609375, -3.8837890625, -3.55908203125, -3.234375, -2.90966796875, -2.5849609375, -2.26025390625, -1.935546875, -1.61083984375, -1.2861328125, -0.96142578125, -0.63671875, -0.31201171875, 0.0126953125, 0.33740234375, 0.662109375, 0.98681640625, 1.3115234375, 1.63623046875, 1.9609375, 2.28564453125, 2.6103515625, 2.93505859375, 3.259765625, 3.58447265625, 3.9091796875, 4.23388671875, 4.55859375, 4.88330078125, 5.2080078125, 5.53271484375, 5.857421875, 6.18212890625, 6.5068359375, 6.83154296875, 7.15625, 7.48095703125, 7.8056640625, 8.13037109375, 8.455078125, 8.77978515625, 9.1044921875, 9.42919921875, 9.75390625, 10.07861328125, 10.4033203125, 10.72802734375, 11.052734375, 11.37744140625, 11.7021484375, 12.02685546875, 12.3515625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 5.0, 17.0, 14.0, 34.0, 39.0, 59.0, 81.0, 103.0, 154.0, 212.0, 308.0, 468.0, 690.0, 940.0, 1316.0, 2016.0, 2934.0, 4260.0, 6457.0, 9913.0, 15135.0, 23766.0, 36999.0, 59223.0, 105127.0, 253514.0, 255152.0, 104493.0, 59475.0, 36856.0, 23517.0, 15256.0, 9895.0, 6435.0, 4296.0, 2909.0, 2014.0, 1357.0, 932.0, 633.0, 440.0, 336.0, 228.0, 178.0, 102.0, 75.0, 50.0, 37.0, 31.0, 25.0, 16.0, 13.0, 7.0, 8.0, 4.0, 2.0, 2.0, 1.0], "bins": [-2.529296875, -2.45025634765625, -2.3712158203125, -2.29217529296875, -2.213134765625, -2.13409423828125, -2.0550537109375, -1.97601318359375, -1.89697265625, -1.81793212890625, -1.7388916015625, -1.65985107421875, -1.580810546875, -1.50177001953125, -1.4227294921875, -1.34368896484375, -1.2646484375, -1.18560791015625, -1.1065673828125, -1.02752685546875, -0.948486328125, -0.86944580078125, -0.7904052734375, -0.71136474609375, -0.63232421875, -0.55328369140625, -0.4742431640625, -0.39520263671875, -0.316162109375, -0.23712158203125, -0.1580810546875, -0.07904052734375, 0.0, 0.07904052734375, 0.1580810546875, 0.23712158203125, 0.316162109375, 0.39520263671875, 0.4742431640625, 0.55328369140625, 0.63232421875, 0.71136474609375, 0.7904052734375, 0.86944580078125, 0.948486328125, 1.02752685546875, 1.1065673828125, 1.18560791015625, 1.2646484375, 1.34368896484375, 1.4227294921875, 1.50177001953125, 1.580810546875, 1.65985107421875, 1.7388916015625, 1.81793212890625, 1.89697265625, 1.97601318359375, 2.0550537109375, 2.13409423828125, 2.213134765625, 2.29217529296875, 2.3712158203125, 2.45025634765625, 2.529296875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 0.0, 2.0, 4.0, 3.0, 7.0, 14.0, 17.0, 9.0, 13.0, 17.0, 18.0, 18.0, 32.0, 22.0, 25.0, 26.0, 31.0, 40.0, 32.0, 50.0, 37.0, 51.0, 39.0, 48.0, 43.0, 30.0, 26.0, 34.0, 38.0, 21.0, 26.0, 28.0, 27.0, 28.0, 16.0, 17.0, 25.0, 24.0, 11.0, 12.0, 7.0, 9.0, 9.0, 6.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.3984375, -5.21588134765625, -5.0333251953125, -4.85076904296875, -4.668212890625, -4.48565673828125, -4.3031005859375, -4.12054443359375, -3.93798828125, -3.75543212890625, -3.5728759765625, -3.39031982421875, -3.207763671875, -3.02520751953125, -2.8426513671875, -2.66009521484375, -2.4775390625, -2.29498291015625, -2.1124267578125, -1.92987060546875, -1.747314453125, -1.56475830078125, -1.3822021484375, -1.19964599609375, -1.01708984375, -0.83453369140625, -0.6519775390625, -0.46942138671875, -0.286865234375, -0.10430908203125, 0.0782470703125, 0.26080322265625, 0.443359375, 0.62591552734375, 0.8084716796875, 0.99102783203125, 1.173583984375, 1.35614013671875, 1.5386962890625, 1.72125244140625, 1.90380859375, 2.08636474609375, 2.2689208984375, 2.45147705078125, 2.634033203125, 2.81658935546875, 2.9991455078125, 3.18170166015625, 3.3642578125, 3.54681396484375, 3.7293701171875, 3.91192626953125, 4.094482421875, 4.27703857421875, 4.4595947265625, 4.64215087890625, 4.82470703125, 5.00726318359375, 5.1898193359375, 5.37237548828125, 5.554931640625, 5.73748779296875, 5.9200439453125, 6.10260009765625, 6.28515625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 7.0, 11.0, 21.0, 22.0, 36.0, 55.0, 62.0, 101.0, 141.0, 158.0, 226.0, 337.0, 451.0, 623.0, 951.0, 1256.0, 1833.0, 2847.0, 4483.0, 6923.0, 11097.0, 19113.0, 35137.0, 69317.0, 157417.0, 334579.0, 209720.0, 89013.0, 42845.0, 22988.0, 13099.0, 8023.0, 5160.0, 3376.0, 2194.0, 1520.0, 1013.0, 720.0, 492.0, 375.0, 262.0, 154.0, 111.0, 85.0, 65.0, 47.0, 27.0, 26.0, 16.0, 3.0, 6.0, 7.0, 4.0, 3.0, 2.0, 1.0], "bins": [-0.00433349609375, -0.004204750061035156, -0.0040760040283203125, -0.003947257995605469, -0.003818511962890625, -0.0036897659301757812, -0.0035610198974609375, -0.0034322738647460938, -0.00330352783203125, -0.0031747817993164062, -0.0030460357666015625, -0.0029172897338867188, -0.002788543701171875, -0.0026597976684570312, -0.0025310516357421875, -0.0024023056030273438, -0.0022735595703125, -0.0021448135375976562, -0.0020160675048828125, -0.0018873214721679688, -0.001758575439453125, -0.0016298294067382812, -0.0015010833740234375, -0.0013723373413085938, -0.00124359130859375, -0.0011148452758789062, -0.0009860992431640625, -0.0008573532104492188, -0.000728607177734375, -0.0005998611450195312, -0.0004711151123046875, -0.00034236907958984375, -0.000213623046875, -8.487701416015625e-05, 4.38690185546875e-05, 0.00017261505126953125, 0.000301361083984375, 0.00043010711669921875, 0.0005588531494140625, 0.0006875991821289062, 0.00081634521484375, 0.0009450912475585938, 0.0010738372802734375, 0.0012025833129882812, 0.001331329345703125, 0.0014600753784179688, 0.0015888214111328125, 0.0017175674438476562, 0.0018463134765625, 0.0019750595092773438, 0.0021038055419921875, 0.0022325515747070312, 0.002361297607421875, 0.0024900436401367188, 0.0026187896728515625, 0.0027475357055664062, 0.00287628173828125, 0.0030050277709960938, 0.0031337738037109375, 0.0032625198364257812, 0.003391265869140625, 0.0035200119018554688, 0.0036487579345703125, 0.0037775039672851562, 0.00390625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 11.0, 5.0, 11.0, 11.0, 20.0, 28.0, 19.0, 35.0, 41.0, 53.0, 58.0, 85.0, 77.0, 84.0, 83.0, 60.0, 64.0, 63.0, 49.0, 26.0, 33.0, 20.0, 14.0, 13.0, 9.0, 4.0, 6.0, 0.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.258487701416016e-06, -6.075017154216766e-06, -5.891546607017517e-06, -5.708076059818268e-06, -5.5246055126190186e-06, -5.341134965419769e-06, -5.15766441822052e-06, -4.974193871021271e-06, -4.7907233238220215e-06, -4.607252776622772e-06, -4.423782229423523e-06, -4.240311682224274e-06, -4.056841135025024e-06, -3.873370587825775e-06, -3.689900040626526e-06, -3.5064294934272766e-06, -3.3229589462280273e-06, -3.139488399028778e-06, -2.956017851829529e-06, -2.7725473046302795e-06, -2.5890767574310303e-06, -2.405606210231781e-06, -2.2221356630325317e-06, -2.0386651158332825e-06, -1.8551945686340332e-06, -1.671724021434784e-06, -1.4882534742355347e-06, -1.3047829270362854e-06, -1.1213123798370361e-06, -9.378418326377869e-07, -7.543712854385376e-07, -5.709007382392883e-07, -3.8743019104003906e-07, -2.039596438407898e-07, -2.0489096641540527e-08, 1.6298145055770874e-07, 3.46451997756958e-07, 5.299225449562073e-07, 7.133930921554565e-07, 8.968636393547058e-07, 1.080334186553955e-06, 1.2638047337532043e-06, 1.4472752809524536e-06, 1.6307458281517029e-06, 1.8142163753509521e-06, 1.9976869225502014e-06, 2.1811574697494507e-06, 2.3646280169487e-06, 2.5480985641479492e-06, 2.7315691113471985e-06, 2.9150396585464478e-06, 3.098510205745697e-06, 3.2819807529449463e-06, 3.4654513001441956e-06, 3.648921847343445e-06, 3.832392394542694e-06, 4.015862941741943e-06, 4.199333488941193e-06, 4.382804036140442e-06, 4.566274583339691e-06, 4.7497451305389404e-06, 4.93321567773819e-06, 5.116686224937439e-06, 5.300156772136688e-06, 5.4836273193359375e-06]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 5.0, 9.0, 10.0, 7.0, 5.0, 21.0, 33.0, 40.0, 41.0, 70.0, 114.0, 173.0, 247.0, 377.0, 611.0, 989.0, 1580.0, 2595.0, 4459.0, 8162.0, 15313.0, 33700.0, 82469.0, 251279.0, 409678.0, 137862.0, 50746.0, 22313.0, 10859.0, 5839.0, 3456.0, 2039.0, 1235.0, 816.0, 474.0, 295.0, 209.0, 123.0, 81.0, 78.0, 40.0, 24.0, 18.0, 29.0, 8.0, 7.0, 11.0, 1.0, 5.0, 3.0, 2.0, 3.0, 3.0], "bins": [-0.006465911865234375, -0.006282448768615723, -0.00609898567199707, -0.005915522575378418, -0.005732059478759766, -0.005548596382141113, -0.005365133285522461, -0.005181670188903809, -0.004998207092285156, -0.004814743995666504, -0.0046312808990478516, -0.004447817802429199, -0.004264354705810547, -0.0040808916091918945, -0.003897428512573242, -0.00371396541595459, -0.0035305023193359375, -0.003347039222717285, -0.003163576126098633, -0.0029801130294799805, -0.002796649932861328, -0.0026131868362426758, -0.0024297237396240234, -0.002246260643005371, -0.0020627975463867188, -0.0018793344497680664, -0.001695871353149414, -0.0015124082565307617, -0.0013289451599121094, -0.001145482063293457, -0.0009620189666748047, -0.0007785558700561523, -0.0005950927734375, -0.00041162967681884766, -0.0002281665802001953, -4.470348358154297e-05, 0.00013875961303710938, 0.0003222227096557617, 0.0005056858062744141, 0.0006891489028930664, 0.0008726119995117188, 0.001056075096130371, 0.0012395381927490234, 0.0014230012893676758, 0.0016064643859863281, 0.0017899274826049805, 0.001973390579223633, 0.002156853675842285, 0.0023403167724609375, 0.00252377986907959, 0.002707242965698242, 0.0028907060623168945, 0.003074169158935547, 0.0032576322555541992, 0.0034410953521728516, 0.003624558448791504, 0.0038080215454101562, 0.003991484642028809, 0.004174947738647461, 0.004358410835266113, 0.004541873931884766, 0.004725337028503418, 0.00490880012512207, 0.005092263221740723, 0.005275726318359375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 4.0, 4.0, 10.0, 3.0, 12.0, 10.0, 20.0, 16.0, 39.0, 58.0, 67.0, 97.0, 84.0, 111.0, 111.0, 87.0, 68.0, 59.0, 40.0, 30.0, 17.0, 7.0, 15.0, 8.0, 7.0, 4.0, 6.0, 5.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002010345458984375, -0.0019395947456359863, -0.0018688440322875977, -0.001798093318939209, -0.0017273426055908203, -0.0016565918922424316, -0.001585841178894043, -0.0015150904655456543, -0.0014443397521972656, -0.001373589038848877, -0.0013028383255004883, -0.0012320876121520996, -0.001161336898803711, -0.0010905861854553223, -0.0010198354721069336, -0.0009490847587585449, -0.0008783340454101562, -0.0008075833320617676, -0.0007368326187133789, -0.0006660819053649902, -0.0005953311920166016, -0.0005245804786682129, -0.0004538297653198242, -0.00038307905197143555, -0.0003123283386230469, -0.0002415776252746582, -0.00017082691192626953, -0.00010007619857788086, -2.9325485229492188e-05, 4.1425228118896484e-05, 0.00011217594146728516, 0.00018292665481567383, 0.0002536773681640625, 0.00032442808151245117, 0.00039517879486083984, 0.0004659295082092285, 0.0005366802215576172, 0.0006074309349060059, 0.0006781816482543945, 0.0007489323616027832, 0.0008196830749511719, 0.0008904337882995605, 0.0009611845016479492, 0.0010319352149963379, 0.0011026859283447266, 0.0011734366416931152, 0.001244187355041504, 0.0013149380683898926, 0.0013856887817382812, 0.00145643949508667, 0.0015271902084350586, 0.0015979409217834473, 0.001668691635131836, 0.0017394423484802246, 0.0018101930618286133, 0.001880943775177002, 0.0019516944885253906, 0.0020224452018737793, 0.002093195915222168, 0.0021639466285705566, 0.0022346973419189453, 0.002305448055267334, 0.0023761987686157227, 0.0024469494819641113, 0.0025177001953125]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 1.0, 3.0, 3.0, 6.0, 7.0, 4.0, 13.0, 16.0, 23.0, 25.0, 33.0, 36.0, 45.0, 64.0, 76.0, 53.0, 78.0, 82.0, 62.0, 59.0, 57.0, 38.0, 27.0, 31.0, 35.0, 33.0, 19.0, 17.0, 9.0, 7.0, 7.0, 4.0, 3.0, 4.0, 5.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-10.720723152160645, -10.407450675964355, -10.094179153442383, -9.780906677246094, -9.467634201049805, -9.154361724853516, -8.841089248657227, -8.527817726135254, -8.214545249938965, -7.901272773742676, -7.588000774383545, -7.274728775024414, -6.961456298828125, -6.648183822631836, -6.334911823272705, -6.021639823913574, -5.708367347717285, -5.395094871520996, -5.081822872161865, -4.768550872802734, -4.455278396606445, -4.142005920410156, -3.8287339210510254, -3.5154616832733154, -3.2021894454956055, -2.8889172077178955, -2.5756449699401855, -2.2623727321624756, -1.9491004943847656, -1.6358282566070557, -1.3225560188293457, -1.0092837810516357, -0.6960105895996094, -0.3827383518218994, -0.06946611404418945, 0.2438061237335205, 0.5570783615112305, 0.8703505992889404, 1.1836228370666504, 1.4968950748443604, 1.8101673126220703, 2.1234395503997803, 2.4367117881774902, 2.7499840259552, 3.06325626373291, 3.37652850151062, 3.68980073928833, 4.003072738647461, 4.31634521484375, 4.629617691040039, 4.94288969039917, 5.256161689758301, 5.56943416595459, 5.882706642150879, 6.19597864151001, 6.509250640869141, 6.82252311706543, 7.135795593261719, 7.44906759262085, 7.7623395919799805, 8.07561206817627, 8.388884544372559, 8.702156066894531, 9.01542854309082, 9.32870101928711]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 0.0, 3.0, 11.0, 5.0, 6.0, 11.0, 10.0, 20.0, 14.0, 18.0, 31.0, 33.0, 32.0, 41.0, 42.0, 44.0, 41.0, 48.0, 56.0, 49.0, 32.0, 39.0, 44.0, 43.0, 31.0, 33.0, 31.0, 44.0, 35.0, 26.0, 18.0, 19.0, 23.0, 17.0, 11.0, 12.0, 9.0, 7.0, 8.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.194217681884766, -7.8819260597229, -7.569634437561035, -7.25734281539917, -6.945051193237305, -6.632760047912598, -6.320468425750732, -6.008176803588867, -5.695885181427002, -5.383593559265137, -5.0713019371032715, -4.759010314941406, -4.446719169616699, -4.134427070617676, -3.8221359252929688, -3.5098443031311035, -3.1975526809692383, -2.885261058807373, -2.572969436645508, -2.2606780529022217, -1.9483864307403564, -1.6360948085784912, -1.3238033056259155, -1.0115118026733398, -0.6992201805114746, -0.38692861795425415, -0.07463705539703369, 0.23765450716018677, 0.5499460697174072, 0.8622376918792725, 1.1745291948318481, 1.4868206977844238, 1.799112319946289, 2.1114039421081543, 2.4236955642700195, 2.7359869480133057, 3.048278570175171, 3.360570192337036, 3.6728615760803223, 3.9851531982421875, 4.297444820404053, 4.609736442565918, 4.922028064727783, 5.234319686889648, 5.5466108322143555, 5.858902931213379, 6.171194076538086, 6.483485698699951, 6.795777320861816, 7.108068943023682, 7.420360565185547, 7.732652187347412, 8.044943809509277, 8.357234954833984, 8.669527053833008, 8.981818199157715, 9.294109344482422, 9.606400489807129, 9.918692588806152, 10.23098373413086, 10.543275833129883, 10.85556697845459, 11.167859077453613, 11.48015022277832, 11.792442321777344]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 8.0, 10.0, 23.0, 17.0, 38.0, 48.0, 70.0, 88.0, 149.0, 258.0, 388.0, 586.0, 951.0, 1485.0, 2373.0, 3766.0, 6435.0, 10428.0, 17793.0, 31351.0, 57077.0, 106643.0, 183982.0, 227085.0, 173941.0, 98686.0, 52924.0, 29360.0, 16944.0, 9961.0, 5895.0, 3703.0, 2197.0, 1338.0, 915.0, 546.0, 372.0, 250.0, 159.0, 113.0, 64.0, 46.0, 29.0, 14.0, 21.0, 8.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-17.25, -16.71826171875, -16.1865234375, -15.65478515625, -15.123046875, -14.59130859375, -14.0595703125, -13.52783203125, -12.99609375, -12.46435546875, -11.9326171875, -11.40087890625, -10.869140625, -10.33740234375, -9.8056640625, -9.27392578125, -8.7421875, -8.21044921875, -7.6787109375, -7.14697265625, -6.615234375, -6.08349609375, -5.5517578125, -5.02001953125, -4.48828125, -3.95654296875, -3.4248046875, -2.89306640625, -2.361328125, -1.82958984375, -1.2978515625, -0.76611328125, -0.234375, 0.29736328125, 0.8291015625, 1.36083984375, 1.892578125, 2.42431640625, 2.9560546875, 3.48779296875, 4.01953125, 4.55126953125, 5.0830078125, 5.61474609375, 6.146484375, 6.67822265625, 7.2099609375, 7.74169921875, 8.2734375, 8.80517578125, 9.3369140625, 9.86865234375, 10.400390625, 10.93212890625, 11.4638671875, 11.99560546875, 12.52734375, 13.05908203125, 13.5908203125, 14.12255859375, 14.654296875, 15.18603515625, 15.7177734375, 16.24951171875, 16.78125]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 9.0, 9.0, 9.0, 12.0, 14.0, 21.0, 22.0, 19.0, 30.0, 24.0, 35.0, 41.0, 39.0, 46.0, 42.0, 45.0, 38.0, 43.0, 46.0, 39.0, 31.0, 35.0, 32.0, 35.0, 39.0, 34.0, 27.0, 25.0, 23.0, 25.0, 11.0, 20.0, 17.0, 13.0, 13.0, 7.0, 9.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.46875, -7.203369140625, -6.93798828125, -6.672607421875, -6.4072265625, -6.141845703125, -5.87646484375, -5.611083984375, -5.345703125, -5.080322265625, -4.81494140625, -4.549560546875, -4.2841796875, -4.018798828125, -3.75341796875, -3.488037109375, -3.22265625, -2.957275390625, -2.69189453125, -2.426513671875, -2.1611328125, -1.895751953125, -1.63037109375, -1.364990234375, -1.099609375, -0.834228515625, -0.56884765625, -0.303466796875, -0.0380859375, 0.227294921875, 0.49267578125, 0.758056640625, 1.0234375, 1.288818359375, 1.55419921875, 1.819580078125, 2.0849609375, 2.350341796875, 2.61572265625, 2.881103515625, 3.146484375, 3.411865234375, 3.67724609375, 3.942626953125, 4.2080078125, 4.473388671875, 4.73876953125, 5.004150390625, 5.26953125, 5.534912109375, 5.80029296875, 6.065673828125, 6.3310546875, 6.596435546875, 6.86181640625, 7.127197265625, 7.392578125, 7.657958984375, 7.92333984375, 8.188720703125, 8.4541015625, 8.719482421875, 8.98486328125, 9.250244140625, 9.515625]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 6.0, 7.0, 9.0, 8.0, 15.0, 21.0, 28.0, 40.0, 92.0, 116.0, 178.0, 257.0, 388.0, 507.0, 719.0, 1117.0, 1538.0, 2302.0, 3181.0, 4787.0, 7017.0, 10334.0, 15680.0, 23831.0, 36732.0, 57270.0, 89608.0, 131782.0, 166517.0, 158217.0, 116072.0, 76427.0, 49333.0, 31666.0, 20539.0, 13649.0, 9062.0, 6085.0, 4067.0, 2994.0, 1923.0, 1341.0, 1005.0, 665.0, 468.0, 310.0, 196.0, 149.0, 105.0, 80.0, 37.0, 33.0, 22.0, 17.0, 9.0, 7.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-11.4140625, -11.0313720703125, -10.648681640625, -10.2659912109375, -9.88330078125, -9.5006103515625, -9.117919921875, -8.7352294921875, -8.3525390625, -7.9698486328125, -7.587158203125, -7.2044677734375, -6.82177734375, -6.4390869140625, -6.056396484375, -5.6737060546875, -5.291015625, -4.9083251953125, -4.525634765625, -4.1429443359375, -3.76025390625, -3.3775634765625, -2.994873046875, -2.6121826171875, -2.2294921875, -1.8468017578125, -1.464111328125, -1.0814208984375, -0.69873046875, -0.3160400390625, 0.066650390625, 0.4493408203125, 0.83203125, 1.2147216796875, 1.597412109375, 1.9801025390625, 2.36279296875, 2.7454833984375, 3.128173828125, 3.5108642578125, 3.8935546875, 4.2762451171875, 4.658935546875, 5.0416259765625, 5.42431640625, 5.8070068359375, 6.189697265625, 6.5723876953125, 6.955078125, 7.3377685546875, 7.720458984375, 8.1031494140625, 8.48583984375, 8.8685302734375, 9.251220703125, 9.6339111328125, 10.0166015625, 10.3992919921875, 10.781982421875, 11.1646728515625, 11.54736328125, 11.9300537109375, 12.312744140625, 12.6954345703125, 13.078125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 6.0, 5.0, 6.0, 7.0, 7.0, 9.0, 11.0, 8.0, 18.0, 13.0, 16.0, 27.0, 20.0, 26.0, 31.0, 31.0, 32.0, 37.0, 42.0, 31.0, 30.0, 42.0, 37.0, 36.0, 47.0, 34.0, 16.0, 42.0, 40.0, 25.0, 28.0, 32.0, 33.0, 19.0, 28.0, 26.0, 14.0, 18.0, 17.0, 8.0, 6.0, 5.0, 9.0, 8.0, 6.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.7578125, -4.60546875, -4.453125, -4.30078125, -4.1484375, -3.99609375, -3.84375, -3.69140625, -3.5390625, -3.38671875, -3.234375, -3.08203125, -2.9296875, -2.77734375, -2.625, -2.47265625, -2.3203125, -2.16796875, -2.015625, -1.86328125, -1.7109375, -1.55859375, -1.40625, -1.25390625, -1.1015625, -0.94921875, -0.796875, -0.64453125, -0.4921875, -0.33984375, -0.1875, -0.03515625, 0.1171875, 0.26953125, 0.421875, 0.57421875, 0.7265625, 0.87890625, 1.03125, 1.18359375, 1.3359375, 1.48828125, 1.640625, 1.79296875, 1.9453125, 2.09765625, 2.25, 2.40234375, 2.5546875, 2.70703125, 2.859375, 3.01171875, 3.1640625, 3.31640625, 3.46875, 3.62109375, 3.7734375, 3.92578125, 4.078125, 4.23046875, 4.3828125, 4.53515625, 4.6875, 4.83984375, 4.9921875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 6.0, 8.0, 14.0, 23.0, 23.0, 26.0, 47.0, 48.0, 71.0, 112.0, 150.0, 222.0, 351.0, 485.0, 698.0, 977.0, 1488.0, 2261.0, 3400.0, 5829.0, 9721.0, 17433.0, 32982.0, 70291.0, 186613.0, 399561.0, 174497.0, 67322.0, 31851.0, 16711.0, 9600.0, 5483.0, 3462.0, 2177.0, 1458.0, 955.0, 684.0, 452.0, 308.0, 218.0, 155.0, 107.0, 93.0, 53.0, 34.0, 20.0, 21.0, 17.0, 12.0, 8.0, 10.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0], "bins": [-2.083984375, -2.019805908203125, -1.95562744140625, -1.891448974609375, -1.8272705078125, -1.763092041015625, -1.69891357421875, -1.634735107421875, -1.570556640625, -1.506378173828125, -1.44219970703125, -1.378021240234375, -1.3138427734375, -1.249664306640625, -1.18548583984375, -1.121307373046875, -1.05712890625, -0.992950439453125, -0.92877197265625, -0.864593505859375, -0.8004150390625, -0.736236572265625, -0.67205810546875, -0.607879638671875, -0.543701171875, -0.479522705078125, -0.41534423828125, -0.351165771484375, -0.2869873046875, -0.222808837890625, -0.15863037109375, -0.094451904296875, -0.0302734375, 0.033905029296875, 0.09808349609375, 0.162261962890625, 0.2264404296875, 0.290618896484375, 0.35479736328125, 0.418975830078125, 0.483154296875, 0.547332763671875, 0.61151123046875, 0.675689697265625, 0.7398681640625, 0.804046630859375, 0.86822509765625, 0.932403564453125, 0.99658203125, 1.060760498046875, 1.12493896484375, 1.189117431640625, 1.2532958984375, 1.317474365234375, 1.38165283203125, 1.445831298828125, 1.510009765625, 1.574188232421875, 1.63836669921875, 1.702545166015625, 1.7667236328125, 1.830902099609375, 1.89508056640625, 1.959259033203125, 2.0234375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 8.0, 8.0, 13.0, 17.0, 16.0, 25.0, 37.0, 48.0, 72.0, 73.0, 96.0, 96.0, 104.0, 86.0, 80.0, 54.0, 48.0, 20.0, 25.0, 21.0, 11.0, 12.0, 10.0, 6.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001385211944580078, -0.0001342911273241043, -0.0001300610601902008, -0.0001258309930562973, -0.0001216009259223938, -0.0001173708587884903, -0.00011314079165458679, -0.00010891072452068329, -0.00010468065738677979, -0.00010045059025287628, -9.622052311897278e-05, -9.199045598506927e-05, -8.776038885116577e-05, -8.353032171726227e-05, -7.930025458335876e-05, -7.507018744945526e-05, -7.084012031555176e-05, -6.661005318164825e-05, -6.237998604774475e-05, -5.814991891384125e-05, -5.3919851779937744e-05, -4.968978464603424e-05, -4.545971751213074e-05, -4.1229650378227234e-05, -3.699958324432373e-05, -3.276951611042023e-05, -2.8539448976516724e-05, -2.430938184261322e-05, -2.0079314708709717e-05, -1.5849247574806213e-05, -1.161918044090271e-05, -7.3891133069992065e-06, -3.159046173095703e-06, 1.0710209608078003e-06, 5.301088094711304e-06, 9.531155228614807e-06, 1.376122236251831e-05, 1.7991289496421814e-05, 2.2221356630325317e-05, 2.645142376422882e-05, 3.0681490898132324e-05, 3.491155803203583e-05, 3.914162516593933e-05, 4.3371692299842834e-05, 4.760175943374634e-05, 5.183182656764984e-05, 5.6061893701553345e-05, 6.029196083545685e-05, 6.452202796936035e-05, 6.875209510326385e-05, 7.298216223716736e-05, 7.721222937107086e-05, 8.144229650497437e-05, 8.567236363887787e-05, 8.990243077278137e-05, 9.413249790668488e-05, 9.836256504058838e-05, 0.00010259263217449188, 0.00010682269930839539, 0.00011105276644229889, 0.00011528283357620239, 0.0001195129007101059, 0.0001237429678440094, 0.0001279730349779129, 0.0001322031021118164]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 9.0, 14.0, 17.0, 27.0, 51.0, 55.0, 61.0, 120.0, 164.0, 189.0, 275.0, 456.0, 554.0, 858.0, 1249.0, 1807.0, 2695.0, 4333.0, 6913.0, 11339.0, 20089.0, 36418.0, 73978.0, 183742.0, 370462.0, 175870.0, 71375.0, 35670.0, 19249.0, 11101.0, 6601.0, 4228.0, 2809.0, 1764.0, 1193.0, 799.0, 618.0, 410.0, 287.0, 200.0, 158.0, 102.0, 63.0, 59.0, 34.0, 30.0, 20.0, 12.0, 8.0, 11.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.927734375, -1.868377685546875, -1.80902099609375, -1.749664306640625, -1.6903076171875, -1.630950927734375, -1.57159423828125, -1.512237548828125, -1.452880859375, -1.393524169921875, -1.33416748046875, -1.274810791015625, -1.2154541015625, -1.156097412109375, -1.09674072265625, -1.037384033203125, -0.97802734375, -0.918670654296875, -0.85931396484375, -0.799957275390625, -0.7406005859375, -0.681243896484375, -0.62188720703125, -0.562530517578125, -0.503173828125, -0.443817138671875, -0.38446044921875, -0.325103759765625, -0.2657470703125, -0.206390380859375, -0.14703369140625, -0.087677001953125, -0.0283203125, 0.031036376953125, 0.09039306640625, 0.149749755859375, 0.2091064453125, 0.268463134765625, 0.32781982421875, 0.387176513671875, 0.446533203125, 0.505889892578125, 0.56524658203125, 0.624603271484375, 0.6839599609375, 0.743316650390625, 0.80267333984375, 0.862030029296875, 0.92138671875, 0.980743408203125, 1.04010009765625, 1.099456787109375, 1.1588134765625, 1.218170166015625, 1.27752685546875, 1.336883544921875, 1.396240234375, 1.455596923828125, 1.51495361328125, 1.574310302734375, 1.6336669921875, 1.693023681640625, 1.75238037109375, 1.811737060546875, 1.87109375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 6.0, 2.0, 4.0, 10.0, 12.0, 14.0, 16.0, 18.0, 14.0, 35.0, 30.0, 48.0, 34.0, 63.0, 62.0, 81.0, 80.0, 71.0, 66.0, 57.0, 55.0, 52.0, 27.0, 29.0, 30.0, 18.0, 18.0, 7.0, 5.0, 8.0, 5.0, 9.0, 5.0, 0.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.755859375, -0.7325363159179688, -0.7092132568359375, -0.6858901977539062, -0.662567138671875, -0.6392440795898438, -0.6159210205078125, -0.5925979614257812, -0.56927490234375, -0.5459518432617188, -0.5226287841796875, -0.49930572509765625, -0.475982666015625, -0.45265960693359375, -0.4293365478515625, -0.40601348876953125, -0.3826904296875, -0.35936737060546875, -0.3360443115234375, -0.31272125244140625, -0.289398193359375, -0.26607513427734375, -0.2427520751953125, -0.21942901611328125, -0.19610595703125, -0.17278289794921875, -0.1494598388671875, -0.12613677978515625, -0.102813720703125, -0.07949066162109375, -0.0561676025390625, -0.03284454345703125, -0.009521484375, 0.01380157470703125, 0.0371246337890625, 0.06044769287109375, 0.083770751953125, 0.10709381103515625, 0.1304168701171875, 0.15373992919921875, 0.17706298828125, 0.20038604736328125, 0.2237091064453125, 0.24703216552734375, 0.270355224609375, 0.29367828369140625, 0.3170013427734375, 0.34032440185546875, 0.3636474609375, 0.38697052001953125, 0.4102935791015625, 0.43361663818359375, 0.456939697265625, 0.48026275634765625, 0.5035858154296875, 0.5269088745117188, 0.55023193359375, 0.5735549926757812, 0.5968780517578125, 0.6202011108398438, 0.643524169921875, 0.6668472290039062, 0.6901702880859375, 0.7134933471679688, 0.73681640625]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 7.0, 8.0, 7.0, 8.0, 16.0, 18.0, 20.0, 20.0, 19.0, 36.0, 35.0, 53.0, 58.0, 73.0, 73.0, 57.0, 65.0, 63.0, 58.0, 53.0, 40.0, 35.0, 29.0, 26.0, 30.0, 18.0, 16.0, 9.0, 10.0, 9.0, 7.0, 4.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-9.26874828338623, -8.986112594604492, -8.703476905822754, -8.420841217041016, -8.138205528259277, -7.855569839477539, -7.572934150695801, -7.2902984619140625, -7.007662773132324, -6.725027084350586, -6.442391395568848, -6.159755706787109, -5.877120018005371, -5.594484329223633, -5.3118486404418945, -5.029212951660156, -4.746577262878418, -4.46394157409668, -4.181305885314941, -3.898670196533203, -3.616034507751465, -3.3333988189697266, -3.0507631301879883, -2.76812744140625, -2.4854917526245117, -2.2028560638427734, -1.9202203750610352, -1.6375846862792969, -1.3549489974975586, -1.0723133087158203, -0.789677619934082, -0.5070419311523438, -0.22440624237060547, 0.05822944641113281, 0.3408651351928711, 0.6235008239746094, 0.9061365127563477, 1.188772201538086, 1.4714078903198242, 1.7540435791015625, 2.036679267883301, 2.319314956665039, 2.6019506454467773, 2.8845863342285156, 3.167222023010254, 3.449857711791992, 3.7324934005737305, 4.015129089355469, 4.297764778137207, 4.580400466918945, 4.863036155700684, 5.145671844482422, 5.42830753326416, 5.710943222045898, 5.993578910827637, 6.276214599609375, 6.558850288391113, 6.841485977172852, 7.12412166595459, 7.406757354736328, 7.689393043518066, 7.972028732299805, 8.254664421081543, 8.537300109863281, 8.81993579864502]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 4.0, 9.0, 12.0, 11.0, 10.0, 14.0, 12.0, 16.0, 12.0, 22.0, 19.0, 33.0, 37.0, 50.0, 26.0, 38.0, 41.0, 37.0, 41.0, 32.0, 47.0, 35.0, 37.0, 38.0, 40.0, 29.0, 28.0, 40.0, 28.0, 29.0, 20.0, 26.0, 25.0, 16.0, 14.0, 15.0, 13.0, 7.0, 14.0, 3.0, 7.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.518990516662598, -7.2486162185668945, -6.97824239730835, -6.7078680992126465, -6.437494277954102, -6.167119979858398, -5.896745681762695, -5.626371383666992, -5.355997562408447, -5.085623264312744, -4.815249443054199, -4.544875144958496, -4.274500846862793, -4.004127025604248, -3.733752727508545, -3.463378667831421, -3.193004608154297, -2.922630548477173, -2.652256488800049, -2.3818821907043457, -2.1115081310272217, -1.8411340713500977, -1.570759892463684, -1.3003857135772705, -1.0300116539001465, -0.7596375346183777, -0.4892634153366089, -0.2188892960548401, 0.05148482322692871, 0.32185888290405273, 0.5922330617904663, 0.8626072406768799, 1.1329803466796875, 1.4033544063568115, 1.673728585243225, 1.9441027641296387, 2.2144768238067627, 2.4848508834838867, 2.75522518157959, 3.025599241256714, 3.295973300933838, 3.566347360610962, 3.836721420288086, 4.107095718383789, 4.377470016479492, 4.647843837738037, 4.91821813583374, 5.188591957092285, 5.458966255187988, 5.729340553283691, 5.999714374542236, 6.2700886726379395, 6.540462493896484, 6.8108367919921875, 7.081211090087891, 7.351585388183594, 7.621959209442139, 7.892333507537842, 8.162707328796387, 8.43308162689209, 8.703455924987793, 8.97382926940918, 9.244203567504883, 9.514577865600586, 9.784952163696289]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 11.0, 9.0, 16.0, 23.0, 30.0, 53.0, 69.0, 97.0, 154.0, 265.0, 421.0, 596.0, 1001.0, 1506.0, 2309.0, 3614.0, 5724.0, 8759.0, 13996.0, 22865.0, 38236.0, 65763.0, 122550.0, 278498.0, 908460.0, 1545270.0, 699800.0, 218016.0, 104541.0, 58683.0, 34675.0, 21158.0, 13211.0, 8318.0, 5419.0, 3484.0, 2295.0, 1504.0, 973.0, 617.0, 400.0, 272.0, 205.0, 127.0, 103.0, 60.0, 38.0, 33.0, 20.0, 16.0, 6.0, 10.0, 4.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-10.984375, -10.5833740234375, -10.182373046875, -9.7813720703125, -9.38037109375, -8.9793701171875, -8.578369140625, -8.1773681640625, -7.7763671875, -7.3753662109375, -6.974365234375, -6.5733642578125, -6.17236328125, -5.7713623046875, -5.370361328125, -4.9693603515625, -4.568359375, -4.1673583984375, -3.766357421875, -3.3653564453125, -2.96435546875, -2.5633544921875, -2.162353515625, -1.7613525390625, -1.3603515625, -0.9593505859375, -0.558349609375, -0.1573486328125, 0.24365234375, 0.6446533203125, 1.045654296875, 1.4466552734375, 1.84765625, 2.2486572265625, 2.649658203125, 3.0506591796875, 3.45166015625, 3.8526611328125, 4.253662109375, 4.6546630859375, 5.0556640625, 5.4566650390625, 5.857666015625, 6.2586669921875, 6.65966796875, 7.0606689453125, 7.461669921875, 7.8626708984375, 8.263671875, 8.6646728515625, 9.065673828125, 9.4666748046875, 9.86767578125, 10.2686767578125, 10.669677734375, 11.0706787109375, 11.4716796875, 11.8726806640625, 12.273681640625, 12.6746826171875, 13.07568359375, 13.4766845703125, 13.877685546875, 14.2786865234375, 14.6796875]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 6.0, 7.0, 8.0, 3.0, 10.0, 12.0, 14.0, 15.0, 16.0, 18.0, 12.0, 21.0, 32.0, 28.0, 40.0, 32.0, 41.0, 37.0, 31.0, 36.0, 52.0, 37.0, 35.0, 44.0, 39.0, 29.0, 35.0, 27.0, 35.0, 26.0, 27.0, 23.0, 22.0, 34.0, 23.0, 20.0, 12.0, 10.0, 11.0, 14.0, 10.0, 10.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.98046875, -5.75213623046875, -5.5238037109375, -5.29547119140625, -5.067138671875, -4.83880615234375, -4.6104736328125, -4.38214111328125, -4.15380859375, -3.92547607421875, -3.6971435546875, -3.46881103515625, -3.240478515625, -3.01214599609375, -2.7838134765625, -2.55548095703125, -2.3271484375, -2.09881591796875, -1.8704833984375, -1.64215087890625, -1.413818359375, -1.18548583984375, -0.9571533203125, -0.72882080078125, -0.50048828125, -0.27215576171875, -0.0438232421875, 0.18450927734375, 0.412841796875, 0.64117431640625, 0.8695068359375, 1.09783935546875, 1.326171875, 1.55450439453125, 1.7828369140625, 2.01116943359375, 2.239501953125, 2.46783447265625, 2.6961669921875, 2.92449951171875, 3.15283203125, 3.38116455078125, 3.6094970703125, 3.83782958984375, 4.066162109375, 4.29449462890625, 4.5228271484375, 4.75115966796875, 4.9794921875, 5.20782470703125, 5.4361572265625, 5.66448974609375, 5.892822265625, 6.12115478515625, 6.3494873046875, 6.57781982421875, 6.80615234375, 7.03448486328125, 7.2628173828125, 7.49114990234375, 7.719482421875, 7.94781494140625, 8.1761474609375, 8.40447998046875, 8.6328125]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 6.0, 8.0, 13.0, 22.0, 34.0, 46.0, 61.0, 98.0, 158.0, 253.0, 355.0, 578.0, 930.0, 1443.0, 2227.0, 3503.0, 5505.0, 9353.0, 15485.0, 26399.0, 45349.0, 80448.0, 152388.0, 308720.0, 688611.0, 1387098.0, 759626.0, 336379.0, 164518.0, 86651.0, 47768.0, 27800.0, 16421.0, 9777.0, 6026.0, 3705.0, 2367.0, 1467.0, 960.0, 556.0, 418.0, 242.0, 185.0, 117.0, 75.0, 54.0, 30.0, 25.0, 13.0, 6.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0], "bins": [-11.671875, -11.3133544921875, -10.954833984375, -10.5963134765625, -10.23779296875, -9.8792724609375, -9.520751953125, -9.1622314453125, -8.8037109375, -8.4451904296875, -8.086669921875, -7.7281494140625, -7.36962890625, -7.0111083984375, -6.652587890625, -6.2940673828125, -5.935546875, -5.5770263671875, -5.218505859375, -4.8599853515625, -4.50146484375, -4.1429443359375, -3.784423828125, -3.4259033203125, -3.0673828125, -2.7088623046875, -2.350341796875, -1.9918212890625, -1.63330078125, -1.2747802734375, -0.916259765625, -0.5577392578125, -0.19921875, 0.1593017578125, 0.517822265625, 0.8763427734375, 1.23486328125, 1.5933837890625, 1.951904296875, 2.3104248046875, 2.6689453125, 3.0274658203125, 3.385986328125, 3.7445068359375, 4.10302734375, 4.4615478515625, 4.820068359375, 5.1785888671875, 5.537109375, 5.8956298828125, 6.254150390625, 6.6126708984375, 6.97119140625, 7.3297119140625, 7.688232421875, 8.0467529296875, 8.4052734375, 8.7637939453125, 9.122314453125, 9.4808349609375, 9.83935546875, 10.1978759765625, 10.556396484375, 10.9149169921875, 11.2734375]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 6.0, 9.0, 7.0, 17.0, 15.0, 23.0, 25.0, 26.0, 39.0, 50.0, 58.0, 72.0, 84.0, 100.0, 121.0, 166.0, 199.0, 237.0, 322.0, 362.0, 394.0, 349.0, 248.0, 209.0, 191.0, 142.0, 116.0, 111.0, 78.0, 58.0, 51.0, 35.0, 35.0, 26.0, 22.0, 15.0, 10.0, 11.0, 9.0, 6.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.19140625, -4.05291748046875, -3.9144287109375, -3.77593994140625, -3.637451171875, -3.49896240234375, -3.3604736328125, -3.22198486328125, -3.08349609375, -2.94500732421875, -2.8065185546875, -2.66802978515625, -2.529541015625, -2.39105224609375, -2.2525634765625, -2.11407470703125, -1.9755859375, -1.83709716796875, -1.6986083984375, -1.56011962890625, -1.421630859375, -1.28314208984375, -1.1446533203125, -1.00616455078125, -0.86767578125, -0.72918701171875, -0.5906982421875, -0.45220947265625, -0.313720703125, -0.17523193359375, -0.0367431640625, 0.10174560546875, 0.240234375, 0.37872314453125, 0.5172119140625, 0.65570068359375, 0.794189453125, 0.93267822265625, 1.0711669921875, 1.20965576171875, 1.34814453125, 1.48663330078125, 1.6251220703125, 1.76361083984375, 1.902099609375, 2.04058837890625, 2.1790771484375, 2.31756591796875, 2.4560546875, 2.59454345703125, 2.7330322265625, 2.87152099609375, 3.010009765625, 3.14849853515625, 3.2869873046875, 3.42547607421875, 3.56396484375, 3.70245361328125, 3.8409423828125, 3.97943115234375, 4.117919921875, 4.25640869140625, 4.3948974609375, 4.53338623046875, 4.671875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 5.0, 2.0, 3.0, 4.0, 3.0, 11.0, 9.0, 15.0, 18.0, 26.0, 22.0, 27.0, 54.0, 73.0, 78.0, 85.0, 74.0, 74.0, 79.0, 78.0, 52.0, 45.0, 38.0, 21.0, 26.0, 16.0, 16.0, 8.0, 11.0, 7.0, 4.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.14832592010498, -8.830744743347168, -8.513163566589355, -8.195581436157227, -7.878000259399414, -7.560419082641602, -7.242837905883789, -6.925256729125977, -6.607675075531006, -6.290093898773193, -5.972512245178223, -5.65493106842041, -5.337349891662598, -5.019768238067627, -4.7021870613098145, -4.384605407714844, -4.067024230957031, -3.7494428157806396, -3.431861400604248, -3.1142802238464355, -2.796698808670044, -2.4791173934936523, -2.16153621673584, -1.8439548015594482, -1.5263733863830566, -1.208791971206665, -0.891210675239563, -0.5736293196678162, -0.25604796409606934, 0.061533451080322266, 0.3791147470474243, 0.6966960430145264, 1.0142765045166016, 1.3318579196929932, 1.6494392156600952, 1.9670205116271973, 2.284601926803589, 2.6021833419799805, 2.919764518737793, 3.2373459339141846, 3.554927349090576, 3.8725087642669678, 4.190090179443359, 4.507671356201172, 4.825252532958984, 5.142834186553955, 5.460415363311768, 5.777997016906738, 6.095578193664551, 6.413159370422363, 6.730741024017334, 7.0483222007751465, 7.365903854370117, 7.68348503112793, 8.001066207885742, 8.318647384643555, 8.636228561401367, 8.95380973815918, 9.271390914916992, 9.588973045349121, 9.906554222106934, 10.224135398864746, 10.541716575622559, 10.859297752380371, 11.1768798828125]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 12.0, 2.0, 5.0, 7.0, 17.0, 9.0, 15.0, 30.0, 34.0, 32.0, 36.0, 36.0, 45.0, 44.0, 34.0, 52.0, 47.0, 67.0, 42.0, 45.0, 48.0, 51.0, 36.0, 38.0, 45.0, 30.0, 27.0, 31.0, 19.0, 13.0, 16.0, 11.0, 11.0, 9.0, 3.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.935747146606445, -9.604849815368652, -9.273953437805176, -8.943056106567383, -8.61215877532959, -8.281261444091797, -7.95036506652832, -7.619467735290527, -7.288570880889893, -6.957674026489258, -6.626776695251465, -6.29587984085083, -5.964982986450195, -5.634085655212402, -5.303188800811768, -4.972291946411133, -4.64139461517334, -4.310497760772705, -3.979600429534912, -3.6487035751342773, -3.3178064823150635, -2.9869093894958496, -2.656012535095215, -2.325115442276001, -1.994218349456787, -1.6633212566375732, -1.332424283027649, -1.0015273094177246, -0.6706302165985107, -0.3397331237792969, -0.008836150169372559, 0.32206082344055176, 0.6529569625854492, 0.9838539958000183, 1.3147510290145874, 1.6456480026245117, 1.9765450954437256, 2.3074421882629395, 2.638339042663574, 2.969236135482788, 3.300133228302002, 3.631030321121216, 3.9619274139404297, 4.2928242683410645, 4.623721122741699, 4.954618453979492, 5.285515308380127, 5.616412162780762, 5.947309494018555, 6.2782063484191895, 6.609103679656982, 6.940000534057617, 7.27089786529541, 7.601794719696045, 7.93269157409668, 8.263588905334473, 8.594486236572266, 8.925383567810059, 9.256279945373535, 9.587177276611328, 9.918074607849121, 10.248971939086914, 10.57986831665039, 10.910765647888184, 11.24166202545166]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 0.0, 3.0, 4.0, 11.0, 13.0, 14.0, 15.0, 22.0, 32.0, 40.0, 65.0, 132.0, 198.0, 348.0, 522.0, 838.0, 1307.0, 2113.0, 3507.0, 5622.0, 9309.0, 15926.0, 27006.0, 49402.0, 96869.0, 241062.0, 341296.0, 118360.0, 57590.0, 31750.0, 17689.0, 10809.0, 6468.0, 3810.0, 2345.0, 1514.0, 998.0, 575.0, 354.0, 207.0, 151.0, 89.0, 56.0, 32.0, 26.0, 19.0, 16.0, 7.0, 4.0, 10.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.873046875, -2.777679443359375, -2.68231201171875, -2.586944580078125, -2.4915771484375, -2.396209716796875, -2.30084228515625, -2.205474853515625, -2.110107421875, -2.014739990234375, -1.91937255859375, -1.824005126953125, -1.7286376953125, -1.633270263671875, -1.53790283203125, -1.442535400390625, -1.34716796875, -1.251800537109375, -1.15643310546875, -1.061065673828125, -0.9656982421875, -0.870330810546875, -0.77496337890625, -0.679595947265625, -0.584228515625, -0.488861083984375, -0.39349365234375, -0.298126220703125, -0.2027587890625, -0.107391357421875, -0.01202392578125, 0.083343505859375, 0.1787109375, 0.274078369140625, 0.36944580078125, 0.464813232421875, 0.5601806640625, 0.655548095703125, 0.75091552734375, 0.846282958984375, 0.941650390625, 1.037017822265625, 1.13238525390625, 1.227752685546875, 1.3231201171875, 1.418487548828125, 1.51385498046875, 1.609222412109375, 1.70458984375, 1.799957275390625, 1.89532470703125, 1.990692138671875, 2.0860595703125, 2.181427001953125, 2.27679443359375, 2.372161865234375, 2.467529296875, 2.562896728515625, 2.65826416015625, 2.753631591796875, 2.8489990234375, 2.944366455078125, 3.03973388671875, 3.135101318359375, 3.23046875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 5.0, 9.0, 10.0, 7.0, 8.0, 15.0, 21.0, 32.0, 34.0, 28.0, 33.0, 50.0, 44.0, 52.0, 49.0, 43.0, 49.0, 50.0, 57.0, 50.0, 56.0, 40.0, 37.0, 39.0, 39.0, 31.0, 26.0, 24.0, 16.0, 11.0, 14.0, 14.0, 1.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6484375, -10.29541015625, -9.9423828125, -9.58935546875, -9.236328125, -8.88330078125, -8.5302734375, -8.17724609375, -7.82421875, -7.47119140625, -7.1181640625, -6.76513671875, -6.412109375, -6.05908203125, -5.7060546875, -5.35302734375, -5.0, -4.64697265625, -4.2939453125, -3.94091796875, -3.587890625, -3.23486328125, -2.8818359375, -2.52880859375, -2.17578125, -1.82275390625, -1.4697265625, -1.11669921875, -0.763671875, -0.41064453125, -0.0576171875, 0.29541015625, 0.6484375, 1.00146484375, 1.3544921875, 1.70751953125, 2.060546875, 2.41357421875, 2.7666015625, 3.11962890625, 3.47265625, 3.82568359375, 4.1787109375, 4.53173828125, 4.884765625, 5.23779296875, 5.5908203125, 5.94384765625, 6.296875, 6.64990234375, 7.0029296875, 7.35595703125, 7.708984375, 8.06201171875, 8.4150390625, 8.76806640625, 9.12109375, 9.47412109375, 9.8271484375, 10.18017578125, 10.533203125, 10.88623046875, 11.2392578125, 11.59228515625, 11.9453125]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 3.0, 6.0, 11.0, 12.0, 21.0, 28.0, 36.0, 42.0, 65.0, 74.0, 95.0, 149.0, 203.0, 273.0, 373.0, 497.0, 708.0, 949.0, 1278.0, 1893.0, 2581.0, 3632.0, 5509.0, 7619.0, 11614.0, 17015.0, 25892.0, 39521.0, 61492.0, 104205.0, 231086.0, 241483.0, 106050.0, 62683.0, 40136.0, 25945.0, 17514.0, 11531.0, 7893.0, 5360.0, 3833.0, 2629.0, 1861.0, 1310.0, 928.0, 706.0, 494.0, 377.0, 251.0, 196.0, 128.0, 105.0, 85.0, 51.0, 44.0, 42.0, 14.0, 13.0, 14.0, 9.0, 1.0, 2.0, 4.0], "bins": [-2.068359375, -2.003753662109375, -1.93914794921875, -1.874542236328125, -1.8099365234375, -1.745330810546875, -1.68072509765625, -1.616119384765625, -1.551513671875, -1.486907958984375, -1.42230224609375, -1.357696533203125, -1.2930908203125, -1.228485107421875, -1.16387939453125, -1.099273681640625, -1.03466796875, -0.970062255859375, -0.90545654296875, -0.840850830078125, -0.7762451171875, -0.711639404296875, -0.64703369140625, -0.582427978515625, -0.517822265625, -0.453216552734375, -0.38861083984375, -0.324005126953125, -0.2593994140625, -0.194793701171875, -0.13018798828125, -0.065582275390625, -0.0009765625, 0.063629150390625, 0.12823486328125, 0.192840576171875, 0.2574462890625, 0.322052001953125, 0.38665771484375, 0.451263427734375, 0.515869140625, 0.580474853515625, 0.64508056640625, 0.709686279296875, 0.7742919921875, 0.838897705078125, 0.90350341796875, 0.968109130859375, 1.03271484375, 1.097320556640625, 1.16192626953125, 1.226531982421875, 1.2911376953125, 1.355743408203125, 1.42034912109375, 1.484954833984375, 1.549560546875, 1.614166259765625, 1.67877197265625, 1.743377685546875, 1.8079833984375, 1.872589111328125, 1.93719482421875, 2.001800537109375, 2.06640625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 4.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 5.0, 4.0, 11.0, 10.0, 8.0, 9.0, 14.0, 24.0, 16.0, 14.0, 19.0, 24.0, 27.0, 27.0, 35.0, 32.0, 28.0, 29.0, 34.0, 43.0, 44.0, 28.0, 33.0, 42.0, 36.0, 29.0, 31.0, 34.0, 38.0, 22.0, 29.0, 35.0, 20.0, 25.0, 29.0, 15.0, 16.0, 12.0, 13.0, 10.0, 10.0, 9.0, 5.0, 1.0, 6.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0], "bins": [-5.14453125, -4.989990234375, -4.83544921875, -4.680908203125, -4.5263671875, -4.371826171875, -4.21728515625, -4.062744140625, -3.908203125, -3.753662109375, -3.59912109375, -3.444580078125, -3.2900390625, -3.135498046875, -2.98095703125, -2.826416015625, -2.671875, -2.517333984375, -2.36279296875, -2.208251953125, -2.0537109375, -1.899169921875, -1.74462890625, -1.590087890625, -1.435546875, -1.281005859375, -1.12646484375, -0.971923828125, -0.8173828125, -0.662841796875, -0.50830078125, -0.353759765625, -0.19921875, -0.044677734375, 0.10986328125, 0.264404296875, 0.4189453125, 0.573486328125, 0.72802734375, 0.882568359375, 1.037109375, 1.191650390625, 1.34619140625, 1.500732421875, 1.6552734375, 1.809814453125, 1.96435546875, 2.118896484375, 2.2734375, 2.427978515625, 2.58251953125, 2.737060546875, 2.8916015625, 3.046142578125, 3.20068359375, 3.355224609375, 3.509765625, 3.664306640625, 3.81884765625, 3.973388671875, 4.1279296875, 4.282470703125, 4.43701171875, 4.591552734375, 4.74609375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 8.0, 16.0, 16.0, 12.0, 19.0, 28.0, 45.0, 44.0, 56.0, 65.0, 88.0, 118.0, 150.0, 193.0, 291.0, 425.0, 612.0, 978.0, 1594.0, 2637.0, 4675.0, 8913.0, 17847.0, 39193.0, 99136.0, 314816.0, 358452.0, 113137.0, 43054.0, 19410.0, 9726.0, 5094.0, 2813.0, 1693.0, 1034.0, 651.0, 422.0, 297.0, 184.0, 161.0, 112.0, 72.0, 54.0, 47.0, 50.0, 33.0, 21.0, 13.0, 11.0, 16.0, 11.0, 6.0, 6.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.005290985107421875, -0.005130946636199951, -0.004970908164978027, -0.0048108696937561035, -0.00465083122253418, -0.004490792751312256, -0.004330754280090332, -0.004170715808868408, -0.004010677337646484, -0.0038506388664245605, -0.0036906003952026367, -0.003530561923980713, -0.003370523452758789, -0.0032104849815368652, -0.0030504465103149414, -0.0028904080390930176, -0.0027303695678710938, -0.00257033109664917, -0.002410292625427246, -0.0022502541542053223, -0.0020902156829833984, -0.0019301772117614746, -0.0017701387405395508, -0.001610100269317627, -0.0014500617980957031, -0.0012900233268737793, -0.0011299848556518555, -0.0009699463844299316, -0.0008099079132080078, -0.000649869441986084, -0.0004898309707641602, -0.00032979249954223633, -0.0001697540283203125, -9.715557098388672e-06, 0.00015032291412353516, 0.000310361385345459, 0.0004703998565673828, 0.0006304383277893066, 0.0007904767990112305, 0.0009505152702331543, 0.0011105537414550781, 0.001270592212677002, 0.0014306306838989258, 0.0015906691551208496, 0.0017507076263427734, 0.0019107460975646973, 0.002070784568786621, 0.002230823040008545, 0.0023908615112304688, 0.0025508999824523926, 0.0027109384536743164, 0.0028709769248962402, 0.003031015396118164, 0.003191053867340088, 0.0033510923385620117, 0.0035111308097839355, 0.0036711692810058594, 0.003831207752227783, 0.003991246223449707, 0.004151284694671631, 0.004311323165893555, 0.0044713616371154785, 0.004631400108337402, 0.004791438579559326, 0.00495147705078125]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 3.0, 9.0, 12.0, 21.0, 13.0, 23.0, 21.0, 30.0, 35.0, 60.0, 24.0, 70.0, 41.0, 65.0, 73.0, 59.0, 72.0, 53.0, 66.0, 25.0, 49.0, 26.0, 32.0, 20.0, 30.0, 11.0, 14.0, 9.0, 12.0, 5.0, 3.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.0067901611328125e-06, -4.858709871768951e-06, -4.71062958240509e-06, -4.562549293041229e-06, -4.414469003677368e-06, -4.266388714313507e-06, -4.118308424949646e-06, -3.970228135585785e-06, -3.822147846221924e-06, -3.6740675568580627e-06, -3.5259872674942017e-06, -3.3779069781303406e-06, -3.2298266887664795e-06, -3.0817463994026184e-06, -2.9336661100387573e-06, -2.7855858206748962e-06, -2.637505531311035e-06, -2.489425241947174e-06, -2.341344952583313e-06, -2.193264663219452e-06, -2.045184373855591e-06, -1.8971040844917297e-06, -1.7490237951278687e-06, -1.6009435057640076e-06, -1.4528632164001465e-06, -1.3047829270362854e-06, -1.1567026376724243e-06, -1.0086223483085632e-06, -8.605420589447021e-07, -7.124617695808411e-07, -5.6438148021698e-07, -4.163011908531189e-07, -2.682209014892578e-07, -1.2014061212539673e-07, 2.7939677238464355e-08, 1.7601996660232544e-07, 3.241002559661865e-07, 4.721805453300476e-07, 6.202608346939087e-07, 7.683411240577698e-07, 9.164214134216309e-07, 1.064501702785492e-06, 1.212581992149353e-06, 1.3606622815132141e-06, 1.5087425708770752e-06, 1.6568228602409363e-06, 1.8049031496047974e-06, 1.9529834389686584e-06, 2.1010637283325195e-06, 2.2491440176963806e-06, 2.3972243070602417e-06, 2.5453045964241028e-06, 2.693384885787964e-06, 2.841465175151825e-06, 2.989545464515686e-06, 3.137625753879547e-06, 3.285706043243408e-06, 3.4337863326072693e-06, 3.5818666219711304e-06, 3.7299469113349915e-06, 3.8780272006988525e-06, 4.026107490062714e-06, 4.174187779426575e-06, 4.322268068790436e-06, 4.470348358154297e-06]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 3.0, 6.0, 11.0, 11.0, 18.0, 24.0, 31.0, 29.0, 56.0, 60.0, 80.0, 80.0, 146.0, 184.0, 285.0, 305.0, 479.0, 685.0, 934.0, 1401.0, 2185.0, 3676.0, 6374.0, 11815.0, 23336.0, 47067.0, 107744.0, 272901.0, 322738.0, 130637.0, 55874.0, 26689.0, 13558.0, 7360.0, 4128.0, 2455.0, 1527.0, 1026.0, 694.0, 553.0, 357.0, 250.0, 175.0, 178.0, 120.0, 80.0, 58.0, 65.0, 35.0, 15.0, 19.0, 10.0, 6.0, 16.0, 5.0, 5.0, 3.0, 0.0, 0.0, 0.0, 4.0], "bins": [-0.004184722900390625, -0.004050195217132568, -0.003915667533874512, -0.003781139850616455, -0.0036466121673583984, -0.003512084484100342, -0.003377556800842285, -0.0032430291175842285, -0.003108501434326172, -0.0029739737510681152, -0.0028394460678100586, -0.002704918384552002, -0.0025703907012939453, -0.0024358630180358887, -0.002301335334777832, -0.0021668076515197754, -0.0020322799682617188, -0.0018977522850036621, -0.0017632246017456055, -0.0016286969184875488, -0.0014941692352294922, -0.0013596415519714355, -0.001225113868713379, -0.0010905861854553223, -0.0009560585021972656, -0.000821530818939209, -0.0006870031356811523, -0.0005524754524230957, -0.00041794776916503906, -0.0002834200859069824, -0.00014889240264892578, -1.436471939086914e-05, 0.0001201629638671875, 0.00025469064712524414, 0.0003892183303833008, 0.0005237460136413574, 0.0006582736968994141, 0.0007928013801574707, 0.0009273290634155273, 0.001061856746673584, 0.0011963844299316406, 0.0013309121131896973, 0.001465439796447754, 0.0015999674797058105, 0.0017344951629638672, 0.0018690228462219238, 0.0020035505294799805, 0.002138078212738037, 0.0022726058959960938, 0.0024071335792541504, 0.002541661262512207, 0.0026761889457702637, 0.0028107166290283203, 0.002945244312286377, 0.0030797719955444336, 0.0032142996788024902, 0.003348827362060547, 0.0034833550453186035, 0.00361788272857666, 0.003752410411834717, 0.0038869380950927734, 0.00402146577835083, 0.004155993461608887, 0.004290521144866943, 0.004425048828125]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 1.0, 6.0, 13.0, 12.0, 21.0, 23.0, 40.0, 49.0, 67.0, 86.0, 129.0, 130.0, 96.0, 83.0, 49.0, 53.0, 43.0, 28.0, 25.0, 20.0, 11.0, 6.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.001712799072265625, -0.0016578733921051025, -0.00160294771194458, -0.0015480220317840576, -0.0014930963516235352, -0.0014381706714630127, -0.0013832449913024902, -0.0013283193111419678, -0.0012733936309814453, -0.0012184679508209229, -0.0011635422706604004, -0.001108616590499878, -0.0010536909103393555, -0.000998765230178833, -0.0009438395500183105, -0.0008889138698577881, -0.0008339881896972656, -0.0007790625095367432, -0.0007241368293762207, -0.0006692111492156982, -0.0006142854690551758, -0.0005593597888946533, -0.0005044341087341309, -0.0004495084285736084, -0.00039458274841308594, -0.0003396570682525635, -0.000284731388092041, -0.00022980570793151855, -0.0001748800277709961, -0.00011995434761047363, -6.502866744995117e-05, -1.0102987289428711e-05, 4.482269287109375e-05, 9.974837303161621e-05, 0.00015467405319213867, 0.00020959973335266113, 0.0002645254135131836, 0.00031945109367370605, 0.0003743767738342285, 0.000429302453994751, 0.00048422813415527344, 0.0005391538143157959, 0.0005940794944763184, 0.0006490051746368408, 0.0007039308547973633, 0.0007588565349578857, 0.0008137822151184082, 0.0008687078952789307, 0.0009236335754394531, 0.0009785592555999756, 0.001033484935760498, 0.0010884106159210205, 0.001143336296081543, 0.0011982619762420654, 0.0012531876564025879, 0.0013081133365631104, 0.0013630390167236328, 0.0014179646968841553, 0.0014728903770446777, 0.0015278160572052002, 0.0015827417373657227, 0.0016376674175262451, 0.0016925930976867676, 0.00174751877784729, 0.0018024444580078125]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 1.0, 4.0, 4.0, 3.0, 3.0, 3.0, 10.0, 5.0, 23.0, 19.0, 23.0, 27.0, 34.0, 60.0, 76.0, 70.0, 92.0, 73.0, 84.0, 74.0, 69.0, 52.0, 46.0, 26.0, 26.0, 24.0, 10.0, 15.0, 9.0, 11.0, 6.0, 5.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.434188842773438, -9.114850044250488, -8.795511245727539, -8.47617244720459, -8.15683364868164, -7.837494373321533, -7.518155097961426, -7.198816299438477, -6.879477500915527, -6.560138702392578, -6.240799903869629, -5.9214606285095215, -5.602121829986572, -5.282783031463623, -4.963443756103516, -4.644104957580566, -4.324766159057617, -4.005427360534668, -3.6860883235931396, -3.3667492866516113, -3.047410488128662, -2.728071689605713, -2.4087326526641846, -2.0893936157226562, -1.770054817199707, -1.4507158994674683, -1.1313769817352295, -0.8120380640029907, -0.49269914627075195, -0.17336022853851318, 0.14597868919372559, 0.4653177261352539, 0.7846565246582031, 1.103995442390442, 1.4233343601226807, 1.7426732778549194, 2.062012195587158, 2.3813509941101074, 2.7006900310516357, 3.020029067993164, 3.3393678665161133, 3.6587066650390625, 3.978045701980591, 4.297384738922119, 4.616723537445068, 4.936062335968018, 5.255401611328125, 5.574740409851074, 5.894079208374023, 6.213418006896973, 6.532756805419922, 6.852096080780029, 7.1714348793029785, 7.490773677825928, 7.810112953186035, 8.129451751708984, 8.448790550231934, 8.768129348754883, 9.087468147277832, 9.406806945800781, 9.726146697998047, 10.045485496520996, 10.364824295043945, 10.684163093566895, 11.003501892089844]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 12.0, 1.0, 6.0, 7.0, 17.0, 9.0, 15.0, 30.0, 32.0, 33.0, 37.0, 35.0, 45.0, 42.0, 37.0, 50.0, 49.0, 66.0, 42.0, 44.0, 49.0, 52.0, 36.0, 38.0, 45.0, 30.0, 25.0, 31.0, 21.0, 13.0, 16.0, 11.0, 11.0, 9.0, 3.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.857563018798828, -9.527534484863281, -9.197505950927734, -8.867476463317871, -8.537447929382324, -8.207419395446777, -7.8773908615112305, -7.547362327575684, -7.2173333168029785, -6.887304782867432, -6.557275772094727, -6.22724723815918, -5.897218704223633, -5.567189693450928, -5.237161159515381, -4.907132148742676, -4.577103614807129, -4.247075080871582, -3.917046070098877, -3.58701753616333, -3.256988763809204, -2.926959991455078, -2.5969314575195312, -2.2669026851654053, -1.9368739128112793, -1.6068451404571533, -1.276816487312317, -0.9467877745628357, -0.6167590618133545, -0.2867302894592285, 0.04329836368560791, 0.37332701683044434, 0.7033567428588867, 1.0333855152130127, 1.3634141683578491, 1.6934428215026855, 2.0234715938568115, 2.3535003662109375, 2.6835289001464844, 3.0135576725006104, 3.3435864448547363, 3.6736152172088623, 4.003643989562988, 4.333672523498535, 4.663701057434082, 4.993730068206787, 5.323758602142334, 5.653787612915039, 5.983816146850586, 6.313844680786133, 6.643873691558838, 6.973902225494385, 7.30393123626709, 7.633959770202637, 7.963988304138184, 8.29401683807373, 8.624046325683594, 8.95407485961914, 9.284103393554688, 9.61413288116455, 9.944161415100098, 10.274189949035645, 10.604218482971191, 10.934247016906738, 11.264275550842285]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 11.0, 9.0, 20.0, 21.0, 42.0, 58.0, 86.0, 147.0, 206.0, 338.0, 542.0, 891.0, 1466.0, 2374.0, 4041.0, 6760.0, 12044.0, 20787.0, 37642.0, 70129.0, 132482.0, 217315.0, 224683.0, 144376.0, 76934.0, 41204.0, 22648.0, 12729.0, 7380.0, 4464.0, 2629.0, 1555.0, 948.0, 575.0, 383.0, 201.0, 144.0, 89.0, 66.0, 54.0, 21.0, 14.0, 12.0, 11.0, 5.0, 7.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0], "bins": [-17.28125, -16.7740478515625, -16.266845703125, -15.7596435546875, -15.25244140625, -14.7452392578125, -14.238037109375, -13.7308349609375, -13.2236328125, -12.7164306640625, -12.209228515625, -11.7020263671875, -11.19482421875, -10.6876220703125, -10.180419921875, -9.6732177734375, -9.166015625, -8.6588134765625, -8.151611328125, -7.6444091796875, -7.13720703125, -6.6300048828125, -6.122802734375, -5.6156005859375, -5.1083984375, -4.6011962890625, -4.093994140625, -3.5867919921875, -3.07958984375, -2.5723876953125, -2.065185546875, -1.5579833984375, -1.05078125, -0.5435791015625, -0.036376953125, 0.4708251953125, 0.97802734375, 1.4852294921875, 1.992431640625, 2.4996337890625, 3.0068359375, 3.5140380859375, 4.021240234375, 4.5284423828125, 5.03564453125, 5.5428466796875, 6.050048828125, 6.5572509765625, 7.064453125, 7.5716552734375, 8.078857421875, 8.5860595703125, 9.09326171875, 9.6004638671875, 10.107666015625, 10.6148681640625, 11.1220703125, 11.6292724609375, 12.136474609375, 12.6436767578125, 13.15087890625, 13.6580810546875, 14.165283203125, 14.6724853515625, 15.1796875]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 3.0, 7.0, 8.0, 9.0, 11.0, 19.0, 19.0, 20.0, 29.0, 40.0, 33.0, 30.0, 43.0, 44.0, 49.0, 55.0, 53.0, 51.0, 46.0, 53.0, 49.0, 41.0, 37.0, 25.0, 52.0, 38.0, 28.0, 17.0, 21.0, 24.0, 10.0, 12.0, 9.0, 5.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3671875, -8.06396484375, -7.7607421875, -7.45751953125, -7.154296875, -6.85107421875, -6.5478515625, -6.24462890625, -5.94140625, -5.63818359375, -5.3349609375, -5.03173828125, -4.728515625, -4.42529296875, -4.1220703125, -3.81884765625, -3.515625, -3.21240234375, -2.9091796875, -2.60595703125, -2.302734375, -1.99951171875, -1.6962890625, -1.39306640625, -1.08984375, -0.78662109375, -0.4833984375, -0.18017578125, 0.123046875, 0.42626953125, 0.7294921875, 1.03271484375, 1.3359375, 1.63916015625, 1.9423828125, 2.24560546875, 2.548828125, 2.85205078125, 3.1552734375, 3.45849609375, 3.76171875, 4.06494140625, 4.3681640625, 4.67138671875, 4.974609375, 5.27783203125, 5.5810546875, 5.88427734375, 6.1875, 6.49072265625, 6.7939453125, 7.09716796875, 7.400390625, 7.70361328125, 8.0068359375, 8.31005859375, 8.61328125, 8.91650390625, 9.2197265625, 9.52294921875, 9.826171875, 10.12939453125, 10.4326171875, 10.73583984375, 11.0390625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 8.0, 9.0, 13.0, 16.0, 24.0, 39.0, 62.0, 101.0, 153.0, 254.0, 364.0, 550.0, 867.0, 1248.0, 1966.0, 2773.0, 4264.0, 6383.0, 9681.0, 15127.0, 22730.0, 35441.0, 54846.0, 87236.0, 132321.0, 172092.0, 164415.0, 119292.0, 76644.0, 49008.0, 31310.0, 20105.0, 13350.0, 8646.0, 5698.0, 3931.0, 2623.0, 1694.0, 1130.0, 735.0, 484.0, 345.0, 192.0, 135.0, 94.0, 65.0, 38.0, 26.0, 15.0, 7.0, 7.0, 1.0, 4.0, 2.0, 3.0, 0.0, 2.0], "bins": [-12.78125, -12.392333984375, -12.00341796875, -11.614501953125, -11.2255859375, -10.836669921875, -10.44775390625, -10.058837890625, -9.669921875, -9.281005859375, -8.89208984375, -8.503173828125, -8.1142578125, -7.725341796875, -7.33642578125, -6.947509765625, -6.55859375, -6.169677734375, -5.78076171875, -5.391845703125, -5.0029296875, -4.614013671875, -4.22509765625, -3.836181640625, -3.447265625, -3.058349609375, -2.66943359375, -2.280517578125, -1.8916015625, -1.502685546875, -1.11376953125, -0.724853515625, -0.3359375, 0.052978515625, 0.44189453125, 0.830810546875, 1.2197265625, 1.608642578125, 1.99755859375, 2.386474609375, 2.775390625, 3.164306640625, 3.55322265625, 3.942138671875, 4.3310546875, 4.719970703125, 5.10888671875, 5.497802734375, 5.88671875, 6.275634765625, 6.66455078125, 7.053466796875, 7.4423828125, 7.831298828125, 8.22021484375, 8.609130859375, 8.998046875, 9.386962890625, 9.77587890625, 10.164794921875, 10.5537109375, 10.942626953125, 11.33154296875, 11.720458984375, 12.109375]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 6.0, 6.0, 9.0, 6.0, 10.0, 10.0, 12.0, 11.0, 16.0, 18.0, 15.0, 28.0, 28.0, 24.0, 31.0, 29.0, 21.0, 28.0, 29.0, 37.0, 34.0, 33.0, 31.0, 31.0, 32.0, 41.0, 27.0, 26.0, 29.0, 30.0, 26.0, 29.0, 29.0, 28.0, 28.0, 25.0, 18.0, 28.0, 12.0, 21.0, 14.0, 10.0, 10.0, 9.0, 4.0, 8.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-4.484375, -4.343994140625, -4.20361328125, -4.063232421875, -3.9228515625, -3.782470703125, -3.64208984375, -3.501708984375, -3.361328125, -3.220947265625, -3.08056640625, -2.940185546875, -2.7998046875, -2.659423828125, -2.51904296875, -2.378662109375, -2.23828125, -2.097900390625, -1.95751953125, -1.817138671875, -1.6767578125, -1.536376953125, -1.39599609375, -1.255615234375, -1.115234375, -0.974853515625, -0.83447265625, -0.694091796875, -0.5537109375, -0.413330078125, -0.27294921875, -0.132568359375, 0.0078125, 0.148193359375, 0.28857421875, 0.428955078125, 0.5693359375, 0.709716796875, 0.85009765625, 0.990478515625, 1.130859375, 1.271240234375, 1.41162109375, 1.552001953125, 1.6923828125, 1.832763671875, 1.97314453125, 2.113525390625, 2.25390625, 2.394287109375, 2.53466796875, 2.675048828125, 2.8154296875, 2.955810546875, 3.09619140625, 3.236572265625, 3.376953125, 3.517333984375, 3.65771484375, 3.798095703125, 3.9384765625, 4.078857421875, 4.21923828125, 4.359619140625, 4.5]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 7.0, 6.0, 12.0, 12.0, 18.0, 26.0, 30.0, 55.0, 60.0, 83.0, 135.0, 210.0, 289.0, 430.0, 594.0, 918.0, 1470.0, 2347.0, 3704.0, 6189.0, 10590.0, 19435.0, 38249.0, 85697.0, 259075.0, 381003.0, 127188.0, 51903.0, 25085.0, 13589.0, 7656.0, 4470.0, 2874.0, 1746.0, 1119.0, 732.0, 484.0, 296.0, 240.0, 166.0, 106.0, 96.0, 47.0, 34.0, 29.0, 12.0, 10.0, 15.0, 6.0, 5.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0], "bins": [-2.197265625, -2.1290283203125, -2.060791015625, -1.9925537109375, -1.92431640625, -1.8560791015625, -1.787841796875, -1.7196044921875, -1.6513671875, -1.5831298828125, -1.514892578125, -1.4466552734375, -1.37841796875, -1.3101806640625, -1.241943359375, -1.1737060546875, -1.10546875, -1.0372314453125, -0.968994140625, -0.9007568359375, -0.83251953125, -0.7642822265625, -0.696044921875, -0.6278076171875, -0.5595703125, -0.4913330078125, -0.423095703125, -0.3548583984375, -0.28662109375, -0.2183837890625, -0.150146484375, -0.0819091796875, -0.013671875, 0.0545654296875, 0.122802734375, 0.1910400390625, 0.25927734375, 0.3275146484375, 0.395751953125, 0.4639892578125, 0.5322265625, 0.6004638671875, 0.668701171875, 0.7369384765625, 0.80517578125, 0.8734130859375, 0.941650390625, 1.0098876953125, 1.078125, 1.1463623046875, 1.214599609375, 1.2828369140625, 1.35107421875, 1.4193115234375, 1.487548828125, 1.5557861328125, 1.6240234375, 1.6922607421875, 1.760498046875, 1.8287353515625, 1.89697265625, 1.9652099609375, 2.033447265625, 2.1016845703125, 2.169921875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 5.0, 0.0, 5.0, 6.0, 8.0, 13.0, 11.0, 10.0, 30.0, 21.0, 39.0, 46.0, 74.0, 79.0, 86.0, 84.0, 83.0, 87.0, 74.0, 58.0, 44.0, 33.0, 25.0, 25.0, 14.0, 10.0, 9.0, 11.0, 2.0, 5.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00012934207916259766, -0.00012591015547513962, -0.00012247823178768158, -0.00011904630810022354, -0.0001156143844127655, -0.00011218246072530746, -0.00010875053703784943, -0.00010531861335039139, -0.00010188668966293335, -9.845476597547531e-05, -9.502284228801727e-05, -9.159091860055923e-05, -8.81589949131012e-05, -8.472707122564316e-05, -8.129514753818512e-05, -7.786322385072708e-05, -7.443130016326904e-05, -7.0999376475811e-05, -6.756745278835297e-05, -6.413552910089493e-05, -6.070360541343689e-05, -5.727168172597885e-05, -5.383975803852081e-05, -5.0407834351062775e-05, -4.6975910663604736e-05, -4.35439869761467e-05, -4.011206328868866e-05, -3.668013960123062e-05, -3.324821591377258e-05, -2.9816292226314545e-05, -2.6384368538856506e-05, -2.2952444851398468e-05, -1.952052116394043e-05, -1.608859747648239e-05, -1.2656673789024353e-05, -9.224750101566315e-06, -5.792826414108276e-06, -2.360902726650238e-06, 1.0710209608078003e-06, 4.502944648265839e-06, 7.934868335723877e-06, 1.1366792023181915e-05, 1.4798715710639954e-05, 1.8230639398097992e-05, 2.166256308555603e-05, 2.509448677301407e-05, 2.8526410460472107e-05, 3.1958334147930145e-05, 3.5390257835388184e-05, 3.882218152284622e-05, 4.225410521030426e-05, 4.56860288977623e-05, 4.911795258522034e-05, 5.2549876272678375e-05, 5.5981799960136414e-05, 5.941372364759445e-05, 6.284564733505249e-05, 6.627757102251053e-05, 6.970949470996857e-05, 7.31414183974266e-05, 7.657334208488464e-05, 8.000526577234268e-05, 8.343718945980072e-05, 8.686911314725876e-05, 9.03010368347168e-05]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 7.0, 9.0, 12.0, 10.0, 27.0, 33.0, 62.0, 78.0, 138.0, 170.0, 287.0, 437.0, 695.0, 1124.0, 1904.0, 3210.0, 5801.0, 10594.0, 19917.0, 41741.0, 111277.0, 401540.0, 295347.0, 82291.0, 34259.0, 16721.0, 8817.0, 4832.0, 2773.0, 1610.0, 1061.0, 649.0, 400.0, 253.0, 159.0, 89.0, 73.0, 58.0, 27.0, 19.0, 16.0, 10.0, 6.0, 3.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.640625, -2.562652587890625, -2.48468017578125, -2.406707763671875, -2.3287353515625, -2.250762939453125, -2.17279052734375, -2.094818115234375, -2.016845703125, -1.938873291015625, -1.86090087890625, -1.782928466796875, -1.7049560546875, -1.626983642578125, -1.54901123046875, -1.471038818359375, -1.39306640625, -1.315093994140625, -1.23712158203125, -1.159149169921875, -1.0811767578125, -1.003204345703125, -0.92523193359375, -0.847259521484375, -0.769287109375, -0.691314697265625, -0.61334228515625, -0.535369873046875, -0.4573974609375, -0.379425048828125, -0.30145263671875, -0.223480224609375, -0.1455078125, -0.067535400390625, 0.01043701171875, 0.088409423828125, 0.1663818359375, 0.244354248046875, 0.32232666015625, 0.400299072265625, 0.478271484375, 0.556243896484375, 0.63421630859375, 0.712188720703125, 0.7901611328125, 0.868133544921875, 0.94610595703125, 1.024078369140625, 1.10205078125, 1.180023193359375, 1.25799560546875, 1.335968017578125, 1.4139404296875, 1.491912841796875, 1.56988525390625, 1.647857666015625, 1.725830078125, 1.803802490234375, 1.88177490234375, 1.959747314453125, 2.0377197265625, 2.115692138671875, 2.19366455078125, 2.271636962890625, 2.349609375]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 1.0, 2.0, 3.0, 9.0, 8.0, 11.0, 4.0, 17.0, 10.0, 22.0, 25.0, 25.0, 41.0, 54.0, 77.0, 87.0, 78.0, 90.0, 90.0, 73.0, 60.0, 43.0, 32.0, 20.0, 25.0, 30.0, 23.0, 12.0, 10.0, 6.0, 3.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92431640625, -0.8973464965820312, -0.8703765869140625, -0.8434066772460938, -0.816436767578125, -0.7894668579101562, -0.7624969482421875, -0.7355270385742188, -0.70855712890625, -0.6815872192382812, -0.6546173095703125, -0.6276473999023438, -0.600677490234375, -0.5737075805664062, -0.5467376708984375, -0.5197677612304688, -0.4927978515625, -0.46582794189453125, -0.4388580322265625, -0.41188812255859375, -0.384918212890625, -0.35794830322265625, -0.3309783935546875, -0.30400848388671875, -0.27703857421875, -0.25006866455078125, -0.2230987548828125, -0.19612884521484375, -0.169158935546875, -0.14218902587890625, -0.1152191162109375, -0.08824920654296875, -0.061279296875, -0.03430938720703125, -0.0073394775390625, 0.01963043212890625, 0.046600341796875, 0.07357025146484375, 0.1005401611328125, 0.12751007080078125, 0.15447998046875, 0.18144989013671875, 0.2084197998046875, 0.23538970947265625, 0.262359619140625, 0.28932952880859375, 0.3162994384765625, 0.34326934814453125, 0.3702392578125, 0.39720916748046875, 0.4241790771484375, 0.45114898681640625, 0.478118896484375, 0.5050888061523438, 0.5320587158203125, 0.5590286254882812, 0.58599853515625, 0.6129684448242188, 0.6399383544921875, 0.6669082641601562, 0.693878173828125, 0.7208480834960938, 0.7478179931640625, 0.7747879028320312, 0.8017578125]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 8.0, 6.0, 5.0, 8.0, 12.0, 13.0, 10.0, 24.0, 31.0, 35.0, 43.0, 72.0, 61.0, 77.0, 108.0, 88.0, 90.0, 61.0, 52.0, 39.0, 38.0, 30.0, 18.0, 16.0, 14.0, 14.0, 6.0, 5.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-12.078577995300293, -11.740821838378906, -11.403064727783203, -11.065308570861816, -10.72755241394043, -10.389795303344727, -10.05203914642334, -9.714282989501953, -9.37652587890625, -9.038769721984863, -8.70101261138916, -8.363256454467773, -8.02549934387207, -7.687743186950684, -7.349987030029297, -7.012230396270752, -6.674473762512207, -6.336717128753662, -5.998960494995117, -5.6612043380737305, -5.3234477043151855, -4.985691070556641, -4.647934913635254, -4.310178279876709, -3.972421646118164, -3.634665012359619, -3.2969086170196533, -2.9591522216796875, -2.6213955879211426, -2.2836389541625977, -1.9458825588226318, -1.608126163482666, -1.270369529724121, -0.9326130151748657, -0.5948565006256104, -0.257099986076355, 0.08065652847290039, 0.41841304302215576, 0.7561695575714111, 1.093925952911377, 1.4316825866699219, 1.7694391012191772, 2.1071956157684326, 2.4449520111083984, 2.7827086448669434, 3.1204652786254883, 3.458221673965454, 3.79597806930542, 4.133734703063965, 4.47149133682251, 4.809247970581055, 5.147004127502441, 5.484760761260986, 5.822517395019531, 6.160273551940918, 6.498030185699463, 6.835786819458008, 7.173543453216553, 7.511300086975098, 7.849056243896484, 8.186813354492188, 8.524569511413574, 8.862325668334961, 9.200082778930664, 9.53783893585205]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 8.0, 9.0, 8.0, 11.0, 21.0, 16.0, 23.0, 23.0, 30.0, 40.0, 36.0, 44.0, 38.0, 32.0, 57.0, 48.0, 43.0, 45.0, 35.0, 42.0, 44.0, 49.0, 34.0, 37.0, 40.0, 23.0, 33.0, 26.0, 19.0, 25.0, 14.0, 12.0, 12.0, 9.0, 3.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.963143348693848, -9.6455078125, -9.327871322631836, -9.010235786437988, -8.69260025024414, -8.374964714050293, -8.057329177856445, -7.739692687988281, -7.422057151794434, -7.104421615600586, -6.78678560256958, -6.469149589538574, -6.151514053344727, -5.833878517150879, -5.516242504119873, -5.198606491088867, -4.8809709548950195, -4.563335418701172, -4.245699405670166, -3.9280636310577393, -3.6104278564453125, -3.2927920818328857, -2.975156307220459, -2.6575205326080322, -2.3398847579956055, -2.0222489833831787, -1.704613208770752, -1.3869774341583252, -1.0693416595458984, -0.7517058849334717, -0.4340701103210449, -0.11643433570861816, 0.2012014389038086, 0.5188372135162354, 0.8364729881286621, 1.1541087627410889, 1.4717445373535156, 1.7893803119659424, 2.107016086578369, 2.424651861190796, 2.7422876358032227, 3.0599234104156494, 3.377559185028076, 3.695194959640503, 4.01283073425293, 4.330466270446777, 4.648102283477783, 4.965738296508789, 5.283373832702637, 5.601009368896484, 5.91864538192749, 6.236281394958496, 6.553916931152344, 6.871552467346191, 7.189188480377197, 7.506824493408203, 7.824460029602051, 8.142095565795898, 8.459732055664062, 8.77736759185791, 9.095003128051758, 9.412638664245605, 9.730274200439453, 10.047910690307617, 10.365546226501465]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 9.0, 14.0, 23.0, 24.0, 40.0, 61.0, 106.0, 185.0, 259.0, 518.0, 766.0, 1353.0, 2193.0, 3701.0, 6927.0, 12307.0, 23566.0, 45464.0, 91752.0, 221772.0, 868851.0, 1886234.0, 672044.0, 185477.0, 81719.0, 40658.0, 21216.0, 11536.0, 6421.0, 3635.0, 2141.0, 1256.0, 802.0, 453.0, 279.0, 179.0, 131.0, 68.0, 53.0, 28.0, 19.0, 16.0, 10.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.046875, -15.5518798828125, -15.056884765625, -14.5618896484375, -14.06689453125, -13.5718994140625, -13.076904296875, -12.5819091796875, -12.0869140625, -11.5919189453125, -11.096923828125, -10.6019287109375, -10.10693359375, -9.6119384765625, -9.116943359375, -8.6219482421875, -8.126953125, -7.6319580078125, -7.136962890625, -6.6419677734375, -6.14697265625, -5.6519775390625, -5.156982421875, -4.6619873046875, -4.1669921875, -3.6719970703125, -3.177001953125, -2.6820068359375, -2.18701171875, -1.6920166015625, -1.197021484375, -0.7020263671875, -0.20703125, 0.2879638671875, 0.782958984375, 1.2779541015625, 1.77294921875, 2.2679443359375, 2.762939453125, 3.2579345703125, 3.7529296875, 4.2479248046875, 4.742919921875, 5.2379150390625, 5.73291015625, 6.2279052734375, 6.722900390625, 7.2178955078125, 7.712890625, 8.2078857421875, 8.702880859375, 9.1978759765625, 9.69287109375, 10.1878662109375, 10.682861328125, 11.1778564453125, 11.6728515625, 12.1678466796875, 12.662841796875, 13.1578369140625, 13.65283203125, 14.1478271484375, 14.642822265625, 15.1378173828125, 15.6328125]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 2.0, 6.0, 9.0, 9.0, 17.0, 12.0, 21.0, 13.0, 26.0, 34.0, 43.0, 33.0, 26.0, 46.0, 42.0, 56.0, 50.0, 42.0, 55.0, 49.0, 36.0, 39.0, 43.0, 33.0, 40.0, 37.0, 32.0, 32.0, 26.0, 19.0, 16.0, 17.0, 15.0, 10.0, 5.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1640625, -8.8814697265625, -8.598876953125, -8.3162841796875, -8.03369140625, -7.7510986328125, -7.468505859375, -7.1859130859375, -6.9033203125, -6.6207275390625, -6.338134765625, -6.0555419921875, -5.77294921875, -5.4903564453125, -5.207763671875, -4.9251708984375, -4.642578125, -4.3599853515625, -4.077392578125, -3.7947998046875, -3.51220703125, -3.2296142578125, -2.947021484375, -2.6644287109375, -2.3818359375, -2.0992431640625, -1.816650390625, -1.5340576171875, -1.25146484375, -0.9688720703125, -0.686279296875, -0.4036865234375, -0.12109375, 0.1614990234375, 0.444091796875, 0.7266845703125, 1.00927734375, 1.2918701171875, 1.574462890625, 1.8570556640625, 2.1396484375, 2.4222412109375, 2.704833984375, 2.9874267578125, 3.27001953125, 3.5526123046875, 3.835205078125, 4.1177978515625, 4.400390625, 4.6829833984375, 4.965576171875, 5.2481689453125, 5.53076171875, 5.8133544921875, 6.095947265625, 6.3785400390625, 6.6611328125, 6.9437255859375, 7.226318359375, 7.5089111328125, 7.79150390625, 8.0740966796875, 8.356689453125, 8.6392822265625, 8.921875]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 16.0, 24.0, 41.0, 43.0, 82.0, 142.0, 236.0, 390.0, 715.0, 1148.0, 1811.0, 2952.0, 4932.0, 7960.0, 12732.0, 21649.0, 36813.0, 66332.0, 123667.0, 245910.0, 537847.0, 1247056.0, 1012055.0, 429115.0, 202285.0, 103624.0, 55503.0, 31556.0, 18698.0, 11337.0, 6874.0, 4148.0, 2643.0, 1507.0, 932.0, 591.0, 366.0, 212.0, 112.0, 83.0, 52.0, 35.0, 19.0, 11.0, 7.0, 8.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.625, -11.271240234375, -10.91748046875, -10.563720703125, -10.2099609375, -9.856201171875, -9.50244140625, -9.148681640625, -8.794921875, -8.441162109375, -8.08740234375, -7.733642578125, -7.3798828125, -7.026123046875, -6.67236328125, -6.318603515625, -5.96484375, -5.611083984375, -5.25732421875, -4.903564453125, -4.5498046875, -4.196044921875, -3.84228515625, -3.488525390625, -3.134765625, -2.781005859375, -2.42724609375, -2.073486328125, -1.7197265625, -1.365966796875, -1.01220703125, -0.658447265625, -0.3046875, 0.049072265625, 0.40283203125, 0.756591796875, 1.1103515625, 1.464111328125, 1.81787109375, 2.171630859375, 2.525390625, 2.879150390625, 3.23291015625, 3.586669921875, 3.9404296875, 4.294189453125, 4.64794921875, 5.001708984375, 5.35546875, 5.709228515625, 6.06298828125, 6.416748046875, 6.7705078125, 7.124267578125, 7.47802734375, 7.831787109375, 8.185546875, 8.539306640625, 8.89306640625, 9.246826171875, 9.6005859375, 9.954345703125, 10.30810546875, 10.661865234375, 11.015625]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 6.0, 9.0, 6.0, 8.0, 11.0, 25.0, 27.0, 33.0, 31.0, 34.0, 49.0, 72.0, 80.0, 91.0, 114.0, 147.0, 184.0, 235.0, 246.0, 330.0, 380.0, 341.0, 335.0, 268.0, 194.0, 161.0, 137.0, 96.0, 94.0, 59.0, 50.0, 50.0, 34.0, 32.0, 16.0, 20.0, 17.0, 12.0, 16.0, 10.0, 11.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.53515625, -4.39666748046875, -4.2581787109375, -4.11968994140625, -3.981201171875, -3.84271240234375, -3.7042236328125, -3.56573486328125, -3.42724609375, -3.28875732421875, -3.1502685546875, -3.01177978515625, -2.873291015625, -2.73480224609375, -2.5963134765625, -2.45782470703125, -2.3193359375, -2.18084716796875, -2.0423583984375, -1.90386962890625, -1.765380859375, -1.62689208984375, -1.4884033203125, -1.34991455078125, -1.21142578125, -1.07293701171875, -0.9344482421875, -0.79595947265625, -0.657470703125, -0.51898193359375, -0.3804931640625, -0.24200439453125, -0.103515625, 0.03497314453125, 0.1734619140625, 0.31195068359375, 0.450439453125, 0.58892822265625, 0.7274169921875, 0.86590576171875, 1.00439453125, 1.14288330078125, 1.2813720703125, 1.41986083984375, 1.558349609375, 1.69683837890625, 1.8353271484375, 1.97381591796875, 2.1123046875, 2.25079345703125, 2.3892822265625, 2.52777099609375, 2.666259765625, 2.80474853515625, 2.9432373046875, 3.08172607421875, 3.22021484375, 3.35870361328125, 3.4971923828125, 3.63568115234375, 3.774169921875, 3.91265869140625, 4.0511474609375, 4.18963623046875, 4.328125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 4.0, 3.0, 6.0, 10.0, 10.0, 9.0, 29.0, 18.0, 33.0, 42.0, 55.0, 59.0, 64.0, 92.0, 102.0, 100.0, 85.0, 65.0, 53.0, 41.0, 29.0, 21.0, 14.0, 11.0, 16.0, 7.0, 7.0, 5.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.589468955993652, -12.235082626342773, -11.880695343017578, -11.5263090133667, -11.17192268371582, -10.817535400390625, -10.463149070739746, -10.108762741088867, -9.754375457763672, -9.399989128112793, -9.045601844787598, -8.691215515136719, -8.336828231811523, -7.9824419021606445, -7.628055572509766, -7.2736687660217285, -6.919281959533691, -6.564895153045654, -6.210508346557617, -5.856122016906738, -5.501735210418701, -5.147348403930664, -4.792962074279785, -4.438575267791748, -4.084188461303711, -3.729801654815674, -3.375415086746216, -3.021028518676758, -2.6666417121887207, -2.3122549057006836, -1.9578683376312256, -1.6034817695617676, -1.2490949630737305, -0.8947082757949829, -0.5403215885162354, -0.1859349012374878, 0.16845178604125977, 0.5228384733200073, 0.8772251605987549, 1.231611728668213, 1.58599853515625, 1.9403852224349976, 2.294771909713745, 2.649158477783203, 3.0035452842712402, 3.3579320907592773, 3.7123186588287354, 4.066705226898193, 4.4210920333862305, 4.775478839874268, 5.129865646362305, 5.484251976013184, 5.838638782501221, 6.193025588989258, 6.547411918640137, 6.901798725128174, 7.256185531616211, 7.610572338104248, 7.964959144592285, 8.319345474243164, 8.67373275756836, 9.028119087219238, 9.382505416870117, 9.736892700195312, 10.091279029846191]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 7.0, 11.0, 7.0, 15.0, 13.0, 16.0, 24.0, 26.0, 23.0, 33.0, 38.0, 40.0, 31.0, 44.0, 34.0, 44.0, 44.0, 37.0, 25.0, 47.0, 44.0, 48.0, 37.0, 39.0, 37.0, 32.0, 21.0, 30.0, 21.0, 21.0, 25.0, 22.0, 17.0, 7.0, 10.0, 8.0, 8.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.862984657287598, -8.572951316833496, -8.282917022705078, -7.992883682250977, -7.702850341796875, -7.412816524505615, -7.1227827072143555, -6.832749366760254, -6.542716026306152, -6.252682209014893, -5.962648868560791, -5.672615051269531, -5.38258171081543, -5.09254789352417, -4.80251407623291, -4.512480735778809, -4.222446918487549, -3.932413339614868, -3.6423797607421875, -3.3523459434509277, -3.062312602996826, -2.7722787857055664, -2.4822452068328857, -2.192211627960205, -1.9021780490875244, -1.6121444702148438, -1.322110891342163, -1.0320771932601929, -0.7420436143875122, -0.45201003551483154, -0.16197633743286133, 0.12805724143981934, 0.4180908203125, 0.7081243991851807, 0.9981580376625061, 1.2881916761398315, 1.5782252550125122, 1.8682588338851929, 2.158292531967163, 2.4483261108398438, 2.7383596897125244, 3.028393268585205, 3.3184268474578857, 3.6084604263305664, 3.898494243621826, 4.188527584075928, 4.4785614013671875, 4.768594741821289, 5.058628559112549, 5.348662376403809, 5.63869571685791, 5.92872953414917, 6.2187628746032715, 6.508796691894531, 6.798830032348633, 7.088863849639893, 7.378897666931152, 7.668931484222412, 7.958964824676514, 8.248998641967773, 8.539031982421875, 8.829065322875977, 9.119099617004395, 9.409132957458496, 9.699166297912598]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 9.0, 4.0, 15.0, 17.0, 26.0, 38.0, 49.0, 87.0, 143.0, 185.0, 330.0, 517.0, 761.0, 1206.0, 1762.0, 2881.0, 4528.0, 7170.0, 11149.0, 17954.0, 29125.0, 48220.0, 83093.0, 165573.0, 349747.0, 137469.0, 72812.0, 43237.0, 25977.0, 16415.0, 10279.0, 6325.0, 4142.0, 2613.0, 1638.0, 1100.0, 685.0, 419.0, 282.0, 190.0, 120.0, 98.0, 63.0, 35.0, 27.0, 14.0, 8.0, 11.0, 7.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-2.810546875, -2.72882080078125, -2.6470947265625, -2.56536865234375, -2.483642578125, -2.40191650390625, -2.3201904296875, -2.23846435546875, -2.15673828125, -2.07501220703125, -1.9932861328125, -1.91156005859375, -1.829833984375, -1.74810791015625, -1.6663818359375, -1.58465576171875, -1.5029296875, -1.42120361328125, -1.3394775390625, -1.25775146484375, -1.176025390625, -1.09429931640625, -1.0125732421875, -0.93084716796875, -0.84912109375, -0.76739501953125, -0.6856689453125, -0.60394287109375, -0.522216796875, -0.44049072265625, -0.3587646484375, -0.27703857421875, -0.1953125, -0.11358642578125, -0.0318603515625, 0.04986572265625, 0.131591796875, 0.21331787109375, 0.2950439453125, 0.37677001953125, 0.45849609375, 0.54022216796875, 0.6219482421875, 0.70367431640625, 0.785400390625, 0.86712646484375, 0.9488525390625, 1.03057861328125, 1.1123046875, 1.19403076171875, 1.2757568359375, 1.35748291015625, 1.439208984375, 1.52093505859375, 1.6026611328125, 1.68438720703125, 1.76611328125, 1.84783935546875, 1.9295654296875, 2.01129150390625, 2.093017578125, 2.17474365234375, 2.2564697265625, 2.33819580078125, 2.419921875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 7.0, 5.0, 11.0, 11.0, 9.0, 10.0, 18.0, 25.0, 23.0, 35.0, 26.0, 27.0, 37.0, 31.0, 43.0, 37.0, 53.0, 40.0, 33.0, 44.0, 47.0, 39.0, 38.0, 42.0, 38.0, 30.0, 42.0, 22.0, 26.0, 28.0, 18.0, 29.0, 17.0, 16.0, 12.0, 9.0, 9.0, 5.0, 2.0, 7.0, 2.0, 5.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7578125, -8.462158203125, -8.16650390625, -7.870849609375, -7.5751953125, -7.279541015625, -6.98388671875, -6.688232421875, -6.392578125, -6.096923828125, -5.80126953125, -5.505615234375, -5.2099609375, -4.914306640625, -4.61865234375, -4.322998046875, -4.02734375, -3.731689453125, -3.43603515625, -3.140380859375, -2.8447265625, -2.549072265625, -2.25341796875, -1.957763671875, -1.662109375, -1.366455078125, -1.07080078125, -0.775146484375, -0.4794921875, -0.183837890625, 0.11181640625, 0.407470703125, 0.703125, 0.998779296875, 1.29443359375, 1.590087890625, 1.8857421875, 2.181396484375, 2.47705078125, 2.772705078125, 3.068359375, 3.364013671875, 3.65966796875, 3.955322265625, 4.2509765625, 4.546630859375, 4.84228515625, 5.137939453125, 5.43359375, 5.729248046875, 6.02490234375, 6.320556640625, 6.6162109375, 6.911865234375, 7.20751953125, 7.503173828125, 7.798828125, 8.094482421875, 8.39013671875, 8.685791015625, 8.9814453125, 9.277099609375, 9.57275390625, 9.868408203125, 10.1640625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 10.0, 7.0, 15.0, 18.0, 21.0, 30.0, 63.0, 86.0, 135.0, 188.0, 264.0, 364.0, 490.0, 752.0, 1177.0, 1581.0, 2440.0, 3826.0, 5642.0, 8887.0, 13900.0, 22633.0, 36661.0, 62411.0, 110389.0, 258648.0, 249502.0, 109049.0, 61335.0, 36568.0, 22111.0, 13850.0, 8716.0, 5615.0, 3595.0, 2391.0, 1648.0, 1096.0, 739.0, 515.0, 395.0, 230.0, 167.0, 104.0, 104.0, 67.0, 41.0, 37.0, 18.0, 13.0, 7.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.5234375, -2.444549560546875, -2.36566162109375, -2.286773681640625, -2.2078857421875, -2.128997802734375, -2.05010986328125, -1.971221923828125, -1.892333984375, -1.813446044921875, -1.73455810546875, -1.655670166015625, -1.5767822265625, -1.497894287109375, -1.41900634765625, -1.340118408203125, -1.26123046875, -1.182342529296875, -1.10345458984375, -1.024566650390625, -0.9456787109375, -0.866790771484375, -0.78790283203125, -0.709014892578125, -0.630126953125, -0.551239013671875, -0.47235107421875, -0.393463134765625, -0.3145751953125, -0.235687255859375, -0.15679931640625, -0.077911376953125, 0.0009765625, 0.079864501953125, 0.15875244140625, 0.237640380859375, 0.3165283203125, 0.395416259765625, 0.47430419921875, 0.553192138671875, 0.632080078125, 0.710968017578125, 0.78985595703125, 0.868743896484375, 0.9476318359375, 1.026519775390625, 1.10540771484375, 1.184295654296875, 1.26318359375, 1.342071533203125, 1.42095947265625, 1.499847412109375, 1.5787353515625, 1.657623291015625, 1.73651123046875, 1.815399169921875, 1.894287109375, 1.973175048828125, 2.05206298828125, 2.130950927734375, 2.2098388671875, 2.288726806640625, 2.36761474609375, 2.446502685546875, 2.525390625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 6.0, 6.0, 4.0, 7.0, 12.0, 12.0, 11.0, 12.0, 21.0, 21.0, 23.0, 30.0, 33.0, 40.0, 34.0, 34.0, 37.0, 31.0, 33.0, 45.0, 34.0, 32.0, 40.0, 38.0, 41.0, 35.0, 35.0, 41.0, 33.0, 34.0, 30.0, 21.0, 16.0, 17.0, 29.0, 14.0, 10.0, 9.0, 7.0, 10.0, 7.0, 3.0, 6.0, 2.0, 1.0, 2.0, 5.0, 3.0, 1.0, 2.0], "bins": [-6.29296875, -6.1163330078125, -5.939697265625, -5.7630615234375, -5.58642578125, -5.4097900390625, -5.233154296875, -5.0565185546875, -4.8798828125, -4.7032470703125, -4.526611328125, -4.3499755859375, -4.17333984375, -3.9967041015625, -3.820068359375, -3.6434326171875, -3.466796875, -3.2901611328125, -3.113525390625, -2.9368896484375, -2.76025390625, -2.5836181640625, -2.406982421875, -2.2303466796875, -2.0537109375, -1.8770751953125, -1.700439453125, -1.5238037109375, -1.34716796875, -1.1705322265625, -0.993896484375, -0.8172607421875, -0.640625, -0.4639892578125, -0.287353515625, -0.1107177734375, 0.06591796875, 0.2425537109375, 0.419189453125, 0.5958251953125, 0.7724609375, 0.9490966796875, 1.125732421875, 1.3023681640625, 1.47900390625, 1.6556396484375, 1.832275390625, 2.0089111328125, 2.185546875, 2.3621826171875, 2.538818359375, 2.7154541015625, 2.89208984375, 3.0687255859375, 3.245361328125, 3.4219970703125, 3.5986328125, 3.7752685546875, 3.951904296875, 4.1285400390625, 4.30517578125, 4.4818115234375, 4.658447265625, 4.8350830078125, 5.01171875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 8.0, 3.0, 12.0, 12.0, 16.0, 21.0, 24.0, 35.0, 42.0, 64.0, 110.0, 114.0, 162.0, 185.0, 272.0, 341.0, 535.0, 739.0, 991.0, 1500.0, 2390.0, 3608.0, 5863.0, 9718.0, 17271.0, 33571.0, 72531.0, 181013.0, 362651.0, 195574.0, 77318.0, 35693.0, 18322.0, 10295.0, 5953.0, 3743.0, 2391.0, 1576.0, 1092.0, 779.0, 530.0, 387.0, 288.0, 217.0, 172.0, 127.0, 96.0, 56.0, 44.0, 28.0, 27.0, 23.0, 13.0, 10.0, 4.0, 4.0, 3.0, 2.0, 1.0], "bins": [-0.004360198974609375, -0.004230201244354248, -0.004100203514099121, -0.003970205783843994, -0.003840208053588867, -0.0037102103233337402, -0.0035802125930786133, -0.0034502148628234863, -0.0033202171325683594, -0.0031902194023132324, -0.0030602216720581055, -0.0029302239418029785, -0.0028002262115478516, -0.0026702284812927246, -0.0025402307510375977, -0.0024102330207824707, -0.0022802352905273438, -0.002150237560272217, -0.00202023983001709, -0.0018902420997619629, -0.001760244369506836, -0.001630246639251709, -0.001500248908996582, -0.001370251178741455, -0.0012402534484863281, -0.0011102557182312012, -0.0009802579879760742, -0.0008502602577209473, -0.0007202625274658203, -0.0005902647972106934, -0.0004602670669555664, -0.00033026933670043945, -0.0002002716064453125, -7.027387619018555e-05, 5.9723854064941406e-05, 0.00018972158432006836, 0.0003197193145751953, 0.00044971704483032227, 0.0005797147750854492, 0.0007097125053405762, 0.0008397102355957031, 0.0009697079658508301, 0.001099705696105957, 0.001229703426361084, 0.001359701156616211, 0.0014896988868713379, 0.0016196966171264648, 0.0017496943473815918, 0.0018796920776367188, 0.0020096898078918457, 0.0021396875381469727, 0.0022696852684020996, 0.0023996829986572266, 0.0025296807289123535, 0.0026596784591674805, 0.0027896761894226074, 0.0029196739196777344, 0.0030496716499328613, 0.0031796693801879883, 0.0033096671104431152, 0.003439664840698242, 0.003569662570953369, 0.003699660301208496, 0.003829658031463623, 0.00395965576171875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 4.0, 3.0, 10.0, 4.0, 6.0, 9.0, 16.0, 17.0, 20.0, 37.0, 45.0, 48.0, 75.0, 51.0, 96.0, 69.0, 95.0, 54.0, 60.0, 82.0, 43.0, 35.0, 21.0, 28.0, 9.0, 14.0, 15.0, 16.0, 8.0, 1.0, 4.0, 6.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.291534423828125e-06, -4.147179424762726e-06, -4.002824425697327e-06, -3.8584694266319275e-06, -3.7141144275665283e-06, -3.569759428501129e-06, -3.42540442943573e-06, -3.281049430370331e-06, -3.1366944313049316e-06, -2.9923394322395325e-06, -2.8479844331741333e-06, -2.703629434108734e-06, -2.559274435043335e-06, -2.414919435977936e-06, -2.2705644369125366e-06, -2.1262094378471375e-06, -1.9818544387817383e-06, -1.8374994397163391e-06, -1.69314444065094e-06, -1.5487894415855408e-06, -1.4044344425201416e-06, -1.2600794434547424e-06, -1.1157244443893433e-06, -9.71369445323944e-07, -8.270144462585449e-07, -6.826594471931458e-07, -5.383044481277466e-07, -3.939494490623474e-07, -2.4959444999694824e-07, -1.0523945093154907e-07, 3.91155481338501e-08, 1.8347054719924927e-07, 3.2782554626464844e-07, 4.721805453300476e-07, 6.165355443954468e-07, 7.60890543460846e-07, 9.052455425262451e-07, 1.0496005415916443e-06, 1.1939555406570435e-06, 1.3383105397224426e-06, 1.4826655387878418e-06, 1.627020537853241e-06, 1.7713755369186401e-06, 1.9157305359840393e-06, 2.0600855350494385e-06, 2.2044405341148376e-06, 2.348795533180237e-06, 2.493150532245636e-06, 2.637505531311035e-06, 2.7818605303764343e-06, 2.9262155294418335e-06, 3.0705705285072327e-06, 3.214925527572632e-06, 3.359280526638031e-06, 3.50363552570343e-06, 3.6479905247688293e-06, 3.7923455238342285e-06, 3.936700522899628e-06, 4.081055521965027e-06, 4.225410521030426e-06, 4.369765520095825e-06, 4.514120519161224e-06, 4.6584755182266235e-06, 4.802830517292023e-06, 4.947185516357422e-06]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 5.0, 10.0, 13.0, 12.0, 30.0, 41.0, 59.0, 71.0, 103.0, 174.0, 199.0, 360.0, 540.0, 801.0, 1310.0, 2139.0, 3777.0, 7136.0, 15151.0, 35880.0, 100682.0, 341771.0, 360677.0, 106944.0, 37762.0, 15577.0, 7466.0, 3827.0, 2163.0, 1400.0, 810.0, 527.0, 372.0, 242.0, 176.0, 99.0, 82.0, 55.0, 36.0, 25.0, 13.0, 14.0, 2.0, 8.0, 9.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.005779266357421875, -0.005604267120361328, -0.005429267883300781, -0.005254268646240234, -0.0050792694091796875, -0.004904270172119141, -0.004729270935058594, -0.004554271697998047, -0.0043792724609375, -0.004204273223876953, -0.004029273986816406, -0.0038542747497558594, -0.0036792755126953125, -0.0035042762756347656, -0.0033292770385742188, -0.003154277801513672, -0.002979278564453125, -0.002804279327392578, -0.0026292800903320312, -0.0024542808532714844, -0.0022792816162109375, -0.0021042823791503906, -0.0019292831420898438, -0.0017542839050292969, -0.00157928466796875, -0.0014042854309082031, -0.0012292861938476562, -0.0010542869567871094, -0.0008792877197265625, -0.0007042884826660156, -0.0005292892456054688, -0.0003542900085449219, -0.000179290771484375, -4.291534423828125e-06, 0.00017070770263671875, 0.0003457069396972656, 0.0005207061767578125, 0.0006957054138183594, 0.0008707046508789062, 0.0010457038879394531, 0.001220703125, 0.0013957023620605469, 0.0015707015991210938, 0.0017457008361816406, 0.0019207000732421875, 0.0020956993103027344, 0.0022706985473632812, 0.002445697784423828, 0.002620697021484375, 0.002795696258544922, 0.0029706954956054688, 0.0031456947326660156, 0.0033206939697265625, 0.0034956932067871094, 0.0036706924438476562, 0.003845691680908203, 0.00402069091796875, 0.004195690155029297, 0.004370689392089844, 0.004545688629150391, 0.0047206878662109375, 0.004895687103271484, 0.005070686340332031, 0.005245685577392578, 0.005420684814453125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 4.0, 5.0, 8.0, 7.0, 4.0, 12.0, 16.0, 24.0, 25.0, 35.0, 59.0, 82.0, 112.0, 114.0, 124.0, 82.0, 85.0, 54.0, 33.0, 34.0, 23.0, 17.0, 10.0, 8.0, 8.0, 1.0, 3.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0023288726806640625, -0.0022660642862319946, -0.0022032558917999268, -0.002140447497367859, -0.002077639102935791, -0.002014830708503723, -0.0019520223140716553, -0.0018892139196395874, -0.0018264055252075195, -0.0017635971307754517, -0.0017007887363433838, -0.001637980341911316, -0.001575171947479248, -0.0015123635530471802, -0.0014495551586151123, -0.0013867467641830444, -0.0013239383697509766, -0.0012611299753189087, -0.0011983215808868408, -0.001135513186454773, -0.001072704792022705, -0.0010098963975906372, -0.0009470880031585693, -0.0008842796087265015, -0.0008214712142944336, -0.0007586628198623657, -0.0006958544254302979, -0.00063304603099823, -0.0005702376365661621, -0.0005074292421340942, -0.00044462084770202637, -0.0003818124532699585, -0.0003190040588378906, -0.00025619566440582275, -0.00019338726997375488, -0.000130578875541687, -6.777048110961914e-05, -4.9620866775512695e-06, 5.78463077545166e-05, 0.00012065470218658447, 0.00018346309661865234, 0.0002462714910507202, 0.0003090798854827881, 0.00037188827991485596, 0.00043469667434692383, 0.0004975050687789917, 0.0005603134632110596, 0.0006231218576431274, 0.0006859302520751953, 0.0007487386465072632, 0.0008115470409393311, 0.0008743554353713989, 0.0009371638298034668, 0.0009999722242355347, 0.0010627806186676025, 0.0011255890130996704, 0.0011883974075317383, 0.0012512058019638062, 0.001314014196395874, 0.001376822590827942, 0.0014396309852600098, 0.0015024393796920776, 0.0015652477741241455, 0.0016280561685562134, 0.0016908645629882812]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 5.0, 12.0, 10.0, 14.0, 25.0, 17.0, 34.0, 55.0, 53.0, 55.0, 83.0, 92.0, 110.0, 91.0, 76.0, 69.0, 51.0, 33.0, 22.0, 26.0, 12.0, 11.0, 11.0, 7.0, 8.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-12.359190940856934, -11.998172760009766, -11.637155532836914, -11.276138305664062, -10.915120124816895, -10.554101943969727, -10.193084716796875, -9.832067489624023, -9.471049308776855, -9.110031127929688, -8.749013900756836, -8.387996673583984, -8.026978492736816, -7.665960788726807, -7.304943084716797, -6.943925380706787, -6.582907676696777, -6.221889972686768, -5.860872268676758, -5.499854564666748, -5.138836860656738, -4.7778191566467285, -4.416801452636719, -4.055783748626709, -3.694766044616699, -3.3337483406066895, -2.9727306365966797, -2.61171293258667, -2.25069522857666, -1.8896775245666504, -1.5286598205566406, -1.1676421165466309, -0.8066253662109375, -0.44560766220092773, -0.08458995819091797, 0.2764277458190918, 0.6374454498291016, 0.9984631538391113, 1.359480857849121, 1.7204985618591309, 2.0815162658691406, 2.4425339698791504, 2.80355167388916, 3.16456937789917, 3.5255870819091797, 3.8866047859191895, 4.247622489929199, 4.608640193939209, 4.969657897949219, 5.3306756019592285, 5.691693305969238, 6.052711009979248, 6.413728713989258, 6.774746417999268, 7.135764122009277, 7.496781826019287, 7.857799530029297, 8.218816757202148, 8.579834938049316, 8.940853118896484, 9.301870346069336, 9.662887573242188, 10.023905754089355, 10.384923934936523, 10.745941162109375]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 7.0, 11.0, 7.0, 15.0, 12.0, 17.0, 24.0, 28.0, 21.0, 32.0, 40.0, 38.0, 33.0, 44.0, 34.0, 44.0, 41.0, 41.0, 24.0, 47.0, 44.0, 48.0, 37.0, 42.0, 34.0, 30.0, 24.0, 28.0, 20.0, 22.0, 25.0, 23.0, 16.0, 7.0, 11.0, 7.0, 9.0, 3.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.806563377380371, -8.517349243164062, -8.228134155273438, -7.938919544219971, -7.649704933166504, -7.360490322113037, -7.07127571105957, -6.7820611000061035, -6.492846488952637, -6.20363187789917, -5.914417266845703, -5.625202655792236, -5.3359880447387695, -5.046773433685303, -4.757558822631836, -4.468344211578369, -4.179129600524902, -3.8899149894714355, -3.6007003784179688, -3.311485767364502, -3.022271156311035, -2.7330565452575684, -2.4438419342041016, -2.1546273231506348, -1.865412712097168, -1.5761981010437012, -1.2869834899902344, -0.9977688789367676, -0.7085542678833008, -0.419339656829834, -0.1301250457763672, 0.1590895652770996, 0.44830322265625, 0.7375178337097168, 1.0267324447631836, 1.3159470558166504, 1.6051616668701172, 1.894376277923584, 2.183590888977051, 2.4728055000305176, 2.7620201110839844, 3.051234722137451, 3.340449333190918, 3.6296639442443848, 3.9188785552978516, 4.208093166351318, 4.497307777404785, 4.786522388458252, 5.075736999511719, 5.3649516105651855, 5.654166221618652, 5.943380832672119, 6.232595443725586, 6.521810054779053, 6.8110246658325195, 7.100239276885986, 7.389453887939453, 7.67866849899292, 7.967883110046387, 8.257097244262695, 8.54631233215332, 8.835527420043945, 9.124741554260254, 9.413955688476562, 9.703170776367188]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 1.0, 8.0, 7.0, 13.0, 13.0, 23.0, 19.0, 38.0, 74.0, 106.0, 116.0, 194.0, 274.0, 439.0, 633.0, 930.0, 1438.0, 2340.0, 3584.0, 5711.0, 9007.0, 14337.0, 23027.0, 37795.0, 63604.0, 106437.0, 165770.0, 196704.0, 159477.0, 101109.0, 60121.0, 35771.0, 21992.0, 13532.0, 8665.0, 5352.0, 3465.0, 2215.0, 1427.0, 939.0, 661.0, 378.0, 257.0, 173.0, 117.0, 90.0, 62.0, 48.0, 25.0, 13.0, 7.0, 9.0, 7.0, 3.0, 3.0, 6.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.1015625, -12.6849365234375, -12.268310546875, -11.8516845703125, -11.43505859375, -11.0184326171875, -10.601806640625, -10.1851806640625, -9.7685546875, -9.3519287109375, -8.935302734375, -8.5186767578125, -8.10205078125, -7.6854248046875, -7.268798828125, -6.8521728515625, -6.435546875, -6.0189208984375, -5.602294921875, -5.1856689453125, -4.76904296875, -4.3524169921875, -3.935791015625, -3.5191650390625, -3.1025390625, -2.6859130859375, -2.269287109375, -1.8526611328125, -1.43603515625, -1.0194091796875, -0.602783203125, -0.1861572265625, 0.23046875, 0.6470947265625, 1.063720703125, 1.4803466796875, 1.89697265625, 2.3135986328125, 2.730224609375, 3.1468505859375, 3.5634765625, 3.9801025390625, 4.396728515625, 4.8133544921875, 5.22998046875, 5.6466064453125, 6.063232421875, 6.4798583984375, 6.896484375, 7.3131103515625, 7.729736328125, 8.1463623046875, 8.56298828125, 8.9796142578125, 9.396240234375, 9.8128662109375, 10.2294921875, 10.6461181640625, 11.062744140625, 11.4793701171875, 11.89599609375, 12.3126220703125, 12.729248046875, 13.1458740234375, 13.5625]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 4.0, 8.0, 7.0, 5.0, 16.0, 20.0, 10.0, 22.0, 32.0, 18.0, 30.0, 41.0, 37.0, 29.0, 38.0, 44.0, 50.0, 24.0, 43.0, 37.0, 36.0, 37.0, 55.0, 45.0, 37.0, 36.0, 33.0, 26.0, 23.0, 20.0, 24.0, 29.0, 10.0, 19.0, 15.0, 10.0, 6.0, 10.0, 7.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.9296875, -7.6634521484375, -7.397216796875, -7.1309814453125, -6.86474609375, -6.5985107421875, -6.332275390625, -6.0660400390625, -5.7998046875, -5.5335693359375, -5.267333984375, -5.0010986328125, -4.73486328125, -4.4686279296875, -4.202392578125, -3.9361572265625, -3.669921875, -3.4036865234375, -3.137451171875, -2.8712158203125, -2.60498046875, -2.3387451171875, -2.072509765625, -1.8062744140625, -1.5400390625, -1.2738037109375, -1.007568359375, -0.7413330078125, -0.47509765625, -0.2088623046875, 0.057373046875, 0.3236083984375, 0.58984375, 0.8560791015625, 1.122314453125, 1.3885498046875, 1.65478515625, 1.9210205078125, 2.187255859375, 2.4534912109375, 2.7197265625, 2.9859619140625, 3.252197265625, 3.5184326171875, 3.78466796875, 4.0509033203125, 4.317138671875, 4.5833740234375, 4.849609375, 5.1158447265625, 5.382080078125, 5.6483154296875, 5.91455078125, 6.1807861328125, 6.447021484375, 6.7132568359375, 6.9794921875, 7.2457275390625, 7.511962890625, 7.7781982421875, 8.04443359375, 8.3106689453125, 8.576904296875, 8.8431396484375, 9.109375]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 7.0, 19.0, 31.0, 32.0, 53.0, 78.0, 121.0, 212.0, 356.0, 522.0, 803.0, 1280.0, 1949.0, 2927.0, 4510.0, 6855.0, 10837.0, 16879.0, 26747.0, 43362.0, 71526.0, 116441.0, 171131.0, 188351.0, 144186.0, 91285.0, 55245.0, 34094.0, 20856.0, 13360.0, 8534.0, 5668.0, 3516.0, 2400.0, 1544.0, 1031.0, 626.0, 442.0, 263.0, 160.0, 123.0, 74.0, 43.0, 32.0, 16.0, 12.0, 6.0, 2.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-13.4140625, -12.998046875, -12.58203125, -12.166015625, -11.75, -11.333984375, -10.91796875, -10.501953125, -10.0859375, -9.669921875, -9.25390625, -8.837890625, -8.421875, -8.005859375, -7.58984375, -7.173828125, -6.7578125, -6.341796875, -5.92578125, -5.509765625, -5.09375, -4.677734375, -4.26171875, -3.845703125, -3.4296875, -3.013671875, -2.59765625, -2.181640625, -1.765625, -1.349609375, -0.93359375, -0.517578125, -0.1015625, 0.314453125, 0.73046875, 1.146484375, 1.5625, 1.978515625, 2.39453125, 2.810546875, 3.2265625, 3.642578125, 4.05859375, 4.474609375, 4.890625, 5.306640625, 5.72265625, 6.138671875, 6.5546875, 6.970703125, 7.38671875, 7.802734375, 8.21875, 8.634765625, 9.05078125, 9.466796875, 9.8828125, 10.298828125, 10.71484375, 11.130859375, 11.546875, 11.962890625, 12.37890625, 12.794921875, 13.2109375]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 7.0, 4.0, 9.0, 7.0, 8.0, 13.0, 14.0, 14.0, 20.0, 22.0, 20.0, 18.0, 25.0, 34.0, 33.0, 39.0, 39.0, 32.0, 44.0, 41.0, 45.0, 41.0, 41.0, 41.0, 37.0, 33.0, 41.0, 39.0, 39.0, 28.0, 28.0, 22.0, 30.0, 19.0, 17.0, 6.0, 14.0, 12.0, 6.0, 10.0, 3.0, 2.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.80859375, -4.63720703125, -4.4658203125, -4.29443359375, -4.123046875, -3.95166015625, -3.7802734375, -3.60888671875, -3.4375, -3.26611328125, -3.0947265625, -2.92333984375, -2.751953125, -2.58056640625, -2.4091796875, -2.23779296875, -2.06640625, -1.89501953125, -1.7236328125, -1.55224609375, -1.380859375, -1.20947265625, -1.0380859375, -0.86669921875, -0.6953125, -0.52392578125, -0.3525390625, -0.18115234375, -0.009765625, 0.16162109375, 0.3330078125, 0.50439453125, 0.67578125, 0.84716796875, 1.0185546875, 1.18994140625, 1.361328125, 1.53271484375, 1.7041015625, 1.87548828125, 2.046875, 2.21826171875, 2.3896484375, 2.56103515625, 2.732421875, 2.90380859375, 3.0751953125, 3.24658203125, 3.41796875, 3.58935546875, 3.7607421875, 3.93212890625, 4.103515625, 4.27490234375, 4.4462890625, 4.61767578125, 4.7890625, 4.96044921875, 5.1318359375, 5.30322265625, 5.474609375, 5.64599609375, 5.8173828125, 5.98876953125, 6.16015625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 10.0, 20.0, 15.0, 23.0, 36.0, 49.0, 78.0, 110.0, 157.0, 247.0, 353.0, 563.0, 824.0, 1278.0, 1859.0, 3062.0, 4858.0, 7820.0, 13262.0, 23873.0, 46271.0, 108445.0, 331365.0, 305041.0, 99491.0, 43654.0, 22694.0, 12585.0, 7508.0, 4612.0, 2898.0, 1902.0, 1182.0, 816.0, 493.0, 380.0, 232.0, 169.0, 101.0, 76.0, 48.0, 26.0, 21.0, 14.0, 9.0, 8.0, 4.0, 6.0, 3.0, 4.0, 3.0, 1.0, 2.0], "bins": [-2.677734375, -2.598876953125, -2.52001953125, -2.441162109375, -2.3623046875, -2.283447265625, -2.20458984375, -2.125732421875, -2.046875, -1.968017578125, -1.88916015625, -1.810302734375, -1.7314453125, -1.652587890625, -1.57373046875, -1.494873046875, -1.416015625, -1.337158203125, -1.25830078125, -1.179443359375, -1.1005859375, -1.021728515625, -0.94287109375, -0.864013671875, -0.78515625, -0.706298828125, -0.62744140625, -0.548583984375, -0.4697265625, -0.390869140625, -0.31201171875, -0.233154296875, -0.154296875, -0.075439453125, 0.00341796875, 0.082275390625, 0.1611328125, 0.239990234375, 0.31884765625, 0.397705078125, 0.4765625, 0.555419921875, 0.63427734375, 0.713134765625, 0.7919921875, 0.870849609375, 0.94970703125, 1.028564453125, 1.107421875, 1.186279296875, 1.26513671875, 1.343994140625, 1.4228515625, 1.501708984375, 1.58056640625, 1.659423828125, 1.73828125, 1.817138671875, 1.89599609375, 1.974853515625, 2.0537109375, 2.132568359375, 2.21142578125, 2.290283203125, 2.369140625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 2.0, 5.0, 7.0, 8.0, 19.0, 16.0, 20.0, 25.0, 31.0, 50.0, 43.0, 51.0, 59.0, 59.0, 64.0, 58.0, 63.0, 68.0, 54.0, 65.0, 39.0, 28.0, 27.0, 23.0, 18.0, 19.0, 16.0, 8.0, 8.0, 3.0, 4.0, 7.0, 5.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-9.679794311523438e-05, -9.389221668243408e-05, -9.098649024963379e-05, -8.80807638168335e-05, -8.51750373840332e-05, -8.226931095123291e-05, -7.936358451843262e-05, -7.645785808563232e-05, -7.355213165283203e-05, -7.064640522003174e-05, -6.774067878723145e-05, -6.483495235443115e-05, -6.192922592163086e-05, -5.9023499488830566e-05, -5.6117773056030273e-05, -5.321204662322998e-05, -5.030632019042969e-05, -4.7400593757629395e-05, -4.44948673248291e-05, -4.158914089202881e-05, -3.8683414459228516e-05, -3.577768802642822e-05, -3.287196159362793e-05, -2.9966235160827637e-05, -2.7060508728027344e-05, -2.415478229522705e-05, -2.1249055862426758e-05, -1.8343329429626465e-05, -1.5437602996826172e-05, -1.2531876564025879e-05, -9.626150131225586e-06, -6.720423698425293e-06, -3.814697265625e-06, -9.08970832824707e-07, 1.996755599975586e-06, 4.902482032775879e-06, 7.808208465576172e-06, 1.0713934898376465e-05, 1.3619661331176758e-05, 1.652538776397705e-05, 1.9431114196777344e-05, 2.2336840629577637e-05, 2.524256706237793e-05, 2.8148293495178223e-05, 3.1054019927978516e-05, 3.395974636077881e-05, 3.68654727935791e-05, 3.9771199226379395e-05, 4.267692565917969e-05, 4.558265209197998e-05, 4.8488378524780273e-05, 5.1394104957580566e-05, 5.429983139038086e-05, 5.720555782318115e-05, 6.0111284255981445e-05, 6.301701068878174e-05, 6.592273712158203e-05, 6.882846355438232e-05, 7.173418998718262e-05, 7.463991641998291e-05, 7.75456428527832e-05, 8.04513692855835e-05, 8.335709571838379e-05, 8.626282215118408e-05, 8.916854858398438e-05]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 5.0, 6.0, 9.0, 9.0, 19.0, 21.0, 25.0, 58.0, 60.0, 108.0, 174.0, 244.0, 370.0, 608.0, 887.0, 1358.0, 2229.0, 3572.0, 5886.0, 9882.0, 17597.0, 33070.0, 68154.0, 173391.0, 393002.0, 187044.0, 71383.0, 34882.0, 18175.0, 10192.0, 6056.0, 3644.0, 2282.0, 1477.0, 968.0, 563.0, 409.0, 263.0, 175.0, 109.0, 71.0, 47.0, 22.0, 21.0, 15.0, 8.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.5078125, -2.43072509765625, -2.3536376953125, -2.27655029296875, -2.199462890625, -2.12237548828125, -2.0452880859375, -1.96820068359375, -1.89111328125, -1.81402587890625, -1.7369384765625, -1.65985107421875, -1.582763671875, -1.50567626953125, -1.4285888671875, -1.35150146484375, -1.2744140625, -1.19732666015625, -1.1202392578125, -1.04315185546875, -0.966064453125, -0.88897705078125, -0.8118896484375, -0.73480224609375, -0.65771484375, -0.58062744140625, -0.5035400390625, -0.42645263671875, -0.349365234375, -0.27227783203125, -0.1951904296875, -0.11810302734375, -0.041015625, 0.03607177734375, 0.1131591796875, 0.19024658203125, 0.267333984375, 0.34442138671875, 0.4215087890625, 0.49859619140625, 0.57568359375, 0.65277099609375, 0.7298583984375, 0.80694580078125, 0.884033203125, 0.96112060546875, 1.0382080078125, 1.11529541015625, 1.1923828125, 1.26947021484375, 1.3465576171875, 1.42364501953125, 1.500732421875, 1.57781982421875, 1.6549072265625, 1.73199462890625, 1.80908203125, 1.88616943359375, 1.9632568359375, 2.04034423828125, 2.117431640625, 2.19451904296875, 2.2716064453125, 2.34869384765625, 2.42578125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 7.0, 7.0, 7.0, 10.0, 6.0, 13.0, 11.0, 15.0, 21.0, 32.0, 21.0, 44.0, 49.0, 41.0, 41.0, 63.0, 72.0, 61.0, 68.0, 56.0, 52.0, 49.0, 41.0, 38.0, 38.0, 13.0, 27.0, 16.0, 15.0, 11.0, 11.0, 4.0, 10.0, 13.0, 0.0, 2.0, 4.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.70068359375, -0.6751251220703125, -0.649566650390625, -0.6240081787109375, -0.59844970703125, -0.5728912353515625, -0.547332763671875, -0.5217742919921875, -0.4962158203125, -0.4706573486328125, -0.445098876953125, -0.4195404052734375, -0.39398193359375, -0.3684234619140625, -0.342864990234375, -0.3173065185546875, -0.291748046875, -0.2661895751953125, -0.240631103515625, -0.2150726318359375, -0.18951416015625, -0.1639556884765625, -0.138397216796875, -0.1128387451171875, -0.0872802734375, -0.0617218017578125, -0.036163330078125, -0.0106048583984375, 0.01495361328125, 0.0405120849609375, 0.066070556640625, 0.0916290283203125, 0.1171875, 0.1427459716796875, 0.168304443359375, 0.1938629150390625, 0.21942138671875, 0.2449798583984375, 0.270538330078125, 0.2960968017578125, 0.3216552734375, 0.3472137451171875, 0.372772216796875, 0.3983306884765625, 0.42388916015625, 0.4494476318359375, 0.475006103515625, 0.5005645751953125, 0.526123046875, 0.5516815185546875, 0.577239990234375, 0.6027984619140625, 0.62835693359375, 0.6539154052734375, 0.679473876953125, 0.7050323486328125, 0.7305908203125, 0.7561492919921875, 0.781707763671875, 0.8072662353515625, 0.83282470703125, 0.8583831787109375, 0.883941650390625, 0.9095001220703125, 0.93505859375]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 8.0, 11.0, 17.0, 18.0, 30.0, 27.0, 43.0, 48.0, 57.0, 67.0, 90.0, 102.0, 87.0, 71.0, 61.0, 58.0, 46.0, 38.0, 24.0, 22.0, 16.0, 12.0, 6.0, 6.0, 7.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.092114448547363, -9.752225875854492, -9.412338256835938, -9.072449684143066, -8.732561111450195, -8.392672538757324, -8.052783966064453, -7.712896347045898, -7.373007774353027, -7.033119201660156, -6.693231105804443, -6.3533430099487305, -6.013454437255859, -5.673565864562988, -5.333677768707275, -4.9937896728515625, -4.653901100158691, -4.31401252746582, -3.9741244316101074, -3.6342360973358154, -3.2943477630615234, -2.9544594287872314, -2.6145710945129395, -2.2746827602386475, -1.9347944259643555, -1.5949060916900635, -1.2550177574157715, -0.9151294231414795, -0.5752410888671875, -0.2353527545928955, 0.10453557968139648, 0.4444239139556885, 0.7843132019042969, 1.1242015361785889, 1.4640898704528809, 1.8039782047271729, 2.143866539001465, 2.483754873275757, 2.823643207550049, 3.163531541824341, 3.503419876098633, 3.843308210372925, 4.183196544647217, 4.52308464050293, 4.862973213195801, 5.202861785888672, 5.542749881744385, 5.882637977600098, 6.222526550292969, 6.56241512298584, 6.902303218841553, 7.242191314697266, 7.582079887390137, 7.921968460083008, 8.261856079101562, 8.601744651794434, 8.941633224487305, 9.281521797180176, 9.621410369873047, 9.961297988891602, 10.301186561584473, 10.641075134277344, 10.980962753295898, 11.32085132598877, 11.66073989868164]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 8.0, 7.0, 9.0, 5.0, 10.0, 17.0, 10.0, 21.0, 17.0, 22.0, 30.0, 23.0, 31.0, 31.0, 36.0, 32.0, 38.0, 27.0, 37.0, 45.0, 45.0, 33.0, 30.0, 33.0, 43.0, 30.0, 34.0, 26.0, 35.0, 25.0, 35.0, 24.0, 20.0, 16.0, 19.0, 21.0, 10.0, 15.0, 12.0, 13.0, 8.0, 6.0, 6.0, 10.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-8.51307487487793, -8.24659252166748, -7.980109214782715, -7.713626384735107, -7.4471435546875, -7.180661201477051, -6.914178371429443, -6.647695541381836, -6.3812127113342285, -6.114729881286621, -5.848247051239014, -5.581764221191406, -5.315281867980957, -5.048798561096191, -4.782316207885742, -4.515833377838135, -4.249350547790527, -3.98286771774292, -3.7163848876953125, -3.449902296066284, -3.1834194660186768, -2.9169366359710693, -2.650454044342041, -2.3839712142944336, -2.117488384246826, -1.8510055541992188, -1.5845228433609009, -1.318040132522583, -1.0515573024749756, -0.7850744724273682, -0.5185917615890503, -0.2521090507507324, 0.014372825622558594, 0.28085559606552124, 0.5473383665084839, 0.8138211369514465, 1.0803039073944092, 1.3467867374420166, 1.6132694482803345, 1.8797521591186523, 2.1462349891662598, 2.412717819213867, 2.6792006492614746, 2.945683240890503, 3.2121660709381104, 3.4786489009857178, 3.745131492614746, 4.0116143226623535, 4.278097152709961, 4.544579982757568, 4.811062812805176, 5.077545642852783, 5.344028472900391, 5.61051082611084, 5.876993656158447, 6.143476486206055, 6.409959316253662, 6.6764421463012695, 6.942924976348877, 7.209407806396484, 7.475890159606934, 7.742373466491699, 8.008855819702148, 8.275339126586914, 8.541821479797363]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 14.0, 19.0, 28.0, 45.0, 72.0, 91.0, 170.0, 229.0, 398.0, 574.0, 820.0, 1279.0, 1929.0, 2983.0, 4411.0, 6824.0, 10640.0, 16715.0, 26711.0, 43314.0, 72768.0, 131096.0, 286071.0, 830839.0, 1428478.0, 765480.0, 258326.0, 120590.0, 68887.0, 41324.0, 25512.0, 16275.0, 10631.0, 6820.0, 4455.0, 3227.0, 2024.0, 1333.0, 904.0, 639.0, 413.0, 307.0, 191.0, 145.0, 92.0, 76.0, 36.0, 30.0, 13.0, 13.0, 8.0, 7.0, 5.0, 2.0, 1.0, 3.0], "bins": [-11.6015625, -11.244140625, -10.88671875, -10.529296875, -10.171875, -9.814453125, -9.45703125, -9.099609375, -8.7421875, -8.384765625, -8.02734375, -7.669921875, -7.3125, -6.955078125, -6.59765625, -6.240234375, -5.8828125, -5.525390625, -5.16796875, -4.810546875, -4.453125, -4.095703125, -3.73828125, -3.380859375, -3.0234375, -2.666015625, -2.30859375, -1.951171875, -1.59375, -1.236328125, -0.87890625, -0.521484375, -0.1640625, 0.193359375, 0.55078125, 0.908203125, 1.265625, 1.623046875, 1.98046875, 2.337890625, 2.6953125, 3.052734375, 3.41015625, 3.767578125, 4.125, 4.482421875, 4.83984375, 5.197265625, 5.5546875, 5.912109375, 6.26953125, 6.626953125, 6.984375, 7.341796875, 7.69921875, 8.056640625, 8.4140625, 8.771484375, 9.12890625, 9.486328125, 9.84375, 10.201171875, 10.55859375, 10.916015625, 11.2734375]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 1.0, 5.0, 15.0, 11.0, 13.0, 10.0, 16.0, 20.0, 21.0, 28.0, 26.0, 33.0, 19.0, 29.0, 37.0, 30.0, 38.0, 55.0, 38.0, 26.0, 46.0, 34.0, 33.0, 33.0, 37.0, 38.0, 34.0, 22.0, 30.0, 32.0, 26.0, 25.0, 22.0, 20.0, 17.0, 15.0, 11.0, 15.0, 8.0, 11.0, 9.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.41796875, -7.1846923828125, -6.951416015625, -6.7181396484375, -6.48486328125, -6.2515869140625, -6.018310546875, -5.7850341796875, -5.5517578125, -5.3184814453125, -5.085205078125, -4.8519287109375, -4.61865234375, -4.3853759765625, -4.152099609375, -3.9188232421875, -3.685546875, -3.4522705078125, -3.218994140625, -2.9857177734375, -2.75244140625, -2.5191650390625, -2.285888671875, -2.0526123046875, -1.8193359375, -1.5860595703125, -1.352783203125, -1.1195068359375, -0.88623046875, -0.6529541015625, -0.419677734375, -0.1864013671875, 0.046875, 0.2801513671875, 0.513427734375, 0.7467041015625, 0.97998046875, 1.2132568359375, 1.446533203125, 1.6798095703125, 1.9130859375, 2.1463623046875, 2.379638671875, 2.6129150390625, 2.84619140625, 3.0794677734375, 3.312744140625, 3.5460205078125, 3.779296875, 4.0125732421875, 4.245849609375, 4.4791259765625, 4.71240234375, 4.9456787109375, 5.178955078125, 5.4122314453125, 5.6455078125, 5.8787841796875, 6.112060546875, 6.3453369140625, 6.57861328125, 6.8118896484375, 7.045166015625, 7.2784423828125, 7.51171875]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [4.0, 4.0, 5.0, 3.0, 5.0, 3.0, 7.0, 20.0, 21.0, 44.0, 62.0, 97.0, 134.0, 183.0, 246.0, 363.0, 585.0, 901.0, 1279.0, 1995.0, 3063.0, 4575.0, 7312.0, 11550.0, 19406.0, 32415.0, 55059.0, 97948.0, 178728.0, 341916.0, 717864.0, 1275546.0, 700064.0, 334918.0, 174688.0, 96034.0, 54416.0, 31690.0, 19107.0, 11590.0, 7245.0, 4439.0, 2926.0, 1927.0, 1342.0, 783.0, 564.0, 375.0, 267.0, 198.0, 128.0, 87.0, 68.0, 31.0, 24.0, 14.0, 10.0, 8.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0], "bins": [-10.0, -9.682373046875, -9.36474609375, -9.047119140625, -8.7294921875, -8.411865234375, -8.09423828125, -7.776611328125, -7.458984375, -7.141357421875, -6.82373046875, -6.506103515625, -6.1884765625, -5.870849609375, -5.55322265625, -5.235595703125, -4.91796875, -4.600341796875, -4.28271484375, -3.965087890625, -3.6474609375, -3.329833984375, -3.01220703125, -2.694580078125, -2.376953125, -2.059326171875, -1.74169921875, -1.424072265625, -1.1064453125, -0.788818359375, -0.47119140625, -0.153564453125, 0.1640625, 0.481689453125, 0.79931640625, 1.116943359375, 1.4345703125, 1.752197265625, 2.06982421875, 2.387451171875, 2.705078125, 3.022705078125, 3.34033203125, 3.657958984375, 3.9755859375, 4.293212890625, 4.61083984375, 4.928466796875, 5.24609375, 5.563720703125, 5.88134765625, 6.198974609375, 6.5166015625, 6.834228515625, 7.15185546875, 7.469482421875, 7.787109375, 8.104736328125, 8.42236328125, 8.739990234375, 9.0576171875, 9.375244140625, 9.69287109375, 10.010498046875, 10.328125]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 3.0, 5.0, 11.0, 6.0, 8.0, 17.0, 16.0, 20.0, 18.0, 36.0, 35.0, 59.0, 52.0, 94.0, 81.0, 109.0, 117.0, 152.0, 205.0, 218.0, 261.0, 331.0, 383.0, 359.0, 254.0, 225.0, 185.0, 147.0, 127.0, 104.0, 91.0, 74.0, 42.0, 48.0, 46.0, 44.0, 15.0, 12.0, 11.0, 12.0, 10.0, 8.0, 5.0, 4.0, 7.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.27734375, -4.14556884765625, -4.0137939453125, -3.88201904296875, -3.750244140625, -3.61846923828125, -3.4866943359375, -3.35491943359375, -3.22314453125, -3.09136962890625, -2.9595947265625, -2.82781982421875, -2.696044921875, -2.56427001953125, -2.4324951171875, -2.30072021484375, -2.1689453125, -2.03717041015625, -1.9053955078125, -1.77362060546875, -1.641845703125, -1.51007080078125, -1.3782958984375, -1.24652099609375, -1.11474609375, -0.98297119140625, -0.8511962890625, -0.71942138671875, -0.587646484375, -0.45587158203125, -0.3240966796875, -0.19232177734375, -0.060546875, 0.07122802734375, 0.2030029296875, 0.33477783203125, 0.466552734375, 0.59832763671875, 0.7301025390625, 0.86187744140625, 0.99365234375, 1.12542724609375, 1.2572021484375, 1.38897705078125, 1.520751953125, 1.65252685546875, 1.7843017578125, 1.91607666015625, 2.0478515625, 2.17962646484375, 2.3114013671875, 2.44317626953125, 2.574951171875, 2.70672607421875, 2.8385009765625, 2.97027587890625, 3.10205078125, 3.23382568359375, 3.3656005859375, 3.49737548828125, 3.629150390625, 3.76092529296875, 3.8927001953125, 4.02447509765625, 4.15625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 2.0, 4.0, 4.0, 5.0, 9.0, 8.0, 15.0, 11.0, 18.0, 22.0, 16.0, 29.0, 37.0, 37.0, 55.0, 59.0, 65.0, 66.0, 87.0, 77.0, 72.0, 55.0, 44.0, 37.0, 27.0, 25.0, 24.0, 19.0, 15.0, 9.0, 7.0, 6.0, 10.0, 5.0, 4.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.999770164489746, -8.709814071655273, -8.4198579788208, -8.129901885986328, -7.839945316314697, -7.549988746643066, -7.260032653808594, -6.970076560974121, -6.680120468139648, -6.390164375305176, -6.100207805633545, -5.810251712799072, -5.5202956199646, -5.230339050292969, -4.940382957458496, -4.650426864624023, -4.360470294952393, -4.07051420211792, -3.780557870864868, -3.4906015396118164, -3.2006454467773438, -2.910689115524292, -2.6207327842712402, -2.3307766914367676, -2.040820360183716, -1.7508641481399536, -1.4609079360961914, -1.1709516048431396, -0.8809953927993774, -0.5910391807556152, -0.3010828495025635, -0.01112675666809082, 0.27882957458496094, 0.5687857866287231, 0.8587420582771301, 1.148698329925537, 1.4386545419692993, 1.7286107540130615, 2.0185670852661133, 2.308523178100586, 2.5984795093536377, 2.8884358406066895, 3.178391933441162, 3.468348264694214, 3.7583045959472656, 4.048260688781738, 4.338216781616211, 4.628172874450684, 4.9181294441223145, 5.208085536956787, 5.498042106628418, 5.787998199462891, 6.077954292297363, 6.367910385131836, 6.657866954803467, 6.9478230476379395, 7.23777961730957, 7.527735710144043, 7.817692279815674, 8.107648849487305, 8.397604942321777, 8.68756103515625, 8.977517127990723, 9.267473220825195, 9.557429313659668]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 1.0, 3.0, 3.0, 9.0, 10.0, 6.0, 15.0, 16.0, 13.0, 16.0, 27.0, 33.0, 26.0, 20.0, 29.0, 31.0, 41.0, 35.0, 35.0, 47.0, 52.0, 33.0, 31.0, 27.0, 37.0, 18.0, 41.0, 37.0, 39.0, 23.0, 33.0, 29.0, 25.0, 21.0, 23.0, 22.0, 18.0, 15.0, 16.0, 11.0, 10.0, 6.0, 2.0, 7.0, 5.0, 5.0, 3.0, 3.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.155181884765625, -7.882974147796631, -7.610766887664795, -7.338559150695801, -7.066351413726807, -6.7941436767578125, -6.521936416625977, -6.249728679656982, -5.977520942687988, -5.705313205718994, -5.433105945587158, -5.160898208618164, -4.88869047164917, -4.616482734680176, -4.34427547454834, -4.072067737579346, -3.7998604774475098, -3.5276529788970947, -3.2554452419281006, -2.9832377433776855, -2.7110300064086914, -2.4388225078582764, -2.1666150093078613, -1.8944073915481567, -1.6221997737884521, -1.3499921560287476, -1.077784538269043, -0.8055770397186279, -0.5333694219589233, -0.26116180419921875, 0.011045694351196289, 0.2832533121109009, 0.5554609298706055, 0.8276685476303101, 1.0998761653900146, 1.3720836639404297, 1.6442912817001343, 1.9164988994598389, 2.188706398010254, 2.460914134979248, 2.733121633529663, 3.005329132080078, 3.2775368690490723, 3.5497443675994873, 3.8219518661499023, 4.0941596031188965, 4.366367340087891, 4.638574600219727, 4.910782337188721, 5.182990074157715, 5.455197334289551, 5.727405071258545, 5.999612808227539, 6.271820068359375, 6.544027805328369, 6.816235542297363, 7.088442802429199, 7.360650539398193, 7.632857799530029, 7.905065536499023, 8.17727279663086, 8.449481010437012, 8.721688270568848, 8.993895530700684, 9.266103744506836]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 10.0, 10.0, 16.0, 14.0, 26.0, 54.0, 74.0, 108.0, 134.0, 263.0, 420.0, 626.0, 992.0, 1720.0, 2670.0, 4510.0, 7329.0, 12017.0, 19657.0, 31652.0, 54538.0, 101286.0, 224013.0, 304670.0, 122941.0, 64127.0, 36900.0, 22274.0, 13690.0, 8350.0, 5181.0, 3150.0, 1905.0, 1211.0, 762.0, 460.0, 280.0, 176.0, 116.0, 58.0, 50.0, 42.0, 24.0, 19.0, 9.0, 14.0, 4.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-2.689453125, -2.60308837890625, -2.5167236328125, -2.43035888671875, -2.343994140625, -2.25762939453125, -2.1712646484375, -2.08489990234375, -1.99853515625, -1.91217041015625, -1.8258056640625, -1.73944091796875, -1.653076171875, -1.56671142578125, -1.4803466796875, -1.39398193359375, -1.3076171875, -1.22125244140625, -1.1348876953125, -1.04852294921875, -0.962158203125, -0.87579345703125, -0.7894287109375, -0.70306396484375, -0.61669921875, -0.53033447265625, -0.4439697265625, -0.35760498046875, -0.271240234375, -0.18487548828125, -0.0985107421875, -0.01214599609375, 0.07421875, 0.16058349609375, 0.2469482421875, 0.33331298828125, 0.419677734375, 0.50604248046875, 0.5924072265625, 0.67877197265625, 0.76513671875, 0.85150146484375, 0.9378662109375, 1.02423095703125, 1.110595703125, 1.19696044921875, 1.2833251953125, 1.36968994140625, 1.4560546875, 1.54241943359375, 1.6287841796875, 1.71514892578125, 1.801513671875, 1.88787841796875, 1.9742431640625, 2.06060791015625, 2.14697265625, 2.23333740234375, 2.3197021484375, 2.40606689453125, 2.492431640625, 2.57879638671875, 2.6651611328125, 2.75152587890625, 2.837890625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 12.0, 13.0, 15.0, 12.0, 23.0, 22.0, 21.0, 22.0, 32.0, 32.0, 29.0, 24.0, 40.0, 47.0, 41.0, 44.0, 36.0, 39.0, 26.0, 40.0, 29.0, 37.0, 39.0, 39.0, 30.0, 34.0, 31.0, 23.0, 22.0, 16.0, 24.0, 19.0, 18.0, 13.0, 7.0, 9.0, 11.0, 8.0, 6.0, 2.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.8203125, -8.5369873046875, -8.253662109375, -7.9703369140625, -7.68701171875, -7.4036865234375, -7.120361328125, -6.8370361328125, -6.5537109375, -6.2703857421875, -5.987060546875, -5.7037353515625, -5.42041015625, -5.1370849609375, -4.853759765625, -4.5704345703125, -4.287109375, -4.0037841796875, -3.720458984375, -3.4371337890625, -3.15380859375, -2.8704833984375, -2.587158203125, -2.3038330078125, -2.0205078125, -1.7371826171875, -1.453857421875, -1.1705322265625, -0.88720703125, -0.6038818359375, -0.320556640625, -0.0372314453125, 0.24609375, 0.5294189453125, 0.812744140625, 1.0960693359375, 1.37939453125, 1.6627197265625, 1.946044921875, 2.2293701171875, 2.5126953125, 2.7960205078125, 3.079345703125, 3.3626708984375, 3.64599609375, 3.9293212890625, 4.212646484375, 4.4959716796875, 4.779296875, 5.0626220703125, 5.345947265625, 5.6292724609375, 5.91259765625, 6.1959228515625, 6.479248046875, 6.7625732421875, 7.0458984375, 7.3292236328125, 7.612548828125, 7.8958740234375, 8.17919921875, 8.4625244140625, 8.745849609375, 9.0291748046875, 9.3125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 2.0, 13.0, 7.0, 8.0, 26.0, 26.0, 44.0, 53.0, 73.0, 128.0, 134.0, 203.0, 295.0, 396.0, 551.0, 734.0, 1029.0, 1506.0, 2077.0, 2994.0, 4305.0, 6565.0, 9428.0, 14544.0, 22766.0, 36365.0, 60520.0, 108151.0, 279586.0, 237950.0, 100670.0, 57454.0, 34527.0, 21575.0, 14152.0, 9223.0, 6306.0, 4145.0, 2873.0, 2032.0, 1442.0, 1014.0, 710.0, 528.0, 366.0, 290.0, 212.0, 155.0, 119.0, 83.0, 56.0, 36.0, 35.0, 28.0, 16.0, 18.0, 9.0, 5.0, 5.0, 3.0, 3.0], "bins": [-2.419921875, -2.34417724609375, -2.2684326171875, -2.19268798828125, -2.116943359375, -2.04119873046875, -1.9654541015625, -1.88970947265625, -1.81396484375, -1.73822021484375, -1.6624755859375, -1.58673095703125, -1.510986328125, -1.43524169921875, -1.3594970703125, -1.28375244140625, -1.2080078125, -1.13226318359375, -1.0565185546875, -0.98077392578125, -0.905029296875, -0.82928466796875, -0.7535400390625, -0.67779541015625, -0.60205078125, -0.52630615234375, -0.4505615234375, -0.37481689453125, -0.299072265625, -0.22332763671875, -0.1475830078125, -0.07183837890625, 0.00390625, 0.07965087890625, 0.1553955078125, 0.23114013671875, 0.306884765625, 0.38262939453125, 0.4583740234375, 0.53411865234375, 0.60986328125, 0.68560791015625, 0.7613525390625, 0.83709716796875, 0.912841796875, 0.98858642578125, 1.0643310546875, 1.14007568359375, 1.2158203125, 1.29156494140625, 1.3673095703125, 1.44305419921875, 1.518798828125, 1.59454345703125, 1.6702880859375, 1.74603271484375, 1.82177734375, 1.89752197265625, 1.9732666015625, 2.04901123046875, 2.124755859375, 2.20050048828125, 2.2762451171875, 2.35198974609375, 2.427734375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 4.0, 1.0, 4.0, 9.0, 6.0, 6.0, 7.0, 12.0, 15.0, 8.0, 13.0, 12.0, 8.0, 21.0, 22.0, 29.0, 25.0, 40.0, 27.0, 33.0, 32.0, 48.0, 33.0, 49.0, 42.0, 47.0, 43.0, 34.0, 30.0, 39.0, 42.0, 32.0, 36.0, 25.0, 33.0, 17.0, 17.0, 21.0, 18.0, 9.0, 14.0, 7.0, 2.0, 7.0, 5.0, 5.0, 6.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-5.15625, -4.98101806640625, -4.8057861328125, -4.63055419921875, -4.455322265625, -4.28009033203125, -4.1048583984375, -3.92962646484375, -3.75439453125, -3.57916259765625, -3.4039306640625, -3.22869873046875, -3.053466796875, -2.87823486328125, -2.7030029296875, -2.52777099609375, -2.3525390625, -2.17730712890625, -2.0020751953125, -1.82684326171875, -1.651611328125, -1.47637939453125, -1.3011474609375, -1.12591552734375, -0.95068359375, -0.77545166015625, -0.6002197265625, -0.42498779296875, -0.249755859375, -0.07452392578125, 0.1007080078125, 0.27593994140625, 0.451171875, 0.62640380859375, 0.8016357421875, 0.97686767578125, 1.152099609375, 1.32733154296875, 1.5025634765625, 1.67779541015625, 1.85302734375, 2.02825927734375, 2.2034912109375, 2.37872314453125, 2.553955078125, 2.72918701171875, 2.9044189453125, 3.07965087890625, 3.2548828125, 3.43011474609375, 3.6053466796875, 3.78057861328125, 3.955810546875, 4.13104248046875, 4.3062744140625, 4.48150634765625, 4.65673828125, 4.83197021484375, 5.0072021484375, 5.18243408203125, 5.357666015625, 5.53289794921875, 5.7081298828125, 5.88336181640625, 6.05859375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 9.0, 7.0, 13.0, 19.0, 23.0, 34.0, 36.0, 51.0, 67.0, 97.0, 135.0, 217.0, 251.0, 391.0, 630.0, 1019.0, 1629.0, 2612.0, 4347.0, 7861.0, 14538.0, 29558.0, 66244.0, 166484.0, 372695.0, 218909.0, 83796.0, 36888.0, 17359.0, 9158.0, 5143.0, 3014.0, 1905.0, 1130.0, 744.0, 482.0, 302.0, 220.0, 164.0, 114.0, 65.0, 55.0, 36.0, 29.0, 20.0, 16.0, 15.0, 8.0, 4.0, 4.0, 1.0, 2.0, 3.0, 3.0, 3.0], "bins": [-0.004154205322265625, -0.004030704498291016, -0.003907203674316406, -0.003783702850341797, -0.0036602020263671875, -0.003536701202392578, -0.0034132003784179688, -0.0032896995544433594, -0.00316619873046875, -0.0030426979064941406, -0.0029191970825195312, -0.002795696258544922, -0.0026721954345703125, -0.002548694610595703, -0.0024251937866210938, -0.0023016929626464844, -0.002178192138671875, -0.0020546913146972656, -0.0019311904907226562, -0.0018076896667480469, -0.0016841888427734375, -0.0015606880187988281, -0.0014371871948242188, -0.0013136863708496094, -0.001190185546875, -0.0010666847229003906, -0.0009431838989257812, -0.0008196830749511719, -0.0006961822509765625, -0.0005726814270019531, -0.00044918060302734375, -0.0003256797790527344, -0.000202178955078125, -7.867813110351562e-05, 4.482269287109375e-05, 0.00016832351684570312, 0.0002918243408203125, 0.0004153251647949219, 0.0005388259887695312, 0.0006623268127441406, 0.00078582763671875, 0.0009093284606933594, 0.0010328292846679688, 0.0011563301086425781, 0.0012798309326171875, 0.0014033317565917969, 0.0015268325805664062, 0.0016503334045410156, 0.001773834228515625, 0.0018973350524902344, 0.0020208358764648438, 0.002144336700439453, 0.0022678375244140625, 0.002391338348388672, 0.0025148391723632812, 0.0026383399963378906, 0.0027618408203125, 0.0028853416442871094, 0.0030088424682617188, 0.003132343292236328, 0.0032558441162109375, 0.003379344940185547, 0.0035028457641601562, 0.0036263465881347656, 0.003749847412109375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 7.0, 8.0, 11.0, 11.0, 13.0, 18.0, 23.0, 27.0, 32.0, 38.0, 41.0, 53.0, 58.0, 55.0, 112.0, 66.0, 71.0, 58.0, 52.0, 33.0, 36.0, 46.0, 34.0, 22.0, 26.0, 13.0, 10.0, 4.0, 2.0, 6.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.993511199951172e-06, -3.87243926525116e-06, -3.7513673305511475e-06, -3.6302953958511353e-06, -3.509223461151123e-06, -3.388151526451111e-06, -3.2670795917510986e-06, -3.1460076570510864e-06, -3.0249357223510742e-06, -2.903863787651062e-06, -2.78279185295105e-06, -2.6617199182510376e-06, -2.5406479835510254e-06, -2.419576048851013e-06, -2.298504114151001e-06, -2.1774321794509888e-06, -2.0563602447509766e-06, -1.9352883100509644e-06, -1.8142163753509521e-06, -1.69314444065094e-06, -1.5720725059509277e-06, -1.4510005712509155e-06, -1.3299286365509033e-06, -1.2088567018508911e-06, -1.087784767150879e-06, -9.667128324508667e-07, -8.456408977508545e-07, -7.245689630508423e-07, -6.034970283508301e-07, -4.824250936508179e-07, -3.6135315895080566e-07, -2.4028122425079346e-07, -1.1920928955078125e-07, 1.862645149230957e-09, 1.2293457984924316e-07, 2.4400651454925537e-07, 3.650784492492676e-07, 4.861503839492798e-07, 6.07222318649292e-07, 7.282942533493042e-07, 8.493661880493164e-07, 9.704381227493286e-07, 1.0915100574493408e-06, 1.212581992149353e-06, 1.3336539268493652e-06, 1.4547258615493774e-06, 1.5757977962493896e-06, 1.6968697309494019e-06, 1.817941665649414e-06, 1.9390136003494263e-06, 2.0600855350494385e-06, 2.1811574697494507e-06, 2.302229404449463e-06, 2.423301339149475e-06, 2.5443732738494873e-06, 2.6654452085494995e-06, 2.7865171432495117e-06, 2.907589077949524e-06, 3.028661012649536e-06, 3.1497329473495483e-06, 3.2708048820495605e-06, 3.3918768167495728e-06, 3.512948751449585e-06, 3.634020686149597e-06, 3.7550926208496094e-06]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 4.0, 8.0, 21.0, 20.0, 27.0, 44.0, 72.0, 143.0, 170.0, 226.0, 307.0, 499.0, 732.0, 964.0, 1555.0, 2398.0, 3853.0, 5891.0, 9839.0, 17299.0, 31408.0, 62185.0, 131044.0, 286367.0, 255234.0, 114445.0, 55253.0, 28180.0, 15378.0, 9111.0, 5580.0, 3523.0, 2264.0, 1414.0, 1031.0, 636.0, 442.0, 296.0, 196.0, 162.0, 101.0, 81.0, 41.0, 29.0, 24.0, 21.0, 14.0, 7.0, 5.0, 3.0, 4.0, 3.0, 1.0], "bins": [-0.003803253173828125, -0.0036943256855010986, -0.0035853981971740723, -0.003476470708847046, -0.0033675432205200195, -0.003258615732192993, -0.003149688243865967, -0.0030407607555389404, -0.002931833267211914, -0.0028229057788848877, -0.0027139782905578613, -0.002605050802230835, -0.0024961233139038086, -0.0023871958255767822, -0.002278268337249756, -0.0021693408489227295, -0.002060413360595703, -0.0019514858722686768, -0.0018425583839416504, -0.001733630895614624, -0.0016247034072875977, -0.0015157759189605713, -0.001406848430633545, -0.0012979209423065186, -0.0011889934539794922, -0.0010800659656524658, -0.0009711384773254395, -0.0008622109889984131, -0.0007532835006713867, -0.0006443560123443604, -0.000535428524017334, -0.0004265010356903076, -0.00031757354736328125, -0.00020864605903625488, -9.971857070922852e-05, 9.208917617797852e-06, 0.00011813640594482422, 0.00022706389427185059, 0.00033599138259887695, 0.0004449188709259033, 0.0005538463592529297, 0.0006627738475799561, 0.0007717013359069824, 0.0008806288242340088, 0.0009895563125610352, 0.0010984838008880615, 0.0012074112892150879, 0.0013163387775421143, 0.0014252662658691406, 0.001534193754196167, 0.0016431212425231934, 0.0017520487308502197, 0.001860976219177246, 0.0019699037075042725, 0.002078831195831299, 0.002187758684158325, 0.0022966861724853516, 0.002405613660812378, 0.0025145411491394043, 0.0026234686374664307, 0.002732396125793457, 0.0028413236141204834, 0.0029502511024475098, 0.003059178590774536, 0.0031681060791015625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 6.0, 4.0, 10.0, 10.0, 6.0, 14.0, 8.0, 8.0, 15.0, 21.0, 33.0, 46.0, 43.0, 49.0, 87.0, 119.0, 106.0, 95.0, 82.0, 56.0, 42.0, 31.0, 23.0, 16.0, 15.0, 13.0, 13.0, 7.0, 8.0, 1.0, 2.0, 7.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.001590728759765625, -0.0015457719564437866, -0.0015008151531219482, -0.0014558583498001099, -0.0014109015464782715, -0.001365944743156433, -0.0013209879398345947, -0.0012760311365127563, -0.001231074333190918, -0.0011861175298690796, -0.0011411607265472412, -0.0010962039232254028, -0.0010512471199035645, -0.001006290316581726, -0.0009613335132598877, -0.0009163767099380493, -0.0008714199066162109, -0.0008264631032943726, -0.0007815062999725342, -0.0007365494966506958, -0.0006915926933288574, -0.000646635890007019, -0.0006016790866851807, -0.0005567222833633423, -0.0005117654800415039, -0.00046680867671966553, -0.00042185187339782715, -0.00037689507007598877, -0.0003319382667541504, -0.000286981463432312, -0.00024202466011047363, -0.00019706785678863525, -0.00015211105346679688, -0.0001071542501449585, -6.219744682312012e-05, -1.7240643501281738e-05, 2.771615982055664e-05, 7.267296314239502e-05, 0.0001176297664642334, 0.00016258656978607178, 0.00020754337310791016, 0.00025250017642974854, 0.0002974569797515869, 0.0003424137830734253, 0.00038737058639526367, 0.00043232738971710205, 0.00047728419303894043, 0.0005222409963607788, 0.0005671977996826172, 0.0006121546030044556, 0.0006571114063262939, 0.0007020682096481323, 0.0007470250129699707, 0.0007919818162918091, 0.0008369386196136475, 0.0008818954229354858, 0.0009268522262573242, 0.0009718090295791626, 0.001016765832901001, 0.0010617226362228394, 0.0011066794395446777, 0.0011516362428665161, 0.0011965930461883545, 0.0012415498495101929, 0.0012865066528320312]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 2.0, 5.0, 6.0, 5.0, 12.0, 15.0, 8.0, 20.0, 15.0, 19.0, 31.0, 32.0, 41.0, 45.0, 63.0, 65.0, 59.0, 88.0, 81.0, 74.0, 52.0, 44.0, 37.0, 31.0, 25.0, 22.0, 20.0, 21.0, 9.0, 7.0, 8.0, 11.0, 3.0, 3.0, 6.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.897679328918457, -8.612547874450684, -8.327417373657227, -8.042285919189453, -7.757155418395996, -7.472023963928223, -7.186892986297607, -6.901762008666992, -6.616631031036377, -6.331500053405762, -6.0463690757751465, -5.761238098144531, -5.476106643676758, -5.190976142883301, -4.905844688415527, -4.620713710784912, -4.335582733154297, -4.050451755523682, -3.7653207778930664, -3.480189561843872, -3.195058584213257, -2.9099276065826416, -2.6247963905334473, -2.339665412902832, -2.054534435272217, -1.7694034576416016, -1.4842723608016968, -1.199141263961792, -0.9140102863311768, -0.6288793087005615, -0.34374821186065674, -0.05861711502075195, 0.22651290893554688, 0.5116439461708069, 0.7967749834060669, 1.0819060802459717, 1.367037057876587, 1.6521680355072021, 1.937299132347107, 2.2224302291870117, 2.507561206817627, 2.792692184448242, 3.0778231620788574, 3.3629543781280518, 3.648085355758667, 3.9332163333892822, 4.218347549438477, 4.503478527069092, 4.788609504699707, 5.073740482330322, 5.3588714599609375, 5.644002437591553, 5.929133415222168, 6.214264869689941, 6.499395847320557, 6.784526824951172, 7.069657802581787, 7.354788780212402, 7.639919757843018, 7.925050735473633, 8.210182189941406, 8.495312690734863, 8.780444145202637, 9.065574645996094, 9.350706100463867]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 9.0, 10.0, 6.0, 15.0, 16.0, 13.0, 16.0, 27.0, 31.0, 28.0, 20.0, 27.0, 32.0, 42.0, 34.0, 35.0, 49.0, 49.0, 34.0, 32.0, 26.0, 37.0, 19.0, 42.0, 33.0, 42.0, 22.0, 33.0, 29.0, 26.0, 22.0, 22.0, 22.0, 18.0, 15.0, 17.0, 10.0, 10.0, 6.0, 2.0, 7.0, 5.0, 5.0, 2.0, 4.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.116678237915039, -7.845007419586182, -7.573336601257324, -7.301665306091309, -7.029994487762451, -6.758323669433594, -6.486652851104736, -6.214982032775879, -5.943310737609863, -5.671639919281006, -5.399969100952148, -5.128297805786133, -4.856626987457275, -4.584956169128418, -4.3132853507995605, -4.041614532470703, -3.7699437141418457, -3.4982728958129883, -3.2266018390655518, -2.9549310207366943, -2.683259963989258, -2.4115891456604004, -2.139918327331543, -1.868247389793396, -1.596576452255249, -1.324905514717102, -1.053234577178955, -0.7815637588500977, -0.5098928213119507, -0.2382218837738037, 0.03344893455505371, 0.3051198720932007, 0.5767908096313477, 0.8484617471694946, 1.1201326847076416, 1.391803503036499, 1.663474440574646, 1.935145378112793, 2.2068161964416504, 2.478487014770508, 2.7501580715179443, 3.0218288898468018, 3.2934999465942383, 3.5651707649230957, 3.836841583251953, 4.108512878417969, 4.380183219909668, 4.651854515075684, 4.923525333404541, 5.195196151733398, 5.466866970062256, 5.738537788391113, 6.010209083557129, 6.281879901885986, 6.553550720214844, 6.825221538543701, 7.096892356872559, 7.368563175201416, 7.640233993530273, 7.911905288696289, 8.183575630187988, 8.455246925354004, 8.726917266845703, 8.998588562011719, 9.270259857177734]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 6.0, 9.0, 14.0, 21.0, 35.0, 35.0, 58.0, 70.0, 133.0, 219.0, 271.0, 373.0, 614.0, 864.0, 1206.0, 1856.0, 2710.0, 3739.0, 5673.0, 8111.0, 11939.0, 17232.0, 25423.0, 37945.0, 58145.0, 88503.0, 127278.0, 155479.0, 150715.0, 115211.0, 77906.0, 50793.0, 33701.0, 22868.0, 15374.0, 10510.0, 7309.0, 5111.0, 3488.0, 2386.0, 1633.0, 1114.0, 825.0, 541.0, 349.0, 241.0, 160.0, 113.0, 79.0, 61.0, 53.0, 18.0, 12.0, 16.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-10.90625, -10.552734375, -10.19921875, -9.845703125, -9.4921875, -9.138671875, -8.78515625, -8.431640625, -8.078125, -7.724609375, -7.37109375, -7.017578125, -6.6640625, -6.310546875, -5.95703125, -5.603515625, -5.25, -4.896484375, -4.54296875, -4.189453125, -3.8359375, -3.482421875, -3.12890625, -2.775390625, -2.421875, -2.068359375, -1.71484375, -1.361328125, -1.0078125, -0.654296875, -0.30078125, 0.052734375, 0.40625, 0.759765625, 1.11328125, 1.466796875, 1.8203125, 2.173828125, 2.52734375, 2.880859375, 3.234375, 3.587890625, 3.94140625, 4.294921875, 4.6484375, 5.001953125, 5.35546875, 5.708984375, 6.0625, 6.416015625, 6.76953125, 7.123046875, 7.4765625, 7.830078125, 8.18359375, 8.537109375, 8.890625, 9.244140625, 9.59765625, 9.951171875, 10.3046875, 10.658203125, 11.01171875, 11.365234375, 11.71875]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 3.0, 3.0, 8.0, 13.0, 8.0, 12.0, 14.0, 11.0, 17.0, 27.0, 21.0, 21.0, 28.0, 29.0, 27.0, 39.0, 42.0, 38.0, 37.0, 50.0, 48.0, 28.0, 31.0, 31.0, 28.0, 32.0, 33.0, 40.0, 36.0, 18.0, 28.0, 24.0, 32.0, 32.0, 24.0, 13.0, 12.0, 16.0, 13.0, 6.0, 11.0, 3.0, 5.0, 7.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.9140625, -7.6591796875, -7.404296875, -7.1494140625, -6.89453125, -6.6396484375, -6.384765625, -6.1298828125, -5.875, -5.6201171875, -5.365234375, -5.1103515625, -4.85546875, -4.6005859375, -4.345703125, -4.0908203125, -3.8359375, -3.5810546875, -3.326171875, -3.0712890625, -2.81640625, -2.5615234375, -2.306640625, -2.0517578125, -1.796875, -1.5419921875, -1.287109375, -1.0322265625, -0.77734375, -0.5224609375, -0.267578125, -0.0126953125, 0.2421875, 0.4970703125, 0.751953125, 1.0068359375, 1.26171875, 1.5166015625, 1.771484375, 2.0263671875, 2.28125, 2.5361328125, 2.791015625, 3.0458984375, 3.30078125, 3.5556640625, 3.810546875, 4.0654296875, 4.3203125, 4.5751953125, 4.830078125, 5.0849609375, 5.33984375, 5.5947265625, 5.849609375, 6.1044921875, 6.359375, 6.6142578125, 6.869140625, 7.1240234375, 7.37890625, 7.6337890625, 7.888671875, 8.1435546875, 8.3984375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 6.0, 5.0, 12.0, 12.0, 20.0, 23.0, 43.0, 46.0, 72.0, 87.0, 153.0, 255.0, 334.0, 538.0, 802.0, 1099.0, 1775.0, 2685.0, 3862.0, 5865.0, 9034.0, 13502.0, 20289.0, 30600.0, 47573.0, 74950.0, 118392.0, 164879.0, 174243.0, 133542.0, 86315.0, 54362.0, 34939.0, 22717.0, 15311.0, 10225.0, 6651.0, 4455.0, 2961.0, 1904.0, 1336.0, 844.0, 568.0, 400.0, 261.0, 203.0, 131.0, 102.0, 68.0, 36.0, 22.0, 19.0, 18.0, 7.0, 4.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.015625, -11.6298828125, -11.244140625, -10.8583984375, -10.47265625, -10.0869140625, -9.701171875, -9.3154296875, -8.9296875, -8.5439453125, -8.158203125, -7.7724609375, -7.38671875, -7.0009765625, -6.615234375, -6.2294921875, -5.84375, -5.4580078125, -5.072265625, -4.6865234375, -4.30078125, -3.9150390625, -3.529296875, -3.1435546875, -2.7578125, -2.3720703125, -1.986328125, -1.6005859375, -1.21484375, -0.8291015625, -0.443359375, -0.0576171875, 0.328125, 0.7138671875, 1.099609375, 1.4853515625, 1.87109375, 2.2568359375, 2.642578125, 3.0283203125, 3.4140625, 3.7998046875, 4.185546875, 4.5712890625, 4.95703125, 5.3427734375, 5.728515625, 6.1142578125, 6.5, 6.8857421875, 7.271484375, 7.6572265625, 8.04296875, 8.4287109375, 8.814453125, 9.2001953125, 9.5859375, 9.9716796875, 10.357421875, 10.7431640625, 11.12890625, 11.5146484375, 11.900390625, 12.2861328125, 12.671875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 7.0, 7.0, 3.0, 17.0, 10.0, 10.0, 18.0, 18.0, 28.0, 18.0, 34.0, 32.0, 32.0, 24.0, 33.0, 34.0, 32.0, 50.0, 41.0, 31.0, 40.0, 41.0, 40.0, 30.0, 41.0, 31.0, 31.0, 23.0, 28.0, 37.0, 22.0, 28.0, 26.0, 13.0, 14.0, 21.0, 12.0, 13.0, 11.0, 3.0, 6.0, 6.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1953125, -5.0274658203125, -4.859619140625, -4.6917724609375, -4.52392578125, -4.3560791015625, -4.188232421875, -4.0203857421875, -3.8525390625, -3.6846923828125, -3.516845703125, -3.3489990234375, -3.18115234375, -3.0133056640625, -2.845458984375, -2.6776123046875, -2.509765625, -2.3419189453125, -2.174072265625, -2.0062255859375, -1.83837890625, -1.6705322265625, -1.502685546875, -1.3348388671875, -1.1669921875, -0.9991455078125, -0.831298828125, -0.6634521484375, -0.49560546875, -0.3277587890625, -0.159912109375, 0.0079345703125, 0.17578125, 0.3436279296875, 0.511474609375, 0.6793212890625, 0.84716796875, 1.0150146484375, 1.182861328125, 1.3507080078125, 1.5185546875, 1.6864013671875, 1.854248046875, 2.0220947265625, 2.18994140625, 2.3577880859375, 2.525634765625, 2.6934814453125, 2.861328125, 3.0291748046875, 3.197021484375, 3.3648681640625, 3.53271484375, 3.7005615234375, 3.868408203125, 4.0362548828125, 4.2041015625, 4.3719482421875, 4.539794921875, 4.7076416015625, 4.87548828125, 5.0433349609375, 5.211181640625, 5.3790283203125, 5.546875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 2.0, 7.0, 10.0, 18.0, 20.0, 35.0, 50.0, 66.0, 75.0, 136.0, 187.0, 276.0, 326.0, 507.0, 755.0, 1038.0, 1432.0, 2154.0, 3134.0, 4473.0, 6919.0, 10722.0, 16922.0, 28034.0, 48633.0, 91067.0, 204755.0, 303011.0, 147875.0, 70943.0, 39771.0, 23277.0, 14363.0, 9022.0, 5908.0, 3879.0, 2670.0, 1843.0, 1240.0, 864.0, 638.0, 443.0, 283.0, 251.0, 154.0, 94.0, 92.0, 63.0, 35.0, 29.0, 22.0, 12.0, 9.0, 10.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.84375, -1.782928466796875, -1.72210693359375, -1.661285400390625, -1.6004638671875, -1.539642333984375, -1.47882080078125, -1.417999267578125, -1.357177734375, -1.296356201171875, -1.23553466796875, -1.174713134765625, -1.1138916015625, -1.053070068359375, -0.99224853515625, -0.931427001953125, -0.87060546875, -0.809783935546875, -0.74896240234375, -0.688140869140625, -0.6273193359375, -0.566497802734375, -0.50567626953125, -0.444854736328125, -0.384033203125, -0.323211669921875, -0.26239013671875, -0.201568603515625, -0.1407470703125, -0.079925537109375, -0.01910400390625, 0.041717529296875, 0.1025390625, 0.163360595703125, 0.22418212890625, 0.285003662109375, 0.3458251953125, 0.406646728515625, 0.46746826171875, 0.528289794921875, 0.589111328125, 0.649932861328125, 0.71075439453125, 0.771575927734375, 0.8323974609375, 0.893218994140625, 0.95404052734375, 1.014862060546875, 1.07568359375, 1.136505126953125, 1.19732666015625, 1.258148193359375, 1.3189697265625, 1.379791259765625, 1.44061279296875, 1.501434326171875, 1.562255859375, 1.623077392578125, 1.68389892578125, 1.744720458984375, 1.8055419921875, 1.866363525390625, 1.92718505859375, 1.988006591796875, 2.048828125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 6.0, 12.0, 20.0, 22.0, 39.0, 43.0, 52.0, 60.0, 80.0, 108.0, 98.0, 98.0, 74.0, 71.0, 44.0, 43.0, 30.0, 19.0, 22.0, 11.0, 11.0, 10.0, 7.0, 6.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012731552124023438, -0.00012301653623580933, -0.00011871755123138428, -0.00011441856622695923, -0.00011011958122253418, -0.00010582059621810913, -0.00010152161121368408, -9.722262620925903e-05, -9.292364120483398e-05, -8.862465620040894e-05, -8.432567119598389e-05, -8.002668619155884e-05, -7.572770118713379e-05, -7.142871618270874e-05, -6.712973117828369e-05, -6.283074617385864e-05, -5.8531761169433594e-05, -5.4232776165008545e-05, -4.9933791160583496e-05, -4.563480615615845e-05, -4.13358211517334e-05, -3.703683614730835e-05, -3.27378511428833e-05, -2.8438866138458252e-05, -2.4139881134033203e-05, -1.9840896129608154e-05, -1.5541911125183105e-05, -1.1242926120758057e-05, -6.943941116333008e-06, -2.644956111907959e-06, 1.6540288925170898e-06, 5.953013896942139e-06, 1.0251998901367188e-05, 1.4550983905792236e-05, 1.8849968910217285e-05, 2.3148953914642334e-05, 2.7447938919067383e-05, 3.174692392349243e-05, 3.604590892791748e-05, 4.034489393234253e-05, 4.464387893676758e-05, 4.894286394119263e-05, 5.3241848945617676e-05, 5.7540833950042725e-05, 6.183981895446777e-05, 6.613880395889282e-05, 7.043778896331787e-05, 7.473677396774292e-05, 7.903575897216797e-05, 8.333474397659302e-05, 8.763372898101807e-05, 9.193271398544312e-05, 9.623169898986816e-05, 0.00010053068399429321, 0.00010482966899871826, 0.00010912865400314331, 0.00011342763900756836, 0.00011772662401199341, 0.00012202560901641846, 0.0001263245940208435, 0.00013062357902526855, 0.0001349225640296936, 0.00013922154903411865, 0.0001435205340385437, 0.00014781951904296875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 2.0, 1.0, 3.0, 5.0, 6.0, 11.0, 9.0, 17.0, 30.0, 40.0, 61.0, 87.0, 111.0, 175.0, 282.0, 367.0, 636.0, 895.0, 1386.0, 2235.0, 3522.0, 5617.0, 9290.0, 15209.0, 26140.0, 47440.0, 94356.0, 249160.0, 328098.0, 125988.0, 58126.0, 32086.0, 18291.0, 10778.0, 6790.0, 3962.0, 2649.0, 1550.0, 1078.0, 667.0, 442.0, 305.0, 215.0, 128.0, 99.0, 66.0, 41.0, 37.0, 24.0, 13.0, 11.0, 12.0, 5.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 3.0], "bins": [-2.26953125, -2.198974609375, -2.12841796875, -2.057861328125, -1.9873046875, -1.916748046875, -1.84619140625, -1.775634765625, -1.705078125, -1.634521484375, -1.56396484375, -1.493408203125, -1.4228515625, -1.352294921875, -1.28173828125, -1.211181640625, -1.140625, -1.070068359375, -0.99951171875, -0.928955078125, -0.8583984375, -0.787841796875, -0.71728515625, -0.646728515625, -0.576171875, -0.505615234375, -0.43505859375, -0.364501953125, -0.2939453125, -0.223388671875, -0.15283203125, -0.082275390625, -0.01171875, 0.058837890625, 0.12939453125, 0.199951171875, 0.2705078125, 0.341064453125, 0.41162109375, 0.482177734375, 0.552734375, 0.623291015625, 0.69384765625, 0.764404296875, 0.8349609375, 0.905517578125, 0.97607421875, 1.046630859375, 1.1171875, 1.187744140625, 1.25830078125, 1.328857421875, 1.3994140625, 1.469970703125, 1.54052734375, 1.611083984375, 1.681640625, 1.752197265625, 1.82275390625, 1.893310546875, 1.9638671875, 2.034423828125, 2.10498046875, 2.175537109375, 2.24609375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 1.0, 8.0, 4.0, 5.0, 12.0, 11.0, 12.0, 11.0, 16.0, 21.0, 33.0, 30.0, 28.0, 31.0, 45.0, 49.0, 45.0, 60.0, 65.0, 66.0, 64.0, 56.0, 40.0, 49.0, 37.0, 39.0, 30.0, 26.0, 17.0, 20.0, 17.0, 17.0, 6.0, 11.0, 3.0, 6.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8056640625, -0.7787628173828125, -0.751861572265625, -0.7249603271484375, -0.69805908203125, -0.6711578369140625, -0.644256591796875, -0.6173553466796875, -0.5904541015625, -0.5635528564453125, -0.536651611328125, -0.5097503662109375, -0.48284912109375, -0.4559478759765625, -0.429046630859375, -0.4021453857421875, -0.375244140625, -0.3483428955078125, -0.321441650390625, -0.2945404052734375, -0.26763916015625, -0.2407379150390625, -0.213836669921875, -0.1869354248046875, -0.1600341796875, -0.1331329345703125, -0.106231689453125, -0.0793304443359375, -0.05242919921875, -0.0255279541015625, 0.001373291015625, 0.0282745361328125, 0.05517578125, 0.0820770263671875, 0.108978271484375, 0.1358795166015625, 0.16278076171875, 0.1896820068359375, 0.216583251953125, 0.2434844970703125, 0.2703857421875, 0.2972869873046875, 0.324188232421875, 0.3510894775390625, 0.37799072265625, 0.4048919677734375, 0.431793212890625, 0.4586944580078125, 0.485595703125, 0.5124969482421875, 0.539398193359375, 0.5662994384765625, 0.59320068359375, 0.6201019287109375, 0.647003173828125, 0.6739044189453125, 0.7008056640625, 0.7277069091796875, 0.754608154296875, 0.7815093994140625, 0.80841064453125, 0.8353118896484375, 0.862213134765625, 0.8891143798828125, 0.916015625]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 5.0, 8.0, 7.0, 6.0, 12.0, 23.0, 27.0, 34.0, 38.0, 36.0, 37.0, 66.0, 93.0, 78.0, 80.0, 88.0, 66.0, 65.0, 58.0, 37.0, 38.0, 19.0, 20.0, 12.0, 11.0, 8.0, 7.0, 6.0, 5.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.037823677062988, -10.694245338439941, -10.350666999816895, -10.007089614868164, -9.663511276245117, -9.31993293762207, -8.976354598999023, -8.632776260375977, -8.28919792175293, -7.945619583129883, -7.602041721343994, -7.258463382720947, -6.914885520935059, -6.571307182312012, -6.227728843688965, -5.884150505065918, -5.5405731201171875, -5.196994781494141, -4.853416919708252, -4.509838581085205, -4.166260719299316, -3.8226823806762695, -3.4791040420532227, -3.135525941848755, -2.791947841644287, -2.4483697414398193, -2.1047916412353516, -1.7612133026123047, -1.417635202407837, -1.0740571022033691, -0.7304787635803223, -0.3869006633758545, -0.04332256317138672, 0.30025559663772583, 0.6438337564468384, 0.9874119758605957, 1.3309900760650635, 1.6745681762695312, 2.018146514892578, 2.361724615097046, 2.7053027153015137, 3.0488808155059814, 3.392458915710449, 3.736037254333496, 4.079615592956543, 4.423193454742432, 4.7667717933654785, 5.110349655151367, 5.453927993774414, 5.797506332397461, 6.14108419418335, 6.4846625328063965, 6.828240394592285, 7.171818733215332, 7.515397071838379, 7.858975410461426, 8.202552795410156, 8.546131134033203, 8.88970947265625, 9.233287811279297, 9.576865196228027, 9.920443534851074, 10.264021873474121, 10.607600212097168, 10.951178550720215]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 6.0, 11.0, 12.0, 13.0, 9.0, 18.0, 19.0, 18.0, 17.0, 27.0, 29.0, 25.0, 17.0, 31.0, 36.0, 27.0, 37.0, 30.0, 37.0, 38.0, 30.0, 33.0, 37.0, 38.0, 36.0, 25.0, 36.0, 32.0, 29.0, 27.0, 22.0, 20.0, 20.0, 22.0, 14.0, 24.0, 19.0, 10.0, 10.0, 14.0, 8.0, 9.0, 8.0, 6.0, 3.0, 2.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-7.880161762237549, -7.623427391052246, -7.366693019866943, -7.109958648681641, -6.853224277496338, -6.596489906311035, -6.339755058288574, -6.08302116394043, -5.826286315917969, -5.569551944732666, -5.312817573547363, -5.0560832023620605, -4.799348831176758, -4.542614459991455, -4.285880088806152, -4.029145240783691, -3.772411346435547, -3.515676975250244, -3.2589426040649414, -3.0022082328796387, -2.745473861694336, -2.488739490509033, -2.2320048809051514, -1.9752705097198486, -1.718536138534546, -1.4618017673492432, -1.2050673961639404, -0.9483329057693481, -0.6915985345840454, -0.4348641633987427, -0.1781296730041504, 0.07860469818115234, 0.3353385925292969, 0.5920729637145996, 0.8488073945045471, 1.1055418252944946, 1.3622761964797974, 1.6190105676651, 1.8757450580596924, 2.132479429244995, 2.389213800430298, 2.6459481716156006, 2.9026825428009033, 3.159417152404785, 3.416151523590088, 3.6728858947753906, 3.9296202659606934, 4.186354637145996, 4.443089008331299, 4.699823379516602, 4.956557750701904, 5.213292121887207, 5.47002649307251, 5.7267608642578125, 5.983495712280273, 6.240229606628418, 6.496964454650879, 6.753698825836182, 7.010433197021484, 7.267167568206787, 7.52390193939209, 7.780636310577393, 8.037370681762695, 8.294105529785156, 8.5508394241333]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 15.0, 14.0, 20.0, 46.0, 54.0, 82.0, 136.0, 201.0, 334.0, 462.0, 685.0, 1035.0, 1462.0, 2267.0, 3478.0, 5092.0, 7864.0, 11930.0, 18396.0, 28907.0, 46221.0, 76003.0, 133904.0, 287601.0, 778617.0, 1377659.0, 796773.0, 277299.0, 128248.0, 74585.0, 46342.0, 29444.0, 19085.0, 12646.0, 8607.0, 5702.0, 4047.0, 2724.0, 1852.0, 1351.0, 941.0, 659.0, 460.0, 345.0, 217.0, 144.0, 106.0, 82.0, 44.0, 33.0, 18.0, 20.0, 10.0, 7.0, 6.0, 4.0, 4.0, 3.0], "bins": [-10.6328125, -10.29541015625, -9.9580078125, -9.62060546875, -9.283203125, -8.94580078125, -8.6083984375, -8.27099609375, -7.93359375, -7.59619140625, -7.2587890625, -6.92138671875, -6.583984375, -6.24658203125, -5.9091796875, -5.57177734375, -5.234375, -4.89697265625, -4.5595703125, -4.22216796875, -3.884765625, -3.54736328125, -3.2099609375, -2.87255859375, -2.53515625, -2.19775390625, -1.8603515625, -1.52294921875, -1.185546875, -0.84814453125, -0.5107421875, -0.17333984375, 0.1640625, 0.50146484375, 0.8388671875, 1.17626953125, 1.513671875, 1.85107421875, 2.1884765625, 2.52587890625, 2.86328125, 3.20068359375, 3.5380859375, 3.87548828125, 4.212890625, 4.55029296875, 4.8876953125, 5.22509765625, 5.5625, 5.89990234375, 6.2373046875, 6.57470703125, 6.912109375, 7.24951171875, 7.5869140625, 7.92431640625, 8.26171875, 8.59912109375, 8.9365234375, 9.27392578125, 9.611328125, 9.94873046875, 10.2861328125, 10.62353515625, 10.9609375]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 8.0, 7.0, 8.0, 17.0, 12.0, 20.0, 13.0, 20.0, 16.0, 32.0, 28.0, 29.0, 32.0, 23.0, 35.0, 36.0, 37.0, 36.0, 37.0, 35.0, 28.0, 39.0, 41.0, 39.0, 32.0, 35.0, 28.0, 29.0, 21.0, 29.0, 24.0, 21.0, 13.0, 24.0, 20.0, 20.0, 13.0, 6.0, 15.0, 6.0, 7.0, 7.0, 4.0, 7.0, 3.0, 6.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-7.21484375, -6.9808349609375, -6.746826171875, -6.5128173828125, -6.27880859375, -6.0447998046875, -5.810791015625, -5.5767822265625, -5.3427734375, -5.1087646484375, -4.874755859375, -4.6407470703125, -4.40673828125, -4.1727294921875, -3.938720703125, -3.7047119140625, -3.470703125, -3.2366943359375, -3.002685546875, -2.7686767578125, -2.53466796875, -2.3006591796875, -2.066650390625, -1.8326416015625, -1.5986328125, -1.3646240234375, -1.130615234375, -0.8966064453125, -0.66259765625, -0.4285888671875, -0.194580078125, 0.0394287109375, 0.2734375, 0.5074462890625, 0.741455078125, 0.9754638671875, 1.20947265625, 1.4434814453125, 1.677490234375, 1.9114990234375, 2.1455078125, 2.3795166015625, 2.613525390625, 2.8475341796875, 3.08154296875, 3.3155517578125, 3.549560546875, 3.7835693359375, 4.017578125, 4.2515869140625, 4.485595703125, 4.7196044921875, 4.95361328125, 5.1876220703125, 5.421630859375, 5.6556396484375, 5.8896484375, 6.1236572265625, 6.357666015625, 6.5916748046875, 6.82568359375, 7.0596923828125, 7.293701171875, 7.5277099609375, 7.76171875]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 4.0, 6.0, 5.0, 19.0, 17.0, 34.0, 51.0, 71.0, 117.0, 150.0, 265.0, 366.0, 597.0, 900.0, 1423.0, 2205.0, 3352.0, 5231.0, 8298.0, 13712.0, 22429.0, 38628.0, 68459.0, 128657.0, 262145.0, 591969.0, 1376142.0, 901450.0, 376524.0, 175920.0, 91130.0, 49838.0, 28635.0, 17096.0, 10306.0, 6439.0, 4222.0, 2638.0, 1635.0, 1105.0, 719.0, 478.0, 316.0, 184.0, 157.0, 94.0, 54.0, 37.0, 24.0, 16.0, 9.0, 4.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.859375, -10.5059814453125, -10.152587890625, -9.7991943359375, -9.44580078125, -9.0924072265625, -8.739013671875, -8.3856201171875, -8.0322265625, -7.6788330078125, -7.325439453125, -6.9720458984375, -6.61865234375, -6.2652587890625, -5.911865234375, -5.5584716796875, -5.205078125, -4.8516845703125, -4.498291015625, -4.1448974609375, -3.79150390625, -3.4381103515625, -3.084716796875, -2.7313232421875, -2.3779296875, -2.0245361328125, -1.671142578125, -1.3177490234375, -0.96435546875, -0.6109619140625, -0.257568359375, 0.0958251953125, 0.44921875, 0.8026123046875, 1.156005859375, 1.5093994140625, 1.86279296875, 2.2161865234375, 2.569580078125, 2.9229736328125, 3.2763671875, 3.6297607421875, 3.983154296875, 4.3365478515625, 4.68994140625, 5.0433349609375, 5.396728515625, 5.7501220703125, 6.103515625, 6.4569091796875, 6.810302734375, 7.1636962890625, 7.51708984375, 7.8704833984375, 8.223876953125, 8.5772705078125, 8.9306640625, 9.2840576171875, 9.637451171875, 9.9908447265625, 10.34423828125, 10.6976318359375, 11.051025390625, 11.4044189453125, 11.7578125]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 5.0, 7.0, 5.0, 10.0, 7.0, 7.0, 13.0, 32.0, 16.0, 15.0, 24.0, 22.0, 50.0, 34.0, 63.0, 59.0, 87.0, 102.0, 114.0, 144.0, 182.0, 208.0, 227.0, 281.0, 338.0, 369.0, 271.0, 248.0, 190.0, 155.0, 132.0, 118.0, 81.0, 81.0, 68.0, 72.0, 46.0, 31.0, 23.0, 31.0, 20.0, 17.0, 14.0, 18.0, 14.0, 8.0, 8.0, 3.0, 3.0, 0.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.65234375, -3.52593994140625, -3.3995361328125, -3.27313232421875, -3.146728515625, -3.02032470703125, -2.8939208984375, -2.76751708984375, -2.64111328125, -2.51470947265625, -2.3883056640625, -2.26190185546875, -2.135498046875, -2.00909423828125, -1.8826904296875, -1.75628662109375, -1.6298828125, -1.50347900390625, -1.3770751953125, -1.25067138671875, -1.124267578125, -0.99786376953125, -0.8714599609375, -0.74505615234375, -0.61865234375, -0.49224853515625, -0.3658447265625, -0.23944091796875, -0.113037109375, 0.01336669921875, 0.1397705078125, 0.26617431640625, 0.392578125, 0.51898193359375, 0.6453857421875, 0.77178955078125, 0.898193359375, 1.02459716796875, 1.1510009765625, 1.27740478515625, 1.40380859375, 1.53021240234375, 1.6566162109375, 1.78302001953125, 1.909423828125, 2.03582763671875, 2.1622314453125, 2.28863525390625, 2.4150390625, 2.54144287109375, 2.6678466796875, 2.79425048828125, 2.920654296875, 3.04705810546875, 3.1734619140625, 3.29986572265625, 3.42626953125, 3.55267333984375, 3.6790771484375, 3.80548095703125, 3.931884765625, 4.05828857421875, 4.1846923828125, 4.31109619140625, 4.4375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 2.0, 7.0, 8.0, 8.0, 11.0, 12.0, 24.0, 19.0, 37.0, 45.0, 62.0, 59.0, 91.0, 99.0, 126.0, 107.0, 68.0, 59.0, 36.0, 29.0, 18.0, 16.0, 18.0, 10.0, 5.0, 6.0, 7.0, 8.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.789109230041504, -10.389486312866211, -9.989863395690918, -9.590241432189941, -9.190618515014648, -8.790995597839355, -8.391372680664062, -7.991750240325928, -7.592127799987793, -7.1925048828125, -6.792882442474365, -6.393259525299072, -5.9936370849609375, -5.5940141677856445, -5.194391250610352, -4.794768810272217, -4.395145893096924, -3.99552321434021, -3.595900535583496, -3.196277618408203, -2.7966551780700684, -2.3970322608947754, -1.9974095821380615, -1.5977869033813477, -1.1981642246246338, -0.7985415458679199, -0.3989188075065613, 0.0007039308547973633, 0.40032660961151123, 0.7999492883682251, 1.1995720863342285, 1.5991947650909424, 1.9988174438476562, 2.39844012260437, 2.798062801361084, 3.197685718536377, 3.5973081588745117, 3.9969310760498047, 4.396553993225098, 4.796176433563232, 5.195798873901367, 5.59542179107666, 5.995044231414795, 6.394667148590088, 6.794289588928223, 7.193912506103516, 7.593535423278809, 7.993157863616943, 8.392780303955078, 8.792403221130371, 9.192026138305664, 9.59164810180664, 9.991271018981934, 10.390893936157227, 10.79051685333252, 11.190139770507812, 11.589762687683105, 11.989385604858398, 12.389008522033691, 12.788630485534668, 13.188253402709961, 13.587876319885254, 13.987499237060547, 14.387121200561523, 14.786744117736816]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 5.0, 2.0, 3.0, 5.0, 3.0, 15.0, 6.0, 11.0, 17.0, 13.0, 19.0, 19.0, 23.0, 18.0, 24.0, 30.0, 29.0, 25.0, 25.0, 34.0, 25.0, 35.0, 46.0, 38.0, 29.0, 40.0, 40.0, 40.0, 27.0, 38.0, 35.0, 31.0, 29.0, 19.0, 21.0, 29.0, 25.0, 19.0, 16.0, 16.0, 10.0, 14.0, 15.0, 10.0, 8.0, 11.0, 7.0, 3.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.488620281219482, -7.223860740661621, -6.959100723266602, -6.69434118270874, -6.429581642150879, -6.164821624755859, -5.900062084197998, -5.635302543640137, -5.370542526245117, -5.105782985687256, -4.841022968292236, -4.576263427734375, -4.311503887176514, -4.046744346618652, -3.781984329223633, -3.5172247886657715, -3.25246524810791, -2.9877054691314697, -2.7229459285736084, -2.458186149597168, -2.1934266090393066, -1.9286668300628662, -1.6639070510864258, -1.399147391319275, -1.134387731552124, -0.8696280717849731, -0.6048683524131775, -0.34010863304138184, -0.07534897327423096, 0.18941068649291992, 0.45417046546936035, 0.7189301252365112, 0.9836893081665039, 1.2484489679336548, 1.5132086277008057, 1.777968406677246, 2.0427279472351074, 2.307487726211548, 2.5722475051879883, 2.8370070457458496, 3.10176682472229, 3.3665266036987305, 3.631286144256592, 3.8960459232330322, 4.160805702209473, 4.425565242767334, 4.690324783325195, 4.955084800720215, 5.219844341278076, 5.4846038818359375, 5.749363899230957, 6.014123439788818, 6.27888298034668, 6.543642997741699, 6.8084025382995605, 7.073162078857422, 7.337922096252441, 7.602681636810303, 7.867441654205322, 8.132201194763184, 8.396961212158203, 8.661720275878906, 8.926480293273926, 9.191240310668945, 9.455999374389648]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 12.0, 8.0, 22.0, 35.0, 56.0, 64.0, 107.0, 161.0, 232.0, 349.0, 534.0, 731.0, 1080.0, 1733.0, 2518.0, 3713.0, 5516.0, 8337.0, 13038.0, 20298.0, 32388.0, 53526.0, 92589.0, 191057.0, 315970.0, 123955.0, 68525.0, 40603.0, 24708.0, 15865.0, 10404.0, 6984.0, 4414.0, 2999.0, 1974.0, 1339.0, 927.0, 590.0, 393.0, 260.0, 190.0, 115.0, 86.0, 56.0, 27.0, 22.0, 16.0, 11.0, 9.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.61328125, -2.532196044921875, -2.45111083984375, -2.370025634765625, -2.2889404296875, -2.207855224609375, -2.12677001953125, -2.045684814453125, -1.964599609375, -1.883514404296875, -1.80242919921875, -1.721343994140625, -1.6402587890625, -1.559173583984375, -1.47808837890625, -1.397003173828125, -1.31591796875, -1.234832763671875, -1.15374755859375, -1.072662353515625, -0.9915771484375, -0.910491943359375, -0.82940673828125, -0.748321533203125, -0.667236328125, -0.586151123046875, -0.50506591796875, -0.423980712890625, -0.3428955078125, -0.261810302734375, -0.18072509765625, -0.099639892578125, -0.0185546875, 0.062530517578125, 0.14361572265625, 0.224700927734375, 0.3057861328125, 0.386871337890625, 0.46795654296875, 0.549041748046875, 0.630126953125, 0.711212158203125, 0.79229736328125, 0.873382568359375, 0.9544677734375, 1.035552978515625, 1.11663818359375, 1.197723388671875, 1.27880859375, 1.359893798828125, 1.44097900390625, 1.522064208984375, 1.6031494140625, 1.684234619140625, 1.76531982421875, 1.846405029296875, 1.927490234375, 2.008575439453125, 2.08966064453125, 2.170745849609375, 2.2518310546875, 2.332916259765625, 2.41400146484375, 2.495086669921875, 2.576171875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 6.0, 5.0, 6.0, 16.0, 13.0, 19.0, 22.0, 25.0, 24.0, 20.0, 16.0, 31.0, 31.0, 31.0, 39.0, 25.0, 47.0, 41.0, 30.0, 30.0, 46.0, 50.0, 44.0, 36.0, 23.0, 44.0, 32.0, 27.0, 27.0, 23.0, 34.0, 17.0, 18.0, 12.0, 14.0, 11.0, 12.0, 11.0, 13.0, 13.0, 4.0, 3.0, 2.0, 1.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3046875, -8.01953125, -7.734375, -7.44921875, -7.1640625, -6.87890625, -6.59375, -6.30859375, -6.0234375, -5.73828125, -5.453125, -5.16796875, -4.8828125, -4.59765625, -4.3125, -4.02734375, -3.7421875, -3.45703125, -3.171875, -2.88671875, -2.6015625, -2.31640625, -2.03125, -1.74609375, -1.4609375, -1.17578125, -0.890625, -0.60546875, -0.3203125, -0.03515625, 0.25, 0.53515625, 0.8203125, 1.10546875, 1.390625, 1.67578125, 1.9609375, 2.24609375, 2.53125, 2.81640625, 3.1015625, 3.38671875, 3.671875, 3.95703125, 4.2421875, 4.52734375, 4.8125, 5.09765625, 5.3828125, 5.66796875, 5.953125, 6.23828125, 6.5234375, 6.80859375, 7.09375, 7.37890625, 7.6640625, 7.94921875, 8.234375, 8.51953125, 8.8046875, 9.08984375, 9.375, 9.66015625, 9.9453125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 4.0, 6.0, 12.0, 16.0, 11.0, 36.0, 30.0, 28.0, 73.0, 102.0, 129.0, 178.0, 231.0, 342.0, 485.0, 651.0, 906.0, 1340.0, 1920.0, 2808.0, 4201.0, 6185.0, 9152.0, 14341.0, 22254.0, 35491.0, 58158.0, 103664.0, 247104.0, 268825.0, 106950.0, 59438.0, 36371.0, 22854.0, 14649.0, 9533.0, 6290.0, 4222.0, 2898.0, 1941.0, 1386.0, 1042.0, 585.0, 498.0, 348.0, 240.0, 175.0, 134.0, 92.0, 72.0, 51.0, 38.0, 29.0, 18.0, 14.0, 8.0, 4.0, 0.0, 2.0, 2.0, 2.0], "bins": [-2.521484375, -2.4427490234375, -2.364013671875, -2.2852783203125, -2.20654296875, -2.1278076171875, -2.049072265625, -1.9703369140625, -1.8916015625, -1.8128662109375, -1.734130859375, -1.6553955078125, -1.57666015625, -1.4979248046875, -1.419189453125, -1.3404541015625, -1.26171875, -1.1829833984375, -1.104248046875, -1.0255126953125, -0.94677734375, -0.8680419921875, -0.789306640625, -0.7105712890625, -0.6318359375, -0.5531005859375, -0.474365234375, -0.3956298828125, -0.31689453125, -0.2381591796875, -0.159423828125, -0.0806884765625, -0.001953125, 0.0767822265625, 0.155517578125, 0.2342529296875, 0.31298828125, 0.3917236328125, 0.470458984375, 0.5491943359375, 0.6279296875, 0.7066650390625, 0.785400390625, 0.8641357421875, 0.94287109375, 1.0216064453125, 1.100341796875, 1.1790771484375, 1.2578125, 1.3365478515625, 1.415283203125, 1.4940185546875, 1.57275390625, 1.6514892578125, 1.730224609375, 1.8089599609375, 1.8876953125, 1.9664306640625, 2.045166015625, 2.1239013671875, 2.20263671875, 2.2813720703125, 2.360107421875, 2.4388427734375, 2.517578125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 6.0, 9.0, 6.0, 14.0, 12.0, 16.0, 13.0, 24.0, 20.0, 27.0, 24.0, 21.0, 29.0, 39.0, 32.0, 43.0, 49.0, 48.0, 44.0, 45.0, 37.0, 31.0, 38.0, 30.0, 31.0, 42.0, 32.0, 32.0, 19.0, 24.0, 25.0, 21.0, 24.0, 14.0, 16.0, 10.0, 9.0, 5.0, 4.0, 7.0, 4.0, 6.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 4.0], "bins": [-6.28125, -6.0989990234375, -5.916748046875, -5.7344970703125, -5.55224609375, -5.3699951171875, -5.187744140625, -5.0054931640625, -4.8232421875, -4.6409912109375, -4.458740234375, -4.2764892578125, -4.09423828125, -3.9119873046875, -3.729736328125, -3.5474853515625, -3.365234375, -3.1829833984375, -3.000732421875, -2.8184814453125, -2.63623046875, -2.4539794921875, -2.271728515625, -2.0894775390625, -1.9072265625, -1.7249755859375, -1.542724609375, -1.3604736328125, -1.17822265625, -0.9959716796875, -0.813720703125, -0.6314697265625, -0.44921875, -0.2669677734375, -0.084716796875, 0.0975341796875, 0.27978515625, 0.4620361328125, 0.644287109375, 0.8265380859375, 1.0087890625, 1.1910400390625, 1.373291015625, 1.5555419921875, 1.73779296875, 1.9200439453125, 2.102294921875, 2.2845458984375, 2.466796875, 2.6490478515625, 2.831298828125, 3.0135498046875, 3.19580078125, 3.3780517578125, 3.560302734375, 3.7425537109375, 3.9248046875, 4.1070556640625, 4.289306640625, 4.4715576171875, 4.65380859375, 4.8360595703125, 5.018310546875, 5.2005615234375, 5.3828125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 2.0, 2.0, 6.0, 9.0, 13.0, 11.0, 21.0, 41.0, 53.0, 69.0, 90.0, 117.0, 181.0, 256.0, 319.0, 457.0, 707.0, 992.0, 1421.0, 2135.0, 3091.0, 4792.0, 7228.0, 11527.0, 18701.0, 33034.0, 62198.0, 131032.0, 288588.0, 244647.0, 108276.0, 53268.0, 28800.0, 16402.0, 10337.0, 6431.0, 4148.0, 2859.0, 1882.0, 1280.0, 933.0, 663.0, 438.0, 309.0, 246.0, 179.0, 99.0, 75.0, 53.0, 43.0, 27.0, 19.0, 17.0, 18.0, 7.0, 7.0, 4.0, 2.0, 1.0, 3.0, 1.0], "bins": [-0.0035572052001953125, -0.0034456253051757812, -0.00333404541015625, -0.0032224655151367188, -0.0031108856201171875, -0.0029993057250976562, -0.002887725830078125, -0.0027761459350585938, -0.0026645660400390625, -0.0025529861450195312, -0.00244140625, -0.0023298263549804688, -0.0022182464599609375, -0.0021066665649414062, -0.001995086669921875, -0.0018835067749023438, -0.0017719268798828125, -0.0016603469848632812, -0.00154876708984375, -0.0014371871948242188, -0.0013256072998046875, -0.0012140274047851562, -0.001102447509765625, -0.0009908676147460938, -0.0008792877197265625, -0.0007677078247070312, -0.0006561279296875, -0.0005445480346679688, -0.0004329681396484375, -0.00032138824462890625, -0.000209808349609375, -9.822845458984375e-05, 1.33514404296875e-05, 0.00012493133544921875, 0.00023651123046875, 0.00034809112548828125, 0.0004596710205078125, 0.0005712509155273438, 0.000682830810546875, 0.0007944107055664062, 0.0009059906005859375, 0.0010175704956054688, 0.001129150390625, 0.0012407302856445312, 0.0013523101806640625, 0.0014638900756835938, 0.001575469970703125, 0.0016870498657226562, 0.0017986297607421875, 0.0019102096557617188, 0.00202178955078125, 0.0021333694458007812, 0.0022449493408203125, 0.0023565292358398438, 0.002468109130859375, 0.0025796890258789062, 0.0026912689208984375, 0.0028028488159179688, 0.0029144287109375, 0.0030260086059570312, 0.0031375885009765625, 0.0032491683959960938, 0.003360748291015625, 0.0034723281860351562, 0.0035839080810546875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 5.0, 2.0, 2.0, 2.0, 3.0, 8.0, 11.0, 14.0, 26.0, 29.0, 32.0, 27.0, 43.0, 46.0, 48.0, 67.0, 67.0, 76.0, 50.0, 87.0, 47.0, 67.0, 43.0, 57.0, 19.0, 45.0, 18.0, 28.0, 9.0, 9.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.125999450683594e-06, -4.978850483894348e-06, -4.8317015171051025e-06, -4.684552550315857e-06, -4.537403583526611e-06, -4.390254616737366e-06, -4.24310564994812e-06, -4.0959566831588745e-06, -3.948807716369629e-06, -3.8016587495803833e-06, -3.6545097827911377e-06, -3.507360816001892e-06, -3.3602118492126465e-06, -3.213062882423401e-06, -3.0659139156341553e-06, -2.9187649488449097e-06, -2.771615982055664e-06, -2.6244670152664185e-06, -2.477318048477173e-06, -2.3301690816879272e-06, -2.1830201148986816e-06, -2.035871148109436e-06, -1.8887221813201904e-06, -1.7415732145309448e-06, -1.5944242477416992e-06, -1.4472752809524536e-06, -1.300126314163208e-06, -1.1529773473739624e-06, -1.0058283805847168e-06, -8.586794137954712e-07, -7.115304470062256e-07, -5.6438148021698e-07, -4.172325134277344e-07, -2.7008354663848877e-07, -1.2293457984924316e-07, 2.421438694000244e-08, 1.7136335372924805e-07, 3.1851232051849365e-07, 4.6566128730773926e-07, 6.128102540969849e-07, 7.599592208862305e-07, 9.071081876754761e-07, 1.0542571544647217e-06, 1.2014061212539673e-06, 1.3485550880432129e-06, 1.4957040548324585e-06, 1.642853021621704e-06, 1.7900019884109497e-06, 1.9371509552001953e-06, 2.084299921989441e-06, 2.2314488887786865e-06, 2.378597855567932e-06, 2.5257468223571777e-06, 2.6728957891464233e-06, 2.820044755935669e-06, 2.9671937227249146e-06, 3.11434268951416e-06, 3.2614916563034058e-06, 3.4086406230926514e-06, 3.555789589881897e-06, 3.7029385566711426e-06, 3.850087523460388e-06, 3.997236490249634e-06, 4.144385457038879e-06, 4.291534423828125e-06]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 1.0, 9.0, 8.0, 12.0, 20.0, 25.0, 31.0, 46.0, 49.0, 73.0, 116.0, 170.0, 237.0, 334.0, 499.0, 687.0, 1064.0, 1615.0, 2482.0, 4019.0, 6534.0, 11497.0, 21017.0, 40844.0, 86978.0, 204771.0, 350165.0, 164434.0, 72102.0, 34901.0, 17834.0, 9878.0, 5797.0, 3595.0, 2214.0, 1460.0, 889.0, 659.0, 418.0, 341.0, 207.0, 146.0, 113.0, 79.0, 54.0, 43.0, 22.0, 29.0, 22.0, 7.0, 9.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0037841796875, -0.003655374050140381, -0.0035265684127807617, -0.0033977627754211426, -0.0032689571380615234, -0.0031401515007019043, -0.003011345863342285, -0.002882540225982666, -0.002753734588623047, -0.0026249289512634277, -0.0024961233139038086, -0.0023673176765441895, -0.0022385120391845703, -0.002109706401824951, -0.001980900764465332, -0.0018520951271057129, -0.0017232894897460938, -0.0015944838523864746, -0.0014656782150268555, -0.0013368725776672363, -0.0012080669403076172, -0.001079261302947998, -0.0009504556655883789, -0.0008216500282287598, -0.0006928443908691406, -0.0005640387535095215, -0.00043523311614990234, -0.0003064274787902832, -0.00017762184143066406, -4.881620407104492e-05, 7.998943328857422e-05, 0.00020879507064819336, 0.0003376007080078125, 0.00046640634536743164, 0.0005952119827270508, 0.0007240176200866699, 0.0008528232574462891, 0.0009816288948059082, 0.0011104345321655273, 0.0012392401695251465, 0.0013680458068847656, 0.0014968514442443848, 0.001625657081604004, 0.001754462718963623, 0.0018832683563232422, 0.0020120739936828613, 0.0021408796310424805, 0.0022696852684020996, 0.0023984909057617188, 0.002527296543121338, 0.002656102180480957, 0.002784907817840576, 0.0029137134552001953, 0.0030425190925598145, 0.0031713247299194336, 0.0033001303672790527, 0.003428936004638672, 0.003557741641998291, 0.00368654727935791, 0.0038153529167175293, 0.0039441585540771484, 0.004072964191436768, 0.004201769828796387, 0.004330575466156006, 0.004459381103515625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 8.0, 6.0, 5.0, 10.0, 12.0, 17.0, 17.0, 29.0, 33.0, 48.0, 63.0, 66.0, 71.0, 107.0, 95.0, 87.0, 70.0, 46.0, 55.0, 37.0, 24.0, 26.0, 18.0, 14.0, 8.0, 7.0, 7.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0018281936645507812, -0.0017758309841156006, -0.00172346830368042, -0.0016711056232452393, -0.0016187429428100586, -0.001566380262374878, -0.0015140175819396973, -0.0014616549015045166, -0.001409292221069336, -0.0013569295406341553, -0.0013045668601989746, -0.001252204179763794, -0.0011998414993286133, -0.0011474788188934326, -0.001095116138458252, -0.0010427534580230713, -0.0009903907775878906, -0.00093802809715271, -0.0008856654167175293, -0.0008333027362823486, -0.000780940055847168, -0.0007285773754119873, -0.0006762146949768066, -0.000623852014541626, -0.0005714893341064453, -0.0005191266536712646, -0.000466763973236084, -0.0004144012928009033, -0.00036203861236572266, -0.000309675931930542, -0.00025731325149536133, -0.00020495057106018066, -0.000152587890625, -0.00010022521018981934, -4.786252975463867e-05, 4.500150680541992e-06, 5.6862831115722656e-05, 0.00010922551155090332, 0.00016158819198608398, 0.00021395087242126465, 0.0002663135528564453, 0.000318676233291626, 0.00037103891372680664, 0.0004234015941619873, 0.00047576427459716797, 0.0005281269550323486, 0.0005804896354675293, 0.00063285231590271, 0.0006852149963378906, 0.0007375776767730713, 0.000789940357208252, 0.0008423030376434326, 0.0008946657180786133, 0.0009470283985137939, 0.0009993910789489746, 0.0010517537593841553, 0.001104116439819336, 0.0011564791202545166, 0.0012088418006896973, 0.001261204481124878, 0.0013135671615600586, 0.0013659298419952393, 0.00141829252243042, 0.0014706552028656006, 0.0015230178833007812]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 10.0, 8.0, 13.0, 19.0, 23.0, 27.0, 44.0, 62.0, 56.0, 85.0, 108.0, 109.0, 126.0, 70.0, 68.0, 38.0, 33.0, 26.0, 9.0, 19.0, 11.0, 3.0, 5.0, 8.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.31043529510498, -10.895340919494629, -10.480246543884277, -10.065152168273926, -9.650057792663574, -9.234963417053223, -8.819868087768555, -8.404773712158203, -7.98967981338501, -7.574585437774658, -7.159491062164307, -6.744396209716797, -6.329301834106445, -5.914207458496094, -5.499113082885742, -5.084018707275391, -4.668924331665039, -4.2538299560546875, -3.838735580444336, -3.4236409664154053, -3.0085465908050537, -2.593452215194702, -2.1783576011657715, -1.76326322555542, -1.3481688499450684, -0.933074414730072, -0.5179799795150757, -0.10288548469543457, 0.312208890914917, 0.7273032665252686, 1.1423978805541992, 1.5574922561645508, 1.9725866317749023, 2.387681007385254, 2.8027753829956055, 3.217869997024536, 3.6329643726348877, 4.04805850982666, 4.46315336227417, 4.8782477378845215, 5.293342113494873, 5.708436489105225, 6.123530864715576, 6.538625717163086, 6.9537200927734375, 7.368814468383789, 7.783908843994141, 8.199003219604492, 8.614097595214844, 9.029191970825195, 9.444286346435547, 9.859380722045898, 10.27447509765625, 10.689569473266602, 11.104663848876953, 11.519758224487305, 11.934852600097656, 12.349946975708008, 12.76504135131836, 13.180135726928711, 13.595230102539062, 14.010324478149414, 14.425418853759766, 14.840513229370117, 15.255608558654785]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 5.0, 2.0, 3.0, 5.0, 3.0, 15.0, 5.0, 12.0, 17.0, 13.0, 20.0, 18.0, 23.0, 17.0, 24.0, 30.0, 30.0, 26.0, 24.0, 32.0, 27.0, 35.0, 44.0, 40.0, 27.0, 41.0, 42.0, 39.0, 27.0, 38.0, 36.0, 30.0, 29.0, 19.0, 22.0, 28.0, 26.0, 18.0, 18.0, 14.0, 11.0, 13.0, 16.0, 9.0, 7.0, 12.0, 7.0, 3.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.478738784790039, -7.213583469390869, -6.948428630828857, -6.6832733154296875, -6.418118476867676, -6.152963161468506, -5.887807846069336, -5.622653007507324, -5.3574981689453125, -5.092342853546143, -4.827188014984131, -4.562032699584961, -4.296877861022949, -4.031722545623779, -3.7665674686431885, -3.5014123916625977, -3.2362570762634277, -2.971101999282837, -2.705946922302246, -2.440791606903076, -2.1756367683410645, -1.910481572151184, -1.6453263759613037, -1.380171298980713, -1.115016222000122, -0.8498611450195312, -0.5847060084342957, -0.31955087184906006, -0.05439579486846924, 0.21075928211212158, 0.47591447830200195, 0.7410695552825928, 1.0062246322631836, 1.2713797092437744, 1.5365347862243652, 1.8016899824142456, 2.066844940185547, 2.332000255584717, 2.5971553325653076, 2.8623104095458984, 3.1274654865264893, 3.39262056350708, 3.657775640487671, 3.9229307174682617, 4.188086032867432, 4.453240871429443, 4.718396186828613, 4.983551025390625, 5.248706340789795, 5.513861656188965, 5.779016494750977, 6.0441718101501465, 6.309326648712158, 6.574481964111328, 6.83963680267334, 7.10479211807251, 7.36994743347168, 7.63510274887085, 7.900257587432861, 8.165412902832031, 8.430567741394043, 8.695722579956055, 8.960878372192383, 9.226033210754395, 9.491188049316406]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 3.0, 7.0, 13.0, 18.0, 31.0, 31.0, 73.0, 111.0, 121.0, 215.0, 309.0, 389.0, 604.0, 973.0, 1550.0, 2142.0, 3317.0, 4933.0, 7616.0, 11553.0, 17724.0, 27773.0, 43682.0, 72277.0, 120059.0, 181560.0, 192688.0, 137262.0, 82464.0, 49832.0, 30850.0, 20185.0, 13061.0, 8597.0, 5551.0, 3643.0, 2405.0, 1584.0, 1139.0, 733.0, 469.0, 345.0, 219.0, 150.0, 105.0, 70.0, 41.0, 25.0, 26.0, 13.0, 7.0, 9.0, 5.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.8203125, -13.4031982421875, -12.986083984375, -12.5689697265625, -12.15185546875, -11.7347412109375, -11.317626953125, -10.9005126953125, -10.4833984375, -10.0662841796875, -9.649169921875, -9.2320556640625, -8.81494140625, -8.3978271484375, -7.980712890625, -7.5635986328125, -7.146484375, -6.7293701171875, -6.312255859375, -5.8951416015625, -5.47802734375, -5.0609130859375, -4.643798828125, -4.2266845703125, -3.8095703125, -3.3924560546875, -2.975341796875, -2.5582275390625, -2.14111328125, -1.7239990234375, -1.306884765625, -0.8897705078125, -0.47265625, -0.0555419921875, 0.361572265625, 0.7786865234375, 1.19580078125, 1.6129150390625, 2.030029296875, 2.4471435546875, 2.8642578125, 3.2813720703125, 3.698486328125, 4.1156005859375, 4.53271484375, 4.9498291015625, 5.366943359375, 5.7840576171875, 6.201171875, 6.6182861328125, 7.035400390625, 7.4525146484375, 7.86962890625, 8.2867431640625, 8.703857421875, 9.1209716796875, 9.5380859375, 9.9552001953125, 10.372314453125, 10.7894287109375, 11.20654296875, 11.6236572265625, 12.040771484375, 12.4578857421875, 12.875]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 2.0, 3.0, 5.0, 5.0, 8.0, 9.0, 8.0, 9.0, 15.0, 11.0, 18.0, 15.0, 22.0, 23.0, 20.0, 28.0, 32.0, 23.0, 25.0, 30.0, 30.0, 33.0, 37.0, 44.0, 36.0, 33.0, 39.0, 57.0, 26.0, 33.0, 27.0, 32.0, 29.0, 26.0, 29.0, 17.0, 23.0, 22.0, 21.0, 13.0, 11.0, 12.0, 9.0, 14.0, 15.0, 8.0, 7.0, 2.0, 5.0, 3.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.25, -7.003662109375, -6.75732421875, -6.510986328125, -6.2646484375, -6.018310546875, -5.77197265625, -5.525634765625, -5.279296875, -5.032958984375, -4.78662109375, -4.540283203125, -4.2939453125, -4.047607421875, -3.80126953125, -3.554931640625, -3.30859375, -3.062255859375, -2.81591796875, -2.569580078125, -2.3232421875, -2.076904296875, -1.83056640625, -1.584228515625, -1.337890625, -1.091552734375, -0.84521484375, -0.598876953125, -0.3525390625, -0.106201171875, 0.14013671875, 0.386474609375, 0.6328125, 0.879150390625, 1.12548828125, 1.371826171875, 1.6181640625, 1.864501953125, 2.11083984375, 2.357177734375, 2.603515625, 2.849853515625, 3.09619140625, 3.342529296875, 3.5888671875, 3.835205078125, 4.08154296875, 4.327880859375, 4.57421875, 4.820556640625, 5.06689453125, 5.313232421875, 5.5595703125, 5.805908203125, 6.05224609375, 6.298583984375, 6.544921875, 6.791259765625, 7.03759765625, 7.283935546875, 7.5302734375, 7.776611328125, 8.02294921875, 8.269287109375, 8.515625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 6.0, 8.0, 10.0, 13.0, 14.0, 31.0, 41.0, 62.0, 72.0, 150.0, 186.0, 276.0, 393.0, 564.0, 792.0, 1113.0, 1612.0, 2266.0, 3427.0, 4934.0, 7396.0, 10911.0, 16176.0, 24905.0, 39033.0, 62930.0, 102154.0, 154426.0, 183749.0, 153553.0, 100754.0, 62413.0, 39006.0, 25041.0, 16355.0, 10778.0, 7120.0, 4893.0, 3447.0, 2306.0, 1601.0, 1111.0, 758.0, 541.0, 409.0, 246.0, 184.0, 132.0, 78.0, 56.0, 61.0, 30.0, 14.0, 12.0, 12.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-12.1640625, -11.76513671875, -11.3662109375, -10.96728515625, -10.568359375, -10.16943359375, -9.7705078125, -9.37158203125, -8.97265625, -8.57373046875, -8.1748046875, -7.77587890625, -7.376953125, -6.97802734375, -6.5791015625, -6.18017578125, -5.78125, -5.38232421875, -4.9833984375, -4.58447265625, -4.185546875, -3.78662109375, -3.3876953125, -2.98876953125, -2.58984375, -2.19091796875, -1.7919921875, -1.39306640625, -0.994140625, -0.59521484375, -0.1962890625, 0.20263671875, 0.6015625, 1.00048828125, 1.3994140625, 1.79833984375, 2.197265625, 2.59619140625, 2.9951171875, 3.39404296875, 3.79296875, 4.19189453125, 4.5908203125, 4.98974609375, 5.388671875, 5.78759765625, 6.1865234375, 6.58544921875, 6.984375, 7.38330078125, 7.7822265625, 8.18115234375, 8.580078125, 8.97900390625, 9.3779296875, 9.77685546875, 10.17578125, 10.57470703125, 10.9736328125, 11.37255859375, 11.771484375, 12.17041015625, 12.5693359375, 12.96826171875, 13.3671875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 7.0, 5.0, 3.0, 3.0, 12.0, 10.0, 15.0, 11.0, 18.0, 21.0, 22.0, 28.0, 23.0, 40.0, 33.0, 33.0, 35.0, 32.0, 31.0, 31.0, 35.0, 46.0, 42.0, 32.0, 30.0, 29.0, 37.0, 31.0, 35.0, 41.0, 25.0, 33.0, 24.0, 22.0, 23.0, 14.0, 22.0, 15.0, 13.0, 9.0, 6.0, 7.0, 5.0, 2.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.0546875, -4.88336181640625, -4.7120361328125, -4.54071044921875, -4.369384765625, -4.19805908203125, -4.0267333984375, -3.85540771484375, -3.68408203125, -3.51275634765625, -3.3414306640625, -3.17010498046875, -2.998779296875, -2.82745361328125, -2.6561279296875, -2.48480224609375, -2.3134765625, -2.14215087890625, -1.9708251953125, -1.79949951171875, -1.628173828125, -1.45684814453125, -1.2855224609375, -1.11419677734375, -0.94287109375, -0.77154541015625, -0.6002197265625, -0.42889404296875, -0.257568359375, -0.08624267578125, 0.0850830078125, 0.25640869140625, 0.427734375, 0.59906005859375, 0.7703857421875, 0.94171142578125, 1.113037109375, 1.28436279296875, 1.4556884765625, 1.62701416015625, 1.79833984375, 1.96966552734375, 2.1409912109375, 2.31231689453125, 2.483642578125, 2.65496826171875, 2.8262939453125, 2.99761962890625, 3.1689453125, 3.34027099609375, 3.5115966796875, 3.68292236328125, 3.854248046875, 4.02557373046875, 4.1968994140625, 4.36822509765625, 4.53955078125, 4.71087646484375, 4.8822021484375, 5.05352783203125, 5.224853515625, 5.39617919921875, 5.5675048828125, 5.73883056640625, 5.91015625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 2.0, 7.0, 7.0, 8.0, 11.0, 8.0, 24.0, 34.0, 37.0, 62.0, 79.0, 118.0, 178.0, 241.0, 393.0, 560.0, 777.0, 1093.0, 1655.0, 2376.0, 3627.0, 5454.0, 8436.0, 13504.0, 22221.0, 38520.0, 75023.0, 179769.0, 345037.0, 176758.0, 73988.0, 38067.0, 22092.0, 13415.0, 8411.0, 5334.0, 3630.0, 2405.0, 1587.0, 1114.0, 743.0, 576.0, 336.0, 254.0, 167.0, 123.0, 91.0, 73.0, 38.0, 33.0, 31.0, 8.0, 11.0, 8.0, 4.0, 3.0, 1.0, 1.0, 4.0, 2.0], "bins": [-2.390625, -2.317047119140625, -2.24346923828125, -2.169891357421875, -2.0963134765625, -2.022735595703125, -1.94915771484375, -1.875579833984375, -1.802001953125, -1.728424072265625, -1.65484619140625, -1.581268310546875, -1.5076904296875, -1.434112548828125, -1.36053466796875, -1.286956787109375, -1.21337890625, -1.139801025390625, -1.06622314453125, -0.992645263671875, -0.9190673828125, -0.845489501953125, -0.77191162109375, -0.698333740234375, -0.624755859375, -0.551177978515625, -0.47760009765625, -0.404022216796875, -0.3304443359375, -0.256866455078125, -0.18328857421875, -0.109710693359375, -0.0361328125, 0.037445068359375, 0.11102294921875, 0.184600830078125, 0.2581787109375, 0.331756591796875, 0.40533447265625, 0.478912353515625, 0.552490234375, 0.626068115234375, 0.69964599609375, 0.773223876953125, 0.8468017578125, 0.920379638671875, 0.99395751953125, 1.067535400390625, 1.14111328125, 1.214691162109375, 1.28826904296875, 1.361846923828125, 1.4354248046875, 1.509002685546875, 1.58258056640625, 1.656158447265625, 1.729736328125, 1.803314208984375, 1.87689208984375, 1.950469970703125, 2.0240478515625, 2.097625732421875, 2.17120361328125, 2.244781494140625, 2.318359375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 1.0, 2.0, 3.0, 6.0, 4.0, 13.0, 13.0, 25.0, 32.0, 39.0, 49.0, 56.0, 68.0, 89.0, 89.0, 99.0, 86.0, 82.0, 69.0, 47.0, 36.0, 24.0, 14.0, 11.0, 13.0, 8.0, 5.0, 3.0, 5.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001462697982788086, -0.0001416672021150589, -0.0001370646059513092, -0.0001324620097875595, -0.00012785941362380981, -0.00012325681746006012, -0.00011865422129631042, -0.00011405162513256073, -0.00010944902896881104, -0.00010484643280506134, -0.00010024383664131165, -9.564124047756195e-05, -9.103864431381226e-05, -8.643604815006256e-05, -8.183345198631287e-05, -7.723085582256317e-05, -7.262825965881348e-05, -6.802566349506378e-05, -6.342306733131409e-05, -5.882047116756439e-05, -5.42178750038147e-05, -4.9615278840065e-05, -4.501268267631531e-05, -4.041008651256561e-05, -3.580749034881592e-05, -3.120489418506622e-05, -2.660229802131653e-05, -2.1999701857566833e-05, -1.739710569381714e-05, -1.2794509530067444e-05, -8.191913366317749e-06, -3.589317202568054e-06, 1.0132789611816406e-06, 5.6158751249313354e-06, 1.021847128868103e-05, 1.4821067452430725e-05, 1.942366361618042e-05, 2.4026259779930115e-05, 2.862885594367981e-05, 3.3231452107429504e-05, 3.78340482711792e-05, 4.2436644434928894e-05, 4.703924059867859e-05, 5.1641836762428284e-05, 5.624443292617798e-05, 6.084702908992767e-05, 6.544962525367737e-05, 7.005222141742706e-05, 7.465481758117676e-05, 7.925741374492645e-05, 8.386000990867615e-05, 8.846260607242584e-05, 9.306520223617554e-05, 9.766779839992523e-05, 0.00010227039456367493, 0.00010687299072742462, 0.00011147558689117432, 0.00011607818305492401, 0.0001206807792186737, 0.0001252833753824234, 0.0001298859715461731, 0.0001344885677099228, 0.00013909116387367249, 0.00014369376003742218, 0.00014829635620117188]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 2.0, 3.0, 1.0, 6.0, 10.0, 8.0, 21.0, 18.0, 30.0, 63.0, 90.0, 148.0, 210.0, 337.0, 471.0, 725.0, 1164.0, 1843.0, 2889.0, 4680.0, 7487.0, 12278.0, 20806.0, 37254.0, 72422.0, 180496.0, 373789.0, 172736.0, 70237.0, 36189.0, 20327.0, 12123.0, 7253.0, 4504.0, 2851.0, 1843.0, 1151.0, 721.0, 475.0, 311.0, 200.0, 148.0, 81.0, 57.0, 37.0, 33.0, 14.0, 8.0, 4.0, 3.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.36328125, -2.283111572265625, -2.20294189453125, -2.122772216796875, -2.0426025390625, -1.962432861328125, -1.88226318359375, -1.802093505859375, -1.721923828125, -1.641754150390625, -1.56158447265625, -1.481414794921875, -1.4012451171875, -1.321075439453125, -1.24090576171875, -1.160736083984375, -1.08056640625, -1.000396728515625, -0.92022705078125, -0.840057373046875, -0.7598876953125, -0.679718017578125, -0.59954833984375, -0.519378662109375, -0.439208984375, -0.359039306640625, -0.27886962890625, -0.198699951171875, -0.1185302734375, -0.038360595703125, 0.04180908203125, 0.121978759765625, 0.2021484375, 0.282318115234375, 0.36248779296875, 0.442657470703125, 0.5228271484375, 0.602996826171875, 0.68316650390625, 0.763336181640625, 0.843505859375, 0.923675537109375, 1.00384521484375, 1.084014892578125, 1.1641845703125, 1.244354248046875, 1.32452392578125, 1.404693603515625, 1.48486328125, 1.565032958984375, 1.64520263671875, 1.725372314453125, 1.8055419921875, 1.885711669921875, 1.96588134765625, 2.046051025390625, 2.126220703125, 2.206390380859375, 2.28656005859375, 2.366729736328125, 2.4468994140625, 2.527069091796875, 2.60723876953125, 2.687408447265625, 2.767578125]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 4.0, 1.0, 1.0, 4.0, 3.0, 6.0, 5.0, 5.0, 8.0, 6.0, 12.0, 9.0, 15.0, 22.0, 18.0, 18.0, 18.0, 26.0, 29.0, 29.0, 36.0, 35.0, 49.0, 47.0, 68.0, 57.0, 66.0, 40.0, 52.0, 40.0, 32.0, 33.0, 23.0, 24.0, 21.0, 26.0, 12.0, 19.0, 19.0, 11.0, 10.0, 7.0, 10.0, 5.0, 9.0, 7.0, 1.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7470703125, -0.7220687866210938, -0.6970672607421875, -0.6720657348632812, -0.647064208984375, -0.6220626831054688, -0.5970611572265625, -0.5720596313476562, -0.54705810546875, -0.5220565795898438, -0.4970550537109375, -0.47205352783203125, -0.447052001953125, -0.42205047607421875, -0.3970489501953125, -0.37204742431640625, -0.3470458984375, -0.32204437255859375, -0.2970428466796875, -0.27204132080078125, -0.247039794921875, -0.22203826904296875, -0.1970367431640625, -0.17203521728515625, -0.14703369140625, -0.12203216552734375, -0.0970306396484375, -0.07202911376953125, -0.047027587890625, -0.02202606201171875, 0.0029754638671875, 0.02797698974609375, 0.052978515625, 0.07798004150390625, 0.1029815673828125, 0.12798309326171875, 0.152984619140625, 0.17798614501953125, 0.2029876708984375, 0.22798919677734375, 0.25299072265625, 0.27799224853515625, 0.3029937744140625, 0.32799530029296875, 0.352996826171875, 0.37799835205078125, 0.4029998779296875, 0.42800140380859375, 0.4530029296875, 0.47800445556640625, 0.5030059814453125, 0.5280075073242188, 0.553009033203125, 0.5780105590820312, 0.6030120849609375, 0.6280136108398438, 0.65301513671875, 0.6780166625976562, 0.7030181884765625, 0.7280197143554688, 0.753021240234375, 0.7780227661132812, 0.8030242919921875, 0.8280258178710938, 0.85302734375]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 5.0, 4.0, 3.0, 5.0, 9.0, 13.0, 15.0, 15.0, 22.0, 24.0, 52.0, 55.0, 57.0, 71.0, 102.0, 95.0, 94.0, 76.0, 64.0, 67.0, 33.0, 26.0, 13.0, 14.0, 19.0, 15.0, 5.0, 7.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.596051216125488, -11.226978302001953, -10.857905387878418, -10.488832473754883, -10.119759559631348, -9.750686645507812, -9.381612777709961, -9.012540817260742, -8.64346694946289, -8.274394035339355, -7.90532112121582, -7.536248207092285, -7.16717529296875, -6.798102378845215, -6.4290289878845215, -6.059956073760986, -5.690883636474609, -5.321810722351074, -4.952737808227539, -4.583664894104004, -4.214591979980469, -3.8455188274383545, -3.4764456748962402, -3.107372760772705, -2.73829984664917, -2.3692269325256348, -2.0001540184020996, -1.6310808658599854, -1.2620079517364502, -0.892935037612915, -0.5238618850708008, -0.15478897094726562, 0.21428394317626953, 0.5833569169044495, 0.9524298906326294, 1.321502923965454, 1.6905758380889893, 2.0596487522125244, 2.4287219047546387, 2.797794818878174, 3.166867733001709, 3.535940647125244, 3.9050135612487793, 4.274086952209473, 4.643159866333008, 5.012232780456543, 5.381305694580078, 5.750378608703613, 6.119451522827148, 6.488524436950684, 6.857597351074219, 7.226670265197754, 7.595743179321289, 7.964816093444824, 8.33388900756836, 8.702962875366211, 9.07203483581543, 9.441107749938965, 9.8101806640625, 10.179253578186035, 10.54832649230957, 10.917399406433105, 11.28647232055664, 11.655546188354492, 12.024619102478027]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 1.0, 2.0, 2.0, 4.0, 5.0, 10.0, 15.0, 9.0, 14.0, 13.0, 21.0, 28.0, 12.0, 24.0, 23.0, 39.0, 30.0, 19.0, 35.0, 23.0, 43.0, 34.0, 37.0, 27.0, 36.0, 39.0, 36.0, 34.0, 44.0, 27.0, 30.0, 35.0, 30.0, 28.0, 19.0, 24.0, 21.0, 16.0, 15.0, 15.0, 14.0, 13.0, 13.0, 7.0, 10.0, 10.0, 7.0, 7.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0], "bins": [-8.964853286743164, -8.684450149536133, -8.404046058654785, -8.123642921447754, -7.8432393074035645, -7.562835693359375, -7.282432556152344, -7.002028942108154, -6.721625328063965, -6.441221714019775, -6.160818099975586, -5.880414962768555, -5.600011348724365, -5.319607734680176, -5.0392045974731445, -4.758800983428955, -4.478397369384766, -4.197993755340576, -3.917590379714966, -3.6371870040893555, -3.356783390045166, -3.0763797760009766, -2.795976400375366, -2.515573024749756, -2.2351694107055664, -1.9547659158706665, -1.6743624210357666, -1.3939589262008667, -1.1135554313659668, -0.8331519365310669, -0.552748441696167, -0.2723449468612671, 0.008059501647949219, 0.2884629964828491, 0.568866491317749, 0.8492699861526489, 1.1296734809875488, 1.4100769758224487, 1.6904804706573486, 1.9708839654922485, 2.2512874603271484, 2.531691074371338, 2.8120944499969482, 3.0924978256225586, 3.372901439666748, 3.6533050537109375, 3.933708429336548, 4.214111804962158, 4.494515419006348, 4.774919033050537, 5.055322647094727, 5.335725784301758, 5.616129398345947, 5.896533012390137, 6.176936149597168, 6.457339763641357, 6.737743377685547, 7.018146991729736, 7.298550605773926, 7.578953742980957, 7.8593573570251465, 8.139760971069336, 8.420164108276367, 8.700568199157715, 8.980971336364746]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 8.0, 3.0, 6.0, 12.0, 15.0, 22.0, 33.0, 58.0, 84.0, 131.0, 198.0, 302.0, 481.0, 754.0, 1206.0, 1840.0, 3016.0, 4772.0, 8045.0, 13670.0, 23166.0, 40807.0, 74264.0, 144261.0, 370187.0, 1294138.0, 1444623.0, 424597.0, 157189.0, 78948.0, 43541.0, 24661.0, 14919.0, 9138.0, 5591.0, 3463.0, 2204.0, 1421.0, 871.0, 602.0, 365.0, 224.0, 164.0, 109.0, 73.0, 35.0, 23.0, 21.0, 9.0, 7.0, 6.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-14.3671875, -13.9190673828125, -13.470947265625, -13.0228271484375, -12.57470703125, -12.1265869140625, -11.678466796875, -11.2303466796875, -10.7822265625, -10.3341064453125, -9.885986328125, -9.4378662109375, -8.98974609375, -8.5416259765625, -8.093505859375, -7.6453857421875, -7.197265625, -6.7491455078125, -6.301025390625, -5.8529052734375, -5.40478515625, -4.9566650390625, -4.508544921875, -4.0604248046875, -3.6123046875, -3.1641845703125, -2.716064453125, -2.2679443359375, -1.81982421875, -1.3717041015625, -0.923583984375, -0.4754638671875, -0.02734375, 0.4207763671875, 0.868896484375, 1.3170166015625, 1.76513671875, 2.2132568359375, 2.661376953125, 3.1094970703125, 3.5576171875, 4.0057373046875, 4.453857421875, 4.9019775390625, 5.35009765625, 5.7982177734375, 6.246337890625, 6.6944580078125, 7.142578125, 7.5906982421875, 8.038818359375, 8.4869384765625, 8.93505859375, 9.3831787109375, 9.831298828125, 10.2794189453125, 10.7275390625, 11.1756591796875, 11.623779296875, 12.0718994140625, 12.52001953125, 12.9681396484375, 13.416259765625, 13.8643798828125, 14.3125]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 6.0, 1.0, 3.0, 12.0, 6.0, 9.0, 20.0, 11.0, 21.0, 21.0, 18.0, 13.0, 37.0, 31.0, 25.0, 29.0, 26.0, 38.0, 23.0, 39.0, 29.0, 36.0, 29.0, 34.0, 44.0, 42.0, 26.0, 51.0, 23.0, 31.0, 31.0, 33.0, 17.0, 19.0, 27.0, 15.0, 19.0, 18.0, 12.0, 17.0, 11.0, 8.0, 7.0, 7.0, 9.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0], "bins": [-7.71875, -7.4786376953125, -7.238525390625, -6.9984130859375, -6.75830078125, -6.5181884765625, -6.278076171875, -6.0379638671875, -5.7978515625, -5.5577392578125, -5.317626953125, -5.0775146484375, -4.83740234375, -4.5972900390625, -4.357177734375, -4.1170654296875, -3.876953125, -3.6368408203125, -3.396728515625, -3.1566162109375, -2.91650390625, -2.6763916015625, -2.436279296875, -2.1961669921875, -1.9560546875, -1.7159423828125, -1.475830078125, -1.2357177734375, -0.99560546875, -0.7554931640625, -0.515380859375, -0.2752685546875, -0.03515625, 0.2049560546875, 0.445068359375, 0.6851806640625, 0.92529296875, 1.1654052734375, 1.405517578125, 1.6456298828125, 1.8857421875, 2.1258544921875, 2.365966796875, 2.6060791015625, 2.84619140625, 3.0863037109375, 3.326416015625, 3.5665283203125, 3.806640625, 4.0467529296875, 4.286865234375, 4.5269775390625, 4.76708984375, 5.0072021484375, 5.247314453125, 5.4874267578125, 5.7275390625, 5.9676513671875, 6.207763671875, 6.4478759765625, 6.68798828125, 6.9281005859375, 7.168212890625, 7.4083251953125, 7.6484375]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 4.0, 1.0, 7.0, 4.0, 7.0, 6.0, 17.0, 21.0, 36.0, 58.0, 101.0, 137.0, 182.0, 267.0, 367.0, 589.0, 879.0, 1368.0, 2100.0, 3083.0, 4909.0, 7687.0, 12683.0, 21119.0, 36629.0, 65403.0, 123452.0, 251746.0, 580747.0, 1390691.0, 930027.0, 375822.0, 174720.0, 89252.0, 48559.0, 27952.0, 16354.0, 9798.0, 6113.0, 3903.0, 2497.0, 1667.0, 1139.0, 691.0, 459.0, 359.0, 230.0, 153.0, 93.0, 69.0, 51.0, 35.0, 17.0, 12.0, 9.0, 6.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-11.53125, -11.15625, -10.78125, -10.40625, -10.03125, -9.65625, -9.28125, -8.90625, -8.53125, -8.15625, -7.78125, -7.40625, -7.03125, -6.65625, -6.28125, -5.90625, -5.53125, -5.15625, -4.78125, -4.40625, -4.03125, -3.65625, -3.28125, -2.90625, -2.53125, -2.15625, -1.78125, -1.40625, -1.03125, -0.65625, -0.28125, 0.09375, 0.46875, 0.84375, 1.21875, 1.59375, 1.96875, 2.34375, 2.71875, 3.09375, 3.46875, 3.84375, 4.21875, 4.59375, 4.96875, 5.34375, 5.71875, 6.09375, 6.46875, 6.84375, 7.21875, 7.59375, 7.96875, 8.34375, 8.71875, 9.09375, 9.46875, 9.84375, 10.21875, 10.59375, 10.96875, 11.34375, 11.71875, 12.09375, 12.46875]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 7.0, 8.0, 10.0, 11.0, 11.0, 19.0, 21.0, 33.0, 35.0, 50.0, 50.0, 92.0, 92.0, 121.0, 139.0, 170.0, 205.0, 280.0, 308.0, 421.0, 379.0, 322.0, 259.0, 207.0, 156.0, 132.0, 122.0, 80.0, 70.0, 56.0, 49.0, 40.0, 24.0, 17.0, 15.0, 14.0, 10.0, 13.0, 9.0, 4.0, 2.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.953125, -4.7923583984375, -4.631591796875, -4.4708251953125, -4.31005859375, -4.1492919921875, -3.988525390625, -3.8277587890625, -3.6669921875, -3.5062255859375, -3.345458984375, -3.1846923828125, -3.02392578125, -2.8631591796875, -2.702392578125, -2.5416259765625, -2.380859375, -2.2200927734375, -2.059326171875, -1.8985595703125, -1.73779296875, -1.5770263671875, -1.416259765625, -1.2554931640625, -1.0947265625, -0.9339599609375, -0.773193359375, -0.6124267578125, -0.45166015625, -0.2908935546875, -0.130126953125, 0.0306396484375, 0.19140625, 0.3521728515625, 0.512939453125, 0.6737060546875, 0.83447265625, 0.9952392578125, 1.156005859375, 1.3167724609375, 1.4775390625, 1.6383056640625, 1.799072265625, 1.9598388671875, 2.12060546875, 2.2813720703125, 2.442138671875, 2.6029052734375, 2.763671875, 2.9244384765625, 3.085205078125, 3.2459716796875, 3.40673828125, 3.5675048828125, 3.728271484375, 3.8890380859375, 4.0498046875, 4.2105712890625, 4.371337890625, 4.5321044921875, 4.69287109375, 4.8536376953125, 5.014404296875, 5.1751708984375, 5.3359375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 0.0, 4.0, 11.0, 7.0, 10.0, 11.0, 16.0, 17.0, 31.0, 42.0, 44.0, 54.0, 92.0, 91.0, 102.0, 98.0, 82.0, 74.0, 46.0, 43.0, 32.0, 20.0, 16.0, 17.0, 5.0, 12.0, 3.0, 0.0, 3.0, 4.0, 2.0, 5.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0], "bins": [-14.486303329467773, -14.111387252807617, -13.736471176147461, -13.361555099487305, -12.986639022827148, -12.611722946166992, -12.236806869506836, -11.86189079284668, -11.486974716186523, -11.112058639526367, -10.737142562866211, -10.362226486206055, -9.987310409545898, -9.612394332885742, -9.237478256225586, -8.86256217956543, -8.487646102905273, -8.112730026245117, -7.737813949584961, -7.362897872924805, -6.987981796264648, -6.613065719604492, -6.238149642944336, -5.86323356628418, -5.488317489624023, -5.113401412963867, -4.738485336303711, -4.363569259643555, -3.9886531829833984, -3.613737106323242, -3.238821029663086, -2.8639049530029297, -2.4889888763427734, -2.114072799682617, -1.739156723022461, -1.3642406463623047, -0.9893245697021484, -0.6144084930419922, -0.23949241638183594, 0.1354236602783203, 0.5103397369384766, 0.8852558135986328, 1.260171890258789, 1.6350879669189453, 2.0100040435791016, 2.384920120239258, 2.759836196899414, 3.1347522735595703, 3.5096683502197266, 3.884584426879883, 4.259500503540039, 4.634416580200195, 5.009332656860352, 5.384248733520508, 5.759164810180664, 6.13408088684082, 6.508996963500977, 6.883913040161133, 7.258829116821289, 7.633745193481445, 8.008661270141602, 8.383577346801758, 8.758493423461914, 9.13340950012207, 9.508325576782227]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 8.0, 7.0, 11.0, 6.0, 13.0, 13.0, 13.0, 25.0, 17.0, 22.0, 28.0, 25.0, 28.0, 39.0, 41.0, 32.0, 41.0, 29.0, 37.0, 33.0, 34.0, 52.0, 49.0, 36.0, 43.0, 39.0, 31.0, 36.0, 24.0, 29.0, 22.0, 21.0, 18.0, 15.0, 15.0, 11.0, 14.0, 12.0, 11.0, 5.0, 9.0, 3.0, 3.0, 0.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.81031322479248, -9.497172355651855, -9.18403148651123, -8.870890617370605, -8.55774974822998, -8.244608879089355, -7.931467533111572, -7.618326663970947, -7.305185794830322, -6.992044925689697, -6.678904056549072, -6.365763187408447, -6.052621841430664, -5.739480972290039, -5.426340103149414, -5.113199234008789, -4.800058364868164, -4.486917495727539, -4.173776626586914, -3.86063551902771, -3.547494649887085, -3.23435378074646, -2.921212673187256, -2.608071804046631, -2.294930934906006, -1.9817900657653809, -1.6686490774154663, -1.3555080890655518, -1.0423672199249268, -0.7292263507843018, -0.4160853624343872, -0.10294437408447266, 0.21019554138183594, 0.5233364701271057, 0.8364773988723755, 1.14961838722229, 1.462759256362915, 1.77590012550354, 2.089041233062744, 2.402182102203369, 2.715322971343994, 3.028463840484619, 3.341604709625244, 3.6547458171844482, 3.9678866863250732, 4.281027793884277, 4.594168663024902, 4.907309532165527, 5.220450401306152, 5.533591270446777, 5.846732139587402, 6.159873008728027, 6.473013877868652, 6.786154747009277, 7.0992960929870605, 7.4124369621276855, 7.7255778312683105, 8.038719177246094, 8.351860046386719, 8.665000915527344, 8.978141784667969, 9.291282653808594, 9.604423522949219, 9.917564392089844, 10.230705261230469]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 5.0, 6.0, 10.0, 7.0, 24.0, 29.0, 41.0, 59.0, 87.0, 128.0, 187.0, 266.0, 430.0, 532.0, 899.0, 1302.0, 1886.0, 2762.0, 3984.0, 5561.0, 8194.0, 11694.0, 18079.0, 27407.0, 42041.0, 66646.0, 110736.0, 278772.0, 198116.0, 96664.0, 59366.0, 37648.0, 24425.0, 16018.0, 10545.0, 7385.0, 5080.0, 3501.0, 2585.0, 1738.0, 1186.0, 812.0, 541.0, 377.0, 267.0, 175.0, 132.0, 69.0, 63.0, 33.0, 25.0, 11.0, 15.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.412109375, -2.33642578125, -2.2607421875, -2.18505859375, -2.109375, -2.03369140625, -1.9580078125, -1.88232421875, -1.806640625, -1.73095703125, -1.6552734375, -1.57958984375, -1.50390625, -1.42822265625, -1.3525390625, -1.27685546875, -1.201171875, -1.12548828125, -1.0498046875, -0.97412109375, -0.8984375, -0.82275390625, -0.7470703125, -0.67138671875, -0.595703125, -0.52001953125, -0.4443359375, -0.36865234375, -0.29296875, -0.21728515625, -0.1416015625, -0.06591796875, 0.009765625, 0.08544921875, 0.1611328125, 0.23681640625, 0.3125, 0.38818359375, 0.4638671875, 0.53955078125, 0.615234375, 0.69091796875, 0.7666015625, 0.84228515625, 0.91796875, 0.99365234375, 1.0693359375, 1.14501953125, 1.220703125, 1.29638671875, 1.3720703125, 1.44775390625, 1.5234375, 1.59912109375, 1.6748046875, 1.75048828125, 1.826171875, 1.90185546875, 1.9775390625, 2.05322265625, 2.12890625, 2.20458984375, 2.2802734375, 2.35595703125, 2.431640625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 11.0, 8.0, 17.0, 11.0, 10.0, 20.0, 22.0, 20.0, 21.0, 26.0, 30.0, 33.0, 46.0, 31.0, 37.0, 29.0, 30.0, 32.0, 51.0, 32.0, 49.0, 50.0, 29.0, 45.0, 30.0, 35.0, 34.0, 26.0, 23.0, 16.0, 17.0, 23.0, 16.0, 13.0, 13.0, 11.0, 9.0, 13.0, 11.0, 6.0, 1.0, 2.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.9375, -9.628662109375, -9.31982421875, -9.010986328125, -8.7021484375, -8.393310546875, -8.08447265625, -7.775634765625, -7.466796875, -7.157958984375, -6.84912109375, -6.540283203125, -6.2314453125, -5.922607421875, -5.61376953125, -5.304931640625, -4.99609375, -4.687255859375, -4.37841796875, -4.069580078125, -3.7607421875, -3.451904296875, -3.14306640625, -2.834228515625, -2.525390625, -2.216552734375, -1.90771484375, -1.598876953125, -1.2900390625, -0.981201171875, -0.67236328125, -0.363525390625, -0.0546875, 0.254150390625, 0.56298828125, 0.871826171875, 1.1806640625, 1.489501953125, 1.79833984375, 2.107177734375, 2.416015625, 2.724853515625, 3.03369140625, 3.342529296875, 3.6513671875, 3.960205078125, 4.26904296875, 4.577880859375, 4.88671875, 5.195556640625, 5.50439453125, 5.813232421875, 6.1220703125, 6.430908203125, 6.73974609375, 7.048583984375, 7.357421875, 7.666259765625, 7.97509765625, 8.283935546875, 8.5927734375, 8.901611328125, 9.21044921875, 9.519287109375, 9.828125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 7.0, 8.0, 16.0, 30.0, 40.0, 71.0, 105.0, 131.0, 225.0, 312.0, 479.0, 708.0, 1043.0, 1566.0, 2374.0, 3560.0, 5603.0, 8618.0, 14011.0, 21978.0, 35968.0, 59466.0, 106027.0, 255347.0, 265174.0, 107578.0, 60336.0, 36277.0, 22559.0, 13867.0, 8791.0, 5498.0, 3699.0, 2324.0, 1579.0, 1033.0, 727.0, 451.0, 338.0, 212.0, 153.0, 93.0, 58.0, 43.0, 27.0, 16.0, 9.0, 9.0, 7.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.984375, -2.891143798828125, -2.79791259765625, -2.704681396484375, -2.6114501953125, -2.518218994140625, -2.42498779296875, -2.331756591796875, -2.238525390625, -2.145294189453125, -2.05206298828125, -1.958831787109375, -1.8656005859375, -1.772369384765625, -1.67913818359375, -1.585906982421875, -1.49267578125, -1.399444580078125, -1.30621337890625, -1.212982177734375, -1.1197509765625, -1.026519775390625, -0.93328857421875, -0.840057373046875, -0.746826171875, -0.653594970703125, -0.56036376953125, -0.467132568359375, -0.3739013671875, -0.280670166015625, -0.18743896484375, -0.094207763671875, -0.0009765625, 0.092254638671875, 0.18548583984375, 0.278717041015625, 0.3719482421875, 0.465179443359375, 0.55841064453125, 0.651641845703125, 0.744873046875, 0.838104248046875, 0.93133544921875, 1.024566650390625, 1.1177978515625, 1.211029052734375, 1.30426025390625, 1.397491455078125, 1.49072265625, 1.583953857421875, 1.67718505859375, 1.770416259765625, 1.8636474609375, 1.956878662109375, 2.05010986328125, 2.143341064453125, 2.236572265625, 2.329803466796875, 2.42303466796875, 2.516265869140625, 2.6094970703125, 2.702728271484375, 2.79595947265625, 2.889190673828125, 2.982421875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 3.0, 7.0, 9.0, 11.0, 13.0, 15.0, 21.0, 24.0, 16.0, 29.0, 28.0, 23.0, 31.0, 44.0, 25.0, 38.0, 28.0, 35.0, 43.0, 37.0, 52.0, 44.0, 31.0, 41.0, 41.0, 46.0, 40.0, 26.0, 29.0, 25.0, 22.0, 22.0, 18.0, 10.0, 17.0, 17.0, 9.0, 5.0, 10.0, 7.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.46484375, -7.2518310546875, -7.038818359375, -6.8258056640625, -6.61279296875, -6.3997802734375, -6.186767578125, -5.9737548828125, -5.7607421875, -5.5477294921875, -5.334716796875, -5.1217041015625, -4.90869140625, -4.6956787109375, -4.482666015625, -4.2696533203125, -4.056640625, -3.8436279296875, -3.630615234375, -3.4176025390625, -3.20458984375, -2.9915771484375, -2.778564453125, -2.5655517578125, -2.3525390625, -2.1395263671875, -1.926513671875, -1.7135009765625, -1.50048828125, -1.2874755859375, -1.074462890625, -0.8614501953125, -0.6484375, -0.4354248046875, -0.222412109375, -0.0093994140625, 0.20361328125, 0.4166259765625, 0.629638671875, 0.8426513671875, 1.0556640625, 1.2686767578125, 1.481689453125, 1.6947021484375, 1.90771484375, 2.1207275390625, 2.333740234375, 2.5467529296875, 2.759765625, 2.9727783203125, 3.185791015625, 3.3988037109375, 3.61181640625, 3.8248291015625, 4.037841796875, 4.2508544921875, 4.4638671875, 4.6768798828125, 4.889892578125, 5.1029052734375, 5.31591796875, 5.5289306640625, 5.741943359375, 5.9549560546875, 6.16796875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 8.0, 10.0, 16.0, 22.0, 25.0, 47.0, 77.0, 114.0, 154.0, 183.0, 279.0, 371.0, 580.0, 874.0, 1222.0, 1747.0, 2620.0, 3845.0, 5706.0, 8961.0, 14233.0, 23727.0, 42801.0, 84806.0, 197491.0, 330685.0, 161182.0, 71506.0, 36823.0, 21117.0, 12604.0, 8168.0, 5350.0, 3590.0, 2343.0, 1608.0, 1129.0, 757.0, 521.0, 378.0, 262.0, 180.0, 135.0, 96.0, 80.0, 41.0, 26.0, 24.0, 22.0, 11.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0031414031982421875, -0.0030345022678375244, -0.0029276013374328613, -0.0028207004070281982, -0.002713799476623535, -0.002606898546218872, -0.002499997615814209, -0.002393096685409546, -0.002286195755004883, -0.0021792948246002197, -0.0020723938941955566, -0.0019654929637908936, -0.0018585920333862305, -0.0017516911029815674, -0.0016447901725769043, -0.0015378892421722412, -0.0014309883117675781, -0.001324087381362915, -0.001217186450958252, -0.0011102855205535889, -0.0010033845901489258, -0.0008964836597442627, -0.0007895827293395996, -0.0006826817989349365, -0.0005757808685302734, -0.00046887993812561035, -0.00036197900772094727, -0.0002550780773162842, -0.0001481771469116211, -4.127621650695801e-05, 6.562471389770508e-05, 0.00017252564430236816, 0.00027942657470703125, 0.00038632750511169434, 0.0004932284355163574, 0.0006001293659210205, 0.0007070302963256836, 0.0008139312267303467, 0.0009208321571350098, 0.0010277330875396729, 0.001134634017944336, 0.001241534948348999, 0.0013484358787536621, 0.0014553368091583252, 0.0015622377395629883, 0.0016691386699676514, 0.0017760396003723145, 0.0018829405307769775, 0.0019898414611816406, 0.0020967423915863037, 0.002203643321990967, 0.00231054425239563, 0.002417445182800293, 0.002524346113204956, 0.002631247043609619, 0.0027381479740142822, 0.0028450489044189453, 0.0029519498348236084, 0.0030588507652282715, 0.0031657516956329346, 0.0032726526260375977, 0.0033795535564422607, 0.003486454486846924, 0.003593355417251587, 0.00370025634765625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 2.0, 4.0, 5.0, 8.0, 7.0, 3.0, 7.0, 12.0, 15.0, 21.0, 24.0, 31.0, 35.0, 54.0, 46.0, 65.0, 63.0, 61.0, 35.0, 61.0, 67.0, 62.0, 58.0, 39.0, 33.0, 43.0, 29.0, 21.0, 20.0, 12.0, 12.0, 5.0, 10.0, 6.0, 1.0, 4.0, 11.0, 3.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9802322387695312e-06, -2.8656795620918274e-06, -2.7511268854141235e-06, -2.6365742087364197e-06, -2.522021532058716e-06, -2.407468855381012e-06, -2.292916178703308e-06, -2.1783635020256042e-06, -2.0638108253479004e-06, -1.9492581486701965e-06, -1.8347054719924927e-06, -1.7201527953147888e-06, -1.605600118637085e-06, -1.491047441959381e-06, -1.3764947652816772e-06, -1.2619420886039734e-06, -1.1473894119262695e-06, -1.0328367352485657e-06, -9.182840585708618e-07, -8.03731381893158e-07, -6.891787052154541e-07, -5.746260285377502e-07, -4.600733518600464e-07, -3.4552067518234253e-07, -2.3096799850463867e-07, -1.1641532182693481e-07, -1.862645149230957e-09, 1.126900315284729e-07, 2.2724270820617676e-07, 3.417953848838806e-07, 4.5634806156158447e-07, 5.709007382392883e-07, 6.854534149169922e-07, 8.00006091594696e-07, 9.145587682723999e-07, 1.0291114449501038e-06, 1.1436641216278076e-06, 1.2582167983055115e-06, 1.3727694749832153e-06, 1.4873221516609192e-06, 1.601874828338623e-06, 1.716427505016327e-06, 1.8309801816940308e-06, 1.9455328583717346e-06, 2.0600855350494385e-06, 2.1746382117271423e-06, 2.289190888404846e-06, 2.40374356508255e-06, 2.518296241760254e-06, 2.6328489184379578e-06, 2.7474015951156616e-06, 2.8619542717933655e-06, 2.9765069484710693e-06, 3.091059625148773e-06, 3.205612301826477e-06, 3.320164978504181e-06, 3.4347176551818848e-06, 3.5492703318595886e-06, 3.6638230085372925e-06, 3.7783756852149963e-06, 3.8929283618927e-06, 4.007481038570404e-06, 4.122033715248108e-06, 4.236586391925812e-06, 4.351139068603516e-06]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 4.0, 8.0, 9.0, 5.0, 16.0, 18.0, 25.0, 41.0, 50.0, 61.0, 90.0, 151.0, 221.0, 268.0, 420.0, 593.0, 964.0, 1418.0, 2088.0, 3218.0, 5034.0, 8026.0, 13271.0, 23200.0, 42571.0, 90141.0, 231554.0, 343068.0, 143662.0, 60946.0, 30917.0, 17472.0, 10444.0, 6592.0, 4019.0, 2644.0, 1792.0, 1139.0, 744.0, 541.0, 322.0, 237.0, 174.0, 124.0, 75.0, 46.0, 43.0, 31.0, 23.0, 17.0, 12.0, 5.0, 3.0, 2.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.003772735595703125, -0.003648042678833008, -0.0035233497619628906, -0.0033986568450927734, -0.0032739639282226562, -0.003149271011352539, -0.003024578094482422, -0.0028998851776123047, -0.0027751922607421875, -0.0026504993438720703, -0.002525806427001953, -0.002401113510131836, -0.0022764205932617188, -0.0021517276763916016, -0.0020270347595214844, -0.0019023418426513672, -0.00177764892578125, -0.0016529560089111328, -0.0015282630920410156, -0.0014035701751708984, -0.0012788772583007812, -0.001154184341430664, -0.0010294914245605469, -0.0009047985076904297, -0.0007801055908203125, -0.0006554126739501953, -0.0005307197570800781, -0.00040602684020996094, -0.00028133392333984375, -0.00015664100646972656, -3.1948089599609375e-05, 9.274482727050781e-05, 0.000217437744140625, 0.0003421306610107422, 0.0004668235778808594, 0.0005915164947509766, 0.0007162094116210938, 0.0008409023284912109, 0.0009655952453613281, 0.0010902881622314453, 0.0012149810791015625, 0.0013396739959716797, 0.0014643669128417969, 0.001589059829711914, 0.0017137527465820312, 0.0018384456634521484, 0.0019631385803222656, 0.002087831497192383, 0.0022125244140625, 0.002337217330932617, 0.0024619102478027344, 0.0025866031646728516, 0.0027112960815429688, 0.002835988998413086, 0.002960681915283203, 0.0030853748321533203, 0.0032100677490234375, 0.0033347606658935547, 0.003459453582763672, 0.003584146499633789, 0.0037088394165039062, 0.0038335323333740234, 0.003958225250244141, 0.004082918167114258, 0.004207611083984375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 2.0, 2.0, 8.0, 6.0, 8.0, 10.0, 10.0, 13.0, 16.0, 23.0, 17.0, 17.0, 39.0, 41.0, 39.0, 60.0, 61.0, 101.0, 100.0, 71.0, 62.0, 48.0, 36.0, 29.0, 27.0, 28.0, 28.0, 20.0, 16.0, 15.0, 8.0, 10.0, 6.0, 10.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017986297607421875, -0.0017487704753875732, -0.001698911190032959, -0.0016490519046783447, -0.0015991926193237305, -0.0015493333339691162, -0.001499474048614502, -0.0014496147632598877, -0.0013997554779052734, -0.0013498961925506592, -0.001300036907196045, -0.0012501776218414307, -0.0012003183364868164, -0.0011504590511322021, -0.0011005997657775879, -0.0010507404804229736, -0.0010008811950683594, -0.0009510219097137451, -0.0009011626243591309, -0.0008513033390045166, -0.0008014440536499023, -0.0007515847682952881, -0.0007017254829406738, -0.0006518661975860596, -0.0006020069122314453, -0.0005521476268768311, -0.0005022883415222168, -0.00045242905616760254, -0.0004025697708129883, -0.000352710485458374, -0.00030285120010375977, -0.0002529919147491455, -0.00020313262939453125, -0.000153273344039917, -0.00010341405868530273, -5.3554773330688477e-05, -3.6954879760742188e-06, 4.616379737854004e-05, 9.60230827331543e-05, 0.00014588236808776855, 0.0001957416534423828, 0.00024560093879699707, 0.00029546022415161133, 0.0003453195095062256, 0.00039517879486083984, 0.0004450380802154541, 0.0004948973655700684, 0.0005447566509246826, 0.0005946159362792969, 0.0006444752216339111, 0.0006943345069885254, 0.0007441937923431396, 0.0007940530776977539, 0.0008439123630523682, 0.0008937716484069824, 0.0009436309337615967, 0.000993490219116211, 0.0010433495044708252, 0.0010932087898254395, 0.0011430680751800537, 0.001192927360534668, 0.0012427866458892822, 0.0012926459312438965, 0.0013425052165985107, 0.001392364501953125]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 5.0, 12.0, 8.0, 7.0, 11.0, 16.0, 22.0, 31.0, 45.0, 44.0, 60.0, 86.0, 91.0, 96.0, 97.0, 84.0, 74.0, 46.0, 39.0, 28.0, 25.0, 17.0, 15.0, 10.0, 8.0, 2.0, 1.0, 4.0, 2.0, 3.0, 5.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 0.0, 2.0], "bins": [-14.163093566894531, -13.796456336975098, -13.429818153381348, -13.063180923461914, -12.69654369354248, -12.329906463623047, -11.963268280029297, -11.596631050109863, -11.22999382019043, -10.863356590270996, -10.496718406677246, -10.130081176757812, -9.763443946838379, -9.396806716918945, -9.030168533325195, -8.663531303405762, -8.296894073486328, -7.930256366729736, -7.563619136810303, -7.196981430053711, -6.830344200134277, -6.4637064933776855, -6.097068786621094, -5.73043155670166, -5.36379337310791, -4.997155666351318, -4.630518436431885, -4.263880729675293, -3.8972434997558594, -3.5306057929992676, -3.163968324661255, -2.797330856323242, -2.4306936264038086, -2.064056158065796, -1.6974186897277832, -1.330781102180481, -0.9641436338424683, -0.5975061655044556, -0.23086857795715332, 0.13576889038085938, 0.5024063587188721, 0.8690438270568848, 1.2356812953948975, 1.6023188829421997, 1.9689563512802124, 2.3355937004089355, 2.7022314071655273, 3.06886887550354, 3.4355063438415527, 3.8021438121795654, 4.168781280517578, 4.53541898727417, 4.9020562171936035, 5.268693923950195, 5.635331153869629, 6.001968860626221, 6.3686065673828125, 6.735244274139404, 7.101881504058838, 7.46851921081543, 7.835156440734863, 8.201793670654297, 8.568431854248047, 8.93506908416748, 9.301706314086914]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 8.0, 7.0, 12.0, 5.0, 12.0, 14.0, 11.0, 27.0, 17.0, 22.0, 27.0, 26.0, 26.0, 41.0, 38.0, 35.0, 40.0, 30.0, 35.0, 34.0, 34.0, 54.0, 48.0, 35.0, 39.0, 42.0, 32.0, 35.0, 26.0, 28.0, 23.0, 20.0, 18.0, 16.0, 14.0, 11.0, 13.0, 13.0, 10.0, 7.0, 9.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.817947387695312, -9.506502151489258, -9.195056915283203, -8.883612632751465, -8.57216739654541, -8.260722160339355, -7.949277400970459, -7.6378326416015625, -7.326387405395508, -7.014942169189453, -6.703497409820557, -6.39205265045166, -6.0806074142456055, -5.769162178039551, -5.457717418670654, -5.146272659301758, -4.834827423095703, -4.523382186889648, -4.211937427520752, -3.9004924297332764, -3.589047431945801, -3.277602434158325, -2.9661574363708496, -2.654712438583374, -2.3432674407958984, -2.031822443008423, -1.7203774452209473, -1.4089324474334717, -1.097487449645996, -0.7860424518585205, -0.4745974540710449, -0.16315245628356934, 0.14829254150390625, 0.45973753929138184, 0.7711825370788574, 1.082627534866333, 1.3940725326538086, 1.7055175304412842, 2.0169625282287598, 2.3284075260162354, 2.639852523803711, 2.9512975215911865, 3.262742519378662, 3.5741875171661377, 3.8856325149536133, 4.197077751159668, 4.5085225105285645, 4.819967269897461, 5.131412506103516, 5.44285774230957, 5.754302501678467, 6.065747261047363, 6.377192497253418, 6.688637733459473, 7.000082492828369, 7.311527252197266, 7.62297248840332, 7.934417724609375, 8.24586296081543, 8.557307243347168, 8.868752479553223, 9.180197715759277, 9.491641998291016, 9.80308723449707, 10.114532470703125]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 6.0, 9.0, 13.0, 19.0, 21.0, 34.0, 55.0, 90.0, 119.0, 199.0, 280.0, 367.0, 559.0, 803.0, 1184.0, 1712.0, 2518.0, 3809.0, 5318.0, 8166.0, 12258.0, 19012.0, 30123.0, 49658.0, 84226.0, 143312.0, 203704.0, 184338.0, 116547.0, 67647.0, 40255.0, 24336.0, 15927.0, 10332.0, 6913.0, 4630.0, 3155.0, 2198.0, 1501.0, 992.0, 666.0, 457.0, 377.0, 250.0, 149.0, 97.0, 73.0, 44.0, 40.0, 27.0, 12.0, 4.0, 12.0, 6.0, 3.0, 3.0, 2.0], "bins": [-15.2265625, -14.7760009765625, -14.325439453125, -13.8748779296875, -13.42431640625, -12.9737548828125, -12.523193359375, -12.0726318359375, -11.6220703125, -11.1715087890625, -10.720947265625, -10.2703857421875, -9.81982421875, -9.3692626953125, -8.918701171875, -8.4681396484375, -8.017578125, -7.5670166015625, -7.116455078125, -6.6658935546875, -6.21533203125, -5.7647705078125, -5.314208984375, -4.8636474609375, -4.4130859375, -3.9625244140625, -3.511962890625, -3.0614013671875, -2.61083984375, -2.1602783203125, -1.709716796875, -1.2591552734375, -0.80859375, -0.3580322265625, 0.092529296875, 0.5430908203125, 0.99365234375, 1.4442138671875, 1.894775390625, 2.3453369140625, 2.7958984375, 3.2464599609375, 3.697021484375, 4.1475830078125, 4.59814453125, 5.0487060546875, 5.499267578125, 5.9498291015625, 6.400390625, 6.8509521484375, 7.301513671875, 7.7520751953125, 8.20263671875, 8.6531982421875, 9.103759765625, 9.5543212890625, 10.0048828125, 10.4554443359375, 10.906005859375, 11.3565673828125, 11.80712890625, 12.2576904296875, 12.708251953125, 13.1588134765625, 13.609375]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 9.0, 11.0, 11.0, 8.0, 10.0, 17.0, 18.0, 17.0, 27.0, 32.0, 18.0, 30.0, 33.0, 35.0, 42.0, 37.0, 33.0, 37.0, 28.0, 41.0, 51.0, 46.0, 40.0, 44.0, 36.0, 36.0, 32.0, 32.0, 27.0, 17.0, 19.0, 18.0, 19.0, 16.0, 8.0, 13.0, 8.0, 16.0, 6.0, 5.0, 6.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.8828125, -9.5882568359375, -9.293701171875, -8.9991455078125, -8.70458984375, -8.4100341796875, -8.115478515625, -7.8209228515625, -7.5263671875, -7.2318115234375, -6.937255859375, -6.6427001953125, -6.34814453125, -6.0535888671875, -5.759033203125, -5.4644775390625, -5.169921875, -4.8753662109375, -4.580810546875, -4.2862548828125, -3.99169921875, -3.6971435546875, -3.402587890625, -3.1080322265625, -2.8134765625, -2.5189208984375, -2.224365234375, -1.9298095703125, -1.63525390625, -1.3406982421875, -1.046142578125, -0.7515869140625, -0.45703125, -0.1624755859375, 0.132080078125, 0.4266357421875, 0.72119140625, 1.0157470703125, 1.310302734375, 1.6048583984375, 1.8994140625, 2.1939697265625, 2.488525390625, 2.7830810546875, 3.07763671875, 3.3721923828125, 3.666748046875, 3.9613037109375, 4.255859375, 4.5504150390625, 4.844970703125, 5.1395263671875, 5.43408203125, 5.7286376953125, 6.023193359375, 6.3177490234375, 6.6123046875, 6.9068603515625, 7.201416015625, 7.4959716796875, 7.79052734375, 8.0850830078125, 8.379638671875, 8.6741943359375, 8.96875]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 10.0, 15.0, 15.0, 31.0, 45.0, 62.0, 84.0, 143.0, 211.0, 334.0, 483.0, 726.0, 1127.0, 1695.0, 2453.0, 3904.0, 5954.0, 9329.0, 14490.0, 23301.0, 38337.0, 65439.0, 118635.0, 199825.0, 219724.0, 143356.0, 78745.0, 45231.0, 27645.0, 16870.0, 10653.0, 6941.0, 4402.0, 2781.0, 1874.0, 1225.0, 837.0, 527.0, 359.0, 229.0, 162.0, 107.0, 86.0, 49.0, 29.0, 24.0, 20.0, 13.0, 9.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-15.75, -15.26025390625, -14.7705078125, -14.28076171875, -13.791015625, -13.30126953125, -12.8115234375, -12.32177734375, -11.83203125, -11.34228515625, -10.8525390625, -10.36279296875, -9.873046875, -9.38330078125, -8.8935546875, -8.40380859375, -7.9140625, -7.42431640625, -6.9345703125, -6.44482421875, -5.955078125, -5.46533203125, -4.9755859375, -4.48583984375, -3.99609375, -3.50634765625, -3.0166015625, -2.52685546875, -2.037109375, -1.54736328125, -1.0576171875, -0.56787109375, -0.078125, 0.41162109375, 0.9013671875, 1.39111328125, 1.880859375, 2.37060546875, 2.8603515625, 3.35009765625, 3.83984375, 4.32958984375, 4.8193359375, 5.30908203125, 5.798828125, 6.28857421875, 6.7783203125, 7.26806640625, 7.7578125, 8.24755859375, 8.7373046875, 9.22705078125, 9.716796875, 10.20654296875, 10.6962890625, 11.18603515625, 11.67578125, 12.16552734375, 12.6552734375, 13.14501953125, 13.634765625, 14.12451171875, 14.6142578125, 15.10400390625, 15.59375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 9.0, 7.0, 7.0, 9.0, 9.0, 11.0, 21.0, 16.0, 27.0, 16.0, 26.0, 27.0, 28.0, 37.0, 31.0, 25.0, 28.0, 37.0, 34.0, 37.0, 36.0, 45.0, 41.0, 37.0, 42.0, 43.0, 37.0, 41.0, 32.0, 26.0, 30.0, 23.0, 14.0, 18.0, 19.0, 21.0, 7.0, 9.0, 10.0, 6.0, 7.0, 1.0, 4.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.4765625, -5.290283203125, -5.10400390625, -4.917724609375, -4.7314453125, -4.545166015625, -4.35888671875, -4.172607421875, -3.986328125, -3.800048828125, -3.61376953125, -3.427490234375, -3.2412109375, -3.054931640625, -2.86865234375, -2.682373046875, -2.49609375, -2.309814453125, -2.12353515625, -1.937255859375, -1.7509765625, -1.564697265625, -1.37841796875, -1.192138671875, -1.005859375, -0.819580078125, -0.63330078125, -0.447021484375, -0.2607421875, -0.074462890625, 0.11181640625, 0.298095703125, 0.484375, 0.670654296875, 0.85693359375, 1.043212890625, 1.2294921875, 1.415771484375, 1.60205078125, 1.788330078125, 1.974609375, 2.160888671875, 2.34716796875, 2.533447265625, 2.7197265625, 2.906005859375, 3.09228515625, 3.278564453125, 3.46484375, 3.651123046875, 3.83740234375, 4.023681640625, 4.2099609375, 4.396240234375, 4.58251953125, 4.768798828125, 4.955078125, 5.141357421875, 5.32763671875, 5.513916015625, 5.7001953125, 5.886474609375, 6.07275390625, 6.259033203125, 6.4453125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 4.0, 7.0, 12.0, 11.0, 12.0, 26.0, 30.0, 43.0, 55.0, 85.0, 113.0, 203.0, 293.0, 439.0, 691.0, 1049.0, 1843.0, 2972.0, 5111.0, 9049.0, 17136.0, 33511.0, 70545.0, 186899.0, 393656.0, 182786.0, 69564.0, 32936.0, 17104.0, 9334.0, 5202.0, 3028.0, 1819.0, 1052.0, 651.0, 457.0, 288.0, 187.0, 128.0, 77.0, 50.0, 30.0, 21.0, 21.0, 12.0, 9.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.97265625, -2.886474609375, -2.80029296875, -2.714111328125, -2.6279296875, -2.541748046875, -2.45556640625, -2.369384765625, -2.283203125, -2.197021484375, -2.11083984375, -2.024658203125, -1.9384765625, -1.852294921875, -1.76611328125, -1.679931640625, -1.59375, -1.507568359375, -1.42138671875, -1.335205078125, -1.2490234375, -1.162841796875, -1.07666015625, -0.990478515625, -0.904296875, -0.818115234375, -0.73193359375, -0.645751953125, -0.5595703125, -0.473388671875, -0.38720703125, -0.301025390625, -0.21484375, -0.128662109375, -0.04248046875, 0.043701171875, 0.1298828125, 0.216064453125, 0.30224609375, 0.388427734375, 0.474609375, 0.560791015625, 0.64697265625, 0.733154296875, 0.8193359375, 0.905517578125, 0.99169921875, 1.077880859375, 1.1640625, 1.250244140625, 1.33642578125, 1.422607421875, 1.5087890625, 1.594970703125, 1.68115234375, 1.767333984375, 1.853515625, 1.939697265625, 2.02587890625, 2.112060546875, 2.1982421875, 2.284423828125, 2.37060546875, 2.456787109375, 2.54296875]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 7.0, 7.0, 5.0, 6.0, 16.0, 8.0, 14.0, 18.0, 21.0, 31.0, 35.0, 51.0, 45.0, 69.0, 67.0, 77.0, 87.0, 62.0, 62.0, 66.0, 44.0, 35.0, 30.0, 42.0, 27.0, 14.0, 10.0, 11.0, 14.0, 6.0, 8.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00010389089584350586, -0.00010055769234895706, -9.722448885440826e-05, -9.389128535985947e-05, -9.055808186531067e-05, -8.722487837076187e-05, -8.389167487621307e-05, -8.055847138166428e-05, -7.722526788711548e-05, -7.389206439256668e-05, -7.055886089801788e-05, -6.722565740346909e-05, -6.389245390892029e-05, -6.055925041437149e-05, -5.722604691982269e-05, -5.3892843425273895e-05, -5.05596399307251e-05, -4.72264364361763e-05, -4.38932329416275e-05, -4.0560029447078705e-05, -3.722682595252991e-05, -3.389362245798111e-05, -3.056041896343231e-05, -2.7227215468883514e-05, -2.3894011974334717e-05, -2.056080847978592e-05, -1.722760498523712e-05, -1.3894401490688324e-05, -1.0561197996139526e-05, -7.227994501590729e-06, -3.894791007041931e-06, -5.615875124931335e-07, 2.771615982055664e-06, 6.104819476604462e-06, 9.43802297115326e-06, 1.2771226465702057e-05, 1.6104429960250854e-05, 1.9437633454799652e-05, 2.277083694934845e-05, 2.6104040443897247e-05, 2.9437243938446045e-05, 3.277044743299484e-05, 3.610365092754364e-05, 3.943685442209244e-05, 4.2770057916641235e-05, 4.610326141119003e-05, 4.943646490573883e-05, 5.276966840028763e-05, 5.6102871894836426e-05, 5.9436075389385223e-05, 6.276927888393402e-05, 6.610248237848282e-05, 6.943568587303162e-05, 7.276888936758041e-05, 7.610209286212921e-05, 7.943529635667801e-05, 8.27684998512268e-05, 8.61017033457756e-05, 8.94349068403244e-05, 9.27681103348732e-05, 9.6101313829422e-05, 9.94345173239708e-05, 0.00010276772081851959, 0.00010610092431306839, 0.00010943412780761719]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 8.0, 7.0, 3.0, 11.0, 16.0, 26.0, 46.0, 61.0, 75.0, 119.0, 170.0, 243.0, 361.0, 589.0, 908.0, 1421.0, 2164.0, 3364.0, 5267.0, 8137.0, 12689.0, 19898.0, 32825.0, 57888.0, 114932.0, 263149.0, 262781.0, 114801.0, 57927.0, 32952.0, 20056.0, 12740.0, 8155.0, 5211.0, 3346.0, 2102.0, 1397.0, 933.0, 602.0, 386.0, 271.0, 162.0, 107.0, 98.0, 47.0, 33.0, 23.0, 12.0, 16.0, 15.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-2.09375, -2.0283203125, -1.962890625, -1.8974609375, -1.83203125, -1.7666015625, -1.701171875, -1.6357421875, -1.5703125, -1.5048828125, -1.439453125, -1.3740234375, -1.30859375, -1.2431640625, -1.177734375, -1.1123046875, -1.046875, -0.9814453125, -0.916015625, -0.8505859375, -0.78515625, -0.7197265625, -0.654296875, -0.5888671875, -0.5234375, -0.4580078125, -0.392578125, -0.3271484375, -0.26171875, -0.1962890625, -0.130859375, -0.0654296875, 0.0, 0.0654296875, 0.130859375, 0.1962890625, 0.26171875, 0.3271484375, 0.392578125, 0.4580078125, 0.5234375, 0.5888671875, 0.654296875, 0.7197265625, 0.78515625, 0.8505859375, 0.916015625, 0.9814453125, 1.046875, 1.1123046875, 1.177734375, 1.2431640625, 1.30859375, 1.3740234375, 1.439453125, 1.5048828125, 1.5703125, 1.6357421875, 1.701171875, 1.7666015625, 1.83203125, 1.8974609375, 1.962890625, 2.0283203125, 2.09375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 1.0, 4.0, 8.0, 11.0, 15.0, 20.0, 17.0, 19.0, 23.0, 18.0, 25.0, 36.0, 50.0, 31.0, 51.0, 57.0, 70.0, 65.0, 52.0, 65.0, 43.0, 49.0, 45.0, 48.0, 30.0, 23.0, 25.0, 21.0, 21.0, 12.0, 10.0, 10.0, 9.0, 3.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0146484375, -0.9853134155273438, -0.9559783935546875, -0.9266433715820312, -0.897308349609375, -0.8679733276367188, -0.8386383056640625, -0.8093032836914062, -0.77996826171875, -0.7506332397460938, -0.7212982177734375, -0.6919631958007812, -0.662628173828125, -0.6332931518554688, -0.6039581298828125, -0.5746231079101562, -0.5452880859375, -0.5159530639648438, -0.4866180419921875, -0.45728302001953125, -0.427947998046875, -0.39861297607421875, -0.3692779541015625, -0.33994293212890625, -0.31060791015625, -0.28127288818359375, -0.2519378662109375, -0.22260284423828125, -0.193267822265625, -0.16393280029296875, -0.1345977783203125, -0.10526275634765625, -0.075927734375, -0.04659271240234375, -0.0172576904296875, 0.01207733154296875, 0.041412353515625, 0.07074737548828125, 0.1000823974609375, 0.12941741943359375, 0.15875244140625, 0.18808746337890625, 0.2174224853515625, 0.24675750732421875, 0.276092529296875, 0.30542755126953125, 0.3347625732421875, 0.36409759521484375, 0.3934326171875, 0.42276763916015625, 0.4521026611328125, 0.48143768310546875, 0.510772705078125, 0.5401077270507812, 0.5694427490234375, 0.5987777709960938, 0.62811279296875, 0.6574478149414062, 0.6867828369140625, 0.7161178588867188, 0.745452880859375, 0.7747879028320312, 0.8041229248046875, 0.8334579467773438, 0.86279296875]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 2.0, 5.0, 1.0, 8.0, 8.0, 16.0, 9.0, 15.0, 7.0, 25.0, 24.0, 37.0, 43.0, 61.0, 77.0, 97.0, 100.0, 110.0, 83.0, 66.0, 59.0, 31.0, 25.0, 22.0, 18.0, 15.0, 12.0, 9.0, 5.0, 6.0, 4.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.79197883605957, -12.388477325439453, -11.984975814819336, -11.581474304199219, -11.177972793579102, -10.774471282958984, -10.370969772338867, -9.96746826171875, -9.563966751098633, -9.160465240478516, -8.756963729858398, -8.353462219238281, -7.949960708618164, -7.546459197998047, -7.1429572105407715, -6.739455699920654, -6.335953712463379, -5.932452201843262, -5.5289506912231445, -5.125449180603027, -4.72194766998291, -4.318446159362793, -3.9149441719055176, -3.5114426612854004, -3.107941150665283, -2.704439640045166, -2.300938129425049, -1.8974363803863525, -1.4939348697662354, -1.0904333591461182, -0.6869316101074219, -0.2834300994873047, 0.1200714111328125, 0.5235729813575745, 0.9270745515823364, 1.3305761814117432, 1.7340776920318604, 2.1375792026519775, 2.541080951690674, 2.944582462310791, 3.348083972930908, 3.7515854835510254, 4.155086994171143, 4.558588981628418, 4.962090492248535, 5.365592002868652, 5.7690935134887695, 6.172595024108887, 6.576096534729004, 6.979598045349121, 7.383099555969238, 7.7866010665893555, 8.190102577209473, 8.59360408782959, 8.997106552124023, 9.40060806274414, 9.804109573364258, 10.207611083984375, 10.611112594604492, 11.01461410522461, 11.418115615844727, 11.821617126464844, 12.225118637084961, 12.628620147705078, 13.032121658325195]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 8.0, 2.0, 7.0, 12.0, 7.0, 11.0, 21.0, 24.0, 19.0, 18.0, 23.0, 24.0, 26.0, 27.0, 37.0, 46.0, 43.0, 46.0, 46.0, 28.0, 40.0, 38.0, 43.0, 24.0, 41.0, 37.0, 24.0, 35.0, 30.0, 27.0, 28.0, 26.0, 23.0, 15.0, 13.0, 22.0, 9.0, 9.0, 12.0, 6.0, 5.0, 6.0, 7.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.447684288024902, -10.119959831237793, -9.792236328125, -9.46451187133789, -9.136788368225098, -8.809063911437988, -8.481340408325195, -8.153615951538086, -7.825891494750977, -7.498167514801025, -7.170443534851074, -6.842719078063965, -6.514995098114014, -6.1872711181640625, -5.859547138214111, -5.53182315826416, -5.204099178314209, -4.876375198364258, -4.548651218414307, -4.2209272384643555, -3.893202781677246, -3.565478801727295, -3.2377548217773438, -2.9100306034088135, -2.5823066234588623, -2.254582643508911, -1.9268584251403809, -1.5991344451904297, -1.271410346031189, -0.9436862468719482, -0.6159622669219971, -0.2882380485534668, 0.039485931396484375, 0.3672100007534027, 0.694934070110321, 1.022658109664917, 1.3503822088241577, 1.6781063079833984, 2.0058302879333496, 2.33355450630188, 2.661278486251831, 2.9890024662017822, 3.3167266845703125, 3.6444506645202637, 3.972174644470215, 4.299899101257324, 4.627622604370117, 4.955347061157227, 5.283071041107178, 5.610795021057129, 5.93851900100708, 6.266242980957031, 6.593967437744141, 6.921691417694092, 7.249415397644043, 7.577139854431152, 7.904863357543945, 8.232587814331055, 8.560311317443848, 8.888035774230957, 9.21575927734375, 9.54348373413086, 9.871208190917969, 10.198931694030762, 10.526656150817871]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 9.0, 12.0, 16.0, 27.0, 33.0, 60.0, 100.0, 135.0, 217.0, 354.0, 504.0, 841.0, 1289.0, 1982.0, 3154.0, 4769.0, 7614.0, 12379.0, 20180.0, 34268.0, 60565.0, 113287.0, 250525.0, 787967.0, 1649186.0, 751189.0, 232204.0, 108253.0, 60284.0, 35002.0, 20915.0, 13064.0, 8293.0, 5463.0, 3376.0, 2317.0, 1547.0, 1036.0, 660.0, 433.0, 260.0, 184.0, 130.0, 72.0, 49.0, 32.0, 19.0, 13.0, 10.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-14.015625, -13.584228515625, -13.15283203125, -12.721435546875, -12.2900390625, -11.858642578125, -11.42724609375, -10.995849609375, -10.564453125, -10.133056640625, -9.70166015625, -9.270263671875, -8.8388671875, -8.407470703125, -7.97607421875, -7.544677734375, -7.11328125, -6.681884765625, -6.25048828125, -5.819091796875, -5.3876953125, -4.956298828125, -4.52490234375, -4.093505859375, -3.662109375, -3.230712890625, -2.79931640625, -2.367919921875, -1.9365234375, -1.505126953125, -1.07373046875, -0.642333984375, -0.2109375, 0.220458984375, 0.65185546875, 1.083251953125, 1.5146484375, 1.946044921875, 2.37744140625, 2.808837890625, 3.240234375, 3.671630859375, 4.10302734375, 4.534423828125, 4.9658203125, 5.397216796875, 5.82861328125, 6.260009765625, 6.69140625, 7.122802734375, 7.55419921875, 7.985595703125, 8.4169921875, 8.848388671875, 9.27978515625, 9.711181640625, 10.142578125, 10.573974609375, 11.00537109375, 11.436767578125, 11.8681640625, 12.299560546875, 12.73095703125, 13.162353515625, 13.59375]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 5.0, 5.0, 8.0, 5.0, 14.0, 11.0, 13.0, 18.0, 17.0, 22.0, 19.0, 29.0, 26.0, 24.0, 42.0, 33.0, 56.0, 40.0, 45.0, 36.0, 45.0, 36.0, 40.0, 37.0, 35.0, 23.0, 40.0, 38.0, 31.0, 28.0, 24.0, 21.0, 23.0, 25.0, 17.0, 12.0, 12.0, 10.0, 11.0, 8.0, 2.0, 12.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.3359375, -9.046630859375, -8.75732421875, -8.468017578125, -8.1787109375, -7.889404296875, -7.60009765625, -7.310791015625, -7.021484375, -6.732177734375, -6.44287109375, -6.153564453125, -5.8642578125, -5.574951171875, -5.28564453125, -4.996337890625, -4.70703125, -4.417724609375, -4.12841796875, -3.839111328125, -3.5498046875, -3.260498046875, -2.97119140625, -2.681884765625, -2.392578125, -2.103271484375, -1.81396484375, -1.524658203125, -1.2353515625, -0.946044921875, -0.65673828125, -0.367431640625, -0.078125, 0.211181640625, 0.50048828125, 0.789794921875, 1.0791015625, 1.368408203125, 1.65771484375, 1.947021484375, 2.236328125, 2.525634765625, 2.81494140625, 3.104248046875, 3.3935546875, 3.682861328125, 3.97216796875, 4.261474609375, 4.55078125, 4.840087890625, 5.12939453125, 5.418701171875, 5.7080078125, 5.997314453125, 6.28662109375, 6.575927734375, 6.865234375, 7.154541015625, 7.44384765625, 7.733154296875, 8.0224609375, 8.311767578125, 8.60107421875, 8.890380859375, 9.1796875]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 9.0, 11.0, 25.0, 24.0, 28.0, 42.0, 73.0, 118.0, 201.0, 275.0, 467.0, 668.0, 1156.0, 1893.0, 3327.0, 5522.0, 9479.0, 17138.0, 31396.0, 60896.0, 126334.0, 299783.0, 868038.0, 1715323.0, 615611.0, 226383.0, 100504.0, 49225.0, 26040.0, 14327.0, 8163.0, 4744.0, 2820.0, 1597.0, 939.0, 633.0, 363.0, 239.0, 159.0, 100.0, 64.0, 64.0, 34.0, 19.0, 16.0, 8.0, 4.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.25, -14.7635498046875, -14.277099609375, -13.7906494140625, -13.30419921875, -12.8177490234375, -12.331298828125, -11.8448486328125, -11.3583984375, -10.8719482421875, -10.385498046875, -9.8990478515625, -9.41259765625, -8.9261474609375, -8.439697265625, -7.9532470703125, -7.466796875, -6.9803466796875, -6.493896484375, -6.0074462890625, -5.52099609375, -5.0345458984375, -4.548095703125, -4.0616455078125, -3.5751953125, -3.0887451171875, -2.602294921875, -2.1158447265625, -1.62939453125, -1.1429443359375, -0.656494140625, -0.1700439453125, 0.31640625, 0.8028564453125, 1.289306640625, 1.7757568359375, 2.26220703125, 2.7486572265625, 3.235107421875, 3.7215576171875, 4.2080078125, 4.6944580078125, 5.180908203125, 5.6673583984375, 6.15380859375, 6.6402587890625, 7.126708984375, 7.6131591796875, 8.099609375, 8.5860595703125, 9.072509765625, 9.5589599609375, 10.04541015625, 10.5318603515625, 11.018310546875, 11.5047607421875, 11.9912109375, 12.4776611328125, 12.964111328125, 13.4505615234375, 13.93701171875, 14.4234619140625, 14.909912109375, 15.3963623046875, 15.8828125]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 3.0, 2.0, 2.0, 5.0, 6.0, 6.0, 6.0, 27.0, 20.0, 23.0, 34.0, 25.0, 47.0, 61.0, 86.0, 87.0, 120.0, 149.0, 197.0, 242.0, 305.0, 375.0, 481.0, 391.0, 298.0, 240.0, 165.0, 136.0, 132.0, 91.0, 65.0, 60.0, 41.0, 34.0, 38.0, 17.0, 18.0, 14.0, 12.0, 8.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-6.375, -6.184326171875, -5.99365234375, -5.802978515625, -5.6123046875, -5.421630859375, -5.23095703125, -5.040283203125, -4.849609375, -4.658935546875, -4.46826171875, -4.277587890625, -4.0869140625, -3.896240234375, -3.70556640625, -3.514892578125, -3.32421875, -3.133544921875, -2.94287109375, -2.752197265625, -2.5615234375, -2.370849609375, -2.18017578125, -1.989501953125, -1.798828125, -1.608154296875, -1.41748046875, -1.226806640625, -1.0361328125, -0.845458984375, -0.65478515625, -0.464111328125, -0.2734375, -0.082763671875, 0.10791015625, 0.298583984375, 0.4892578125, 0.679931640625, 0.87060546875, 1.061279296875, 1.251953125, 1.442626953125, 1.63330078125, 1.823974609375, 2.0146484375, 2.205322265625, 2.39599609375, 2.586669921875, 2.77734375, 2.968017578125, 3.15869140625, 3.349365234375, 3.5400390625, 3.730712890625, 3.92138671875, 4.112060546875, 4.302734375, 4.493408203125, 4.68408203125, 4.874755859375, 5.0654296875, 5.256103515625, 5.44677734375, 5.637451171875, 5.828125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 6.0, 3.0, 3.0, 7.0, 8.0, 7.0, 9.0, 21.0, 14.0, 13.0, 17.0, 22.0, 30.0, 37.0, 34.0, 63.0, 72.0, 74.0, 79.0, 82.0, 66.0, 80.0, 51.0, 42.0, 25.0, 27.0, 18.0, 16.0, 11.0, 13.0, 10.0, 2.0, 9.0, 8.0, 2.0, 4.0, 3.0, 5.0, 3.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.412540435791016, -9.096385955810547, -8.780231475830078, -8.46407699584961, -8.14792251586914, -7.831768035888672, -7.515613079071045, -7.199458599090576, -6.883304119110107, -6.567149639129639, -6.25099515914917, -5.934840679168701, -5.618685722351074, -5.3025312423706055, -4.986376762390137, -4.670222282409668, -4.354067802429199, -4.0379133224487305, -3.7217588424682617, -3.405604124069214, -3.089449644088745, -2.7732951641082764, -2.4571404457092285, -2.1409859657287598, -1.824831485748291, -1.5086770057678223, -1.192522406578064, -0.8763678669929504, -0.5602133274078369, -0.24405884742736816, 0.07209575176239014, 0.38825035095214844, 0.7044057846069336, 1.0205602645874023, 1.3367148637771606, 1.652869462966919, 1.9690239429473877, 2.2851784229278564, 2.6013331413269043, 2.917487621307373, 3.233642101287842, 3.5497965812683105, 3.8659510612487793, 4.182105541229248, 4.498260498046875, 4.814414978027344, 5.1305694580078125, 5.446723937988281, 5.76287841796875, 6.079032897949219, 6.3951873779296875, 6.711341857910156, 7.027496337890625, 7.343650817871094, 7.659805774688721, 7.9759602546691895, 8.2921142578125, 8.608268737792969, 8.924423217773438, 9.240577697753906, 9.556732177734375, 9.872886657714844, 10.189041137695312, 10.505195617675781, 10.821351051330566]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 4.0, 6.0, 3.0, 6.0, 4.0, 6.0, 8.0, 15.0, 17.0, 20.0, 9.0, 15.0, 20.0, 14.0, 29.0, 21.0, 27.0, 29.0, 25.0, 32.0, 22.0, 33.0, 28.0, 41.0, 24.0, 33.0, 35.0, 31.0, 35.0, 39.0, 29.0, 27.0, 23.0, 34.0, 23.0, 30.0, 23.0, 25.0, 19.0, 17.0, 16.0, 16.0, 13.0, 10.0, 10.0, 13.0, 12.0, 12.0, 5.0, 4.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0], "bins": [-8.471705436706543, -8.188186645507812, -7.90466833114624, -7.621150016784668, -7.3376312255859375, -7.054112434387207, -6.770594120025635, -6.4870758056640625, -6.203557014465332, -5.920038223266602, -5.636519908905029, -5.353001594543457, -5.069482803344727, -4.785964012145996, -4.502445697784424, -4.218927383422852, -3.935408592224121, -3.6518900394439697, -3.3683714866638184, -3.084852933883667, -2.8013343811035156, -2.5178158283233643, -2.234297275543213, -1.9507787227630615, -1.6672601699829102, -1.3837416172027588, -1.1002230644226074, -0.816704511642456, -0.5331859588623047, -0.24966740608215332, 0.03385114669799805, 0.3173696994781494, 0.6008892059326172, 0.8844077587127686, 1.16792631149292, 1.4514448642730713, 1.7349634170532227, 2.018481969833374, 2.3020005226135254, 2.5855190753936768, 2.869037628173828, 3.1525561809539795, 3.436074733734131, 3.7195932865142822, 4.003111839294434, 4.286630630493164, 4.570148944854736, 4.853667259216309, 5.137186050415039, 5.4207048416137695, 5.704223155975342, 5.987741470336914, 6.2712602615356445, 6.554779052734375, 6.838297367095947, 7.1218156814575195, 7.40533447265625, 7.6888532638549805, 7.972371578216553, 8.255889892578125, 8.539408683776855, 8.822927474975586, 9.1064453125, 9.38996410369873, 9.673482894897461]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 5.0, 15.0, 15.0, 22.0, 26.0, 33.0, 63.0, 75.0, 131.0, 194.0, 235.0, 324.0, 408.0, 518.0, 683.0, 932.0, 1304.0, 1795.0, 2396.0, 3145.0, 4173.0, 5786.0, 7899.0, 10875.0, 15217.0, 21438.0, 30560.0, 45781.0, 68785.0, 111702.0, 247788.0, 175093.0, 94170.0, 60047.0, 39575.0, 27463.0, 19056.0, 13628.0, 9889.0, 7142.0, 5270.0, 3959.0, 2922.0, 2005.0, 1534.0, 1136.0, 877.0, 677.0, 534.0, 347.0, 234.0, 179.0, 133.0, 112.0, 84.0, 71.0, 41.0, 38.0, 14.0, 9.0, 4.0], "bins": [-2.431640625, -2.359771728515625, -2.28790283203125, -2.216033935546875, -2.1441650390625, -2.072296142578125, -2.00042724609375, -1.928558349609375, -1.856689453125, -1.784820556640625, -1.71295166015625, -1.641082763671875, -1.5692138671875, -1.497344970703125, -1.42547607421875, -1.353607177734375, -1.28173828125, -1.209869384765625, -1.13800048828125, -1.066131591796875, -0.9942626953125, -0.922393798828125, -0.85052490234375, -0.778656005859375, -0.706787109375, -0.634918212890625, -0.56304931640625, -0.491180419921875, -0.4193115234375, -0.347442626953125, -0.27557373046875, -0.203704833984375, -0.1318359375, -0.059967041015625, 0.01190185546875, 0.083770751953125, 0.1556396484375, 0.227508544921875, 0.29937744140625, 0.371246337890625, 0.443115234375, 0.514984130859375, 0.58685302734375, 0.658721923828125, 0.7305908203125, 0.802459716796875, 0.87432861328125, 0.946197509765625, 1.01806640625, 1.089935302734375, 1.16180419921875, 1.233673095703125, 1.3055419921875, 1.377410888671875, 1.44927978515625, 1.521148681640625, 1.593017578125, 1.664886474609375, 1.73675537109375, 1.808624267578125, 1.8804931640625, 1.952362060546875, 2.02423095703125, 2.096099853515625, 2.16796875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 7.0, 4.0, 2.0, 3.0, 5.0, 6.0, 9.0, 8.0, 17.0, 19.0, 12.0, 19.0, 17.0, 20.0, 29.0, 22.0, 24.0, 24.0, 36.0, 28.0, 20.0, 30.0, 31.0, 38.0, 30.0, 35.0, 31.0, 37.0, 25.0, 32.0, 32.0, 37.0, 34.0, 26.0, 27.0, 30.0, 18.0, 19.0, 19.0, 25.0, 21.0, 10.0, 12.0, 13.0, 6.0, 6.0, 12.0, 10.0, 6.0, 8.0, 7.0, 1.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0], "bins": [-8.484375, -8.1964111328125, -7.908447265625, -7.6204833984375, -7.33251953125, -7.0445556640625, -6.756591796875, -6.4686279296875, -6.1806640625, -5.8927001953125, -5.604736328125, -5.3167724609375, -5.02880859375, -4.7408447265625, -4.452880859375, -4.1649169921875, -3.876953125, -3.5889892578125, -3.301025390625, -3.0130615234375, -2.72509765625, -2.4371337890625, -2.149169921875, -1.8612060546875, -1.5732421875, -1.2852783203125, -0.997314453125, -0.7093505859375, -0.42138671875, -0.1334228515625, 0.154541015625, 0.4425048828125, 0.73046875, 1.0184326171875, 1.306396484375, 1.5943603515625, 1.88232421875, 2.1702880859375, 2.458251953125, 2.7462158203125, 3.0341796875, 3.3221435546875, 3.610107421875, 3.8980712890625, 4.18603515625, 4.4739990234375, 4.761962890625, 5.0499267578125, 5.337890625, 5.6258544921875, 5.913818359375, 6.2017822265625, 6.48974609375, 6.7777099609375, 7.065673828125, 7.3536376953125, 7.6416015625, 7.9295654296875, 8.217529296875, 8.5054931640625, 8.79345703125, 9.0814208984375, 9.369384765625, 9.6573486328125, 9.9453125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 11.0, 7.0, 10.0, 15.0, 19.0, 31.0, 63.0, 95.0, 123.0, 159.0, 230.0, 321.0, 467.0, 671.0, 956.0, 1399.0, 2042.0, 2947.0, 4289.0, 6506.0, 9836.0, 15192.0, 23393.0, 36391.0, 58668.0, 103919.0, 256223.0, 256965.0, 103499.0, 58988.0, 36374.0, 23306.0, 15133.0, 9799.0, 6605.0, 4394.0, 2959.0, 1934.0, 1441.0, 929.0, 682.0, 465.0, 344.0, 256.0, 143.0, 108.0, 66.0, 51.0, 50.0, 31.0, 21.0, 20.0, 8.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.919921875, -2.82867431640625, -2.7374267578125, -2.64617919921875, -2.554931640625, -2.46368408203125, -2.3724365234375, -2.28118896484375, -2.18994140625, -2.09869384765625, -2.0074462890625, -1.91619873046875, -1.824951171875, -1.73370361328125, -1.6424560546875, -1.55120849609375, -1.4599609375, -1.36871337890625, -1.2774658203125, -1.18621826171875, -1.094970703125, -1.00372314453125, -0.9124755859375, -0.82122802734375, -0.72998046875, -0.63873291015625, -0.5474853515625, -0.45623779296875, -0.364990234375, -0.27374267578125, -0.1824951171875, -0.09124755859375, 0.0, 0.09124755859375, 0.1824951171875, 0.27374267578125, 0.364990234375, 0.45623779296875, 0.5474853515625, 0.63873291015625, 0.72998046875, 0.82122802734375, 0.9124755859375, 1.00372314453125, 1.094970703125, 1.18621826171875, 1.2774658203125, 1.36871337890625, 1.4599609375, 1.55120849609375, 1.6424560546875, 1.73370361328125, 1.824951171875, 1.91619873046875, 2.0074462890625, 2.09869384765625, 2.18994140625, 2.28118896484375, 2.3724365234375, 2.46368408203125, 2.554931640625, 2.64617919921875, 2.7374267578125, 2.82867431640625, 2.919921875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 4.0, 6.0, 8.0, 3.0, 9.0, 14.0, 14.0, 16.0, 20.0, 11.0, 20.0, 30.0, 19.0, 25.0, 32.0, 28.0, 39.0, 40.0, 33.0, 43.0, 53.0, 40.0, 46.0, 44.0, 31.0, 25.0, 43.0, 39.0, 30.0, 21.0, 25.0, 31.0, 19.0, 25.0, 20.0, 16.0, 16.0, 18.0, 8.0, 8.0, 9.0, 9.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0], "bins": [-7.2734375, -7.059326171875, -6.84521484375, -6.631103515625, -6.4169921875, -6.202880859375, -5.98876953125, -5.774658203125, -5.560546875, -5.346435546875, -5.13232421875, -4.918212890625, -4.7041015625, -4.489990234375, -4.27587890625, -4.061767578125, -3.84765625, -3.633544921875, -3.41943359375, -3.205322265625, -2.9912109375, -2.777099609375, -2.56298828125, -2.348876953125, -2.134765625, -1.920654296875, -1.70654296875, -1.492431640625, -1.2783203125, -1.064208984375, -0.85009765625, -0.635986328125, -0.421875, -0.207763671875, 0.00634765625, 0.220458984375, 0.4345703125, 0.648681640625, 0.86279296875, 1.076904296875, 1.291015625, 1.505126953125, 1.71923828125, 1.933349609375, 2.1474609375, 2.361572265625, 2.57568359375, 2.789794921875, 3.00390625, 3.218017578125, 3.43212890625, 3.646240234375, 3.8603515625, 4.074462890625, 4.28857421875, 4.502685546875, 4.716796875, 4.930908203125, 5.14501953125, 5.359130859375, 5.5732421875, 5.787353515625, 6.00146484375, 6.215576171875, 6.4296875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 6.0, 7.0, 10.0, 18.0, 19.0, 17.0, 25.0, 33.0, 50.0, 67.0, 82.0, 110.0, 135.0, 167.0, 218.0, 318.0, 400.0, 494.0, 669.0, 1080.0, 1507.0, 2314.0, 3841.0, 6563.0, 11778.0, 23274.0, 50256.0, 126449.0, 367277.0, 274011.0, 94040.0, 39392.0, 18381.0, 9760.0, 5510.0, 3349.0, 2098.0, 1345.0, 929.0, 653.0, 452.0, 319.0, 260.0, 194.0, 136.0, 126.0, 98.0, 63.0, 58.0, 43.0, 36.0, 38.0, 27.0, 21.0, 12.0, 10.0, 8.0, 7.0, 2.0, 1.0, 4.0], "bins": [-0.0052642822265625, -0.005098998546600342, -0.004933714866638184, -0.004768431186676025, -0.004603147506713867, -0.004437863826751709, -0.004272580146789551, -0.004107296466827393, -0.003942012786865234, -0.003776729106903076, -0.003611445426940918, -0.0034461617469787598, -0.0032808780670166016, -0.0031155943870544434, -0.002950310707092285, -0.002785027027130127, -0.0026197433471679688, -0.0024544596672058105, -0.0022891759872436523, -0.002123892307281494, -0.001958608627319336, -0.0017933249473571777, -0.0016280412673950195, -0.0014627575874328613, -0.0012974739074707031, -0.001132190227508545, -0.0009669065475463867, -0.0008016228675842285, -0.0006363391876220703, -0.0004710555076599121, -0.0003057718276977539, -0.0001404881477355957, 2.47955322265625e-05, 0.0001900792121887207, 0.0003553628921508789, 0.0005206465721130371, 0.0006859302520751953, 0.0008512139320373535, 0.0010164976119995117, 0.00118178129196167, 0.0013470649719238281, 0.0015123486518859863, 0.0016776323318481445, 0.0018429160118103027, 0.002008199691772461, 0.002173483371734619, 0.0023387670516967773, 0.0025040507316589355, 0.0026693344116210938, 0.002834618091583252, 0.00299990177154541, 0.0031651854515075684, 0.0033304691314697266, 0.0034957528114318848, 0.003661036491394043, 0.003826320171356201, 0.003991603851318359, 0.004156887531280518, 0.004322171211242676, 0.004487454891204834, 0.004652738571166992, 0.00481802225112915, 0.004983305931091309, 0.005148589611053467, 0.005313873291015625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 3.0, 6.0, 7.0, 7.0, 7.0, 15.0, 11.0, 21.0, 29.0, 21.0, 33.0, 41.0, 45.0, 57.0, 53.0, 68.0, 70.0, 48.0, 31.0, 54.0, 64.0, 41.0, 49.0, 35.0, 34.0, 30.0, 27.0, 15.0, 14.0, 16.0, 9.0, 13.0, 6.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.5762786865234375e-06, -3.458932042121887e-06, -3.341585397720337e-06, -3.2242387533187866e-06, -3.1068921089172363e-06, -2.989545464515686e-06, -2.8721988201141357e-06, -2.7548521757125854e-06, -2.637505531311035e-06, -2.520158886909485e-06, -2.4028122425079346e-06, -2.2854655981063843e-06, -2.168118953704834e-06, -2.0507723093032837e-06, -1.9334256649017334e-06, -1.816079020500183e-06, -1.6987323760986328e-06, -1.5813857316970825e-06, -1.4640390872955322e-06, -1.346692442893982e-06, -1.2293457984924316e-06, -1.1119991540908813e-06, -9.94652509689331e-07, -8.773058652877808e-07, -7.599592208862305e-07, -6.426125764846802e-07, -5.252659320831299e-07, -4.079192876815796e-07, -2.905726432800293e-07, -1.73225998878479e-07, -5.587935447692871e-08, 6.146728992462158e-08, 1.7881393432617188e-07, 2.9616057872772217e-07, 4.1350722312927246e-07, 5.308538675308228e-07, 6.48200511932373e-07, 7.655471563339233e-07, 8.828938007354736e-07, 1.000240445137024e-06, 1.1175870895385742e-06, 1.2349337339401245e-06, 1.3522803783416748e-06, 1.469627022743225e-06, 1.5869736671447754e-06, 1.7043203115463257e-06, 1.821666955947876e-06, 1.9390136003494263e-06, 2.0563602447509766e-06, 2.173706889152527e-06, 2.291053533554077e-06, 2.4084001779556274e-06, 2.5257468223571777e-06, 2.643093466758728e-06, 2.7604401111602783e-06, 2.8777867555618286e-06, 2.995133399963379e-06, 3.112480044364929e-06, 3.2298266887664795e-06, 3.3471733331680298e-06, 3.46451997756958e-06, 3.5818666219711304e-06, 3.6992132663726807e-06, 3.816559910774231e-06, 3.933906555175781e-06]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 5.0, 3.0, 12.0, 8.0, 15.0, 23.0, 33.0, 50.0, 75.0, 121.0, 177.0, 227.0, 396.0, 636.0, 1015.0, 1694.0, 2765.0, 4691.0, 8707.0, 17010.0, 37216.0, 93128.0, 284276.0, 378273.0, 125159.0, 47368.0, 21023.0, 10514.0, 5633.0, 3156.0, 1942.0, 1193.0, 710.0, 428.0, 303.0, 181.0, 102.0, 94.0, 57.0, 34.0, 24.0, 27.0, 17.0, 13.0, 11.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005588531494140625, -0.0054146647453308105, -0.005240797996520996, -0.005066931247711182, -0.004893064498901367, -0.004719197750091553, -0.004545331001281738, -0.004371464252471924, -0.004197597503662109, -0.004023730754852295, -0.0038498640060424805, -0.003675997257232666, -0.0035021305084228516, -0.003328263759613037, -0.0031543970108032227, -0.002980530261993408, -0.0028066635131835938, -0.0026327967643737793, -0.002458930015563965, -0.0022850632667541504, -0.002111196517944336, -0.0019373297691345215, -0.001763463020324707, -0.0015895962715148926, -0.0014157295227050781, -0.0012418627738952637, -0.0010679960250854492, -0.0008941292762756348, -0.0007202625274658203, -0.0005463957786560059, -0.0003725290298461914, -0.00019866228103637695, -2.47955322265625e-05, 0.00014907121658325195, 0.0003229379653930664, 0.0004968047142028809, 0.0006706714630126953, 0.0008445382118225098, 0.0010184049606323242, 0.0011922717094421387, 0.0013661384582519531, 0.0015400052070617676, 0.001713871955871582, 0.0018877387046813965, 0.002061605453491211, 0.0022354722023010254, 0.00240933895111084, 0.0025832056999206543, 0.0027570724487304688, 0.002930939197540283, 0.0031048059463500977, 0.003278672695159912, 0.0034525394439697266, 0.003626406192779541, 0.0038002729415893555, 0.00397413969039917, 0.004148006439208984, 0.004321873188018799, 0.004495739936828613, 0.004669606685638428, 0.004843473434448242, 0.005017340183258057, 0.005191206932067871, 0.0053650736808776855, 0.0055389404296875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 1.0, 5.0, 3.0, 5.0, 4.0, 13.0, 11.0, 12.0, 26.0, 31.0, 26.0, 38.0, 59.0, 77.0, 80.0, 92.0, 96.0, 80.0, 86.0, 56.0, 42.0, 34.0, 28.0, 19.0, 22.0, 12.0, 5.0, 11.0, 4.0, 8.0, 7.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018815994262695312, -0.0018148571252822876, -0.001748114824295044, -0.0016813725233078003, -0.0016146302223205566, -0.001547887921333313, -0.0014811456203460693, -0.0014144033193588257, -0.001347661018371582, -0.0012809187173843384, -0.0012141764163970947, -0.001147434115409851, -0.0010806918144226074, -0.0010139495134353638, -0.0009472072124481201, -0.0008804649114608765, -0.0008137226104736328, -0.0007469803094863892, -0.0006802380084991455, -0.0006134957075119019, -0.0005467534065246582, -0.00048001110553741455, -0.0004132688045501709, -0.00034652650356292725, -0.0002797842025756836, -0.00021304190158843994, -0.0001462996006011963, -7.955729961395264e-05, -1.2814998626708984e-05, 5.392730236053467e-05, 0.00012066960334777832, 0.00018741190433502197, 0.0002541542053222656, 0.0003208965063095093, 0.00038763880729675293, 0.0004543811082839966, 0.0005211234092712402, 0.0005878657102584839, 0.0006546080112457275, 0.0007213503122329712, 0.0007880926132202148, 0.0008548349142074585, 0.0009215772151947021, 0.0009883195161819458, 0.0010550618171691895, 0.001121804118156433, 0.0011885464191436768, 0.0012552887201309204, 0.001322031021118164, 0.0013887733221054077, 0.0014555156230926514, 0.001522257924079895, 0.0015890002250671387, 0.0016557425260543823, 0.001722484827041626, 0.0017892271280288696, 0.0018559694290161133, 0.001922711730003357, 0.0019894540309906006, 0.0020561963319778442, 0.002122938632965088, 0.0021896809339523315, 0.002256423234939575, 0.002323165535926819, 0.0023899078369140625]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 5.0, 3.0, 9.0, 7.0, 12.0, 13.0, 17.0, 15.0, 11.0, 24.0, 27.0, 29.0, 40.0, 40.0, 66.0, 77.0, 75.0, 85.0, 67.0, 81.0, 55.0, 58.0, 27.0, 27.0, 23.0, 12.0, 16.0, 16.0, 8.0, 7.0, 6.0, 11.0, 3.0, 2.0, 3.0, 5.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-9.736104011535645, -9.42552375793457, -9.114943504333496, -8.804362297058105, -8.493782043457031, -8.183201789855957, -7.872621536254883, -7.562041282653809, -7.251460552215576, -6.940880298614502, -6.6302995681762695, -6.319719314575195, -6.009139060974121, -5.698558330535889, -5.3879780769348145, -5.077397346496582, -4.766817092895508, -4.456236839294434, -4.145656108856201, -3.835075855255127, -3.5244953632354736, -3.2139148712158203, -2.903334617614746, -2.5927541255950928, -2.2821736335754395, -1.9715931415557861, -1.6610127687454224, -1.3504323959350586, -1.0398519039154053, -0.729271411895752, -0.4186910390853882, -0.10811066627502441, 0.2024688720703125, 0.513049304485321, 0.8236297369003296, 1.1342101097106934, 1.4447906017303467, 1.75537109375, 2.065951347351074, 2.3765318393707275, 2.687112331390381, 2.997692823410034, 3.3082733154296875, 3.6188535690307617, 3.929434061050415, 4.240014553070068, 4.550594806671143, 4.861175537109375, 5.171755790710449, 5.482336044311523, 5.792916774749756, 6.10349702835083, 6.4140777587890625, 6.724658012390137, 7.035238265991211, 7.345818519592285, 7.656399250030518, 7.966979503631592, 8.277560234069824, 8.588140487670898, 8.898720741271973, 9.209300994873047, 9.519882202148438, 9.830462455749512, 10.141042709350586]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 4.0, 6.0, 3.0, 5.0, 5.0, 6.0, 8.0, 15.0, 16.0, 20.0, 10.0, 16.0, 19.0, 15.0, 28.0, 21.0, 28.0, 29.0, 24.0, 32.0, 22.0, 32.0, 28.0, 40.0, 27.0, 32.0, 34.0, 28.0, 38.0, 40.0, 28.0, 28.0, 23.0, 33.0, 24.0, 29.0, 23.0, 25.0, 19.0, 18.0, 16.0, 16.0, 13.0, 10.0, 10.0, 13.0, 12.0, 11.0, 6.0, 4.0, 6.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0], "bins": [-8.353033065795898, -8.0700101852417, -7.7869873046875, -7.503964900970459, -7.22094202041626, -6.9379191398620605, -6.6548967361450195, -6.37187385559082, -6.088850975036621, -5.805828094482422, -5.522805213928223, -5.239782810211182, -4.956759929656982, -4.673737049102783, -4.390714645385742, -4.107691764831543, -3.8246688842773438, -3.5416460037231445, -3.2586233615875244, -2.9756007194519043, -2.692577838897705, -2.409554958343506, -2.1265323162078857, -1.843509554862976, -1.5604867935180664, -1.2774640321731567, -0.9944412708282471, -0.7114185094833374, -0.42839574813842773, -0.14537298679351807, 0.1376497745513916, 0.42067253589630127, 0.7036952972412109, 0.9867180585861206, 1.2697408199310303, 1.55276358127594, 1.8357863426208496, 2.118809223175049, 2.401831865310669, 2.684854507446289, 2.9678773880004883, 3.2509002685546875, 3.5339229106903076, 3.8169455528259277, 4.099968433380127, 4.382991313934326, 4.666013717651367, 4.949036598205566, 5.232059478759766, 5.515082359313965, 5.798105239868164, 6.081127643585205, 6.364150524139404, 6.6471734046936035, 6.9301958084106445, 7.213218688964844, 7.496241569519043, 7.779264450073242, 8.062287330627441, 8.34531021118164, 8.628332138061523, 8.911355018615723, 9.194377899169922, 9.477400779724121, 9.76042366027832]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 5.0, 8.0, 11.0, 17.0, 23.0, 43.0, 66.0, 77.0, 124.0, 192.0, 233.0, 392.0, 538.0, 720.0, 1088.0, 1473.0, 2104.0, 2882.0, 3899.0, 5409.0, 7645.0, 10538.0, 14936.0, 20824.0, 29973.0, 43978.0, 67833.0, 108208.0, 158628.0, 173121.0, 132479.0, 84792.0, 54150.0, 35788.0, 24629.0, 17523.0, 12468.0, 8951.0, 6417.0, 4663.0, 3359.0, 2345.0, 1703.0, 1267.0, 890.0, 644.0, 441.0, 331.0, 231.0, 166.0, 115.0, 75.0, 62.0, 30.0, 28.0, 14.0, 10.0, 7.0, 3.0, 1.0], "bins": [-12.859375, -12.4725341796875, -12.085693359375, -11.6988525390625, -11.31201171875, -10.9251708984375, -10.538330078125, -10.1514892578125, -9.7646484375, -9.3778076171875, -8.990966796875, -8.6041259765625, -8.21728515625, -7.8304443359375, -7.443603515625, -7.0567626953125, -6.669921875, -6.2830810546875, -5.896240234375, -5.5093994140625, -5.12255859375, -4.7357177734375, -4.348876953125, -3.9620361328125, -3.5751953125, -3.1883544921875, -2.801513671875, -2.4146728515625, -2.02783203125, -1.6409912109375, -1.254150390625, -0.8673095703125, -0.48046875, -0.0936279296875, 0.293212890625, 0.6800537109375, 1.06689453125, 1.4537353515625, 1.840576171875, 2.2274169921875, 2.6142578125, 3.0010986328125, 3.387939453125, 3.7747802734375, 4.16162109375, 4.5484619140625, 4.935302734375, 5.3221435546875, 5.708984375, 6.0958251953125, 6.482666015625, 6.8695068359375, 7.25634765625, 7.6431884765625, 8.030029296875, 8.4168701171875, 8.8037109375, 9.1905517578125, 9.577392578125, 9.9642333984375, 10.35107421875, 10.7379150390625, 11.124755859375, 11.5115966796875, 11.8984375]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 7.0, 3.0, 3.0, 10.0, 15.0, 13.0, 19.0, 12.0, 17.0, 16.0, 10.0, 23.0, 22.0, 23.0, 32.0, 33.0, 28.0, 23.0, 27.0, 34.0, 33.0, 40.0, 37.0, 28.0, 31.0, 37.0, 32.0, 37.0, 28.0, 21.0, 30.0, 24.0, 32.0, 23.0, 30.0, 21.0, 16.0, 13.0, 18.0, 18.0, 19.0, 10.0, 9.0, 11.0, 8.0, 4.0, 5.0, 6.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-8.5546875, -8.2783203125, -8.001953125, -7.7255859375, -7.44921875, -7.1728515625, -6.896484375, -6.6201171875, -6.34375, -6.0673828125, -5.791015625, -5.5146484375, -5.23828125, -4.9619140625, -4.685546875, -4.4091796875, -4.1328125, -3.8564453125, -3.580078125, -3.3037109375, -3.02734375, -2.7509765625, -2.474609375, -2.1982421875, -1.921875, -1.6455078125, -1.369140625, -1.0927734375, -0.81640625, -0.5400390625, -0.263671875, 0.0126953125, 0.2890625, 0.5654296875, 0.841796875, 1.1181640625, 1.39453125, 1.6708984375, 1.947265625, 2.2236328125, 2.5, 2.7763671875, 3.052734375, 3.3291015625, 3.60546875, 3.8818359375, 4.158203125, 4.4345703125, 4.7109375, 4.9873046875, 5.263671875, 5.5400390625, 5.81640625, 6.0927734375, 6.369140625, 6.6455078125, 6.921875, 7.1982421875, 7.474609375, 7.7509765625, 8.02734375, 8.3037109375, 8.580078125, 8.8564453125, 9.1328125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 5.0, 3.0, 4.0, 6.0, 11.0, 15.0, 17.0, 22.0, 47.0, 65.0, 102.0, 169.0, 300.0, 465.0, 877.0, 1545.0, 2731.0, 4977.0, 8981.0, 17041.0, 32091.0, 64009.0, 139802.0, 280793.0, 256511.0, 119869.0, 56350.0, 28277.0, 15054.0, 8260.0, 4374.0, 2483.0, 1364.0, 786.0, 465.0, 258.0, 147.0, 85.0, 70.0, 40.0, 27.0, 22.0, 10.0, 9.0, 7.0, 3.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-24.859375, -24.126220703125, -23.39306640625, -22.659912109375, -21.9267578125, -21.193603515625, -20.46044921875, -19.727294921875, -18.994140625, -18.260986328125, -17.52783203125, -16.794677734375, -16.0615234375, -15.328369140625, -14.59521484375, -13.862060546875, -13.12890625, -12.395751953125, -11.66259765625, -10.929443359375, -10.1962890625, -9.463134765625, -8.72998046875, -7.996826171875, -7.263671875, -6.530517578125, -5.79736328125, -5.064208984375, -4.3310546875, -3.597900390625, -2.86474609375, -2.131591796875, -1.3984375, -0.665283203125, 0.06787109375, 0.801025390625, 1.5341796875, 2.267333984375, 3.00048828125, 3.733642578125, 4.466796875, 5.199951171875, 5.93310546875, 6.666259765625, 7.3994140625, 8.132568359375, 8.86572265625, 9.598876953125, 10.33203125, 11.065185546875, 11.79833984375, 12.531494140625, 13.2646484375, 13.997802734375, 14.73095703125, 15.464111328125, 16.197265625, 16.930419921875, 17.66357421875, 18.396728515625, 19.1298828125, 19.863037109375, 20.59619140625, 21.329345703125, 22.0625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 10.0, 3.0, 8.0, 8.0, 19.0, 21.0, 23.0, 26.0, 32.0, 30.0, 46.0, 40.0, 50.0, 39.0, 61.0, 53.0, 53.0, 41.0, 49.0, 45.0, 43.0, 45.0, 32.0, 42.0, 44.0, 27.0, 22.0, 28.0, 11.0, 18.0, 14.0, 7.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.73046875, -6.46014404296875, -6.1898193359375, -5.91949462890625, -5.649169921875, -5.37884521484375, -5.1085205078125, -4.83819580078125, -4.56787109375, -4.29754638671875, -4.0272216796875, -3.75689697265625, -3.486572265625, -3.21624755859375, -2.9459228515625, -2.67559814453125, -2.4052734375, -2.13494873046875, -1.8646240234375, -1.59429931640625, -1.323974609375, -1.05364990234375, -0.7833251953125, -0.51300048828125, -0.24267578125, 0.02764892578125, 0.2979736328125, 0.56829833984375, 0.838623046875, 1.10894775390625, 1.3792724609375, 1.64959716796875, 1.919921875, 2.19024658203125, 2.4605712890625, 2.73089599609375, 3.001220703125, 3.27154541015625, 3.5418701171875, 3.81219482421875, 4.08251953125, 4.35284423828125, 4.6231689453125, 4.89349365234375, 5.163818359375, 5.43414306640625, 5.7044677734375, 5.97479248046875, 6.2451171875, 6.51544189453125, 6.7857666015625, 7.05609130859375, 7.326416015625, 7.59674072265625, 7.8670654296875, 8.13739013671875, 8.40771484375, 8.67803955078125, 8.9483642578125, 9.21868896484375, 9.489013671875, 9.75933837890625, 10.0296630859375, 10.29998779296875, 10.5703125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 3.0, 7.0, 15.0, 11.0, 25.0, 33.0, 43.0, 50.0, 80.0, 119.0, 180.0, 291.0, 484.0, 708.0, 1194.0, 2005.0, 3563.0, 6629.0, 12840.0, 26786.0, 61366.0, 213269.0, 498625.0, 130169.0, 45822.0, 20926.0, 10323.0, 5511.0, 2949.0, 1764.0, 1040.0, 588.0, 388.0, 251.0, 153.0, 106.0, 66.0, 53.0, 41.0, 24.0, 19.0, 12.0, 6.0, 5.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.787109375, -3.666259765625, -3.54541015625, -3.424560546875, -3.3037109375, -3.182861328125, -3.06201171875, -2.941162109375, -2.8203125, -2.699462890625, -2.57861328125, -2.457763671875, -2.3369140625, -2.216064453125, -2.09521484375, -1.974365234375, -1.853515625, -1.732666015625, -1.61181640625, -1.490966796875, -1.3701171875, -1.249267578125, -1.12841796875, -1.007568359375, -0.88671875, -0.765869140625, -0.64501953125, -0.524169921875, -0.4033203125, -0.282470703125, -0.16162109375, -0.040771484375, 0.080078125, 0.200927734375, 0.32177734375, 0.442626953125, 0.5634765625, 0.684326171875, 0.80517578125, 0.926025390625, 1.046875, 1.167724609375, 1.28857421875, 1.409423828125, 1.5302734375, 1.651123046875, 1.77197265625, 1.892822265625, 2.013671875, 2.134521484375, 2.25537109375, 2.376220703125, 2.4970703125, 2.617919921875, 2.73876953125, 2.859619140625, 2.98046875, 3.101318359375, 3.22216796875, 3.343017578125, 3.4638671875, 3.584716796875, 3.70556640625, 3.826416015625, 3.947265625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 2.0, 1.0, 2.0, 7.0, 4.0, 13.0, 23.0, 26.0, 27.0, 49.0, 67.0, 74.0, 87.0, 85.0, 111.0, 106.0, 71.0, 57.0, 42.0, 43.0, 29.0, 15.0, 14.0, 18.0, 8.0, 12.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00018644332885742188, -0.0001815594732761383, -0.00017667561769485474, -0.00017179176211357117, -0.0001669079065322876, -0.00016202405095100403, -0.00015714019536972046, -0.0001522563397884369, -0.00014737248420715332, -0.00014248862862586975, -0.00013760477304458618, -0.0001327209174633026, -0.00012783706188201904, -0.00012295320630073547, -0.0001180693507194519, -0.00011318549513816833, -0.00010830163955688477, -0.0001034177839756012, -9.853392839431763e-05, -9.365007281303406e-05, -8.876621723175049e-05, -8.388236165046692e-05, -7.899850606918335e-05, -7.411465048789978e-05, -6.923079490661621e-05, -6.434693932533264e-05, -5.946308374404907e-05, -5.45792281627655e-05, -4.9695372581481934e-05, -4.4811517000198364e-05, -3.9927661418914795e-05, -3.5043805837631226e-05, -3.0159950256347656e-05, -2.5276094675064087e-05, -2.0392239093780518e-05, -1.5508383512496948e-05, -1.0624527931213379e-05, -5.7406723499298096e-06, -8.568167686462402e-07, 4.027038812637329e-06, 8.910894393920898e-06, 1.3794749975204468e-05, 1.8678605556488037e-05, 2.3562461137771606e-05, 2.8446316719055176e-05, 3.3330172300338745e-05, 3.8214027881622314e-05, 4.3097883462905884e-05, 4.798173904418945e-05, 5.286559462547302e-05, 5.774945020675659e-05, 6.263330578804016e-05, 6.751716136932373e-05, 7.24010169506073e-05, 7.728487253189087e-05, 8.216872811317444e-05, 8.705258369445801e-05, 9.193643927574158e-05, 9.682029485702515e-05, 0.00010170415043830872, 0.00010658800601959229, 0.00011147186160087585, 0.00011635571718215942, 0.00012123957276344299, 0.00012612342834472656]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 8.0, 13.0, 14.0, 20.0, 30.0, 45.0, 54.0, 69.0, 127.0, 167.0, 280.0, 362.0, 519.0, 784.0, 1277.0, 1948.0, 3176.0, 5124.0, 8462.0, 14361.0, 25148.0, 47884.0, 115851.0, 396342.0, 260849.0, 77987.0, 37027.0, 20140.0, 11526.0, 7062.0, 4429.0, 2618.0, 1668.0, 1044.0, 675.0, 452.0, 296.0, 219.0, 167.0, 118.0, 79.0, 42.0, 24.0, 22.0, 15.0, 8.0, 10.0, 4.0, 7.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-3.359375, -3.260009765625, -3.16064453125, -3.061279296875, -2.9619140625, -2.862548828125, -2.76318359375, -2.663818359375, -2.564453125, -2.465087890625, -2.36572265625, -2.266357421875, -2.1669921875, -2.067626953125, -1.96826171875, -1.868896484375, -1.76953125, -1.670166015625, -1.57080078125, -1.471435546875, -1.3720703125, -1.272705078125, -1.17333984375, -1.073974609375, -0.974609375, -0.875244140625, -0.77587890625, -0.676513671875, -0.5771484375, -0.477783203125, -0.37841796875, -0.279052734375, -0.1796875, -0.080322265625, 0.01904296875, 0.118408203125, 0.2177734375, 0.317138671875, 0.41650390625, 0.515869140625, 0.615234375, 0.714599609375, 0.81396484375, 0.913330078125, 1.0126953125, 1.112060546875, 1.21142578125, 1.310791015625, 1.41015625, 1.509521484375, 1.60888671875, 1.708251953125, 1.8076171875, 1.906982421875, 2.00634765625, 2.105712890625, 2.205078125, 2.304443359375, 2.40380859375, 2.503173828125, 2.6025390625, 2.701904296875, 2.80126953125, 2.900634765625, 3.0]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 4.0, 0.0, 1.0, 4.0, 1.0, 5.0, 8.0, 11.0, 6.0, 10.0, 11.0, 21.0, 20.0, 21.0, 22.0, 25.0, 33.0, 36.0, 65.0, 77.0, 87.0, 109.0, 104.0, 59.0, 47.0, 40.0, 35.0, 31.0, 21.0, 23.0, 16.0, 11.0, 11.0, 9.0, 6.0, 9.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.39453125, -1.3538360595703125, -1.313140869140625, -1.2724456787109375, -1.23175048828125, -1.1910552978515625, -1.150360107421875, -1.1096649169921875, -1.0689697265625, -1.0282745361328125, -0.987579345703125, -0.9468841552734375, -0.90618896484375, -0.8654937744140625, -0.824798583984375, -0.7841033935546875, -0.743408203125, -0.7027130126953125, -0.662017822265625, -0.6213226318359375, -0.58062744140625, -0.5399322509765625, -0.499237060546875, -0.4585418701171875, -0.4178466796875, -0.3771514892578125, -0.336456298828125, -0.2957611083984375, -0.25506591796875, -0.2143707275390625, -0.173675537109375, -0.1329803466796875, -0.09228515625, -0.0515899658203125, -0.010894775390625, 0.0298004150390625, 0.07049560546875, 0.1111907958984375, 0.151885986328125, 0.1925811767578125, 0.2332763671875, 0.2739715576171875, 0.314666748046875, 0.3553619384765625, 0.39605712890625, 0.4367523193359375, 0.477447509765625, 0.5181427001953125, 0.558837890625, 0.5995330810546875, 0.640228271484375, 0.6809234619140625, 0.72161865234375, 0.7623138427734375, 0.803009033203125, 0.8437042236328125, 0.8843994140625, 0.9250946044921875, 0.965789794921875, 1.0064849853515625, 1.04718017578125, 1.0878753662109375, 1.128570556640625, 1.1692657470703125, 1.2099609375]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 4.0, 8.0, 7.0, 4.0, 6.0, 10.0, 11.0, 10.0, 17.0, 23.0, 18.0, 36.0, 43.0, 49.0, 71.0, 56.0, 73.0, 93.0, 78.0, 85.0, 60.0, 43.0, 42.0, 29.0, 15.0, 25.0, 14.0, 18.0, 16.0, 7.0, 9.0, 6.0, 8.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.684285163879395, -12.328146934509277, -11.972007751464844, -11.615869522094727, -11.25973129272461, -10.903592109680176, -10.547453880310059, -10.191314697265625, -9.835176467895508, -9.47903823852539, -9.122899055480957, -8.76676082611084, -8.410621643066406, -8.054483413696289, -7.698345184326172, -7.3422064781188965, -6.986067771911621, -6.629929065704346, -6.27379035949707, -5.917652130126953, -5.561513423919678, -5.205374717712402, -4.849236488342285, -4.49309778213501, -4.136959075927734, -3.780820369720459, -3.4246819019317627, -3.0685434341430664, -2.712404727935791, -2.3562660217285156, -2.0001275539398193, -1.643989086151123, -1.2878494262695312, -0.9317108392715454, -0.5755722522735596, -0.21943366527557373, 0.1367049217224121, 0.49284350872039795, 0.8489820957183838, 1.20512056350708, 1.5612592697143555, 1.9173978567123413, 2.273536443710327, 2.6296749114990234, 2.985813617706299, 3.341952323913574, 3.6980907917022705, 4.054229259490967, 4.410367965698242, 4.766506671905518, 5.122645378112793, 5.47878360748291, 5.8349223136901855, 6.191061019897461, 6.547199249267578, 6.9033379554748535, 7.259476661682129, 7.615615367889404, 7.97175407409668, 8.327892303466797, 8.684030532836914, 9.040169715881348, 9.396307945251465, 9.752447128295898, 10.108585357666016]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 7.0, 10.0, 7.0, 8.0, 7.0, 12.0, 20.0, 13.0, 19.0, 19.0, 23.0, 30.0, 30.0, 32.0, 28.0, 28.0, 30.0, 38.0, 31.0, 44.0, 34.0, 40.0, 39.0, 28.0, 31.0, 33.0, 31.0, 37.0, 25.0, 34.0, 25.0, 23.0, 30.0, 23.0, 16.0, 23.0, 21.0, 10.0, 17.0, 15.0, 11.0, 2.0, 3.0, 6.0, 5.0, 1.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.142831802368164, -9.806644439697266, -9.470458030700684, -9.134270668029785, -8.798084259033203, -8.461896896362305, -8.125709533691406, -7.789523124694824, -7.453335762023926, -7.1171488761901855, -6.780961990356445, -6.444774627685547, -6.108587741851807, -5.772400856018066, -5.436213970184326, -5.100027084350586, -4.763840198516846, -4.4276533126831055, -4.091466426849365, -3.755279302597046, -3.4190921783447266, -3.0829052925109863, -2.746718406677246, -2.4105312824249268, -2.0743443965911865, -1.7381573915481567, -1.401970386505127, -1.0657835006713867, -0.7295964956283569, -0.39340949058532715, -0.057222604751586914, 0.2789645195007324, 0.6151514053344727, 0.9513384103775024, 1.2875254154205322, 1.6237123012542725, 1.9598993062973022, 2.296086311340332, 2.6322731971740723, 2.9684603214263916, 3.304647207260132, 3.640834093093872, 3.9770212173461914, 4.313208103179932, 4.649394989013672, 4.98558235168457, 5.321768760681152, 5.657956123352051, 5.994143009185791, 6.330329895019531, 6.6665167808532715, 7.002703666687012, 7.33889102935791, 7.67507791519165, 8.01126480102539, 8.347452163696289, 8.683638572692871, 9.01982593536377, 9.356012344360352, 9.69219970703125, 10.028386116027832, 10.36457347869873, 10.700759887695312, 11.036947250366211, 11.37313461303711]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 7.0, 9.0, 12.0, 28.0, 54.0, 60.0, 95.0, 165.0, 243.0, 433.0, 647.0, 939.0, 1471.0, 2309.0, 3451.0, 5359.0, 8234.0, 13172.0, 20276.0, 32327.0, 52749.0, 88521.0, 161861.0, 386374.0, 1150597.0, 1340355.0, 486758.0, 181125.0, 97084.0, 57901.0, 35902.0, 22770.0, 14497.0, 9385.0, 6369.0, 4126.0, 2774.0, 1795.0, 1278.0, 822.0, 602.0, 406.0, 280.0, 212.0, 158.0, 76.0, 73.0, 54.0, 39.0, 26.0, 13.0, 7.0, 10.0, 3.0, 1.0, 1.0], "bins": [-13.3203125, -12.91796875, -12.515625, -12.11328125, -11.7109375, -11.30859375, -10.90625, -10.50390625, -10.1015625, -9.69921875, -9.296875, -8.89453125, -8.4921875, -8.08984375, -7.6875, -7.28515625, -6.8828125, -6.48046875, -6.078125, -5.67578125, -5.2734375, -4.87109375, -4.46875, -4.06640625, -3.6640625, -3.26171875, -2.859375, -2.45703125, -2.0546875, -1.65234375, -1.25, -0.84765625, -0.4453125, -0.04296875, 0.359375, 0.76171875, 1.1640625, 1.56640625, 1.96875, 2.37109375, 2.7734375, 3.17578125, 3.578125, 3.98046875, 4.3828125, 4.78515625, 5.1875, 5.58984375, 5.9921875, 6.39453125, 6.796875, 7.19921875, 7.6015625, 8.00390625, 8.40625, 8.80859375, 9.2109375, 9.61328125, 10.015625, 10.41796875, 10.8203125, 11.22265625, 11.625, 12.02734375, 12.4296875]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 3.0, 10.0, 7.0, 6.0, 7.0, 15.0, 14.0, 15.0, 20.0, 18.0, 28.0, 39.0, 22.0, 31.0, 35.0, 28.0, 30.0, 40.0, 26.0, 38.0, 40.0, 39.0, 43.0, 39.0, 35.0, 38.0, 28.0, 36.0, 29.0, 22.0, 30.0, 41.0, 22.0, 17.0, 14.0, 20.0, 19.0, 15.0, 14.0, 8.0, 6.0, 6.0, 3.0, 3.0, 3.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.671875, -9.3677978515625, -9.063720703125, -8.7596435546875, -8.45556640625, -8.1514892578125, -7.847412109375, -7.5433349609375, -7.2392578125, -6.9351806640625, -6.631103515625, -6.3270263671875, -6.02294921875, -5.7188720703125, -5.414794921875, -5.1107177734375, -4.806640625, -4.5025634765625, -4.198486328125, -3.8944091796875, -3.59033203125, -3.2862548828125, -2.982177734375, -2.6781005859375, -2.3740234375, -2.0699462890625, -1.765869140625, -1.4617919921875, -1.15771484375, -0.8536376953125, -0.549560546875, -0.2454833984375, 0.05859375, 0.3626708984375, 0.666748046875, 0.9708251953125, 1.27490234375, 1.5789794921875, 1.883056640625, 2.1871337890625, 2.4912109375, 2.7952880859375, 3.099365234375, 3.4034423828125, 3.70751953125, 4.0115966796875, 4.315673828125, 4.6197509765625, 4.923828125, 5.2279052734375, 5.531982421875, 5.8360595703125, 6.14013671875, 6.4442138671875, 6.748291015625, 7.0523681640625, 7.3564453125, 7.6605224609375, 7.964599609375, 8.2686767578125, 8.57275390625, 8.8768310546875, 9.180908203125, 9.4849853515625, 9.7890625]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 4.0, 12.0, 9.0, 24.0, 27.0, 42.0, 75.0, 102.0, 165.0, 265.0, 425.0, 603.0, 1023.0, 1578.0, 2841.0, 4717.0, 8088.0, 13990.0, 24659.0, 45591.0, 87522.0, 179909.0, 415700.0, 1207487.0, 1342571.0, 457869.0, 194582.0, 93484.0, 48741.0, 26215.0, 14845.0, 8572.0, 4967.0, 2982.0, 1749.0, 1005.0, 690.0, 431.0, 280.0, 170.0, 101.0, 63.0, 37.0, 32.0, 10.0, 10.0, 9.0, 7.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-14.8515625, -14.38818359375, -13.9248046875, -13.46142578125, -12.998046875, -12.53466796875, -12.0712890625, -11.60791015625, -11.14453125, -10.68115234375, -10.2177734375, -9.75439453125, -9.291015625, -8.82763671875, -8.3642578125, -7.90087890625, -7.4375, -6.97412109375, -6.5107421875, -6.04736328125, -5.583984375, -5.12060546875, -4.6572265625, -4.19384765625, -3.73046875, -3.26708984375, -2.8037109375, -2.34033203125, -1.876953125, -1.41357421875, -0.9501953125, -0.48681640625, -0.0234375, 0.43994140625, 0.9033203125, 1.36669921875, 1.830078125, 2.29345703125, 2.7568359375, 3.22021484375, 3.68359375, 4.14697265625, 4.6103515625, 5.07373046875, 5.537109375, 6.00048828125, 6.4638671875, 6.92724609375, 7.390625, 7.85400390625, 8.3173828125, 8.78076171875, 9.244140625, 9.70751953125, 10.1708984375, 10.63427734375, 11.09765625, 11.56103515625, 12.0244140625, 12.48779296875, 12.951171875, 13.41455078125, 13.8779296875, 14.34130859375, 14.8046875]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 3.0, 6.0, 8.0, 12.0, 13.0, 22.0, 23.0, 30.0, 19.0, 40.0, 48.0, 64.0, 86.0, 98.0, 116.0, 111.0, 194.0, 189.0, 253.0, 322.0, 401.0, 407.0, 314.0, 243.0, 200.0, 154.0, 140.0, 118.0, 101.0, 73.0, 53.0, 48.0, 28.0, 24.0, 35.0, 18.0, 14.0, 15.0, 10.0, 7.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.59765625, -5.41790771484375, -5.2381591796875, -5.05841064453125, -4.878662109375, -4.69891357421875, -4.5191650390625, -4.33941650390625, -4.15966796875, -3.97991943359375, -3.8001708984375, -3.62042236328125, -3.440673828125, -3.26092529296875, -3.0811767578125, -2.90142822265625, -2.7216796875, -2.54193115234375, -2.3621826171875, -2.18243408203125, -2.002685546875, -1.82293701171875, -1.6431884765625, -1.46343994140625, -1.28369140625, -1.10394287109375, -0.9241943359375, -0.74444580078125, -0.564697265625, -0.38494873046875, -0.2052001953125, -0.02545166015625, 0.154296875, 0.33404541015625, 0.5137939453125, 0.69354248046875, 0.873291015625, 1.05303955078125, 1.2327880859375, 1.41253662109375, 1.59228515625, 1.77203369140625, 1.9517822265625, 2.13153076171875, 2.311279296875, 2.49102783203125, 2.6707763671875, 2.85052490234375, 3.0302734375, 3.21002197265625, 3.3897705078125, 3.56951904296875, 3.749267578125, 3.92901611328125, 4.1087646484375, 4.28851318359375, 4.46826171875, 4.64801025390625, 4.8277587890625, 5.00750732421875, 5.187255859375, 5.36700439453125, 5.5467529296875, 5.72650146484375, 5.90625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 4.0, 5.0, 6.0, 1.0, 7.0, 13.0, 18.0, 19.0, 9.0, 28.0, 19.0, 20.0, 32.0, 37.0, 44.0, 56.0, 87.0, 86.0, 74.0, 60.0, 75.0, 60.0, 37.0, 30.0, 35.0, 24.0, 25.0, 16.0, 10.0, 10.0, 9.0, 7.0, 5.0, 9.0, 8.0, 2.0, 0.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.706703186035156, -8.39739990234375, -8.08809757232666, -7.778794288635254, -7.469491004943848, -7.1601881980896, -6.850885391235352, -6.541582107543945, -6.232279300689697, -5.922976493835449, -5.613673210144043, -5.304370403289795, -4.995067596435547, -4.685764312744141, -4.376461505889893, -4.0671586990356445, -3.7578554153442383, -3.448552370071411, -3.139249324798584, -2.829946517944336, -2.520643472671509, -2.2113404273986816, -1.902037501335144, -1.5927345752716064, -1.2834315299987793, -0.9741285443305969, -0.6648255586624146, -0.3555225729942322, -0.046219587326049805, 0.26308345794677734, 0.5723863840103149, 0.8816893100738525, 1.1909914016723633, 1.5002944469451904, 1.809597373008728, 2.1189002990722656, 2.4282033443450928, 2.73750638961792, 3.046809196472168, 3.356112241744995, 3.6654152870178223, 3.9747183322906494, 4.284021377563477, 4.593324184417725, 4.902626991271973, 5.211930274963379, 5.521233081817627, 5.830535888671875, 6.139839172363281, 6.449141979217529, 6.7584452629089355, 7.067748069763184, 7.37705135345459, 7.686354160308838, 7.995656967163086, 8.304960250854492, 8.614263534545898, 8.923566818237305, 9.232869148254395, 9.5421724319458, 9.851475715637207, 10.160778045654297, 10.470081329345703, 10.77938461303711, 11.0886869430542]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 7.0, 5.0, 9.0, 5.0, 10.0, 12.0, 11.0, 17.0, 11.0, 21.0, 23.0, 17.0, 31.0, 34.0, 34.0, 38.0, 34.0, 38.0, 31.0, 37.0, 32.0, 29.0, 43.0, 37.0, 40.0, 39.0, 33.0, 38.0, 43.0, 28.0, 31.0, 26.0, 27.0, 24.0, 25.0, 10.0, 16.0, 10.0, 7.0, 10.0, 13.0, 4.0, 6.0, 5.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-12.014616966247559, -11.654500961303711, -11.294384956359863, -10.934268951416016, -10.574152946472168, -10.21403694152832, -9.853920936584473, -9.493804931640625, -9.133688926696777, -8.77357292175293, -8.413456916809082, -8.053340911865234, -7.693224906921387, -7.333108901977539, -6.972992897033691, -6.612876892089844, -6.252760410308838, -5.89264440536499, -5.532528400421143, -5.172412395477295, -4.812296390533447, -4.4521803855896, -4.092063903808594, -3.731948137283325, -3.3718321323394775, -3.01171612739563, -2.6516001224517822, -2.2914838790893555, -1.9313679933547974, -1.5712519884109497, -1.2111358642578125, -0.8510198593139648, -0.4909038543701172, -0.13078781962394714, 0.2293282151222229, 0.5894442796707153, 0.949560284614563, 1.3096762895584106, 1.6697924137115479, 2.0299084186553955, 2.390024423599243, 2.750140428543091, 3.1102564334869385, 3.4703726768493652, 3.830488681793213, 4.1906046867370605, 4.550720691680908, 4.910836696624756, 5.2709527015686035, 5.631068706512451, 5.991184711456299, 6.3513007164001465, 6.711416721343994, 7.071532726287842, 7.431649208068848, 7.791765213012695, 8.151881217956543, 8.51199722290039, 8.872113227844238, 9.232229232788086, 9.592345237731934, 9.952461242675781, 10.312577247619629, 10.672693252563477, 11.032809257507324]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 4.0, 5.0, 11.0, 17.0, 18.0, 27.0, 39.0, 66.0, 84.0, 126.0, 178.0, 228.0, 306.0, 503.0, 670.0, 922.0, 1378.0, 1976.0, 2856.0, 4297.0, 6413.0, 9531.0, 14579.0, 22987.0, 36744.0, 59963.0, 101873.0, 211836.0, 276160.0, 114693.0, 66181.0, 40081.0, 25287.0, 16244.0, 10457.0, 6924.0, 4810.0, 3145.0, 2164.0, 1472.0, 1019.0, 663.0, 490.0, 326.0, 226.0, 165.0, 125.0, 90.0, 64.0, 39.0, 30.0, 25.0, 19.0, 18.0, 4.0, 6.0, 0.0, 1.0, 2.0, 3.0], "bins": [-3.142578125, -3.044677734375, -2.94677734375, -2.848876953125, -2.7509765625, -2.653076171875, -2.55517578125, -2.457275390625, -2.359375, -2.261474609375, -2.16357421875, -2.065673828125, -1.9677734375, -1.869873046875, -1.77197265625, -1.674072265625, -1.576171875, -1.478271484375, -1.38037109375, -1.282470703125, -1.1845703125, -1.086669921875, -0.98876953125, -0.890869140625, -0.79296875, -0.695068359375, -0.59716796875, -0.499267578125, -0.4013671875, -0.303466796875, -0.20556640625, -0.107666015625, -0.009765625, 0.088134765625, 0.18603515625, 0.283935546875, 0.3818359375, 0.479736328125, 0.57763671875, 0.675537109375, 0.7734375, 0.871337890625, 0.96923828125, 1.067138671875, 1.1650390625, 1.262939453125, 1.36083984375, 1.458740234375, 1.556640625, 1.654541015625, 1.75244140625, 1.850341796875, 1.9482421875, 2.046142578125, 2.14404296875, 2.241943359375, 2.33984375, 2.437744140625, 2.53564453125, 2.633544921875, 2.7314453125, 2.829345703125, 2.92724609375, 3.025146484375, 3.123046875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 7.0, 5.0, 8.0, 10.0, 8.0, 15.0, 21.0, 11.0, 15.0, 26.0, 22.0, 32.0, 30.0, 28.0, 43.0, 37.0, 35.0, 28.0, 48.0, 23.0, 40.0, 42.0, 44.0, 34.0, 40.0, 31.0, 41.0, 33.0, 32.0, 26.0, 38.0, 28.0, 23.0, 14.0, 15.0, 17.0, 10.0, 5.0, 10.0, 6.0, 5.0, 7.0, 3.0, 2.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.84375, -11.474853515625, -11.10595703125, -10.737060546875, -10.3681640625, -9.999267578125, -9.63037109375, -9.261474609375, -8.892578125, -8.523681640625, -8.15478515625, -7.785888671875, -7.4169921875, -7.048095703125, -6.67919921875, -6.310302734375, -5.94140625, -5.572509765625, -5.20361328125, -4.834716796875, -4.4658203125, -4.096923828125, -3.72802734375, -3.359130859375, -2.990234375, -2.621337890625, -2.25244140625, -1.883544921875, -1.5146484375, -1.145751953125, -0.77685546875, -0.407958984375, -0.0390625, 0.329833984375, 0.69873046875, 1.067626953125, 1.4365234375, 1.805419921875, 2.17431640625, 2.543212890625, 2.912109375, 3.281005859375, 3.64990234375, 4.018798828125, 4.3876953125, 4.756591796875, 5.12548828125, 5.494384765625, 5.86328125, 6.232177734375, 6.60107421875, 6.969970703125, 7.3388671875, 7.707763671875, 8.07666015625, 8.445556640625, 8.814453125, 9.183349609375, 9.55224609375, 9.921142578125, 10.2900390625, 10.658935546875, 11.02783203125, 11.396728515625, 11.765625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 13.0, 12.0, 21.0, 29.0, 39.0, 52.0, 80.0, 91.0, 112.0, 182.0, 226.0, 345.0, 446.0, 604.0, 851.0, 1219.0, 1685.0, 2283.0, 3443.0, 4930.0, 7153.0, 10652.0, 15933.0, 24023.0, 37382.0, 60196.0, 106463.0, 250921.0, 243488.0, 105156.0, 59504.0, 37385.0, 23872.0, 15727.0, 10340.0, 7213.0, 4852.0, 3370.0, 2407.0, 1639.0, 1144.0, 859.0, 624.0, 448.0, 307.0, 244.0, 172.0, 112.0, 106.0, 64.0, 40.0, 39.0, 17.0, 17.0, 14.0, 11.0, 3.0, 6.0, 1.0, 1.0], "bins": [-3.123046875, -3.025421142578125, -2.92779541015625, -2.830169677734375, -2.7325439453125, -2.634918212890625, -2.53729248046875, -2.439666748046875, -2.342041015625, -2.244415283203125, -2.14678955078125, -2.049163818359375, -1.9515380859375, -1.853912353515625, -1.75628662109375, -1.658660888671875, -1.56103515625, -1.463409423828125, -1.36578369140625, -1.268157958984375, -1.1705322265625, -1.072906494140625, -0.97528076171875, -0.877655029296875, -0.780029296875, -0.682403564453125, -0.58477783203125, -0.487152099609375, -0.3895263671875, -0.291900634765625, -0.19427490234375, -0.096649169921875, 0.0009765625, 0.098602294921875, 0.19622802734375, 0.293853759765625, 0.3914794921875, 0.489105224609375, 0.58673095703125, 0.684356689453125, 0.781982421875, 0.879608154296875, 0.97723388671875, 1.074859619140625, 1.1724853515625, 1.270111083984375, 1.36773681640625, 1.465362548828125, 1.56298828125, 1.660614013671875, 1.75823974609375, 1.855865478515625, 1.9534912109375, 2.051116943359375, 2.14874267578125, 2.246368408203125, 2.343994140625, 2.441619873046875, 2.53924560546875, 2.636871337890625, 2.7344970703125, 2.832122802734375, 2.92974853515625, 3.027374267578125, 3.125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 4.0, 1.0, 5.0, 7.0, 3.0, 5.0, 7.0, 10.0, 8.0, 16.0, 14.0, 9.0, 21.0, 24.0, 24.0, 35.0, 22.0, 25.0, 36.0, 37.0, 26.0, 42.0, 42.0, 43.0, 36.0, 42.0, 34.0, 40.0, 44.0, 45.0, 32.0, 29.0, 29.0, 29.0, 29.0, 20.0, 16.0, 17.0, 22.0, 7.0, 10.0, 16.0, 10.0, 10.0, 4.0, 2.0, 6.0, 7.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.32421875, -7.0875244140625, -6.850830078125, -6.6141357421875, -6.37744140625, -6.1407470703125, -5.904052734375, -5.6673583984375, -5.4306640625, -5.1939697265625, -4.957275390625, -4.7205810546875, -4.48388671875, -4.2471923828125, -4.010498046875, -3.7738037109375, -3.537109375, -3.3004150390625, -3.063720703125, -2.8270263671875, -2.59033203125, -2.3536376953125, -2.116943359375, -1.8802490234375, -1.6435546875, -1.4068603515625, -1.170166015625, -0.9334716796875, -0.69677734375, -0.4600830078125, -0.223388671875, 0.0133056640625, 0.25, 0.4866943359375, 0.723388671875, 0.9600830078125, 1.19677734375, 1.4334716796875, 1.670166015625, 1.9068603515625, 2.1435546875, 2.3802490234375, 2.616943359375, 2.8536376953125, 3.09033203125, 3.3270263671875, 3.563720703125, 3.8004150390625, 4.037109375, 4.2738037109375, 4.510498046875, 4.7471923828125, 4.98388671875, 5.2205810546875, 5.457275390625, 5.6939697265625, 5.9306640625, 6.1673583984375, 6.404052734375, 6.6407470703125, 6.87744140625, 7.1141357421875, 7.350830078125, 7.5875244140625, 7.82421875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 11.0, 12.0, 9.0, 26.0, 24.0, 52.0, 67.0, 84.0, 120.0, 205.0, 255.0, 407.0, 624.0, 844.0, 1224.0, 1766.0, 2813.0, 4352.0, 7269.0, 12823.0, 23944.0, 49637.0, 119288.0, 353125.0, 281242.0, 96898.0, 41338.0, 20834.0, 11161.0, 6612.0, 3791.0, 2530.0, 1601.0, 1091.0, 767.0, 471.0, 364.0, 252.0, 169.0, 118.0, 90.0, 65.0, 54.0, 35.0, 35.0, 13.0, 14.0, 8.0, 8.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0], "bins": [-0.005924224853515625, -0.0057440996170043945, -0.005563974380493164, -0.005383849143981934, -0.005203723907470703, -0.005023598670959473, -0.004843473434448242, -0.004663348197937012, -0.004483222961425781, -0.004303097724914551, -0.00412297248840332, -0.00394284725189209, -0.0037627220153808594, -0.003582596778869629, -0.0034024715423583984, -0.003222346305847168, -0.0030422210693359375, -0.002862095832824707, -0.0026819705963134766, -0.002501845359802246, -0.0023217201232910156, -0.002141594886779785, -0.0019614696502685547, -0.0017813444137573242, -0.0016012191772460938, -0.0014210939407348633, -0.0012409687042236328, -0.0010608434677124023, -0.0008807182312011719, -0.0007005929946899414, -0.0005204677581787109, -0.00034034252166748047, -0.00016021728515625, 1.990795135498047e-05, 0.00020003318786621094, 0.0003801584243774414, 0.0005602836608886719, 0.0007404088973999023, 0.0009205341339111328, 0.0011006593704223633, 0.0012807846069335938, 0.0014609098434448242, 0.0016410350799560547, 0.0018211603164672852, 0.0020012855529785156, 0.002181410789489746, 0.0023615360260009766, 0.002541661262512207, 0.0027217864990234375, 0.002901911735534668, 0.0030820369720458984, 0.003262162208557129, 0.0034422874450683594, 0.00362241268157959, 0.0038025379180908203, 0.003982663154602051, 0.004162788391113281, 0.004342913627624512, 0.004523038864135742, 0.004703164100646973, 0.004883289337158203, 0.005063414573669434, 0.005243539810180664, 0.0054236650466918945, 0.005603790283203125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 10.0, 9.0, 9.0, 9.0, 9.0, 9.0, 27.0, 25.0, 39.0, 45.0, 31.0, 50.0, 51.0, 20.0, 56.0, 58.0, 66.0, 60.0, 74.0, 34.0, 59.0, 18.0, 38.0, 34.0, 21.0, 26.0, 21.0, 15.0, 16.0, 8.0, 9.0, 9.0, 7.0, 5.0, 8.0, 6.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.874301910400391e-06, -3.762543201446533e-06, -3.6507844924926758e-06, -3.5390257835388184e-06, -3.427267074584961e-06, -3.3155083656311035e-06, -3.203749656677246e-06, -3.0919909477233887e-06, -2.9802322387695312e-06, -2.868473529815674e-06, -2.7567148208618164e-06, -2.644956111907959e-06, -2.5331974029541016e-06, -2.421438694000244e-06, -2.3096799850463867e-06, -2.1979212760925293e-06, -2.086162567138672e-06, -1.9744038581848145e-06, -1.862645149230957e-06, -1.7508864402770996e-06, -1.6391277313232422e-06, -1.5273690223693848e-06, -1.4156103134155273e-06, -1.30385160446167e-06, -1.1920928955078125e-06, -1.080334186553955e-06, -9.685754776000977e-07, -8.568167686462402e-07, -7.450580596923828e-07, -6.332993507385254e-07, -5.21540641784668e-07, -4.0978193283081055e-07, -2.980232238769531e-07, -1.862645149230957e-07, -7.450580596923828e-08, 3.725290298461914e-08, 1.4901161193847656e-07, 2.60770320892334e-07, 3.725290298461914e-07, 4.842877388000488e-07, 5.960464477539062e-07, 7.078051567077637e-07, 8.195638656616211e-07, 9.313225746154785e-07, 1.043081283569336e-06, 1.1548399925231934e-06, 1.2665987014770508e-06, 1.3783574104309082e-06, 1.4901161193847656e-06, 1.601874828338623e-06, 1.7136335372924805e-06, 1.8253922462463379e-06, 1.9371509552001953e-06, 2.0489096641540527e-06, 2.16066837310791e-06, 2.2724270820617676e-06, 2.384185791015625e-06, 2.4959444999694824e-06, 2.60770320892334e-06, 2.7194619178771973e-06, 2.8312206268310547e-06, 2.942979335784912e-06, 3.0547380447387695e-06, 3.166496753692627e-06, 3.2782554626464844e-06]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 8.0, 9.0, 15.0, 20.0, 32.0, 34.0, 72.0, 121.0, 160.0, 259.0, 428.0, 687.0, 1096.0, 1782.0, 2946.0, 4779.0, 8294.0, 15378.0, 30572.0, 69096.0, 194202.0, 427867.0, 167082.0, 61973.0, 28036.0, 14038.0, 7833.0, 4681.0, 2723.0, 1654.0, 1000.0, 653.0, 374.0, 202.0, 178.0, 79.0, 67.0, 40.0, 21.0, 25.0, 18.0, 7.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.006099700927734375, -0.005911648273468018, -0.00572359561920166, -0.005535542964935303, -0.005347490310668945, -0.005159437656402588, -0.0049713850021362305, -0.004783332347869873, -0.004595279693603516, -0.004407227039337158, -0.004219174385070801, -0.004031121730804443, -0.003843069076538086, -0.0036550164222717285, -0.003466963768005371, -0.0032789111137390137, -0.0030908584594726562, -0.002902805805206299, -0.0027147531509399414, -0.002526700496673584, -0.0023386478424072266, -0.002150595188140869, -0.0019625425338745117, -0.0017744898796081543, -0.0015864372253417969, -0.0013983845710754395, -0.001210331916809082, -0.0010222792625427246, -0.0008342266082763672, -0.0006461739540100098, -0.00045812129974365234, -0.0002700686454772949, -8.20159912109375e-05, 0.00010603666305541992, 0.00029408931732177734, 0.00048214197158813477, 0.0006701946258544922, 0.0008582472801208496, 0.001046299934387207, 0.0012343525886535645, 0.0014224052429199219, 0.0016104578971862793, 0.0017985105514526367, 0.001986563205718994, 0.0021746158599853516, 0.002362668514251709, 0.0025507211685180664, 0.002738773822784424, 0.0029268264770507812, 0.0031148791313171387, 0.003302931785583496, 0.0034909844398498535, 0.003679037094116211, 0.0038670897483825684, 0.004055142402648926, 0.004243195056915283, 0.004431247711181641, 0.004619300365447998, 0.0048073530197143555, 0.004995405673980713, 0.00518345832824707, 0.005371510982513428, 0.005559563636779785, 0.005747616291046143, 0.0059356689453125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 2.0, 8.0, 7.0, 9.0, 12.0, 13.0, 19.0, 17.0, 31.0, 38.0, 35.0, 49.0, 50.0, 66.0, 93.0, 96.0, 86.0, 84.0, 65.0, 43.0, 34.0, 36.0, 13.0, 14.0, 11.0, 14.0, 11.0, 11.0, 4.0, 7.0, 7.0, 4.0, 6.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025310516357421875, -0.002461269497871399, -0.0023914873600006104, -0.0023217052221298218, -0.002251923084259033, -0.0021821409463882446, -0.002112358808517456, -0.0020425766706466675, -0.001972794532775879, -0.0019030123949050903, -0.0018332302570343018, -0.0017634481191635132, -0.0016936659812927246, -0.001623883843421936, -0.0015541017055511475, -0.0014843195676803589, -0.0014145374298095703, -0.0013447552919387817, -0.0012749731540679932, -0.0012051910161972046, -0.001135408878326416, -0.0010656267404556274, -0.0009958446025848389, -0.0009260624647140503, -0.0008562803268432617, -0.0007864981889724731, -0.0007167160511016846, -0.000646933913230896, -0.0005771517753601074, -0.0005073696374893188, -0.0004375874996185303, -0.0003678053617477417, -0.0002980232238769531, -0.00022824108600616455, -0.00015845894813537598, -8.86768102645874e-05, -1.8894672393798828e-05, 5.0887465476989746e-05, 0.00012066960334777832, 0.0001904517412185669, 0.00026023387908935547, 0.00033001601696014404, 0.0003997981548309326, 0.0004695802927017212, 0.0005393624305725098, 0.0006091445684432983, 0.0006789267063140869, 0.0007487088441848755, 0.0008184909820556641, 0.0008882731199264526, 0.0009580552577972412, 0.0010278373956680298, 0.0010976195335388184, 0.001167401671409607, 0.0012371838092803955, 0.001306965947151184, 0.0013767480850219727, 0.0014465302228927612, 0.0015163123607635498, 0.0015860944986343384, 0.001655876636505127, 0.0017256587743759155, 0.001795440912246704, 0.0018652230501174927, 0.0019350051879882812]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 3.0, 8.0, 4.0, 7.0, 8.0, 18.0, 13.0, 11.0, 24.0, 18.0, 22.0, 23.0, 33.0, 45.0, 49.0, 61.0, 92.0, 75.0, 70.0, 71.0, 67.0, 54.0, 31.0, 37.0, 27.0, 23.0, 18.0, 18.0, 11.0, 6.0, 14.0, 4.0, 9.0, 8.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.882548332214355, -8.573310852050781, -8.264073371887207, -7.954835414886475, -7.6455979347229, -7.336359977722168, -7.027122497558594, -6.7178850173950195, -6.408647537231445, -6.099410057067871, -5.790172100067139, -5.4809346199035645, -5.17169713973999, -4.862459182739258, -4.553221702575684, -4.243984222412109, -3.934746265411377, -3.6255085468292236, -3.3162710666656494, -3.007033348083496, -2.697795867919922, -2.3885581493377686, -2.0793204307556152, -1.770082950592041, -1.4608452320098877, -1.151607632637024, -0.8423699736595154, -0.5331323146820068, -0.22389471530914307, 0.0853428840637207, 0.394580602645874, 0.7038180828094482, 1.0130558013916016, 1.3222934007644653, 1.631531000137329, 1.9407687187194824, 2.2500061988830566, 2.55924391746521, 2.8684816360473633, 3.1777191162109375, 3.486956834793091, 3.796194553375244, 4.105432033538818, 4.414669990539551, 4.723907470703125, 5.033144950866699, 5.342382431030273, 5.651619911193848, 5.96085786819458, 6.270095348358154, 6.579333305358887, 6.888570785522461, 7.197808265686035, 7.507045745849609, 7.816283702850342, 8.125520706176758, 8.434759140014648, 8.743996620178223, 9.053234100341797, 9.362472534179688, 9.671710014343262, 9.980947494506836, 10.29018497467041, 10.599422454833984, 10.908659934997559]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 7.0, 5.0, 9.0, 5.0, 10.0, 12.0, 11.0, 17.0, 11.0, 20.0, 24.0, 16.0, 34.0, 34.0, 32.0, 38.0, 35.0, 37.0, 33.0, 34.0, 34.0, 29.0, 42.0, 39.0, 39.0, 38.0, 33.0, 38.0, 43.0, 28.0, 31.0, 26.0, 28.0, 23.0, 25.0, 10.0, 16.0, 10.0, 7.0, 10.0, 13.0, 4.0, 8.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-11.95711612701416, -11.597426414489746, -11.237736701965332, -10.878046989440918, -10.518357276916504, -10.15866756439209, -9.798977851867676, -9.439288139343262, -9.079598426818848, -8.719908714294434, -8.36021900177002, -8.000529289245605, -7.640839576721191, -7.281149864196777, -6.921460151672363, -6.561770439147949, -6.202080726623535, -5.842391014099121, -5.482701301574707, -5.123011589050293, -4.763321876525879, -4.403632164001465, -4.043942451477051, -3.6842527389526367, -3.3245630264282227, -2.9648733139038086, -2.6051836013793945, -2.2454938888549805, -1.8858041763305664, -1.5261144638061523, -1.1664247512817383, -0.8067350387573242, -0.44704437255859375, -0.08735466003417969, 0.2723350524902344, 0.6320247650146484, 0.9917144775390625, 1.3514041900634766, 1.7110939025878906, 2.0707836151123047, 2.4304733276367188, 2.790163040161133, 3.149852752685547, 3.509542465209961, 3.869232177734375, 4.228921890258789, 4.588611602783203, 4.948301315307617, 5.307991027832031, 5.667680740356445, 6.027370452880859, 6.387060165405273, 6.7467498779296875, 7.106439590454102, 7.466129302978516, 7.82581901550293, 8.185508728027344, 8.545198440551758, 8.904888153076172, 9.264577865600586, 9.624267578125, 9.983957290649414, 10.343647003173828, 10.703336715698242, 11.063026428222656]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 6.0, 23.0, 33.0, 46.0, 54.0, 103.0, 144.0, 232.0, 366.0, 527.0, 943.0, 1467.0, 2236.0, 3530.0, 5902.0, 9769.0, 16879.0, 29404.0, 53832.0, 104188.0, 205334.0, 264713.0, 163958.0, 81928.0, 43177.0, 24258.0, 14078.0, 8264.0, 4902.0, 3077.0, 1919.0, 1187.0, 769.0, 471.0, 278.0, 180.0, 113.0, 86.0, 58.0, 46.0, 26.0, 20.0, 9.0, 8.0, 5.0, 3.0, 2.0, 2.0, 0.0, 3.0], "bins": [-22.578125, -21.93896484375, -21.2998046875, -20.66064453125, -20.021484375, -19.38232421875, -18.7431640625, -18.10400390625, -17.46484375, -16.82568359375, -16.1865234375, -15.54736328125, -14.908203125, -14.26904296875, -13.6298828125, -12.99072265625, -12.3515625, -11.71240234375, -11.0732421875, -10.43408203125, -9.794921875, -9.15576171875, -8.5166015625, -7.87744140625, -7.23828125, -6.59912109375, -5.9599609375, -5.32080078125, -4.681640625, -4.04248046875, -3.4033203125, -2.76416015625, -2.125, -1.48583984375, -0.8466796875, -0.20751953125, 0.431640625, 1.07080078125, 1.7099609375, 2.34912109375, 2.98828125, 3.62744140625, 4.2666015625, 4.90576171875, 5.544921875, 6.18408203125, 6.8232421875, 7.46240234375, 8.1015625, 8.74072265625, 9.3798828125, 10.01904296875, 10.658203125, 11.29736328125, 11.9365234375, 12.57568359375, 13.21484375, 13.85400390625, 14.4931640625, 15.13232421875, 15.771484375, 16.41064453125, 17.0498046875, 17.68896484375, 18.328125]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 9.0, 9.0, 13.0, 6.0, 14.0, 14.0, 20.0, 22.0, 29.0, 24.0, 41.0, 37.0, 32.0, 37.0, 37.0, 32.0, 47.0, 39.0, 30.0, 41.0, 43.0, 50.0, 33.0, 47.0, 40.0, 32.0, 25.0, 35.0, 40.0, 25.0, 19.0, 9.0, 14.0, 11.0, 8.0, 9.0, 6.0, 5.0, 7.0, 9.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.078125, -11.711669921875, -11.34521484375, -10.978759765625, -10.6123046875, -10.245849609375, -9.87939453125, -9.512939453125, -9.146484375, -8.780029296875, -8.41357421875, -8.047119140625, -7.6806640625, -7.314208984375, -6.94775390625, -6.581298828125, -6.21484375, -5.848388671875, -5.48193359375, -5.115478515625, -4.7490234375, -4.382568359375, -4.01611328125, -3.649658203125, -3.283203125, -2.916748046875, -2.55029296875, -2.183837890625, -1.8173828125, -1.450927734375, -1.08447265625, -0.718017578125, -0.3515625, 0.014892578125, 0.38134765625, 0.747802734375, 1.1142578125, 1.480712890625, 1.84716796875, 2.213623046875, 2.580078125, 2.946533203125, 3.31298828125, 3.679443359375, 4.0458984375, 4.412353515625, 4.77880859375, 5.145263671875, 5.51171875, 5.878173828125, 6.24462890625, 6.611083984375, 6.9775390625, 7.343994140625, 7.71044921875, 8.076904296875, 8.443359375, 8.809814453125, 9.17626953125, 9.542724609375, 9.9091796875, 10.275634765625, 10.64208984375, 11.008544921875, 11.375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 8.0, 17.0, 24.0, 33.0, 38.0, 63.0, 95.0, 124.0, 158.0, 231.0, 351.0, 508.0, 753.0, 1121.0, 1475.0, 2161.0, 3231.0, 4634.0, 6923.0, 10233.0, 15301.0, 23515.0, 36707.0, 58771.0, 99848.0, 172542.0, 217477.0, 153402.0, 88410.0, 52578.0, 33170.0, 21258.0, 13947.0, 9449.0, 6284.0, 4198.0, 2889.0, 2025.0, 1439.0, 952.0, 642.0, 444.0, 328.0, 247.0, 139.0, 133.0, 101.0, 58.0, 34.0, 25.0, 28.0, 13.0, 9.0, 6.0, 3.0, 4.0, 2.0, 2.0], "bins": [-16.390625, -15.884521484375, -15.37841796875, -14.872314453125, -14.3662109375, -13.860107421875, -13.35400390625, -12.847900390625, -12.341796875, -11.835693359375, -11.32958984375, -10.823486328125, -10.3173828125, -9.811279296875, -9.30517578125, -8.799072265625, -8.29296875, -7.786865234375, -7.28076171875, -6.774658203125, -6.2685546875, -5.762451171875, -5.25634765625, -4.750244140625, -4.244140625, -3.738037109375, -3.23193359375, -2.725830078125, -2.2197265625, -1.713623046875, -1.20751953125, -0.701416015625, -0.1953125, 0.310791015625, 0.81689453125, 1.322998046875, 1.8291015625, 2.335205078125, 2.84130859375, 3.347412109375, 3.853515625, 4.359619140625, 4.86572265625, 5.371826171875, 5.8779296875, 6.384033203125, 6.89013671875, 7.396240234375, 7.90234375, 8.408447265625, 8.91455078125, 9.420654296875, 9.9267578125, 10.432861328125, 10.93896484375, 11.445068359375, 11.951171875, 12.457275390625, 12.96337890625, 13.469482421875, 13.9755859375, 14.481689453125, 14.98779296875, 15.493896484375, 16.0]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 5.0, 3.0, 3.0, 8.0, 4.0, 12.0, 9.0, 16.0, 18.0, 18.0, 23.0, 29.0, 31.0, 21.0, 35.0, 32.0, 37.0, 44.0, 39.0, 32.0, 42.0, 41.0, 38.0, 48.0, 36.0, 42.0, 34.0, 33.0, 35.0, 31.0, 29.0, 30.0, 19.0, 14.0, 12.0, 21.0, 15.0, 10.0, 13.0, 8.0, 5.0, 6.0, 7.0, 3.0, 4.0, 3.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.76953125, -6.54510498046875, -6.3206787109375, -6.09625244140625, -5.871826171875, -5.64739990234375, -5.4229736328125, -5.19854736328125, -4.97412109375, -4.74969482421875, -4.5252685546875, -4.30084228515625, -4.076416015625, -3.85198974609375, -3.6275634765625, -3.40313720703125, -3.1787109375, -2.95428466796875, -2.7298583984375, -2.50543212890625, -2.281005859375, -2.05657958984375, -1.8321533203125, -1.60772705078125, -1.38330078125, -1.15887451171875, -0.9344482421875, -0.71002197265625, -0.485595703125, -0.26116943359375, -0.0367431640625, 0.18768310546875, 0.412109375, 0.63653564453125, 0.8609619140625, 1.08538818359375, 1.309814453125, 1.53424072265625, 1.7586669921875, 1.98309326171875, 2.20751953125, 2.43194580078125, 2.6563720703125, 2.88079833984375, 3.105224609375, 3.32965087890625, 3.5540771484375, 3.77850341796875, 4.0029296875, 4.22735595703125, 4.4517822265625, 4.67620849609375, 4.900634765625, 5.12506103515625, 5.3494873046875, 5.57391357421875, 5.79833984375, 6.02276611328125, 6.2471923828125, 6.47161865234375, 6.696044921875, 6.92047119140625, 7.1448974609375, 7.36932373046875, 7.59375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 9.0, 3.0, 11.0, 13.0, 19.0, 28.0, 43.0, 85.0, 98.0, 137.0, 209.0, 294.0, 476.0, 765.0, 1207.0, 2015.0, 3472.0, 6118.0, 11253.0, 21229.0, 43128.0, 102704.0, 341068.0, 326845.0, 98516.0, 42413.0, 20700.0, 10886.0, 6070.0, 3326.0, 2000.0, 1249.0, 765.0, 465.0, 308.0, 218.0, 112.0, 89.0, 64.0, 44.0, 39.0, 23.0, 9.0, 11.0, 7.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.20703125, -3.103515625, -3.0, -2.896484375, -2.79296875, -2.689453125, -2.5859375, -2.482421875, -2.37890625, -2.275390625, -2.171875, -2.068359375, -1.96484375, -1.861328125, -1.7578125, -1.654296875, -1.55078125, -1.447265625, -1.34375, -1.240234375, -1.13671875, -1.033203125, -0.9296875, -0.826171875, -0.72265625, -0.619140625, -0.515625, -0.412109375, -0.30859375, -0.205078125, -0.1015625, 0.001953125, 0.10546875, 0.208984375, 0.3125, 0.416015625, 0.51953125, 0.623046875, 0.7265625, 0.830078125, 0.93359375, 1.037109375, 1.140625, 1.244140625, 1.34765625, 1.451171875, 1.5546875, 1.658203125, 1.76171875, 1.865234375, 1.96875, 2.072265625, 2.17578125, 2.279296875, 2.3828125, 2.486328125, 2.58984375, 2.693359375, 2.796875, 2.900390625, 3.00390625, 3.107421875, 3.2109375, 3.314453125, 3.41796875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 7.0, 6.0, 4.0, 17.0, 7.0, 18.0, 13.0, 35.0, 32.0, 54.0, 56.0, 61.0, 83.0, 105.0, 105.0, 85.0, 74.0, 61.0, 47.0, 39.0, 22.0, 18.0, 18.0, 8.0, 9.0, 10.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.00018775463104248047, -0.00018339324742555618, -0.0001790318638086319, -0.0001746704801917076, -0.00017030909657478333, -0.00016594771295785904, -0.00016158632934093475, -0.00015722494572401047, -0.00015286356210708618, -0.0001485021784901619, -0.0001441407948732376, -0.00013977941125631332, -0.00013541802763938904, -0.00013105664402246475, -0.00012669526040554047, -0.00012233387678861618, -0.0001179724931716919, -0.00011361110955476761, -0.00010924972593784332, -0.00010488834232091904, -0.00010052695870399475, -9.616557508707047e-05, -9.180419147014618e-05, -8.74428078532219e-05, -8.308142423629761e-05, -7.872004061937332e-05, -7.435865700244904e-05, -6.999727338552475e-05, -6.563588976860046e-05, -6.127450615167618e-05, -5.691312253475189e-05, -5.2551738917827606e-05, -4.819035530090332e-05, -4.3828971683979034e-05, -3.946758806705475e-05, -3.510620445013046e-05, -3.074482083320618e-05, -2.638343721628189e-05, -2.2022053599357605e-05, -1.766066998243332e-05, -1.3299286365509033e-05, -8.937902748584747e-06, -4.5765191316604614e-06, -2.1513551473617554e-07, 4.14624810218811e-06, 8.507631719112396e-06, 1.2869015336036682e-05, 1.7230398952960968e-05, 2.1591782569885254e-05, 2.595316618680954e-05, 3.0314549803733826e-05, 3.467593342065811e-05, 3.90373170375824e-05, 4.339870065450668e-05, 4.776008427143097e-05, 5.2121467888355255e-05, 5.648285150527954e-05, 6.084423512220383e-05, 6.520561873912811e-05, 6.95670023560524e-05, 7.392838597297668e-05, 7.828976958990097e-05, 8.265115320682526e-05, 8.701253682374954e-05, 9.137392044067383e-05]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 6.0, 0.0, 2.0, 4.0, 8.0, 22.0, 27.0, 34.0, 50.0, 74.0, 106.0, 159.0, 245.0, 349.0, 530.0, 806.0, 1203.0, 1825.0, 2730.0, 3975.0, 6118.0, 9088.0, 14199.0, 22359.0, 36601.0, 66756.0, 150676.0, 330049.0, 202409.0, 81968.0, 43152.0, 25987.0, 16203.0, 10472.0, 6758.0, 4434.0, 2999.0, 2022.0, 1382.0, 911.0, 640.0, 434.0, 267.0, 148.0, 107.0, 80.0, 63.0, 43.0, 36.0, 14.0, 9.0, 7.0, 5.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.37109375, -2.296173095703125, -2.22125244140625, -2.146331787109375, -2.0714111328125, -1.996490478515625, -1.92156982421875, -1.846649169921875, -1.771728515625, -1.696807861328125, -1.62188720703125, -1.546966552734375, -1.4720458984375, -1.397125244140625, -1.32220458984375, -1.247283935546875, -1.17236328125, -1.097442626953125, -1.02252197265625, -0.947601318359375, -0.8726806640625, -0.797760009765625, -0.72283935546875, -0.647918701171875, -0.572998046875, -0.498077392578125, -0.42315673828125, -0.348236083984375, -0.2733154296875, -0.198394775390625, -0.12347412109375, -0.048553466796875, 0.0263671875, 0.101287841796875, 0.17620849609375, 0.251129150390625, 0.3260498046875, 0.400970458984375, 0.47589111328125, 0.550811767578125, 0.625732421875, 0.700653076171875, 0.77557373046875, 0.850494384765625, 0.9254150390625, 1.000335693359375, 1.07525634765625, 1.150177001953125, 1.22509765625, 1.300018310546875, 1.37493896484375, 1.449859619140625, 1.5247802734375, 1.599700927734375, 1.67462158203125, 1.749542236328125, 1.824462890625, 1.899383544921875, 1.97430419921875, 2.049224853515625, 2.1241455078125, 2.199066162109375, 2.27398681640625, 2.348907470703125, 2.423828125]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 4.0, 3.0, 9.0, 5.0, 4.0, 8.0, 15.0, 21.0, 11.0, 21.0, 16.0, 18.0, 26.0, 29.0, 32.0, 37.0, 46.0, 59.0, 55.0, 61.0, 52.0, 57.0, 60.0, 51.0, 35.0, 33.0, 26.0, 27.0, 23.0, 25.0, 21.0, 21.0, 12.0, 10.0, 8.0, 9.0, 9.0, 4.0, 6.0, 10.0, 6.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90673828125, -0.8769912719726562, -0.8472442626953125, -0.8174972534179688, -0.787750244140625, -0.7580032348632812, -0.7282562255859375, -0.6985092163085938, -0.66876220703125, -0.6390151977539062, -0.6092681884765625, -0.5795211791992188, -0.549774169921875, -0.5200271606445312, -0.4902801513671875, -0.46053314208984375, -0.4307861328125, -0.40103912353515625, -0.3712921142578125, -0.34154510498046875, -0.311798095703125, -0.28205108642578125, -0.2523040771484375, -0.22255706787109375, -0.19281005859375, -0.16306304931640625, -0.1333160400390625, -0.10356903076171875, -0.073822021484375, -0.04407501220703125, -0.0143280029296875, 0.01541900634765625, 0.045166015625, 0.07491302490234375, 0.1046600341796875, 0.13440704345703125, 0.164154052734375, 0.19390106201171875, 0.2236480712890625, 0.25339508056640625, 0.28314208984375, 0.31288909912109375, 0.3426361083984375, 0.37238311767578125, 0.402130126953125, 0.43187713623046875, 0.4616241455078125, 0.49137115478515625, 0.5211181640625, 0.5508651733398438, 0.5806121826171875, 0.6103591918945312, 0.640106201171875, 0.6698532104492188, 0.6996002197265625, 0.7293472290039062, 0.75909423828125, 0.7888412475585938, 0.8185882568359375, 0.8483352661132812, 0.878082275390625, 0.9078292846679688, 0.9375762939453125, 0.9673233032226562, 0.9970703125]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 10.0, 5.0, 6.0, 6.0, 7.0, 8.0, 14.0, 20.0, 18.0, 20.0, 21.0, 37.0, 32.0, 56.0, 65.0, 70.0, 93.0, 111.0, 67.0, 64.0, 54.0, 45.0, 32.0, 32.0, 19.0, 17.0, 14.0, 13.0, 10.0, 8.0, 9.0, 8.0, 0.0, 4.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.747939109802246, -9.399699211120605, -9.051458358764648, -8.703218460083008, -8.354978561401367, -8.006738662719727, -7.658498287200928, -7.310257911682129, -6.962018013000488, -6.613778114318848, -6.265537738800049, -5.91729736328125, -5.569057464599609, -5.220817565917969, -4.87257719039917, -4.524336814880371, -4.1760969161987305, -3.8278567790985107, -3.479616641998291, -3.1313765048980713, -2.7831363677978516, -2.434896230697632, -2.086656093597412, -1.7384159564971924, -1.3901758193969727, -1.041935682296753, -0.6936955451965332, -0.3454554080963135, 0.00278472900390625, 0.351024866104126, 0.6992650032043457, 1.0475051403045654, 1.3957452774047852, 1.7439854145050049, 2.0922255516052246, 2.4404656887054443, 2.788705825805664, 3.136945962905884, 3.4851861000061035, 3.8334262371063232, 4.181666374206543, 4.529906272888184, 4.878146648406982, 5.226387023925781, 5.574626922607422, 5.9228668212890625, 6.271107196807861, 6.61934757232666, 6.967587471008301, 7.315827369689941, 7.66406774520874, 8.012308120727539, 8.36054801940918, 8.70878791809082, 9.057027816772461, 9.405268669128418, 9.753508567810059, 10.1017484664917, 10.449989318847656, 10.798229217529297, 11.146469116210938, 11.494709014892578, 11.842948913574219, 12.191189765930176, 12.539429664611816]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 7.0, 5.0, 5.0, 5.0, 7.0, 12.0, 11.0, 6.0, 8.0, 19.0, 14.0, 28.0, 25.0, 18.0, 19.0, 27.0, 34.0, 36.0, 29.0, 32.0, 38.0, 27.0, 38.0, 28.0, 35.0, 32.0, 41.0, 34.0, 35.0, 43.0, 31.0, 38.0, 31.0, 27.0, 24.0, 25.0, 19.0, 15.0, 17.0, 9.0, 7.0, 17.0, 17.0, 5.0, 9.0, 6.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-10.452103614807129, -10.100647926330566, -9.749191284179688, -9.397735595703125, -9.046279907226562, -8.69482421875, -8.343368530273438, -7.991911888122559, -7.640456199645996, -7.289000511169434, -6.937544345855713, -6.586088180541992, -6.23463249206543, -5.883176803588867, -5.5317206382751465, -5.180264472961426, -4.828808784484863, -4.477353096008301, -4.12589693069458, -3.7744410037994385, -3.422985076904297, -3.0715291500091553, -2.7200732231140137, -2.368617296218872, -2.0171613693237305, -1.6657054424285889, -1.3142495155334473, -0.9627935886383057, -0.6113376617431641, -0.25988173484802246, 0.09157419204711914, 0.44303011894226074, 0.7944869995117188, 1.1459429264068604, 1.497398853302002, 1.8488547801971436, 2.200310707092285, 2.5517666339874268, 2.9032225608825684, 3.25467848777771, 3.6061344146728516, 3.957590341567993, 4.309046268463135, 4.6605024337768555, 5.011958122253418, 5.3634138107299805, 5.714869976043701, 6.066326141357422, 6.417781829833984, 6.769237518310547, 7.120693683624268, 7.472149848937988, 7.823605537414551, 8.175061225891113, 8.526517868041992, 8.877973556518555, 9.229429244995117, 9.58088493347168, 9.932340621948242, 10.283797264099121, 10.635252952575684, 10.986708641052246, 11.338165283203125, 11.689620971679688, 12.04107666015625]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [2.0, 5.0, 7.0, 6.0, 11.0, 32.0, 49.0, 58.0, 77.0, 148.0, 213.0, 313.0, 433.0, 678.0, 1121.0, 1599.0, 2385.0, 3383.0, 5202.0, 7915.0, 12189.0, 18691.0, 29550.0, 47603.0, 79613.0, 144112.0, 318800.0, 985871.0, 1496076.0, 562391.0, 205651.0, 104031.0, 60703.0, 36779.0, 23233.0, 14855.0, 9826.0, 6560.0, 4365.0, 3012.0, 2044.0, 1388.0, 1026.0, 675.0, 461.0, 365.0, 216.0, 167.0, 120.0, 100.0, 61.0, 41.0, 25.0, 23.0, 14.0, 10.0, 4.0, 7.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-12.3046875, -11.869384765625, -11.43408203125, -10.998779296875, -10.5634765625, -10.128173828125, -9.69287109375, -9.257568359375, -8.822265625, -8.386962890625, -7.95166015625, -7.516357421875, -7.0810546875, -6.645751953125, -6.21044921875, -5.775146484375, -5.33984375, -4.904541015625, -4.46923828125, -4.033935546875, -3.5986328125, -3.163330078125, -2.72802734375, -2.292724609375, -1.857421875, -1.422119140625, -0.98681640625, -0.551513671875, -0.1162109375, 0.319091796875, 0.75439453125, 1.189697265625, 1.625, 2.060302734375, 2.49560546875, 2.930908203125, 3.3662109375, 3.801513671875, 4.23681640625, 4.672119140625, 5.107421875, 5.542724609375, 5.97802734375, 6.413330078125, 6.8486328125, 7.283935546875, 7.71923828125, 8.154541015625, 8.58984375, 9.025146484375, 9.46044921875, 9.895751953125, 10.3310546875, 10.766357421875, 11.20166015625, 11.636962890625, 12.072265625, 12.507568359375, 12.94287109375, 13.378173828125, 13.8134765625, 14.248779296875, 14.68408203125, 15.119384765625, 15.5546875]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 2.0, 6.0, 4.0, 7.0, 6.0, 4.0, 11.0, 12.0, 4.0, 17.0, 16.0, 22.0, 18.0, 20.0, 18.0, 23.0, 15.0, 51.0, 27.0, 33.0, 34.0, 45.0, 32.0, 20.0, 31.0, 28.0, 41.0, 40.0, 37.0, 34.0, 39.0, 37.0, 33.0, 30.0, 32.0, 26.0, 24.0, 15.0, 8.0, 17.0, 13.0, 13.0, 11.0, 10.0, 13.0, 7.0, 8.0, 4.0, 2.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-8.7265625, -8.4222412109375, -8.117919921875, -7.8135986328125, -7.50927734375, -7.2049560546875, -6.900634765625, -6.5963134765625, -6.2919921875, -5.9876708984375, -5.683349609375, -5.3790283203125, -5.07470703125, -4.7703857421875, -4.466064453125, -4.1617431640625, -3.857421875, -3.5531005859375, -3.248779296875, -2.9444580078125, -2.64013671875, -2.3358154296875, -2.031494140625, -1.7271728515625, -1.4228515625, -1.1185302734375, -0.814208984375, -0.5098876953125, -0.20556640625, 0.0987548828125, 0.403076171875, 0.7073974609375, 1.01171875, 1.3160400390625, 1.620361328125, 1.9246826171875, 2.22900390625, 2.5333251953125, 2.837646484375, 3.1419677734375, 3.4462890625, 3.7506103515625, 4.054931640625, 4.3592529296875, 4.66357421875, 4.9678955078125, 5.272216796875, 5.5765380859375, 5.880859375, 6.1851806640625, 6.489501953125, 6.7938232421875, 7.09814453125, 7.4024658203125, 7.706787109375, 8.0111083984375, 8.3154296875, 8.6197509765625, 8.924072265625, 9.2283935546875, 9.53271484375, 9.8370361328125, 10.141357421875, 10.4456787109375, 10.75]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 0.0, 7.0, 8.0, 9.0, 13.0, 28.0, 36.0, 46.0, 67.0, 79.0, 132.0, 225.0, 346.0, 504.0, 827.0, 1332.0, 2294.0, 3906.0, 6874.0, 12467.0, 23224.0, 45260.0, 92535.0, 208501.0, 547070.0, 1661923.0, 983151.0, 329946.0, 138054.0, 64690.0, 32043.0, 16891.0, 9079.0, 5180.0, 3011.0, 1670.0, 1031.0, 647.0, 404.0, 237.0, 185.0, 109.0, 68.0, 55.0, 37.0, 30.0, 15.0, 16.0, 8.0, 7.0, 3.0, 3.0, 1.0, 3.0, 0.0, 3.0, 1.0], "bins": [-17.375, -16.844482421875, -16.31396484375, -15.783447265625, -15.2529296875, -14.722412109375, -14.19189453125, -13.661376953125, -13.130859375, -12.600341796875, -12.06982421875, -11.539306640625, -11.0087890625, -10.478271484375, -9.94775390625, -9.417236328125, -8.88671875, -8.356201171875, -7.82568359375, -7.295166015625, -6.7646484375, -6.234130859375, -5.70361328125, -5.173095703125, -4.642578125, -4.112060546875, -3.58154296875, -3.051025390625, -2.5205078125, -1.989990234375, -1.45947265625, -0.928955078125, -0.3984375, 0.132080078125, 0.66259765625, 1.193115234375, 1.7236328125, 2.254150390625, 2.78466796875, 3.315185546875, 3.845703125, 4.376220703125, 4.90673828125, 5.437255859375, 5.9677734375, 6.498291015625, 7.02880859375, 7.559326171875, 8.08984375, 8.620361328125, 9.15087890625, 9.681396484375, 10.2119140625, 10.742431640625, 11.27294921875, 11.803466796875, 12.333984375, 12.864501953125, 13.39501953125, 13.925537109375, 14.4560546875, 14.986572265625, 15.51708984375, 16.047607421875, 16.578125]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 5.0, 11.0, 22.0, 27.0, 30.0, 37.0, 46.0, 63.0, 91.0, 110.0, 150.0, 198.0, 229.0, 279.0, 379.0, 490.0, 428.0, 357.0, 266.0, 219.0, 144.0, 129.0, 100.0, 65.0, 55.0, 42.0, 33.0, 22.0, 16.0, 3.0, 7.0, 6.0, 3.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8671875, -7.6275634765625, -7.387939453125, -7.1483154296875, -6.90869140625, -6.6690673828125, -6.429443359375, -6.1898193359375, -5.9501953125, -5.7105712890625, -5.470947265625, -5.2313232421875, -4.99169921875, -4.7520751953125, -4.512451171875, -4.2728271484375, -4.033203125, -3.7935791015625, -3.553955078125, -3.3143310546875, -3.07470703125, -2.8350830078125, -2.595458984375, -2.3558349609375, -2.1162109375, -1.8765869140625, -1.636962890625, -1.3973388671875, -1.15771484375, -0.9180908203125, -0.678466796875, -0.4388427734375, -0.19921875, 0.0404052734375, 0.280029296875, 0.5196533203125, 0.75927734375, 0.9989013671875, 1.238525390625, 1.4781494140625, 1.7177734375, 1.9573974609375, 2.197021484375, 2.4366455078125, 2.67626953125, 2.9158935546875, 3.155517578125, 3.3951416015625, 3.634765625, 3.8743896484375, 4.114013671875, 4.3536376953125, 4.59326171875, 4.8328857421875, 5.072509765625, 5.3121337890625, 5.5517578125, 5.7913818359375, 6.031005859375, 6.2706298828125, 6.51025390625, 6.7498779296875, 6.989501953125, 7.2291259765625, 7.46875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 5.0, 5.0, 9.0, 14.0, 14.0, 14.0, 11.0, 25.0, 22.0, 32.0, 38.0, 53.0, 49.0, 75.0, 77.0, 95.0, 92.0, 79.0, 70.0, 38.0, 29.0, 30.0, 21.0, 15.0, 14.0, 15.0, 11.0, 5.0, 12.0, 5.0, 5.0, 2.0, 3.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.804123878479004, -11.439645767211914, -11.075167655944824, -10.710689544677734, -10.346210479736328, -9.981732368469238, -9.617254257202148, -9.252776145935059, -8.888298034667969, -8.523819923400879, -8.159341812133789, -7.794863224029541, -7.430385112762451, -7.065907001495361, -6.701428413391113, -6.336950302124023, -5.972472190856934, -5.607994079589844, -5.243515968322754, -4.879037380218506, -4.514559268951416, -4.150081157684326, -3.7856028079986572, -3.4211244583129883, -3.0566463470458984, -2.6921682357788086, -2.3276898860931396, -1.9632116556167603, -1.5987334251403809, -1.2342551946640015, -0.8697769641876221, -0.5052986145019531, -0.14082050323486328, 0.2236577272415161, 0.5881359577178955, 0.9526141881942749, 1.3170924186706543, 1.6815706491470337, 2.046048879623413, 2.410527229309082, 2.775005340576172, 3.1394834518432617, 3.5039618015289307, 3.8684401512145996, 4.2329182624816895, 4.597396373748779, 4.961874961853027, 5.326353073120117, 5.690831184387207, 6.055309295654297, 6.419787406921387, 6.784265995025635, 7.148744106292725, 7.5132222175598145, 7.8777008056640625, 8.242178916931152, 8.606657028198242, 8.971135139465332, 9.335613250732422, 9.700091361999512, 10.064569473266602, 10.429048538208008, 10.793526649475098, 11.158004760742188, 11.522482872009277]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 9.0, 5.0, 9.0, 11.0, 8.0, 8.0, 12.0, 13.0, 21.0, 17.0, 28.0, 25.0, 32.0, 33.0, 35.0, 35.0, 36.0, 41.0, 46.0, 40.0, 41.0, 37.0, 37.0, 42.0, 45.0, 33.0, 40.0, 45.0, 34.0, 25.0, 34.0, 23.0, 11.0, 19.0, 13.0, 8.0, 15.0, 10.0, 6.0, 7.0, 12.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.57560920715332, -11.164199829101562, -10.752791404724121, -10.341382026672363, -9.929973602294922, -9.518564224243164, -9.107154846191406, -8.695745468139648, -8.284337043762207, -7.872928142547607, -7.461519241333008, -7.05010986328125, -6.63870096206665, -6.227292060852051, -5.815882682800293, -5.404473781585693, -4.993064880371094, -4.581655979156494, -4.1702470779418945, -3.7588376998901367, -3.347428798675537, -2.9360198974609375, -2.524610757827759, -2.11320161819458, -1.7017927169799805, -1.2903836965560913, -0.8789746761322021, -0.467565655708313, -0.05615663528442383, 0.3552522659301758, 0.7666614055633545, 1.1780705451965332, 1.5894794464111328, 2.0008883476257324, 2.412297487258911, 2.82370662689209, 3.2351155281066895, 3.646524429321289, 4.057933807373047, 4.4693427085876465, 4.880751609802246, 5.292160511016846, 5.703569412231445, 6.114978790283203, 6.526387691497803, 6.937796592712402, 7.34920597076416, 7.76061487197876, 8.17202377319336, 8.583433151245117, 8.994841575622559, 9.406250953674316, 9.817659378051758, 10.229068756103516, 10.640478134155273, 11.051887512207031, 11.463295936584473, 11.87470531463623, 12.286113739013672, 12.69752311706543, 13.108932495117188, 13.520340919494629, 13.931750297546387, 14.343158721923828, 14.754568099975586]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 8.0, 6.0, 15.0, 18.0, 31.0, 39.0, 45.0, 83.0, 112.0, 203.0, 337.0, 476.0, 734.0, 1062.0, 1485.0, 2171.0, 3131.0, 4652.0, 7057.0, 10432.0, 16125.0, 25030.0, 39863.0, 64959.0, 113726.0, 294153.0, 206435.0, 97487.0, 57495.0, 35374.0, 22585.0, 14379.0, 9434.0, 6277.0, 4245.0, 2812.0, 1920.0, 1326.0, 945.0, 643.0, 444.0, 273.0, 164.0, 111.0, 77.0, 52.0, 47.0, 21.0, 29.0, 15.0, 8.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.263671875, -3.1544189453125, -3.045166015625, -2.9359130859375, -2.82666015625, -2.7174072265625, -2.608154296875, -2.4989013671875, -2.3896484375, -2.2803955078125, -2.171142578125, -2.0618896484375, -1.95263671875, -1.8433837890625, -1.734130859375, -1.6248779296875, -1.515625, -1.4063720703125, -1.297119140625, -1.1878662109375, -1.07861328125, -0.9693603515625, -0.860107421875, -0.7508544921875, -0.6416015625, -0.5323486328125, -0.423095703125, -0.3138427734375, -0.20458984375, -0.0953369140625, 0.013916015625, 0.1231689453125, 0.232421875, 0.3416748046875, 0.450927734375, 0.5601806640625, 0.66943359375, 0.7786865234375, 0.887939453125, 0.9971923828125, 1.1064453125, 1.2156982421875, 1.324951171875, 1.4342041015625, 1.54345703125, 1.6527099609375, 1.761962890625, 1.8712158203125, 1.98046875, 2.0897216796875, 2.198974609375, 2.3082275390625, 2.41748046875, 2.5267333984375, 2.635986328125, 2.7452392578125, 2.8544921875, 2.9637451171875, 3.072998046875, 3.1822509765625, 3.29150390625, 3.4007568359375, 3.510009765625, 3.6192626953125, 3.728515625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 5.0, 8.0, 11.0, 7.0, 12.0, 10.0, 6.0, 13.0, 28.0, 14.0, 29.0, 24.0, 24.0, 39.0, 37.0, 38.0, 29.0, 41.0, 38.0, 44.0, 48.0, 34.0, 42.0, 38.0, 39.0, 39.0, 37.0, 42.0, 41.0, 26.0, 24.0, 21.0, 19.0, 13.0, 14.0, 21.0, 6.0, 7.0, 7.0, 7.0, 8.0, 6.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.015625, -11.61279296875, -11.2099609375, -10.80712890625, -10.404296875, -10.00146484375, -9.5986328125, -9.19580078125, -8.79296875, -8.39013671875, -7.9873046875, -7.58447265625, -7.181640625, -6.77880859375, -6.3759765625, -5.97314453125, -5.5703125, -5.16748046875, -4.7646484375, -4.36181640625, -3.958984375, -3.55615234375, -3.1533203125, -2.75048828125, -2.34765625, -1.94482421875, -1.5419921875, -1.13916015625, -0.736328125, -0.33349609375, 0.0693359375, 0.47216796875, 0.875, 1.27783203125, 1.6806640625, 2.08349609375, 2.486328125, 2.88916015625, 3.2919921875, 3.69482421875, 4.09765625, 4.50048828125, 4.9033203125, 5.30615234375, 5.708984375, 6.11181640625, 6.5146484375, 6.91748046875, 7.3203125, 7.72314453125, 8.1259765625, 8.52880859375, 8.931640625, 9.33447265625, 9.7373046875, 10.14013671875, 10.54296875, 10.94580078125, 11.3486328125, 11.75146484375, 12.154296875, 12.55712890625, 12.9599609375, 13.36279296875, 13.765625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 9.0, 10.0, 21.0, 33.0, 37.0, 53.0, 75.0, 101.0, 115.0, 193.0, 248.0, 322.0, 430.0, 580.0, 778.0, 1081.0, 1524.0, 2038.0, 2910.0, 4223.0, 5811.0, 8522.0, 12355.0, 17936.0, 26678.0, 40278.0, 61672.0, 100813.0, 225888.0, 239133.0, 103225.0, 62871.0, 40998.0, 27228.0, 18277.0, 12440.0, 8626.0, 6048.0, 4175.0, 3008.0, 2150.0, 1518.0, 1074.0, 823.0, 618.0, 426.0, 309.0, 238.0, 170.0, 137.0, 107.0, 72.0, 55.0, 48.0, 19.0, 13.0, 12.0, 9.0, 2.0, 0.0, 4.0], "bins": [-2.96875, -2.87603759765625, -2.7833251953125, -2.69061279296875, -2.597900390625, -2.50518798828125, -2.4124755859375, -2.31976318359375, -2.22705078125, -2.13433837890625, -2.0416259765625, -1.94891357421875, -1.856201171875, -1.76348876953125, -1.6707763671875, -1.57806396484375, -1.4853515625, -1.39263916015625, -1.2999267578125, -1.20721435546875, -1.114501953125, -1.02178955078125, -0.9290771484375, -0.83636474609375, -0.74365234375, -0.65093994140625, -0.5582275390625, -0.46551513671875, -0.372802734375, -0.28009033203125, -0.1873779296875, -0.09466552734375, -0.001953125, 0.09075927734375, 0.1834716796875, 0.27618408203125, 0.368896484375, 0.46160888671875, 0.5543212890625, 0.64703369140625, 0.73974609375, 0.83245849609375, 0.9251708984375, 1.01788330078125, 1.110595703125, 1.20330810546875, 1.2960205078125, 1.38873291015625, 1.4814453125, 1.57415771484375, 1.6668701171875, 1.75958251953125, 1.852294921875, 1.94500732421875, 2.0377197265625, 2.13043212890625, 2.22314453125, 2.31585693359375, 2.4085693359375, 2.50128173828125, 2.593994140625, 2.68670654296875, 2.7794189453125, 2.87213134765625, 2.96484375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 1.0, 3.0, 1.0, 4.0, 3.0, 6.0, 3.0, 9.0, 7.0, 6.0, 9.0, 7.0, 10.0, 13.0, 15.0, 15.0, 20.0, 14.0, 32.0, 26.0, 35.0, 29.0, 29.0, 25.0, 29.0, 28.0, 36.0, 39.0, 24.0, 33.0, 50.0, 48.0, 27.0, 30.0, 30.0, 23.0, 28.0, 30.0, 22.0, 39.0, 20.0, 22.0, 18.0, 20.0, 18.0, 9.0, 9.0, 11.0, 12.0, 9.0, 4.0, 3.0, 5.0, 3.0, 2.0, 7.0, 3.0, 3.0, 0.0, 2.0], "bins": [-7.41015625, -7.188232421875, -6.96630859375, -6.744384765625, -6.5224609375, -6.300537109375, -6.07861328125, -5.856689453125, -5.634765625, -5.412841796875, -5.19091796875, -4.968994140625, -4.7470703125, -4.525146484375, -4.30322265625, -4.081298828125, -3.859375, -3.637451171875, -3.41552734375, -3.193603515625, -2.9716796875, -2.749755859375, -2.52783203125, -2.305908203125, -2.083984375, -1.862060546875, -1.64013671875, -1.418212890625, -1.1962890625, -0.974365234375, -0.75244140625, -0.530517578125, -0.30859375, -0.086669921875, 0.13525390625, 0.357177734375, 0.5791015625, 0.801025390625, 1.02294921875, 1.244873046875, 1.466796875, 1.688720703125, 1.91064453125, 2.132568359375, 2.3544921875, 2.576416015625, 2.79833984375, 3.020263671875, 3.2421875, 3.464111328125, 3.68603515625, 3.907958984375, 4.1298828125, 4.351806640625, 4.57373046875, 4.795654296875, 5.017578125, 5.239501953125, 5.46142578125, 5.683349609375, 5.9052734375, 6.127197265625, 6.34912109375, 6.571044921875, 6.79296875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 7.0, 8.0, 11.0, 12.0, 13.0, 20.0, 19.0, 39.0, 40.0, 69.0, 69.0, 107.0, 149.0, 202.0, 233.0, 363.0, 507.0, 748.0, 1050.0, 1620.0, 2559.0, 3766.0, 6387.0, 11251.0, 21194.0, 45972.0, 122457.0, 422451.0, 255874.0, 78984.0, 32816.0, 15911.0, 8793.0, 5033.0, 3124.0, 2021.0, 1336.0, 997.0, 593.0, 442.0, 348.0, 257.0, 221.0, 129.0, 96.0, 68.0, 46.0, 42.0, 27.0, 21.0, 14.0, 17.0, 8.0, 10.0, 7.0, 3.0, 1.0, 3.0, 1.0, 2.0], "bins": [-0.00696563720703125, -0.006746530532836914, -0.006527423858642578, -0.006308317184448242, -0.006089210510253906, -0.00587010383605957, -0.005650997161865234, -0.0054318904876708984, -0.0052127838134765625, -0.0049936771392822266, -0.004774570465087891, -0.004555463790893555, -0.004336357116699219, -0.004117250442504883, -0.003898143768310547, -0.003679037094116211, -0.003459930419921875, -0.003240823745727539, -0.003021717071533203, -0.002802610397338867, -0.0025835037231445312, -0.0023643970489501953, -0.0021452903747558594, -0.0019261837005615234, -0.0017070770263671875, -0.0014879703521728516, -0.0012688636779785156, -0.0010497570037841797, -0.0008306503295898438, -0.0006115436553955078, -0.0003924369812011719, -0.00017333030700683594, 4.57763671875e-05, 0.00026488304138183594, 0.0004839897155761719, 0.0007030963897705078, 0.0009222030639648438, 0.0011413097381591797, 0.0013604164123535156, 0.0015795230865478516, 0.0017986297607421875, 0.0020177364349365234, 0.0022368431091308594, 0.0024559497833251953, 0.0026750564575195312, 0.002894163131713867, 0.003113269805908203, 0.003332376480102539, 0.003551483154296875, 0.003770589828491211, 0.003989696502685547, 0.004208803176879883, 0.004427909851074219, 0.004647016525268555, 0.004866123199462891, 0.0050852298736572266, 0.0053043365478515625, 0.0055234432220458984, 0.005742549896240234, 0.00596165657043457, 0.006180763244628906, 0.006399869918823242, 0.006618976593017578, 0.006838083267211914, 0.00705718994140625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 7.0, 8.0, 9.0, 18.0, 20.0, 31.0, 49.0, 43.0, 53.0, 53.0, 73.0, 94.0, 87.0, 78.0, 72.0, 76.0, 62.0, 41.0, 34.0, 26.0, 9.0, 13.0, 12.0, 9.0, 7.0, 7.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9604644775390625e-06, -5.7872384786605835e-06, -5.6140124797821045e-06, -5.4407864809036255e-06, -5.2675604820251465e-06, -5.0943344831466675e-06, -4.9211084842681885e-06, -4.7478824853897095e-06, -4.5746564865112305e-06, -4.4014304876327515e-06, -4.2282044887542725e-06, -4.0549784898757935e-06, -3.8817524909973145e-06, -3.7085264921188354e-06, -3.5353004932403564e-06, -3.3620744943618774e-06, -3.1888484954833984e-06, -3.0156224966049194e-06, -2.8423964977264404e-06, -2.6691704988479614e-06, -2.4959444999694824e-06, -2.3227185010910034e-06, -2.1494925022125244e-06, -1.9762665033340454e-06, -1.8030405044555664e-06, -1.6298145055770874e-06, -1.4565885066986084e-06, -1.2833625078201294e-06, -1.1101365089416504e-06, -9.369105100631714e-07, -7.636845111846924e-07, -5.904585123062134e-07, -4.172325134277344e-07, -2.4400651454925537e-07, -7.078051567077637e-08, 1.0244548320770264e-07, 2.7567148208618164e-07, 4.4889748096466064e-07, 6.221234798431396e-07, 7.953494787216187e-07, 9.685754776000977e-07, 1.1418014764785767e-06, 1.3150274753570557e-06, 1.4882534742355347e-06, 1.6614794731140137e-06, 1.8347054719924927e-06, 2.0079314708709717e-06, 2.1811574697494507e-06, 2.3543834686279297e-06, 2.5276094675064087e-06, 2.7008354663848877e-06, 2.8740614652633667e-06, 3.0472874641418457e-06, 3.2205134630203247e-06, 3.3937394618988037e-06, 3.5669654607772827e-06, 3.7401914596557617e-06, 3.913417458534241e-06, 4.08664345741272e-06, 4.259869456291199e-06, 4.433095455169678e-06, 4.606321454048157e-06, 4.779547452926636e-06, 4.952773451805115e-06, 5.125999450683594e-06]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 5.0, 5.0, 10.0, 9.0, 14.0, 24.0, 23.0, 42.0, 57.0, 75.0, 95.0, 167.0, 227.0, 319.0, 572.0, 951.0, 1659.0, 2956.0, 5699.0, 11341.0, 25893.0, 73545.0, 360564.0, 426239.0, 83682.0, 28498.0, 12425.0, 5964.0, 3118.0, 1766.0, 922.0, 533.0, 380.0, 233.0, 170.0, 113.0, 67.0, 59.0, 44.0, 29.0, 19.0, 15.0, 14.0, 7.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00933074951171875, -0.00903022289276123, -0.008729696273803711, -0.008429169654846191, -0.008128643035888672, -0.007828116416931152, -0.007527589797973633, -0.007227063179016113, -0.006926536560058594, -0.006626009941101074, -0.006325483322143555, -0.006024956703186035, -0.005724430084228516, -0.005423903465270996, -0.0051233768463134766, -0.004822850227355957, -0.0045223236083984375, -0.004221796989440918, -0.0039212703704833984, -0.003620743751525879, -0.0033202171325683594, -0.00301969051361084, -0.0027191638946533203, -0.0024186372756958008, -0.0021181106567382812, -0.0018175840377807617, -0.0015170574188232422, -0.0012165307998657227, -0.0009160041809082031, -0.0006154775619506836, -0.00031495094299316406, -1.4424324035644531e-05, 0.000286102294921875, 0.0005866289138793945, 0.0008871555328369141, 0.0011876821517944336, 0.0014882087707519531, 0.0017887353897094727, 0.002089262008666992, 0.0023897886276245117, 0.0026903152465820312, 0.0029908418655395508, 0.0032913684844970703, 0.00359189510345459, 0.0038924217224121094, 0.004192948341369629, 0.0044934749603271484, 0.004794001579284668, 0.0050945281982421875, 0.005395054817199707, 0.0056955814361572266, 0.005996108055114746, 0.006296634674072266, 0.006597161293029785, 0.006897687911987305, 0.007198214530944824, 0.007498741149902344, 0.007799267768859863, 0.008099794387817383, 0.008400321006774902, 0.008700847625732422, 0.009001374244689941, 0.009301900863647461, 0.00960242748260498, 0.0099029541015625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 0.0, 3.0, 4.0, 7.0, 9.0, 11.0, 14.0, 15.0, 14.0, 27.0, 34.0, 54.0, 82.0, 126.0, 163.0, 129.0, 96.0, 54.0, 45.0, 35.0, 27.0, 21.0, 6.0, 9.0, 6.0, 7.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003936767578125, -0.003811955451965332, -0.003687143325805664, -0.003562331199645996, -0.003437519073486328, -0.00331270694732666, -0.003187894821166992, -0.0030630826950073242, -0.0029382705688476562, -0.0028134584426879883, -0.0026886463165283203, -0.0025638341903686523, -0.0024390220642089844, -0.0023142099380493164, -0.0021893978118896484, -0.0020645856857299805, -0.0019397735595703125, -0.0018149614334106445, -0.0016901493072509766, -0.0015653371810913086, -0.0014405250549316406, -0.0013157129287719727, -0.0011909008026123047, -0.0010660886764526367, -0.0009412765502929688, -0.0008164644241333008, -0.0006916522979736328, -0.0005668401718139648, -0.0004420280456542969, -0.0003172159194946289, -0.00019240379333496094, -6.759166717529297e-05, 5.7220458984375e-05, 0.00018203258514404297, 0.00030684471130371094, 0.0004316568374633789, 0.0005564689636230469, 0.0006812810897827148, 0.0008060932159423828, 0.0009309053421020508, 0.0010557174682617188, 0.0011805295944213867, 0.0013053417205810547, 0.0014301538467407227, 0.0015549659729003906, 0.0016797780990600586, 0.0018045902252197266, 0.0019294023513793945, 0.0020542144775390625, 0.0021790266036987305, 0.0023038387298583984, 0.0024286508560180664, 0.0025534629821777344, 0.0026782751083374023, 0.0028030872344970703, 0.0029278993606567383, 0.0030527114868164062, 0.0031775236129760742, 0.003302335739135742, 0.00342714786529541, 0.003551959991455078, 0.003676772117614746, 0.003801584243774414, 0.003926396369934082, 0.00405120849609375]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 7.0, 2.0, 6.0, 9.0, 9.0, 20.0, 13.0, 14.0, 20.0, 24.0, 35.0, 29.0, 55.0, 45.0, 70.0, 84.0, 99.0, 88.0, 71.0, 65.0, 49.0, 35.0, 21.0, 24.0, 15.0, 15.0, 14.0, 15.0, 11.0, 5.0, 7.0, 5.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.573942184448242, -11.216841697692871, -10.8597412109375, -10.502640724182129, -10.145540237426758, -9.788439750671387, -9.431339263916016, -9.074239730834961, -8.717138290405273, -8.360037803649902, -8.002937316894531, -7.64583683013916, -7.288736343383789, -6.931635856628418, -6.574535846710205, -6.217435359954834, -5.860335350036621, -5.50323486328125, -5.146134376525879, -4.789033889770508, -4.431933403015137, -4.074832916259766, -3.7177329063415527, -3.3606324195861816, -3.0035319328308105, -2.6464314460754395, -2.2893309593200684, -1.9322307109832764, -1.5751302242279053, -1.2180297374725342, -0.8609294891357422, -0.5038290023803711, -0.1467294692993164, 0.2103709578514099, 0.5674713850021362, 0.9245717525482178, 1.2816722393035889, 1.63877272605896, 1.995872974395752, 2.352973461151123, 2.710073947906494, 3.0671744346618652, 3.4242749214172363, 3.7813751697540283, 4.13847541809082, 4.495575904846191, 4.8526763916015625, 5.209776878356934, 5.566877365112305, 5.923977851867676, 6.281078338623047, 6.638178825378418, 6.995279312133789, 7.35237979888916, 7.709479808807373, 8.066579818725586, 8.423681259155273, 8.780781745910645, 9.137882232666016, 9.494982719421387, 9.852083206176758, 10.209183692932129, 10.5662841796875, 10.923383712768555, 11.280484199523926]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 9.0, 5.0, 9.0, 11.0, 8.0, 8.0, 12.0, 13.0, 21.0, 18.0, 26.0, 26.0, 33.0, 33.0, 34.0, 34.0, 35.0, 44.0, 46.0, 42.0, 39.0, 37.0, 38.0, 40.0, 43.0, 36.0, 38.0, 47.0, 33.0, 26.0, 33.0, 22.0, 12.0, 19.0, 13.0, 8.0, 15.0, 10.0, 6.0, 7.0, 12.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.473306655883789, -11.062585830688477, -10.651865005493164, -10.241144180297852, -9.830422401428223, -9.41970157623291, -9.008980751037598, -8.598259925842285, -8.187538146972656, -7.776817321777344, -7.366096019744873, -6.9553751945495605, -6.54465389251709, -6.133933067321777, -5.723212242126465, -5.312491416931152, -4.90177059173584, -4.491049766540527, -4.080328464508057, -3.669607639312744, -3.2588865756988525, -2.848165512084961, -2.4374446868896484, -2.026723623275757, -1.6160025596618652, -1.2052814960479736, -0.7945605516433716, -0.38383960723876953, 0.02688145637512207, 0.43760251998901367, 0.8483233451843262, 1.2590444087982178, 1.6697654724121094, 2.080486536026001, 2.4912075996398926, 2.901928424835205, 3.3126494884490967, 3.7233705520629883, 4.134091377258301, 4.544812202453613, 4.955533504486084, 5.3662543296813965, 5.776975631713867, 6.18769645690918, 6.598417282104492, 7.009138584136963, 7.419859409332275, 7.830580711364746, 8.241301536560059, 8.652022361755371, 9.062743186950684, 9.473464965820312, 9.884185791015625, 10.294906616210938, 10.70562744140625, 11.116348266601562, 11.527069091796875, 11.937789916992188, 12.3485107421875, 12.759231567382812, 13.169953346252441, 13.580674171447754, 13.991394996643066, 14.402115821838379, 14.812837600708008]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 6.0, 6.0, 6.0, 7.0, 16.0, 27.0, 35.0, 45.0, 71.0, 123.0, 145.0, 229.0, 355.0, 519.0, 703.0, 1063.0, 1548.0, 2158.0, 3076.0, 4573.0, 6803.0, 10323.0, 15452.0, 24126.0, 38598.0, 63316.0, 110640.0, 189527.0, 217833.0, 143321.0, 80076.0, 47589.0, 29501.0, 18762.0, 12306.0, 8296.0, 5433.0, 3715.0, 2517.0, 1768.0, 1231.0, 869.0, 605.0, 420.0, 278.0, 202.0, 120.0, 75.0, 68.0, 26.0, 17.0, 17.0, 9.0, 5.0, 7.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-16.3125, -15.772705078125, -15.23291015625, -14.693115234375, -14.1533203125, -13.613525390625, -13.07373046875, -12.533935546875, -11.994140625, -11.454345703125, -10.91455078125, -10.374755859375, -9.8349609375, -9.295166015625, -8.75537109375, -8.215576171875, -7.67578125, -7.135986328125, -6.59619140625, -6.056396484375, -5.5166015625, -4.976806640625, -4.43701171875, -3.897216796875, -3.357421875, -2.817626953125, -2.27783203125, -1.738037109375, -1.1982421875, -0.658447265625, -0.11865234375, 0.421142578125, 0.9609375, 1.500732421875, 2.04052734375, 2.580322265625, 3.1201171875, 3.659912109375, 4.19970703125, 4.739501953125, 5.279296875, 5.819091796875, 6.35888671875, 6.898681640625, 7.4384765625, 7.978271484375, 8.51806640625, 9.057861328125, 9.59765625, 10.137451171875, 10.67724609375, 11.217041015625, 11.7568359375, 12.296630859375, 12.83642578125, 13.376220703125, 13.916015625, 14.455810546875, 14.99560546875, 15.535400390625, 16.0751953125, 16.614990234375, 17.15478515625, 17.694580078125, 18.234375]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 7.0, 9.0, 9.0, 10.0, 8.0, 9.0, 12.0, 11.0, 19.0, 21.0, 29.0, 29.0, 27.0, 28.0, 42.0, 34.0, 31.0, 46.0, 36.0, 42.0, 39.0, 37.0, 31.0, 37.0, 36.0, 37.0, 40.0, 38.0, 46.0, 27.0, 19.0, 29.0, 20.0, 16.0, 16.0, 7.0, 12.0, 5.0, 12.0, 6.0, 9.0, 11.0, 7.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.640625, -10.27392578125, -9.9072265625, -9.54052734375, -9.173828125, -8.80712890625, -8.4404296875, -8.07373046875, -7.70703125, -7.34033203125, -6.9736328125, -6.60693359375, -6.240234375, -5.87353515625, -5.5068359375, -5.14013671875, -4.7734375, -4.40673828125, -4.0400390625, -3.67333984375, -3.306640625, -2.93994140625, -2.5732421875, -2.20654296875, -1.83984375, -1.47314453125, -1.1064453125, -0.73974609375, -0.373046875, -0.00634765625, 0.3603515625, 0.72705078125, 1.09375, 1.46044921875, 1.8271484375, 2.19384765625, 2.560546875, 2.92724609375, 3.2939453125, 3.66064453125, 4.02734375, 4.39404296875, 4.7607421875, 5.12744140625, 5.494140625, 5.86083984375, 6.2275390625, 6.59423828125, 6.9609375, 7.32763671875, 7.6943359375, 8.06103515625, 8.427734375, 8.79443359375, 9.1611328125, 9.52783203125, 9.89453125, 10.26123046875, 10.6279296875, 10.99462890625, 11.361328125, 11.72802734375, 12.0947265625, 12.46142578125, 12.828125]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 5.0, 14.0, 14.0, 13.0, 23.0, 41.0, 56.0, 86.0, 128.0, 174.0, 262.0, 390.0, 564.0, 861.0, 1279.0, 1775.0, 2667.0, 3976.0, 5955.0, 8822.0, 13291.0, 19812.0, 30296.0, 46945.0, 76294.0, 133818.0, 212613.0, 191525.0, 111514.0, 65211.0, 40729.0, 26257.0, 17544.0, 11615.0, 7807.0, 5102.0, 3577.0, 2426.0, 1575.0, 1087.0, 786.0, 550.0, 323.0, 265.0, 149.0, 101.0, 83.0, 56.0, 34.0, 28.0, 17.0, 11.0, 5.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.234375, -15.7080078125, -15.181640625, -14.6552734375, -14.12890625, -13.6025390625, -13.076171875, -12.5498046875, -12.0234375, -11.4970703125, -10.970703125, -10.4443359375, -9.91796875, -9.3916015625, -8.865234375, -8.3388671875, -7.8125, -7.2861328125, -6.759765625, -6.2333984375, -5.70703125, -5.1806640625, -4.654296875, -4.1279296875, -3.6015625, -3.0751953125, -2.548828125, -2.0224609375, -1.49609375, -0.9697265625, -0.443359375, 0.0830078125, 0.609375, 1.1357421875, 1.662109375, 2.1884765625, 2.71484375, 3.2412109375, 3.767578125, 4.2939453125, 4.8203125, 5.3466796875, 5.873046875, 6.3994140625, 6.92578125, 7.4521484375, 7.978515625, 8.5048828125, 9.03125, 9.5576171875, 10.083984375, 10.6103515625, 11.13671875, 11.6630859375, 12.189453125, 12.7158203125, 13.2421875, 13.7685546875, 14.294921875, 14.8212890625, 15.34765625, 15.8740234375, 16.400390625, 16.9267578125, 17.453125]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 7.0, 11.0, 4.0, 17.0, 6.0, 15.0, 16.0, 21.0, 24.0, 35.0, 21.0, 22.0, 38.0, 28.0, 36.0, 29.0, 34.0, 42.0, 43.0, 44.0, 38.0, 40.0, 37.0, 43.0, 38.0, 35.0, 24.0, 25.0, 26.0, 27.0, 28.0, 23.0, 22.0, 19.0, 21.0, 12.0, 9.0, 14.0, 6.0, 7.0, 4.0, 4.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0, -6.76885986328125, -6.5377197265625, -6.30657958984375, -6.075439453125, -5.84429931640625, -5.6131591796875, -5.38201904296875, -5.15087890625, -4.91973876953125, -4.6885986328125, -4.45745849609375, -4.226318359375, -3.99517822265625, -3.7640380859375, -3.53289794921875, -3.3017578125, -3.07061767578125, -2.8394775390625, -2.60833740234375, -2.377197265625, -2.14605712890625, -1.9149169921875, -1.68377685546875, -1.45263671875, -1.22149658203125, -0.9903564453125, -0.75921630859375, -0.528076171875, -0.29693603515625, -0.0657958984375, 0.16534423828125, 0.396484375, 0.62762451171875, 0.8587646484375, 1.08990478515625, 1.321044921875, 1.55218505859375, 1.7833251953125, 2.01446533203125, 2.24560546875, 2.47674560546875, 2.7078857421875, 2.93902587890625, 3.170166015625, 3.40130615234375, 3.6324462890625, 3.86358642578125, 4.0947265625, 4.32586669921875, 4.5570068359375, 4.78814697265625, 5.019287109375, 5.25042724609375, 5.4815673828125, 5.71270751953125, 5.94384765625, 6.17498779296875, 6.4061279296875, 6.63726806640625, 6.868408203125, 7.09954833984375, 7.3306884765625, 7.56182861328125, 7.79296875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 5.0, 9.0, 13.0, 8.0, 22.0, 29.0, 38.0, 57.0, 89.0, 128.0, 165.0, 258.0, 356.0, 522.0, 759.0, 1037.0, 1576.0, 2366.0, 3705.0, 5693.0, 8966.0, 14994.0, 25884.0, 48344.0, 110035.0, 299728.0, 299021.0, 109708.0, 48646.0, 25823.0, 14834.0, 8885.0, 5776.0, 3579.0, 2376.0, 1636.0, 1098.0, 739.0, 516.0, 365.0, 230.0, 171.0, 120.0, 77.0, 46.0, 46.0, 30.0, 12.0, 19.0, 11.0, 3.0, 7.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.25390625, -2.17877197265625, -2.1036376953125, -2.02850341796875, -1.953369140625, -1.87823486328125, -1.8031005859375, -1.72796630859375, -1.65283203125, -1.57769775390625, -1.5025634765625, -1.42742919921875, -1.352294921875, -1.27716064453125, -1.2020263671875, -1.12689208984375, -1.0517578125, -0.97662353515625, -0.9014892578125, -0.82635498046875, -0.751220703125, -0.67608642578125, -0.6009521484375, -0.52581787109375, -0.45068359375, -0.37554931640625, -0.3004150390625, -0.22528076171875, -0.150146484375, -0.07501220703125, 0.0001220703125, 0.07525634765625, 0.150390625, 0.22552490234375, 0.3006591796875, 0.37579345703125, 0.450927734375, 0.52606201171875, 0.6011962890625, 0.67633056640625, 0.75146484375, 0.82659912109375, 0.9017333984375, 0.97686767578125, 1.052001953125, 1.12713623046875, 1.2022705078125, 1.27740478515625, 1.3525390625, 1.42767333984375, 1.5028076171875, 1.57794189453125, 1.653076171875, 1.72821044921875, 1.8033447265625, 1.87847900390625, 1.95361328125, 2.02874755859375, 2.1038818359375, 2.17901611328125, 2.254150390625, 2.32928466796875, 2.4044189453125, 2.47955322265625, 2.5546875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 6.0, 4.0, 3.0, 2.0, 3.0, 7.0, 7.0, 8.0, 10.0, 14.0, 24.0, 21.0, 19.0, 29.0, 27.0, 36.0, 35.0, 51.0, 58.0, 54.0, 59.0, 74.0, 74.0, 47.0, 65.0, 50.0, 40.0, 29.0, 23.0, 23.0, 20.0, 22.0, 16.0, 11.0, 8.0, 4.0, 6.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-9.5367431640625e-05, -9.222421795129776e-05, -8.908100426197052e-05, -8.593779057264328e-05, -8.279457688331604e-05, -7.96513631939888e-05, -7.650814950466156e-05, -7.336493581533432e-05, -7.022172212600708e-05, -6.707850843667984e-05, -6.39352947473526e-05, -6.079208105802536e-05, -5.764886736869812e-05, -5.450565367937088e-05, -5.136243999004364e-05, -4.82192263007164e-05, -4.507601261138916e-05, -4.193279892206192e-05, -3.878958523273468e-05, -3.564637154340744e-05, -3.25031578540802e-05, -2.935994416475296e-05, -2.621673047542572e-05, -2.307351678609848e-05, -1.993030309677124e-05, -1.6787089407444e-05, -1.364387571811676e-05, -1.050066202878952e-05, -7.35744833946228e-06, -4.21423465013504e-06, -1.0710209608078003e-06, 2.0721927285194397e-06, 5.21540641784668e-06, 8.35862010717392e-06, 1.150183379650116e-05, 1.46450474858284e-05, 1.778826117515564e-05, 2.093147486448288e-05, 2.407468855381012e-05, 2.721790224313736e-05, 3.03611159324646e-05, 3.350432962179184e-05, 3.664754331111908e-05, 3.979075700044632e-05, 4.293397068977356e-05, 4.60771843791008e-05, 4.922039806842804e-05, 5.236361175775528e-05, 5.550682544708252e-05, 5.865003913640976e-05, 6.1793252825737e-05, 6.493646651506424e-05, 6.807968020439148e-05, 7.122289389371872e-05, 7.436610758304596e-05, 7.75093212723732e-05, 8.065253496170044e-05, 8.379574865102768e-05, 8.693896234035492e-05, 9.008217602968216e-05, 9.32253897190094e-05, 9.636860340833664e-05, 9.951181709766388e-05, 0.00010265503078699112, 0.00010579824447631836]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 4.0, 4.0, 4.0, 11.0, 13.0, 16.0, 23.0, 35.0, 29.0, 75.0, 87.0, 123.0, 174.0, 284.0, 397.0, 638.0, 984.0, 1632.0, 2663.0, 4685.0, 8389.0, 15573.0, 31299.0, 70367.0, 215864.0, 430599.0, 152794.0, 55540.0, 25801.0, 12892.0, 7086.0, 4057.0, 2343.0, 1433.0, 878.0, 560.0, 378.0, 248.0, 152.0, 138.0, 83.0, 52.0, 45.0, 27.0, 22.0, 19.0, 11.0, 9.0, 8.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.8203125, -2.724273681640625, -2.62823486328125, -2.532196044921875, -2.4361572265625, -2.340118408203125, -2.24407958984375, -2.148040771484375, -2.052001953125, -1.955963134765625, -1.85992431640625, -1.763885498046875, -1.6678466796875, -1.571807861328125, -1.47576904296875, -1.379730224609375, -1.28369140625, -1.187652587890625, -1.09161376953125, -0.995574951171875, -0.8995361328125, -0.803497314453125, -0.70745849609375, -0.611419677734375, -0.515380859375, -0.419342041015625, -0.32330322265625, -0.227264404296875, -0.1312255859375, -0.035186767578125, 0.06085205078125, 0.156890869140625, 0.2529296875, 0.348968505859375, 0.44500732421875, 0.541046142578125, 0.6370849609375, 0.733123779296875, 0.82916259765625, 0.925201416015625, 1.021240234375, 1.117279052734375, 1.21331787109375, 1.309356689453125, 1.4053955078125, 1.501434326171875, 1.59747314453125, 1.693511962890625, 1.78955078125, 1.885589599609375, 1.98162841796875, 2.077667236328125, 2.1737060546875, 2.269744873046875, 2.36578369140625, 2.461822509765625, 2.557861328125, 2.653900146484375, 2.74993896484375, 2.845977783203125, 2.9420166015625, 3.038055419921875, 3.13409423828125, 3.230133056640625, 3.326171875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 8.0, 6.0, 12.0, 17.0, 16.0, 23.0, 22.0, 27.0, 47.0, 49.0, 45.0, 64.0, 91.0, 99.0, 91.0, 70.0, 55.0, 39.0, 46.0, 27.0, 30.0, 19.0, 20.0, 14.0, 15.0, 13.0, 6.0, 7.0, 4.0, 5.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0166015625, -0.9797515869140625, -0.942901611328125, -0.9060516357421875, -0.86920166015625, -0.8323516845703125, -0.795501708984375, -0.7586517333984375, -0.7218017578125, -0.6849517822265625, -0.648101806640625, -0.6112518310546875, -0.57440185546875, -0.5375518798828125, -0.500701904296875, -0.4638519287109375, -0.427001953125, -0.3901519775390625, -0.353302001953125, -0.3164520263671875, -0.27960205078125, -0.2427520751953125, -0.205902099609375, -0.1690521240234375, -0.1322021484375, -0.0953521728515625, -0.058502197265625, -0.0216522216796875, 0.01519775390625, 0.0520477294921875, 0.088897705078125, 0.1257476806640625, 0.16259765625, 0.1994476318359375, 0.236297607421875, 0.2731475830078125, 0.30999755859375, 0.3468475341796875, 0.383697509765625, 0.4205474853515625, 0.4573974609375, 0.4942474365234375, 0.531097412109375, 0.5679473876953125, 0.60479736328125, 0.6416473388671875, 0.678497314453125, 0.7153472900390625, 0.752197265625, 0.7890472412109375, 0.825897216796875, 0.8627471923828125, 0.89959716796875, 0.9364471435546875, 0.973297119140625, 1.0101470947265625, 1.0469970703125, 1.0838470458984375, 1.120697021484375, 1.1575469970703125, 1.19439697265625, 1.2312469482421875, 1.268096923828125, 1.3049468994140625, 1.341796875]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 7.0, 2.0, 4.0, 5.0, 5.0, 5.0, 6.0, 13.0, 12.0, 19.0, 26.0, 37.0, 28.0, 39.0, 65.0, 63.0, 81.0, 94.0, 104.0, 74.0, 73.0, 58.0, 28.0, 35.0, 28.0, 25.0, 20.0, 10.0, 10.0, 7.0, 9.0, 4.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.253314018249512, -12.837448120117188, -12.421581268310547, -12.005714416503906, -11.589848518371582, -11.173982620239258, -10.758115768432617, -10.342248916625977, -9.926383018493652, -9.510517120361328, -9.094650268554688, -8.678783416748047, -8.262917518615723, -7.84705114364624, -7.431184768676758, -7.015318393707275, -6.599452018737793, -6.1835856437683105, -5.767719268798828, -5.351852893829346, -4.935986518859863, -4.520120143890381, -4.104253768920898, -3.688387393951416, -3.2725210189819336, -2.856654644012451, -2.4407882690429688, -2.0249218940734863, -1.609055519104004, -1.1931891441345215, -0.7773227691650391, -0.36145639419555664, 0.054409027099609375, 0.4702754020690918, 0.8861417770385742, 1.3020081520080566, 1.717874526977539, 2.1337409019470215, 2.549607276916504, 2.9654736518859863, 3.3813400268554688, 3.797206401824951, 4.213072776794434, 4.628939151763916, 5.044805526733398, 5.460671901702881, 5.876538276672363, 6.292404651641846, 6.708271026611328, 7.1241374015808105, 7.540003776550293, 7.955870151519775, 8.371736526489258, 8.787603378295898, 9.203469276428223, 9.619335174560547, 10.035202026367188, 10.451068878173828, 10.866934776306152, 11.282800674438477, 11.698667526245117, 12.114534378051758, 12.530400276184082, 12.946266174316406, 13.362133026123047]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 2.0, 9.0, 6.0, 10.0, 6.0, 9.0, 19.0, 24.0, 14.0, 23.0, 25.0, 28.0, 27.0, 39.0, 40.0, 43.0, 33.0, 39.0, 52.0, 43.0, 29.0, 39.0, 46.0, 37.0, 43.0, 34.0, 45.0, 40.0, 26.0, 27.0, 22.0, 22.0, 17.0, 27.0, 12.0, 10.0, 4.0, 9.0, 11.0, 7.0, 6.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.966153144836426, -10.52086067199707, -10.075567245483398, -9.630274772644043, -9.184981346130371, -8.739688873291016, -8.294395446777344, -7.849102973937988, -7.403810024261475, -6.958517074584961, -6.513224124908447, -6.067931175231934, -5.622638702392578, -5.177345275878906, -4.732052803039551, -4.286759853363037, -3.8414669036865234, -3.3961739540100098, -2.950881004333496, -2.5055882930755615, -2.060295343399048, -1.6150023937225342, -1.1697096824645996, -0.7244167327880859, -0.27912378311157227, 0.16616910696029663, 0.6114619970321655, 1.0567548274993896, 1.5020477771759033, 1.947340726852417, 2.3926334381103516, 2.8379263877868652, 3.2832202911376953, 3.728513240814209, 4.173806190490723, 4.619098663330078, 5.06439208984375, 5.5096845626831055, 5.954977512359619, 6.400270462036133, 6.8455634117126465, 7.29085636138916, 7.736149311065674, 8.181442260742188, 8.626734733581543, 9.072028160095215, 9.51732063293457, 9.962614059448242, 10.407906532287598, 10.853199005126953, 11.298492431640625, 11.74378490447998, 12.189078330993652, 12.634370803833008, 13.07966423034668, 13.524956703186035, 13.97024917602539, 14.415541648864746, 14.860835075378418, 15.306127548217773, 15.751420974731445, 16.196714401245117, 16.642005920410156, 17.087299346923828, 17.5325927734375]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [5.0, 2.0, 3.0, 7.0, 16.0, 19.0, 20.0, 42.0, 64.0, 101.0, 151.0, 227.0, 382.0, 639.0, 947.0, 1607.0, 2514.0, 4093.0, 6910.0, 11288.0, 19425.0, 34494.0, 63133.0, 123488.0, 284237.0, 1020607.0, 1728992.0, 508375.0, 177956.0, 87977.0, 47984.0, 26884.0, 15809.0, 9449.0, 5805.0, 3693.0, 2370.0, 1523.0, 991.0, 669.0, 428.0, 285.0, 206.0, 140.0, 93.0, 63.0, 62.0, 34.0, 23.0, 23.0, 13.0, 7.0, 6.0, 7.0, 2.0, 2.0, 5.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-14.8125, -14.24853515625, -13.6845703125, -13.12060546875, -12.556640625, -11.99267578125, -11.4287109375, -10.86474609375, -10.30078125, -9.73681640625, -9.1728515625, -8.60888671875, -8.044921875, -7.48095703125, -6.9169921875, -6.35302734375, -5.7890625, -5.22509765625, -4.6611328125, -4.09716796875, -3.533203125, -2.96923828125, -2.4052734375, -1.84130859375, -1.27734375, -0.71337890625, -0.1494140625, 0.41455078125, 0.978515625, 1.54248046875, 2.1064453125, 2.67041015625, 3.234375, 3.79833984375, 4.3623046875, 4.92626953125, 5.490234375, 6.05419921875, 6.6181640625, 7.18212890625, 7.74609375, 8.31005859375, 8.8740234375, 9.43798828125, 10.001953125, 10.56591796875, 11.1298828125, 11.69384765625, 12.2578125, 12.82177734375, 13.3857421875, 13.94970703125, 14.513671875, 15.07763671875, 15.6416015625, 16.20556640625, 16.76953125, 17.33349609375, 17.8974609375, 18.46142578125, 19.025390625, 19.58935546875, 20.1533203125, 20.71728515625, 21.28125]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 6.0, 2.0, 10.0, 15.0, 7.0, 10.0, 18.0, 13.0, 24.0, 24.0, 23.0, 26.0, 36.0, 38.0, 39.0, 45.0, 44.0, 43.0, 43.0, 37.0, 43.0, 37.0, 41.0, 41.0, 35.0, 45.0, 39.0, 28.0, 28.0, 27.0, 23.0, 20.0, 22.0, 23.0, 9.0, 6.0, 5.0, 7.0, 7.0, 9.0, 4.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3125, -9.9188232421875, -9.525146484375, -9.1314697265625, -8.73779296875, -8.3441162109375, -7.950439453125, -7.5567626953125, -7.1630859375, -6.7694091796875, -6.375732421875, -5.9820556640625, -5.58837890625, -5.1947021484375, -4.801025390625, -4.4073486328125, -4.013671875, -3.6199951171875, -3.226318359375, -2.8326416015625, -2.43896484375, -2.0452880859375, -1.651611328125, -1.2579345703125, -0.8642578125, -0.4705810546875, -0.076904296875, 0.3167724609375, 0.71044921875, 1.1041259765625, 1.497802734375, 1.8914794921875, 2.28515625, 2.6788330078125, 3.072509765625, 3.4661865234375, 3.85986328125, 4.2535400390625, 4.647216796875, 5.0408935546875, 5.4345703125, 5.8282470703125, 6.221923828125, 6.6156005859375, 7.00927734375, 7.4029541015625, 7.796630859375, 8.1903076171875, 8.583984375, 8.9776611328125, 9.371337890625, 9.7650146484375, 10.15869140625, 10.5523681640625, 10.946044921875, 11.3397216796875, 11.7333984375, 12.1270751953125, 12.520751953125, 12.9144287109375, 13.30810546875, 13.7017822265625, 14.095458984375, 14.4891357421875, 14.8828125]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 8.0, 4.0, 19.0, 13.0, 31.0, 33.0, 69.0, 96.0, 133.0, 213.0, 326.0, 522.0, 782.0, 1284.0, 2094.0, 3529.0, 6130.0, 10385.0, 18528.0, 34160.0, 65074.0, 136233.0, 321896.0, 958500.0, 1668353.0, 552611.0, 210616.0, 95156.0, 48042.0, 25277.0, 14297.0, 8035.0, 4584.0, 2756.0, 1697.0, 1032.0, 614.0, 411.0, 286.0, 161.0, 98.0, 66.0, 47.0, 33.0, 17.0, 17.0, 8.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.625, -16.07568359375, -15.5263671875, -14.97705078125, -14.427734375, -13.87841796875, -13.3291015625, -12.77978515625, -12.23046875, -11.68115234375, -11.1318359375, -10.58251953125, -10.033203125, -9.48388671875, -8.9345703125, -8.38525390625, -7.8359375, -7.28662109375, -6.7373046875, -6.18798828125, -5.638671875, -5.08935546875, -4.5400390625, -3.99072265625, -3.44140625, -2.89208984375, -2.3427734375, -1.79345703125, -1.244140625, -0.69482421875, -0.1455078125, 0.40380859375, 0.953125, 1.50244140625, 2.0517578125, 2.60107421875, 3.150390625, 3.69970703125, 4.2490234375, 4.79833984375, 5.34765625, 5.89697265625, 6.4462890625, 6.99560546875, 7.544921875, 8.09423828125, 8.6435546875, 9.19287109375, 9.7421875, 10.29150390625, 10.8408203125, 11.39013671875, 11.939453125, 12.48876953125, 13.0380859375, 13.58740234375, 14.13671875, 14.68603515625, 15.2353515625, 15.78466796875, 16.333984375, 16.88330078125, 17.4326171875, 17.98193359375, 18.53125]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 6.0, 4.0, 11.0, 11.0, 14.0, 12.0, 27.0, 32.0, 44.0, 53.0, 65.0, 105.0, 107.0, 123.0, 185.0, 214.0, 274.0, 325.0, 381.0, 472.0, 360.0, 251.0, 206.0, 165.0, 134.0, 122.0, 79.0, 57.0, 68.0, 40.0, 29.0, 20.0, 18.0, 22.0, 14.0, 7.0, 7.0, 2.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.73046875, -6.49969482421875, -6.2689208984375, -6.03814697265625, -5.807373046875, -5.57659912109375, -5.3458251953125, -5.11505126953125, -4.88427734375, -4.65350341796875, -4.4227294921875, -4.19195556640625, -3.961181640625, -3.73040771484375, -3.4996337890625, -3.26885986328125, -3.0380859375, -2.80731201171875, -2.5765380859375, -2.34576416015625, -2.114990234375, -1.88421630859375, -1.6534423828125, -1.42266845703125, -1.19189453125, -0.96112060546875, -0.7303466796875, -0.49957275390625, -0.268798828125, -0.03802490234375, 0.1927490234375, 0.42352294921875, 0.654296875, 0.88507080078125, 1.1158447265625, 1.34661865234375, 1.577392578125, 1.80816650390625, 2.0389404296875, 2.26971435546875, 2.50048828125, 2.73126220703125, 2.9620361328125, 3.19281005859375, 3.423583984375, 3.65435791015625, 3.8851318359375, 4.11590576171875, 4.3466796875, 4.57745361328125, 4.8082275390625, 5.03900146484375, 5.269775390625, 5.50054931640625, 5.7313232421875, 5.96209716796875, 6.19287109375, 6.42364501953125, 6.6544189453125, 6.88519287109375, 7.115966796875, 7.34674072265625, 7.5775146484375, 7.80828857421875, 8.0390625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 6.0, 15.0, 14.0, 10.0, 16.0, 29.0, 34.0, 56.0, 54.0, 72.0, 117.0, 140.0, 105.0, 98.0, 59.0, 46.0, 30.0, 24.0, 18.0, 13.0, 15.0, 9.0, 1.0, 6.0, 4.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.616439819335938, -19.062349319458008, -18.508258819580078, -17.95417022705078, -17.40007972717285, -16.845989227294922, -16.291898727416992, -15.737809181213379, -15.183719635009766, -14.629629135131836, -14.075539588928223, -13.521449089050293, -12.96735954284668, -12.41326904296875, -11.85917854309082, -11.305088996887207, -10.750998497009277, -10.196907997131348, -9.642818450927734, -9.088727951049805, -8.534638404846191, -7.980547904968262, -7.42645788192749, -6.872367858886719, -6.318277835845947, -5.764187812805176, -5.210097789764404, -4.656007766723633, -4.101917266845703, -3.5478274822235107, -2.99373722076416, -2.4396471977233887, -1.8855571746826172, -1.3314671516418457, -0.7773770093917847, -0.22328686714172363, 0.33080315589904785, 0.8848931789398193, 1.43898344039917, 1.9930734634399414, 2.547163486480713, 3.1012535095214844, 3.655343532562256, 4.209433555603027, 4.763524055480957, 5.31761360168457, 5.8717041015625, 6.4257941246032715, 6.979884147644043, 7.5339741706848145, 8.088064193725586, 8.642154693603516, 9.196244239807129, 9.750334739685059, 10.304424285888672, 10.858514785766602, 11.412605285644531, 11.966695785522461, 12.520785331726074, 13.074875831604004, 13.628965377807617, 14.183055877685547, 14.737146377563477, 15.29123592376709, 15.845325469970703]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 4.0, 6.0, 9.0, 13.0, 15.0, 16.0, 20.0, 18.0, 26.0, 27.0, 26.0, 38.0, 36.0, 53.0, 35.0, 52.0, 39.0, 47.0, 34.0, 56.0, 38.0, 32.0, 42.0, 48.0, 37.0, 35.0, 27.0, 37.0, 28.0, 19.0, 16.0, 13.0, 10.0, 13.0, 9.0, 5.0, 8.0, 5.0, 10.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.353267669677734, -11.873824119567871, -11.394379615783691, -10.914936065673828, -10.435491561889648, -9.956048011779785, -9.476604461669922, -8.997159957885742, -8.517715454101562, -8.0382719039917, -7.5588274002075195, -7.079383850097656, -6.599939346313477, -6.120495796203613, -5.641051769256592, -5.16160774230957, -4.682164192199707, -4.2027201652526855, -3.723276138305664, -3.2438323497772217, -2.7643883228302, -2.2849442958831787, -1.8055005073547363, -1.3260564804077148, -0.8466124534606934, -0.36716848611831665, 0.11227548122406006, 0.591719388961792, 1.0711634159088135, 1.550607442855835, 2.0300512313842773, 2.509495258331299, 2.9889392852783203, 3.468383312225342, 3.9478273391723633, 4.427270889282227, 4.906715393066406, 5.3861589431762695, 5.865602970123291, 6.3450469970703125, 6.824491024017334, 7.3039350509643555, 7.783379077911377, 8.262823104858398, 8.742266654968262, 9.221711158752441, 9.701154708862305, 10.180599212646484, 10.660042762756348, 11.139486312866211, 11.61893081665039, 12.098374366760254, 12.577818870544434, 13.057262420654297, 13.536706924438477, 14.01615047454834, 14.495594024658203, 14.975037574768066, 15.454482078552246, 15.93392562866211, 16.41337013244629, 16.89281463623047, 17.372257232666016, 17.851701736450195, 18.331146240234375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 7.0, 13.0, 17.0, 14.0, 27.0, 36.0, 58.0, 116.0, 181.0, 294.0, 426.0, 765.0, 1363.0, 2216.0, 3736.0, 6217.0, 10240.0, 17874.0, 31266.0, 58600.0, 118956.0, 337781.0, 240068.0, 100925.0, 51012.0, 27634.0, 15842.0, 9162.0, 5509.0, 3250.0, 1908.0, 1179.0, 745.0, 418.0, 247.0, 163.0, 97.0, 57.0, 45.0, 23.0, 24.0, 16.0, 7.0, 8.0, 8.0, 4.0, 1.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.5703125, -4.41741943359375, -4.2645263671875, -4.11163330078125, -3.958740234375, -3.80584716796875, -3.6529541015625, -3.50006103515625, -3.34716796875, -3.19427490234375, -3.0413818359375, -2.88848876953125, -2.735595703125, -2.58270263671875, -2.4298095703125, -2.27691650390625, -2.1240234375, -1.97113037109375, -1.8182373046875, -1.66534423828125, -1.512451171875, -1.35955810546875, -1.2066650390625, -1.05377197265625, -0.90087890625, -0.74798583984375, -0.5950927734375, -0.44219970703125, -0.289306640625, -0.13641357421875, 0.0164794921875, 0.16937255859375, 0.322265625, 0.47515869140625, 0.6280517578125, 0.78094482421875, 0.933837890625, 1.08673095703125, 1.2396240234375, 1.39251708984375, 1.54541015625, 1.69830322265625, 1.8511962890625, 2.00408935546875, 2.156982421875, 2.30987548828125, 2.4627685546875, 2.61566162109375, 2.7685546875, 2.92144775390625, 3.0743408203125, 3.22723388671875, 3.380126953125, 3.53302001953125, 3.6859130859375, 3.83880615234375, 3.99169921875, 4.14459228515625, 4.2974853515625, 4.45037841796875, 4.603271484375, 4.75616455078125, 4.9090576171875, 5.06195068359375, 5.21484375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 1.0, 6.0, 13.0, 14.0, 14.0, 18.0, 18.0, 17.0, 25.0, 31.0, 33.0, 38.0, 39.0, 47.0, 55.0, 49.0, 45.0, 38.0, 65.0, 33.0, 37.0, 48.0, 48.0, 32.0, 38.0, 34.0, 35.0, 26.0, 19.0, 12.0, 17.0, 12.0, 13.0, 7.0, 6.0, 6.0, 8.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6328125, -12.1270751953125, -11.621337890625, -11.1156005859375, -10.60986328125, -10.1041259765625, -9.598388671875, -9.0926513671875, -8.5869140625, -8.0811767578125, -7.575439453125, -7.0697021484375, -6.56396484375, -6.0582275390625, -5.552490234375, -5.0467529296875, -4.541015625, -4.0352783203125, -3.529541015625, -3.0238037109375, -2.51806640625, -2.0123291015625, -1.506591796875, -1.0008544921875, -0.4951171875, 0.0106201171875, 0.516357421875, 1.0220947265625, 1.52783203125, 2.0335693359375, 2.539306640625, 3.0450439453125, 3.55078125, 4.0565185546875, 4.562255859375, 5.0679931640625, 5.57373046875, 6.0794677734375, 6.585205078125, 7.0909423828125, 7.5966796875, 8.1024169921875, 8.608154296875, 9.1138916015625, 9.61962890625, 10.1253662109375, 10.631103515625, 11.1368408203125, 11.642578125, 12.1483154296875, 12.654052734375, 13.1597900390625, 13.66552734375, 14.1712646484375, 14.677001953125, 15.1827392578125, 15.6884765625, 16.1942138671875, 16.699951171875, 17.2056884765625, 17.71142578125, 18.2171630859375, 18.722900390625, 19.2286376953125, 19.734375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [4.0, 5.0, 2.0, 9.0, 11.0, 18.0, 25.0, 44.0, 47.0, 67.0, 88.0, 124.0, 180.0, 265.0, 344.0, 467.0, 618.0, 789.0, 1146.0, 1586.0, 2140.0, 3132.0, 4367.0, 6095.0, 8779.0, 12596.0, 18487.0, 27127.0, 40452.0, 62560.0, 105645.0, 237238.0, 222504.0, 102850.0, 61579.0, 39834.0, 26548.0, 18055.0, 12628.0, 8666.0, 6074.0, 4238.0, 3058.0, 2201.0, 1540.0, 1151.0, 848.0, 615.0, 451.0, 315.0, 244.0, 205.0, 142.0, 107.0, 85.0, 60.0, 45.0, 24.0, 16.0, 17.0, 8.0, 3.0, 5.0, 3.0], "bins": [-3.228515625, -3.1275634765625, -3.026611328125, -2.9256591796875, -2.82470703125, -2.7237548828125, -2.622802734375, -2.5218505859375, -2.4208984375, -2.3199462890625, -2.218994140625, -2.1180419921875, -2.01708984375, -1.9161376953125, -1.815185546875, -1.7142333984375, -1.61328125, -1.5123291015625, -1.411376953125, -1.3104248046875, -1.20947265625, -1.1085205078125, -1.007568359375, -0.9066162109375, -0.8056640625, -0.7047119140625, -0.603759765625, -0.5028076171875, -0.40185546875, -0.3009033203125, -0.199951171875, -0.0989990234375, 0.001953125, 0.1029052734375, 0.203857421875, 0.3048095703125, 0.40576171875, 0.5067138671875, 0.607666015625, 0.7086181640625, 0.8095703125, 0.9105224609375, 1.011474609375, 1.1124267578125, 1.21337890625, 1.3143310546875, 1.415283203125, 1.5162353515625, 1.6171875, 1.7181396484375, 1.819091796875, 1.9200439453125, 2.02099609375, 2.1219482421875, 2.222900390625, 2.3238525390625, 2.4248046875, 2.5257568359375, 2.626708984375, 2.7276611328125, 2.82861328125, 2.9295654296875, 3.030517578125, 3.1314697265625, 3.232421875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 9.0, 12.0, 8.0, 10.0, 15.0, 9.0, 16.0, 17.0, 19.0, 19.0, 23.0, 27.0, 32.0, 27.0, 39.0, 34.0, 32.0, 37.0, 29.0, 35.0, 47.0, 31.0, 31.0, 40.0, 41.0, 30.0, 26.0, 29.0, 27.0, 20.0, 21.0, 31.0, 29.0, 20.0, 23.0, 12.0, 11.0, 13.0, 11.0, 8.0, 7.0, 7.0, 3.0, 6.0, 4.0, 8.0, 6.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-7.92578125, -7.67559814453125, -7.4254150390625, -7.17523193359375, -6.925048828125, -6.67486572265625, -6.4246826171875, -6.17449951171875, -5.92431640625, -5.67413330078125, -5.4239501953125, -5.17376708984375, -4.923583984375, -4.67340087890625, -4.4232177734375, -4.17303466796875, -3.9228515625, -3.67266845703125, -3.4224853515625, -3.17230224609375, -2.922119140625, -2.67193603515625, -2.4217529296875, -2.17156982421875, -1.92138671875, -1.67120361328125, -1.4210205078125, -1.17083740234375, -0.920654296875, -0.67047119140625, -0.4202880859375, -0.17010498046875, 0.080078125, 0.33026123046875, 0.5804443359375, 0.83062744140625, 1.080810546875, 1.33099365234375, 1.5811767578125, 1.83135986328125, 2.08154296875, 2.33172607421875, 2.5819091796875, 2.83209228515625, 3.082275390625, 3.33245849609375, 3.5826416015625, 3.83282470703125, 4.0830078125, 4.33319091796875, 4.5833740234375, 4.83355712890625, 5.083740234375, 5.33392333984375, 5.5841064453125, 5.83428955078125, 6.08447265625, 6.33465576171875, 6.5848388671875, 6.83502197265625, 7.085205078125, 7.33538818359375, 7.5855712890625, 7.83575439453125, 8.0859375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 5.0, 3.0, 5.0, 5.0, 10.0, 15.0, 14.0, 25.0, 47.0, 56.0, 64.0, 99.0, 154.0, 206.0, 291.0, 432.0, 562.0, 824.0, 1136.0, 1672.0, 2446.0, 3606.0, 5577.0, 8858.0, 14151.0, 24117.0, 40805.0, 74758.0, 154825.0, 315476.0, 189879.0, 88641.0, 47066.0, 27048.0, 16313.0, 10059.0, 6328.0, 4089.0, 2727.0, 1811.0, 1267.0, 886.0, 622.0, 390.0, 329.0, 245.0, 165.0, 116.0, 111.0, 70.0, 50.0, 33.0, 25.0, 24.0, 10.0, 6.0, 5.0, 6.0, 4.0, 4.0, 0.0, 0.0, 2.0], "bins": [-0.004547119140625, -0.004398643970489502, -0.004250168800354004, -0.004101693630218506, -0.003953218460083008, -0.0038047432899475098, -0.0036562681198120117, -0.0035077929496765137, -0.0033593177795410156, -0.0032108426094055176, -0.0030623674392700195, -0.0029138922691345215, -0.0027654170989990234, -0.0026169419288635254, -0.0024684667587280273, -0.0023199915885925293, -0.0021715164184570312, -0.002023041248321533, -0.0018745660781860352, -0.0017260909080505371, -0.001577615737915039, -0.001429140567779541, -0.001280665397644043, -0.001132190227508545, -0.0009837150573730469, -0.0008352398872375488, -0.0006867647171020508, -0.0005382895469665527, -0.0003898143768310547, -0.00024133920669555664, -9.28640365600586e-05, 5.561113357543945e-05, 0.0002040863037109375, 0.00035256147384643555, 0.0005010366439819336, 0.0006495118141174316, 0.0007979869842529297, 0.0009464621543884277, 0.0010949373245239258, 0.0012434124946594238, 0.0013918876647949219, 0.00154036283493042, 0.001688838005065918, 0.001837313175201416, 0.001985788345336914, 0.002134263515472412, 0.00228273868560791, 0.002431213855743408, 0.0025796890258789062, 0.0027281641960144043, 0.0028766393661499023, 0.0030251145362854004, 0.0031735897064208984, 0.0033220648765563965, 0.0034705400466918945, 0.0036190152168273926, 0.0037674903869628906, 0.003915965557098389, 0.004064440727233887, 0.004212915897369385, 0.004361391067504883, 0.004509866237640381, 0.004658341407775879, 0.004806816577911377, 0.004955291748046875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 10.0, 10.0, 6.0, 10.0, 8.0, 11.0, 12.0, 23.0, 15.0, 37.0, 61.0, 52.0, 60.0, 61.0, 55.0, 64.0, 64.0, 55.0, 53.0, 75.0, 53.0, 30.0, 29.0, 28.0, 24.0, 18.0, 10.0, 15.0, 20.0, 6.0, 8.0, 3.0, 3.0, 1.0, 2.0, 1.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.172325134277344e-06, -4.046596586704254e-06, -3.9208680391311646e-06, -3.795139491558075e-06, -3.6694109439849854e-06, -3.5436823964118958e-06, -3.417953848838806e-06, -3.2922253012657166e-06, -3.166496753692627e-06, -3.0407682061195374e-06, -2.9150396585464478e-06, -2.789311110973358e-06, -2.6635825634002686e-06, -2.537854015827179e-06, -2.4121254682540894e-06, -2.2863969206809998e-06, -2.16066837310791e-06, -2.0349398255348206e-06, -1.909211277961731e-06, -1.7834827303886414e-06, -1.6577541828155518e-06, -1.5320256352424622e-06, -1.4062970876693726e-06, -1.280568540096283e-06, -1.1548399925231934e-06, -1.0291114449501038e-06, -9.033828973770142e-07, -7.776543498039246e-07, -6.51925802230835e-07, -5.261972546577454e-07, -4.0046870708465576e-07, -2.7474015951156616e-07, -1.4901161193847656e-07, -2.3283064365386963e-08, 1.0244548320770264e-07, 2.2817403078079224e-07, 3.5390257835388184e-07, 4.796311259269714e-07, 6.05359673500061e-07, 7.310882210731506e-07, 8.568167686462402e-07, 9.825453162193298e-07, 1.1082738637924194e-06, 1.234002411365509e-06, 1.3597309589385986e-06, 1.4854595065116882e-06, 1.6111880540847778e-06, 1.7369166016578674e-06, 1.862645149230957e-06, 1.9883736968040466e-06, 2.1141022443771362e-06, 2.239830791950226e-06, 2.3655593395233154e-06, 2.491287887096405e-06, 2.6170164346694946e-06, 2.7427449822425842e-06, 2.868473529815674e-06, 2.9942020773887634e-06, 3.119930624961853e-06, 3.2456591725349426e-06, 3.3713877201080322e-06, 3.497116267681122e-06, 3.6228448152542114e-06, 3.748573362827301e-06, 3.874301910400391e-06]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 9.0, 8.0, 9.0, 17.0, 24.0, 33.0, 46.0, 69.0, 85.0, 130.0, 162.0, 215.0, 316.0, 444.0, 653.0, 1008.0, 1507.0, 2394.0, 3874.0, 6190.0, 10774.0, 19340.0, 37028.0, 76023.0, 177376.0, 366704.0, 181563.0, 77542.0, 37494.0, 19071.0, 11073.0, 6289.0, 3873.0, 2386.0, 1615.0, 950.0, 680.0, 433.0, 339.0, 224.0, 163.0, 114.0, 93.0, 56.0, 49.0, 36.0, 25.0, 22.0, 13.0, 6.0, 1.0, 6.0, 4.0, 3.0, 1.0, 1.0], "bins": [-0.00609588623046875, -0.005913972854614258, -0.005732059478759766, -0.0055501461029052734, -0.005368232727050781, -0.005186319351196289, -0.005004405975341797, -0.004822492599487305, -0.0046405792236328125, -0.00445866584777832, -0.004276752471923828, -0.004094839096069336, -0.003912925720214844, -0.0037310123443603516, -0.0035490989685058594, -0.003367185592651367, -0.003185272216796875, -0.003003358840942383, -0.0028214454650878906, -0.0026395320892333984, -0.0024576187133789062, -0.002275705337524414, -0.002093791961669922, -0.0019118785858154297, -0.0017299652099609375, -0.0015480518341064453, -0.0013661384582519531, -0.001184225082397461, -0.0010023117065429688, -0.0008203983306884766, -0.0006384849548339844, -0.0004565715789794922, -0.000274658203125, -9.274482727050781e-05, 8.916854858398438e-05, 0.00027108192443847656, 0.00045299530029296875, 0.0006349086761474609, 0.0008168220520019531, 0.0009987354278564453, 0.0011806488037109375, 0.0013625621795654297, 0.0015444755554199219, 0.001726388931274414, 0.0019083023071289062, 0.0020902156829833984, 0.0022721290588378906, 0.002454042434692383, 0.002635955810546875, 0.002817869186401367, 0.0029997825622558594, 0.0031816959381103516, 0.0033636093139648438, 0.003545522689819336, 0.003727436065673828, 0.00390934944152832, 0.0040912628173828125, 0.004273176193237305, 0.004455089569091797, 0.004637002944946289, 0.004818916320800781, 0.0050008296966552734, 0.005182743072509766, 0.005364656448364258, 0.00554656982421875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 5.0, 4.0, 6.0, 13.0, 16.0, 9.0, 12.0, 23.0, 23.0, 22.0, 39.0, 62.0, 46.0, 64.0, 60.0, 64.0, 51.0, 75.0, 68.0, 55.0, 63.0, 51.0, 36.0, 30.0, 21.0, 13.0, 14.0, 12.0, 8.0, 10.0, 7.0, 5.0, 5.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.002506256103515625, -0.0024318695068359375, -0.00235748291015625, -0.0022830963134765625, -0.002208709716796875, -0.0021343231201171875, -0.0020599365234375, -0.0019855499267578125, -0.001911163330078125, -0.0018367767333984375, -0.00176239013671875, -0.0016880035400390625, -0.001613616943359375, -0.0015392303466796875, -0.00146484375, -0.0013904571533203125, -0.001316070556640625, -0.0012416839599609375, -0.00116729736328125, -0.0010929107666015625, -0.001018524169921875, -0.0009441375732421875, -0.0008697509765625, -0.0007953643798828125, -0.000720977783203125, -0.0006465911865234375, -0.00057220458984375, -0.0004978179931640625, -0.000423431396484375, -0.0003490447998046875, -0.000274658203125, -0.0002002716064453125, -0.000125885009765625, -5.14984130859375e-05, 2.288818359375e-05, 9.72747802734375e-05, 0.000171661376953125, 0.0002460479736328125, 0.0003204345703125, 0.0003948211669921875, 0.000469207763671875, 0.0005435943603515625, 0.00061798095703125, 0.0006923675537109375, 0.000766754150390625, 0.0008411407470703125, 0.00091552734375, 0.0009899139404296875, 0.001064300537109375, 0.0011386871337890625, 0.00121307373046875, 0.0012874603271484375, 0.001361846923828125, 0.0014362335205078125, 0.0015106201171875, 0.0015850067138671875, 0.001659393310546875, 0.0017337799072265625, 0.00180816650390625, 0.0018825531005859375, 0.001956939697265625, 0.0020313262939453125, 0.002105712890625, 0.0021800994873046875, 0.002254486083984375]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 7.0, 11.0, 13.0, 14.0, 15.0, 24.0, 28.0, 39.0, 55.0, 61.0, 87.0, 131.0, 126.0, 102.0, 76.0, 54.0, 45.0, 28.0, 19.0, 22.0, 10.0, 13.0, 4.0, 2.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.127361297607422, -18.580533981323242, -18.033706665039062, -17.486879348754883, -16.940052032470703, -16.393226623535156, -15.84639835357666, -15.29957103729248, -14.752744674682617, -14.205917358398438, -13.659090042114258, -13.112262725830078, -12.565436363220215, -12.018609046936035, -11.471781730651855, -10.924954414367676, -10.378127098083496, -9.831299781799316, -9.284472465515137, -8.737646102905273, -8.190818786621094, -7.643991470336914, -7.097164154052734, -6.550336837768555, -6.003509998321533, -5.4566826820373535, -4.909855842590332, -4.363028526306152, -3.8162014484405518, -3.269374370574951, -2.7225470542907715, -2.175719976425171, -1.6288928985595703, -1.0820658206939697, -0.5352386236190796, 0.011588573455810547, 0.5584156513214111, 1.1052427291870117, 1.6520700454711914, 2.198897123336792, 2.7457242012023926, 3.292551279067993, 3.8393783569335938, 4.386205673217773, 4.933032989501953, 5.479859828948975, 6.026687145233154, 6.573513984680176, 7.1203413009643555, 7.667168617248535, 8.213995933532715, 8.760822296142578, 9.307649612426758, 9.854476928710938, 10.401304244995117, 10.948131561279297, 11.494958877563477, 12.041786193847656, 12.588613510131836, 13.135440826416016, 13.682267189025879, 14.229094505310059, 14.775921821594238, 15.322749137878418, 15.869575500488281]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 4.0, 6.0, 8.0, 14.0, 14.0, 16.0, 21.0, 18.0, 25.0, 27.0, 26.0, 39.0, 34.0, 53.0, 38.0, 52.0, 38.0, 47.0, 33.0, 56.0, 38.0, 34.0, 42.0, 46.0, 39.0, 34.0, 25.0, 39.0, 27.0, 19.0, 17.0, 13.0, 11.0, 12.0, 8.0, 6.0, 8.0, 5.0, 10.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.31564712524414, -11.836283683776855, -11.35692024230957, -10.877556800842285, -10.398193359375, -9.918829917907715, -9.43946647644043, -8.960103034973145, -8.48073959350586, -8.001376152038574, -7.522012710571289, -7.042649269104004, -6.563285827636719, -6.083922386169434, -5.604558944702148, -5.125195503234863, -4.645832538604736, -4.166469097137451, -3.687105655670166, -3.207742214202881, -2.7283787727355957, -2.2490155696868896, -1.7696521282196045, -1.2902886867523193, -0.8109252452850342, -0.3315618336200714, 0.14780157804489136, 0.6271649599075317, 1.106528401374817, 1.5858917236328125, 2.0652551651000977, 2.544618606567383, 3.023982048034668, 3.503345489501953, 3.9827089309692383, 4.462072372436523, 4.941435813903809, 5.420799255371094, 5.900162696838379, 6.379526138305664, 6.858889579772949, 7.338253021240234, 7.8176164627075195, 8.296979904174805, 8.77634334564209, 9.255706787109375, 9.73507022857666, 10.214433670043945, 10.693796157836914, 11.1731595993042, 11.652523040771484, 12.13188648223877, 12.611249923706055, 13.09061336517334, 13.569976806640625, 14.04934024810791, 14.528703689575195, 15.00806713104248, 15.487430572509766, 15.96679401397705, 16.446157455444336, 16.925519943237305, 17.404884338378906, 17.884246826171875, 18.363611221313477]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 6.0, 12.0, 10.0, 18.0, 30.0, 45.0, 59.0, 97.0, 142.0, 253.0, 421.0, 703.0, 1077.0, 1826.0, 3193.0, 5275.0, 9224.0, 15859.0, 27953.0, 51477.0, 100620.0, 220303.0, 298209.0, 149820.0, 72641.0, 38522.0, 21402.0, 11956.0, 7016.0, 4272.0, 2413.0, 1486.0, 872.0, 493.0, 314.0, 193.0, 125.0, 73.0, 43.0, 30.0, 21.0, 17.0, 12.0, 7.0, 8.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.125, -22.334716796875, -21.54443359375, -20.754150390625, -19.9638671875, -19.173583984375, -18.38330078125, -17.593017578125, -16.802734375, -16.012451171875, -15.22216796875, -14.431884765625, -13.6416015625, -12.851318359375, -12.06103515625, -11.270751953125, -10.48046875, -9.690185546875, -8.89990234375, -8.109619140625, -7.3193359375, -6.529052734375, -5.73876953125, -4.948486328125, -4.158203125, -3.367919921875, -2.57763671875, -1.787353515625, -0.9970703125, -0.206787109375, 0.58349609375, 1.373779296875, 2.1640625, 2.954345703125, 3.74462890625, 4.534912109375, 5.3251953125, 6.115478515625, 6.90576171875, 7.696044921875, 8.486328125, 9.276611328125, 10.06689453125, 10.857177734375, 11.6474609375, 12.437744140625, 13.22802734375, 14.018310546875, 14.80859375, 15.598876953125, 16.38916015625, 17.179443359375, 17.9697265625, 18.760009765625, 19.55029296875, 20.340576171875, 21.130859375, 21.921142578125, 22.71142578125, 23.501708984375, 24.2919921875, 25.082275390625, 25.87255859375, 26.662841796875, 27.453125]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 2.0, 10.0, 8.0, 15.0, 15.0, 11.0, 16.0, 18.0, 20.0, 36.0, 27.0, 37.0, 27.0, 45.0, 50.0, 49.0, 38.0, 43.0, 49.0, 40.0, 38.0, 31.0, 42.0, 38.0, 52.0, 38.0, 26.0, 32.0, 23.0, 32.0, 13.0, 12.0, 15.0, 14.0, 8.0, 3.0, 9.0, 3.0, 10.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9609375, -10.5220947265625, -10.083251953125, -9.6444091796875, -9.20556640625, -8.7667236328125, -8.327880859375, -7.8890380859375, -7.4501953125, -7.0113525390625, -6.572509765625, -6.1336669921875, -5.69482421875, -5.2559814453125, -4.817138671875, -4.3782958984375, -3.939453125, -3.5006103515625, -3.061767578125, -2.6229248046875, -2.18408203125, -1.7452392578125, -1.306396484375, -0.8675537109375, -0.4287109375, 0.0101318359375, 0.448974609375, 0.8878173828125, 1.32666015625, 1.7655029296875, 2.204345703125, 2.6431884765625, 3.08203125, 3.5208740234375, 3.959716796875, 4.3985595703125, 4.83740234375, 5.2762451171875, 5.715087890625, 6.1539306640625, 6.5927734375, 7.0316162109375, 7.470458984375, 7.9093017578125, 8.34814453125, 8.7869873046875, 9.225830078125, 9.6646728515625, 10.103515625, 10.5423583984375, 10.981201171875, 11.4200439453125, 11.85888671875, 12.2977294921875, 12.736572265625, 13.1754150390625, 13.6142578125, 14.0531005859375, 14.491943359375, 14.9307861328125, 15.36962890625, 15.8084716796875, 16.247314453125, 16.6861572265625, 17.125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 5.0, 2.0, 9.0, 6.0, 10.0, 18.0, 26.0, 37.0, 61.0, 73.0, 124.0, 189.0, 292.0, 469.0, 715.0, 1098.0, 1604.0, 2581.0, 4017.0, 6186.0, 10005.0, 16140.0, 26677.0, 45884.0, 84026.0, 173919.0, 282330.0, 183119.0, 88181.0, 47909.0, 27974.0, 16535.0, 10322.0, 6445.0, 4117.0, 2651.0, 1666.0, 1080.0, 728.0, 462.0, 315.0, 186.0, 130.0, 84.0, 52.0, 37.0, 27.0, 9.0, 17.0, 8.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.328125, -19.61572265625, -18.9033203125, -18.19091796875, -17.478515625, -16.76611328125, -16.0537109375, -15.34130859375, -14.62890625, -13.91650390625, -13.2041015625, -12.49169921875, -11.779296875, -11.06689453125, -10.3544921875, -9.64208984375, -8.9296875, -8.21728515625, -7.5048828125, -6.79248046875, -6.080078125, -5.36767578125, -4.6552734375, -3.94287109375, -3.23046875, -2.51806640625, -1.8056640625, -1.09326171875, -0.380859375, 0.33154296875, 1.0439453125, 1.75634765625, 2.46875, 3.18115234375, 3.8935546875, 4.60595703125, 5.318359375, 6.03076171875, 6.7431640625, 7.45556640625, 8.16796875, 8.88037109375, 9.5927734375, 10.30517578125, 11.017578125, 11.72998046875, 12.4423828125, 13.15478515625, 13.8671875, 14.57958984375, 15.2919921875, 16.00439453125, 16.716796875, 17.42919921875, 18.1416015625, 18.85400390625, 19.56640625, 20.27880859375, 20.9912109375, 21.70361328125, 22.416015625, 23.12841796875, 23.8408203125, 24.55322265625, 25.265625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 5.0, 10.0, 10.0, 9.0, 11.0, 17.0, 16.0, 20.0, 16.0, 26.0, 32.0, 31.0, 40.0, 35.0, 47.0, 43.0, 48.0, 42.0, 54.0, 39.0, 47.0, 40.0, 44.0, 38.0, 35.0, 27.0, 30.0, 39.0, 23.0, 27.0, 20.0, 20.0, 15.0, 9.0, 8.0, 6.0, 8.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.2109375, -9.921875, -9.6328125, -9.34375, -9.0546875, -8.765625, -8.4765625, -8.1875, -7.8984375, -7.609375, -7.3203125, -7.03125, -6.7421875, -6.453125, -6.1640625, -5.875, -5.5859375, -5.296875, -5.0078125, -4.71875, -4.4296875, -4.140625, -3.8515625, -3.5625, -3.2734375, -2.984375, -2.6953125, -2.40625, -2.1171875, -1.828125, -1.5390625, -1.25, -0.9609375, -0.671875, -0.3828125, -0.09375, 0.1953125, 0.484375, 0.7734375, 1.0625, 1.3515625, 1.640625, 1.9296875, 2.21875, 2.5078125, 2.796875, 3.0859375, 3.375, 3.6640625, 3.953125, 4.2421875, 4.53125, 4.8203125, 5.109375, 5.3984375, 5.6875, 5.9765625, 6.265625, 6.5546875, 6.84375, 7.1328125, 7.421875, 7.7109375, 8.0, 8.2890625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 7.0, 9.0, 13.0, 14.0, 29.0, 35.0, 60.0, 70.0, 107.0, 163.0, 248.0, 412.0, 578.0, 906.0, 1490.0, 2349.0, 4014.0, 6847.0, 12378.0, 23621.0, 48487.0, 119372.0, 373552.0, 280127.0, 89462.0, 39282.0, 19243.0, 10551.0, 5901.0, 3460.0, 2119.0, 1248.0, 794.0, 546.0, 361.0, 231.0, 136.0, 103.0, 75.0, 41.0, 35.0, 28.0, 15.0, 7.0, 10.0, 7.0, 5.0, 5.0, 0.0, 2.0, 0.0, 2.0, 2.0], "bins": [-4.32421875, -4.196502685546875, -4.06878662109375, -3.941070556640625, -3.8133544921875, -3.685638427734375, -3.55792236328125, -3.430206298828125, -3.302490234375, -3.174774169921875, -3.04705810546875, -2.919342041015625, -2.7916259765625, -2.663909912109375, -2.53619384765625, -2.408477783203125, -2.28076171875, -2.153045654296875, -2.02532958984375, -1.897613525390625, -1.7698974609375, -1.642181396484375, -1.51446533203125, -1.386749267578125, -1.259033203125, -1.131317138671875, -1.00360107421875, -0.875885009765625, -0.7481689453125, -0.620452880859375, -0.49273681640625, -0.365020751953125, -0.2373046875, -0.109588623046875, 0.01812744140625, 0.145843505859375, 0.2735595703125, 0.401275634765625, 0.52899169921875, 0.656707763671875, 0.784423828125, 0.912139892578125, 1.03985595703125, 1.167572021484375, 1.2952880859375, 1.423004150390625, 1.55072021484375, 1.678436279296875, 1.80615234375, 1.933868408203125, 2.06158447265625, 2.189300537109375, 2.3170166015625, 2.444732666015625, 2.57244873046875, 2.700164794921875, 2.827880859375, 2.955596923828125, 3.08331298828125, 3.211029052734375, 3.3387451171875, 3.466461181640625, 3.59417724609375, 3.721893310546875, 3.849609375]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 2.0, 3.0, 4.0, 10.0, 18.0, 18.0, 26.0, 26.0, 40.0, 58.0, 69.0, 107.0, 104.0, 98.0, 105.0, 98.0, 59.0, 44.0, 26.0, 30.0, 13.0, 15.0, 4.0, 8.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014328956604003906, -0.00013677403330802917, -0.0001302585005760193, -0.0001237429678440094, -0.00011722743511199951, -0.00011071190237998962, -0.00010419636964797974, -9.768083691596985e-05, -9.116530418395996e-05, -8.464977145195007e-05, -7.813423871994019e-05, -7.16187059879303e-05, -6.510317325592041e-05, -5.858764052391052e-05, -5.2072107791900635e-05, -4.555657505989075e-05, -3.904104232788086e-05, -3.252550959587097e-05, -2.6009976863861084e-05, -1.9494444131851196e-05, -1.2978911399841309e-05, -6.463378667831421e-06, 5.21540641784668e-08, 6.5676867961883545e-06, 1.3083219528198242e-05, 1.959875226020813e-05, 2.6114284992218018e-05, 3.2629817724227905e-05, 3.914535045623779e-05, 4.566088318824768e-05, 5.217641592025757e-05, 5.8691948652267456e-05, 6.520748138427734e-05, 7.172301411628723e-05, 7.823854684829712e-05, 8.475407958030701e-05, 9.12696123123169e-05, 9.778514504432678e-05, 0.00010430067777633667, 0.00011081621050834656, 0.00011733174324035645, 0.00012384727597236633, 0.00013036280870437622, 0.0001368783414363861, 0.000143393874168396, 0.00014990940690040588, 0.00015642493963241577, 0.00016294047236442566, 0.00016945600509643555, 0.00017597153782844543, 0.00018248707056045532, 0.0001890026032924652, 0.0001955181360244751, 0.00020203366875648499, 0.00020854920148849487, 0.00021506473422050476, 0.00022158026695251465, 0.00022809579968452454, 0.00023461133241653442, 0.0002411268651485443, 0.0002476423978805542, 0.0002541579306125641, 0.000260673463344574, 0.00026718899607658386, 0.00027370452880859375]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 3.0, 6.0, 13.0, 21.0, 26.0, 22.0, 58.0, 63.0, 90.0, 123.0, 175.0, 246.0, 348.0, 525.0, 732.0, 1113.0, 1665.0, 2555.0, 4082.0, 6296.0, 10404.0, 17423.0, 30570.0, 57599.0, 126328.0, 312481.0, 258278.0, 101249.0, 48883.0, 26544.0, 15125.0, 9141.0, 5794.0, 3440.0, 2334.0, 1476.0, 1097.0, 675.0, 474.0, 323.0, 196.0, 166.0, 127.0, 73.0, 54.0, 37.0, 29.0, 16.0, 19.0, 18.0, 8.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.208984375, -3.108306884765625, -3.00762939453125, -2.906951904296875, -2.8062744140625, -2.705596923828125, -2.60491943359375, -2.504241943359375, -2.403564453125, -2.302886962890625, -2.20220947265625, -2.101531982421875, -2.0008544921875, -1.900177001953125, -1.79949951171875, -1.698822021484375, -1.59814453125, -1.497467041015625, -1.39678955078125, -1.296112060546875, -1.1954345703125, -1.094757080078125, -0.99407958984375, -0.893402099609375, -0.792724609375, -0.692047119140625, -0.59136962890625, -0.490692138671875, -0.3900146484375, -0.289337158203125, -0.18865966796875, -0.087982177734375, 0.0126953125, 0.113372802734375, 0.21405029296875, 0.314727783203125, 0.4154052734375, 0.516082763671875, 0.61676025390625, 0.717437744140625, 0.818115234375, 0.918792724609375, 1.01947021484375, 1.120147705078125, 1.2208251953125, 1.321502685546875, 1.42218017578125, 1.522857666015625, 1.62353515625, 1.724212646484375, 1.82489013671875, 1.925567626953125, 2.0262451171875, 2.126922607421875, 2.22760009765625, 2.328277587890625, 2.428955078125, 2.529632568359375, 2.63031005859375, 2.730987548828125, 2.8316650390625, 2.932342529296875, 3.03302001953125, 3.133697509765625, 3.234375]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 3.0, 3.0, 4.0, 9.0, 9.0, 7.0, 14.0, 17.0, 16.0, 22.0, 34.0, 37.0, 32.0, 40.0, 50.0, 64.0, 71.0, 71.0, 64.0, 53.0, 55.0, 56.0, 48.0, 39.0, 29.0, 32.0, 23.0, 24.0, 14.0, 10.0, 14.0, 8.0, 10.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.396484375, -1.3511962890625, -1.305908203125, -1.2606201171875, -1.21533203125, -1.1700439453125, -1.124755859375, -1.0794677734375, -1.0341796875, -0.9888916015625, -0.943603515625, -0.8983154296875, -0.85302734375, -0.8077392578125, -0.762451171875, -0.7171630859375, -0.671875, -0.6265869140625, -0.581298828125, -0.5360107421875, -0.49072265625, -0.4454345703125, -0.400146484375, -0.3548583984375, -0.3095703125, -0.2642822265625, -0.218994140625, -0.1737060546875, -0.12841796875, -0.0831298828125, -0.037841796875, 0.0074462890625, 0.052734375, 0.0980224609375, 0.143310546875, 0.1885986328125, 0.23388671875, 0.2791748046875, 0.324462890625, 0.3697509765625, 0.4150390625, 0.4603271484375, 0.505615234375, 0.5509033203125, 0.59619140625, 0.6414794921875, 0.686767578125, 0.7320556640625, 0.77734375, 0.8226318359375, 0.867919921875, 0.9132080078125, 0.95849609375, 1.0037841796875, 1.049072265625, 1.0943603515625, 1.1396484375, 1.1849365234375, 1.230224609375, 1.2755126953125, 1.32080078125, 1.3660888671875, 1.411376953125, 1.4566650390625, 1.501953125]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 4.0, 2.0, 3.0, 5.0, 5.0, 4.0, 5.0, 11.0, 12.0, 19.0, 17.0, 25.0, 37.0, 49.0, 55.0, 85.0, 93.0, 121.0, 101.0, 85.0, 78.0, 51.0, 41.0, 25.0, 10.0, 16.0, 13.0, 9.0, 6.0, 8.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.600847244262695, -17.090660095214844, -16.58047103881836, -16.070283889770508, -15.560094833374023, -15.049907684326172, -14.539719581604004, -14.029531478881836, -13.519343376159668, -13.0091552734375, -12.498967170715332, -11.988779067993164, -11.478591918945312, -10.968402862548828, -10.458215713500977, -9.948027610778809, -9.43783950805664, -8.927651405334473, -8.417463302612305, -7.907275676727295, -7.397087574005127, -6.886899471282959, -6.376711845397949, -5.866523742675781, -5.356335639953613, -4.846147537231445, -4.335959434509277, -3.8257718086242676, -3.3155837059020996, -2.8053956031799316, -2.2952077388763428, -1.785019874572754, -1.2748327255249023, -0.7646447420120239, -0.2544567584991455, 0.2557312250137329, 0.7659192085266113, 1.2761073112487793, 1.7862951755523682, 2.296483039855957, 2.806671142578125, 3.316859245300293, 3.827047109603882, 4.337234973907471, 4.847423076629639, 5.357611179351807, 5.867798805236816, 6.377986907958984, 6.888175010681152, 7.39836311340332, 7.908551216125488, 8.418739318847656, 8.928926467895508, 9.439115524291992, 9.949302673339844, 10.459490776062012, 10.96967887878418, 11.479866981506348, 11.990055084228516, 12.500243186950684, 13.010431289672852, 13.520618438720703, 14.030806541442871, 14.540994644165039, 15.051182746887207]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 7.0, 7.0, 12.0, 12.0, 20.0, 14.0, 20.0, 21.0, 34.0, 28.0, 35.0, 42.0, 39.0, 38.0, 40.0, 36.0, 45.0, 50.0, 53.0, 38.0, 38.0, 38.0, 46.0, 36.0, 37.0, 28.0, 26.0, 18.0, 30.0, 18.0, 18.0, 12.0, 18.0, 17.0, 8.0, 7.0, 4.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.407158851623535, -11.9179048538208, -11.428651809692383, -10.939397811889648, -10.450143814086914, -9.96088981628418, -9.471635818481445, -8.982382774353027, -8.493128776550293, -8.003874778747559, -7.514621257781982, -7.025367736816406, -6.536113739013672, -6.0468597412109375, -5.557606220245361, -5.068352699279785, -4.579098701477051, -4.089844703674316, -3.6005911827087402, -3.111337423324585, -2.6220836639404297, -2.1328299045562744, -1.6435761451721191, -1.1543223857879639, -0.6650686264038086, -0.17581486701965332, 0.31343889236450195, 0.8026926517486572, 1.2919464111328125, 1.7812001705169678, 2.270453929901123, 2.7597076892852783, 3.24896240234375, 3.7382161617279053, 4.2274699211120605, 4.716723442077637, 5.205977439880371, 5.6952314376831055, 6.184484958648682, 6.673738479614258, 7.162992477416992, 7.652246475219727, 8.141500473022461, 8.630753517150879, 9.120007514953613, 9.609261512756348, 10.098514556884766, 10.5877685546875, 11.077022552490234, 11.566276550292969, 12.055530548095703, 12.544783592224121, 13.034037590026855, 13.52329158782959, 14.012544631958008, 14.501798629760742, 14.991052627563477, 15.480306625366211, 15.969560623168945, 16.45881462097168, 16.94806671142578, 17.437320709228516, 17.92657470703125, 18.415828704833984, 18.90508270263672]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [5.0, 4.0, 9.0, 10.0, 27.0, 33.0, 68.0, 118.0, 183.0, 370.0, 565.0, 927.0, 1566.0, 2684.0, 4470.0, 7489.0, 13079.0, 23148.0, 41911.0, 79114.0, 161111.0, 433758.0, 1634786.0, 1220979.0, 297050.0, 122126.0, 63046.0, 34657.0, 19760.0, 11642.0, 7136.0, 4432.0, 2851.0, 1725.0, 1120.0, 697.0, 467.0, 325.0, 254.0, 160.0, 119.0, 94.0, 53.0, 42.0, 37.0, 15.0, 22.0, 18.0, 13.0, 6.0, 4.0, 5.0, 4.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.2265625, -13.6043701171875, -12.982177734375, -12.3599853515625, -11.73779296875, -11.1156005859375, -10.493408203125, -9.8712158203125, -9.2490234375, -8.6268310546875, -8.004638671875, -7.3824462890625, -6.76025390625, -6.1380615234375, -5.515869140625, -4.8936767578125, -4.271484375, -3.6492919921875, -3.027099609375, -2.4049072265625, -1.78271484375, -1.1605224609375, -0.538330078125, 0.0838623046875, 0.7060546875, 1.3282470703125, 1.950439453125, 2.5726318359375, 3.19482421875, 3.8170166015625, 4.439208984375, 5.0614013671875, 5.68359375, 6.3057861328125, 6.927978515625, 7.5501708984375, 8.17236328125, 8.7945556640625, 9.416748046875, 10.0389404296875, 10.6611328125, 11.2833251953125, 11.905517578125, 12.5277099609375, 13.14990234375, 13.7720947265625, 14.394287109375, 15.0164794921875, 15.638671875, 16.2608642578125, 16.883056640625, 17.5052490234375, 18.12744140625, 18.7496337890625, 19.371826171875, 19.9940185546875, 20.6162109375, 21.2384033203125, 21.860595703125, 22.4827880859375, 23.10498046875, 23.7271728515625, 24.349365234375, 24.9715576171875, 25.59375]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 10.0, 5.0, 11.0, 8.0, 16.0, 22.0, 14.0, 23.0, 35.0, 26.0, 39.0, 41.0, 36.0, 40.0, 42.0, 42.0, 45.0, 47.0, 49.0, 46.0, 38.0, 48.0, 41.0, 44.0, 29.0, 29.0, 25.0, 25.0, 25.0, 21.0, 18.0, 11.0, 14.0, 17.0, 10.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.84375, -10.395263671875, -9.94677734375, -9.498291015625, -9.0498046875, -8.601318359375, -8.15283203125, -7.704345703125, -7.255859375, -6.807373046875, -6.35888671875, -5.910400390625, -5.4619140625, -5.013427734375, -4.56494140625, -4.116455078125, -3.66796875, -3.219482421875, -2.77099609375, -2.322509765625, -1.8740234375, -1.425537109375, -0.97705078125, -0.528564453125, -0.080078125, 0.368408203125, 0.81689453125, 1.265380859375, 1.7138671875, 2.162353515625, 2.61083984375, 3.059326171875, 3.5078125, 3.956298828125, 4.40478515625, 4.853271484375, 5.3017578125, 5.750244140625, 6.19873046875, 6.647216796875, 7.095703125, 7.544189453125, 7.99267578125, 8.441162109375, 8.8896484375, 9.338134765625, 9.78662109375, 10.235107421875, 10.68359375, 11.132080078125, 11.58056640625, 12.029052734375, 12.4775390625, 12.926025390625, 13.37451171875, 13.822998046875, 14.271484375, 14.719970703125, 15.16845703125, 15.616943359375, 16.0654296875, 16.513916015625, 16.96240234375, 17.410888671875, 17.859375]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 13.0, 16.0, 18.0, 25.0, 40.0, 57.0, 89.0, 141.0, 216.0, 309.0, 473.0, 713.0, 1034.0, 1558.0, 2495.0, 3910.0, 6203.0, 9880.0, 16345.0, 27410.0, 47217.0, 85001.0, 160192.0, 335735.0, 854715.0, 1514844.0, 583273.0, 251872.0, 125545.0, 67862.0, 38407.0, 22393.0, 13428.0, 8235.0, 5360.0, 3168.0, 2090.0, 1387.0, 941.0, 535.0, 369.0, 263.0, 181.0, 103.0, 79.0, 46.0, 36.0, 17.0, 21.0, 7.0, 2.0, 3.0, 5.0, 6.0, 5.0, 1.0, 1.0], "bins": [-15.6796875, -15.1944580078125, -14.709228515625, -14.2239990234375, -13.73876953125, -13.2535400390625, -12.768310546875, -12.2830810546875, -11.7978515625, -11.3126220703125, -10.827392578125, -10.3421630859375, -9.85693359375, -9.3717041015625, -8.886474609375, -8.4012451171875, -7.916015625, -7.4307861328125, -6.945556640625, -6.4603271484375, -5.97509765625, -5.4898681640625, -5.004638671875, -4.5194091796875, -4.0341796875, -3.5489501953125, -3.063720703125, -2.5784912109375, -2.09326171875, -1.6080322265625, -1.122802734375, -0.6375732421875, -0.15234375, 0.3328857421875, 0.818115234375, 1.3033447265625, 1.78857421875, 2.2738037109375, 2.759033203125, 3.2442626953125, 3.7294921875, 4.2147216796875, 4.699951171875, 5.1851806640625, 5.67041015625, 6.1556396484375, 6.640869140625, 7.1260986328125, 7.611328125, 8.0965576171875, 8.581787109375, 9.0670166015625, 9.55224609375, 10.0374755859375, 10.522705078125, 11.0079345703125, 11.4931640625, 11.9783935546875, 12.463623046875, 12.9488525390625, 13.43408203125, 13.9193115234375, 14.404541015625, 14.8897705078125, 15.375]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 4.0, 4.0, 3.0, 14.0, 6.0, 9.0, 13.0, 24.0, 30.0, 24.0, 60.0, 39.0, 59.0, 77.0, 98.0, 138.0, 138.0, 144.0, 236.0, 232.0, 302.0, 382.0, 423.0, 307.0, 226.0, 199.0, 182.0, 114.0, 118.0, 101.0, 81.0, 62.0, 48.0, 41.0, 26.0, 25.0, 22.0, 15.0, 11.0, 5.0, 12.0, 3.0, 4.0, 6.0, 4.0, 2.0, 4.0], "bins": [-8.6875, -8.46563720703125, -8.2437744140625, -8.02191162109375, -7.800048828125, -7.57818603515625, -7.3563232421875, -7.13446044921875, -6.91259765625, -6.69073486328125, -6.4688720703125, -6.24700927734375, -6.025146484375, -5.80328369140625, -5.5814208984375, -5.35955810546875, -5.1376953125, -4.91583251953125, -4.6939697265625, -4.47210693359375, -4.250244140625, -4.02838134765625, -3.8065185546875, -3.58465576171875, -3.36279296875, -3.14093017578125, -2.9190673828125, -2.69720458984375, -2.475341796875, -2.25347900390625, -2.0316162109375, -1.80975341796875, -1.587890625, -1.36602783203125, -1.1441650390625, -0.92230224609375, -0.700439453125, -0.47857666015625, -0.2567138671875, -0.03485107421875, 0.18701171875, 0.40887451171875, 0.6307373046875, 0.85260009765625, 1.074462890625, 1.29632568359375, 1.5181884765625, 1.74005126953125, 1.9619140625, 2.18377685546875, 2.4056396484375, 2.62750244140625, 2.849365234375, 3.07122802734375, 3.2930908203125, 3.51495361328125, 3.73681640625, 3.95867919921875, 4.1805419921875, 4.40240478515625, 4.624267578125, 4.84613037109375, 5.0679931640625, 5.28985595703125, 5.51171875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 7.0, 4.0, 7.0, 7.0, 14.0, 16.0, 6.0, 14.0, 15.0, 21.0, 32.0, 50.0, 48.0, 69.0, 72.0, 101.0, 97.0, 100.0, 63.0, 56.0, 39.0, 32.0, 34.0, 30.0, 16.0, 13.0, 9.0, 5.0, 5.0, 4.0, 4.0, 2.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.691887855529785, -14.232332229614258, -13.77277660369873, -13.313220977783203, -12.853665351867676, -12.394109725952148, -11.934553146362305, -11.474998474121094, -11.01544189453125, -10.555886268615723, -10.096330642700195, -9.636775016784668, -9.17721939086914, -8.717663764953613, -8.258108139038086, -7.7985520362854, -7.338996887207031, -6.879441261291504, -6.419885635375977, -5.960330009460449, -5.500774383544922, -5.0412187576293945, -4.581662654876709, -4.122107028961182, -3.6625514030456543, -3.202995777130127, -2.7434401512145996, -2.283884286880493, -1.8243286609649658, -1.3647730350494385, -0.905217170715332, -0.4456615447998047, 0.013894081115722656, 0.4734497666358948, 0.9330054521560669, 1.3925611972808838, 1.8521168231964111, 2.3116724491119385, 2.771228313446045, 3.2307839393615723, 3.6903395652770996, 4.149895191192627, 4.609450817108154, 5.06900691986084, 5.528562545776367, 5.9881181716918945, 6.447673797607422, 6.907229423522949, 7.366785049438477, 7.826340675354004, 8.285896301269531, 8.745451927185059, 9.205007553100586, 9.664563179016113, 10.12411880493164, 10.583675384521484, 11.043230056762695, 11.502785682678223, 11.96234130859375, 12.421896934509277, 12.881452560424805, 13.341008186340332, 13.80056381225586, 14.260120391845703, 14.71967601776123]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 9.0, 4.0, 5.0, 12.0, 10.0, 9.0, 19.0, 13.0, 22.0, 22.0, 24.0, 36.0, 35.0, 36.0, 42.0, 36.0, 47.0, 36.0, 56.0, 39.0, 58.0, 51.0, 36.0, 26.0, 37.0, 34.0, 36.0, 31.0, 28.0, 20.0, 36.0, 23.0, 14.0, 14.0, 17.0, 12.0, 7.0, 6.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.84069538116455, -13.330482482910156, -12.820268630981445, -12.31005573272705, -11.79984188079834, -11.289628982543945, -10.779415130615234, -10.26920223236084, -9.758989334106445, -9.24877643585205, -8.73856258392334, -8.228349685668945, -7.718135833740234, -7.20792293548584, -6.697709560394287, -6.187496185302734, -5.677282333374023, -5.167068958282471, -4.656855583190918, -4.146642684936523, -3.6364290714263916, -3.126215696334839, -2.6160025596618652, -2.1057891845703125, -1.5955758094787598, -1.085362434387207, -0.5751491785049438, -0.06493592262268066, 0.44527745246887207, 0.9554908275604248, 1.4657039642333984, 1.9759173393249512, 2.4861297607421875, 2.9963431358337402, 3.506556510925293, 4.0167694091796875, 4.526983261108398, 5.037196159362793, 5.547409534454346, 6.057622909545898, 6.567836284637451, 7.078049659729004, 7.588263034820557, 8.09847640991211, 8.608689308166504, 9.118903160095215, 9.62911605834961, 10.13932991027832, 10.649542808532715, 11.15975570678711, 11.66996955871582, 12.180182456970215, 12.690396308898926, 13.20060920715332, 13.710823059082031, 14.221035957336426, 14.73124885559082, 15.241461753845215, 15.751675605773926, 16.26188850402832, 16.77210235595703, 17.282316207885742, 17.79252815246582, 18.30274200439453, 18.812955856323242]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 8.0, 6.0, 17.0, 12.0, 22.0, 22.0, 46.0, 67.0, 129.0, 199.0, 323.0, 457.0, 750.0, 1187.0, 2031.0, 3153.0, 5348.0, 9166.0, 16225.0, 29485.0, 55258.0, 112413.0, 328676.0, 265049.0, 102741.0, 51420.0, 27330.0, 15268.0, 8559.0, 5118.0, 3011.0, 1849.0, 1152.0, 706.0, 471.0, 313.0, 169.0, 137.0, 82.0, 53.0, 40.0, 29.0, 13.0, 15.0, 12.0, 6.0, 5.0, 2.0, 5.0, 2.0, 1.0, 3.0], "bins": [-5.75, -5.58544921875, -5.4208984375, -5.25634765625, -5.091796875, -4.92724609375, -4.7626953125, -4.59814453125, -4.43359375, -4.26904296875, -4.1044921875, -3.93994140625, -3.775390625, -3.61083984375, -3.4462890625, -3.28173828125, -3.1171875, -2.95263671875, -2.7880859375, -2.62353515625, -2.458984375, -2.29443359375, -2.1298828125, -1.96533203125, -1.80078125, -1.63623046875, -1.4716796875, -1.30712890625, -1.142578125, -0.97802734375, -0.8134765625, -0.64892578125, -0.484375, -0.31982421875, -0.1552734375, 0.00927734375, 0.173828125, 0.33837890625, 0.5029296875, 0.66748046875, 0.83203125, 0.99658203125, 1.1611328125, 1.32568359375, 1.490234375, 1.65478515625, 1.8193359375, 1.98388671875, 2.1484375, 2.31298828125, 2.4775390625, 2.64208984375, 2.806640625, 2.97119140625, 3.1357421875, 3.30029296875, 3.46484375, 3.62939453125, 3.7939453125, 3.95849609375, 4.123046875, 4.28759765625, 4.4521484375, 4.61669921875, 4.78125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 8.0, 4.0, 6.0, 6.0, 11.0, 10.0, 15.0, 12.0, 27.0, 20.0, 20.0, 31.0, 25.0, 40.0, 39.0, 35.0, 31.0, 43.0, 47.0, 52.0, 60.0, 43.0, 43.0, 39.0, 30.0, 42.0, 29.0, 27.0, 27.0, 37.0, 23.0, 28.0, 20.0, 16.0, 18.0, 9.0, 9.0, 12.0, 4.0, 5.0, 0.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.5234375, -12.0169677734375, -11.510498046875, -11.0040283203125, -10.49755859375, -9.9910888671875, -9.484619140625, -8.9781494140625, -8.4716796875, -7.9652099609375, -7.458740234375, -6.9522705078125, -6.44580078125, -5.9393310546875, -5.432861328125, -4.9263916015625, -4.419921875, -3.9134521484375, -3.406982421875, -2.9005126953125, -2.39404296875, -1.8875732421875, -1.381103515625, -0.8746337890625, -0.3681640625, 0.1383056640625, 0.644775390625, 1.1512451171875, 1.65771484375, 2.1641845703125, 2.670654296875, 3.1771240234375, 3.68359375, 4.1900634765625, 4.696533203125, 5.2030029296875, 5.70947265625, 6.2159423828125, 6.722412109375, 7.2288818359375, 7.7353515625, 8.2418212890625, 8.748291015625, 9.2547607421875, 9.76123046875, 10.2677001953125, 10.774169921875, 11.2806396484375, 11.787109375, 12.2935791015625, 12.800048828125, 13.3065185546875, 13.81298828125, 14.3194580078125, 14.825927734375, 15.3323974609375, 15.8388671875, 16.3453369140625, 16.851806640625, 17.3582763671875, 17.86474609375, 18.3712158203125, 18.877685546875, 19.3841552734375, 19.890625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 14.0, 17.0, 22.0, 28.0, 43.0, 61.0, 92.0, 111.0, 139.0, 235.0, 305.0, 418.0, 542.0, 746.0, 1011.0, 1450.0, 2088.0, 2822.0, 4053.0, 5772.0, 8360.0, 11936.0, 17624.0, 25926.0, 38834.0, 61126.0, 106109.0, 230822.0, 235590.0, 106887.0, 61881.0, 39088.0, 26179.0, 17681.0, 11920.0, 8569.0, 5717.0, 4125.0, 2895.0, 2028.0, 1456.0, 1055.0, 777.0, 534.0, 433.0, 288.0, 215.0, 141.0, 136.0, 96.0, 47.0, 51.0, 34.0, 10.0, 10.0, 15.0, 3.0, 0.0, 0.0, 2.0], "bins": [-3.62109375, -3.507965087890625, -3.39483642578125, -3.281707763671875, -3.1685791015625, -3.055450439453125, -2.94232177734375, -2.829193115234375, -2.716064453125, -2.602935791015625, -2.48980712890625, -2.376678466796875, -2.2635498046875, -2.150421142578125, -2.03729248046875, -1.924163818359375, -1.81103515625, -1.697906494140625, -1.58477783203125, -1.471649169921875, -1.3585205078125, -1.245391845703125, -1.13226318359375, -1.019134521484375, -0.906005859375, -0.792877197265625, -0.67974853515625, -0.566619873046875, -0.4534912109375, -0.340362548828125, -0.22723388671875, -0.114105224609375, -0.0009765625, 0.112152099609375, 0.22528076171875, 0.338409423828125, 0.4515380859375, 0.564666748046875, 0.67779541015625, 0.790924072265625, 0.904052734375, 1.017181396484375, 1.13031005859375, 1.243438720703125, 1.3565673828125, 1.469696044921875, 1.58282470703125, 1.695953369140625, 1.80908203125, 1.922210693359375, 2.03533935546875, 2.148468017578125, 2.2615966796875, 2.374725341796875, 2.48785400390625, 2.600982666015625, 2.714111328125, 2.827239990234375, 2.94036865234375, 3.053497314453125, 3.1666259765625, 3.279754638671875, 3.39288330078125, 3.506011962890625, 3.619140625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 5.0, 3.0, 6.0, 4.0, 8.0, 10.0, 11.0, 4.0, 6.0, 11.0, 15.0, 15.0, 19.0, 28.0, 13.0, 17.0, 25.0, 20.0, 31.0, 29.0, 33.0, 29.0, 36.0, 35.0, 36.0, 32.0, 26.0, 38.0, 31.0, 48.0, 38.0, 34.0, 34.0, 26.0, 22.0, 23.0, 29.0, 22.0, 21.0, 19.0, 17.0, 14.0, 11.0, 15.0, 14.0, 8.0, 6.0, 4.0, 8.0, 9.0, 2.0, 3.0, 4.0, 1.0, 4.0, 3.0], "bins": [-9.046875, -8.7833251953125, -8.519775390625, -8.2562255859375, -7.99267578125, -7.7291259765625, -7.465576171875, -7.2020263671875, -6.9384765625, -6.6749267578125, -6.411376953125, -6.1478271484375, -5.88427734375, -5.6207275390625, -5.357177734375, -5.0936279296875, -4.830078125, -4.5665283203125, -4.302978515625, -4.0394287109375, -3.77587890625, -3.5123291015625, -3.248779296875, -2.9852294921875, -2.7216796875, -2.4581298828125, -2.194580078125, -1.9310302734375, -1.66748046875, -1.4039306640625, -1.140380859375, -0.8768310546875, -0.61328125, -0.3497314453125, -0.086181640625, 0.1773681640625, 0.44091796875, 0.7044677734375, 0.968017578125, 1.2315673828125, 1.4951171875, 1.7586669921875, 2.022216796875, 2.2857666015625, 2.54931640625, 2.8128662109375, 3.076416015625, 3.3399658203125, 3.603515625, 3.8670654296875, 4.130615234375, 4.3941650390625, 4.65771484375, 4.9212646484375, 5.184814453125, 5.4483642578125, 5.7119140625, 5.9754638671875, 6.239013671875, 6.5025634765625, 6.76611328125, 7.0296630859375, 7.293212890625, 7.5567626953125, 7.8203125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 3.0, 0.0, 9.0, 9.0, 13.0, 11.0, 26.0, 27.0, 29.0, 38.0, 67.0, 96.0, 135.0, 171.0, 225.0, 335.0, 464.0, 689.0, 1030.0, 1339.0, 2033.0, 2870.0, 4259.0, 6690.0, 10581.0, 17890.0, 33080.0, 67458.0, 166123.0, 378138.0, 190722.0, 75684.0, 36045.0, 19313.0, 11221.0, 6974.0, 4546.0, 3040.0, 2191.0, 1457.0, 999.0, 712.0, 518.0, 359.0, 265.0, 189.0, 142.0, 89.0, 71.0, 51.0, 40.0, 28.0, 23.0, 13.0, 13.0, 4.0, 10.0, 5.0, 4.0, 1.0, 3.0], "bins": [-0.00568389892578125, -0.005509376525878906, -0.0053348541259765625, -0.005160331726074219, -0.004985809326171875, -0.004811286926269531, -0.0046367645263671875, -0.004462242126464844, -0.0042877197265625, -0.004113197326660156, -0.0039386749267578125, -0.0037641525268554688, -0.003589630126953125, -0.0034151077270507812, -0.0032405853271484375, -0.0030660629272460938, -0.00289154052734375, -0.0027170181274414062, -0.0025424957275390625, -0.0023679733276367188, -0.002193450927734375, -0.0020189285278320312, -0.0018444061279296875, -0.0016698837280273438, -0.001495361328125, -0.0013208389282226562, -0.0011463165283203125, -0.0009717941284179688, -0.000797271728515625, -0.0006227493286132812, -0.0004482269287109375, -0.00027370452880859375, -9.918212890625e-05, 7.534027099609375e-05, 0.0002498626708984375, 0.00042438507080078125, 0.000598907470703125, 0.0007734298706054688, 0.0009479522705078125, 0.0011224746704101562, 0.0012969970703125, 0.0014715194702148438, 0.0016460418701171875, 0.0018205642700195312, 0.001995086669921875, 0.0021696090698242188, 0.0023441314697265625, 0.0025186538696289062, 0.00269317626953125, 0.0028676986694335938, 0.0030422210693359375, 0.0032167434692382812, 0.003391265869140625, 0.0035657882690429688, 0.0037403106689453125, 0.003914833068847656, 0.00408935546875, 0.004263877868652344, 0.0044384002685546875, 0.004612922668457031, 0.004787445068359375, 0.004961967468261719, 0.0051364898681640625, 0.005311012268066406, 0.00548553466796875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 7.0, 9.0, 10.0, 16.0, 14.0, 22.0, 18.0, 17.0, 23.0, 53.0, 54.0, 47.0, 53.0, 63.0, 49.0, 58.0, 98.0, 55.0, 48.0, 49.0, 35.0, 43.0, 46.0, 16.0, 21.0, 16.0, 14.0, 7.0, 11.0, 6.0, 5.0, 6.0, 5.0, 2.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0531158447265625e-06, -3.9245933294296265e-06, -3.7960708141326904e-06, -3.6675482988357544e-06, -3.5390257835388184e-06, -3.4105032682418823e-06, -3.2819807529449463e-06, -3.1534582376480103e-06, -3.0249357223510742e-06, -2.896413207054138e-06, -2.767890691757202e-06, -2.639368176460266e-06, -2.51084566116333e-06, -2.382323145866394e-06, -2.253800630569458e-06, -2.125278115272522e-06, -1.996755599975586e-06, -1.86823308467865e-06, -1.7397105693817139e-06, -1.6111880540847778e-06, -1.4826655387878418e-06, -1.3541430234909058e-06, -1.2256205081939697e-06, -1.0970979928970337e-06, -9.685754776000977e-07, -8.400529623031616e-07, -7.115304470062256e-07, -5.830079317092896e-07, -4.544854164123535e-07, -3.259629011154175e-07, -1.9744038581848145e-07, -6.891787052154541e-08, 5.960464477539063e-08, 1.8812716007232666e-07, 3.166496753692627e-07, 4.4517219066619873e-07, 5.736947059631348e-07, 7.022172212600708e-07, 8.307397365570068e-07, 9.592622518539429e-07, 1.087784767150879e-06, 1.216307282447815e-06, 1.344829797744751e-06, 1.473352313041687e-06, 1.601874828338623e-06, 1.730397343635559e-06, 1.8589198589324951e-06, 1.987442374229431e-06, 2.115964889526367e-06, 2.2444874048233032e-06, 2.3730099201202393e-06, 2.5015324354171753e-06, 2.6300549507141113e-06, 2.7585774660110474e-06, 2.8870999813079834e-06, 3.0156224966049194e-06, 3.1441450119018555e-06, 3.2726675271987915e-06, 3.4011900424957275e-06, 3.5297125577926636e-06, 3.6582350730895996e-06, 3.7867575883865356e-06, 3.915280103683472e-06, 4.043802618980408e-06, 4.172325134277344e-06]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 3.0, 14.0, 11.0, 14.0, 27.0, 22.0, 48.0, 60.0, 86.0, 134.0, 150.0, 224.0, 277.0, 383.0, 492.0, 687.0, 922.0, 1257.0, 1720.0, 2421.0, 3412.0, 5160.0, 7518.0, 11795.0, 19543.0, 34319.0, 67917.0, 160989.0, 376450.0, 181619.0, 74214.0, 37012.0, 20904.0, 12573.0, 8172.0, 5292.0, 3596.0, 2531.0, 1757.0, 1281.0, 931.0, 691.0, 497.0, 361.0, 302.0, 192.0, 156.0, 123.0, 87.0, 80.0, 49.0, 20.0, 25.0, 19.0, 13.0, 8.0, 5.0, 4.0, 1.0, 2.0], "bins": [-0.005443572998046875, -0.005276381969451904, -0.005109190940856934, -0.004941999912261963, -0.004774808883666992, -0.0046076178550720215, -0.004440426826477051, -0.00427323579788208, -0.004106044769287109, -0.003938853740692139, -0.003771662712097168, -0.0036044716835021973, -0.0034372806549072266, -0.003270089626312256, -0.003102898597717285, -0.0029357075691223145, -0.0027685165405273438, -0.002601325511932373, -0.0024341344833374023, -0.0022669434547424316, -0.002099752426147461, -0.0019325613975524902, -0.0017653703689575195, -0.0015981793403625488, -0.0014309883117675781, -0.0012637972831726074, -0.0010966062545776367, -0.000929415225982666, -0.0007622241973876953, -0.0005950331687927246, -0.0004278421401977539, -0.0002606511116027832, -9.34600830078125e-05, 7.37309455871582e-05, 0.0002409219741821289, 0.0004081130027770996, 0.0005753040313720703, 0.000742495059967041, 0.0009096860885620117, 0.0010768771171569824, 0.0012440681457519531, 0.0014112591743469238, 0.0015784502029418945, 0.0017456412315368652, 0.001912832260131836, 0.0020800232887268066, 0.0022472143173217773, 0.002414405345916748, 0.0025815963745117188, 0.0027487874031066895, 0.00291597843170166, 0.003083169460296631, 0.0032503604888916016, 0.0034175515174865723, 0.003584742546081543, 0.0037519335746765137, 0.003919124603271484, 0.004086315631866455, 0.004253506660461426, 0.0044206976890563965, 0.004587888717651367, 0.004755079746246338, 0.004922270774841309, 0.005089461803436279, 0.00525665283203125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 8.0, 5.0, 6.0, 7.0, 4.0, 9.0, 14.0, 11.0, 18.0, 11.0, 26.0, 29.0, 21.0, 38.0, 40.0, 58.0, 98.0, 121.0, 88.0, 80.0, 68.0, 46.0, 36.0, 33.0, 17.0, 22.0, 16.0, 19.0, 10.0, 4.0, 4.0, 7.0, 3.0, 6.0, 3.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.00295257568359375, -0.00286787748336792, -0.00278317928314209, -0.0026984810829162598, -0.0026137828826904297, -0.0025290846824645996, -0.0024443864822387695, -0.0023596882820129395, -0.0022749900817871094, -0.0021902918815612793, -0.0021055936813354492, -0.002020895481109619, -0.001936197280883789, -0.001851499080657959, -0.001766800880432129, -0.0016821026802062988, -0.0015974044799804688, -0.0015127062797546387, -0.0014280080795288086, -0.0013433098793029785, -0.0012586116790771484, -0.0011739134788513184, -0.0010892152786254883, -0.0010045170783996582, -0.0009198188781738281, -0.000835120677947998, -0.000750422477722168, -0.0006657242774963379, -0.0005810260772705078, -0.0004963278770446777, -0.00041162967681884766, -0.0003269314765930176, -0.0002422332763671875, -0.00015753507614135742, -7.283687591552734e-05, 1.1861324310302734e-05, 9.655952453613281e-05, 0.0001812577247619629, 0.00026595592498779297, 0.00035065412521362305, 0.0004353523254394531, 0.0005200505256652832, 0.0006047487258911133, 0.0006894469261169434, 0.0007741451263427734, 0.0008588433265686035, 0.0009435415267944336, 0.0010282397270202637, 0.0011129379272460938, 0.0011976361274719238, 0.001282334327697754, 0.001367032527923584, 0.001451730728149414, 0.0015364289283752441, 0.0016211271286010742, 0.0017058253288269043, 0.0017905235290527344, 0.0018752217292785645, 0.0019599199295043945, 0.0020446181297302246, 0.0021293163299560547, 0.0022140145301818848, 0.002298712730407715, 0.002383410930633545, 0.002468109130859375]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 5.0, 6.0, 8.0, 8.0, 15.0, 7.0, 11.0, 20.0, 12.0, 26.0, 28.0, 51.0, 43.0, 65.0, 69.0, 112.0, 90.0, 94.0, 71.0, 55.0, 33.0, 40.0, 33.0, 27.0, 11.0, 17.0, 11.0, 7.0, 3.0, 5.0, 4.0, 4.0, 0.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.018342971801758, -13.56515884399414, -13.111974716186523, -12.658790588378906, -12.205607414245605, -11.752423286437988, -11.299239158630371, -10.846055030822754, -10.392871856689453, -9.939687728881836, -9.486503601074219, -9.033319473266602, -8.5801362991333, -8.126952171325684, -7.673768043518066, -7.220583915710449, -6.767399787902832, -6.314215660095215, -5.861032009124756, -5.407847881317139, -4.95466423034668, -4.5014801025390625, -4.048295974731445, -3.5951120853424072, -3.141928195953369, -2.688744306564331, -2.235560417175293, -1.7823762893676758, -1.3291923999786377, -0.8760085105895996, -0.4228243827819824, 0.030359506607055664, 0.48354434967041016, 0.936728298664093, 1.3899122476577759, 1.8430962562561035, 2.2962801456451416, 2.7494640350341797, 3.202648162841797, 3.655832052230835, 4.109015941619873, 4.56220006942749, 5.015383720397949, 5.468567848205566, 5.921751976013184, 6.374935626983643, 6.82811975479126, 7.281303405761719, 7.734487533569336, 8.187671661376953, 8.64085578918457, 9.094039916992188, 9.547223091125488, 10.000407218933105, 10.453591346740723, 10.90677547454834, 11.35995864868164, 11.813142776489258, 12.266326904296875, 12.719511032104492, 13.172694206237793, 13.62587833404541, 14.079062461853027, 14.532246589660645, 14.985430717468262]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 9.0, 4.0, 5.0, 11.0, 12.0, 8.0, 19.0, 12.0, 23.0, 22.0, 24.0, 36.0, 35.0, 36.0, 42.0, 36.0, 47.0, 36.0, 55.0, 41.0, 56.0, 52.0, 36.0, 25.0, 37.0, 35.0, 37.0, 30.0, 27.0, 22.0, 35.0, 23.0, 14.0, 13.0, 18.0, 11.0, 8.0, 6.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.781859397888184, -13.271169662475586, -12.760478973388672, -12.249789237976074, -11.739099502563477, -11.228409767150879, -10.717720031738281, -10.207029342651367, -9.69633960723877, -9.185649871826172, -8.674959182739258, -8.16426944732666, -7.6535797119140625, -7.142889976501465, -6.632199764251709, -6.121509552001953, -5.6108198165893555, -5.100130081176758, -4.589439868927002, -4.078749656677246, -3.5680599212646484, -3.0573699474334717, -2.546679973602295, -2.035989999771118, -1.5253000259399414, -1.0146100521087646, -0.5039200782775879, 0.006769895553588867, 0.5174598693847656, 1.0281498432159424, 1.5388398170471191, 2.049529790878296, 2.5602188110351562, 3.070908784866333, 3.5815987586975098, 4.092288970947266, 4.602978706359863, 5.113668441772461, 5.624358654022217, 6.135048866271973, 6.64573860168457, 7.156428337097168, 7.667118549346924, 8.17780876159668, 8.688498497009277, 9.199188232421875, 9.709878921508789, 10.220568656921387, 10.731258392333984, 11.241948127746582, 11.75263786315918, 12.263328552246094, 12.774018287658691, 13.284708023071289, 13.795398712158203, 14.3060884475708, 14.816778182983398, 15.327467918395996, 15.838157653808594, 16.348848342895508, 16.859539031982422, 17.370227813720703, 17.880918502807617, 18.3916072845459, 18.902297973632812]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 9.0, 5.0, 12.0, 11.0, 28.0, 26.0, 59.0, 52.0, 80.0, 136.0, 201.0, 375.0, 515.0, 837.0, 1312.0, 2242.0, 3470.0, 5522.0, 8891.0, 14298.0, 23479.0, 39399.0, 69240.0, 132203.0, 267355.0, 225846.0, 107655.0, 58047.0, 33788.0, 20366.0, 12428.0, 7668.0, 4759.0, 3077.0, 1899.0, 1202.0, 751.0, 473.0, 287.0, 186.0, 112.0, 78.0, 58.0, 38.0, 22.0, 18.0, 9.0, 11.0, 8.0, 6.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0], "bins": [-26.1875, -25.390380859375, -24.59326171875, -23.796142578125, -22.9990234375, -22.201904296875, -21.40478515625, -20.607666015625, -19.810546875, -19.013427734375, -18.21630859375, -17.419189453125, -16.6220703125, -15.824951171875, -15.02783203125, -14.230712890625, -13.43359375, -12.636474609375, -11.83935546875, -11.042236328125, -10.2451171875, -9.447998046875, -8.65087890625, -7.853759765625, -7.056640625, -6.259521484375, -5.46240234375, -4.665283203125, -3.8681640625, -3.071044921875, -2.27392578125, -1.476806640625, -0.6796875, 0.117431640625, 0.91455078125, 1.711669921875, 2.5087890625, 3.305908203125, 4.10302734375, 4.900146484375, 5.697265625, 6.494384765625, 7.29150390625, 8.088623046875, 8.8857421875, 9.682861328125, 10.47998046875, 11.277099609375, 12.07421875, 12.871337890625, 13.66845703125, 14.465576171875, 15.2626953125, 16.059814453125, 16.85693359375, 17.654052734375, 18.451171875, 19.248291015625, 20.04541015625, 20.842529296875, 21.6396484375, 22.436767578125, 23.23388671875, 24.031005859375, 24.828125]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 9.0, 8.0, 13.0, 15.0, 12.0, 19.0, 19.0, 24.0, 23.0, 29.0, 34.0, 45.0, 38.0, 39.0, 35.0, 45.0, 51.0, 53.0, 49.0, 42.0, 37.0, 32.0, 34.0, 35.0, 34.0, 32.0, 30.0, 26.0, 31.0, 20.0, 19.0, 12.0, 14.0, 14.0, 7.0, 7.0, 1.0, 3.0, 3.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.984375, -11.505126953125, -11.02587890625, -10.546630859375, -10.0673828125, -9.588134765625, -9.10888671875, -8.629638671875, -8.150390625, -7.671142578125, -7.19189453125, -6.712646484375, -6.2333984375, -5.754150390625, -5.27490234375, -4.795654296875, -4.31640625, -3.837158203125, -3.35791015625, -2.878662109375, -2.3994140625, -1.920166015625, -1.44091796875, -0.961669921875, -0.482421875, -0.003173828125, 0.47607421875, 0.955322265625, 1.4345703125, 1.913818359375, 2.39306640625, 2.872314453125, 3.3515625, 3.830810546875, 4.31005859375, 4.789306640625, 5.2685546875, 5.747802734375, 6.22705078125, 6.706298828125, 7.185546875, 7.664794921875, 8.14404296875, 8.623291015625, 9.1025390625, 9.581787109375, 10.06103515625, 10.540283203125, 11.01953125, 11.498779296875, 11.97802734375, 12.457275390625, 12.9365234375, 13.415771484375, 13.89501953125, 14.374267578125, 14.853515625, 15.332763671875, 15.81201171875, 16.291259765625, 16.7705078125, 17.249755859375, 17.72900390625, 18.208251953125, 18.6875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 10.0, 10.0, 12.0, 26.0, 39.0, 58.0, 80.0, 113.0, 163.0, 249.0, 383.0, 562.0, 845.0, 1261.0, 1938.0, 2900.0, 4499.0, 6742.0, 10919.0, 16897.0, 26808.0, 43523.0, 75759.0, 144084.0, 248219.0, 203013.0, 105554.0, 58547.0, 34991.0, 21623.0, 13646.0, 8840.0, 5489.0, 3592.0, 2386.0, 1568.0, 1079.0, 692.0, 457.0, 325.0, 204.0, 145.0, 89.0, 73.0, 44.0, 40.0, 22.0, 12.0, 9.0, 10.0, 5.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0], "bins": [-22.640625, -21.927978515625, -21.21533203125, -20.502685546875, -19.7900390625, -19.077392578125, -18.36474609375, -17.652099609375, -16.939453125, -16.226806640625, -15.51416015625, -14.801513671875, -14.0888671875, -13.376220703125, -12.66357421875, -11.950927734375, -11.23828125, -10.525634765625, -9.81298828125, -9.100341796875, -8.3876953125, -7.675048828125, -6.96240234375, -6.249755859375, -5.537109375, -4.824462890625, -4.11181640625, -3.399169921875, -2.6865234375, -1.973876953125, -1.26123046875, -0.548583984375, 0.1640625, 0.876708984375, 1.58935546875, 2.302001953125, 3.0146484375, 3.727294921875, 4.43994140625, 5.152587890625, 5.865234375, 6.577880859375, 7.29052734375, 8.003173828125, 8.7158203125, 9.428466796875, 10.14111328125, 10.853759765625, 11.56640625, 12.279052734375, 12.99169921875, 13.704345703125, 14.4169921875, 15.129638671875, 15.84228515625, 16.554931640625, 17.267578125, 17.980224609375, 18.69287109375, 19.405517578125, 20.1181640625, 20.830810546875, 21.54345703125, 22.256103515625, 22.96875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 6.0, 7.0, 11.0, 15.0, 11.0, 19.0, 17.0, 13.0, 20.0, 28.0, 19.0, 27.0, 20.0, 34.0, 32.0, 38.0, 40.0, 31.0, 38.0, 31.0, 45.0, 39.0, 41.0, 38.0, 43.0, 32.0, 36.0, 31.0, 34.0, 20.0, 31.0, 30.0, 23.0, 14.0, 19.0, 13.0, 13.0, 7.0, 9.0, 9.0, 4.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1015625, -8.8211669921875, -8.540771484375, -8.2603759765625, -7.97998046875, -7.6995849609375, -7.419189453125, -7.1387939453125, -6.8583984375, -6.5780029296875, -6.297607421875, -6.0172119140625, -5.73681640625, -5.4564208984375, -5.176025390625, -4.8956298828125, -4.615234375, -4.3348388671875, -4.054443359375, -3.7740478515625, -3.49365234375, -3.2132568359375, -2.932861328125, -2.6524658203125, -2.3720703125, -2.0916748046875, -1.811279296875, -1.5308837890625, -1.25048828125, -0.9700927734375, -0.689697265625, -0.4093017578125, -0.12890625, 0.1514892578125, 0.431884765625, 0.7122802734375, 0.99267578125, 1.2730712890625, 1.553466796875, 1.8338623046875, 2.1142578125, 2.3946533203125, 2.675048828125, 2.9554443359375, 3.23583984375, 3.5162353515625, 3.796630859375, 4.0770263671875, 4.357421875, 4.6378173828125, 4.918212890625, 5.1986083984375, 5.47900390625, 5.7593994140625, 6.039794921875, 6.3201904296875, 6.6005859375, 6.8809814453125, 7.161376953125, 7.4417724609375, 7.72216796875, 8.0025634765625, 8.282958984375, 8.5633544921875, 8.84375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 10.0, 13.0, 21.0, 26.0, 45.0, 44.0, 66.0, 91.0, 119.0, 197.0, 249.0, 319.0, 495.0, 710.0, 1013.0, 1359.0, 1939.0, 2973.0, 4358.0, 6606.0, 10081.0, 16357.0, 28908.0, 57610.0, 151603.0, 391392.0, 211325.0, 72546.0, 34355.0, 19320.0, 11524.0, 7389.0, 4805.0, 3195.0, 2262.0, 1534.0, 1067.0, 753.0, 515.0, 371.0, 268.0, 212.0, 160.0, 109.0, 71.0, 58.0, 38.0, 25.0, 17.0, 12.0, 9.0, 8.0, 1.0, 2.0, 5.0, 0.0, 2.0], "bins": [-3.294921875, -3.1939697265625, -3.093017578125, -2.9920654296875, -2.89111328125, -2.7901611328125, -2.689208984375, -2.5882568359375, -2.4873046875, -2.3863525390625, -2.285400390625, -2.1844482421875, -2.08349609375, -1.9825439453125, -1.881591796875, -1.7806396484375, -1.6796875, -1.5787353515625, -1.477783203125, -1.3768310546875, -1.27587890625, -1.1749267578125, -1.073974609375, -0.9730224609375, -0.8720703125, -0.7711181640625, -0.670166015625, -0.5692138671875, -0.46826171875, -0.3673095703125, -0.266357421875, -0.1654052734375, -0.064453125, 0.0364990234375, 0.137451171875, 0.2384033203125, 0.33935546875, 0.4403076171875, 0.541259765625, 0.6422119140625, 0.7431640625, 0.8441162109375, 0.945068359375, 1.0460205078125, 1.14697265625, 1.2479248046875, 1.348876953125, 1.4498291015625, 1.55078125, 1.6517333984375, 1.752685546875, 1.8536376953125, 1.95458984375, 2.0555419921875, 2.156494140625, 2.2574462890625, 2.3583984375, 2.4593505859375, 2.560302734375, 2.6612548828125, 2.76220703125, 2.8631591796875, 2.964111328125, 3.0650634765625, 3.166015625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 5.0, 3.0, 4.0, 8.0, 8.0, 12.0, 12.0, 15.0, 20.0, 32.0, 36.0, 45.0, 60.0, 90.0, 98.0, 93.0, 89.0, 76.0, 73.0, 54.0, 43.0, 34.0, 19.0, 21.0, 13.0, 8.0, 8.0, 7.0, 10.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00018203258514404297, -0.00017696060240268707, -0.00017188861966133118, -0.00016681663691997528, -0.00016174465417861938, -0.0001566726714372635, -0.0001516006886959076, -0.0001465287059545517, -0.0001414567232131958, -0.0001363847404718399, -0.000131312757730484, -0.0001262407749891281, -0.00012116879224777222, -0.00011609680950641632, -0.00011102482676506042, -0.00010595284402370453, -0.00010088086128234863, -9.580887854099274e-05, -9.073689579963684e-05, -8.566491305828094e-05, -8.059293031692505e-05, -7.552094757556915e-05, -7.044896483421326e-05, -6.537698209285736e-05, -6.0304999351501465e-05, -5.523301661014557e-05, -5.016103386878967e-05, -4.508905112743378e-05, -4.001706838607788e-05, -3.4945085644721985e-05, -2.987310290336609e-05, -2.4801120162010193e-05, -1.9729137420654297e-05, -1.4657154679298401e-05, -9.585171937942505e-06, -4.513189196586609e-06, 5.587935447692871e-07, 5.630776286125183e-06, 1.0702759027481079e-05, 1.5774741768836975e-05, 2.084672451019287e-05, 2.5918707251548767e-05, 3.099068999290466e-05, 3.606267273426056e-05, 4.1134655475616455e-05, 4.620663821697235e-05, 5.127862095832825e-05, 5.635060369968414e-05, 6.142258644104004e-05, 6.649456918239594e-05, 7.156655192375183e-05, 7.663853466510773e-05, 8.171051740646362e-05, 8.678250014781952e-05, 9.185448288917542e-05, 9.692646563053131e-05, 0.00010199844837188721, 0.0001070704311132431, 0.000112142413854599, 0.0001172143965959549, 0.0001222863793373108, 0.0001273583620786667, 0.00013243034482002258, 0.00013750232756137848, 0.00014257431030273438]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 8.0, 11.0, 8.0, 19.0, 26.0, 29.0, 47.0, 86.0, 137.0, 184.0, 209.0, 282.0, 449.0, 707.0, 1007.0, 1491.0, 2169.0, 3248.0, 5034.0, 8233.0, 13487.0, 23629.0, 46430.0, 110042.0, 321865.0, 303729.0, 103020.0, 44461.0, 22871.0, 13051.0, 7735.0, 4999.0, 3236.0, 2115.0, 1356.0, 985.0, 644.0, 432.0, 341.0, 226.0, 150.0, 115.0, 72.0, 54.0, 37.0, 30.0, 18.0, 20.0, 8.0, 5.0, 7.0, 1.0, 4.0, 1.0, 0.0, 3.0], "bins": [-3.52734375, -3.42034912109375, -3.3133544921875, -3.20635986328125, -3.099365234375, -2.99237060546875, -2.8853759765625, -2.77838134765625, -2.67138671875, -2.56439208984375, -2.4573974609375, -2.35040283203125, -2.243408203125, -2.13641357421875, -2.0294189453125, -1.92242431640625, -1.8154296875, -1.70843505859375, -1.6014404296875, -1.49444580078125, -1.387451171875, -1.28045654296875, -1.1734619140625, -1.06646728515625, -0.95947265625, -0.85247802734375, -0.7454833984375, -0.63848876953125, -0.531494140625, -0.42449951171875, -0.3175048828125, -0.21051025390625, -0.103515625, 0.00347900390625, 0.1104736328125, 0.21746826171875, 0.324462890625, 0.43145751953125, 0.5384521484375, 0.64544677734375, 0.75244140625, 0.85943603515625, 0.9664306640625, 1.07342529296875, 1.180419921875, 1.28741455078125, 1.3944091796875, 1.50140380859375, 1.6083984375, 1.71539306640625, 1.8223876953125, 1.92938232421875, 2.036376953125, 2.14337158203125, 2.2503662109375, 2.35736083984375, 2.46435546875, 2.57135009765625, 2.6783447265625, 2.78533935546875, 2.892333984375, 2.99932861328125, 3.1063232421875, 3.21331787109375, 3.3203125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 7.0, 5.0, 8.0, 11.0, 9.0, 11.0, 15.0, 15.0, 23.0, 32.0, 35.0, 35.0, 56.0, 63.0, 82.0, 97.0, 74.0, 74.0, 65.0, 59.0, 44.0, 39.0, 25.0, 29.0, 10.0, 11.0, 10.0, 8.0, 14.0, 6.0, 4.0, 4.0, 2.0, 4.0, 3.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5791015625, -1.5312042236328125, -1.483306884765625, -1.4354095458984375, -1.38751220703125, -1.3396148681640625, -1.291717529296875, -1.2438201904296875, -1.1959228515625, -1.1480255126953125, -1.100128173828125, -1.0522308349609375, -1.00433349609375, -0.9564361572265625, -0.908538818359375, -0.8606414794921875, -0.812744140625, -0.7648468017578125, -0.716949462890625, -0.6690521240234375, -0.62115478515625, -0.5732574462890625, -0.525360107421875, -0.4774627685546875, -0.4295654296875, -0.3816680908203125, -0.333770751953125, -0.2858734130859375, -0.23797607421875, -0.1900787353515625, -0.142181396484375, -0.0942840576171875, -0.04638671875, 0.0015106201171875, 0.049407958984375, 0.0973052978515625, 0.14520263671875, 0.1930999755859375, 0.240997314453125, 0.2888946533203125, 0.3367919921875, 0.3846893310546875, 0.432586669921875, 0.4804840087890625, 0.52838134765625, 0.5762786865234375, 0.624176025390625, 0.6720733642578125, 0.719970703125, 0.7678680419921875, 0.815765380859375, 0.8636627197265625, 0.91156005859375, 0.9594573974609375, 1.007354736328125, 1.0552520751953125, 1.1031494140625, 1.1510467529296875, 1.198944091796875, 1.2468414306640625, 1.29473876953125, 1.3426361083984375, 1.390533447265625, 1.4384307861328125, 1.486328125]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 3.0, 2.0, 4.0, 6.0, 5.0, 4.0, 7.0, 8.0, 12.0, 12.0, 14.0, 19.0, 20.0, 21.0, 33.0, 48.0, 45.0, 65.0, 82.0, 99.0, 100.0, 70.0, 73.0, 45.0, 43.0, 29.0, 29.0, 20.0, 23.0, 18.0, 12.0, 6.0, 3.0, 5.0, 4.0, 4.0, 2.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.69520378112793, -12.238527297973633, -11.781851768493652, -11.325175285339355, -10.868498802185059, -10.411823272705078, -9.955146789550781, -9.498470306396484, -9.041793823242188, -8.58511734008789, -8.12844181060791, -7.671765327453613, -7.215088844299316, -6.758412837982178, -6.301736831665039, -5.845060348510742, -5.388384819030762, -4.931708812713623, -4.475032329559326, -4.0183563232421875, -3.5616800785064697, -3.105003833770752, -2.6483278274536133, -2.1916515827178955, -1.7349753379821777, -1.27829909324646, -0.8216229677200317, -0.3649468421936035, 0.09172940254211426, 0.548405647277832, 1.0050816535949707, 1.4617578983306885, 1.9184341430664062, 2.375110387802124, 2.831786632537842, 3.2884626388549805, 3.7451388835906982, 4.201815128326416, 4.658491134643555, 5.115167617797852, 5.57184362411499, 6.028519630432129, 6.485196113586426, 6.9418721199035645, 7.398548126220703, 7.855224609375, 8.311901092529297, 8.768576622009277, 9.225253105163574, 9.681929588317871, 10.138605117797852, 10.595281600952148, 11.051958084106445, 11.508634567260742, 11.965310096740723, 12.42198657989502, 12.878662109375, 13.335338592529297, 13.792014122009277, 14.248690605163574, 14.705367088317871, 15.162042617797852, 15.618719100952148, 16.075395584106445, 16.532072067260742]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 10.0, 8.0, 14.0, 14.0, 13.0, 18.0, 20.0, 25.0, 27.0, 37.0, 42.0, 28.0, 49.0, 41.0, 38.0, 39.0, 49.0, 47.0, 41.0, 46.0, 39.0, 42.0, 34.0, 26.0, 32.0, 23.0, 25.0, 36.0, 26.0, 27.0, 24.0, 16.0, 10.0, 4.0, 9.0, 7.0, 3.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.974176406860352, -15.421013832092285, -14.867851257324219, -14.314687728881836, -13.76152515411377, -13.208362579345703, -12.65519905090332, -12.102036476135254, -11.548873901367188, -10.995711326599121, -10.442548751831055, -9.889385223388672, -9.336222648620605, -8.783060073852539, -8.229896545410156, -7.67673397064209, -7.123571395874023, -6.570408821105957, -6.017245769500732, -5.464082717895508, -4.910920143127441, -4.357757568359375, -3.8045945167541504, -3.251431703567505, -2.6982688903808594, -2.145106077194214, -1.5919432640075684, -1.0387804508209229, -0.48561763763427734, 0.06754517555236816, 0.6207079887390137, 1.1738708019256592, 1.7270336151123047, 2.28019642829895, 2.8333592414855957, 3.386522054672241, 3.9396848678588867, 4.492847442626953, 5.046010494232178, 5.599173545837402, 6.152336120605469, 6.705498695373535, 7.25866174697876, 7.811824798583984, 8.36498737335205, 8.918149948120117, 9.4713134765625, 10.024476051330566, 10.577638626098633, 11.1308012008667, 11.683963775634766, 12.237127304077148, 12.790289878845215, 13.343452453613281, 13.896615982055664, 14.44977855682373, 15.002941131591797, 15.556103706359863, 16.10926628112793, 16.662429809570312, 17.215591430664062, 17.768754959106445, 18.321918487548828, 18.875080108642578, 19.42824363708496]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 8.0, 8.0, 15.0, 25.0, 30.0, 51.0, 95.0, 134.0, 263.0, 441.0, 669.0, 1009.0, 1537.0, 2449.0, 3809.0, 6016.0, 9154.0, 14857.0, 24551.0, 41584.0, 73885.0, 137989.0, 311874.0, 1094187.0, 1602266.0, 471424.0, 171563.0, 89334.0, 51224.0, 30484.0, 18584.0, 12044.0, 7685.0, 5000.0, 3201.0, 2194.0, 1439.0, 979.0, 657.0, 429.0, 301.0, 272.0, 191.0, 99.0, 80.0, 52.0, 59.0, 31.0, 20.0, 15.0, 5.0, 8.0, 8.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-18.296875, -17.670166015625, -17.04345703125, -16.416748046875, -15.7900390625, -15.163330078125, -14.53662109375, -13.909912109375, -13.283203125, -12.656494140625, -12.02978515625, -11.403076171875, -10.7763671875, -10.149658203125, -9.52294921875, -8.896240234375, -8.26953125, -7.642822265625, -7.01611328125, -6.389404296875, -5.7626953125, -5.135986328125, -4.50927734375, -3.882568359375, -3.255859375, -2.629150390625, -2.00244140625, -1.375732421875, -0.7490234375, -0.122314453125, 0.50439453125, 1.131103515625, 1.7578125, 2.384521484375, 3.01123046875, 3.637939453125, 4.2646484375, 4.891357421875, 5.51806640625, 6.144775390625, 6.771484375, 7.398193359375, 8.02490234375, 8.651611328125, 9.2783203125, 9.905029296875, 10.53173828125, 11.158447265625, 11.78515625, 12.411865234375, 13.03857421875, 13.665283203125, 14.2919921875, 14.918701171875, 15.54541015625, 16.172119140625, 16.798828125, 17.425537109375, 18.05224609375, 18.678955078125, 19.3056640625, 19.932373046875, 20.55908203125, 21.185791015625, 21.8125]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 9.0, 7.0, 7.0, 7.0, 11.0, 12.0, 23.0, 18.0, 15.0, 21.0, 24.0, 41.0, 37.0, 38.0, 45.0, 26.0, 35.0, 42.0, 40.0, 50.0, 45.0, 36.0, 39.0, 46.0, 32.0, 37.0, 24.0, 26.0, 30.0, 33.0, 28.0, 20.0, 19.0, 22.0, 17.0, 12.0, 7.0, 6.0, 5.0, 5.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8203125, -12.3492431640625, -11.878173828125, -11.4071044921875, -10.93603515625, -10.4649658203125, -9.993896484375, -9.5228271484375, -9.0517578125, -8.5806884765625, -8.109619140625, -7.6385498046875, -7.16748046875, -6.6964111328125, -6.225341796875, -5.7542724609375, -5.283203125, -4.8121337890625, -4.341064453125, -3.8699951171875, -3.39892578125, -2.9278564453125, -2.456787109375, -1.9857177734375, -1.5146484375, -1.0435791015625, -0.572509765625, -0.1014404296875, 0.36962890625, 0.8406982421875, 1.311767578125, 1.7828369140625, 2.25390625, 2.7249755859375, 3.196044921875, 3.6671142578125, 4.13818359375, 4.6092529296875, 5.080322265625, 5.5513916015625, 6.0224609375, 6.4935302734375, 6.964599609375, 7.4356689453125, 7.90673828125, 8.3778076171875, 8.848876953125, 9.3199462890625, 9.791015625, 10.2620849609375, 10.733154296875, 11.2042236328125, 11.67529296875, 12.1463623046875, 12.617431640625, 13.0885009765625, 13.5595703125, 14.0306396484375, 14.501708984375, 14.9727783203125, 15.44384765625, 15.9149169921875, 16.385986328125, 16.8570556640625, 17.328125]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 6.0, 6.0, 9.0, 19.0, 22.0, 38.0, 46.0, 69.0, 106.0, 178.0, 229.0, 418.0, 658.0, 955.0, 1525.0, 2484.0, 4016.0, 6346.0, 10570.0, 17749.0, 29409.0, 52362.0, 95703.0, 189901.0, 423023.0, 1223931.0, 1272997.0, 438193.0, 195338.0, 98334.0, 53309.0, 30279.0, 17682.0, 10734.0, 6628.0, 3982.0, 2496.0, 1665.0, 1016.0, 606.0, 462.0, 264.0, 195.0, 105.0, 67.0, 52.0, 38.0, 24.0, 16.0, 10.0, 11.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-18.484375, -17.924560546875, -17.36474609375, -16.804931640625, -16.2451171875, -15.685302734375, -15.12548828125, -14.565673828125, -14.005859375, -13.446044921875, -12.88623046875, -12.326416015625, -11.7666015625, -11.206787109375, -10.64697265625, -10.087158203125, -9.52734375, -8.967529296875, -8.40771484375, -7.847900390625, -7.2880859375, -6.728271484375, -6.16845703125, -5.608642578125, -5.048828125, -4.489013671875, -3.92919921875, -3.369384765625, -2.8095703125, -2.249755859375, -1.68994140625, -1.130126953125, -0.5703125, -0.010498046875, 0.54931640625, 1.109130859375, 1.6689453125, 2.228759765625, 2.78857421875, 3.348388671875, 3.908203125, 4.468017578125, 5.02783203125, 5.587646484375, 6.1474609375, 6.707275390625, 7.26708984375, 7.826904296875, 8.38671875, 8.946533203125, 9.50634765625, 10.066162109375, 10.6259765625, 11.185791015625, 11.74560546875, 12.305419921875, 12.865234375, 13.425048828125, 13.98486328125, 14.544677734375, 15.1044921875, 15.664306640625, 16.22412109375, 16.783935546875, 17.34375]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 1.0, 7.0, 8.0, 14.0, 22.0, 18.0, 25.0, 29.0, 40.0, 40.0, 50.0, 63.0, 76.0, 94.0, 107.0, 145.0, 152.0, 184.0, 202.0, 220.0, 297.0, 359.0, 314.0, 305.0, 228.0, 173.0, 191.0, 126.0, 112.0, 93.0, 57.0, 60.0, 65.0, 41.0, 29.0, 22.0, 21.0, 22.0, 18.0, 9.0, 10.0, 5.0, 4.0, 2.0, 7.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.94921875, -6.72296142578125, -6.4967041015625, -6.27044677734375, -6.044189453125, -5.81793212890625, -5.5916748046875, -5.36541748046875, -5.13916015625, -4.91290283203125, -4.6866455078125, -4.46038818359375, -4.234130859375, -4.00787353515625, -3.7816162109375, -3.55535888671875, -3.3291015625, -3.10284423828125, -2.8765869140625, -2.65032958984375, -2.424072265625, -2.19781494140625, -1.9715576171875, -1.74530029296875, -1.51904296875, -1.29278564453125, -1.0665283203125, -0.84027099609375, -0.614013671875, -0.38775634765625, -0.1614990234375, 0.06475830078125, 0.291015625, 0.51727294921875, 0.7435302734375, 0.96978759765625, 1.196044921875, 1.42230224609375, 1.6485595703125, 1.87481689453125, 2.10107421875, 2.32733154296875, 2.5535888671875, 2.77984619140625, 3.006103515625, 3.23236083984375, 3.4586181640625, 3.68487548828125, 3.9111328125, 4.13739013671875, 4.3636474609375, 4.58990478515625, 4.816162109375, 5.04241943359375, 5.2686767578125, 5.49493408203125, 5.72119140625, 5.94744873046875, 6.1737060546875, 6.39996337890625, 6.626220703125, 6.85247802734375, 7.0787353515625, 7.30499267578125, 7.53125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 3.0, 4.0, 6.0, 3.0, 11.0, 7.0, 12.0, 14.0, 19.0, 24.0, 25.0, 38.0, 52.0, 51.0, 68.0, 84.0, 116.0, 114.0, 82.0, 67.0, 37.0, 27.0, 34.0, 18.0, 20.0, 18.0, 13.0, 12.0, 5.0, 6.0, 2.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-19.938812255859375, -19.391992568969727, -18.845172882080078, -18.298351287841797, -17.75153160095215, -17.2047119140625, -16.65789222717285, -16.111072540283203, -15.564251899719238, -15.01743221282959, -14.470611572265625, -13.923791885375977, -13.376972198486328, -12.830151557922363, -12.283331871032715, -11.73651123046875, -11.189691543579102, -10.642871856689453, -10.096051216125488, -9.54923152923584, -9.002410888671875, -8.455591201782227, -7.908771514892578, -7.3619513511657715, -6.815131187438965, -6.268311023712158, -5.721490859985352, -5.174671173095703, -4.6278510093688965, -4.08103084564209, -3.5342109203338623, -2.9873909950256348, -2.4405717849731445, -1.8937517404556274, -1.3469316959381104, -0.8001116514205933, -0.25329160690307617, 0.29352855682373047, 0.840348482131958, 1.3871684074401855, 1.9339885711669922, 2.480808734893799, 3.0276286602020264, 3.574448585510254, 4.1212687492370605, 4.668088912963867, 5.214908599853516, 5.761728763580322, 6.308548927307129, 6.8553690910339355, 7.402189254760742, 7.949008941650391, 8.495828628540039, 9.042649269104004, 9.589468955993652, 10.136289596557617, 10.683109283447266, 11.229928970336914, 11.776749610900879, 12.323569297790527, 12.870389938354492, 13.41720962524414, 13.964029312133789, 14.510848999023438, 15.057669639587402]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 9.0, 15.0, 12.0, 14.0, 14.0, 23.0, 15.0, 28.0, 37.0, 42.0, 24.0, 36.0, 38.0, 46.0, 38.0, 46.0, 46.0, 34.0, 43.0, 46.0, 43.0, 49.0, 37.0, 28.0, 33.0, 35.0, 18.0, 32.0, 26.0, 14.0, 12.0, 12.0, 12.0, 4.0, 13.0, 10.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.78964614868164, -17.219343185424805, -16.64904022216797, -16.0787353515625, -15.508432388305664, -14.938129425048828, -14.367826461791992, -13.797523498535156, -13.227219581604004, -12.656916618347168, -12.086612701416016, -11.51630973815918, -10.946006774902344, -10.375702857971191, -9.805399894714355, -9.235095977783203, -8.664793014526367, -8.094490051269531, -7.524186134338379, -6.953883171081543, -6.383579730987549, -5.813276290893555, -5.242973327636719, -4.672669887542725, -4.1023664474487305, -3.5320630073547363, -2.9617598056793213, -2.3914566040039062, -1.821153163909912, -1.250849723815918, -0.6805465221405029, -0.11024332046508789, 0.46006202697753906, 1.0303653478622437, 1.6006686687469482, 2.1709718704223633, 2.7412753105163574, 3.3115787506103516, 3.8818819522857666, 4.452185153961182, 5.022488594055176, 5.59279203414917, 6.163095474243164, 6.7333984375, 7.303701877593994, 7.874005317687988, 8.444308280944824, 9.014612197875977, 9.584915161132812, 10.155218124389648, 10.7255220413208, 11.295825004577637, 11.866128921508789, 12.436431884765625, 13.006734848022461, 13.577037811279297, 14.14734172821045, 14.717644691467285, 15.287948608398438, 15.858251571655273, 16.42855453491211, 16.998859405517578, 17.569162368774414, 18.13946533203125, 18.709768295288086]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 5.0, 5.0, 7.0, 14.0, 20.0, 20.0, 43.0, 65.0, 102.0, 139.0, 229.0, 347.0, 548.0, 842.0, 1384.0, 2284.0, 3764.0, 6011.0, 10153.0, 17397.0, 30404.0, 54614.0, 103415.0, 263598.0, 308084.0, 109897.0, 57396.0, 31932.0, 18478.0, 10722.0, 6432.0, 3892.0, 2378.0, 1446.0, 917.0, 534.0, 367.0, 217.0, 153.0, 101.0, 69.0, 51.0, 29.0, 20.0, 13.0, 7.0, 8.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.51953125, -5.3472900390625, -5.175048828125, -5.0028076171875, -4.83056640625, -4.6583251953125, -4.486083984375, -4.3138427734375, -4.1416015625, -3.9693603515625, -3.797119140625, -3.6248779296875, -3.45263671875, -3.2803955078125, -3.108154296875, -2.9359130859375, -2.763671875, -2.5914306640625, -2.419189453125, -2.2469482421875, -2.07470703125, -1.9024658203125, -1.730224609375, -1.5579833984375, -1.3857421875, -1.2135009765625, -1.041259765625, -0.8690185546875, -0.69677734375, -0.5245361328125, -0.352294921875, -0.1800537109375, -0.0078125, 0.1644287109375, 0.336669921875, 0.5089111328125, 0.68115234375, 0.8533935546875, 1.025634765625, 1.1978759765625, 1.3701171875, 1.5423583984375, 1.714599609375, 1.8868408203125, 2.05908203125, 2.2313232421875, 2.403564453125, 2.5758056640625, 2.748046875, 2.9202880859375, 3.092529296875, 3.2647705078125, 3.43701171875, 3.6092529296875, 3.781494140625, 3.9537353515625, 4.1259765625, 4.2982177734375, 4.470458984375, 4.6427001953125, 4.81494140625, 4.9871826171875, 5.159423828125, 5.3316650390625, 5.50390625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 8.0, 5.0, 14.0, 14.0, 8.0, 14.0, 19.0, 21.0, 21.0, 26.0, 41.0, 35.0, 25.0, 38.0, 54.0, 34.0, 39.0, 45.0, 52.0, 30.0, 48.0, 47.0, 48.0, 32.0, 32.0, 39.0, 25.0, 36.0, 26.0, 21.0, 21.0, 15.0, 17.0, 6.0, 8.0, 15.0, 9.0, 3.0, 3.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.0625, -17.49755859375, -16.9326171875, -16.36767578125, -15.802734375, -15.23779296875, -14.6728515625, -14.10791015625, -13.54296875, -12.97802734375, -12.4130859375, -11.84814453125, -11.283203125, -10.71826171875, -10.1533203125, -9.58837890625, -9.0234375, -8.45849609375, -7.8935546875, -7.32861328125, -6.763671875, -6.19873046875, -5.6337890625, -5.06884765625, -4.50390625, -3.93896484375, -3.3740234375, -2.80908203125, -2.244140625, -1.67919921875, -1.1142578125, -0.54931640625, 0.015625, 0.58056640625, 1.1455078125, 1.71044921875, 2.275390625, 2.84033203125, 3.4052734375, 3.97021484375, 4.53515625, 5.10009765625, 5.6650390625, 6.22998046875, 6.794921875, 7.35986328125, 7.9248046875, 8.48974609375, 9.0546875, 9.61962890625, 10.1845703125, 10.74951171875, 11.314453125, 11.87939453125, 12.4443359375, 13.00927734375, 13.57421875, 14.13916015625, 14.7041015625, 15.26904296875, 15.833984375, 16.39892578125, 16.9638671875, 17.52880859375, 18.09375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 5.0, 3.0, 8.0, 15.0, 19.0, 26.0, 39.0, 53.0, 60.0, 103.0, 136.0, 219.0, 308.0, 418.0, 640.0, 889.0, 1264.0, 1908.0, 2823.0, 4206.0, 6424.0, 10004.0, 15591.0, 24539.0, 39270.0, 64445.0, 110971.0, 262281.0, 228925.0, 105872.0, 61707.0, 38104.0, 23877.0, 14864.0, 9674.0, 6168.0, 4057.0, 2734.0, 1862.0, 1267.0, 851.0, 598.0, 400.0, 284.0, 205.0, 148.0, 104.0, 65.0, 42.0, 28.0, 13.0, 14.0, 12.0, 9.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0], "bins": [-4.44140625, -4.30242919921875, -4.1634521484375, -4.02447509765625, -3.885498046875, -3.74652099609375, -3.6075439453125, -3.46856689453125, -3.32958984375, -3.19061279296875, -3.0516357421875, -2.91265869140625, -2.773681640625, -2.63470458984375, -2.4957275390625, -2.35675048828125, -2.2177734375, -2.07879638671875, -1.9398193359375, -1.80084228515625, -1.661865234375, -1.52288818359375, -1.3839111328125, -1.24493408203125, -1.10595703125, -0.96697998046875, -0.8280029296875, -0.68902587890625, -0.550048828125, -0.41107177734375, -0.2720947265625, -0.13311767578125, 0.005859375, 0.14483642578125, 0.2838134765625, 0.42279052734375, 0.561767578125, 0.70074462890625, 0.8397216796875, 0.97869873046875, 1.11767578125, 1.25665283203125, 1.3956298828125, 1.53460693359375, 1.673583984375, 1.81256103515625, 1.9515380859375, 2.09051513671875, 2.2294921875, 2.36846923828125, 2.5074462890625, 2.64642333984375, 2.785400390625, 2.92437744140625, 3.0633544921875, 3.20233154296875, 3.34130859375, 3.48028564453125, 3.6192626953125, 3.75823974609375, 3.897216796875, 4.03619384765625, 4.1751708984375, 4.31414794921875, 4.453125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 8.0, 9.0, 11.0, 10.0, 6.0, 20.0, 12.0, 22.0, 25.0, 29.0, 34.0, 28.0, 36.0, 26.0, 19.0, 37.0, 26.0, 35.0, 43.0, 31.0, 36.0, 37.0, 43.0, 31.0, 45.0, 50.0, 41.0, 36.0, 33.0, 23.0, 30.0, 17.0, 11.0, 28.0, 17.0, 10.0, 12.0, 5.0, 9.0, 7.0, 6.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.765625, -9.439453125, -9.11328125, -8.787109375, -8.4609375, -8.134765625, -7.80859375, -7.482421875, -7.15625, -6.830078125, -6.50390625, -6.177734375, -5.8515625, -5.525390625, -5.19921875, -4.873046875, -4.546875, -4.220703125, -3.89453125, -3.568359375, -3.2421875, -2.916015625, -2.58984375, -2.263671875, -1.9375, -1.611328125, -1.28515625, -0.958984375, -0.6328125, -0.306640625, 0.01953125, 0.345703125, 0.671875, 0.998046875, 1.32421875, 1.650390625, 1.9765625, 2.302734375, 2.62890625, 2.955078125, 3.28125, 3.607421875, 3.93359375, 4.259765625, 4.5859375, 4.912109375, 5.23828125, 5.564453125, 5.890625, 6.216796875, 6.54296875, 6.869140625, 7.1953125, 7.521484375, 7.84765625, 8.173828125, 8.5, 8.826171875, 9.15234375, 9.478515625, 9.8046875, 10.130859375, 10.45703125, 10.783203125, 11.109375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 12.0, 9.0, 8.0, 19.0, 32.0, 50.0, 67.0, 116.0, 171.0, 277.0, 406.0, 581.0, 966.0, 1502.0, 2531.0, 4170.0, 7261.0, 12601.0, 23898.0, 48967.0, 118091.0, 373831.0, 274422.0, 91830.0, 40168.0, 19876.0, 11010.0, 6101.0, 3642.0, 2184.0, 1397.0, 839.0, 586.0, 338.0, 207.0, 143.0, 87.0, 69.0, 29.0, 21.0, 21.0, 8.0, 4.0, 4.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00798797607421875, -0.007752120494842529, -0.007516264915466309, -0.007280409336090088, -0.007044553756713867, -0.0068086981773376465, -0.006572842597961426, -0.006336987018585205, -0.006101131439208984, -0.005865275859832764, -0.005629420280456543, -0.005393564701080322, -0.0051577091217041016, -0.004921853542327881, -0.00468599796295166, -0.0044501423835754395, -0.004214286804199219, -0.003978431224822998, -0.0037425756454467773, -0.0035067200660705566, -0.003270864486694336, -0.0030350089073181152, -0.0027991533279418945, -0.002563297748565674, -0.002327442169189453, -0.0020915865898132324, -0.0018557310104370117, -0.001619875431060791, -0.0013840198516845703, -0.0011481642723083496, -0.0009123086929321289, -0.0006764531135559082, -0.0004405975341796875, -0.0002047419548034668, 3.1113624572753906e-05, 0.0002669692039489746, 0.0005028247833251953, 0.000738680362701416, 0.0009745359420776367, 0.0012103915214538574, 0.0014462471008300781, 0.0016821026802062988, 0.0019179582595825195, 0.0021538138389587402, 0.002389669418334961, 0.0026255249977111816, 0.0028613805770874023, 0.003097236156463623, 0.0033330917358398438, 0.0035689473152160645, 0.003804802894592285, 0.004040658473968506, 0.0042765140533447266, 0.004512369632720947, 0.004748225212097168, 0.004984080791473389, 0.005219936370849609, 0.00545579195022583, 0.005691647529602051, 0.0059275031089782715, 0.006163358688354492, 0.006399214267730713, 0.006635069847106934, 0.006870925426483154, 0.007106781005859375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 5.0, 0.0, 2.0, 3.0, 2.0, 5.0, 6.0, 5.0, 8.0, 7.0, 12.0, 12.0, 15.0, 20.0, 17.0, 31.0, 28.0, 33.0, 33.0, 40.0, 55.0, 51.0, 57.0, 54.0, 64.0, 87.0, 40.0, 48.0, 39.0, 46.0, 46.0, 31.0, 24.0, 12.0, 17.0, 19.0, 12.0, 5.0, 6.0, 2.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.635883331298828e-06, -3.5045668482780457e-06, -3.373250365257263e-06, -3.2419338822364807e-06, -3.1106173992156982e-06, -2.9793009161949158e-06, -2.8479844331741333e-06, -2.716667950153351e-06, -2.5853514671325684e-06, -2.454034984111786e-06, -2.3227185010910034e-06, -2.191402018070221e-06, -2.0600855350494385e-06, -1.928769052028656e-06, -1.7974525690078735e-06, -1.666136085987091e-06, -1.5348196029663086e-06, -1.4035031199455261e-06, -1.2721866369247437e-06, -1.1408701539039612e-06, -1.0095536708831787e-06, -8.782371878623962e-07, -7.469207048416138e-07, -6.156042218208313e-07, -4.842877388000488e-07, -3.5297125577926636e-07, -2.2165477275848389e-07, -9.033828973770142e-08, 4.0978193283081055e-08, 1.7229467630386353e-07, 3.03611159324646e-07, 4.3492764234542847e-07, 5.662441253662109e-07, 6.975606083869934e-07, 8.288770914077759e-07, 9.601935744285583e-07, 1.0915100574493408e-06, 1.2228265404701233e-06, 1.3541430234909058e-06, 1.4854595065116882e-06, 1.6167759895324707e-06, 1.7480924725532532e-06, 1.8794089555740356e-06, 2.010725438594818e-06, 2.1420419216156006e-06, 2.273358404636383e-06, 2.4046748876571655e-06, 2.535991370677948e-06, 2.6673078536987305e-06, 2.798624336719513e-06, 2.9299408197402954e-06, 3.061257302761078e-06, 3.1925737857818604e-06, 3.323890268802643e-06, 3.4552067518234253e-06, 3.5865232348442078e-06, 3.7178397178649902e-06, 3.849156200885773e-06, 3.980472683906555e-06, 4.111789166927338e-06, 4.24310564994812e-06, 4.374422132968903e-06, 4.505738615989685e-06, 4.6370550990104675e-06, 4.76837158203125e-06]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 9.0, 10.0, 11.0, 20.0, 25.0, 48.0, 55.0, 81.0, 130.0, 170.0, 299.0, 431.0, 677.0, 1132.0, 1791.0, 3038.0, 5014.0, 9197.0, 18450.0, 39981.0, 96205.0, 331484.0, 355397.0, 101678.0, 41271.0, 19017.0, 9674.0, 5224.0, 2973.0, 1911.0, 1091.0, 758.0, 421.0, 318.0, 185.0, 122.0, 90.0, 54.0, 37.0, 29.0, 15.0, 13.0, 5.0, 6.0, 7.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0075531005859375, -0.0072928667068481445, -0.007032632827758789, -0.006772398948669434, -0.006512165069580078, -0.006251931190490723, -0.005991697311401367, -0.005731463432312012, -0.005471229553222656, -0.005210995674133301, -0.004950761795043945, -0.00469052791595459, -0.004430294036865234, -0.004170060157775879, -0.0039098262786865234, -0.003649592399597168, -0.0033893585205078125, -0.003129124641418457, -0.0028688907623291016, -0.002608656883239746, -0.0023484230041503906, -0.002088189125061035, -0.0018279552459716797, -0.0015677213668823242, -0.0013074874877929688, -0.0010472536087036133, -0.0007870197296142578, -0.0005267858505249023, -0.0002665519714355469, -6.318092346191406e-06, 0.00025391578674316406, 0.0005141496658325195, 0.000774383544921875, 0.0010346174240112305, 0.001294851303100586, 0.0015550851821899414, 0.0018153190612792969, 0.0020755529403686523, 0.002335786819458008, 0.0025960206985473633, 0.0028562545776367188, 0.0031164884567260742, 0.0033767223358154297, 0.003636956214904785, 0.0038971900939941406, 0.004157423973083496, 0.0044176578521728516, 0.004677891731262207, 0.0049381256103515625, 0.005198359489440918, 0.0054585933685302734, 0.005718827247619629, 0.005979061126708984, 0.00623929500579834, 0.006499528884887695, 0.006759762763977051, 0.007019996643066406, 0.007280230522155762, 0.007540464401245117, 0.007800698280334473, 0.008060932159423828, 0.008321166038513184, 0.008581399917602539, 0.008841633796691895, 0.00910186767578125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 1.0, 4.0, 5.0, 4.0, 4.0, 6.0, 11.0, 18.0, 19.0, 15.0, 30.0, 39.0, 44.0, 55.0, 54.0, 86.0, 99.0, 106.0, 79.0, 59.0, 52.0, 47.0, 43.0, 27.0, 26.0, 20.0, 8.0, 9.0, 8.0, 4.0, 7.0, 4.0, 2.0, 4.0, 4.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00390625, -0.0038010776042938232, -0.0036959052085876465, -0.0035907328128814697, -0.003485560417175293, -0.003380388021469116, -0.0032752156257629395, -0.0031700432300567627, -0.003064870834350586, -0.002959698438644409, -0.0028545260429382324, -0.0027493536472320557, -0.002644181251525879, -0.002539008855819702, -0.0024338364601135254, -0.0023286640644073486, -0.002223491668701172, -0.002118319272994995, -0.0020131468772888184, -0.0019079744815826416, -0.0018028020858764648, -0.001697629690170288, -0.0015924572944641113, -0.0014872848987579346, -0.0013821125030517578, -0.001276940107345581, -0.0011717677116394043, -0.0010665953159332275, -0.0009614229202270508, -0.000856250524520874, -0.0007510781288146973, -0.0006459057331085205, -0.0005407333374023438, -0.000435560941696167, -0.00033038854598999023, -0.00022521615028381348, -0.00012004375457763672, -1.4871358871459961e-05, 9.03010368347168e-05, 0.00019547343254089355, 0.0003006458282470703, 0.00040581822395324707, 0.0005109906196594238, 0.0006161630153656006, 0.0007213354110717773, 0.0008265078067779541, 0.0009316802024841309, 0.0010368525981903076, 0.0011420249938964844, 0.0012471973896026611, 0.0013523697853088379, 0.0014575421810150146, 0.0015627145767211914, 0.0016678869724273682, 0.001773059368133545, 0.0018782317638397217, 0.0019834041595458984, 0.002088576555252075, 0.002193748950958252, 0.0022989213466644287, 0.0024040937423706055, 0.0025092661380767822, 0.002614438533782959, 0.0027196109294891357, 0.0028247833251953125]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 5.0, 3.0, 7.0, 9.0, 7.0, 10.0, 17.0, 15.0, 21.0, 25.0, 34.0, 49.0, 47.0, 60.0, 82.0, 113.0, 107.0, 88.0, 78.0, 38.0, 36.0, 26.0, 23.0, 20.0, 22.0, 11.0, 15.0, 12.0, 4.0, 2.0, 6.0, 0.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-19.503889083862305, -18.973661422729492, -18.443431854248047, -17.913204193115234, -17.382976531982422, -16.85274887084961, -16.322519302368164, -15.792291641235352, -15.262063980102539, -14.73183536529541, -14.201607704162598, -13.671379089355469, -13.141151428222656, -12.610922813415527, -12.080694198608398, -11.550466537475586, -11.020237922668457, -10.490009307861328, -9.959781646728516, -9.429553031921387, -8.899325370788574, -8.369096755981445, -7.838868618011475, -7.308640480041504, -6.778412342071533, -6.2481842041015625, -5.717956066131592, -5.187727928161621, -4.657499313354492, -4.12727165222168, -3.597043037414551, -3.06681489944458, -2.536585807800293, -2.0063576698303223, -1.476129412651062, -0.9459011554718018, -0.41567301750183105, 0.11455512046813965, 0.6447834968566895, 1.1750116348266602, 1.7052397727966309, 2.2354679107666016, 2.7656960487365723, 3.295924425125122, 3.8261525630950928, 4.356380462646484, 4.886609077453613, 5.416837215423584, 5.947065353393555, 6.477293491363525, 7.007521629333496, 7.537750244140625, 8.067977905273438, 8.598206520080566, 9.128435134887695, 9.658662796020508, 10.18889045715332, 10.71911907196045, 11.249346733093262, 11.77957534790039, 12.309803009033203, 12.840031623840332, 13.370260238647461, 13.900487899780273, 14.430716514587402]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 9.0, 15.0, 12.0, 14.0, 14.0, 23.0, 16.0, 27.0, 37.0, 43.0, 23.0, 36.0, 39.0, 45.0, 38.0, 46.0, 46.0, 35.0, 42.0, 46.0, 43.0, 49.0, 37.0, 28.0, 33.0, 35.0, 19.0, 31.0, 27.0, 13.0, 12.0, 12.0, 12.0, 4.0, 13.0, 10.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.889938354492188, -17.320709228515625, -16.751480102539062, -16.1822509765625, -15.613021850585938, -15.043792724609375, -14.474563598632812, -13.90533447265625, -13.336105346679688, -12.766876220703125, -12.197647094726562, -11.62841796875, -11.059188842773438, -10.489959716796875, -9.920730590820312, -9.35150146484375, -8.782272338867188, -8.213043212890625, -7.6438140869140625, -7.0745849609375, -6.5053558349609375, -5.936126708984375, -5.3668975830078125, -4.79766845703125, -4.2284393310546875, -3.659210205078125, -3.0899810791015625, -2.520751953125, -1.9515228271484375, -1.382293701171875, -0.8130645751953125, -0.24383544921875, 0.3253936767578125, 0.894622802734375, 1.4638519287109375, 2.0330810546875, 2.6023101806640625, 3.171539306640625, 3.7407684326171875, 4.30999755859375, 4.8792266845703125, 5.448455810546875, 6.0176849365234375, 6.5869140625, 7.1561431884765625, 7.725372314453125, 8.294601440429688, 8.86383056640625, 9.433059692382812, 10.002288818359375, 10.571517944335938, 11.1407470703125, 11.709976196289062, 12.279205322265625, 12.848434448242188, 13.41766357421875, 13.986892700195312, 14.556121826171875, 15.125350952148438, 15.694580078125, 16.263809204101562, 16.833038330078125, 17.402267456054688, 17.97149658203125, 18.540725708007812]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 20.0, 19.0, 31.0, 34.0, 62.0, 101.0, 150.0, 193.0, 269.0, 463.0, 725.0, 1138.0, 1817.0, 3012.0, 4620.0, 7291.0, 11974.0, 19587.0, 32104.0, 55669.0, 105241.0, 229629.0, 277010.0, 132610.0, 67074.0, 37969.0, 22841.0, 13901.0, 8545.0, 5263.0, 3406.0, 1973.0, 1330.0, 865.0, 536.0, 357.0, 217.0, 158.0, 139.0, 64.0, 44.0, 29.0, 18.0, 19.0, 7.0, 11.0, 6.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-27.28125, -26.432861328125, -25.58447265625, -24.736083984375, -23.8876953125, -23.039306640625, -22.19091796875, -21.342529296875, -20.494140625, -19.645751953125, -18.79736328125, -17.948974609375, -17.1005859375, -16.252197265625, -15.40380859375, -14.555419921875, -13.70703125, -12.858642578125, -12.01025390625, -11.161865234375, -10.3134765625, -9.465087890625, -8.61669921875, -7.768310546875, -6.919921875, -6.071533203125, -5.22314453125, -4.374755859375, -3.5263671875, -2.677978515625, -1.82958984375, -0.981201171875, -0.1328125, 0.715576171875, 1.56396484375, 2.412353515625, 3.2607421875, 4.109130859375, 4.95751953125, 5.805908203125, 6.654296875, 7.502685546875, 8.35107421875, 9.199462890625, 10.0478515625, 10.896240234375, 11.74462890625, 12.593017578125, 13.44140625, 14.289794921875, 15.13818359375, 15.986572265625, 16.8349609375, 17.683349609375, 18.53173828125, 19.380126953125, 20.228515625, 21.076904296875, 21.92529296875, 22.773681640625, 23.6220703125, 24.470458984375, 25.31884765625, 26.167236328125, 27.015625]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 8.0, 12.0, 8.0, 16.0, 14.0, 14.0, 19.0, 19.0, 35.0, 31.0, 45.0, 30.0, 30.0, 38.0, 40.0, 47.0, 47.0, 44.0, 36.0, 46.0, 46.0, 50.0, 41.0, 40.0, 36.0, 35.0, 20.0, 29.0, 29.0, 19.0, 16.0, 15.0, 7.0, 10.0, 4.0, 11.0, 11.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.390625, -15.865234375, -15.33984375, -14.814453125, -14.2890625, -13.763671875, -13.23828125, -12.712890625, -12.1875, -11.662109375, -11.13671875, -10.611328125, -10.0859375, -9.560546875, -9.03515625, -8.509765625, -7.984375, -7.458984375, -6.93359375, -6.408203125, -5.8828125, -5.357421875, -4.83203125, -4.306640625, -3.78125, -3.255859375, -2.73046875, -2.205078125, -1.6796875, -1.154296875, -0.62890625, -0.103515625, 0.421875, 0.947265625, 1.47265625, 1.998046875, 2.5234375, 3.048828125, 3.57421875, 4.099609375, 4.625, 5.150390625, 5.67578125, 6.201171875, 6.7265625, 7.251953125, 7.77734375, 8.302734375, 8.828125, 9.353515625, 9.87890625, 10.404296875, 10.9296875, 11.455078125, 11.98046875, 12.505859375, 13.03125, 13.556640625, 14.08203125, 14.607421875, 15.1328125, 15.658203125, 16.18359375, 16.708984375, 17.234375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [4.0, 4.0, 1.0, 2.0, 6.0, 5.0, 12.0, 19.0, 28.0, 50.0, 48.0, 87.0, 165.0, 194.0, 360.0, 474.0, 725.0, 1083.0, 1674.0, 2473.0, 3718.0, 5779.0, 8984.0, 14259.0, 23211.0, 38184.0, 65473.0, 124641.0, 261136.0, 231601.0, 110425.0, 59942.0, 35502.0, 21239.0, 13094.0, 8320.0, 5391.0, 3443.0, 2269.0, 1489.0, 1009.0, 672.0, 470.0, 297.0, 218.0, 123.0, 98.0, 65.0, 36.0, 27.0, 14.0, 14.0, 4.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.828125, -23.969482421875, -23.11083984375, -22.252197265625, -21.3935546875, -20.534912109375, -19.67626953125, -18.817626953125, -17.958984375, -17.100341796875, -16.24169921875, -15.383056640625, -14.5244140625, -13.665771484375, -12.80712890625, -11.948486328125, -11.08984375, -10.231201171875, -9.37255859375, -8.513916015625, -7.6552734375, -6.796630859375, -5.93798828125, -5.079345703125, -4.220703125, -3.362060546875, -2.50341796875, -1.644775390625, -0.7861328125, 0.072509765625, 0.93115234375, 1.789794921875, 2.6484375, 3.507080078125, 4.36572265625, 5.224365234375, 6.0830078125, 6.941650390625, 7.80029296875, 8.658935546875, 9.517578125, 10.376220703125, 11.23486328125, 12.093505859375, 12.9521484375, 13.810791015625, 14.66943359375, 15.528076171875, 16.38671875, 17.245361328125, 18.10400390625, 18.962646484375, 19.8212890625, 20.679931640625, 21.53857421875, 22.397216796875, 23.255859375, 24.114501953125, 24.97314453125, 25.831787109375, 26.6904296875, 27.549072265625, 28.40771484375, 29.266357421875, 30.125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 6.0, 6.0, 7.0, 7.0, 8.0, 6.0, 10.0, 16.0, 9.0, 14.0, 27.0, 28.0, 25.0, 34.0, 32.0, 28.0, 32.0, 40.0, 40.0, 37.0, 49.0, 43.0, 38.0, 52.0, 39.0, 41.0, 42.0, 29.0, 34.0, 40.0, 35.0, 26.0, 25.0, 17.0, 14.0, 16.0, 13.0, 5.0, 8.0, 9.0, 7.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.328125, -9.0067138671875, -8.685302734375, -8.3638916015625, -8.04248046875, -7.7210693359375, -7.399658203125, -7.0782470703125, -6.7568359375, -6.4354248046875, -6.114013671875, -5.7926025390625, -5.47119140625, -5.1497802734375, -4.828369140625, -4.5069580078125, -4.185546875, -3.8641357421875, -3.542724609375, -3.2213134765625, -2.89990234375, -2.5784912109375, -2.257080078125, -1.9356689453125, -1.6142578125, -1.2928466796875, -0.971435546875, -0.6500244140625, -0.32861328125, -0.0072021484375, 0.314208984375, 0.6356201171875, 0.95703125, 1.2784423828125, 1.599853515625, 1.9212646484375, 2.24267578125, 2.5640869140625, 2.885498046875, 3.2069091796875, 3.5283203125, 3.8497314453125, 4.171142578125, 4.4925537109375, 4.81396484375, 5.1353759765625, 5.456787109375, 5.7781982421875, 6.099609375, 6.4210205078125, 6.742431640625, 7.0638427734375, 7.38525390625, 7.7066650390625, 8.028076171875, 8.3494873046875, 8.6708984375, 8.9923095703125, 9.313720703125, 9.6351318359375, 9.95654296875, 10.2779541015625, 10.599365234375, 10.9207763671875, 11.2421875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 10.0, 12.0, 6.0, 12.0, 17.0, 26.0, 40.0, 61.0, 62.0, 98.0, 126.0, 190.0, 243.0, 347.0, 509.0, 761.0, 1179.0, 1801.0, 3060.0, 5091.0, 9876.0, 21020.0, 51570.0, 175140.0, 540006.0, 149061.0, 46763.0, 19287.0, 9090.0, 4939.0, 2826.0, 1755.0, 1106.0, 755.0, 494.0, 361.0, 241.0, 160.0, 122.0, 97.0, 61.0, 45.0, 41.0, 24.0, 21.0, 18.0, 7.0, 8.0, 6.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.24609375, -6.04095458984375, -5.8358154296875, -5.63067626953125, -5.425537109375, -5.22039794921875, -5.0152587890625, -4.81011962890625, -4.60498046875, -4.39984130859375, -4.1947021484375, -3.98956298828125, -3.784423828125, -3.57928466796875, -3.3741455078125, -3.16900634765625, -2.9638671875, -2.75872802734375, -2.5535888671875, -2.34844970703125, -2.143310546875, -1.93817138671875, -1.7330322265625, -1.52789306640625, -1.32275390625, -1.11761474609375, -0.9124755859375, -0.70733642578125, -0.502197265625, -0.29705810546875, -0.0919189453125, 0.11322021484375, 0.318359375, 0.52349853515625, 0.7286376953125, 0.93377685546875, 1.138916015625, 1.34405517578125, 1.5491943359375, 1.75433349609375, 1.95947265625, 2.16461181640625, 2.3697509765625, 2.57489013671875, 2.780029296875, 2.98516845703125, 3.1903076171875, 3.39544677734375, 3.6005859375, 3.80572509765625, 4.0108642578125, 4.21600341796875, 4.421142578125, 4.62628173828125, 4.8314208984375, 5.03656005859375, 5.24169921875, 5.44683837890625, 5.6519775390625, 5.85711669921875, 6.062255859375, 6.26739501953125, 6.4725341796875, 6.67767333984375, 6.8828125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 11.0, 7.0, 6.0, 8.0, 17.0, 34.0, 32.0, 38.0, 46.0, 53.0, 105.0, 100.0, 97.0, 101.0, 74.0, 64.0, 46.0, 40.0, 39.0, 18.0, 12.0, 8.0, 8.0, 7.0, 5.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00017631053924560547, -0.00016983412206172943, -0.0001633577048778534, -0.00015688128769397736, -0.00015040487051010132, -0.00014392845332622528, -0.00013745203614234924, -0.0001309756189584732, -0.00012449920177459717, -0.00011802278459072113, -0.00011154636740684509, -0.00010506995022296906, -9.859353303909302e-05, -9.211711585521698e-05, -8.564069867134094e-05, -7.91642814874649e-05, -7.268786430358887e-05, -6.621144711971283e-05, -5.973502993583679e-05, -5.3258612751960754e-05, -4.678219556808472e-05, -4.030577838420868e-05, -3.382936120033264e-05, -2.7352944016456604e-05, -2.0876526832580566e-05, -1.4400109648704529e-05, -7.923692464828491e-06, -1.4472752809524536e-06, 5.029141902923584e-06, 1.1505559086799622e-05, 1.798197627067566e-05, 2.4458393454551697e-05, 3.0934810638427734e-05, 3.741122782230377e-05, 4.388764500617981e-05, 5.036406219005585e-05, 5.6840479373931885e-05, 6.331689655780792e-05, 6.979331374168396e-05, 7.626973092556e-05, 8.274614810943604e-05, 8.922256529331207e-05, 9.569898247718811e-05, 0.00010217539966106415, 0.00010865181684494019, 0.00011512823402881622, 0.00012160465121269226, 0.0001280810683965683, 0.00013455748558044434, 0.00014103390276432037, 0.0001475103199481964, 0.00015398673713207245, 0.00016046315431594849, 0.00016693957149982452, 0.00017341598868370056, 0.0001798924058675766, 0.00018636882305145264, 0.00019284524023532867, 0.0001993216574192047, 0.00020579807460308075, 0.0002122744917869568, 0.00021875090897083282, 0.00022522732615470886, 0.0002317037433385849, 0.00023818016052246094]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 7.0, 9.0, 14.0, 18.0, 24.0, 23.0, 32.0, 41.0, 51.0, 75.0, 98.0, 125.0, 182.0, 250.0, 391.0, 605.0, 905.0, 1448.0, 2351.0, 4123.0, 7429.0, 13890.0, 29452.0, 74275.0, 273029.0, 441188.0, 116291.0, 41129.0, 18452.0, 9440.0, 5146.0, 2939.0, 1781.0, 1068.0, 732.0, 440.0, 280.0, 241.0, 131.0, 97.0, 92.0, 67.0, 63.0, 23.0, 28.0, 19.0, 11.0, 19.0, 14.0, 6.0, 3.0, 1.0, 6.0, 3.0, 0.0, 1.0, 4.0], "bins": [-5.71875, -5.5411376953125, -5.363525390625, -5.1859130859375, -5.00830078125, -4.8306884765625, -4.653076171875, -4.4754638671875, -4.2978515625, -4.1202392578125, -3.942626953125, -3.7650146484375, -3.58740234375, -3.4097900390625, -3.232177734375, -3.0545654296875, -2.876953125, -2.6993408203125, -2.521728515625, -2.3441162109375, -2.16650390625, -1.9888916015625, -1.811279296875, -1.6336669921875, -1.4560546875, -1.2784423828125, -1.100830078125, -0.9232177734375, -0.74560546875, -0.5679931640625, -0.390380859375, -0.2127685546875, -0.03515625, 0.1424560546875, 0.320068359375, 0.4976806640625, 0.67529296875, 0.8529052734375, 1.030517578125, 1.2081298828125, 1.3857421875, 1.5633544921875, 1.740966796875, 1.9185791015625, 2.09619140625, 2.2738037109375, 2.451416015625, 2.6290283203125, 2.806640625, 2.9842529296875, 3.161865234375, 3.3394775390625, 3.51708984375, 3.6947021484375, 3.872314453125, 4.0499267578125, 4.2275390625, 4.4051513671875, 4.582763671875, 4.7603759765625, 4.93798828125, 5.1156005859375, 5.293212890625, 5.4708251953125, 5.6484375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 8.0, 11.0, 6.0, 14.0, 16.0, 18.0, 32.0, 55.0, 48.0, 69.0, 93.0, 115.0, 114.0, 97.0, 85.0, 56.0, 39.0, 27.0, 26.0, 20.0, 14.0, 13.0, 8.0, 4.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.5546875, -2.474884033203125, -2.39508056640625, -2.315277099609375, -2.2354736328125, -2.155670166015625, -2.07586669921875, -1.996063232421875, -1.916259765625, -1.836456298828125, -1.75665283203125, -1.676849365234375, -1.5970458984375, -1.517242431640625, -1.43743896484375, -1.357635498046875, -1.27783203125, -1.198028564453125, -1.11822509765625, -1.038421630859375, -0.9586181640625, -0.878814697265625, -0.79901123046875, -0.719207763671875, -0.639404296875, -0.559600830078125, -0.47979736328125, -0.399993896484375, -0.3201904296875, -0.240386962890625, -0.16058349609375, -0.080780029296875, -0.0009765625, 0.078826904296875, 0.15863037109375, 0.238433837890625, 0.3182373046875, 0.398040771484375, 0.47784423828125, 0.557647705078125, 0.637451171875, 0.717254638671875, 0.79705810546875, 0.876861572265625, 0.9566650390625, 1.036468505859375, 1.11627197265625, 1.196075439453125, 1.27587890625, 1.355682373046875, 1.43548583984375, 1.515289306640625, 1.5950927734375, 1.674896240234375, 1.75469970703125, 1.834503173828125, 1.914306640625, 1.994110107421875, 2.07391357421875, 2.153717041015625, 2.2335205078125, 2.313323974609375, 2.39312744140625, 2.472930908203125, 2.552734375]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 3.0, 7.0, 7.0, 11.0, 10.0, 12.0, 10.0, 19.0, 25.0, 26.0, 33.0, 46.0, 50.0, 52.0, 76.0, 86.0, 103.0, 80.0, 70.0, 50.0, 44.0, 35.0, 29.0, 14.0, 25.0, 13.0, 9.0, 11.0, 4.0, 8.0, 3.0, 5.0, 3.0, 7.0, 2.0, 1.0, 4.0, 3.0, 1.0, 2.0, 1.0], "bins": [-19.53854751586914, -19.036327362060547, -18.53410530090332, -18.031885147094727, -17.529664993286133, -17.027442932128906, -16.525222778320312, -16.02300262451172, -15.520780563354492, -15.018559455871582, -14.516339302062988, -14.014118194580078, -13.511897087097168, -13.009675979614258, -12.507455825805664, -12.005234718322754, -11.50301456451416, -11.00079345703125, -10.498573303222656, -9.996352195739746, -9.494131088256836, -8.991910934448242, -8.489689826965332, -7.987468719482422, -7.48524808883667, -6.983027458190918, -6.480806350708008, -5.978585720062256, -5.476365089416504, -4.974143981933594, -4.471923351287842, -3.9697024822235107, -3.4674816131591797, -2.9652607440948486, -2.4630398750305176, -1.9608192443847656, -1.4585983753204346, -0.9563775062561035, -0.45415687561035156, 0.04806399345397949, 0.5502848625183105, 1.0525057315826416, 1.554726481437683, 2.0569472312927246, 2.5591681003570557, 3.0613889694213867, 3.5636096000671387, 4.065830230712891, 4.568051338195801, 5.070271968841553, 5.572493076324463, 6.074713706970215, 6.576934814453125, 7.079155445098877, 7.581376075744629, 8.083597183227539, 8.585817337036133, 9.088038444519043, 9.590258598327637, 10.092479705810547, 10.594700813293457, 11.096921920776367, 11.599142074584961, 12.101363182067871, 12.603584289550781]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 12.0, 14.0, 16.0, 18.0, 14.0, 17.0, 22.0, 19.0, 37.0, 24.0, 41.0, 36.0, 38.0, 44.0, 61.0, 35.0, 52.0, 43.0, 44.0, 39.0, 33.0, 44.0, 47.0, 31.0, 34.0, 19.0, 29.0, 24.0, 17.0, 23.0, 17.0, 14.0, 11.0, 13.0, 6.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-18.746007919311523, -18.150054931640625, -17.55410385131836, -16.958152770996094, -16.362199783325195, -15.766247749328613, -15.170295715332031, -14.57434368133545, -13.978391647338867, -13.382439613342285, -12.786487579345703, -12.190535545349121, -11.594583511352539, -10.998631477355957, -10.402679443359375, -9.806727409362793, -9.210775375366211, -8.614823341369629, -8.018871307373047, -7.422919273376465, -6.826967239379883, -6.231015205383301, -5.635063171386719, -5.039111137390137, -4.443159103393555, -3.8472070693969727, -3.2512550354003906, -2.6553030014038086, -2.0593509674072266, -1.4633989334106445, -0.8674468994140625, -0.27149486541748047, 0.3244590759277344, 0.9204111099243164, 1.5163631439208984, 2.1123151779174805, 2.7082672119140625, 3.3042192459106445, 3.9001712799072266, 4.496123313903809, 5.092075347900391, 5.688027381896973, 6.283979415893555, 6.879931449890137, 7.475883483886719, 8.0718355178833, 8.667787551879883, 9.263739585876465, 9.859691619873047, 10.455643653869629, 11.051595687866211, 11.647547721862793, 12.243499755859375, 12.839451789855957, 13.435403823852539, 14.031355857849121, 14.627307891845703, 15.223259925842285, 15.819211959838867, 16.415164947509766, 17.01111602783203, 17.607067108154297, 18.203020095825195, 18.798973083496094, 19.39492416381836]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 7.0, 5.0, 2.0, 6.0, 8.0, 11.0, 21.0, 16.0, 20.0, 27.0, 33.0, 45.0, 44.0, 44.0, 63.0, 82.0, 103.0, 115.0, 143.0, 184.0, 290.0, 487.0, 1023.0, 518430.0, 1271.0, 546.0, 251.0, 188.0, 142.0, 103.0, 87.0, 74.0, 65.0, 47.0, 51.0, 51.0, 30.0, 48.0, 22.0, 13.0, 15.0, 19.0, 12.0, 6.0, 7.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-201.6122589111328, -195.02061462402344, -188.428955078125, -181.83731079101562, -175.2456512451172, -168.6540069580078, -162.06234741210938, -155.470703125, -148.87905883789062, -142.28741455078125, -135.6957550048828, -129.10411071777344, -122.512451171875, -115.92080688476562, -109.32915496826172, -102.73750305175781, -96.14584350585938, -89.55419158935547, -82.96253967285156, -76.37089538574219, -69.77923583984375, -63.18758773803711, -56.59593963623047, -50.00428771972656, -43.412635803222656, -36.82098388671875, -30.229333877563477, -23.637683868408203, -17.046031951904297, -10.45438003540039, -3.86273193359375, 2.7289199829101562, 9.320556640625, 15.91220760345459, 22.50385856628418, 29.095508575439453, 35.68716049194336, 42.278812408447266, 48.870460510253906, 55.46211242675781, 62.05376434326172, 68.64541625976562, 75.23706817626953, 81.82872009277344, 88.42036437988281, 95.01202392578125, 101.60366821289062, 108.19532012939453, 114.78697204589844, 121.37862396240234, 127.97027587890625, 134.56192016601562, 141.15357971191406, 147.74522399902344, 154.33688354492188, 160.92852783203125, 167.52017211914062, 174.11181640625, 180.70347595214844, 187.2951202392578, 193.88677978515625, 200.47842407226562, 207.070068359375, 213.66172790527344, 220.25338745117188]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 11.0, 13.0, 19.0, 17.0, 14.0, 16.0, 23.0, 21.0, 28.0, 31.0, 42.0, 34.0, 35.0, 45.0, 59.0, 38.0, 51.0, 1063.0, 46.0, 38.0, 36.0, 44.0, 43.0, 36.0, 34.0, 24.0, 26.0, 22.0, 18.0, 22.0, 19.0, 13.0, 11.0, 12.0, 7.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-541.4263916015625, -524.1692504882812, -506.9120788574219, -489.6549377441406, -472.39776611328125, -455.140625, -437.88348388671875, -420.6263427734375, -403.3691711425781, -386.1120300292969, -368.8548583984375, -351.59771728515625, -334.340576171875, -317.0834045410156, -299.8262634277344, -282.569091796875, -265.31195068359375, -248.05479431152344, -230.79763793945312, -213.54049682617188, -196.28334045410156, -179.02618408203125, -161.76904296875, -144.5118865966797, -127.25473022460938, -109.99757385253906, -92.74042510986328, -75.4832763671875, -58.22611999511719, -40.968963623046875, -23.711814880371094, -6.4546661376953125, 10.802490234375, 28.059642791748047, 45.316795349121094, 62.57394790649414, 79.83110046386719, 97.0882568359375, 114.34540557861328, 131.60255432128906, 148.85971069335938, 166.1168670654297, 183.3740234375, 200.63116455078125, 217.88832092285156, 235.14547729492188, 252.40261840820312, 269.6597900390625, 286.91693115234375, 304.174072265625, 321.4312438964844, 338.6883850097656, 355.945556640625, 373.20269775390625, 390.4598388671875, 407.71697998046875, 424.9741516113281, 442.2312927246094, 459.48846435546875, 476.74560546875, 494.00274658203125, 511.2599182128906, 528.51708984375, 545.7742309570312, 563.0313720703125]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 8.0, 3.0, 5.0, 5.0, 4.0, 8.0, 11.0, 9.0, 11.0, 15.0, 13.0, 17.0, 9.0, 7.0, 17.0, 17.0, 11.0, 21.0, 14.0, 14.0, 15.0, 13.0, 14.0, 16.0, 23.0, 32.0, 53.0, 77.0, 179.0, 274.0, 670.0, 2068.0, 5384.0, 8492.0, 9970.0, 31197424.0, 25400.0, 1933.0, 1414.0, 208.0, 142.0, 15.0, 10.0, 16.0, 16.0, 19.0, 22.0, 45.0, 35.0, 28.0, 41.0, 49.0, 194.0], "bins": [-2616.0, -2559.375, -2502.75, -2446.125, -2389.5, -2332.875, -2276.25, -2219.625, -2163.0, -2106.375, -2049.75, -1993.125, -1936.5, -1879.875, -1823.25, -1766.625, -1710.0, -1653.375, -1596.75, -1540.125, -1483.5, -1426.875, -1370.25, -1313.625, -1257.0, -1200.375, -1143.75, -1087.125, -1030.5, -973.875, -917.25, -860.625, -804.0, -747.375, -690.75, -634.125, -577.5, -520.875, -464.25, -407.625, -351.0, -294.375, -237.75, -181.125, -124.5, -67.875, -11.25, 45.375, 102.0, 158.625, 215.25, 271.875, 328.5, 385.125, 441.75, 498.375, 555.0, 611.625, 668.25, 724.875, 781.5, 838.125, 894.75, 951.375, 1008.0]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [5.0, 14.0, 16.0, 22.0, 29.0, 54.0, 65.0, 88.0, 105.0, 174.0, 280.0, 377.0, 508.0, 726.0, 1014.0, 1514.0, 2013.0, 2877.0, 4130.0, 5923.0, 8351.0, 12231.0, 18070.0, 27509.0, 41464.0, 65785.0, 107865.0, 186654.0, 377034.0, 3352509.0, 1308493.0, 322861.0, 167314.0, 97355.0, 60030.0, 38411.0, 25099.0, 16611.0, 11363.0, 7997.0, 5383.0, 3776.0, 2813.0, 1941.0, 1299.0, 905.0, 722.0, 530.0, 358.0, 230.0, 165.0, 119.0, 106.0, 63.0, 36.0, 18.0, 21.0, 13.0, 3.0, 2.0, 3.0, 1.0, 4.0, 5.0], "bins": [-10.09375, -9.7562255859375, -9.418701171875, -9.0811767578125, -8.74365234375, -8.4061279296875, -8.068603515625, -7.7310791015625, -7.3935546875, -7.0560302734375, -6.718505859375, -6.3809814453125, -6.04345703125, -5.7059326171875, -5.368408203125, -5.0308837890625, -4.693359375, -4.3558349609375, -4.018310546875, -3.6807861328125, -3.34326171875, -3.0057373046875, -2.668212890625, -2.3306884765625, -1.9931640625, -1.6556396484375, -1.318115234375, -0.9805908203125, -0.64306640625, -0.3055419921875, 0.031982421875, 0.3695068359375, 0.70703125, 1.0445556640625, 1.382080078125, 1.7196044921875, 2.05712890625, 2.3946533203125, 2.732177734375, 3.0697021484375, 3.4072265625, 3.7447509765625, 4.082275390625, 4.4197998046875, 4.75732421875, 5.0948486328125, 5.432373046875, 5.7698974609375, 6.107421875, 6.4449462890625, 6.782470703125, 7.1199951171875, 7.45751953125, 7.7950439453125, 8.132568359375, 8.4700927734375, 8.8076171875, 9.1451416015625, 9.482666015625, 9.8201904296875, 10.15771484375, 10.4952392578125, 10.832763671875, 11.1702880859375, 11.5078125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 5.0, 5.0, 4.0, 2.0, 7.0, 8.0, 7.0, 12.0, 12.0, 12.0, 17.0, 24.0, 15.0, 24.0, 34.0, 34.0, 44.0, 37.0, 57.0, 65.0, 93.0, 247.0, 596.0, 170.0, 86.0, 55.0, 50.0, 41.0, 28.0, 28.0, 34.0, 24.0, 27.0, 19.0, 15.0, 18.0, 17.0, 9.0, 7.0, 10.0, 9.0, 5.0, 4.0, 2.0, 6.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.953125, -19.2724609375, -18.591796875, -17.9111328125, -17.23046875, -16.5498046875, -15.869140625, -15.1884765625, -14.5078125, -13.8271484375, -13.146484375, -12.4658203125, -11.78515625, -11.1044921875, -10.423828125, -9.7431640625, -9.0625, -8.3818359375, -7.701171875, -7.0205078125, -6.33984375, -5.6591796875, -4.978515625, -4.2978515625, -3.6171875, -2.9365234375, -2.255859375, -1.5751953125, -0.89453125, -0.2138671875, 0.466796875, 1.1474609375, 1.828125, 2.5087890625, 3.189453125, 3.8701171875, 4.55078125, 5.2314453125, 5.912109375, 6.5927734375, 7.2734375, 7.9541015625, 8.634765625, 9.3154296875, 9.99609375, 10.6767578125, 11.357421875, 12.0380859375, 12.71875, 13.3994140625, 14.080078125, 14.7607421875, 15.44140625, 16.1220703125, 16.802734375, 17.4833984375, 18.1640625, 18.8447265625, 19.525390625, 20.2060546875, 20.88671875, 21.5673828125, 22.248046875, 22.9287109375, 23.609375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 6.0, 6.0, 12.0, 9.0, 25.0, 32.0, 23.0, 50.0, 63.0, 72.0, 162.0, 198.0, 309.0, 375.0, 598.0, 819.0, 1254.0, 1889.0, 2782.0, 4267.0, 6379.0, 10185.0, 15496.0, 24829.0, 40357.0, 66779.0, 114835.0, 209964.0, 471471.0, 3704196.0, 935702.0, 300108.0, 153094.0, 86548.0, 50976.0, 31430.0, 19614.0, 12535.0, 8018.0, 5157.0, 3396.0, 2321.0, 1533.0, 1060.0, 775.0, 538.0, 328.0, 243.0, 192.0, 151.0, 91.0, 52.0, 35.0, 22.0, 32.0, 15.0, 11.0, 9.0, 12.0, 5.0, 3.0, 5.0], "bins": [-10.7890625, -10.44921875, -10.109375, -9.76953125, -9.4296875, -9.08984375, -8.75, -8.41015625, -8.0703125, -7.73046875, -7.390625, -7.05078125, -6.7109375, -6.37109375, -6.03125, -5.69140625, -5.3515625, -5.01171875, -4.671875, -4.33203125, -3.9921875, -3.65234375, -3.3125, -2.97265625, -2.6328125, -2.29296875, -1.953125, -1.61328125, -1.2734375, -0.93359375, -0.59375, -0.25390625, 0.0859375, 0.42578125, 0.765625, 1.10546875, 1.4453125, 1.78515625, 2.125, 2.46484375, 2.8046875, 3.14453125, 3.484375, 3.82421875, 4.1640625, 4.50390625, 4.84375, 5.18359375, 5.5234375, 5.86328125, 6.203125, 6.54296875, 6.8828125, 7.22265625, 7.5625, 7.90234375, 8.2421875, 8.58203125, 8.921875, 9.26171875, 9.6015625, 9.94140625, 10.28125, 10.62109375, 10.9609375]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 2.0, 6.0, 10.0, 12.0, 12.0, 8.0, 23.0, 23.0, 20.0, 35.0, 27.0, 42.0, 46.0, 45.0, 61.0, 67.0, 96.0, 215.0, 565.0, 186.0, 96.0, 71.0, 42.0, 31.0, 45.0, 30.0, 33.0, 25.0, 24.0, 17.0, 14.0, 15.0, 18.0, 11.0, 12.0, 5.0, 10.0, 4.0, 6.0, 5.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.4921875, -14.0169677734375, -13.541748046875, -13.0665283203125, -12.59130859375, -12.1160888671875, -11.640869140625, -11.1656494140625, -10.6904296875, -10.2152099609375, -9.739990234375, -9.2647705078125, -8.78955078125, -8.3143310546875, -7.839111328125, -7.3638916015625, -6.888671875, -6.4134521484375, -5.938232421875, -5.4630126953125, -4.98779296875, -4.5125732421875, -4.037353515625, -3.5621337890625, -3.0869140625, -2.6116943359375, -2.136474609375, -1.6612548828125, -1.18603515625, -0.7108154296875, -0.235595703125, 0.2396240234375, 0.71484375, 1.1900634765625, 1.665283203125, 2.1405029296875, 2.61572265625, 3.0909423828125, 3.566162109375, 4.0413818359375, 4.5166015625, 4.9918212890625, 5.467041015625, 5.9422607421875, 6.41748046875, 6.8927001953125, 7.367919921875, 7.8431396484375, 8.318359375, 8.7935791015625, 9.268798828125, 9.7440185546875, 10.21923828125, 10.6944580078125, 11.169677734375, 11.6448974609375, 12.1201171875, 12.5953369140625, 13.070556640625, 13.5457763671875, 14.02099609375, 14.4962158203125, 14.971435546875, 15.4466552734375, 15.921875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [8.0, 9.0, 6.0, 1.0, 7.0, 8.0, 25.0, 20.0, 20.0, 38.0, 30.0, 19.0, 40.0, 72.0, 90.0, 132.0, 160.0, 214.0, 229.0, 382.0, 551.0, 623.0, 1103.0, 1643.0, 2366.0, 4281.0, 7866.0, 17331.0, 46057.0, 259817.0, 5834611.0, 66763.0, 22937.0, 9870.0, 5096.0, 2832.0, 1791.0, 1258.0, 821.0, 570.0, 427.0, 342.0, 254.0, 173.0, 155.0, 107.0, 83.0, 52.0, 32.0, 37.0, 12.0, 11.0, 10.0, 12.0, 14.0, 11.0, 7.0, 5.0, 3.0, 3.0, 0.0, 0.0, 5.0, 4.0], "bins": [-30.15625, -29.15625, -28.15625, -27.15625, -26.15625, -25.15625, -24.15625, -23.15625, -22.15625, -21.15625, -20.15625, -19.15625, -18.15625, -17.15625, -16.15625, -15.15625, -14.15625, -13.15625, -12.15625, -11.15625, -10.15625, -9.15625, -8.15625, -7.15625, -6.15625, -5.15625, -4.15625, -3.15625, -2.15625, -1.15625, -0.15625, 0.84375, 1.84375, 2.84375, 3.84375, 4.84375, 5.84375, 6.84375, 7.84375, 8.84375, 9.84375, 10.84375, 11.84375, 12.84375, 13.84375, 14.84375, 15.84375, 16.84375, 17.84375, 18.84375, 19.84375, 20.84375, 21.84375, 22.84375, 23.84375, 24.84375, 25.84375, 26.84375, 27.84375, 28.84375, 29.84375, 30.84375, 31.84375, 32.84375, 33.84375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 10.0, 7.0, 12.0, 15.0, 21.0, 21.0, 19.0, 25.0, 23.0, 46.0, 40.0, 44.0, 38.0, 55.0, 77.0, 100.0, 158.0, 460.0, 278.0, 125.0, 73.0, 57.0, 42.0, 40.0, 25.0, 35.0, 20.0, 21.0, 20.0, 19.0, 21.0, 11.0, 10.0, 10.0, 11.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-9.5625, -9.2296142578125, -8.896728515625, -8.5638427734375, -8.23095703125, -7.8980712890625, -7.565185546875, -7.2322998046875, -6.8994140625, -6.5665283203125, -6.233642578125, -5.9007568359375, -5.56787109375, -5.2349853515625, -4.902099609375, -4.5692138671875, -4.236328125, -3.9034423828125, -3.570556640625, -3.2376708984375, -2.90478515625, -2.5718994140625, -2.239013671875, -1.9061279296875, -1.5732421875, -1.2403564453125, -0.907470703125, -0.5745849609375, -0.24169921875, 0.0911865234375, 0.424072265625, 0.7569580078125, 1.08984375, 1.4227294921875, 1.755615234375, 2.0885009765625, 2.42138671875, 2.7542724609375, 3.087158203125, 3.4200439453125, 3.7529296875, 4.0858154296875, 4.418701171875, 4.7515869140625, 5.08447265625, 5.4173583984375, 5.750244140625, 6.0831298828125, 6.416015625, 6.7489013671875, 7.081787109375, 7.4146728515625, 7.74755859375, 8.0804443359375, 8.413330078125, 8.7462158203125, 9.0791015625, 9.4119873046875, 9.744873046875, 10.0777587890625, 10.41064453125, 10.7435302734375, 11.076416015625, 11.4093017578125, 11.7421875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 3.0, 8.0, 14.0, 22.0, 51.0, 91.0, 330.0, 287.0, 87.0, 45.0, 30.0, 16.0, 5.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.31144714355469, -66.82640838623047, -65.34136962890625, -63.85633087158203, -62.37129592895508, -60.88625717163086, -59.40121841430664, -57.91617965698242, -56.43114471435547, -54.94610595703125, -53.46106719970703, -51.97602844238281, -50.49099349975586, -49.00595474243164, -47.52091598510742, -46.0358772277832, -44.550838470458984, -43.065799713134766, -41.58076095581055, -40.095726013183594, -38.610687255859375, -37.125648498535156, -35.64060974121094, -34.15557098388672, -32.6705322265625, -31.18549346923828, -29.700456619262695, -28.215417861938477, -26.73038101196289, -25.245342254638672, -23.760303497314453, -22.275264739990234, -20.790233612060547, -19.305194854736328, -17.820158004760742, -16.335119247436523, -14.850081443786621, -13.365043640136719, -11.8800048828125, -10.394967079162598, -8.909929275512695, -7.424891471862793, -5.939853191375732, -4.454814910888672, -2.9697771072387695, -1.4847393035888672, 0.0002994537353515625, 1.485337257385254, 2.9703750610351562, 4.455412864685059, 5.940451145172119, 7.42548942565918, 8.910527229309082, 10.395565032958984, 11.880603790283203, 13.365641593933105, 14.850679397583008, 16.335718154907227, 17.820755004882812, 19.30579376220703, 20.79083251953125, 22.275869369506836, 23.760908126831055, 25.24594497680664, 26.73098373413086]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 1.0, 5.0, 7.0, 5.0, 5.0, 5.0, 17.0, 9.0, 10.0, 11.0, 15.0, 17.0, 30.0, 21.0, 22.0, 29.0, 22.0, 29.0, 33.0, 29.0, 44.0, 43.0, 44.0, 45.0, 48.0, 34.0, 37.0, 40.0, 33.0, 41.0, 27.0, 31.0, 22.0, 25.0, 16.0, 22.0, 23.0, 18.0, 19.0, 12.0, 12.0, 9.0, 11.0, 7.0, 4.0, 5.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-14.023988723754883, -13.59156322479248, -13.159136772155762, -12.72671127319336, -12.29428482055664, -11.861859321594238, -11.429433822631836, -10.997007369995117, -10.564580917358398, -10.132155418395996, -9.699728965759277, -9.267303466796875, -8.834877014160156, -8.402451515197754, -7.970025539398193, -7.537599563598633, -7.1051740646362305, -6.67274808883667, -6.240322113037109, -5.807896614074707, -5.375470161437988, -4.943044662475586, -4.510618686676025, -4.078192710876465, -3.6457667350769043, -3.2133407592773438, -2.780914783477783, -2.3484890460968018, -1.9160630702972412, -1.4836370944976807, -1.0512113571166992, -0.6187853813171387, -0.18635940551757812, 0.24606651067733765, 0.6784924268722534, 1.1109182834625244, 1.543344259262085, 1.9757702350616455, 2.408195972442627, 2.8406219482421875, 3.273047924041748, 3.7054738998413086, 4.137899875640869, 4.57032585144043, 5.002751350402832, 5.435177803039551, 5.867603302001953, 6.300029277801514, 6.732455253601074, 7.164881229400635, 7.597307205200195, 8.029732704162598, 8.462159156799316, 8.894584655761719, 9.327011108398438, 9.75943660736084, 10.191862106323242, 10.624287605285645, 11.056714057922363, 11.489139556884766, 11.921566009521484, 12.353991508483887, 12.786417007446289, 13.218843460083008, 13.651269912719727]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 5.0, 6.0, 13.0, 13.0, 15.0, 23.0, 35.0, 49.0, 69.0, 86.0, 166.0, 226.0, 372.0, 575.0, 1007.0, 1759.0, 3428.0, 8099.0, 27628.0, 4087837.0, 42629.0, 11136.0, 4404.0, 2067.0, 1117.0, 579.0, 328.0, 196.0, 127.0, 93.0, 50.0, 43.0, 30.0, 18.0, 11.0, 9.0, 13.0, 7.0, 8.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.04144287109375, -0.04009056091308594, -0.038738250732421875, -0.03738594055175781, -0.03603363037109375, -0.03468132019042969, -0.033329010009765625, -0.03197669982910156, -0.0306243896484375, -0.029272079467773438, -0.027919769287109375, -0.026567459106445312, -0.02521514892578125, -0.023862838745117188, -0.022510528564453125, -0.021158218383789062, -0.019805908203125, -0.018453598022460938, -0.017101287841796875, -0.015748977661132812, -0.01439666748046875, -0.013044357299804688, -0.011692047119140625, -0.010339736938476562, -0.0089874267578125, -0.0076351165771484375, -0.006282806396484375, -0.0049304962158203125, -0.00357818603515625, -0.0022258758544921875, -0.000873565673828125, 0.0004787445068359375, 0.0018310546875, 0.0031833648681640625, 0.004535675048828125, 0.0058879852294921875, 0.00724029541015625, 0.008592605590820312, 0.009944915771484375, 0.011297225952148438, 0.0126495361328125, 0.014001846313476562, 0.015354156494140625, 0.016706466674804688, 0.01805877685546875, 0.019411087036132812, 0.020763397216796875, 0.022115707397460938, 0.023468017578125, 0.024820327758789062, 0.026172637939453125, 0.027524948120117188, 0.02887725830078125, 0.030229568481445312, 0.031581878662109375, 0.03293418884277344, 0.0342864990234375, 0.03563880920410156, 0.036991119384765625, 0.03834342956542969, 0.03969573974609375, 0.04104804992675781, 0.042400360107421875, 0.04375267028808594, 0.04510498046875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 2.0, 6.0, 6.0, 15.0, 7.0, 20.0, 14.0, 15.0, 38.0, 764.0, 21.0, 11.0, 13.0, 9.0, 8.0, 7.0, 6.0, 8.0, 4.0, 3.0, 6.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002384185791015625, -0.00230562686920166, -0.0022270679473876953, -0.0021485090255737305, -0.0020699501037597656, -0.0019913911819458008, -0.001912832260131836, -0.001834273338317871, -0.0017557144165039062, -0.0016771554946899414, -0.0015985965728759766, -0.0015200376510620117, -0.0014414787292480469, -0.001362919807434082, -0.0012843608856201172, -0.0012058019638061523, -0.0011272430419921875, -0.0010486841201782227, -0.0009701251983642578, -0.000891566276550293, -0.0008130073547363281, -0.0007344484329223633, -0.0006558895111083984, -0.0005773305892944336, -0.0004987716674804688, -0.0004202127456665039, -0.00034165382385253906, -0.0002630949020385742, -0.00018453598022460938, -0.00010597705841064453, -2.7418136596679688e-05, 5.1140785217285156e-05, 0.00012969970703125, 0.00020825862884521484, 0.0002868175506591797, 0.00036537647247314453, 0.0004439353942871094, 0.0005224943161010742, 0.0006010532379150391, 0.0006796121597290039, 0.0007581710815429688, 0.0008367300033569336, 0.0009152889251708984, 0.0009938478469848633, 0.0010724067687988281, 0.001150965690612793, 0.0012295246124267578, 0.0013080835342407227, 0.0013866424560546875, 0.0014652013778686523, 0.0015437602996826172, 0.001622319221496582, 0.0017008781433105469, 0.0017794370651245117, 0.0018579959869384766, 0.0019365549087524414, 0.0020151138305664062, 0.002093672752380371, 0.002172231674194336, 0.0022507905960083008, 0.0023293495178222656, 0.0024079084396362305, 0.0024864673614501953, 0.00256502628326416, 0.002643585205078125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 18.0, 11.0, 21.0, 23.0, 35.0, 43.0, 68.0, 98.0, 133.0, 184.0, 282.0, 476.0, 785.0, 1354.0, 2771.0, 7020.0, 30257.0, 3646311.0, 470796.0, 22288.0, 5790.0, 2373.0, 1176.0, 675.0, 425.0, 274.0, 140.0, 153.0, 76.0, 70.0, 38.0, 30.0, 17.0, 18.0, 8.0, 9.0, 8.0, 7.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.05401611328125, -0.052423954010009766, -0.05083179473876953, -0.0492396354675293, -0.04764747619628906, -0.04605531692504883, -0.044463157653808594, -0.04287099838256836, -0.041278839111328125, -0.03968667984008789, -0.038094520568847656, -0.03650236129760742, -0.03491020202636719, -0.03331804275512695, -0.03172588348388672, -0.030133724212646484, -0.02854156494140625, -0.026949405670166016, -0.02535724639892578, -0.023765087127685547, -0.022172927856445312, -0.020580768585205078, -0.018988609313964844, -0.01739645004272461, -0.015804290771484375, -0.01421213150024414, -0.012619972229003906, -0.011027812957763672, -0.009435653686523438, -0.007843494415283203, -0.006251335144042969, -0.004659175872802734, -0.0030670166015625, -0.0014748573303222656, 0.00011730194091796875, 0.0017094612121582031, 0.0033016204833984375, 0.004893779754638672, 0.006485939025878906, 0.00807809829711914, 0.009670257568359375, 0.01126241683959961, 0.012854576110839844, 0.014446735382080078, 0.016038894653320312, 0.017631053924560547, 0.01922321319580078, 0.020815372467041016, 0.02240753173828125, 0.023999691009521484, 0.02559185028076172, 0.027184009552001953, 0.028776168823242188, 0.030368328094482422, 0.031960487365722656, 0.03355264663696289, 0.035144805908203125, 0.03673696517944336, 0.038329124450683594, 0.03992128372192383, 0.04151344299316406, 0.0431056022644043, 0.04469776153564453, 0.046289920806884766, 0.047882080078125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 10.0, 4.0, 10.0, 10.0, 13.0, 5.0, 16.0, 26.0, 16.0, 30.0, 27.0, 40.0, 51.0, 60.0, 82.0, 103.0, 209.0, 2182.0, 583.0, 167.0, 98.0, 59.0, 44.0, 42.0, 37.0, 38.0, 20.0, 26.0, 16.0, 11.0, 11.0, 12.0, 3.0, 2.0, 3.0, 5.0, 4.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005908966064453125, -0.00574415922164917, -0.005579352378845215, -0.00541454553604126, -0.005249738693237305, -0.00508493185043335, -0.0049201250076293945, -0.0047553181648254395, -0.004590511322021484, -0.004425704479217529, -0.004260897636413574, -0.004096090793609619, -0.003931283950805664, -0.003766477108001709, -0.003601670265197754, -0.003436863422393799, -0.0032720565795898438, -0.0031072497367858887, -0.0029424428939819336, -0.0027776360511779785, -0.0026128292083740234, -0.0024480223655700684, -0.0022832155227661133, -0.002118408679962158, -0.001953601837158203, -0.001788794994354248, -0.001623988151550293, -0.0014591813087463379, -0.0012943744659423828, -0.0011295676231384277, -0.0009647607803344727, -0.0007999539375305176, -0.0006351470947265625, -0.0004703402519226074, -0.00030553340911865234, -0.00014072656631469727, 2.4080276489257812e-05, 0.0001888871192932129, 0.00035369396209716797, 0.000518500804901123, 0.0006833076477050781, 0.0008481144905090332, 0.0010129213333129883, 0.0011777281761169434, 0.0013425350189208984, 0.0015073418617248535, 0.0016721487045288086, 0.0018369555473327637, 0.0020017623901367188, 0.002166569232940674, 0.002331376075744629, 0.002496182918548584, 0.002660989761352539, 0.002825796604156494, 0.0029906034469604492, 0.0031554102897644043, 0.0033202171325683594, 0.0034850239753723145, 0.0036498308181762695, 0.0038146376609802246, 0.00397944450378418, 0.004144251346588135, 0.00430905818939209, 0.004473865032196045, 0.004638671875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 4.0, 10.0, 17.0, 46.0, 102.0, 453.0, 246.0, 72.0, 20.0, 12.0, 10.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09733083844184875, -0.09505892544984818, -0.0927870124578476, -0.09051509201526642, -0.08824317902326584, -0.08597126603126526, -0.08369935303926468, -0.0814274400472641, -0.07915551960468292, -0.07688360661268234, -0.07461169362068176, -0.07233977317810059, -0.0700678601861, -0.06779594719409943, -0.06552403420209885, -0.06325212121009827, -0.06098020449280739, -0.05870829150080681, -0.05643637478351593, -0.05416446179151535, -0.05189254507422447, -0.04962063208222389, -0.047348715364933014, -0.045076802372932434, -0.042804889380931854, -0.040532976388931274, -0.038261059671640396, -0.035989146679639816, -0.03371722996234894, -0.03144531697034836, -0.02917340211570263, -0.0269014872610569, -0.02462957426905632, -0.02235765941441059, -0.020085744559764862, -0.017813831567764282, -0.015541915781795979, -0.01327000092715025, -0.010998087003827095, -0.008726172149181366, -0.006454257294535637, -0.004182342439889908, -0.001910428050905466, 0.0003614863380789757, 0.0026334011927247047, 0.004905316047370434, 0.007177229970693588, 0.009449144825339317, 0.011721059679985046, 0.013992974534630775, 0.016264889389276505, 0.018536802381277084, 0.020808719098567963, 0.023080632090568542, 0.02535254694521427, 0.02762446179986, 0.02989637665450573, 0.03216829150915146, 0.03444020450115204, 0.03671212121844292, 0.0389840342104435, 0.041255950927734375, 0.043527863919734955, 0.045799776911735535, 0.04807169362902641]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 4.0, 6.0, 4.0, 10.0, 14.0, 13.0, 16.0, 34.0, 17.0, 24.0, 39.0, 30.0, 44.0, 37.0, 55.0, 68.0, 68.0, 60.0, 64.0, 55.0, 52.0, 53.0, 39.0, 39.0, 44.0, 23.0, 23.0, 8.0, 11.0, 17.0, 11.0, 9.0, 7.0, 3.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.026553034782409668, -0.025897014886140823, -0.025240996852517128, -0.024584978818893433, -0.023928958922624588, -0.023272939026355743, -0.022616920992732048, -0.021960902959108353, -0.021304883062839508, -0.020648863166570663, -0.019992845132946968, -0.019336827099323273, -0.018680807203054428, -0.018024787306785583, -0.017368769273161888, -0.016712751239538193, -0.016056731343269348, -0.015400712378323078, -0.014744693413376808, -0.014088674448430538, -0.013432655483484268, -0.012776636518537998, -0.012120617553591728, -0.011464598588645458, -0.010808579623699188, -0.010152560658752918, -0.009496541693806648, -0.008840522728860378, -0.008184503763914108, -0.007528484798967838, -0.006872465834021568, -0.006216446869075298, -0.005560427904129028, -0.004904408939182758, -0.004248389974236488, -0.0035923710092902184, -0.0029363520443439484, -0.0022803330793976784, -0.0016243141144514084, -0.0009682951495051384, -0.0003122761845588684, 0.0003437427803874016, 0.0009997617453336716, 0.0016557807102799416, 0.0023117996752262115, 0.0029678186401724815, 0.0036238376051187515, 0.0042798565700650215, 0.0049358755350112915, 0.0055918944999575615, 0.0062479134649038315, 0.0069039324298501015, 0.0075599513947963715, 0.008215970359742641, 0.008871989324688911, 0.009528008289635181, 0.010184027254581451, 0.010840046219527721, 0.011496065184473991, 0.012152084149420261, 0.012808103114366531, 0.013464122079312801, 0.014120141044259071, 0.014776160009205341, 0.015432178974151611]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 4.0, 6.0, 8.0, 11.0, 11.0, 28.0, 27.0, 42.0, 46.0, 71.0, 95.0, 126.0, 188.0, 275.0, 399.0, 561.0, 885.0, 1327.0, 2113.0, 3670.0, 6625.0, 14066.0, 38992.0, 913547.0, 35851.0, 13395.0, 6543.0, 3607.0, 2088.0, 1284.0, 833.0, 546.0, 375.0, 216.0, 203.0, 128.0, 97.0, 77.0, 40.0, 35.0, 30.0, 20.0, 15.0, 14.0, 14.0, 6.0, 3.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0318603515625, -0.030848026275634766, -0.02983570098876953, -0.028823375701904297, -0.027811050415039062, -0.026798725128173828, -0.025786399841308594, -0.02477407455444336, -0.023761749267578125, -0.02274942398071289, -0.021737098693847656, -0.020724773406982422, -0.019712448120117188, -0.018700122833251953, -0.01768779754638672, -0.016675472259521484, -0.01566314697265625, -0.014650821685791016, -0.013638496398925781, -0.012626171112060547, -0.011613845825195312, -0.010601520538330078, -0.009589195251464844, -0.00857686996459961, -0.007564544677734375, -0.006552219390869141, -0.005539894104003906, -0.004527568817138672, -0.0035152435302734375, -0.002502918243408203, -0.0014905929565429688, -0.0004782676696777344, 0.0005340576171875, 0.0015463829040527344, 0.0025587081909179688, 0.003571033477783203, 0.0045833587646484375, 0.005595684051513672, 0.006608009338378906, 0.007620334625244141, 0.008632659912109375, 0.00964498519897461, 0.010657310485839844, 0.011669635772705078, 0.012681961059570312, 0.013694286346435547, 0.014706611633300781, 0.015718936920166016, 0.01673126220703125, 0.017743587493896484, 0.01875591278076172, 0.019768238067626953, 0.020780563354492188, 0.021792888641357422, 0.022805213928222656, 0.02381753921508789, 0.024829864501953125, 0.02584218978881836, 0.026854515075683594, 0.027866840362548828, 0.028879165649414062, 0.029891490936279297, 0.03090381622314453, 0.031916141510009766, 0.032928466796875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 4.0, 1.0, 4.0, 3.0, 3.0, 4.0, 9.0, 10.0, 9.0, 14.0, 16.0, 15.0, 23.0, 672.0, 126.0, 13.0, 13.0, 12.0, 8.0, 6.0, 8.0, 7.0, 7.0, 3.0, 5.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002410888671875, -0.002332240343093872, -0.002253592014312744, -0.002174943685531616, -0.0020962953567504883, -0.0020176470279693604, -0.0019389986991882324, -0.0018603503704071045, -0.0017817020416259766, -0.0017030537128448486, -0.0016244053840637207, -0.0015457570552825928, -0.0014671087265014648, -0.001388460397720337, -0.001309812068939209, -0.001231163740158081, -0.0011525154113769531, -0.0010738670825958252, -0.0009952187538146973, -0.0009165704250335693, -0.0008379220962524414, -0.0007592737674713135, -0.0006806254386901855, -0.0006019771099090576, -0.0005233287811279297, -0.00044468045234680176, -0.00036603212356567383, -0.0002873837947845459, -0.00020873546600341797, -0.00013008713722229004, -5.143880844116211e-05, 2.720952033996582e-05, 0.00010585784912109375, 0.00018450617790222168, 0.0002631545066833496, 0.00034180283546447754, 0.00042045116424560547, 0.0004990994930267334, 0.0005777478218078613, 0.0006563961505889893, 0.0007350444793701172, 0.0008136928081512451, 0.000892341136932373, 0.000970989465713501, 0.001049637794494629, 0.0011282861232757568, 0.0012069344520568848, 0.0012855827808380127, 0.0013642311096191406, 0.0014428794384002686, 0.0015215277671813965, 0.0016001760959625244, 0.0016788244247436523, 0.0017574727535247803, 0.0018361210823059082, 0.0019147694110870361, 0.001993417739868164, 0.002072066068649292, 0.00215071439743042, 0.002229362726211548, 0.0023080110549926758, 0.0023866593837738037, 0.0024653077125549316, 0.0025439560413360596, 0.0026226043701171875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 8.0, 7.0, 2.0, 9.0, 8.0, 9.0, 14.0, 24.0, 55.0, 46.0, 83.0, 120.0, 162.0, 254.0, 372.0, 612.0, 999.0, 1878.0, 3984.0, 9826.0, 48308.0, 896074.0, 65202.0, 11115.0, 4335.0, 2000.0, 1129.0, 725.0, 403.0, 243.0, 168.0, 117.0, 75.0, 53.0, 46.0, 33.0, 15.0, 16.0, 8.0, 6.0, 11.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.051666259765625, -0.050079345703125, -0.048492431640625, -0.046905517578125, -0.045318603515625, -0.043731689453125, -0.042144775390625, -0.040557861328125, -0.038970947265625, -0.037384033203125, -0.035797119140625, -0.034210205078125, -0.032623291015625, -0.031036376953125, -0.029449462890625, -0.027862548828125, -0.026275634765625, -0.024688720703125, -0.023101806640625, -0.021514892578125, -0.019927978515625, -0.018341064453125, -0.016754150390625, -0.015167236328125, -0.013580322265625, -0.011993408203125, -0.010406494140625, -0.008819580078125, -0.007232666015625, -0.005645751953125, -0.004058837890625, -0.002471923828125, -0.000885009765625, 0.000701904296875, 0.002288818359375, 0.003875732421875, 0.005462646484375, 0.007049560546875, 0.008636474609375, 0.010223388671875, 0.011810302734375, 0.013397216796875, 0.014984130859375, 0.016571044921875, 0.018157958984375, 0.019744873046875, 0.021331787109375, 0.022918701171875, 0.024505615234375, 0.026092529296875, 0.027679443359375, 0.029266357421875, 0.030853271484375, 0.032440185546875, 0.034027099609375, 0.035614013671875, 0.037200927734375, 0.038787841796875, 0.040374755859375, 0.041961669921875, 0.043548583984375, 0.045135498046875, 0.046722412109375, 0.048309326171875, 0.049896240234375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 3.0, 1.0, 6.0, 5.0, 5.0, 4.0, 10.0, 15.0, 11.0, 19.0, 27.0, 40.0, 40.0, 36.0, 34.0, 34.0, 50.0, 40.0, 56.0, 37.0, 56.0, 56.0, 52.0, 34.0, 40.0, 34.0, 47.0, 35.0, 32.0, 24.0, 26.0, 17.0, 15.0, 9.0, 15.0, 4.0, 14.0, 3.0, 8.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01047515869140625, -0.010152935981750488, -0.009830713272094727, -0.009508490562438965, -0.009186267852783203, -0.008864045143127441, -0.00854182243347168, -0.008219599723815918, -0.007897377014160156, -0.0075751543045043945, -0.007252931594848633, -0.006930708885192871, -0.006608486175537109, -0.006286263465881348, -0.005964040756225586, -0.005641818046569824, -0.0053195953369140625, -0.004997372627258301, -0.004675149917602539, -0.004352927207946777, -0.004030704498291016, -0.003708481788635254, -0.003386259078979492, -0.0030640363693237305, -0.0027418136596679688, -0.002419590950012207, -0.0020973682403564453, -0.0017751455307006836, -0.0014529228210449219, -0.0011307001113891602, -0.0008084774017333984, -0.0004862546920776367, -0.000164031982421875, 0.00015819072723388672, 0.00048041343688964844, 0.0008026361465454102, 0.0011248588562011719, 0.0014470815658569336, 0.0017693042755126953, 0.002091526985168457, 0.0024137496948242188, 0.0027359724044799805, 0.003058195114135742, 0.003380417823791504, 0.0037026405334472656, 0.004024863243103027, 0.004347085952758789, 0.004669308662414551, 0.0049915313720703125, 0.005313754081726074, 0.005635976791381836, 0.005958199501037598, 0.006280422210693359, 0.006602644920349121, 0.006924867630004883, 0.0072470903396606445, 0.007569313049316406, 0.007891535758972168, 0.00821375846862793, 0.008535981178283691, 0.008858203887939453, 0.009180426597595215, 0.009502649307250977, 0.009824872016906738, 0.0101470947265625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 0.0, 3.0, 2.0, 1.0, 5.0, 7.0, 6.0, 13.0, 8.0, 20.0, 26.0, 57.0, 83.0, 265.0, 1656.0, 1004614.0, 40516.0, 915.0, 182.0, 46.0, 30.0, 28.0, 16.0, 13.0, 8.0, 11.0, 6.0, 3.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.056365966796875, -0.05459785461425781, -0.052829742431640625, -0.05106163024902344, -0.04929351806640625, -0.04752540588378906, -0.045757293701171875, -0.04398918151855469, -0.0422210693359375, -0.04045295715332031, -0.038684844970703125, -0.03691673278808594, -0.03514862060546875, -0.03338050842285156, -0.031612396240234375, -0.029844284057617188, -0.028076171875, -0.026308059692382812, -0.024539947509765625, -0.022771835327148438, -0.02100372314453125, -0.019235610961914062, -0.017467498779296875, -0.015699386596679688, -0.0139312744140625, -0.012163162231445312, -0.010395050048828125, -0.008626937866210938, -0.00685882568359375, -0.0050907135009765625, -0.003322601318359375, -0.0015544891357421875, 0.000213623046875, 0.0019817352294921875, 0.003749847412109375, 0.0055179595947265625, 0.00728607177734375, 0.009054183959960938, 0.010822296142578125, 0.012590408325195312, 0.0143585205078125, 0.016126632690429688, 0.017894744873046875, 0.019662857055664062, 0.02143096923828125, 0.023199081420898438, 0.024967193603515625, 0.026735305786132812, 0.02850341796875, 0.030271530151367188, 0.032039642333984375, 0.03380775451660156, 0.03557586669921875, 0.03734397888183594, 0.039112091064453125, 0.04088020324707031, 0.0426483154296875, 0.04441642761230469, 0.046184539794921875, 0.04795265197753906, 0.04972076416015625, 0.05148887634277344, 0.053256988525390625, 0.05502510070800781, 0.056793212890625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 6.0, 4.0, 13.0, 11.0, 11.0, 13.0, 17.0, 23.0, 26.0, 40.0, 69.0, 97.0, 124.0, 126.0, 119.0, 81.0, 56.0, 36.0, 31.0, 23.0, 17.0, 10.0, 10.0, 4.0, 9.0, 2.0, 6.0, 3.0, 3.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.722574234008789e-05, -1.674983650445938e-05, -1.627393066883087e-05, -1.5798024833202362e-05, -1.5322118997573853e-05, -1.4846213161945343e-05, -1.4370307326316833e-05, -1.3894401490688324e-05, -1.3418495655059814e-05, -1.2942589819431305e-05, -1.2466683983802795e-05, -1.1990778148174286e-05, -1.1514872312545776e-05, -1.1038966476917267e-05, -1.0563060641288757e-05, -1.0087154805660248e-05, -9.611248970031738e-06, -9.135343134403229e-06, -8.65943729877472e-06, -8.18353146314621e-06, -7.7076256275177e-06, -7.231719791889191e-06, -6.755813956260681e-06, -6.279908120632172e-06, -5.804002285003662e-06, -5.328096449375153e-06, -4.852190613746643e-06, -4.3762847781181335e-06, -3.900378942489624e-06, -3.4244731068611145e-06, -2.948567271232605e-06, -2.4726614356040955e-06, -1.996755599975586e-06, -1.5208497643470764e-06, -1.044943928718567e-06, -5.690380930900574e-07, -9.313225746154785e-08, 3.8277357816696167e-07, 8.586794137954712e-07, 1.3345852494239807e-06, 1.8104910850524902e-06, 2.2863969206809998e-06, 2.7623027563095093e-06, 3.238208591938019e-06, 3.7141144275665283e-06, 4.190020263195038e-06, 4.665926098823547e-06, 5.141831934452057e-06, 5.617737770080566e-06, 6.093643605709076e-06, 6.5695494413375854e-06, 7.045455276966095e-06, 7.5213611125946045e-06, 7.997266948223114e-06, 8.473172783851624e-06, 8.949078619480133e-06, 9.424984455108643e-06, 9.900890290737152e-06, 1.0376796126365662e-05, 1.0852701961994171e-05, 1.132860779762268e-05, 1.180451363325119e-05, 1.22804194688797e-05, 1.275632530450821e-05, 1.3232231140136719e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 6.0, 8.0, 18.0, 12.0, 27.0, 18.0, 34.0, 45.0, 69.0, 133.0, 225.0, 436.0, 1001.0, 3045.0, 21939.0, 1003988.0, 13366.0, 2307.0, 868.0, 395.0, 215.0, 136.0, 91.0, 62.0, 32.0, 23.0, 13.0, 6.0, 10.0, 8.0, 8.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.045196533203125, -0.043485164642333984, -0.04177379608154297, -0.04006242752075195, -0.03835105895996094, -0.03663969039916992, -0.034928321838378906, -0.03321695327758789, -0.031505584716796875, -0.02979421615600586, -0.028082847595214844, -0.026371479034423828, -0.024660110473632812, -0.022948741912841797, -0.02123737335205078, -0.019526004791259766, -0.01781463623046875, -0.016103267669677734, -0.014391899108886719, -0.012680530548095703, -0.010969161987304688, -0.009257793426513672, -0.007546424865722656, -0.005835056304931641, -0.004123687744140625, -0.0024123191833496094, -0.0007009506225585938, 0.0010104179382324219, 0.0027217864990234375, 0.004433155059814453, 0.006144523620605469, 0.007855892181396484, 0.0095672607421875, 0.011278629302978516, 0.012989997863769531, 0.014701366424560547, 0.016412734985351562, 0.018124103546142578, 0.019835472106933594, 0.02154684066772461, 0.023258209228515625, 0.02496957778930664, 0.026680946350097656, 0.028392314910888672, 0.030103683471679688, 0.0318150520324707, 0.03352642059326172, 0.035237789154052734, 0.03694915771484375, 0.038660526275634766, 0.04037189483642578, 0.0420832633972168, 0.04379463195800781, 0.04550600051879883, 0.047217369079589844, 0.04892873764038086, 0.050640106201171875, 0.05235147476196289, 0.054062843322753906, 0.05577421188354492, 0.05748558044433594, 0.05919694900512695, 0.06090831756591797, 0.06261968612670898, 0.0643310546875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 2.0, 6.0, 4.0, 13.0, 17.0, 12.0, 21.0, 49.0, 72.0, 355.0, 214.0, 73.0, 51.0, 34.0, 21.0, 14.0, 13.0, 4.0, 3.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01126861572265625, -0.010834336280822754, -0.010400056838989258, -0.009965777397155762, -0.009531497955322266, -0.00909721851348877, -0.008662939071655273, -0.008228659629821777, -0.007794380187988281, -0.007360100746154785, -0.006925821304321289, -0.006491541862487793, -0.006057262420654297, -0.005622982978820801, -0.005188703536987305, -0.004754424095153809, -0.0043201446533203125, -0.0038858652114868164, -0.0034515857696533203, -0.0030173063278198242, -0.002583026885986328, -0.002148747444152832, -0.001714468002319336, -0.0012801885604858398, -0.0008459091186523438, -0.00041162967681884766, 2.2649765014648438e-05, 0.00045692920684814453, 0.0008912086486816406, 0.0013254880905151367, 0.0017597675323486328, 0.002194046974182129, 0.002628326416015625, 0.003062605857849121, 0.003496885299682617, 0.003931164741516113, 0.004365444183349609, 0.0047997236251831055, 0.0052340030670166016, 0.005668282508850098, 0.006102561950683594, 0.00653684139251709, 0.006971120834350586, 0.007405400276184082, 0.007839679718017578, 0.008273959159851074, 0.00870823860168457, 0.009142518043518066, 0.009576797485351562, 0.010011076927185059, 0.010445356369018555, 0.01087963581085205, 0.011313915252685547, 0.011748194694519043, 0.012182474136352539, 0.012616753578186035, 0.013051033020019531, 0.013485312461853027, 0.013919591903686523, 0.01435387134552002, 0.014788150787353516, 0.015222430229187012, 0.015656709671020508, 0.016090989112854004, 0.0165252685546875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 7.0, 9.0, 12.0, 38.0, 236.0, 593.0, 51.0, 16.0, 8.0, 3.0, 9.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.47643935680389404, -0.46117842197418213, -0.4459174871444702, -0.4306565523147583, -0.4153956472873688, -0.40013471245765686, -0.38487377762794495, -0.36961284279823303, -0.3543519377708435, -0.3390910029411316, -0.3238300681114197, -0.30856913328170776, -0.29330822825431824, -0.2780472934246063, -0.2627863585948944, -0.2475254237651825, -0.23226448893547058, -0.21700355410575867, -0.20174263417720795, -0.18648169934749603, -0.1712207794189453, -0.1559598445892334, -0.14069890975952148, -0.12543797492980957, -0.11017705500125885, -0.09491612762212753, -0.07965520024299622, -0.0643942654132843, -0.049133338034152985, -0.03387241065502167, -0.018611475825309753, -0.0033505484461784363, 0.01191037893295288, 0.027171308174729347, 0.042432237416505814, 0.05769316852092743, 0.07295409590005875, 0.08821502327919006, 0.10347595810890198, 0.1187368854880333, 0.1339978128671646, 0.14925874769687653, 0.16451966762542725, 0.17978060245513916, 0.19504153728485107, 0.2103024572134018, 0.2255633920431137, 0.24082431197166443, 0.25608524680137634, 0.27134618163108826, 0.28660711646080017, 0.3018680214881897, 0.3171289563179016, 0.3323898911476135, 0.34765082597732544, 0.36291176080703735, 0.37817269563674927, 0.3934336304664612, 0.4086945652961731, 0.423955500125885, 0.43921640515327454, 0.45447733998298645, 0.46973827481269836, 0.4849992096424103, 0.5002601146697998]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 4.0, 3.0, 5.0, 5.0, 9.0, 16.0, 19.0, 41.0, 80.0, 124.0, 180.0, 169.0, 139.0, 67.0, 49.0, 25.0, 12.0, 12.0, 9.0, 8.0, 1.0, 8.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20411217212677002, -0.19754594564437866, -0.1909797042608261, -0.18441346287727356, -0.1778472363948822, -0.17128100991249084, -0.1647147685289383, -0.15814852714538574, -0.15158230066299438, -0.14501607418060303, -0.13844983279705048, -0.13188359141349792, -0.12531736493110657, -0.11875113099813461, -0.11218489706516266, -0.1056186631321907, -0.09905242919921875, -0.0924861952662468, -0.08591996133327484, -0.07935372740030289, -0.07278749346733093, -0.06622125953435898, -0.059655025601387024, -0.05308879166841507, -0.046522557735443115, -0.03995632380247116, -0.03339008986949921, -0.026823855936527252, -0.020257622003555298, -0.013691388070583344, -0.007125154137611389, -0.0005589202046394348, 0.0060073137283325195, 0.012573547661304474, 0.019139781594276428, 0.025706015527248383, 0.03227224946022034, 0.03883848339319229, 0.045404717326164246, 0.0519709512591362, 0.058537185192108154, 0.06510341912508011, 0.07166965305805206, 0.07823588699102402, 0.08480212092399597, 0.09136835485696793, 0.09793458878993988, 0.10450082272291183, 0.11106705665588379, 0.11763329058885574, 0.1241995245218277, 0.13076576590538025, 0.1373319923877716, 0.14389821887016296, 0.15046446025371552, 0.15703070163726807, 0.16359692811965942, 0.17016315460205078, 0.17672939598560333, 0.18329563736915588, 0.18986186385154724, 0.1964280903339386, 0.20299433171749115, 0.2095605731010437, 0.21612679958343506]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 5.0, 12.0, 13.0, 21.0, 19.0, 41.0, 77.0, 438.0, 21135.0, 4170379.0, 1818.0, 141.0, 45.0, 38.0, 24.0, 16.0, 11.0, 5.0, 3.0, 11.0, 5.0, 7.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.66015625, -4.50616455078125, -4.3521728515625, -4.19818115234375, -4.044189453125, -3.89019775390625, -3.7362060546875, -3.58221435546875, -3.42822265625, -3.27423095703125, -3.1202392578125, -2.96624755859375, -2.812255859375, -2.65826416015625, -2.5042724609375, -2.35028076171875, -2.1962890625, -2.04229736328125, -1.8883056640625, -1.73431396484375, -1.580322265625, -1.42633056640625, -1.2723388671875, -1.11834716796875, -0.96435546875, -0.81036376953125, -0.6563720703125, -0.50238037109375, -0.348388671875, -0.19439697265625, -0.0404052734375, 0.11358642578125, 0.267578125, 0.42156982421875, 0.5755615234375, 0.72955322265625, 0.883544921875, 1.03753662109375, 1.1915283203125, 1.34552001953125, 1.49951171875, 1.65350341796875, 1.8074951171875, 1.96148681640625, 2.115478515625, 2.26947021484375, 2.4234619140625, 2.57745361328125, 2.7314453125, 2.88543701171875, 3.0394287109375, 3.19342041015625, 3.347412109375, 3.50140380859375, 3.6553955078125, 3.80938720703125, 3.96337890625, 4.11737060546875, 4.2713623046875, 4.42535400390625, 4.579345703125, 4.73333740234375, 4.8873291015625, 5.04132080078125, 5.1953125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 3.0, 6.0, 8.0, 13.0, 8.0, 16.0, 18.0, 14.0, 44.0, 742.0, 34.0, 9.0, 13.0, 12.0, 10.0, 2.0, 10.0, 6.0, 5.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002300262451171875, -0.0022245049476623535, -0.002148747444152832, -0.0020729899406433105, -0.001997232437133789, -0.0019214749336242676, -0.001845717430114746, -0.0017699599266052246, -0.0016942024230957031, -0.0016184449195861816, -0.0015426874160766602, -0.0014669299125671387, -0.0013911724090576172, -0.0013154149055480957, -0.0012396574020385742, -0.0011638998985290527, -0.0010881423950195312, -0.0010123848915100098, -0.0009366273880004883, -0.0008608698844909668, -0.0007851123809814453, -0.0007093548774719238, -0.0006335973739624023, -0.0005578398704528809, -0.0004820823669433594, -0.0004063248634338379, -0.0003305673599243164, -0.0002548098564147949, -0.00017905235290527344, -0.00010329484939575195, -2.753734588623047e-05, 4.8220157623291016e-05, 0.0001239776611328125, 0.00019973516464233398, 0.00027549266815185547, 0.00035125017166137695, 0.00042700767517089844, 0.0005027651786804199, 0.0005785226821899414, 0.0006542801856994629, 0.0007300376892089844, 0.0008057951927185059, 0.0008815526962280273, 0.0009573101997375488, 0.0010330677032470703, 0.0011088252067565918, 0.0011845827102661133, 0.0012603402137756348, 0.0013360977172851562, 0.0014118552207946777, 0.0014876127243041992, 0.0015633702278137207, 0.0016391277313232422, 0.0017148852348327637, 0.0017906427383422852, 0.0018664002418518066, 0.0019421577453613281, 0.0020179152488708496, 0.002093672752380371, 0.0021694302558898926, 0.002245187759399414, 0.0023209452629089355, 0.002396702766418457, 0.0024724602699279785, 0.0025482177734375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 6.0, 10.0, 7.0, 16.0, 19.0, 30.0, 36.0, 61.0, 75.0, 109.0, 183.0, 371.0, 17521.0, 4173043.0, 1796.0, 293.0, 162.0, 131.0, 87.0, 89.0, 66.0, 42.0, 29.0, 19.0, 23.0, 6.0, 17.0, 10.0, 8.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6484375, -0.6179351806640625, -0.587432861328125, -0.5569305419921875, -0.52642822265625, -0.4959259033203125, -0.465423583984375, -0.4349212646484375, -0.4044189453125, -0.3739166259765625, -0.343414306640625, -0.3129119873046875, -0.28240966796875, -0.2519073486328125, -0.221405029296875, -0.1909027099609375, -0.160400390625, -0.1298980712890625, -0.099395751953125, -0.0688934326171875, -0.03839111328125, -0.0078887939453125, 0.022613525390625, 0.0531158447265625, 0.0836181640625, 0.1141204833984375, 0.144622802734375, 0.1751251220703125, 0.20562744140625, 0.2361297607421875, 0.266632080078125, 0.2971343994140625, 0.32763671875, 0.3581390380859375, 0.388641357421875, 0.4191436767578125, 0.44964599609375, 0.4801483154296875, 0.510650634765625, 0.5411529541015625, 0.5716552734375, 0.6021575927734375, 0.632659912109375, 0.6631622314453125, 0.69366455078125, 0.7241668701171875, 0.754669189453125, 0.7851715087890625, 0.815673828125, 0.8461761474609375, 0.876678466796875, 0.9071807861328125, 0.93768310546875, 0.9681854248046875, 0.998687744140625, 1.0291900634765625, 1.0596923828125, 1.0901947021484375, 1.120697021484375, 1.1511993408203125, 1.18170166015625, 1.2122039794921875, 1.242706298828125, 1.2732086181640625, 1.3037109375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 7.0, 8.0, 9.0, 13.0, 19.0, 30.0, 30.0, 53.0, 79.0, 110.0, 165.0, 232.0, 453.0, 1578.0, 359.0, 216.0, 158.0, 129.0, 89.0, 94.0, 67.0, 42.0, 35.0, 17.0, 20.0, 9.0, 17.0, 9.0, 9.0, 7.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.005084991455078125, -0.004847347736358643, -0.00460970401763916, -0.004372060298919678, -0.004134416580200195, -0.003896772861480713, -0.0036591291427612305, -0.003421485424041748, -0.0031838417053222656, -0.002946197986602783, -0.0027085542678833008, -0.0024709105491638184, -0.002233266830444336, -0.0019956231117248535, -0.001757979393005371, -0.0015203356742858887, -0.0012826919555664062, -0.0010450482368469238, -0.0008074045181274414, -0.000569760799407959, -0.00033211708068847656, -9.447336196899414e-05, 0.00014317035675048828, 0.0003808140754699707, 0.0006184577941894531, 0.0008561015129089355, 0.001093745231628418, 0.0013313889503479004, 0.0015690326690673828, 0.0018066763877868652, 0.0020443201065063477, 0.00228196382522583, 0.0025196075439453125, 0.002757251262664795, 0.0029948949813842773, 0.0032325387001037598, 0.003470182418823242, 0.0037078261375427246, 0.003945469856262207, 0.0041831135749816895, 0.004420757293701172, 0.004658401012420654, 0.004896044731140137, 0.005133688449859619, 0.0053713321685791016, 0.005608975887298584, 0.005846619606018066, 0.006084263324737549, 0.006321907043457031, 0.006559550762176514, 0.006797194480895996, 0.0070348381996154785, 0.007272481918334961, 0.007510125637054443, 0.007747769355773926, 0.007985413074493408, 0.00822305679321289, 0.008460700511932373, 0.008698344230651855, 0.008935987949371338, 0.00917363166809082, 0.009411275386810303, 0.009648919105529785, 0.009886562824249268, 0.01012420654296875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 364.0, 622.0, 26.0, 8.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13693085312843323, -0.06829474866390228, 0.0003413558006286621, 0.0689774602651596, 0.13761356472969055, 0.2062496840953827, 0.27488577365875244, 0.3435218632221222, 0.41215798258781433, 0.4807940721511841, 0.5494301915168762, 0.6180663108825684, 0.6867023706436157, 0.7553385496139526, 0.823974609375, 0.8926106691360474, 0.9612468481063843, 1.0298829078674316, 1.0985190868377686, 1.167155146598816, 1.2357912063598633, 1.3044273853302002, 1.3730634450912476, 1.441699504852295, 1.5103356838226318, 1.5789717435836792, 1.6476079225540161, 1.7162439823150635, 1.7848801612854004, 1.8535162210464478, 1.9221522808074951, 1.990788459777832, 2.05942440032959, 2.1280605792999268, 2.1966965198516846, 2.2653326988220215, 2.3339688777923584, 2.4026050567626953, 2.471240997314453, 2.53987717628479, 2.608513355255127, 2.677149534225464, 2.7457854747772217, 2.8144216537475586, 2.8830578327178955, 2.9516940116882324, 3.0203299522399902, 3.088966131210327, 3.157602071762085, 3.226238250732422, 3.2948741912841797, 3.3635103702545166, 3.4321465492248535, 3.5007824897766113, 3.5694186687469482, 3.638054847717285, 3.706690788269043, 3.77532696723938, 3.8439629077911377, 3.9125990867614746, 3.9812352657318115, 4.049871444702148, 4.118507385253906, 4.187143325805664, 4.25577974319458]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 14.0, 19.0, 29.0, 47.0, 60.0, 77.0, 116.0, 121.0, 115.0, 116.0, 89.0, 85.0, 40.0, 25.0, 24.0, 9.0, 5.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11207002401351929, -0.10605020821094513, -0.10003039985895157, -0.09401059150695801, -0.08799077570438385, -0.08197095990180969, -0.07595115154981613, -0.06993134319782257, -0.06391152739524841, -0.057891715317964554, -0.051871903240680695, -0.045852091163396835, -0.039832279086112976, -0.03381246700882912, -0.027792654931545258, -0.0217728428542614, -0.01575303077697754, -0.00973321869969368, -0.0037134066224098206, 0.0023064054548740387, 0.008326217532157898, 0.014346029609441757, 0.020365841686725616, 0.026385653764009476, 0.032405465841293335, 0.038425277918577194, 0.04444508999586105, 0.05046490207314491, 0.05648471415042877, 0.06250452995300293, 0.06852433830499649, 0.07454414665699005, 0.08056396245956421, 0.08658377826213837, 0.09260358661413193, 0.09862339496612549, 0.10464321076869965, 0.1106630265712738, 0.11668283492326736, 0.12270264327526093, 0.12872245907783508, 0.13474227488040924, 0.1407620906829834, 0.14678189158439636, 0.15280170738697052, 0.15882152318954468, 0.16484132409095764, 0.1708611398935318, 0.17688095569610596, 0.18290077149868011, 0.18892058730125427, 0.19494038820266724, 0.2009602040052414, 0.20698001980781555, 0.21299982070922852, 0.21901963651180267, 0.22503945231437683, 0.231059268116951, 0.23707908391952515, 0.2430988848209381, 0.24911870062351227, 0.2551385164260864, 0.2611583173274994, 0.26717814803123474, 0.2731979489326477]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 6.0, 5.0, 9.0, 13.0, 14.0, 24.0, 30.0, 40.0, 44.0, 83.0, 95.0, 121.0, 142.0, 232.0, 304.0, 497.0, 701.0, 992.0, 1426.0, 2311.0, 3660.0, 5844.0, 10324.0, 20366.0, 113765.0, 827037.0, 28092.0, 12903.0, 7018.0, 4277.0, 2663.0, 1701.0, 1137.0, 775.0, 552.0, 368.0, 252.0, 191.0, 132.0, 89.0, 93.0, 61.0, 41.0, 30.0, 28.0, 18.0, 14.0, 10.0, 2.0, 5.0, 9.0, 5.0, 3.0, 5.0, 1.0, 1.0], "bins": [-0.043548583984375, -0.0422358512878418, -0.040923118591308594, -0.03961038589477539, -0.03829765319824219, -0.036984920501708984, -0.03567218780517578, -0.03435945510864258, -0.033046722412109375, -0.03173398971557617, -0.03042125701904297, -0.029108524322509766, -0.027795791625976562, -0.02648305892944336, -0.025170326232910156, -0.023857593536376953, -0.02254486083984375, -0.021232128143310547, -0.019919395446777344, -0.01860666275024414, -0.017293930053710938, -0.015981197357177734, -0.014668464660644531, -0.013355731964111328, -0.012042999267578125, -0.010730266571044922, -0.009417533874511719, -0.008104801177978516, -0.0067920684814453125, -0.005479335784912109, -0.004166603088378906, -0.002853870391845703, -0.0015411376953125, -0.00022840499877929688, 0.0010843276977539062, 0.0023970603942871094, 0.0037097930908203125, 0.005022525787353516, 0.006335258483886719, 0.007647991180419922, 0.008960723876953125, 0.010273456573486328, 0.011586189270019531, 0.012898921966552734, 0.014211654663085938, 0.01552438735961914, 0.016837120056152344, 0.018149852752685547, 0.01946258544921875, 0.020775318145751953, 0.022088050842285156, 0.02340078353881836, 0.024713516235351562, 0.026026248931884766, 0.02733898162841797, 0.028651714324951172, 0.029964447021484375, 0.03127717971801758, 0.03258991241455078, 0.033902645111083984, 0.03521537780761719, 0.03652811050415039, 0.037840843200683594, 0.0391535758972168, 0.04046630859375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 5.0, 6.0, 9.0, 7.0, 13.0, 13.0, 11.0, 28.0, 108.0, 580.0, 123.0, 12.0, 13.0, 12.0, 7.0, 5.0, 7.0, 7.0, 9.0, 3.0, 7.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002239227294921875, -0.0021656155586242676, -0.00209200382232666, -0.0020183920860290527, -0.0019447803497314453, -0.0018711686134338379, -0.0017975568771362305, -0.001723945140838623, -0.0016503334045410156, -0.0015767216682434082, -0.0015031099319458008, -0.0014294981956481934, -0.001355886459350586, -0.0012822747230529785, -0.001208662986755371, -0.0011350512504577637, -0.0010614395141601562, -0.0009878277778625488, -0.0009142160415649414, -0.000840604305267334, -0.0007669925689697266, -0.0006933808326721191, -0.0006197690963745117, -0.0005461573600769043, -0.0004725456237792969, -0.00039893388748168945, -0.00032532215118408203, -0.0002517104148864746, -0.0001780986785888672, -0.00010448694229125977, -3.0875205993652344e-05, 4.273653030395508e-05, 0.0001163482666015625, 0.00018996000289916992, 0.00026357173919677734, 0.00033718347549438477, 0.0004107952117919922, 0.0004844069480895996, 0.000558018684387207, 0.0006316304206848145, 0.0007052421569824219, 0.0007788538932800293, 0.0008524656295776367, 0.0009260773658752441, 0.0009996891021728516, 0.001073300838470459, 0.0011469125747680664, 0.0012205243110656738, 0.0012941360473632812, 0.0013677477836608887, 0.001441359519958496, 0.0015149712562561035, 0.001588582992553711, 0.0016621947288513184, 0.0017358064651489258, 0.0018094182014465332, 0.0018830299377441406, 0.001956641674041748, 0.0020302534103393555, 0.002103865146636963, 0.0021774768829345703, 0.0022510886192321777, 0.002324700355529785, 0.0023983120918273926, 0.002471923828125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 3.0, 8.0, 8.0, 10.0, 17.0, 13.0, 24.0, 19.0, 25.0, 34.0, 37.0, 41.0, 42.0, 74.0, 189.0, 1433.0, 43040.0, 996861.0, 5809.0, 470.0, 91.0, 60.0, 45.0, 22.0, 31.0, 28.0, 28.0, 15.0, 15.0, 18.0, 13.0, 6.0, 5.0, 3.0, 5.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1534423828125, -0.14920997619628906, -0.14497756958007812, -0.1407451629638672, -0.13651275634765625, -0.1322803497314453, -0.12804794311523438, -0.12381553649902344, -0.1195831298828125, -0.11535072326660156, -0.11111831665039062, -0.10688591003417969, -0.10265350341796875, -0.09842109680175781, -0.09418869018554688, -0.08995628356933594, -0.085723876953125, -0.08149147033691406, -0.07725906372070312, -0.07302665710449219, -0.06879425048828125, -0.06456184387207031, -0.060329437255859375, -0.05609703063964844, -0.0518646240234375, -0.04763221740722656, -0.043399810791015625, -0.03916740417480469, -0.03493499755859375, -0.030702590942382812, -0.026470184326171875, -0.022237777709960938, -0.01800537109375, -0.013772964477539062, -0.009540557861328125, -0.0053081512451171875, -0.00107574462890625, 0.0031566619873046875, 0.007389068603515625, 0.011621475219726562, 0.0158538818359375, 0.020086288452148438, 0.024318695068359375, 0.028551101684570312, 0.03278350830078125, 0.03701591491699219, 0.041248321533203125, 0.04548072814941406, 0.049713134765625, 0.05394554138183594, 0.058177947998046875, 0.06241035461425781, 0.06664276123046875, 0.07087516784667969, 0.07510757446289062, 0.07933998107910156, 0.0835723876953125, 0.08780479431152344, 0.09203720092773438, 0.09626960754394531, 0.10050201416015625, 0.10473442077636719, 0.10896682739257812, 0.11319923400878906, 0.117431640625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 2.0, 6.0, 9.0, 10.0, 9.0, 20.0, 17.0, 23.0, 24.0, 20.0, 35.0, 37.0, 43.0, 37.0, 41.0, 42.0, 58.0, 43.0, 49.0, 49.0, 71.0, 49.0, 49.0, 40.0, 33.0, 23.0, 30.0, 24.0, 17.0, 22.0, 20.0, 13.0, 9.0, 5.0, 1.0, 5.0, 7.0, 8.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00750732421875, -0.0073004961013793945, -0.007093667984008789, -0.006886839866638184, -0.006680011749267578, -0.006473183631896973, -0.006266355514526367, -0.006059527397155762, -0.005852699279785156, -0.005645871162414551, -0.005439043045043945, -0.00523221492767334, -0.005025386810302734, -0.004818558692932129, -0.0046117305755615234, -0.004404902458190918, -0.0041980743408203125, -0.003991246223449707, -0.0037844181060791016, -0.003577589988708496, -0.0033707618713378906, -0.003163933753967285, -0.0029571056365966797, -0.0027502775192260742, -0.0025434494018554688, -0.0023366212844848633, -0.002129793167114258, -0.0019229650497436523, -0.0017161369323730469, -0.0015093088150024414, -0.001302480697631836, -0.0010956525802612305, -0.000888824462890625, -0.0006819963455200195, -0.00047516822814941406, -0.0002683401107788086, -6.151199340820312e-05, 0.00014531612396240234, 0.0003521442413330078, 0.0005589723587036133, 0.0007658004760742188, 0.0009726285934448242, 0.0011794567108154297, 0.0013862848281860352, 0.0015931129455566406, 0.001799941062927246, 0.0020067691802978516, 0.002213597297668457, 0.0024204254150390625, 0.002627253532409668, 0.0028340816497802734, 0.003040909767150879, 0.0032477378845214844, 0.00345456600189209, 0.0036613941192626953, 0.0038682222366333008, 0.004075050354003906, 0.004281878471374512, 0.004488706588745117, 0.004695534706115723, 0.004902362823486328, 0.005109190940856934, 0.005316019058227539, 0.0055228471755981445, 0.00572967529296875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 20.0, 41.0, 260.0, 17318.0, 1030298.0, 506.0, 51.0, 21.0, 10.0, 5.0, 5.0, 3.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06695556640625, -0.06362056732177734, -0.06028556823730469, -0.05695056915283203, -0.053615570068359375, -0.05028057098388672, -0.04694557189941406, -0.043610572814941406, -0.04027557373046875, -0.036940574645996094, -0.03360557556152344, -0.03027057647705078, -0.026935577392578125, -0.02360057830810547, -0.020265579223632812, -0.016930580139160156, -0.0135955810546875, -0.010260581970214844, -0.0069255828857421875, -0.0035905838012695312, -0.000255584716796875, 0.0030794143676757812, 0.0064144134521484375, 0.009749412536621094, 0.01308441162109375, 0.016419410705566406, 0.019754409790039062, 0.02308940887451172, 0.026424407958984375, 0.02975940704345703, 0.03309440612792969, 0.036429405212402344, 0.039764404296875, 0.043099403381347656, 0.04643440246582031, 0.04976940155029297, 0.053104400634765625, 0.05643939971923828, 0.05977439880371094, 0.0631093978881836, 0.06644439697265625, 0.0697793960571289, 0.07311439514160156, 0.07644939422607422, 0.07978439331054688, 0.08311939239501953, 0.08645439147949219, 0.08978939056396484, 0.0931243896484375, 0.09645938873291016, 0.09979438781738281, 0.10312938690185547, 0.10646438598632812, 0.10979938507080078, 0.11313438415527344, 0.1164693832397461, 0.11980438232421875, 0.1231393814086914, 0.12647438049316406, 0.12980937957763672, 0.13314437866210938, 0.13647937774658203, 0.1398143768310547, 0.14314937591552734, 0.146484375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 10.0, 14.0, 12.0, 24.0, 50.0, 114.0, 273.0, 245.0, 104.0, 51.0, 28.0, 27.0, 17.0, 8.0, 7.0, 8.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00012123584747314453, -0.00011719204485416412, -0.00011314824223518372, -0.00010910443961620331, -0.0001050606369972229, -0.00010101683437824249, -9.697303175926208e-05, -9.292922914028168e-05, -8.888542652130127e-05, -8.484162390232086e-05, -8.079782128334045e-05, -7.675401866436005e-05, -7.271021604537964e-05, -6.866641342639923e-05, -6.462261080741882e-05, -6.0578808188438416e-05, -5.653500556945801e-05, -5.24912029504776e-05, -4.844740033149719e-05, -4.4403597712516785e-05, -4.035979509353638e-05, -3.631599247455597e-05, -3.227218985557556e-05, -2.8228387236595154e-05, -2.4184584617614746e-05, -2.014078199863434e-05, -1.609697937965393e-05, -1.2053176760673523e-05, -8.009374141693115e-06, -3.9655715227127075e-06, 7.82310962677002e-08, 4.122033715248108e-06, 8.165836334228516e-06, 1.2209638953208923e-05, 1.625344157218933e-05, 2.029724419116974e-05, 2.4341046810150146e-05, 2.8384849429130554e-05, 3.242865204811096e-05, 3.647245466709137e-05, 4.051625728607178e-05, 4.4560059905052185e-05, 4.860386252403259e-05, 5.2647665143013e-05, 5.669146776199341e-05, 6.0735270380973816e-05, 6.477907299995422e-05, 6.882287561893463e-05, 7.286667823791504e-05, 7.691048085689545e-05, 8.095428347587585e-05, 8.499808609485626e-05, 8.904188871383667e-05, 9.308569133281708e-05, 9.712949395179749e-05, 0.00010117329657077789, 0.0001052170991897583, 0.00010926090180873871, 0.00011330470442771912, 0.00011734850704669952, 0.00012139230966567993, 0.00012543611228466034, 0.00012947991490364075, 0.00013352371752262115, 0.00013756752014160156]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 33.0, 101.0, 1253.0, 1045409.0, 1582.0, 112.0, 27.0, 8.0, 3.0, 2.0, 3.0, 3.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1097412109375, -0.10614681243896484, -0.10255241394042969, -0.09895801544189453, -0.09536361694335938, -0.09176921844482422, -0.08817481994628906, -0.0845804214477539, -0.08098602294921875, -0.0773916244506836, -0.07379722595214844, -0.07020282745361328, -0.06660842895507812, -0.06301403045654297, -0.05941963195800781, -0.055825233459472656, -0.0522308349609375, -0.048636436462402344, -0.04504203796386719, -0.04144763946533203, -0.037853240966796875, -0.03425884246826172, -0.030664443969726562, -0.027070045471191406, -0.02347564697265625, -0.019881248474121094, -0.016286849975585938, -0.012692451477050781, -0.009098052978515625, -0.005503654479980469, -0.0019092559814453125, 0.0016851425170898438, 0.005279541015625, 0.008873939514160156, 0.012468338012695312, 0.01606273651123047, 0.019657135009765625, 0.02325153350830078, 0.026845932006835938, 0.030440330505371094, 0.03403472900390625, 0.037629127502441406, 0.04122352600097656, 0.04481792449951172, 0.048412322998046875, 0.05200672149658203, 0.05560111999511719, 0.059195518493652344, 0.0627899169921875, 0.06638431549072266, 0.06997871398925781, 0.07357311248779297, 0.07716751098632812, 0.08076190948486328, 0.08435630798339844, 0.0879507064819336, 0.09154510498046875, 0.0951395034790039, 0.09873390197753906, 0.10232830047607422, 0.10592269897460938, 0.10951709747314453, 0.11311149597167969, 0.11670589447021484, 0.12030029296875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0, 4.0, 12.0, 27.0, 43.0, 103.0, 622.0, 98.0, 43.0, 14.0, 10.0, 1.0, 5.0, 5.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004795074462890625, -0.004637956619262695, -0.004480838775634766, -0.004323720932006836, -0.004166603088378906, -0.0040094852447509766, -0.003852367401123047, -0.003695249557495117, -0.0035381317138671875, -0.003381013870239258, -0.003223896026611328, -0.0030667781829833984, -0.0029096603393554688, -0.002752542495727539, -0.0025954246520996094, -0.0024383068084716797, -0.00228118896484375, -0.0021240711212158203, -0.0019669532775878906, -0.001809835433959961, -0.0016527175903320312, -0.0014955997467041016, -0.0013384819030761719, -0.0011813640594482422, -0.0010242462158203125, -0.0008671283721923828, -0.0007100105285644531, -0.0005528926849365234, -0.00039577484130859375, -0.00023865699768066406, -8.153915405273438e-05, 7.557868957519531e-05, 0.000232696533203125, 0.0003898143768310547, 0.0005469322204589844, 0.0007040500640869141, 0.0008611679077148438, 0.0010182857513427734, 0.0011754035949707031, 0.0013325214385986328, 0.0014896392822265625, 0.0016467571258544922, 0.0018038749694824219, 0.0019609928131103516, 0.0021181106567382812, 0.002275228500366211, 0.0024323463439941406, 0.0025894641876220703, 0.00274658203125, 0.0029036998748779297, 0.0030608177185058594, 0.003217935562133789, 0.0033750534057617188, 0.0035321712493896484, 0.003689289093017578, 0.003846406936645508, 0.0040035247802734375, 0.004160642623901367, 0.004317760467529297, 0.0044748783111572266, 0.004631996154785156, 0.004789113998413086, 0.004946231842041016, 0.005103349685668945, 0.005260467529296875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 8.0, 20.0, 43.0, 153.0, 566.0, 124.0, 34.0, 24.0, 6.0, 6.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.21310336887836456, -0.2075526863336563, -0.20200201869010925, -0.196451336145401, -0.19090065360069275, -0.1853499859571457, -0.17979930341243744, -0.17424863576889038, -0.16869795322418213, -0.16314727067947388, -0.15759660303592682, -0.15204592049121857, -0.1464952528476715, -0.14094457030296326, -0.135393887758255, -0.12984320521354675, -0.1242925375699997, -0.11874186247587204, -0.11319118738174438, -0.10764050483703613, -0.10208982974290848, -0.09653915464878082, -0.09098847210407257, -0.08543779700994492, -0.07988712191581726, -0.0743364468216896, -0.06878577172756195, -0.0632350891828537, -0.057684414088726044, -0.05213373899459839, -0.046583060175180435, -0.04103238135576248, -0.03548169136047363, -0.02993101440370083, -0.024380337446928024, -0.01882966049015522, -0.013278983533382416, -0.0077283065766096115, -0.0021776296198368073, 0.0033730491995811462, 0.008923724293708801, 0.014474401250481606, 0.02002507820725441, 0.025575755164027214, 0.03112643212080002, 0.03667710721492767, 0.04222778603434563, 0.04777846485376358, 0.053329139947891235, 0.05887981504201889, 0.06443049013614655, 0.0699811726808548, 0.07553184777498245, 0.08108252286911011, 0.08663320541381836, 0.09218388050794601, 0.09773455560207367, 0.10328523069620132, 0.10883590579032898, 0.11438658833503723, 0.11993726342916489, 0.12548793852329254, 0.1310386210680008, 0.13658928871154785, 0.1421399712562561]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 7.0, 8.0, 4.0, 6.0, 9.0, 9.0, 14.0, 17.0, 25.0, 28.0, 30.0, 40.0, 57.0, 62.0, 65.0, 67.0, 70.0, 79.0, 63.0, 87.0, 48.0, 52.0, 34.0, 24.0, 19.0, 11.0, 16.0, 8.0, 7.0, 7.0, 6.0, 6.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.05427020788192749, -0.05274710804224014, -0.051224008202552795, -0.04970090463757515, -0.0481778047978878, -0.046654704958200455, -0.04513160139322281, -0.04360850155353546, -0.042085401713848114, -0.04056230187416077, -0.03903920203447342, -0.03751609846949577, -0.035992998629808426, -0.03446989879012108, -0.03294679522514343, -0.031423695385456085, -0.029900595545768738, -0.02837749570608139, -0.026854394003748894, -0.025331292301416397, -0.02380819246172905, -0.022285092622041702, -0.020761990919709206, -0.01923888921737671, -0.01771578937768936, -0.016192689538002014, -0.014669587835669518, -0.013146487064659595, -0.011623386293649673, -0.010100285522639751, -0.00857718475162983, -0.007054083980619907, -0.005530983209609985, -0.004007882438600063, -0.0024847816675901413, -0.0009616808965802193, 0.0005614198744297028, 0.002084520645439625, 0.003607621416449547, 0.005130722187459469, 0.006653822958469391, 0.008176923729479313, 0.009700024500489235, 0.011223125271499157, 0.012746226042509079, 0.014269326813519001, 0.015792427584528923, 0.01731552928686142, 0.018838629126548767, 0.020361728966236115, 0.02188483066856861, 0.023407932370901108, 0.024931032210588455, 0.026454132050275803, 0.0279772337526083, 0.029500335454940796, 0.031023435294628143, 0.03254653513431549, 0.03406963497400284, 0.035592738538980484, 0.03711583837866783, 0.03863893821835518, 0.040162041783332825, 0.04168514162302017, 0.04320824146270752]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 4.0, 4.0, 2.0, 0.0, 4.0, 10.0, 4.0, 4.0, 4.0, 8.0, 22.0, 20.0, 22.0, 22.0, 36.0, 54.0, 542.0, 4193294.0, 52.0, 22.0, 28.0, 26.0, 16.0, 14.0, 12.0, 10.0, 6.0, 17.0, 9.0, 2.0, 6.0, 4.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.71875, -3.59967041015625, -3.4805908203125, -3.36151123046875, -3.242431640625, -3.12335205078125, -3.0042724609375, -2.88519287109375, -2.76611328125, -2.64703369140625, -2.5279541015625, -2.40887451171875, -2.289794921875, -2.17071533203125, -2.0516357421875, -1.93255615234375, -1.8134765625, -1.69439697265625, -1.5753173828125, -1.45623779296875, -1.337158203125, -1.21807861328125, -1.0989990234375, -0.97991943359375, -0.86083984375, -0.74176025390625, -0.6226806640625, -0.50360107421875, -0.384521484375, -0.26544189453125, -0.1463623046875, -0.02728271484375, 0.091796875, 0.21087646484375, 0.3299560546875, 0.44903564453125, 0.568115234375, 0.68719482421875, 0.8062744140625, 0.92535400390625, 1.04443359375, 1.16351318359375, 1.2825927734375, 1.40167236328125, 1.520751953125, 1.63983154296875, 1.7589111328125, 1.87799072265625, 1.9970703125, 2.11614990234375, 2.2352294921875, 2.35430908203125, 2.473388671875, 2.59246826171875, 2.7115478515625, 2.83062744140625, 2.94970703125, 3.06878662109375, 3.1878662109375, 3.30694580078125, 3.426025390625, 3.54510498046875, 3.6641845703125, 3.78326416015625, 3.90234375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 4.0, 5.0, 4.0, 7.0, 10.0, 10.0, 13.0, 10.0, 13.0, 25.0, 105.0, 513.0, 177.0, 24.0, 13.0, 12.0, 8.0, 2.0, 8.0, 8.0, 4.0, 8.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020999908447265625, -0.002031177282333374, -0.0019623637199401855, -0.001893550157546997, -0.0018247365951538086, -0.0017559230327606201, -0.0016871094703674316, -0.0016182959079742432, -0.0015494823455810547, -0.0014806687831878662, -0.0014118552207946777, -0.0013430416584014893, -0.0012742280960083008, -0.0012054145336151123, -0.0011366009712219238, -0.0010677874088287354, -0.0009989738464355469, -0.0009301602840423584, -0.0008613467216491699, -0.0007925331592559814, -0.000723719596862793, -0.0006549060344696045, -0.000586092472076416, -0.0005172789096832275, -0.00044846534729003906, -0.0003796517848968506, -0.0003108382225036621, -0.00024202466011047363, -0.00017321109771728516, -0.00010439753532409668, -3.55839729309082e-05, 3.3229589462280273e-05, 0.00010204315185546875, 0.00017085671424865723, 0.0002396702766418457, 0.0003084838390350342, 0.00037729740142822266, 0.00044611096382141113, 0.0005149245262145996, 0.0005837380886077881, 0.0006525516510009766, 0.000721365213394165, 0.0007901787757873535, 0.000858992338180542, 0.0009278059005737305, 0.000996619462966919, 0.0010654330253601074, 0.001134246587753296, 0.0012030601501464844, 0.0012718737125396729, 0.0013406872749328613, 0.0014095008373260498, 0.0014783143997192383, 0.0015471279621124268, 0.0016159415245056152, 0.0016847550868988037, 0.0017535686492919922, 0.0018223822116851807, 0.0018911957740783691, 0.0019600093364715576, 0.002028822898864746, 0.0020976364612579346, 0.002166450023651123, 0.0022352635860443115, 0.0023040771484375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 7.0, 9.0, 11.0, 34.0, 45.0, 102.0, 239.0, 4187514.0, 5989.0, 188.0, 80.0, 38.0, 9.0, 12.0, 6.0, 3.0, 1.0, 1.0, 4.0, 2.0, 0.0, 3.0], "bins": [-2.564453125, -2.5131149291992188, -2.4617767333984375, -2.4104385375976562, -2.359100341796875, -2.3077621459960938, -2.2564239501953125, -2.2050857543945312, -2.15374755859375, -2.1024093627929688, -2.0510711669921875, -1.9997329711914062, -1.948394775390625, -1.8970565795898438, -1.8457183837890625, -1.7943801879882812, -1.7430419921875, -1.6917037963867188, -1.6403656005859375, -1.5890274047851562, -1.537689208984375, -1.4863510131835938, -1.4350128173828125, -1.3836746215820312, -1.33233642578125, -1.2809982299804688, -1.2296600341796875, -1.1783218383789062, -1.126983642578125, -1.0756454467773438, -1.0243072509765625, -0.9729690551757812, -0.921630859375, -0.8702926635742188, -0.8189544677734375, -0.7676162719726562, -0.716278076171875, -0.6649398803710938, -0.6136016845703125, -0.5622634887695312, -0.51092529296875, -0.45958709716796875, -0.4082489013671875, -0.35691070556640625, -0.305572509765625, -0.25423431396484375, -0.2028961181640625, -0.15155792236328125, -0.1002197265625, -0.04888153076171875, 0.0024566650390625, 0.05379486083984375, 0.105133056640625, 0.15647125244140625, 0.2078094482421875, 0.25914764404296875, 0.31048583984375, 0.36182403564453125, 0.4131622314453125, 0.46450042724609375, 0.515838623046875, 0.5671768188476562, 0.6185150146484375, 0.6698532104492188, 0.72119140625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 13.0, 15.0, 35.0, 74.0, 169.0, 674.0, 2567.0, 350.0, 102.0, 37.0, 18.0, 10.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.017822265625, -0.017467916011810303, -0.017113566398620605, -0.016759216785430908, -0.01640486717224121, -0.016050517559051514, -0.015696167945861816, -0.01534181833267212, -0.014987468719482422, -0.014633119106292725, -0.014278769493103027, -0.01392441987991333, -0.013570070266723633, -0.013215720653533936, -0.012861371040344238, -0.012507021427154541, -0.012152671813964844, -0.011798322200775146, -0.01144397258758545, -0.011089622974395752, -0.010735273361206055, -0.010380923748016357, -0.01002657413482666, -0.009672224521636963, -0.009317874908447266, -0.008963525295257568, -0.008609175682067871, -0.008254826068878174, -0.007900476455688477, -0.007546126842498779, -0.007191777229309082, -0.006837427616119385, -0.0064830780029296875, -0.00612872838973999, -0.005774378776550293, -0.005420029163360596, -0.0050656795501708984, -0.004711329936981201, -0.004356980323791504, -0.004002630710601807, -0.0036482810974121094, -0.003293931484222412, -0.002939581871032715, -0.0025852322578430176, -0.0022308826446533203, -0.001876533031463623, -0.0015221834182739258, -0.0011678338050842285, -0.0008134841918945312, -0.000459134578704834, -0.00010478496551513672, 0.00024956464767456055, 0.0006039142608642578, 0.0009582638740539551, 0.0013126134872436523, 0.0016669631004333496, 0.002021312713623047, 0.002375662326812744, 0.0027300119400024414, 0.0030843615531921387, 0.003438711166381836, 0.003793060779571533, 0.0041474103927612305, 0.004501760005950928, 0.004856109619140625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1020.0, 1.0], "bins": [-6.220249652862549, -6.120551586151123, -6.020853042602539, -5.921154975891113, -5.8214569091796875, -5.7217583656311035, -5.622060298919678, -5.522362232208252, -5.422663688659668, -5.322965621948242, -5.223267078399658, -5.123569011688232, -5.023870944976807, -4.924172401428223, -4.824474334716797, -4.724776268005371, -4.625078201293945, -4.5253801345825195, -4.4256815910339355, -4.32598352432251, -4.226285457611084, -4.1265869140625, -4.026888847351074, -3.9271905422210693, -3.8274922370910645, -3.7277939319610596, -3.628095865249634, -3.528397560119629, -3.428699254989624, -3.329000949859619, -3.2293028831481934, -3.1296045780181885, -3.0299062728881836, -2.9302079677581787, -2.830509901046753, -2.730811595916748, -2.631113290786743, -2.5314149856567383, -2.4317169189453125, -2.3320186138153076, -2.2323203086853027, -2.132622003555298, -2.032923936843872, -1.9332256317138672, -1.8335273265838623, -1.733829140663147, -1.6341309547424316, -1.5344326496124268, -1.434734582901001, -1.3350363969802856, -1.2353380918502808, -1.1356399059295654, -1.0359416007995605, -0.9362434148788452, -0.8365452289581299, -0.7368469834327698, -0.6371487379074097, -0.5374504923820496, -0.43775227665901184, -0.3380540609359741, -0.238355815410614, -0.1386575698852539, -0.038959383964538574, 0.06073886156082153, 0.16043713688850403]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 8.0, 15.0, 38.0, 75.0, 173.0, 262.0, 213.0, 130.0, 64.0, 24.0, 13.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.3733484745025635, -0.3661007881164551, -0.3588531017303467, -0.3516054153442383, -0.34435775876045227, -0.33711007237434387, -0.3298623859882355, -0.3226146996021271, -0.3153670132160187, -0.3081193268299103, -0.3008716404438019, -0.29362398386001587, -0.28637629747390747, -0.2791286110877991, -0.2718809247016907, -0.2646332383155823, -0.2573855519294739, -0.2501378655433655, -0.24289019405841827, -0.23564250767230988, -0.22839482128620148, -0.22114714980125427, -0.21389946341514587, -0.20665177702903748, -0.19940412044525146, -0.19215643405914307, -0.18490876257419586, -0.17766107618808746, -0.17041338980197906, -0.16316571831703186, -0.15591803193092346, -0.14867034554481506, -0.14142265915870667, -0.13417497277259827, -0.12692730128765106, -0.11967961490154266, -0.11243192851543427, -0.10518424957990646, -0.09793657064437866, -0.09068888425827026, -0.08344120532274246, -0.07619352638721466, -0.06894584000110626, -0.06169816106557846, -0.05445047840476036, -0.04720279574394226, -0.03995511680841446, -0.03270743414759636, -0.02545975148677826, -0.01821206882596016, -0.010964388027787209, -0.003716707229614258, 0.003530975431203842, 0.010778658092021942, 0.018026337027549744, 0.025274019688367844, 0.032521702349185944, 0.039769385010004044, 0.047017067670822144, 0.054264746606349945, 0.061512429267168045, 0.06876011192798615, 0.07600779086351395, 0.08325546979904175, 0.09050315618515015]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 5.0, 3.0, 7.0, 8.0, 12.0, 12.0, 9.0, 21.0, 27.0, 35.0, 33.0, 44.0, 55.0, 74.0, 96.0, 230.0, 18076.0, 1028179.0, 1088.0, 158.0, 92.0, 77.0, 60.0, 32.0, 26.0, 15.0, 17.0, 15.0, 12.0, 8.0, 5.0, 5.0, 5.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.24365234375, -0.23560333251953125, -0.2275543212890625, -0.21950531005859375, -0.211456298828125, -0.20340728759765625, -0.1953582763671875, -0.18730926513671875, -0.17926025390625, -0.17121124267578125, -0.1631622314453125, -0.15511322021484375, -0.147064208984375, -0.13901519775390625, -0.1309661865234375, -0.12291717529296875, -0.1148681640625, -0.10681915283203125, -0.0987701416015625, -0.09072113037109375, -0.082672119140625, -0.07462310791015625, -0.0665740966796875, -0.05852508544921875, -0.05047607421875, -0.04242706298828125, -0.0343780517578125, -0.02632904052734375, -0.018280029296875, -0.01023101806640625, -0.0021820068359375, 0.00586700439453125, 0.013916015625, 0.02196502685546875, 0.0300140380859375, 0.03806304931640625, 0.046112060546875, 0.05416107177734375, 0.0622100830078125, 0.07025909423828125, 0.07830810546875, 0.08635711669921875, 0.0944061279296875, 0.10245513916015625, 0.110504150390625, 0.11855316162109375, 0.1266021728515625, 0.13465118408203125, 0.1427001953125, 0.15074920654296875, 0.1587982177734375, 0.16684722900390625, 0.174896240234375, 0.18294525146484375, 0.1909942626953125, 0.19904327392578125, 0.20709228515625, 0.21514129638671875, 0.2231903076171875, 0.23123931884765625, 0.239288330078125, 0.24733734130859375, 0.2553863525390625, 0.26343536376953125, 0.271484375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 58.0, 367.0, 472.0, 107.0, 10.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06341552734375, -0.06219828128814697, -0.060981035232543945, -0.05976378917694092, -0.05854654312133789, -0.05732929706573486, -0.056112051010131836, -0.05489480495452881, -0.05367755889892578, -0.052460312843322754, -0.05124306678771973, -0.0500258207321167, -0.04880857467651367, -0.047591328620910645, -0.04637408256530762, -0.04515683650970459, -0.04393959045410156, -0.042722344398498535, -0.04150509834289551, -0.04028785228729248, -0.03907060623168945, -0.037853360176086426, -0.0366361141204834, -0.03541886806488037, -0.034201622009277344, -0.032984375953674316, -0.03176712989807129, -0.03054988384246826, -0.029332637786865234, -0.028115391731262207, -0.02689814567565918, -0.025680899620056152, -0.024463653564453125, -0.023246407508850098, -0.02202916145324707, -0.020811915397644043, -0.019594669342041016, -0.01837742328643799, -0.01716017723083496, -0.015942931175231934, -0.014725685119628906, -0.013508439064025879, -0.012291193008422852, -0.011073946952819824, -0.009856700897216797, -0.00863945484161377, -0.007422208786010742, -0.006204962730407715, -0.0049877166748046875, -0.00377047061920166, -0.002553224563598633, -0.0013359785079956055, -0.00011873245239257812, 0.0010985136032104492, 0.0023157596588134766, 0.003533005714416504, 0.004750251770019531, 0.005967497825622559, 0.007184743881225586, 0.008401989936828613, 0.00961923599243164, 0.010836482048034668, 0.012053728103637695, 0.013270974159240723, 0.01448822021484375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 3.0, 2.0, 13.0, 6.0, 7.0, 10.0, 11.0, 26.0, 26.0, 26.0, 69.0, 82.0, 109.0, 192.0, 333.0, 1198.0, 13181.0, 949075.0, 80226.0, 2689.0, 531.0, 262.0, 144.0, 98.0, 80.0, 32.0, 27.0, 23.0, 18.0, 13.0, 11.0, 10.0, 7.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1383056640625, -0.1333160400390625, -0.128326416015625, -0.1233367919921875, -0.11834716796875, -0.1133575439453125, -0.108367919921875, -0.1033782958984375, -0.098388671875, -0.0933990478515625, -0.088409423828125, -0.0834197998046875, -0.07843017578125, -0.0734405517578125, -0.068450927734375, -0.0634613037109375, -0.0584716796875, -0.0534820556640625, -0.048492431640625, -0.0435028076171875, -0.03851318359375, -0.0335235595703125, -0.028533935546875, -0.0235443115234375, -0.0185546875, -0.0135650634765625, -0.008575439453125, -0.0035858154296875, 0.00140380859375, 0.0063934326171875, 0.011383056640625, 0.0163726806640625, 0.0213623046875, 0.0263519287109375, 0.031341552734375, 0.0363311767578125, 0.04132080078125, 0.0463104248046875, 0.051300048828125, 0.0562896728515625, 0.061279296875, 0.0662689208984375, 0.071258544921875, 0.0762481689453125, 0.08123779296875, 0.0862274169921875, 0.091217041015625, 0.0962066650390625, 0.1011962890625, 0.1061859130859375, 0.111175537109375, 0.1161651611328125, 0.12115478515625, 0.1261444091796875, 0.131134033203125, 0.1361236572265625, 0.14111328125, 0.1461029052734375, 0.151092529296875, 0.1560821533203125, 0.16107177734375, 0.1660614013671875, 0.171051025390625, 0.1760406494140625, 0.1810302734375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 5.0, 3.0, 8.0, 6.0, 9.0, 15.0, 13.0, 17.0, 20.0, 28.0, 23.0, 46.0, 31.0, 37.0, 56.0, 66.0, 59.0, 64.0, 57.0, 53.0, 60.0, 58.0, 52.0, 41.0, 46.0, 20.0, 33.0, 20.0, 13.0, 11.0, 7.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049285888671875, -0.0476832389831543, -0.046080589294433594, -0.04447793960571289, -0.04287528991699219, -0.041272640228271484, -0.03966999053955078, -0.03806734085083008, -0.036464691162109375, -0.03486204147338867, -0.03325939178466797, -0.031656742095947266, -0.030054092407226562, -0.02845144271850586, -0.026848793029785156, -0.025246143341064453, -0.02364349365234375, -0.022040843963623047, -0.020438194274902344, -0.01883554458618164, -0.017232894897460938, -0.015630245208740234, -0.014027595520019531, -0.012424945831298828, -0.010822296142578125, -0.009219646453857422, -0.007616996765136719, -0.006014347076416016, -0.0044116973876953125, -0.0028090476989746094, -0.0012063980102539062, 0.0003962516784667969, 0.0019989013671875, 0.003601551055908203, 0.005204200744628906, 0.006806850433349609, 0.008409500122070312, 0.010012149810791016, 0.011614799499511719, 0.013217449188232422, 0.014820098876953125, 0.016422748565673828, 0.01802539825439453, 0.019628047943115234, 0.021230697631835938, 0.02283334732055664, 0.024435997009277344, 0.026038646697998047, 0.02764129638671875, 0.029243946075439453, 0.030846595764160156, 0.03244924545288086, 0.03405189514160156, 0.035654544830322266, 0.03725719451904297, 0.03885984420776367, 0.040462493896484375, 0.04206514358520508, 0.04366779327392578, 0.045270442962646484, 0.04687309265136719, 0.04847574234008789, 0.050078392028808594, 0.0516810417175293, 0.05328369140625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 6.0, 4.0, 12.0, 9.0, 16.0, 29.0, 35.0, 58.0, 109.0, 180.0, 523.0, 2652.0, 104361.0, 934159.0, 5024.0, 781.0, 268.0, 123.0, 68.0, 36.0, 21.0, 17.0, 24.0, 9.0, 5.0, 2.0, 7.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12298583984375, -0.11903667449951172, -0.11508750915527344, -0.11113834381103516, -0.10718917846679688, -0.1032400131225586, -0.09929084777832031, -0.09534168243408203, -0.09139251708984375, -0.08744335174560547, -0.08349418640136719, -0.0795450210571289, -0.07559585571289062, -0.07164669036865234, -0.06769752502441406, -0.06374835968017578, -0.0597991943359375, -0.05585002899169922, -0.05190086364746094, -0.047951698303222656, -0.044002532958984375, -0.040053367614746094, -0.03610420227050781, -0.03215503692626953, -0.02820587158203125, -0.02425670623779297, -0.020307540893554688, -0.016358375549316406, -0.012409210205078125, -0.008460044860839844, -0.0045108795166015625, -0.0005617141723632812, 0.003387451171875, 0.007336616516113281, 0.011285781860351562, 0.015234947204589844, 0.019184112548828125, 0.023133277893066406, 0.027082443237304688, 0.03103160858154297, 0.03498077392578125, 0.03892993927001953, 0.04287910461425781, 0.046828269958496094, 0.050777435302734375, 0.054726600646972656, 0.05867576599121094, 0.06262493133544922, 0.0665740966796875, 0.07052326202392578, 0.07447242736816406, 0.07842159271240234, 0.08237075805664062, 0.0863199234008789, 0.09026908874511719, 0.09421825408935547, 0.09816741943359375, 0.10211658477783203, 0.10606575012207031, 0.1100149154663086, 0.11396408081054688, 0.11791324615478516, 0.12186241149902344, 0.12581157684326172, 0.1297607421875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 2.0, 4.0, 3.0, 6.0, 7.0, 5.0, 6.0, 10.0, 11.0, 15.0, 15.0, 20.0, 35.0, 80.0, 162.0, 228.0, 141.0, 100.0, 42.0, 26.0, 22.0, 15.0, 11.0, 11.0, 4.0, 7.0, 6.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.181529998779297e-05, -2.1103769540786743e-05, -2.0392239093780518e-05, -1.9680708646774292e-05, -1.8969178199768066e-05, -1.825764775276184e-05, -1.7546117305755615e-05, -1.683458685874939e-05, -1.6123056411743164e-05, -1.541152596473694e-05, -1.4699995517730713e-05, -1.3988465070724487e-05, -1.3276934623718262e-05, -1.2565404176712036e-05, -1.185387372970581e-05, -1.1142343282699585e-05, -1.043081283569336e-05, -9.719282388687134e-06, -9.007751941680908e-06, -8.296221494674683e-06, -7.584691047668457e-06, -6.8731606006622314e-06, -6.161630153656006e-06, -5.45009970664978e-06, -4.738569259643555e-06, -4.027038812637329e-06, -3.3155083656311035e-06, -2.603977918624878e-06, -1.8924474716186523e-06, -1.1809170246124268e-06, -4.6938657760620117e-07, 2.421438694000244e-07, 9.5367431640625e-07, 1.6652047634124756e-06, 2.376735210418701e-06, 3.0882656574249268e-06, 3.7997961044311523e-06, 4.511326551437378e-06, 5.2228569984436035e-06, 5.934387445449829e-06, 6.645917892456055e-06, 7.35744833946228e-06, 8.068978786468506e-06, 8.780509233474731e-06, 9.492039680480957e-06, 1.0203570127487183e-05, 1.0915100574493408e-05, 1.1626631021499634e-05, 1.233816146850586e-05, 1.3049691915512085e-05, 1.376122236251831e-05, 1.4472752809524536e-05, 1.5184283256530762e-05, 1.5895813703536987e-05, 1.6607344150543213e-05, 1.731887459754944e-05, 1.8030405044555664e-05, 1.874193549156189e-05, 1.9453465938568115e-05, 2.016499638557434e-05, 2.0876526832580566e-05, 2.1588057279586792e-05, 2.2299587726593018e-05, 2.3011118173599243e-05, 2.372264862060547e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 7.0, 3.0, 8.0, 20.0, 17.0, 13.0, 42.0, 48.0, 105.0, 242.0, 992.0, 20227.0, 1018983.0, 6686.0, 714.0, 203.0, 84.0, 45.0, 33.0, 21.0, 10.0, 15.0, 14.0, 9.0, 1.0, 0.0, 2.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1546630859375, -0.14988327026367188, -0.14510345458984375, -0.14032363891601562, -0.1355438232421875, -0.13076400756835938, -0.12598419189453125, -0.12120437622070312, -0.116424560546875, -0.11164474487304688, -0.10686492919921875, -0.10208511352539062, -0.0973052978515625, -0.09252548217773438, -0.08774566650390625, -0.08296585083007812, -0.07818603515625, -0.07340621948242188, -0.06862640380859375, -0.06384658813476562, -0.0590667724609375, -0.054286956787109375, -0.04950714111328125, -0.044727325439453125, -0.039947509765625, -0.035167694091796875, -0.03038787841796875, -0.025608062744140625, -0.0208282470703125, -0.016048431396484375, -0.01126861572265625, -0.006488800048828125, -0.001708984375, 0.003070831298828125, 0.00785064697265625, 0.012630462646484375, 0.0174102783203125, 0.022190093994140625, 0.02696990966796875, 0.031749725341796875, 0.036529541015625, 0.041309356689453125, 0.04608917236328125, 0.050868988037109375, 0.0556488037109375, 0.060428619384765625, 0.06520843505859375, 0.06998825073242188, 0.07476806640625, 0.07954788208007812, 0.08432769775390625, 0.08910751342773438, 0.0938873291015625, 0.09866714477539062, 0.10344696044921875, 0.10822677612304688, 0.113006591796875, 0.11778640747070312, 0.12256622314453125, 0.12734603881835938, 0.1321258544921875, 0.13690567016601562, 0.14168548583984375, 0.14646530151367188, 0.1512451171875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 2.0, 4.0, 5.0, 4.0, 11.0, 12.0, 8.0, 12.0, 29.0, 49.0, 69.0, 142.0, 264.0, 164.0, 86.0, 39.0, 29.0, 13.0, 17.0, 7.0, 6.0, 7.0, 8.0, 2.0, 2.0, 2.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.029449462890625, -0.028087139129638672, -0.026724815368652344, -0.025362491607666016, -0.024000167846679688, -0.02263784408569336, -0.02127552032470703, -0.019913196563720703, -0.018550872802734375, -0.017188549041748047, -0.01582622528076172, -0.01446390151977539, -0.013101577758789062, -0.011739253997802734, -0.010376930236816406, -0.009014606475830078, -0.00765228271484375, -0.006289958953857422, -0.004927635192871094, -0.0035653114318847656, -0.0022029876708984375, -0.0008406639099121094, 0.0005216598510742188, 0.0018839836120605469, 0.003246307373046875, 0.004608631134033203, 0.005970954895019531, 0.007333278656005859, 0.008695602416992188, 0.010057926177978516, 0.011420249938964844, 0.012782573699951172, 0.0141448974609375, 0.015507221221923828, 0.016869544982910156, 0.018231868743896484, 0.019594192504882812, 0.02095651626586914, 0.02231884002685547, 0.023681163787841797, 0.025043487548828125, 0.026405811309814453, 0.02776813507080078, 0.02913045883178711, 0.030492782592773438, 0.031855106353759766, 0.033217430114746094, 0.03457975387573242, 0.03594207763671875, 0.03730440139770508, 0.038666725158691406, 0.040029048919677734, 0.04139137268066406, 0.04275369644165039, 0.04411602020263672, 0.04547834396362305, 0.046840667724609375, 0.0482029914855957, 0.04956531524658203, 0.05092763900756836, 0.05228996276855469, 0.053652286529541016, 0.055014610290527344, 0.05637693405151367, 0.0577392578125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 25.0, 981.0, 9.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.728143692016602, -10.500435829162598, -10.272727966308594, -10.045019149780273, -9.81731128692627, -9.589603424072266, -9.361895561218262, -9.134187698364258, -8.906479835510254, -8.67877197265625, -8.451064109802246, -8.223356246948242, -7.99564790725708, -7.767939567565918, -7.540231704711914, -7.31252384185791, -7.084815502166748, -6.857107639312744, -6.629399299621582, -6.401691436767578, -6.173983573913574, -5.94627571105957, -5.718567371368408, -5.490859508514404, -5.263151168823242, -5.035443305969238, -4.807734966278076, -4.580027103424072, -4.352319240570068, -4.124610900878906, -3.8969030380249023, -3.6691951751708984, -3.4414868354797363, -3.2137787342071533, -2.9860708713531494, -2.7583627700805664, -2.5306549072265625, -2.3029468059539795, -2.0752387046813965, -1.847530722618103, -1.6198227405548096, -1.3921147584915161, -1.1644067764282227, -0.9366986751556396, -0.7089906930923462, -0.48128271102905273, -0.2535746097564697, -0.02586662769317627, 0.2018413543701172, 0.42954936623573303, 0.6572573781013489, 0.8849654197692871, 1.1126734018325806, 1.340381383895874, 1.568089485168457, 1.7957974672317505, 2.023505449295044, 2.251213550567627, 2.478921413421631, 2.706629514694214, 2.934337615966797, 3.162045478820801, 3.389753580093384, 3.617461681365967, 3.8451695442199707]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 6.0, 8.0, 24.0, 23.0, 38.0, 50.0, 63.0, 107.0, 85.0, 98.0, 104.0, 103.0, 77.0, 69.0, 52.0, 31.0, 23.0, 20.0, 14.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.8455477952957153, -0.8251144886016846, -0.8046812415122986, -0.7842479348182678, -0.7638146877288818, -0.7433813810348511, -0.7229481339454651, -0.7025148272514343, -0.6820815801620483, -0.6616482734680176, -0.6412150263786316, -0.6207817196846008, -0.6003484725952148, -0.5799151659011841, -0.5594819188117981, -0.5390486121177673, -0.5186153054237366, -0.4981820285320282, -0.4777487516403198, -0.45731547474861145, -0.4368821978569031, -0.4164488911628723, -0.39601561427116394, -0.37558233737945557, -0.3551490604877472, -0.3347157835960388, -0.31428250670433044, -0.29384922981262207, -0.2734159231185913, -0.2529826760292053, -0.23254936933517456, -0.2121160924434662, -0.1916828155517578, -0.17124953866004944, -0.15081626176834106, -0.1303829699754715, -0.10994969308376312, -0.08951641619205475, -0.06908313184976578, -0.04864984750747681, -0.028216570615768433, -0.00778328999876976, 0.012649990618228912, 0.033083271235227585, 0.05351655185222626, 0.07394982874393463, 0.0943831130862236, 0.11481639742851257, 0.13524967432022095, 0.15568295121192932, 0.1761162281036377, 0.19654951989650726, 0.21698279678821564, 0.237416073679924, 0.2578493654727936, 0.27828264236450195, 0.2987159192562103, 0.3191491961479187, 0.3395824730396271, 0.36001574993133545, 0.3804490566253662, 0.4008823037147522, 0.42131561040878296, 0.44174888730049133, 0.4621821641921997]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 11.0, 20.0, 93.0, 500.0, 4674.0, 4188437.0, 480.0, 66.0, 11.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.2265625, -2.1846771240234375, -2.142791748046875, -2.1009063720703125, -2.05902099609375, -2.0171356201171875, -1.975250244140625, -1.9333648681640625, -1.8914794921875, -1.8495941162109375, -1.807708740234375, -1.7658233642578125, -1.72393798828125, -1.6820526123046875, -1.640167236328125, -1.5982818603515625, -1.556396484375, -1.5145111083984375, -1.472625732421875, -1.4307403564453125, -1.38885498046875, -1.3469696044921875, -1.305084228515625, -1.2631988525390625, -1.2213134765625, -1.1794281005859375, -1.137542724609375, -1.0956573486328125, -1.05377197265625, -1.0118865966796875, -0.970001220703125, -0.9281158447265625, -0.88623046875, -0.8443450927734375, -0.802459716796875, -0.7605743408203125, -0.71868896484375, -0.6768035888671875, -0.634918212890625, -0.5930328369140625, -0.5511474609375, -0.5092620849609375, -0.467376708984375, -0.4254913330078125, -0.38360595703125, -0.3417205810546875, -0.299835205078125, -0.2579498291015625, -0.216064453125, -0.1741790771484375, -0.132293701171875, -0.0904083251953125, -0.04852294921875, -0.0066375732421875, 0.035247802734375, 0.0771331787109375, 0.1190185546875, 0.1609039306640625, 0.202789306640625, 0.2446746826171875, 0.28656005859375, 0.3284454345703125, 0.370330810546875, 0.4122161865234375, 0.4541015625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 17.0, 77.0, 242.0, 369.0, 221.0, 75.0, 13.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07171630859375, -0.0703742504119873, -0.06903219223022461, -0.06769013404846191, -0.06634807586669922, -0.06500601768493652, -0.06366395950317383, -0.06232190132141113, -0.06097984313964844, -0.05963778495788574, -0.05829572677612305, -0.05695366859436035, -0.055611610412597656, -0.05426955223083496, -0.052927494049072266, -0.05158543586730957, -0.050243377685546875, -0.04890131950378418, -0.047559261322021484, -0.04621720314025879, -0.044875144958496094, -0.0435330867767334, -0.0421910285949707, -0.04084897041320801, -0.03950691223144531, -0.03816485404968262, -0.03682279586791992, -0.03548073768615723, -0.03413867950439453, -0.032796621322631836, -0.03145456314086914, -0.030112504959106445, -0.02877044677734375, -0.027428388595581055, -0.02608633041381836, -0.024744272232055664, -0.02340221405029297, -0.022060155868530273, -0.020718097686767578, -0.019376039505004883, -0.018033981323242188, -0.016691923141479492, -0.015349864959716797, -0.014007806777954102, -0.012665748596191406, -0.011323690414428711, -0.009981632232666016, -0.00863957405090332, -0.007297515869140625, -0.00595545768737793, -0.004613399505615234, -0.003271341323852539, -0.0019292831420898438, -0.0005872249603271484, 0.0007548332214355469, 0.002096891403198242, 0.0034389495849609375, 0.004781007766723633, 0.006123065948486328, 0.0074651241302490234, 0.008807182312011719, 0.010149240493774414, 0.01149129867553711, 0.012833356857299805, 0.0141754150390625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 12.0, 37.0, 99.0, 252.0, 574.0, 4191838.0, 1127.0, 265.0, 65.0, 16.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.80078125, -4.70416259765625, -4.6075439453125, -4.51092529296875, -4.414306640625, -4.31768798828125, -4.2210693359375, -4.12445068359375, -4.02783203125, -3.93121337890625, -3.8345947265625, -3.73797607421875, -3.641357421875, -3.54473876953125, -3.4481201171875, -3.35150146484375, -3.2548828125, -3.15826416015625, -3.0616455078125, -2.96502685546875, -2.868408203125, -2.77178955078125, -2.6751708984375, -2.57855224609375, -2.48193359375, -2.38531494140625, -2.2886962890625, -2.19207763671875, -2.095458984375, -1.99884033203125, -1.9022216796875, -1.80560302734375, -1.708984375, -1.61236572265625, -1.5157470703125, -1.41912841796875, -1.322509765625, -1.22589111328125, -1.1292724609375, -1.03265380859375, -0.93603515625, -0.83941650390625, -0.7427978515625, -0.64617919921875, -0.549560546875, -0.45294189453125, -0.3563232421875, -0.25970458984375, -0.1630859375, -0.06646728515625, 0.0301513671875, 0.12677001953125, 0.223388671875, 0.32000732421875, 0.4166259765625, 0.51324462890625, 0.60986328125, 0.70648193359375, 0.8031005859375, 0.89971923828125, 0.996337890625, 1.09295654296875, 1.1895751953125, 1.28619384765625, 1.3828125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 98.0, 3929.0, 51.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3896484375, -0.38123321533203125, -0.3728179931640625, -0.36440277099609375, -0.355987548828125, -0.34757232666015625, -0.3391571044921875, -0.33074188232421875, -0.32232666015625, -0.31391143798828125, -0.3054962158203125, -0.29708099365234375, -0.288665771484375, -0.28025054931640625, -0.2718353271484375, -0.26342010498046875, -0.2550048828125, -0.24658966064453125, -0.2381744384765625, -0.22975921630859375, -0.221343994140625, -0.21292877197265625, -0.2045135498046875, -0.19609832763671875, -0.18768310546875, -0.17926788330078125, -0.1708526611328125, -0.16243743896484375, -0.154022216796875, -0.14560699462890625, -0.1371917724609375, -0.12877655029296875, -0.120361328125, -0.11194610595703125, -0.1035308837890625, -0.09511566162109375, -0.086700439453125, -0.07828521728515625, -0.0698699951171875, -0.06145477294921875, -0.05303955078125, -0.04462432861328125, -0.0362091064453125, -0.02779388427734375, -0.019378662109375, -0.01096343994140625, -0.0025482177734375, 0.00586700439453125, 0.0142822265625, 0.02269744873046875, 0.0311126708984375, 0.03952789306640625, 0.047943115234375, 0.05635833740234375, 0.0647735595703125, 0.07318878173828125, 0.08160400390625, 0.09001922607421875, 0.0984344482421875, 0.10684967041015625, 0.115264892578125, 0.12368011474609375, 0.1320953369140625, 0.14051055908203125, 0.14892578125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 12.0, 474.0, 519.0, 9.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.111863613128662, -5.973001003265381, -5.834138870239258, -5.695276260375977, -5.5564141273498535, -5.417551517486572, -5.278689384460449, -5.139826774597168, -5.000964164733887, -4.8621015548706055, -4.723239421844482, -4.584376811981201, -4.445514678955078, -4.306652069091797, -4.167789936065674, -4.028927326202393, -3.8900651931762695, -3.7512028217315674, -3.6123404502868652, -3.473478078842163, -3.334615707397461, -3.1957530975341797, -3.0568907260894775, -2.9180283546447754, -2.7791659832000732, -2.640303611755371, -2.501441240310669, -2.362578868865967, -2.2237162590026855, -2.0848541259765625, -1.9459915161132812, -1.807129144668579, -1.6682665348052979, -1.5294041633605957, -1.3905417919158936, -1.2516793012619019, -1.1128169298171997, -0.9739545583724976, -0.8350921273231506, -0.6962296962738037, -0.5573673248291016, -0.418504923582077, -0.2796425223350525, -0.14078012108802795, -0.001917719841003418, 0.13694465160369873, 0.27580708265304565, 0.4146695137023926, 0.5535318851470947, 0.6923942565917969, 0.8312566876411438, 0.9701191186904907, 1.1089814901351929, 1.247843861579895, 1.3867063522338867, 1.5255687236785889, 1.664431095123291, 1.8032934665679932, 1.9421558380126953, 2.0810182094573975, 2.2198805809020996, 2.358743190765381, 2.497605562210083, 2.636467933654785, 2.7753303050994873]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 8.0, 14.0, 35.0, 43.0, 94.0, 137.0, 176.0, 154.0, 136.0, 82.0, 62.0, 35.0, 15.0, 9.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3110356330871582, -1.2696609497070312, -1.2282861471176147, -1.1869114637374878, -1.1455366611480713, -1.1041619777679443, -1.0627872943878174, -1.0214126110076904, -0.9800378084182739, -0.9386630654335022, -0.8972883224487305, -0.8559136390686035, -0.8145388960838318, -0.7731641530990601, -0.7317894697189331, -0.6904147267341614, -0.6490399837493896, -0.6076652407646179, -0.5662904977798462, -0.5249158143997192, -0.4835410714149475, -0.4421663284301758, -0.40079161524772644, -0.3594169020652771, -0.31804215908050537, -0.27666741609573364, -0.2352927029132843, -0.19391797482967377, -0.15254324674606323, -0.1111685186624527, -0.06979379057884216, -0.028419077396392822, 0.012955784797668457, 0.05433051288127899, 0.09570524096488953, 0.13707996904850006, 0.1784546971321106, 0.21982942521572113, 0.26120415329933167, 0.302578866481781, 0.34395360946655273, 0.38532835245132446, 0.4267030656337738, 0.46807777881622314, 0.5094525218009949, 0.5508272647857666, 0.5922019481658936, 0.6335766911506653, 0.674951434135437, 0.7163261771202087, 0.7577009201049805, 0.7990756034851074, 0.8404503464698792, 0.8818250894546509, 0.9231997728347778, 0.9645745158195496, 1.0059492588043213, 1.0473239421844482, 1.0886987447738647, 1.1300734281539917, 1.1714482307434082, 1.2128229141235352, 1.254197597503662, 1.295572280883789, 1.3369470834732056]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 5.0, 6.0, 8.0, 6.0, 7.0, 14.0, 30.0, 43.0, 53.0, 127.0, 218.0, 679.0, 2481.0, 25411.0, 981566.0, 33772.0, 2841.0, 752.0, 233.0, 120.0, 68.0, 40.0, 32.0, 17.0, 8.0, 8.0, 2.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.51513671875, -0.5002212524414062, -0.4853057861328125, -0.47039031982421875, -0.455474853515625, -0.44055938720703125, -0.4256439208984375, -0.41072845458984375, -0.39581298828125, -0.38089752197265625, -0.3659820556640625, -0.35106658935546875, -0.336151123046875, -0.32123565673828125, -0.3063201904296875, -0.29140472412109375, -0.2764892578125, -0.26157379150390625, -0.2466583251953125, -0.23174285888671875, -0.216827392578125, -0.20191192626953125, -0.1869964599609375, -0.17208099365234375, -0.15716552734375, -0.14225006103515625, -0.1273345947265625, -0.11241912841796875, -0.097503662109375, -0.08258819580078125, -0.0676727294921875, -0.05275726318359375, -0.037841796875, -0.02292633056640625, -0.0080108642578125, 0.00690460205078125, 0.021820068359375, 0.03673553466796875, 0.0516510009765625, 0.06656646728515625, 0.08148193359375, 0.09639739990234375, 0.1113128662109375, 0.12622833251953125, 0.141143798828125, 0.15605926513671875, 0.1709747314453125, 0.18589019775390625, 0.2008056640625, 0.21572113037109375, 0.2306365966796875, 0.24555206298828125, 0.260467529296875, 0.27538299560546875, 0.2902984619140625, 0.30521392822265625, 0.32012939453125, 0.33504486083984375, 0.3499603271484375, 0.36487579345703125, 0.379791259765625, 0.39470672607421875, 0.4096221923828125, 0.42453765869140625, 0.439453125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 15.0, 32.0, 47.0, 120.0, 143.0, 207.0, 165.0, 130.0, 72.0, 45.0, 16.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10443115234375, -0.10209083557128906, -0.09975051879882812, -0.09741020202636719, -0.09506988525390625, -0.09272956848144531, -0.09038925170898438, -0.08804893493652344, -0.0857086181640625, -0.08336830139160156, -0.08102798461914062, -0.07868766784667969, -0.07634735107421875, -0.07400703430175781, -0.07166671752929688, -0.06932640075683594, -0.066986083984375, -0.06464576721191406, -0.062305450439453125, -0.05996513366699219, -0.05762481689453125, -0.05528450012207031, -0.052944183349609375, -0.05060386657714844, -0.0482635498046875, -0.04592323303222656, -0.043582916259765625, -0.04124259948730469, -0.03890228271484375, -0.03656196594238281, -0.034221649169921875, -0.03188133239746094, -0.029541015625, -0.027200698852539062, -0.024860382080078125, -0.022520065307617188, -0.02017974853515625, -0.017839431762695312, -0.015499114990234375, -0.013158798217773438, -0.0108184814453125, -0.008478164672851562, -0.006137847900390625, -0.0037975311279296875, -0.00145721435546875, 0.0008831024169921875, 0.003223419189453125, 0.0055637359619140625, 0.007904052734375, 0.010244369506835938, 0.012584686279296875, 0.014925003051757812, 0.01726531982421875, 0.019605636596679688, 0.021945953369140625, 0.024286270141601562, 0.0266265869140625, 0.028966903686523438, 0.031307220458984375, 0.03364753723144531, 0.03598785400390625, 0.03832817077636719, 0.040668487548828125, 0.04300880432128906, 0.04534912109375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 9.0, 6.0, 8.0, 12.0, 14.0, 19.0, 23.0, 35.0, 48.0, 80.0, 146.0, 286.0, 1053.0, 17919.0, 1006591.0, 20495.0, 1080.0, 304.0, 141.0, 88.0, 51.0, 33.0, 33.0, 20.0, 8.0, 8.0, 14.0, 5.0, 8.0, 5.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42431640625, -0.4116554260253906, -0.39899444580078125, -0.3863334655761719, -0.3736724853515625, -0.3610115051269531, -0.34835052490234375, -0.3356895446777344, -0.323028564453125, -0.3103675842285156, -0.29770660400390625, -0.2850456237792969, -0.2723846435546875, -0.2597236633300781, -0.24706268310546875, -0.23440170288085938, -0.22174072265625, -0.20907974243164062, -0.19641876220703125, -0.18375778198242188, -0.1710968017578125, -0.15843582153320312, -0.14577484130859375, -0.13311386108398438, -0.120452880859375, -0.10779190063476562, -0.09513092041015625, -0.08246994018554688, -0.0698089599609375, -0.057147979736328125, -0.04448699951171875, -0.031826019287109375, -0.0191650390625, -0.006504058837890625, 0.00615692138671875, 0.018817901611328125, 0.0314788818359375, 0.044139862060546875, 0.05680084228515625, 0.06946182250976562, 0.082122802734375, 0.09478378295898438, 0.10744476318359375, 0.12010574340820312, 0.1327667236328125, 0.14542770385742188, 0.15808868408203125, 0.17074966430664062, 0.18341064453125, 0.19607162475585938, 0.20873260498046875, 0.22139358520507812, 0.2340545654296875, 0.24671554565429688, 0.25937652587890625, 0.2720375061035156, 0.284698486328125, 0.2973594665527344, 0.31002044677734375, 0.3226814270019531, 0.3353424072265625, 0.3480033874511719, 0.36066436767578125, 0.3733253479003906, 0.385986328125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 10.0, 6.0, 7.0, 16.0, 17.0, 20.0, 31.0, 35.0, 38.0, 45.0, 54.0, 52.0, 48.0, 54.0, 56.0, 67.0, 55.0, 50.0, 49.0, 47.0, 50.0, 45.0, 34.0, 27.0, 20.0, 15.0, 11.0, 10.0, 9.0, 5.0, 5.0, 6.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1422119140625, -0.13801193237304688, -0.13381195068359375, -0.12961196899414062, -0.1254119873046875, -0.12121200561523438, -0.11701202392578125, -0.11281204223632812, -0.108612060546875, -0.10441207885742188, -0.10021209716796875, -0.09601211547851562, -0.0918121337890625, -0.08761215209960938, -0.08341217041015625, -0.07921218872070312, -0.07501220703125, -0.07081222534179688, -0.06661224365234375, -0.062412261962890625, -0.0582122802734375, -0.054012298583984375, -0.04981231689453125, -0.045612335205078125, -0.041412353515625, -0.037212371826171875, -0.03301239013671875, -0.028812408447265625, -0.0246124267578125, -0.020412445068359375, -0.01621246337890625, -0.012012481689453125, -0.0078125, -0.003612518310546875, 0.00058746337890625, 0.004787445068359375, 0.0089874267578125, 0.013187408447265625, 0.01738739013671875, 0.021587371826171875, 0.025787353515625, 0.029987335205078125, 0.03418731689453125, 0.038387298583984375, 0.0425872802734375, 0.046787261962890625, 0.05098724365234375, 0.055187225341796875, 0.05938720703125, 0.06358718872070312, 0.06778717041015625, 0.07198715209960938, 0.0761871337890625, 0.08038711547851562, 0.08458709716796875, 0.08878707885742188, 0.092987060546875, 0.09718704223632812, 0.10138702392578125, 0.10558700561523438, 0.1097869873046875, 0.11398696899414062, 0.11818695068359375, 0.12238693237304688, 0.1265869140625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 1.0, 6.0, 5.0, 5.0, 10.0, 19.0, 26.0, 55.0, 92.0, 224.0, 508.0, 1859.0, 14387.0, 974706.0, 52177.0, 3148.0, 749.0, 272.0, 114.0, 68.0, 47.0, 19.0, 15.0, 13.0, 7.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08709716796875, -0.0838308334350586, -0.08056449890136719, -0.07729816436767578, -0.07403182983398438, -0.07076549530029297, -0.06749916076660156, -0.06423282623291016, -0.06096649169921875, -0.057700157165527344, -0.05443382263183594, -0.05116748809814453, -0.047901153564453125, -0.04463481903076172, -0.04136848449707031, -0.038102149963378906, -0.0348358154296875, -0.031569480895996094, -0.028303146362304688, -0.02503681182861328, -0.021770477294921875, -0.01850414276123047, -0.015237808227539062, -0.011971473693847656, -0.00870513916015625, -0.005438804626464844, -0.0021724700927734375, 0.0010938644409179688, 0.004360198974609375, 0.007626533508300781, 0.010892868041992188, 0.014159202575683594, 0.017425537109375, 0.020691871643066406, 0.023958206176757812, 0.02722454071044922, 0.030490875244140625, 0.03375720977783203, 0.03702354431152344, 0.040289878845214844, 0.04355621337890625, 0.046822547912597656, 0.05008888244628906, 0.05335521697998047, 0.056621551513671875, 0.05988788604736328, 0.06315422058105469, 0.0664205551147461, 0.0696868896484375, 0.0729532241821289, 0.07621955871582031, 0.07948589324951172, 0.08275222778320312, 0.08601856231689453, 0.08928489685058594, 0.09255123138427734, 0.09581756591796875, 0.09908390045166016, 0.10235023498535156, 0.10561656951904297, 0.10888290405273438, 0.11214923858642578, 0.11541557312011719, 0.1186819076538086, 0.1219482421875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 3.0, 0.0, 6.0, 3.0, 2.0, 9.0, 6.0, 16.0, 17.0, 27.0, 39.0, 69.0, 103.0, 129.0, 137.0, 141.0, 95.0, 71.0, 32.0, 20.0, 9.0, 14.0, 11.0, 5.0, 13.0, 3.0, 6.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0], "bins": [-1.8894672393798828e-05, -1.838989555835724e-05, -1.788511872291565e-05, -1.738034188747406e-05, -1.687556505203247e-05, -1.637078821659088e-05, -1.5866011381149292e-05, -1.5361234545707703e-05, -1.4856457710266113e-05, -1.4351680874824524e-05, -1.3846904039382935e-05, -1.3342127203941345e-05, -1.2837350368499756e-05, -1.2332573533058167e-05, -1.1827796697616577e-05, -1.1323019862174988e-05, -1.0818243026733398e-05, -1.0313466191291809e-05, -9.80868935585022e-06, -9.30391252040863e-06, -8.799135684967041e-06, -8.294358849525452e-06, -7.789582014083862e-06, -7.284805178642273e-06, -6.780028343200684e-06, -6.275251507759094e-06, -5.770474672317505e-06, -5.2656978368759155e-06, -4.760921001434326e-06, -4.256144165992737e-06, -3.7513673305511475e-06, -3.246590495109558e-06, -2.7418136596679688e-06, -2.2370368242263794e-06, -1.73225998878479e-06, -1.2274831533432007e-06, -7.227063179016113e-07, -2.1792948246002197e-07, 2.868473529815674e-07, 7.916241884231567e-07, 1.296401023864746e-06, 1.8011778593063354e-06, 2.305954694747925e-06, 2.810731530189514e-06, 3.3155083656311035e-06, 3.820285201072693e-06, 4.325062036514282e-06, 4.829838871955872e-06, 5.334615707397461e-06, 5.83939254283905e-06, 6.34416937828064e-06, 6.848946213722229e-06, 7.353723049163818e-06, 7.858499884605408e-06, 8.363276720046997e-06, 8.868053555488586e-06, 9.372830390930176e-06, 9.877607226371765e-06, 1.0382384061813354e-05, 1.0887160897254944e-05, 1.1391937732696533e-05, 1.1896714568138123e-05, 1.2401491403579712e-05, 1.2906268239021301e-05, 1.341104507446289e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 12.0, 10.0, 36.0, 55.0, 185.0, 1053.0, 69277.0, 975832.0, 1713.0, 228.0, 81.0, 32.0, 15.0, 8.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.30419921875, -0.2971477508544922, -0.2900962829589844, -0.28304481506347656, -0.27599334716796875, -0.26894187927246094, -0.2618904113769531, -0.2548389434814453, -0.2477874755859375, -0.2407360076904297, -0.23368453979492188, -0.22663307189941406, -0.21958160400390625, -0.21253013610839844, -0.20547866821289062, -0.1984272003173828, -0.191375732421875, -0.1843242645263672, -0.17727279663085938, -0.17022132873535156, -0.16316986083984375, -0.15611839294433594, -0.14906692504882812, -0.1420154571533203, -0.1349639892578125, -0.1279125213623047, -0.12086105346679688, -0.11380958557128906, -0.10675811767578125, -0.09970664978027344, -0.09265518188476562, -0.08560371398925781, -0.07855224609375, -0.07150077819824219, -0.06444931030273438, -0.05739784240722656, -0.05034637451171875, -0.04329490661621094, -0.036243438720703125, -0.029191970825195312, -0.0221405029296875, -0.015089035034179688, -0.008037567138671875, -0.0009860992431640625, 0.00606536865234375, 0.013116836547851562, 0.020168304443359375, 0.027219772338867188, 0.034271240234375, 0.04132270812988281, 0.048374176025390625, 0.05542564392089844, 0.06247711181640625, 0.06952857971191406, 0.07658004760742188, 0.08363151550292969, 0.0906829833984375, 0.09773445129394531, 0.10478591918945312, 0.11183738708496094, 0.11888885498046875, 0.12594032287597656, 0.13299179077148438, 0.1400432586669922, 0.1470947265625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 11.0, 7.0, 21.0, 20.0, 51.0, 100.0, 209.0, 228.0, 188.0, 76.0, 45.0, 24.0, 10.0, 7.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.107421875, -0.10494613647460938, -0.10247039794921875, -0.09999465942382812, -0.0975189208984375, -0.09504318237304688, -0.09256744384765625, -0.09009170532226562, -0.087615966796875, -0.08514022827148438, -0.08266448974609375, -0.08018875122070312, -0.0777130126953125, -0.07523727416992188, -0.07276153564453125, -0.07028579711914062, -0.06781005859375, -0.06533432006835938, -0.06285858154296875, -0.060382843017578125, -0.0579071044921875, -0.055431365966796875, -0.05295562744140625, -0.050479888916015625, -0.048004150390625, -0.045528411865234375, -0.04305267333984375, -0.040576934814453125, -0.0381011962890625, -0.035625457763671875, -0.03314971923828125, -0.030673980712890625, -0.0281982421875, -0.025722503662109375, -0.02324676513671875, -0.020771026611328125, -0.0182952880859375, -0.015819549560546875, -0.01334381103515625, -0.010868072509765625, -0.008392333984375, -0.005916595458984375, -0.00344085693359375, -0.000965118408203125, 0.0015106201171875, 0.003986358642578125, 0.00646209716796875, 0.008937835693359375, 0.01141357421875, 0.013889312744140625, 0.01636505126953125, 0.018840789794921875, 0.0213165283203125, 0.023792266845703125, 0.02626800537109375, 0.028743743896484375, 0.031219482421875, 0.033695220947265625, 0.03617095947265625, 0.038646697998046875, 0.0411224365234375, 0.043598175048828125, 0.04607391357421875, 0.048549652099609375, 0.051025390625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [2.0, 9.0, 289.0, 656.0, 41.0, 9.0, 6.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3387821614742279, -0.22615563869476318, -0.11352911591529846, -0.0009025931358337402, 0.11172392964363098, 0.2243504822254181, 0.3369769752025604, 0.44960346817970276, 0.5622299909591675, 0.6748565435409546, 0.7874830365180969, 0.9001095294952393, 1.0127360820770264, 1.1253626346588135, 1.2379891872406006, 1.3506156206130981, 1.4632421731948853, 1.5758687257766724, 1.68849515914917, 1.801121711730957, 1.9137482643127441, 2.0263748168945312, 2.1390013694763184, 2.2516279220581055, 2.3642544746398926, 2.4768810272216797, 2.589507579803467, 2.702134132385254, 2.814760684967041, 2.927387237548828, 3.040013551712036, 3.1526401042938232, 3.2652664184570312, 3.3778929710388184, 3.4905195236206055, 3.6031460762023926, 3.7157726287841797, 3.828399181365967, 3.941025495529175, 4.053651809692383, 4.166278839111328, 4.278905391693115, 4.391531944274902, 4.5041584968566895, 4.616785049438477, 4.729411602020264, 4.842038154602051, 4.95466423034668, 5.067290782928467, 5.179917335510254, 5.292543888092041, 5.405170440673828, 5.517796993255615, 5.630423545837402, 5.7430500984191895, 5.855676651000977, 5.9683027267456055, 6.080929279327393, 6.19355583190918, 6.306182384490967, 6.418808937072754, 6.531435489654541, 6.644062042236328, 6.756688117980957, 6.869315147399902]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 8.0, 7.0, 9.0, 15.0, 19.0, 19.0, 36.0, 41.0, 35.0, 48.0, 68.0, 72.0, 71.0, 64.0, 54.0, 64.0, 69.0, 64.0, 45.0, 39.0, 37.0, 22.0, 25.0, 9.0, 18.0, 14.0, 10.0, 5.0, 4.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0854626893997192, -1.054032325744629, -1.0226019620895386, -0.9911715984344482, -0.9597412347793579, -0.9283108711242676, -0.8968804478645325, -0.8654500842094421, -0.8340197205543518, -0.8025893568992615, -0.7711589932441711, -0.7397286295890808, -0.7082982063293457, -0.6768678426742554, -0.645437479019165, -0.6140071153640747, -0.5825767517089844, -0.551146388053894, -0.5197160243988037, -0.488285630941391, -0.45685526728630066, -0.4254249036312103, -0.3939945101737976, -0.3625641465187073, -0.33113378286361694, -0.2997034192085266, -0.2682730555534363, -0.23684266209602356, -0.20541229844093323, -0.1739819347858429, -0.14255155622959137, -0.11112117767333984, -0.07969075441360474, -0.04826038330793381, -0.01683001220226288, 0.01460035890340805, 0.04603073000907898, 0.07746109366416931, 0.10889147222042084, 0.14032185077667236, 0.1717522144317627, 0.20318257808685303, 0.23461295664310455, 0.2660433351993561, 0.2974736988544464, 0.32890406250953674, 0.36033445596694946, 0.3917648196220398, 0.4231951832771301, 0.45462554693222046, 0.4860559105873108, 0.5174862742424011, 0.5489166975021362, 0.5803470611572266, 0.6117774248123169, 0.6432077884674072, 0.6746381521224976, 0.7060685157775879, 0.7374988794326782, 0.7689292430877686, 0.8003596067428589, 0.8317899703979492, 0.8632203936576843, 0.8946507573127747, 0.926081120967865]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 3.0, 5.0, 8.0, 11.0, 20.0, 25.0, 52.0, 112.0, 162.0, 374.0, 1238.0, 10997.0, 4134398.0, 45083.0, 1385.0, 262.0, 82.0, 37.0, 16.0, 10.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.19921875, -1.1755485534667969, -1.1518783569335938, -1.1282081604003906, -1.1045379638671875, -1.0808677673339844, -1.0571975708007812, -1.0335273742675781, -1.009857177734375, -0.9861869812011719, -0.9625167846679688, -0.9388465881347656, -0.9151763916015625, -0.8915061950683594, -0.8678359985351562, -0.8441658020019531, -0.82049560546875, -0.7968254089355469, -0.7731552124023438, -0.7494850158691406, -0.7258148193359375, -0.7021446228027344, -0.6784744262695312, -0.6548042297363281, -0.631134033203125, -0.6074638366699219, -0.5837936401367188, -0.5601234436035156, -0.5364532470703125, -0.5127830505371094, -0.48911285400390625, -0.4654426574707031, -0.4417724609375, -0.4181022644042969, -0.39443206787109375, -0.3707618713378906, -0.3470916748046875, -0.3234214782714844, -0.29975128173828125, -0.2760810852050781, -0.252410888671875, -0.22874069213867188, -0.20507049560546875, -0.18140029907226562, -0.1577301025390625, -0.13405990600585938, -0.11038970947265625, -0.08671951293945312, -0.06304931640625, -0.039379119873046875, -0.01570892333984375, 0.007961273193359375, 0.0316314697265625, 0.055301666259765625, 0.07897186279296875, 0.10264205932617188, 0.126312255859375, 0.14998245239257812, 0.17365264892578125, 0.19732284545898438, 0.2209930419921875, 0.24466323852539062, 0.26833343505859375, 0.2920036315917969, 0.315673828125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 4.0, 9.0, 13.0, 44.0, 64.0, 109.0, 155.0, 177.0, 123.0, 123.0, 92.0, 46.0, 22.0, 14.0, 5.0, 6.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.10809326171875, -0.1059563159942627, -0.10381937026977539, -0.10168242454528809, -0.09954547882080078, -0.09740853309631348, -0.09527158737182617, -0.09313464164733887, -0.09099769592285156, -0.08886075019836426, -0.08672380447387695, -0.08458685874938965, -0.08244991302490234, -0.08031296730041504, -0.07817602157592773, -0.07603907585144043, -0.07390213012695312, -0.07176518440246582, -0.06962823867797852, -0.06749129295349121, -0.0653543472290039, -0.0632174015045166, -0.0610804557800293, -0.05894351005554199, -0.05680656433105469, -0.05466961860656738, -0.05253267288208008, -0.05039572715759277, -0.04825878143310547, -0.046121835708618164, -0.04398488998413086, -0.041847944259643555, -0.03971099853515625, -0.037574052810668945, -0.03543710708618164, -0.033300161361694336, -0.03116321563720703, -0.029026269912719727, -0.026889324188232422, -0.024752378463745117, -0.022615432739257812, -0.020478487014770508, -0.018341541290283203, -0.0162045955657959, -0.014067649841308594, -0.011930704116821289, -0.009793758392333984, -0.00765681266784668, -0.005519866943359375, -0.0033829212188720703, -0.0012459754943847656, 0.0008909702301025391, 0.0030279159545898438, 0.0051648616790771484, 0.007301807403564453, 0.009438753128051758, 0.011575698852539062, 0.013712644577026367, 0.015849590301513672, 0.017986536026000977, 0.02012348175048828, 0.022260427474975586, 0.02439737319946289, 0.026534318923950195, 0.0286712646484375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 13.0, 18.0, 133.0, 565.0, 3482216.0, 710922.0, 298.0, 70.0, 27.0, 14.0, 4.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.2734375, -4.18963623046875, -4.1058349609375, -4.02203369140625, -3.938232421875, -3.85443115234375, -3.7706298828125, -3.68682861328125, -3.60302734375, -3.51922607421875, -3.4354248046875, -3.35162353515625, -3.267822265625, -3.18402099609375, -3.1002197265625, -3.01641845703125, -2.9326171875, -2.84881591796875, -2.7650146484375, -2.68121337890625, -2.597412109375, -2.51361083984375, -2.4298095703125, -2.34600830078125, -2.26220703125, -2.17840576171875, -2.0946044921875, -2.01080322265625, -1.927001953125, -1.84320068359375, -1.7593994140625, -1.67559814453125, -1.591796875, -1.50799560546875, -1.4241943359375, -1.34039306640625, -1.256591796875, -1.17279052734375, -1.0889892578125, -1.00518798828125, -0.92138671875, -0.83758544921875, -0.7537841796875, -0.66998291015625, -0.586181640625, -0.50238037109375, -0.4185791015625, -0.33477783203125, -0.2509765625, -0.16717529296875, -0.0833740234375, 0.00042724609375, 0.084228515625, 0.16802978515625, 0.2518310546875, 0.33563232421875, 0.41943359375, 0.50323486328125, 0.5870361328125, 0.67083740234375, 0.754638671875, 0.83843994140625, 0.9222412109375, 1.00604248046875, 1.08984375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 9.0, 22.0, 76.0, 601.0, 3143.0, 131.0, 45.0, 16.0, 16.0, 10.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.31982421875, -0.3137025833129883, -0.30758094787597656, -0.30145931243896484, -0.2953376770019531, -0.2892160415649414, -0.2830944061279297, -0.27697277069091797, -0.27085113525390625, -0.26472949981689453, -0.2586078643798828, -0.2524862289428711, -0.24636459350585938, -0.24024295806884766, -0.23412132263183594, -0.22799968719482422, -0.2218780517578125, -0.21575641632080078, -0.20963478088378906, -0.20351314544677734, -0.19739151000976562, -0.1912698745727539, -0.1851482391357422, -0.17902660369873047, -0.17290496826171875, -0.16678333282470703, -0.1606616973876953, -0.1545400619506836, -0.14841842651367188, -0.14229679107666016, -0.13617515563964844, -0.13005352020263672, -0.123931884765625, -0.11781024932861328, -0.11168861389160156, -0.10556697845458984, -0.09944534301757812, -0.0933237075805664, -0.08720207214355469, -0.08108043670654297, -0.07495880126953125, -0.06883716583251953, -0.06271553039550781, -0.056593894958496094, -0.050472259521484375, -0.044350624084472656, -0.03822898864746094, -0.03210735321044922, -0.0259857177734375, -0.01986408233642578, -0.013742446899414062, -0.007620811462402344, -0.001499176025390625, 0.004622459411621094, 0.010744094848632812, 0.01686573028564453, 0.02298736572265625, 0.02910900115966797, 0.03523063659667969, 0.041352272033691406, 0.047473907470703125, 0.053595542907714844, 0.05971717834472656, 0.06583881378173828, 0.07196044921875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 11.0, 12.0, 51.0, 864.0, 74.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3138628005981445, -2.2333102226257324, -2.1527578830718994, -2.0722053050994873, -1.9916527271270752, -1.9111002683639526, -1.83054780960083, -1.749995231628418, -1.6694427728652954, -1.5888903141021729, -1.5083377361297607, -1.4277852773666382, -1.3472328186035156, -1.2666802406311035, -1.186127781867981, -1.1055753231048584, -1.0250227451324463, -0.944470226764679, -0.8639177083969116, -0.7833652496337891, -0.7028127312660217, -0.6222602128982544, -0.5417077541351318, -0.4611552357673645, -0.38060271739959717, -0.30005019903182983, -0.2194977104663849, -0.13894520699977875, -0.05839270353317261, 0.022159814834594727, 0.10271230340003967, 0.18326479196548462, 0.26381707191467285, 0.3443695902824402, 0.42492207884788513, 0.5054745674133301, 0.5860270857810974, 0.6665796041488647, 0.7471320629119873, 0.8276845812797546, 0.908237099647522, 0.9887896180152893, 1.0693421363830566, 1.1498945951461792, 1.2304470539093018, 1.3109996318817139, 1.3915520906448364, 1.472104549407959, 1.552657127380371, 1.6332095861434937, 1.7137621641159058, 1.7943146228790283, 1.8748672008514404, 1.955419659614563, 2.0359721183776855, 2.1165246963500977, 2.1970772743225098, 2.277629852294922, 2.358182191848755, 2.438734769821167, 2.519287347793579, 2.599839687347412, 2.680392265319824, 2.7609448432922363, 2.8414971828460693]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 5.0, 3.0, 6.0, 18.0, 18.0, 44.0, 54.0, 65.0, 99.0, 105.0, 116.0, 105.0, 110.0, 92.0, 66.0, 39.0, 29.0, 10.0, 15.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.987154483795166, -0.9595654606819153, -0.9319764375686646, -0.9043874740600586, -0.8767984509468079, -0.8492094278335571, -0.8216204047203064, -0.7940313816070557, -0.7664424180984497, -0.738853394985199, -0.7112643718719482, -0.6836754083633423, -0.6560863852500916, -0.6284973621368408, -0.6009083390235901, -0.5733193159103394, -0.5457302927970886, -0.5181412696838379, -0.49055227637290955, -0.4629632532596588, -0.43537425994873047, -0.40778523683547974, -0.380196213722229, -0.35260719060897827, -0.3250181972980499, -0.2974291741847992, -0.26984018087387085, -0.24225115776062012, -0.21466214954853058, -0.18707314133644104, -0.1594841182231903, -0.13189511001110077, -0.104306161403656, -0.07671715319156647, -0.04912813752889633, -0.021539121866226196, 0.006049886345863342, 0.03363889455795288, 0.06122791767120361, 0.08881692588329315, 0.11640593409538269, 0.14399494230747223, 0.17158395051956177, 0.1991729736328125, 0.22676198184490204, 0.2543509900569916, 0.2819400131702423, 0.30952900648117065, 0.3371180295944214, 0.3647070527076721, 0.39229604601860046, 0.4198850691318512, 0.44747406244277954, 0.4750630855560303, 0.502652108669281, 0.5302411317825317, 0.5578300952911377, 0.5854191184043884, 0.6130081415176392, 0.6405971050262451, 0.6681861281394958, 0.6957751512527466, 0.7233641743659973, 0.750953197479248, 0.7785422205924988]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 3.0, 3.0, 5.0, 9.0, 8.0, 15.0, 22.0, 18.0, 24.0, 29.0, 46.0, 67.0, 62.0, 89.0, 143.0, 179.0, 252.0, 461.0, 776.0, 1596.0, 4072.0, 11913.0, 46559.0, 281821.0, 591349.0, 79951.0, 18670.0, 5573.0, 2150.0, 957.0, 551.0, 347.0, 217.0, 160.0, 110.0, 88.0, 62.0, 46.0, 38.0, 30.0, 19.0, 18.0, 6.0, 13.0, 8.0, 4.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.1710205078125, -0.1658649444580078, -0.16070938110351562, -0.15555381774902344, -0.15039825439453125, -0.14524269104003906, -0.14008712768554688, -0.1349315643310547, -0.1297760009765625, -0.12462043762207031, -0.11946487426757812, -0.11430931091308594, -0.10915374755859375, -0.10399818420410156, -0.09884262084960938, -0.09368705749511719, -0.088531494140625, -0.08337593078613281, -0.07822036743164062, -0.07306480407714844, -0.06790924072265625, -0.06275367736816406, -0.057598114013671875, -0.05244255065917969, -0.0472869873046875, -0.04213142395019531, -0.036975860595703125, -0.03182029724121094, -0.02666473388671875, -0.021509170532226562, -0.016353607177734375, -0.011198043823242188, -0.00604248046875, -0.0008869171142578125, 0.004268646240234375, 0.009424209594726562, 0.01457977294921875, 0.019735336303710938, 0.024890899658203125, 0.030046463012695312, 0.0352020263671875, 0.04035758972167969, 0.045513153076171875, 0.05066871643066406, 0.05582427978515625, 0.06097984313964844, 0.06613540649414062, 0.07129096984863281, 0.076446533203125, 0.08160209655761719, 0.08675765991210938, 0.09191322326660156, 0.09706878662109375, 0.10222434997558594, 0.10737991333007812, 0.11253547668457031, 0.1176910400390625, 0.12284660339355469, 0.12800216674804688, 0.13315773010253906, 0.13831329345703125, 0.14346885681152344, 0.14862442016601562, 0.1537799835205078, 0.158935546875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 8.0, 10.0, 15.0, 30.0, 54.0, 65.0, 85.0, 98.0, 111.0, 122.0, 104.0, 94.0, 61.0, 57.0, 42.0, 15.0, 18.0, 6.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0986328125, -0.096343994140625, -0.09405517578125, -0.091766357421875, -0.0894775390625, -0.087188720703125, -0.08489990234375, -0.082611083984375, -0.080322265625, -0.078033447265625, -0.07574462890625, -0.073455810546875, -0.0711669921875, -0.068878173828125, -0.06658935546875, -0.064300537109375, -0.06201171875, -0.059722900390625, -0.05743408203125, -0.055145263671875, -0.0528564453125, -0.050567626953125, -0.04827880859375, -0.045989990234375, -0.043701171875, -0.041412353515625, -0.03912353515625, -0.036834716796875, -0.0345458984375, -0.032257080078125, -0.02996826171875, -0.027679443359375, -0.025390625, -0.023101806640625, -0.02081298828125, -0.018524169921875, -0.0162353515625, -0.013946533203125, -0.01165771484375, -0.009368896484375, -0.007080078125, -0.004791259765625, -0.00250244140625, -0.000213623046875, 0.0020751953125, 0.004364013671875, 0.00665283203125, 0.008941650390625, 0.01123046875, 0.013519287109375, 0.01580810546875, 0.018096923828125, 0.0203857421875, 0.022674560546875, 0.02496337890625, 0.027252197265625, 0.029541015625, 0.031829833984375, 0.03411865234375, 0.036407470703125, 0.0386962890625, 0.040985107421875, 0.04327392578125, 0.045562744140625, 0.0478515625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 8.0, 11.0, 8.0, 7.0, 14.0, 27.0, 37.0, 42.0, 66.0, 103.0, 192.0, 430.0, 1352.0, 9728.0, 429059.0, 593820.0, 11307.0, 1389.0, 416.0, 192.0, 108.0, 61.0, 52.0, 34.0, 24.0, 21.0, 12.0, 9.0, 6.0, 4.0, 6.0, 3.0, 0.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2242431640625, -0.21491050720214844, -0.20557785034179688, -0.1962451934814453, -0.18691253662109375, -0.1775798797607422, -0.16824722290039062, -0.15891456604003906, -0.1495819091796875, -0.14024925231933594, -0.13091659545898438, -0.12158393859863281, -0.11225128173828125, -0.10291862487792969, -0.09358596801757812, -0.08425331115722656, -0.074920654296875, -0.06558799743652344, -0.056255340576171875, -0.04692268371582031, -0.03759002685546875, -0.028257369995117188, -0.018924713134765625, -0.009592056274414062, -0.0002593994140625, 0.009073257446289062, 0.018405914306640625, 0.027738571166992188, 0.03707122802734375, 0.04640388488769531, 0.055736541748046875, 0.06506919860839844, 0.07440185546875, 0.08373451232910156, 0.09306716918945312, 0.10239982604980469, 0.11173248291015625, 0.12106513977050781, 0.13039779663085938, 0.13973045349121094, 0.1490631103515625, 0.15839576721191406, 0.16772842407226562, 0.1770610809326172, 0.18639373779296875, 0.1957263946533203, 0.20505905151367188, 0.21439170837402344, 0.223724365234375, 0.23305702209472656, 0.24238967895507812, 0.2517223358154297, 0.26105499267578125, 0.2703876495361328, 0.2797203063964844, 0.28905296325683594, 0.2983856201171875, 0.30771827697753906, 0.3170509338378906, 0.3263835906982422, 0.33571624755859375, 0.3450489044189453, 0.3543815612792969, 0.36371421813964844, 0.373046875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 7.0, 9.0, 8.0, 9.0, 12.0, 21.0, 28.0, 30.0, 29.0, 42.0, 42.0, 47.0, 61.0, 55.0, 64.0, 66.0, 63.0, 58.0, 56.0, 52.0, 37.0, 39.0, 36.0, 28.0, 24.0, 17.0, 19.0, 7.0, 6.0, 8.0, 5.0, 5.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1322021484375, -0.12678146362304688, -0.12136077880859375, -0.11594009399414062, -0.1105194091796875, -0.10509872436523438, -0.09967803955078125, -0.09425735473632812, -0.088836669921875, -0.08341598510742188, -0.07799530029296875, -0.07257461547851562, -0.0671539306640625, -0.061733245849609375, -0.05631256103515625, -0.050891876220703125, -0.04547119140625, -0.040050506591796875, -0.03462982177734375, -0.029209136962890625, -0.0237884521484375, -0.018367767333984375, -0.01294708251953125, -0.007526397705078125, -0.002105712890625, 0.003314971923828125, 0.00873565673828125, 0.014156341552734375, 0.0195770263671875, 0.024997711181640625, 0.03041839599609375, 0.035839080810546875, 0.041259765625, 0.046680450439453125, 0.05210113525390625, 0.057521820068359375, 0.0629425048828125, 0.06836318969726562, 0.07378387451171875, 0.07920455932617188, 0.084625244140625, 0.09004592895507812, 0.09546661376953125, 0.10088729858398438, 0.1063079833984375, 0.11172866821289062, 0.11714935302734375, 0.12257003784179688, 0.12799072265625, 0.13341140747070312, 0.13883209228515625, 0.14425277709960938, 0.1496734619140625, 0.15509414672851562, 0.16051483154296875, 0.16593551635742188, 0.171356201171875, 0.17677688598632812, 0.18219757080078125, 0.18761825561523438, 0.1930389404296875, 0.19845962524414062, 0.20388031005859375, 0.20930099487304688, 0.2147216796875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 5.0, 3.0, 4.0, 6.0, 11.0, 7.0, 9.0, 22.0, 20.0, 27.0, 55.0, 71.0, 85.0, 146.0, 261.0, 517.0, 1180.0, 3201.0, 15077.0, 266594.0, 716736.0, 35876.0, 5324.0, 1685.0, 759.0, 319.0, 186.0, 110.0, 75.0, 39.0, 41.0, 23.0, 18.0, 17.0, 10.0, 7.0, 4.0, 9.0, 6.0, 4.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.045989990234375, -0.044644832611083984, -0.04329967498779297, -0.04195451736450195, -0.04060935974121094, -0.03926420211791992, -0.037919044494628906, -0.03657388687133789, -0.035228729248046875, -0.03388357162475586, -0.032538414001464844, -0.031193256378173828, -0.029848098754882812, -0.028502941131591797, -0.02715778350830078, -0.025812625885009766, -0.02446746826171875, -0.023122310638427734, -0.02177715301513672, -0.020431995391845703, -0.019086837768554688, -0.017741680145263672, -0.016396522521972656, -0.01505136489868164, -0.013706207275390625, -0.01236104965209961, -0.011015892028808594, -0.009670734405517578, -0.008325576782226562, -0.006980419158935547, -0.005635261535644531, -0.004290103912353516, -0.0029449462890625, -0.0015997886657714844, -0.00025463104248046875, 0.0010905265808105469, 0.0024356842041015625, 0.003780841827392578, 0.005125999450683594, 0.006471157073974609, 0.007816314697265625, 0.00916147232055664, 0.010506629943847656, 0.011851787567138672, 0.013196945190429688, 0.014542102813720703, 0.01588726043701172, 0.017232418060302734, 0.01857757568359375, 0.019922733306884766, 0.02126789093017578, 0.022613048553466797, 0.023958206176757812, 0.025303363800048828, 0.026648521423339844, 0.02799367904663086, 0.029338836669921875, 0.03068399429321289, 0.032029151916503906, 0.03337430953979492, 0.03471946716308594, 0.03606462478637695, 0.03740978240966797, 0.038754940032958984, 0.04010009765625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 5.0, 2.0, 4.0, 3.0, 8.0, 5.0, 10.0, 29.0, 27.0, 20.0, 38.0, 55.0, 50.0, 61.0, 101.0, 75.0, 68.0, 85.0, 94.0, 71.0, 43.0, 47.0, 24.0, 16.0, 24.0, 10.0, 11.0, 3.0, 5.0, 3.0, 1.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.881092071533203e-06, -8.624978363513947e-06, -8.36886465549469e-06, -8.112750947475433e-06, -7.856637239456177e-06, -7.60052353143692e-06, -7.3444098234176636e-06, -7.088296115398407e-06, -6.83218240737915e-06, -6.576068699359894e-06, -6.319954991340637e-06, -6.063841283321381e-06, -5.807727575302124e-06, -5.5516138672828674e-06, -5.295500159263611e-06, -5.039386451244354e-06, -4.783272743225098e-06, -4.527159035205841e-06, -4.2710453271865845e-06, -4.014931619167328e-06, -3.7588179111480713e-06, -3.5027042031288147e-06, -3.246590495109558e-06, -2.9904767870903015e-06, -2.734363079071045e-06, -2.4782493710517883e-06, -2.2221356630325317e-06, -1.966021955013275e-06, -1.7099082469940186e-06, -1.453794538974762e-06, -1.1976808309555054e-06, -9.415671229362488e-07, -6.854534149169922e-07, -4.293397068977356e-07, -1.73225998878479e-07, 8.288770914077759e-08, 3.390014171600342e-07, 5.951151251792908e-07, 8.512288331985474e-07, 1.107342541217804e-06, 1.3634562492370605e-06, 1.6195699572563171e-06, 1.8756836652755737e-06, 2.1317973732948303e-06, 2.387911081314087e-06, 2.6440247893333435e-06, 2.9001384973526e-06, 3.1562522053718567e-06, 3.4123659133911133e-06, 3.66847962141037e-06, 3.9245933294296265e-06, 4.180707037448883e-06, 4.43682074546814e-06, 4.692934453487396e-06, 4.949048161506653e-06, 5.2051618695259094e-06, 5.461275577545166e-06, 5.717389285564423e-06, 5.973502993583679e-06, 6.229616701602936e-06, 6.485730409622192e-06, 6.741844117641449e-06, 6.9979578256607056e-06, 7.254071533679962e-06, 7.510185241699219e-06]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 5.0, 8.0, 22.0, 26.0, 57.0, 90.0, 175.0, 488.0, 1904.0, 21887.0, 942870.0, 76359.0, 3491.0, 667.0, 234.0, 117.0, 52.0, 44.0, 18.0, 10.0, 8.0, 8.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07110595703125, -0.06878662109375, -0.06646728515625, -0.06414794921875, -0.06182861328125, -0.05950927734375, -0.05718994140625, -0.05487060546875, -0.05255126953125, -0.05023193359375, -0.04791259765625, -0.04559326171875, -0.04327392578125, -0.04095458984375, -0.03863525390625, -0.03631591796875, -0.03399658203125, -0.03167724609375, -0.02935791015625, -0.02703857421875, -0.02471923828125, -0.02239990234375, -0.02008056640625, -0.01776123046875, -0.01544189453125, -0.01312255859375, -0.01080322265625, -0.00848388671875, -0.00616455078125, -0.00384521484375, -0.00152587890625, 0.00079345703125, 0.00311279296875, 0.00543212890625, 0.00775146484375, 0.01007080078125, 0.01239013671875, 0.01470947265625, 0.01702880859375, 0.01934814453125, 0.02166748046875, 0.02398681640625, 0.02630615234375, 0.02862548828125, 0.03094482421875, 0.03326416015625, 0.03558349609375, 0.03790283203125, 0.04022216796875, 0.04254150390625, 0.04486083984375, 0.04718017578125, 0.04949951171875, 0.05181884765625, 0.05413818359375, 0.05645751953125, 0.05877685546875, 0.06109619140625, 0.06341552734375, 0.06573486328125, 0.06805419921875, 0.07037353515625, 0.07269287109375, 0.07501220703125, 0.07733154296875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 1.0, 2.0, 4.0, 8.0, 9.0, 18.0, 16.0, 26.0, 43.0, 52.0, 83.0, 91.0, 154.0, 142.0, 98.0, 72.0, 51.0, 47.0, 15.0, 12.0, 18.0, 9.0, 5.0, 9.0, 5.0, 8.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.043548583984375, -0.042305946350097656, -0.04106330871582031, -0.03982067108154297, -0.038578033447265625, -0.03733539581298828, -0.03609275817871094, -0.034850120544433594, -0.03360748291015625, -0.032364845275878906, -0.031122207641601562, -0.02987957000732422, -0.028636932373046875, -0.02739429473876953, -0.026151657104492188, -0.024909019470214844, -0.0236663818359375, -0.022423744201660156, -0.021181106567382812, -0.01993846893310547, -0.018695831298828125, -0.01745319366455078, -0.016210556030273438, -0.014967918395996094, -0.01372528076171875, -0.012482643127441406, -0.011240005493164062, -0.009997367858886719, -0.008754730224609375, -0.007512092590332031, -0.0062694549560546875, -0.005026817321777344, -0.0037841796875, -0.0025415420532226562, -0.0012989044189453125, -5.626678466796875e-05, 0.001186370849609375, 0.0024290084838867188, 0.0036716461181640625, 0.004914283752441406, 0.00615692138671875, 0.007399559020996094, 0.008642196655273438, 0.009884834289550781, 0.011127471923828125, 0.012370109558105469, 0.013612747192382812, 0.014855384826660156, 0.0160980224609375, 0.017340660095214844, 0.018583297729492188, 0.01982593536376953, 0.021068572998046875, 0.02231121063232422, 0.023553848266601562, 0.024796485900878906, 0.02603912353515625, 0.027281761169433594, 0.028524398803710938, 0.02976703643798828, 0.031009674072265625, 0.03225231170654297, 0.03349494934082031, 0.034737586975097656, 0.035980224609375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 16.0, 763.0, 220.0, 11.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.093675136566162, -2.9450550079345703, -2.7964348793029785, -2.6478145122528076, -2.499194383621216, -2.350574254989624, -2.201953887939453, -2.0533337593078613, -1.9047136306762695, -1.7560935020446777, -1.6074732542037964, -1.458853006362915, -1.3102328777313232, -1.1616127490997314, -1.01299250125885, -0.8643722534179688, -0.715752124786377, -0.5671319365501404, -0.4185117483139038, -0.26989156007766724, -0.12127137184143066, 0.027348816394805908, 0.17596900463104248, 0.32458925247192383, 0.4732093811035156, 0.6218295693397522, 0.7704497575759888, 0.9190699458122253, 1.067690134048462, 1.2163102626800537, 1.364930510520935, 1.5135507583618164, 1.66217041015625, 1.8107905387878418, 1.9594107866287231, 2.1080310344696045, 2.2566511631011963, 2.405271291732788, 2.553891658782959, 2.702511787414551, 2.8511319160461426, 2.9997520446777344, 3.148372173309326, 3.296992540359497, 3.445612668991089, 3.5942327976226807, 3.7428531646728516, 3.8914732933044434, 4.040093421936035, 4.188713550567627, 4.337333679199219, 4.4859538078308105, 4.634573936462402, 4.783194541931152, 4.931814670562744, 5.080434799194336, 5.229054927825928, 5.3776750564575195, 5.526295185089111, 5.674915313720703, 5.823535919189453, 5.972156047821045, 6.120776176452637, 6.2693963050842285, 6.41801643371582]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 3.0, 11.0, 6.0, 11.0, 22.0, 23.0, 30.0, 29.0, 35.0, 49.0, 53.0, 56.0, 68.0, 69.0, 79.0, 75.0, 65.0, 34.0, 59.0, 52.0, 38.0, 35.0, 23.0, 21.0, 16.0, 14.0, 7.0, 5.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9592798948287964, -0.9282735586166382, -0.8972671627998352, -0.866260826587677, -0.8352544903755188, -0.8042480945587158, -0.7732417583465576, -0.7422354221343994, -0.7112290859222412, -0.680222749710083, -0.64921635389328, -0.6182100176811218, -0.5872036814689636, -0.5561972856521606, -0.5251909494400024, -0.49418461322784424, -0.46317824721336365, -0.43217188119888306, -0.40116554498672485, -0.37015917897224426, -0.33915284276008606, -0.30814647674560547, -0.27714014053344727, -0.24613377451896667, -0.21512742340564728, -0.18412107229232788, -0.15311472117900848, -0.12210836261510849, -0.09110201150178909, -0.0600956529378891, -0.029089301824569702, 0.0019170492887496948, 0.03292340040206909, 0.06392975151538849, 0.09493610262870789, 0.12594246864318848, 0.15694880485534668, 0.18795517086982727, 0.21896152198314667, 0.24996787309646606, 0.28097420930862427, 0.31198057532310486, 0.34298691153526306, 0.37399327754974365, 0.40499961376190186, 0.43600597977638245, 0.46701234579086304, 0.49801868200302124, 0.5290250778198242, 0.5600314140319824, 0.5910378098487854, 0.6220441460609436, 0.6530504822731018, 0.6840568780899048, 0.715063214302063, 0.7460695505142212, 0.7770758867263794, 0.8080822229385376, 0.8390886187553406, 0.8700949549674988, 0.901101291179657, 0.93210768699646, 0.9631140232086182, 0.9941203594207764, 1.0251266956329346]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 4.0, 6.0, 15.0, 26.0, 32.0, 50.0, 62.0, 118.0, 226.0, 387.0, 985.0, 3566.0, 31126.0, 4068856.0, 82217.0, 5036.0, 1003.0, 278.0, 137.0, 67.0, 42.0, 15.0, 14.0, 8.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.53466796875, -0.522125244140625, -0.50958251953125, -0.497039794921875, -0.4844970703125, -0.471954345703125, -0.45941162109375, -0.446868896484375, -0.434326171875, -0.421783447265625, -0.40924072265625, -0.396697998046875, -0.3841552734375, -0.371612548828125, -0.35906982421875, -0.346527099609375, -0.333984375, -0.321441650390625, -0.30889892578125, -0.296356201171875, -0.2838134765625, -0.271270751953125, -0.25872802734375, -0.246185302734375, -0.233642578125, -0.221099853515625, -0.20855712890625, -0.196014404296875, -0.1834716796875, -0.170928955078125, -0.15838623046875, -0.145843505859375, -0.13330078125, -0.120758056640625, -0.10821533203125, -0.095672607421875, -0.0831298828125, -0.070587158203125, -0.05804443359375, -0.045501708984375, -0.032958984375, -0.020416259765625, -0.00787353515625, 0.004669189453125, 0.0172119140625, 0.029754638671875, 0.04229736328125, 0.054840087890625, 0.0673828125, 0.079925537109375, 0.09246826171875, 0.105010986328125, 0.1175537109375, 0.130096435546875, 0.14263916015625, 0.155181884765625, 0.167724609375, 0.180267333984375, 0.19281005859375, 0.205352783203125, 0.2178955078125, 0.230438232421875, 0.24298095703125, 0.255523681640625, 0.26806640625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 11.0, 13.0, 26.0, 47.0, 56.0, 90.0, 111.0, 114.0, 103.0, 108.0, 100.0, 72.0, 47.0, 36.0, 31.0, 11.0, 14.0, 4.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.098876953125, -0.09659147262573242, -0.09430599212646484, -0.09202051162719727, -0.08973503112792969, -0.08744955062866211, -0.08516407012939453, -0.08287858963012695, -0.08059310913085938, -0.0783076286315918, -0.07602214813232422, -0.07373666763305664, -0.07145118713378906, -0.06916570663452148, -0.0668802261352539, -0.06459474563598633, -0.06230926513671875, -0.06002378463745117, -0.057738304138183594, -0.055452823638916016, -0.05316734313964844, -0.05088186264038086, -0.04859638214111328, -0.0463109016418457, -0.044025421142578125, -0.04173994064331055, -0.03945446014404297, -0.03716897964477539, -0.03488349914550781, -0.032598018646240234, -0.030312538146972656, -0.028027057647705078, -0.0257415771484375, -0.023456096649169922, -0.021170616149902344, -0.018885135650634766, -0.016599655151367188, -0.01431417465209961, -0.012028694152832031, -0.009743213653564453, -0.007457733154296875, -0.005172252655029297, -0.0028867721557617188, -0.0006012916564941406, 0.0016841888427734375, 0.003969669342041016, 0.006255149841308594, 0.008540630340576172, 0.01082611083984375, 0.013111591339111328, 0.015397071838378906, 0.017682552337646484, 0.019968032836914062, 0.02225351333618164, 0.02453899383544922, 0.026824474334716797, 0.029109954833984375, 0.03139543533325195, 0.03368091583251953, 0.03596639633178711, 0.03825187683105469, 0.040537357330322266, 0.042822837829589844, 0.04510831832885742, 0.047393798828125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 9.0, 9.0, 26.0, 59.0, 214.0, 2972.0, 4190312.0, 390.0, 158.0, 79.0, 34.0, 18.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.494140625, -1.395599365234375, -1.29705810546875, -1.198516845703125, -1.0999755859375, -1.001434326171875, -0.90289306640625, -0.804351806640625, -0.705810546875, -0.607269287109375, -0.50872802734375, -0.410186767578125, -0.3116455078125, -0.213104248046875, -0.11456298828125, -0.016021728515625, 0.08251953125, 0.181060791015625, 0.27960205078125, 0.378143310546875, 0.4766845703125, 0.575225830078125, 0.67376708984375, 0.772308349609375, 0.870849609375, 0.969390869140625, 1.06793212890625, 1.166473388671875, 1.2650146484375, 1.363555908203125, 1.46209716796875, 1.560638427734375, 1.6591796875, 1.757720947265625, 1.85626220703125, 1.954803466796875, 2.0533447265625, 2.151885986328125, 2.25042724609375, 2.348968505859375, 2.447509765625, 2.546051025390625, 2.64459228515625, 2.743133544921875, 2.8416748046875, 2.940216064453125, 3.03875732421875, 3.137298583984375, 3.23583984375, 3.334381103515625, 3.43292236328125, 3.531463623046875, 3.6300048828125, 3.728546142578125, 3.82708740234375, 3.925628662109375, 4.024169921875, 4.122711181640625, 4.22125244140625, 4.319793701171875, 4.4183349609375, 4.516876220703125, 4.61541748046875, 4.713958740234375, 4.8125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 21.0, 3291.0, 758.0, 17.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24072265625, -0.22562408447265625, -0.2105255126953125, -0.19542694091796875, -0.180328369140625, -0.16522979736328125, -0.1501312255859375, -0.13503265380859375, -0.11993408203125, -0.10483551025390625, -0.0897369384765625, -0.07463836669921875, -0.059539794921875, -0.04444122314453125, -0.0293426513671875, -0.01424407958984375, 0.0008544921875, 0.01595306396484375, 0.0310516357421875, 0.04615020751953125, 0.061248779296875, 0.07634735107421875, 0.0914459228515625, 0.10654449462890625, 0.12164306640625, 0.13674163818359375, 0.1518402099609375, 0.16693878173828125, 0.182037353515625, 0.19713592529296875, 0.2122344970703125, 0.22733306884765625, 0.242431640625, 0.25753021240234375, 0.2726287841796875, 0.28772735595703125, 0.302825927734375, 0.31792449951171875, 0.3330230712890625, 0.34812164306640625, 0.36322021484375, 0.37831878662109375, 0.3934173583984375, 0.40851593017578125, 0.423614501953125, 0.43871307373046875, 0.4538116455078125, 0.46891021728515625, 0.4840087890625, 0.49910736083984375, 0.5142059326171875, 0.5293045043945312, 0.544403076171875, 0.5595016479492188, 0.5746002197265625, 0.5896987915039062, 0.60479736328125, 0.6198959350585938, 0.6349945068359375, 0.6500930786132812, 0.665191650390625, 0.6802902221679688, 0.6953887939453125, 0.7104873657226562, 0.7255859375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1003.0, 11.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.780282020568848, -15.463200569152832, -15.146119117736816, -14.829036712646484, -14.511955261230469, -14.194873809814453, -13.877792358398438, -13.560710906982422, -13.243629455566406, -12.92654800415039, -12.609466552734375, -12.292384147644043, -11.975302696228027, -11.658221244812012, -11.341139793395996, -11.02405834197998, -10.706975936889648, -10.389894485473633, -10.072813034057617, -9.755730628967285, -9.43864917755127, -9.121567726135254, -8.804486274719238, -8.487404823303223, -8.17032241821289, -7.853240966796875, -7.536159038543701, -7.2190775871276855, -6.901995658874512, -6.584914207458496, -6.2678327560424805, -5.950751304626465, -5.633669853210449, -5.316588401794434, -4.99950647354126, -4.682425022125244, -4.36534309387207, -4.048261642456055, -3.731180191040039, -3.4140985012054443, -3.0970168113708496, -2.779935121536255, -2.46285343170166, -2.1457719802856445, -1.8286902904510498, -1.511608600616455, -1.19452702999115, -0.8774454593658447, -0.56036376953125, -0.24328213930130005, 0.0737994909286499, 0.39088112115859985, 0.7079627513885498, 1.0250444412231445, 1.3421260118484497, 1.6592075824737549, 1.9762892723083496, 2.2933709621429443, 2.610452651977539, 2.9275341033935547, 3.2446157932281494, 3.561697483062744, 3.8787789344787598, 4.195860862731934, 4.512942314147949]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 10.0, 27.0, 64.0, 104.0, 144.0, 170.0, 163.0, 138.0, 94.0, 52.0, 21.0, 12.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.0589741468429565, -1.0310814380645752, -1.0031887292861938, -0.9752960205078125, -0.9474033117294312, -0.9195106029510498, -0.8916178941726685, -0.8637251853942871, -0.8358324766159058, -0.8079397678375244, -0.7800470590591431, -0.7521543502807617, -0.7242616415023804, -0.696368932723999, -0.6684762239456177, -0.6405835151672363, -0.6126908659934998, -0.5847981572151184, -0.5569054484367371, -0.5290127396583557, -0.5011200308799744, -0.473227322101593, -0.44533464312553406, -0.4174419343471527, -0.38954922556877136, -0.36165651679039, -0.33376380801200867, -0.3058711290359497, -0.27797842025756836, -0.250085711479187, -0.22219300270080566, -0.19430029392242432, -0.1664075255393982, -0.13851481676101685, -0.1106221154332161, -0.08272941410541534, -0.054836705327034, -0.02694399654865265, 0.0009486973285675049, 0.028841406106948853, 0.0567341148853302, 0.08462682366371155, 0.1125195249915123, 0.14041222631931305, 0.1683049350976944, 0.19619764387607574, 0.2240903377532959, 0.25198304653167725, 0.2798757553100586, 0.30776846408843994, 0.3356611728668213, 0.36355388164520264, 0.391446590423584, 0.41933929920196533, 0.4472319781780243, 0.47512468695640564, 0.5030174255371094, 0.5309101343154907, 0.5588028430938721, 0.5866955518722534, 0.6145882606506348, 0.6424809694290161, 0.6703736782073975, 0.6982663869857788, 0.7261590361595154]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 7.0, 3.0, 6.0, 9.0, 7.0, 20.0, 14.0, 19.0, 32.0, 41.0, 48.0, 84.0, 108.0, 162.0, 227.0, 370.0, 626.0, 1102.0, 2324.0, 5727.0, 17380.0, 67467.0, 404406.0, 445723.0, 72529.0, 18538.0, 5982.0, 2556.0, 1209.0, 673.0, 369.0, 249.0, 176.0, 118.0, 69.0, 46.0, 40.0, 23.0, 18.0, 11.0, 10.0, 7.0, 9.0, 8.0, 3.0, 4.0, 1.0, 1.0, 4.0], "bins": [-0.1290283203125, -0.12563514709472656, -0.12224197387695312, -0.11884880065917969, -0.11545562744140625, -0.11206245422363281, -0.10866928100585938, -0.10527610778808594, -0.1018829345703125, -0.09848976135253906, -0.09509658813476562, -0.09170341491699219, -0.08831024169921875, -0.08491706848144531, -0.08152389526367188, -0.07813072204589844, -0.074737548828125, -0.07134437561035156, -0.06795120239257812, -0.06455802917480469, -0.06116485595703125, -0.05777168273925781, -0.054378509521484375, -0.05098533630371094, -0.0475921630859375, -0.04419898986816406, -0.040805816650390625, -0.03741264343261719, -0.03401947021484375, -0.030626296997070312, -0.027233123779296875, -0.023839950561523438, -0.02044677734375, -0.017053604125976562, -0.013660430908203125, -0.010267257690429688, -0.00687408447265625, -0.0034809112548828125, -8.7738037109375e-05, 0.0033054351806640625, 0.0066986083984375, 0.010091781616210938, 0.013484954833984375, 0.016878128051757812, 0.02027130126953125, 0.023664474487304688, 0.027057647705078125, 0.030450820922851562, 0.033843994140625, 0.03723716735839844, 0.040630340576171875, 0.04402351379394531, 0.04741668701171875, 0.05080986022949219, 0.054203033447265625, 0.05759620666503906, 0.0609893798828125, 0.06438255310058594, 0.06777572631835938, 0.07116889953613281, 0.07456207275390625, 0.07795524597167969, 0.08134841918945312, 0.08474159240722656, 0.088134765625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 7.0, 5.0, 22.0, 26.0, 35.0, 43.0, 56.0, 65.0, 90.0, 97.0, 98.0, 74.0, 91.0, 67.0, 60.0, 52.0, 41.0, 26.0, 15.0, 9.0, 7.0, 9.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.06707763671875, -0.06546163558959961, -0.06384563446044922, -0.06222963333129883, -0.06061363220214844, -0.05899763107299805, -0.057381629943847656, -0.055765628814697266, -0.054149627685546875, -0.052533626556396484, -0.050917625427246094, -0.0493016242980957, -0.04768562316894531, -0.04606962203979492, -0.04445362091064453, -0.04283761978149414, -0.04122161865234375, -0.03960561752319336, -0.03798961639404297, -0.03637361526489258, -0.03475761413574219, -0.0331416130065918, -0.031525611877441406, -0.029909610748291016, -0.028293609619140625, -0.026677608489990234, -0.025061607360839844, -0.023445606231689453, -0.021829605102539062, -0.020213603973388672, -0.01859760284423828, -0.01698160171508789, -0.0153656005859375, -0.01374959945678711, -0.012133598327636719, -0.010517597198486328, -0.008901596069335938, -0.007285594940185547, -0.005669593811035156, -0.004053592681884766, -0.002437591552734375, -0.0008215904235839844, 0.0007944107055664062, 0.002410411834716797, 0.0040264129638671875, 0.005642414093017578, 0.007258415222167969, 0.00887441635131836, 0.01049041748046875, 0.01210641860961914, 0.013722419738769531, 0.015338420867919922, 0.016954421997070312, 0.018570423126220703, 0.020186424255371094, 0.021802425384521484, 0.023418426513671875, 0.025034427642822266, 0.026650428771972656, 0.028266429901123047, 0.029882431030273438, 0.03149843215942383, 0.03311443328857422, 0.03473043441772461, 0.036346435546875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 7.0, 11.0, 7.0, 14.0, 20.0, 34.0, 57.0, 82.0, 174.0, 388.0, 1094.0, 6342.0, 186578.0, 836624.0, 14236.0, 1888.0, 522.0, 203.0, 97.0, 62.0, 38.0, 25.0, 22.0, 12.0, 2.0, 3.0, 3.0, 5.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.382568359375, -0.3732738494873047, -0.3639793395996094, -0.35468482971191406, -0.34539031982421875, -0.33609580993652344, -0.3268013000488281, -0.3175067901611328, -0.3082122802734375, -0.2989177703857422, -0.2896232604980469, -0.28032875061035156, -0.27103424072265625, -0.26173973083496094, -0.2524452209472656, -0.2431507110595703, -0.233856201171875, -0.2245616912841797, -0.21526718139648438, -0.20597267150878906, -0.19667816162109375, -0.18738365173339844, -0.17808914184570312, -0.1687946319580078, -0.1595001220703125, -0.1502056121826172, -0.14091110229492188, -0.13161659240722656, -0.12232208251953125, -0.11302757263183594, -0.10373306274414062, -0.09443855285644531, -0.08514404296875, -0.07584953308105469, -0.06655502319335938, -0.05726051330566406, -0.04796600341796875, -0.03867149353027344, -0.029376983642578125, -0.020082473754882812, -0.0107879638671875, -0.0014934539794921875, 0.007801055908203125, 0.017095565795898438, 0.02639007568359375, 0.03568458557128906, 0.044979095458984375, 0.05427360534667969, 0.063568115234375, 0.07286262512207031, 0.08215713500976562, 0.09145164489746094, 0.10074615478515625, 0.11004066467285156, 0.11933517456054688, 0.1286296844482422, 0.1379241943359375, 0.1472187042236328, 0.15651321411132812, 0.16580772399902344, 0.17510223388671875, 0.18439674377441406, 0.19369125366210938, 0.2029857635498047, 0.2122802734375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 9.0, 12.0, 11.0, 18.0, 19.0, 36.0, 32.0, 45.0, 67.0, 67.0, 86.0, 83.0, 94.0, 86.0, 81.0, 66.0, 55.0, 32.0, 21.0, 23.0, 15.0, 15.0, 9.0, 2.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.276611328125, -0.26987457275390625, -0.2631378173828125, -0.25640106201171875, -0.249664306640625, -0.24292755126953125, -0.2361907958984375, -0.22945404052734375, -0.22271728515625, -0.21598052978515625, -0.2092437744140625, -0.20250701904296875, -0.195770263671875, -0.18903350830078125, -0.1822967529296875, -0.17555999755859375, -0.1688232421875, -0.16208648681640625, -0.1553497314453125, -0.14861297607421875, -0.141876220703125, -0.13513946533203125, -0.1284027099609375, -0.12166595458984375, -0.11492919921875, -0.10819244384765625, -0.1014556884765625, -0.09471893310546875, -0.087982177734375, -0.08124542236328125, -0.0745086669921875, -0.06777191162109375, -0.06103515625, -0.05429840087890625, -0.0475616455078125, -0.04082489013671875, -0.034088134765625, -0.02735137939453125, -0.0206146240234375, -0.01387786865234375, -0.00714111328125, -0.00040435791015625, 0.0063323974609375, 0.01306915283203125, 0.019805908203125, 0.02654266357421875, 0.0332794189453125, 0.04001617431640625, 0.0467529296875, 0.05348968505859375, 0.0602264404296875, 0.06696319580078125, 0.073699951171875, 0.08043670654296875, 0.0871734619140625, 0.09391021728515625, 0.10064697265625, 0.10738372802734375, 0.1141204833984375, 0.12085723876953125, 0.127593994140625, 0.13433074951171875, 0.1410675048828125, 0.14780426025390625, 0.154541015625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 8.0, 18.0, 34.0, 34.0, 67.0, 125.0, 233.0, 703.0, 2328.0, 15547.0, 819672.0, 200264.0, 7176.0, 1486.0, 451.0, 187.0, 83.0, 62.0, 20.0, 14.0, 17.0, 9.0, 6.0, 6.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0394287109375, -0.037535667419433594, -0.03564262390136719, -0.03374958038330078, -0.031856536865234375, -0.02996349334716797, -0.028070449829101562, -0.026177406311035156, -0.02428436279296875, -0.022391319274902344, -0.020498275756835938, -0.01860523223876953, -0.016712188720703125, -0.014819145202636719, -0.012926101684570312, -0.011033058166503906, -0.0091400146484375, -0.007246971130371094, -0.0053539276123046875, -0.0034608840942382812, -0.001567840576171875, 0.00032520294189453125, 0.0022182464599609375, 0.004111289978027344, 0.00600433349609375, 0.007897377014160156, 0.009790420532226562, 0.011683464050292969, 0.013576507568359375, 0.015469551086425781, 0.017362594604492188, 0.019255638122558594, 0.021148681640625, 0.023041725158691406, 0.024934768676757812, 0.02682781219482422, 0.028720855712890625, 0.03061389923095703, 0.03250694274902344, 0.034399986267089844, 0.03629302978515625, 0.038186073303222656, 0.04007911682128906, 0.04197216033935547, 0.043865203857421875, 0.04575824737548828, 0.04765129089355469, 0.049544334411621094, 0.0514373779296875, 0.053330421447753906, 0.05522346496582031, 0.05711650848388672, 0.059009552001953125, 0.06090259552001953, 0.06279563903808594, 0.06468868255615234, 0.06658172607421875, 0.06847476959228516, 0.07036781311035156, 0.07226085662841797, 0.07415390014648438, 0.07604694366455078, 0.07793998718261719, 0.0798330307006836, 0.08172607421875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 12.0, 10.0, 14.0, 7.0, 18.0, 17.0, 33.0, 36.0, 29.0, 46.0, 57.0, 54.0, 57.0, 68.0, 66.0, 62.0, 60.0, 61.0, 45.0, 48.0, 39.0, 40.0, 38.0, 13.0, 22.0, 5.0, 11.0, 9.0, 4.0, 3.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.76837158203125e-06, -4.5923516154289246e-06, -4.416331648826599e-06, -4.240311682224274e-06, -4.064291715621948e-06, -3.888271749019623e-06, -3.7122517824172974e-06, -3.536231815814972e-06, -3.3602118492126465e-06, -3.184191882610321e-06, -3.0081719160079956e-06, -2.83215194940567e-06, -2.6561319828033447e-06, -2.4801120162010193e-06, -2.304092049598694e-06, -2.1280720829963684e-06, -1.952052116394043e-06, -1.7760321497917175e-06, -1.600012183189392e-06, -1.4239922165870667e-06, -1.2479722499847412e-06, -1.0719522833824158e-06, -8.959323167800903e-07, -7.199123501777649e-07, -5.438923835754395e-07, -3.67872416973114e-07, -1.9185245037078857e-07, -1.5832483768463135e-08, 1.601874828338623e-07, 3.3620744943618774e-07, 5.122274160385132e-07, 6.882473826408386e-07, 8.642673492431641e-07, 1.0402873158454895e-06, 1.216307282447815e-06, 1.3923272490501404e-06, 1.5683472156524658e-06, 1.7443671822547913e-06, 1.9203871488571167e-06, 2.096407115459442e-06, 2.2724270820617676e-06, 2.448447048664093e-06, 2.6244670152664185e-06, 2.800486981868744e-06, 2.9765069484710693e-06, 3.1525269150733948e-06, 3.3285468816757202e-06, 3.5045668482780457e-06, 3.680586814880371e-06, 3.8566067814826965e-06, 4.032626748085022e-06, 4.208646714687347e-06, 4.384666681289673e-06, 4.560686647891998e-06, 4.736706614494324e-06, 4.912726581096649e-06, 5.088746547698975e-06, 5.2647665143013e-06, 5.4407864809036255e-06, 5.616806447505951e-06, 5.792826414108276e-06, 5.968846380710602e-06, 6.144866347312927e-06, 6.320886313915253e-06, 6.496906280517578e-06]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 11.0, 12.0, 24.0, 40.0, 63.0, 219.0, 670.0, 3025.0, 76237.0, 951221.0, 14802.0, 1502.0, 427.0, 159.0, 58.0, 31.0, 18.0, 5.0, 11.0, 10.0, 6.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07464599609375, -0.07240486145019531, -0.07016372680664062, -0.06792259216308594, -0.06568145751953125, -0.06344032287597656, -0.061199188232421875, -0.05895805358886719, -0.0567169189453125, -0.05447578430175781, -0.052234649658203125, -0.04999351501464844, -0.04775238037109375, -0.04551124572753906, -0.043270111083984375, -0.04102897644042969, -0.038787841796875, -0.03654670715332031, -0.034305572509765625, -0.03206443786621094, -0.02982330322265625, -0.027582168579101562, -0.025341033935546875, -0.023099899291992188, -0.0208587646484375, -0.018617630004882812, -0.016376495361328125, -0.014135360717773438, -0.01189422607421875, -0.009653091430664062, -0.007411956787109375, -0.0051708221435546875, -0.0029296875, -0.0006885528564453125, 0.001552581787109375, 0.0037937164306640625, 0.00603485107421875, 0.008275985717773438, 0.010517120361328125, 0.012758255004882812, 0.0149993896484375, 0.017240524291992188, 0.019481658935546875, 0.021722793579101562, 0.02396392822265625, 0.026205062866210938, 0.028446197509765625, 0.030687332153320312, 0.032928466796875, 0.03516960144042969, 0.037410736083984375, 0.03965187072753906, 0.04189300537109375, 0.04413414001464844, 0.046375274658203125, 0.04861640930175781, 0.0508575439453125, 0.05309867858886719, 0.055339813232421875, 0.05758094787597656, 0.05982208251953125, 0.06206321716308594, 0.06430435180664062, 0.06654548645019531, 0.06878662109375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 6.0, 4.0, 5.0, 5.0, 10.0, 32.0, 49.0, 95.0, 147.0, 214.0, 180.0, 115.0, 59.0, 29.0, 16.0, 17.0, 10.0, 2.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05224609375, -0.05059480667114258, -0.048943519592285156, -0.047292232513427734, -0.04564094543457031, -0.04398965835571289, -0.04233837127685547, -0.04068708419799805, -0.039035797119140625, -0.0373845100402832, -0.03573322296142578, -0.03408193588256836, -0.03243064880371094, -0.030779361724853516, -0.029128074645996094, -0.027476787567138672, -0.02582550048828125, -0.024174213409423828, -0.022522926330566406, -0.020871639251708984, -0.019220352172851562, -0.01756906509399414, -0.01591777801513672, -0.014266490936279297, -0.012615203857421875, -0.010963916778564453, -0.009312629699707031, -0.007661342620849609, -0.0060100555419921875, -0.004358768463134766, -0.0027074813842773438, -0.0010561943054199219, 0.0005950927734375, 0.002246379852294922, 0.0038976669311523438, 0.005548954010009766, 0.0072002410888671875, 0.00885152816772461, 0.010502815246582031, 0.012154102325439453, 0.013805389404296875, 0.015456676483154297, 0.01710796356201172, 0.01875925064086914, 0.020410537719726562, 0.022061824798583984, 0.023713111877441406, 0.025364398956298828, 0.02701568603515625, 0.028666973114013672, 0.030318260192871094, 0.031969547271728516, 0.03362083435058594, 0.03527212142944336, 0.03692340850830078, 0.0385746955871582, 0.040225982666015625, 0.04187726974487305, 0.04352855682373047, 0.04517984390258789, 0.04683113098144531, 0.048482418060302734, 0.050133705139160156, 0.05178499221801758, 0.053436279296875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 7.0, 85.0, 775.0, 131.0, 8.0, 3.0, 2.0, 1.0, 1.0], "bins": [-6.115250587463379, -6.0091776847839355, -5.903104305267334, -5.797031402587891, -5.690958499908447, -5.584885120391846, -5.478812217712402, -5.372738838195801, -5.266665935516357, -5.160593032836914, -5.0545196533203125, -4.948446750640869, -4.842373847961426, -4.736300468444824, -4.630227565765381, -4.5241546630859375, -4.418081283569336, -4.312008380889893, -4.205935001373291, -4.099862098693848, -3.993788957595825, -3.8877158164978027, -3.7816429138183594, -3.675569772720337, -3.5694968700408936, -3.463423728942871, -3.3573508262634277, -3.2512776851654053, -3.145204544067383, -3.0391316413879395, -2.933058500289917, -2.8269853591918945, -2.720911979675293, -2.6148388385772705, -2.508765935897827, -2.4026927947998047, -2.2966196537017822, -2.1905465126037598, -2.0844736099243164, -1.978400468826294, -1.872327446937561, -1.7662544250488281, -1.6601812839508057, -1.5541082620620728, -1.4480351209640503, -1.3419620990753174, -1.235888957977295, -1.129815936088562, -1.023742914199829, -0.9176698327064514, -0.8115967512130737, -0.7055237293243408, -0.5994505882263184, -0.49337756633758545, -0.38730448484420776, -0.2812314033508301, -0.17515826225280762, -0.06908518821001053, 0.03698788583278656, 0.14306095242500305, 0.24913403391838074, 0.35520708560943604, 0.4612801671028137, 0.5673532485961914, 0.6734263300895691]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 4.0, 5.0, 9.0, 8.0, 8.0, 24.0, 21.0, 26.0, 32.0, 28.0, 38.0, 59.0, 43.0, 49.0, 60.0, 45.0, 67.0, 52.0, 52.0, 51.0, 42.0, 48.0, 34.0, 40.0, 34.0, 23.0, 21.0, 20.0, 11.0, 17.0, 12.0, 3.0, 5.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.936475396156311, -0.9110198616981506, -0.8855642676353455, -0.8601087331771851, -0.8346531391143799, -0.8091976046562195, -0.7837420701980591, -0.7582864761352539, -0.7328309416770935, -0.7073754072189331, -0.6819198131561279, -0.6564642786979675, -0.6310087442398071, -0.605553150177002, -0.5800976157188416, -0.5546420812606812, -0.529186487197876, -0.5037309527397156, -0.4782753586769104, -0.45281982421875, -0.4273642599582672, -0.4019086956977844, -0.376453161239624, -0.35099759697914124, -0.32554203271865845, -0.30008646845817566, -0.27463090419769287, -0.24917536973953247, -0.22371980547904968, -0.1982642412185669, -0.1728086918592453, -0.1473531424999237, -0.12189751863479614, -0.09644196182489395, -0.07098640501499176, -0.04553084820508957, -0.020075291395187378, 0.00538027286529541, 0.030835822224617004, 0.0562913715839386, 0.08174693584442139, 0.10720249265432358, 0.13265804946422577, 0.15811359882354736, 0.18356916308403015, 0.20902472734451294, 0.23448027670383453, 0.25993582606315613, 0.2853913903236389, 0.3108469545841217, 0.3363025188446045, 0.3617580533027649, 0.3872136175632477, 0.41266918182373047, 0.43812471628189087, 0.46358028054237366, 0.48903584480285645, 0.5144913792610168, 0.539946973323822, 0.5654025077819824, 0.5908581018447876, 0.616313636302948, 0.6417691707611084, 0.6672247648239136, 0.692680299282074]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 5.0, 3.0, 4.0, 4.0, 5.0, 11.0, 4.0, 11.0, 27.0, 31.0, 40.0, 76.0, 95.0, 166.0, 306.0, 571.0, 1169.0, 2773.0, 9122.0, 61552.0, 3965713.0, 134100.0, 12811.0, 3263.0, 1249.0, 573.0, 274.0, 124.0, 72.0, 52.0, 26.0, 21.0, 11.0, 9.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.317138671875, -0.30951881408691406, -0.3018989562988281, -0.2942790985107422, -0.28665924072265625, -0.2790393829345703, -0.2714195251464844, -0.26379966735839844, -0.2561798095703125, -0.24855995178222656, -0.24094009399414062, -0.2333202362060547, -0.22570037841796875, -0.2180805206298828, -0.21046066284179688, -0.20284080505371094, -0.195220947265625, -0.18760108947753906, -0.17998123168945312, -0.1723613739013672, -0.16474151611328125, -0.1571216583251953, -0.14950180053710938, -0.14188194274902344, -0.1342620849609375, -0.12664222717285156, -0.11902236938476562, -0.11140251159667969, -0.10378265380859375, -0.09616279602050781, -0.08854293823242188, -0.08092308044433594, -0.07330322265625, -0.06568336486816406, -0.058063507080078125, -0.05044364929199219, -0.04282379150390625, -0.03520393371582031, -0.027584075927734375, -0.019964218139648438, -0.0123443603515625, -0.0047245025634765625, 0.002895355224609375, 0.010515213012695312, 0.01813507080078125, 0.025754928588867188, 0.033374786376953125, 0.04099464416503906, 0.048614501953125, 0.05623435974121094, 0.06385421752929688, 0.07147407531738281, 0.07909393310546875, 0.08671379089355469, 0.09433364868164062, 0.10195350646972656, 0.1095733642578125, 0.11719322204589844, 0.12481307983398438, 0.1324329376220703, 0.14005279541015625, 0.1476726531982422, 0.15529251098632812, 0.16291236877441406, 0.1705322265625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 9.0, 13.0, 10.0, 26.0, 30.0, 31.0, 57.0, 60.0, 91.0, 95.0, 93.0, 76.0, 82.0, 79.0, 72.0, 60.0, 36.0, 24.0, 16.0, 21.0, 9.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.064208984375, -0.06267261505126953, -0.06113624572753906, -0.059599876403808594, -0.058063507080078125, -0.056527137756347656, -0.05499076843261719, -0.05345439910888672, -0.05191802978515625, -0.05038166046142578, -0.04884529113769531, -0.047308921813964844, -0.045772552490234375, -0.044236183166503906, -0.04269981384277344, -0.04116344451904297, -0.0396270751953125, -0.03809070587158203, -0.03655433654785156, -0.035017967224121094, -0.033481597900390625, -0.031945228576660156, -0.030408859252929688, -0.02887248992919922, -0.02733612060546875, -0.02579975128173828, -0.024263381958007812, -0.022727012634277344, -0.021190643310546875, -0.019654273986816406, -0.018117904663085938, -0.01658153533935547, -0.015045166015625, -0.013508796691894531, -0.011972427368164062, -0.010436058044433594, -0.008899688720703125, -0.007363319396972656, -0.0058269500732421875, -0.004290580749511719, -0.00275421142578125, -0.0012178421020507812, 0.0003185272216796875, 0.0018548965454101562, 0.003391265869140625, 0.004927635192871094, 0.0064640045166015625, 0.008000373840332031, 0.0095367431640625, 0.011073112487792969, 0.012609481811523438, 0.014145851135253906, 0.015682220458984375, 0.017218589782714844, 0.018754959106445312, 0.02029132843017578, 0.02182769775390625, 0.02336406707763672, 0.024900436401367188, 0.026436805725097656, 0.027973175048828125, 0.029509544372558594, 0.031045913696289062, 0.03258228302001953, 0.03411865234375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 10.0, 13.0, 26.0, 52.0, 74.0, 123.0, 288.0, 593.0, 2086.0, 13840.0, 4104021.0, 67302.0, 4243.0, 958.0, 345.0, 127.0, 68.0, 39.0, 23.0, 17.0, 7.0, 10.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.381103515625, -0.3698005676269531, -0.35849761962890625, -0.3471946716308594, -0.3358917236328125, -0.3245887756347656, -0.31328582763671875, -0.3019828796386719, -0.290679931640625, -0.2793769836425781, -0.26807403564453125, -0.2567710876464844, -0.2454681396484375, -0.23416519165039062, -0.22286224365234375, -0.21155929565429688, -0.20025634765625, -0.18895339965820312, -0.17765045166015625, -0.16634750366210938, -0.1550445556640625, -0.14374160766601562, -0.13243865966796875, -0.12113571166992188, -0.109832763671875, -0.09852981567382812, -0.08722686767578125, -0.07592391967773438, -0.0646209716796875, -0.053318023681640625, -0.04201507568359375, -0.030712127685546875, -0.0194091796875, -0.008106231689453125, 0.00319671630859375, 0.014499664306640625, 0.0258026123046875, 0.037105560302734375, 0.04840850830078125, 0.059711456298828125, 0.071014404296875, 0.08231735229492188, 0.09362030029296875, 0.10492324829101562, 0.1162261962890625, 0.12752914428710938, 0.13883209228515625, 0.15013504028320312, 0.16143798828125, 0.17274093627929688, 0.18404388427734375, 0.19534683227539062, 0.2066497802734375, 0.21795272827148438, 0.22925567626953125, 0.24055862426757812, 0.251861572265625, 0.2631645202636719, 0.27446746826171875, 0.2857704162597656, 0.2970733642578125, 0.3083763122558594, 0.31967926025390625, 0.3309822082519531, 0.34228515625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 5.0, 12.0, 20.0, 43.0, 118.0, 519.0, 2846.0, 331.0, 81.0, 34.0, 14.0, 13.0, 8.0, 2.0, 7.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.190673828125, -0.18637752532958984, -0.1820812225341797, -0.17778491973876953, -0.17348861694335938, -0.16919231414794922, -0.16489601135253906, -0.1605997085571289, -0.15630340576171875, -0.1520071029663086, -0.14771080017089844, -0.14341449737548828, -0.13911819458007812, -0.13482189178466797, -0.1305255889892578, -0.12622928619384766, -0.1219329833984375, -0.11763668060302734, -0.11334037780761719, -0.10904407501220703, -0.10474777221679688, -0.10045146942138672, -0.09615516662597656, -0.0918588638305664, -0.08756256103515625, -0.0832662582397461, -0.07896995544433594, -0.07467365264892578, -0.07037734985351562, -0.06608104705810547, -0.06178474426269531, -0.057488441467285156, -0.053192138671875, -0.048895835876464844, -0.04459953308105469, -0.04030323028564453, -0.036006927490234375, -0.03171062469482422, -0.027414321899414062, -0.023118019104003906, -0.01882171630859375, -0.014525413513183594, -0.010229110717773438, -0.005932807922363281, -0.001636505126953125, 0.0026597976684570312, 0.0069561004638671875, 0.011252403259277344, 0.0155487060546875, 0.019845008850097656, 0.024141311645507812, 0.02843761444091797, 0.032733917236328125, 0.03703022003173828, 0.04132652282714844, 0.045622825622558594, 0.04991912841796875, 0.054215431213378906, 0.05851173400878906, 0.06280803680419922, 0.06710433959960938, 0.07140064239501953, 0.07569694519042969, 0.07999324798583984, 0.08428955078125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 9.0, 21.0, 193.0, 614.0, 127.0, 25.0, 10.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2426059246063232, -1.2139782905578613, -1.185350775718689, -1.156723141670227, -1.1280955076217651, -1.0994679927825928, -1.0708403587341309, -1.042212724685669, -1.0135852098464966, -0.9849576354026794, -0.9563300013542175, -0.9277024269104004, -0.8990748524665833, -0.8704472184181213, -0.8418196439743042, -0.8131920099258423, -0.7845643758773804, -0.7559368014335632, -0.7273091673851013, -0.6986815929412842, -0.670054018497467, -0.6414263844490051, -0.612798810005188, -0.5841711759567261, -0.5555436611175537, -0.5269160866737366, -0.49828848242759705, -0.4696608781814575, -0.441033273935318, -0.41240566968917847, -0.38377809524536133, -0.3551504909992218, -0.3265228867530823, -0.29789528250694275, -0.2692677080631256, -0.24064010381698608, -0.21201249957084656, -0.18338491022586823, -0.1547573208808899, -0.12612971663475037, -0.09750212728977203, -0.0688745304942131, -0.04024693742394447, -0.011619344353675842, 0.017008252441883087, 0.04563584923744202, 0.07426343858242035, 0.10289104282855988, 0.1315186321735382, 0.16014622151851654, 0.18877382576465607, 0.2174014151096344, 0.24602901935577393, 0.27465659379959106, 0.3032841980457306, 0.3319118022918701, 0.36053937673568726, 0.3891669809818268, 0.4177945554256439, 0.44642215967178345, 0.475049763917923, 0.5036773681640625, 0.5323049426078796, 0.5609325170516968, 0.5895601511001587]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 11.0, 6.0, 10.0, 14.0, 12.0, 21.0, 17.0, 32.0, 38.0, 36.0, 53.0, 71.0, 78.0, 78.0, 66.0, 80.0, 72.0, 58.0, 64.0, 40.0, 46.0, 25.0, 19.0, 14.0, 13.0, 10.0, 9.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.35304415225982666, -0.3416506350040436, -0.3302570879459381, -0.31886357069015503, -0.30747002363204956, -0.2960765063762665, -0.2846829891204834, -0.27328944206237793, -0.26189592480659485, -0.25050240755081177, -0.2391088604927063, -0.22771534323692322, -0.21632181107997894, -0.20492827892303467, -0.1935347616672516, -0.1821412295103073, -0.17074769735336304, -0.15935416519641876, -0.1479606330394745, -0.1365671157836914, -0.12517358362674713, -0.11378005146980286, -0.10238652676343918, -0.0909930020570755, -0.07959946990013123, -0.06820593774318695, -0.05681241303682327, -0.045418884605169296, -0.03402535617351532, -0.022631827741861343, -0.011238299310207367, 0.00015522539615631104, 0.011548757553100586, 0.022942285984754562, 0.03433581441640854, 0.045729342848062515, 0.05712287127971649, 0.06851640343666077, 0.07990992814302444, 0.09130345284938812, 0.1026969850063324, 0.11409051716327667, 0.12548404932022095, 0.13687756657600403, 0.1482710987329483, 0.15966463088989258, 0.17105814814567566, 0.18245168030261993, 0.1938452124595642, 0.20523874461650848, 0.21663227677345276, 0.22802579402923584, 0.23941932618618011, 0.2508128583431244, 0.26220637559890747, 0.27359992265701294, 0.284993439912796, 0.2963869571685791, 0.30778050422668457, 0.31917402148246765, 0.33056753873825073, 0.3419610857963562, 0.3533546030521393, 0.36474812030792236, 0.37614166736602783]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 6.0, 7.0, 10.0, 11.0, 7.0, 20.0, 30.0, 38.0, 39.0, 84.0, 131.0, 240.0, 461.0, 955.0, 2754.0, 10633.0, 59436.0, 620715.0, 308601.0, 33996.0, 6821.0, 1937.0, 726.0, 362.0, 215.0, 77.0, 72.0, 46.0, 23.0, 24.0, 20.0, 13.0, 5.0, 9.0, 10.0, 7.0, 7.0, 1.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1424560546875, -0.1379833221435547, -0.13351058959960938, -0.12903785705566406, -0.12456512451171875, -0.12009239196777344, -0.11561965942382812, -0.11114692687988281, -0.1066741943359375, -0.10220146179199219, -0.09772872924804688, -0.09325599670410156, -0.08878326416015625, -0.08431053161621094, -0.07983779907226562, -0.07536506652832031, -0.070892333984375, -0.06641960144042969, -0.061946868896484375, -0.05747413635253906, -0.05300140380859375, -0.04852867126464844, -0.044055938720703125, -0.03958320617675781, -0.0351104736328125, -0.030637741088867188, -0.026165008544921875, -0.021692276000976562, -0.01721954345703125, -0.012746810913085938, -0.008274078369140625, -0.0038013458251953125, 0.00067138671875, 0.0051441192626953125, 0.009616851806640625, 0.014089584350585938, 0.01856231689453125, 0.023035049438476562, 0.027507781982421875, 0.03198051452636719, 0.0364532470703125, 0.04092597961425781, 0.045398712158203125, 0.04987144470214844, 0.05434417724609375, 0.05881690979003906, 0.06328964233398438, 0.06776237487792969, 0.072235107421875, 0.07670783996582031, 0.08118057250976562, 0.08565330505371094, 0.09012603759765625, 0.09459877014160156, 0.09907150268554688, 0.10354423522949219, 0.1080169677734375, 0.11248970031738281, 0.11696243286132812, 0.12143516540527344, 0.12590789794921875, 0.13038063049316406, 0.13485336303710938, 0.1393260955810547, 0.143798828125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 11.0, 19.0, 31.0, 48.0, 51.0, 100.0, 98.0, 122.0, 122.0, 102.0, 100.0, 69.0, 58.0, 25.0, 23.0, 11.0, 3.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.08148193359375, -0.07967329025268555, -0.0778646469116211, -0.07605600357055664, -0.07424736022949219, -0.07243871688842773, -0.07063007354736328, -0.06882143020629883, -0.06701278686523438, -0.06520414352416992, -0.06339550018310547, -0.061586856842041016, -0.05977821350097656, -0.05796957015991211, -0.056160926818847656, -0.0543522834777832, -0.05254364013671875, -0.0507349967956543, -0.048926353454589844, -0.04711771011352539, -0.04530906677246094, -0.043500423431396484, -0.04169178009033203, -0.03988313674926758, -0.038074493408203125, -0.03626585006713867, -0.03445720672607422, -0.032648563385009766, -0.030839920043945312, -0.02903127670288086, -0.027222633361816406, -0.025413990020751953, -0.0236053466796875, -0.021796703338623047, -0.019988059997558594, -0.01817941665649414, -0.016370773315429688, -0.014562129974365234, -0.012753486633300781, -0.010944843292236328, -0.009136199951171875, -0.007327556610107422, -0.005518913269042969, -0.0037102699279785156, -0.0019016265869140625, -9.298324584960938e-05, 0.0017156600952148438, 0.003524303436279297, 0.00533294677734375, 0.007141590118408203, 0.008950233459472656, 0.01075887680053711, 0.012567520141601562, 0.014376163482666016, 0.01618480682373047, 0.017993450164794922, 0.019802093505859375, 0.021610736846923828, 0.02341938018798828, 0.025228023529052734, 0.027036666870117188, 0.02884531021118164, 0.030653953552246094, 0.03246259689331055, 0.034271240234375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 7.0, 18.0, 13.0, 35.0, 26.0, 54.0, 57.0, 91.0, 110.0, 194.0, 318.0, 477.0, 846.0, 1531.0, 3172.0, 7165.0, 17476.0, 47969.0, 160430.0, 511350.0, 204608.0, 56236.0, 20342.0, 8256.0, 3561.0, 1784.0, 867.0, 539.0, 319.0, 229.0, 141.0, 104.0, 68.0, 57.0, 27.0, 22.0, 13.0, 7.0, 8.0, 7.0, 4.0, 3.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.057952880859375, -0.05622720718383789, -0.05450153350830078, -0.05277585983276367, -0.05105018615722656, -0.04932451248168945, -0.047598838806152344, -0.045873165130615234, -0.044147491455078125, -0.042421817779541016, -0.040696144104003906, -0.0389704704284668, -0.03724479675292969, -0.03551912307739258, -0.03379344940185547, -0.03206777572631836, -0.03034210205078125, -0.02861642837524414, -0.02689075469970703, -0.025165081024169922, -0.023439407348632812, -0.021713733673095703, -0.019988059997558594, -0.018262386322021484, -0.016536712646484375, -0.014811038970947266, -0.013085365295410156, -0.011359691619873047, -0.009634017944335938, -0.007908344268798828, -0.006182670593261719, -0.004456996917724609, -0.0027313232421875, -0.0010056495666503906, 0.0007200241088867188, 0.002445697784423828, 0.0041713714599609375, 0.005897045135498047, 0.007622718811035156, 0.009348392486572266, 0.011074066162109375, 0.012799739837646484, 0.014525413513183594, 0.016251087188720703, 0.017976760864257812, 0.019702434539794922, 0.02142810821533203, 0.02315378189086914, 0.02487945556640625, 0.02660512924194336, 0.02833080291748047, 0.030056476593017578, 0.03178215026855469, 0.0335078239440918, 0.035233497619628906, 0.036959171295166016, 0.038684844970703125, 0.040410518646240234, 0.042136192321777344, 0.04386186599731445, 0.04558753967285156, 0.04731321334838867, 0.04903888702392578, 0.05076456069946289, 0.052490234375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 6.0, 2.0, 15.0, 5.0, 14.0, 10.0, 15.0, 25.0, 21.0, 35.0, 37.0, 44.0, 51.0, 58.0, 46.0, 59.0, 59.0, 57.0, 54.0, 43.0, 44.0, 50.0, 42.0, 39.0, 40.0, 27.0, 27.0, 20.0, 21.0, 12.0, 12.0, 4.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11810302734375, -0.11462688446044922, -0.11115074157714844, -0.10767459869384766, -0.10419845581054688, -0.1007223129272461, -0.09724617004394531, -0.09377002716064453, -0.09029388427734375, -0.08681774139404297, -0.08334159851074219, -0.0798654556274414, -0.07638931274414062, -0.07291316986083984, -0.06943702697753906, -0.06596088409423828, -0.0624847412109375, -0.05900859832763672, -0.05553245544433594, -0.052056312561035156, -0.048580169677734375, -0.045104026794433594, -0.04162788391113281, -0.03815174102783203, -0.03467559814453125, -0.03119945526123047, -0.027723312377929688, -0.024247169494628906, -0.020771026611328125, -0.017294883728027344, -0.013818740844726562, -0.010342597961425781, -0.006866455078125, -0.0033903121948242188, 8.58306884765625e-05, 0.0035619735717773438, 0.007038116455078125, 0.010514259338378906, 0.013990402221679688, 0.01746654510498047, 0.02094268798828125, 0.02441883087158203, 0.027894973754882812, 0.031371116638183594, 0.034847259521484375, 0.038323402404785156, 0.04179954528808594, 0.04527568817138672, 0.0487518310546875, 0.05222797393798828, 0.05570411682128906, 0.059180259704589844, 0.06265640258789062, 0.0661325454711914, 0.06960868835449219, 0.07308483123779297, 0.07656097412109375, 0.08003711700439453, 0.08351325988769531, 0.0869894027709961, 0.09046554565429688, 0.09394168853759766, 0.09741783142089844, 0.10089397430419922, 0.1043701171875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 6.0, 4.0, 10.0, 7.0, 16.0, 16.0, 26.0, 37.0, 66.0, 93.0, 152.0, 298.0, 608.0, 1357.0, 4198.0, 22273.0, 308908.0, 642627.0, 56799.0, 7350.0, 2021.0, 789.0, 404.0, 188.0, 122.0, 49.0, 45.0, 23.0, 22.0, 9.0, 7.0, 7.0, 7.0, 1.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0242919921875, -0.023601770401000977, -0.022911548614501953, -0.02222132682800293, -0.021531105041503906, -0.020840883255004883, -0.02015066146850586, -0.019460439682006836, -0.018770217895507812, -0.01807999610900879, -0.017389774322509766, -0.016699552536010742, -0.01600933074951172, -0.015319108963012695, -0.014628887176513672, -0.013938665390014648, -0.013248443603515625, -0.012558221817016602, -0.011868000030517578, -0.011177778244018555, -0.010487556457519531, -0.009797334671020508, -0.009107112884521484, -0.008416891098022461, -0.0077266693115234375, -0.007036447525024414, -0.006346225738525391, -0.005656003952026367, -0.004965782165527344, -0.00427556037902832, -0.003585338592529297, -0.0028951168060302734, -0.00220489501953125, -0.0015146732330322266, -0.0008244514465332031, -0.0001342296600341797, 0.0005559921264648438, 0.0012462139129638672, 0.0019364356994628906, 0.002626657485961914, 0.0033168792724609375, 0.004007101058959961, 0.004697322845458984, 0.005387544631958008, 0.006077766418457031, 0.006767988204956055, 0.007458209991455078, 0.008148431777954102, 0.008838653564453125, 0.009528875350952148, 0.010219097137451172, 0.010909318923950195, 0.011599540710449219, 0.012289762496948242, 0.012979984283447266, 0.013670206069946289, 0.014360427856445312, 0.015050649642944336, 0.01574087142944336, 0.016431093215942383, 0.017121315002441406, 0.01781153678894043, 0.018501758575439453, 0.019191980361938477, 0.0198822021484375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 2.0, 2.0, 6.0, 2.0, 9.0, 12.0, 13.0, 8.0, 18.0, 22.0, 27.0, 42.0, 19.0, 42.0, 49.0, 64.0, 56.0, 63.0, 48.0, 45.0, 62.0, 56.0, 47.0, 39.0, 36.0, 45.0, 35.0, 37.0, 17.0, 19.0, 19.0, 10.0, 15.0, 8.0, 1.0, 3.0, 7.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7550926208496094e-06, -3.5874545574188232e-06, -3.419816493988037e-06, -3.252178430557251e-06, -3.084540367126465e-06, -2.9169023036956787e-06, -2.7492642402648926e-06, -2.5816261768341064e-06, -2.4139881134033203e-06, -2.246350049972534e-06, -2.078711986541748e-06, -1.911073923110962e-06, -1.7434358596801758e-06, -1.5757977962493896e-06, -1.4081597328186035e-06, -1.2405216693878174e-06, -1.0728836059570312e-06, -9.052455425262451e-07, -7.37607479095459e-07, -5.699694156646729e-07, -4.023313522338867e-07, -2.3469328880310059e-07, -6.705522537231445e-08, 1.0058283805847168e-07, 2.682209014892578e-07, 4.3585896492004395e-07, 6.034970283508301e-07, 7.711350917816162e-07, 9.387731552124023e-07, 1.1064112186431885e-06, 1.2740492820739746e-06, 1.4416873455047607e-06, 1.6093254089355469e-06, 1.776963472366333e-06, 1.944601535797119e-06, 2.1122395992279053e-06, 2.2798776626586914e-06, 2.4475157260894775e-06, 2.6151537895202637e-06, 2.78279185295105e-06, 2.950429916381836e-06, 3.118067979812622e-06, 3.285706043243408e-06, 3.4533441066741943e-06, 3.6209821701049805e-06, 3.7886202335357666e-06, 3.956258296966553e-06, 4.123896360397339e-06, 4.291534423828125e-06, 4.459172487258911e-06, 4.626810550689697e-06, 4.794448614120483e-06, 4.9620866775512695e-06, 5.129724740982056e-06, 5.297362804412842e-06, 5.465000867843628e-06, 5.632638931274414e-06, 5.8002769947052e-06, 5.967915058135986e-06, 6.1355531215667725e-06, 6.303191184997559e-06, 6.470829248428345e-06, 6.638467311859131e-06, 6.806105375289917e-06, 6.973743438720703e-06]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 6.0, 6.0, 2.0, 4.0, 10.0, 19.0, 32.0, 38.0, 69.0, 115.0, 176.0, 370.0, 830.0, 2005.0, 6748.0, 36943.0, 364251.0, 556406.0, 65817.0, 10012.0, 2692.0, 996.0, 441.0, 212.0, 139.0, 76.0, 42.0, 33.0, 13.0, 13.0, 14.0, 8.0, 6.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0178070068359375, -0.017195701599121094, -0.016584396362304688, -0.01597309112548828, -0.015361785888671875, -0.014750480651855469, -0.014139175415039062, -0.013527870178222656, -0.01291656494140625, -0.012305259704589844, -0.011693954467773438, -0.011082649230957031, -0.010471343994140625, -0.009860038757324219, -0.009248733520507812, -0.008637428283691406, -0.008026123046875, -0.007414817810058594, -0.0068035125732421875, -0.006192207336425781, -0.005580902099609375, -0.004969596862792969, -0.0043582916259765625, -0.0037469863891601562, -0.00313568115234375, -0.0025243759155273438, -0.0019130706787109375, -0.0013017654418945312, -0.000690460205078125, -7.915496826171875e-05, 0.0005321502685546875, 0.0011434555053710938, 0.0017547607421875, 0.0023660659790039062, 0.0029773712158203125, 0.0035886764526367188, 0.004199981689453125, 0.004811286926269531, 0.0054225921630859375, 0.006033897399902344, 0.00664520263671875, 0.007256507873535156, 0.007867813110351562, 0.008479118347167969, 0.009090423583984375, 0.009701728820800781, 0.010313034057617188, 0.010924339294433594, 0.01153564453125, 0.012146949768066406, 0.012758255004882812, 0.013369560241699219, 0.013980865478515625, 0.014592170715332031, 0.015203475952148438, 0.015814781188964844, 0.01642608642578125, 0.017037391662597656, 0.017648696899414062, 0.01826000213623047, 0.018871307373046875, 0.01948261260986328, 0.020093917846679688, 0.020705223083496094, 0.0213165283203125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 3.0, 6.0, 10.0, 9.0, 7.0, 18.0, 28.0, 37.0, 36.0, 51.0, 84.0, 92.0, 96.0, 115.0, 103.0, 68.0, 63.0, 56.0, 35.0, 28.0, 17.0, 13.0, 5.0, 12.0, 1.0, 4.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0183868408203125, -0.01773214340209961, -0.01707744598388672, -0.016422748565673828, -0.015768051147460938, -0.015113353729248047, -0.014458656311035156, -0.013803958892822266, -0.013149261474609375, -0.012494564056396484, -0.011839866638183594, -0.011185169219970703, -0.010530471801757812, -0.009875774383544922, -0.009221076965332031, -0.00856637954711914, -0.00791168212890625, -0.007256984710693359, -0.006602287292480469, -0.005947589874267578, -0.0052928924560546875, -0.004638195037841797, -0.003983497619628906, -0.0033288002014160156, -0.002674102783203125, -0.0020194053649902344, -0.0013647079467773438, -0.0007100105285644531, -5.53131103515625e-05, 0.0005993843078613281, 0.0012540817260742188, 0.0019087791442871094, 0.0025634765625, 0.0032181739807128906, 0.0038728713989257812, 0.004527568817138672, 0.0051822662353515625, 0.005836963653564453, 0.006491661071777344, 0.007146358489990234, 0.007801055908203125, 0.008455753326416016, 0.009110450744628906, 0.009765148162841797, 0.010419845581054688, 0.011074542999267578, 0.011729240417480469, 0.01238393783569336, 0.01303863525390625, 0.01369333267211914, 0.014348030090332031, 0.015002727508544922, 0.015657424926757812, 0.016312122344970703, 0.016966819763183594, 0.017621517181396484, 0.018276214599609375, 0.018930912017822266, 0.019585609436035156, 0.020240306854248047, 0.020895004272460938, 0.021549701690673828, 0.02220439910888672, 0.02285909652709961, 0.0235137939453125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 8.0, 6.0, 13.0, 32.0, 133.0, 394.0, 297.0, 76.0, 37.0, 8.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41205042600631714, -0.382324755191803, -0.3525990843772888, -0.32287341356277466, -0.2931477427482605, -0.26342207193374634, -0.2336963713169098, -0.20397070050239563, -0.17424502968788147, -0.1445193588733673, -0.11479368060827255, -0.0850680023431778, -0.055342331528663635, -0.025616660714149475, 0.004109025001525879, 0.03383469581604004, 0.0635603666305542, 0.09328603744506836, 0.12301171571016312, 0.15273739397525787, 0.18246306478977203, 0.2121887356042862, 0.24191442131996155, 0.2716400921344757, 0.30136576294898987, 0.33109143376350403, 0.3608171045780182, 0.39054280519485474, 0.4202684760093689, 0.44999414682388306, 0.4797198176383972, 0.5094454884529114, 0.5391710996627808, 0.5688967704772949, 0.5986224412918091, 0.6283481121063232, 0.6580737829208374, 0.6877994537353516, 0.7175251245498657, 0.7472507953643799, 0.776976466178894, 0.8067021369934082, 0.8364278078079224, 0.8661534786224365, 0.8958791494369507, 0.9256048202514648, 0.955330491065979, 0.9850561618804932, 1.0147819519042969, 1.044507622718811, 1.0742332935333252, 1.1039589643478394, 1.1336846351623535, 1.1634103059768677, 1.1931359767913818, 1.222861647605896, 1.2525873184204102, 1.2823129892349243, 1.3120386600494385, 1.3417643308639526, 1.3714900016784668, 1.401215672492981, 1.4309413433074951, 1.4606670141220093, 1.4903926849365234]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 8.0, 4.0, 8.0, 8.0, 18.0, 22.0, 27.0, 27.0, 38.0, 39.0, 42.0, 48.0, 51.0, 55.0, 69.0, 54.0, 68.0, 51.0, 66.0, 60.0, 39.0, 48.0, 23.0, 28.0, 20.0, 15.0, 21.0, 16.0, 11.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.605270266532898, -0.5847169160842896, -0.5641635656356812, -0.543610155582428, -0.5230568051338196, -0.5025034546852112, -0.4819501042366028, -0.4613967537879944, -0.4408433735370636, -0.4202900230884552, -0.3997366428375244, -0.379183292388916, -0.3586299419403076, -0.33807656168937683, -0.31752321124076843, -0.29696983098983765, -0.27641648054122925, -0.25586313009262085, -0.23530974984169006, -0.21475639939308167, -0.19420303404331207, -0.17364966869354248, -0.15309631824493408, -0.1325429528951645, -0.1119895875453949, -0.0914362221956253, -0.07088286429643631, -0.050329502671957016, -0.029776141047477722, -0.00922277569770813, 0.011330582201480865, 0.03188394010066986, 0.05243724584579468, 0.07299061119556427, 0.09354396909475327, 0.11409732699394226, 0.13465069234371185, 0.15520405769348145, 0.17575740814208984, 0.19631077349185944, 0.21686413884162903, 0.23741750419139862, 0.2579708695411682, 0.2785242199897766, 0.299077570438385, 0.3196309506893158, 0.3401843011379242, 0.360737681388855, 0.3812910318374634, 0.4018443822860718, 0.42239776253700256, 0.44295111298561096, 0.46350449323654175, 0.48405784368515015, 0.5046111941337585, 0.5251645445823669, 0.5457179546356201, 0.5662713050842285, 0.5868246555328369, 0.6073780655860901, 0.6279314160346985, 0.6484847664833069, 0.6690381169319153, 0.6895914673805237, 0.7101448178291321]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 7.0, 3.0, 7.0, 3.0, 3.0, 3.0, 6.0, 4.0, 6.0, 10.0, 30.0, 16.0, 39.0, 47.0, 76.0, 99.0, 173.0, 254.0, 423.0, 943.0, 1951.0, 4929.0, 16049.0, 104440.0, 3862849.0, 172084.0, 20360.0, 5530.0, 2106.0, 857.0, 424.0, 226.0, 119.0, 81.0, 50.0, 31.0, 16.0, 16.0, 5.0, 6.0, 7.0, 0.0, 0.0, 2.0], "bins": [-0.1151123046875, -0.11253023147583008, -0.10994815826416016, -0.10736608505249023, -0.10478401184082031, -0.10220193862915039, -0.09961986541748047, -0.09703779220581055, -0.09445571899414062, -0.0918736457824707, -0.08929157257080078, -0.08670949935913086, -0.08412742614746094, -0.08154535293579102, -0.0789632797241211, -0.07638120651245117, -0.07379913330078125, -0.07121706008911133, -0.0686349868774414, -0.06605291366577148, -0.06347084045410156, -0.06088876724243164, -0.05830669403076172, -0.0557246208190918, -0.053142547607421875, -0.05056047439575195, -0.04797840118408203, -0.04539632797241211, -0.04281425476074219, -0.040232181549072266, -0.037650108337402344, -0.03506803512573242, -0.0324859619140625, -0.029903888702392578, -0.027321815490722656, -0.024739742279052734, -0.022157669067382812, -0.01957559585571289, -0.01699352264404297, -0.014411449432373047, -0.011829376220703125, -0.009247303009033203, -0.006665229797363281, -0.004083156585693359, -0.0015010833740234375, 0.0010809898376464844, 0.0036630630493164062, 0.006245136260986328, 0.00882720947265625, 0.011409282684326172, 0.013991355895996094, 0.016573429107666016, 0.019155502319335938, 0.02173757553100586, 0.02431964874267578, 0.026901721954345703, 0.029483795166015625, 0.03206586837768555, 0.03464794158935547, 0.03723001480102539, 0.03981208801269531, 0.042394161224365234, 0.044976234436035156, 0.04755830764770508, 0.050140380859375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 11.0, 16.0, 28.0, 32.0, 60.0, 88.0, 105.0, 92.0, 112.0, 102.0, 100.0, 92.0, 67.0, 32.0, 28.0, 18.0, 8.0, 2.0, 1.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0789794921875, -0.07724237442016602, -0.07550525665283203, -0.07376813888549805, -0.07203102111816406, -0.07029390335083008, -0.0685567855834961, -0.06681966781616211, -0.06508255004882812, -0.06334543228149414, -0.061608314514160156, -0.05987119674682617, -0.05813407897949219, -0.0563969612121582, -0.05465984344482422, -0.052922725677490234, -0.05118560791015625, -0.049448490142822266, -0.04771137237548828, -0.0459742546081543, -0.04423713684082031, -0.04250001907348633, -0.040762901306152344, -0.03902578353881836, -0.037288665771484375, -0.03555154800415039, -0.033814430236816406, -0.03207731246948242, -0.030340194702148438, -0.028603076934814453, -0.02686595916748047, -0.025128841400146484, -0.0233917236328125, -0.021654605865478516, -0.01991748809814453, -0.018180370330810547, -0.016443252563476562, -0.014706134796142578, -0.012969017028808594, -0.01123189926147461, -0.009494781494140625, -0.007757663726806641, -0.006020545959472656, -0.004283428192138672, -0.0025463104248046875, -0.0008091926574707031, 0.0009279251098632812, 0.0026650428771972656, 0.00440216064453125, 0.006139278411865234, 0.007876396179199219, 0.009613513946533203, 0.011350631713867188, 0.013087749481201172, 0.014824867248535156, 0.01656198501586914, 0.018299102783203125, 0.02003622055053711, 0.021773338317871094, 0.023510456085205078, 0.025247573852539062, 0.026984691619873047, 0.02872180938720703, 0.030458927154541016, 0.032196044921875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 6.0, 10.0, 14.0, 25.0, 49.0, 81.0, 164.0, 368.0, 1127.0, 11985.0, 4139389.0, 38190.0, 1762.0, 540.0, 253.0, 146.0, 77.0, 46.0, 19.0, 16.0, 12.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2396240234375, -0.2328968048095703, -0.22616958618164062, -0.21944236755371094, -0.21271514892578125, -0.20598793029785156, -0.19926071166992188, -0.1925334930419922, -0.1858062744140625, -0.1790790557861328, -0.17235183715820312, -0.16562461853027344, -0.15889739990234375, -0.15217018127441406, -0.14544296264648438, -0.1387157440185547, -0.131988525390625, -0.1252613067626953, -0.11853408813476562, -0.11180686950683594, -0.10507965087890625, -0.09835243225097656, -0.09162521362304688, -0.08489799499511719, -0.0781707763671875, -0.07144355773925781, -0.06471633911132812, -0.05798912048339844, -0.05126190185546875, -0.04453468322753906, -0.037807464599609375, -0.031080245971679688, -0.02435302734375, -0.017625808715820312, -0.010898590087890625, -0.0041713714599609375, 0.00255584716796875, 0.009283065795898438, 0.016010284423828125, 0.022737503051757812, 0.0294647216796875, 0.03619194030761719, 0.042919158935546875, 0.04964637756347656, 0.05637359619140625, 0.06310081481933594, 0.06982803344726562, 0.07655525207519531, 0.083282470703125, 0.09000968933105469, 0.09673690795898438, 0.10346412658691406, 0.11019134521484375, 0.11691856384277344, 0.12364578247070312, 0.1303730010986328, 0.1371002197265625, 0.1438274383544922, 0.15055465698242188, 0.15728187561035156, 0.16400909423828125, 0.17073631286621094, 0.17746353149414062, 0.1841907501220703, 0.19091796875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 2.0, 11.0, 25.0, 67.0, 288.0, 2894.0, 584.0, 127.0, 37.0, 23.0, 12.0, 5.0, 4.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047271728515625, -0.04486417770385742, -0.042456626892089844, -0.040049076080322266, -0.03764152526855469, -0.03523397445678711, -0.03282642364501953, -0.030418872833251953, -0.028011322021484375, -0.025603771209716797, -0.02319622039794922, -0.02078866958618164, -0.018381118774414062, -0.015973567962646484, -0.013566017150878906, -0.011158466339111328, -0.00875091552734375, -0.006343364715576172, -0.003935813903808594, -0.0015282630920410156, 0.0008792877197265625, 0.0032868385314941406, 0.005694389343261719, 0.008101940155029297, 0.010509490966796875, 0.012917041778564453, 0.015324592590332031, 0.01773214340209961, 0.020139694213867188, 0.022547245025634766, 0.024954795837402344, 0.027362346649169922, 0.0297698974609375, 0.03217744827270508, 0.034584999084472656, 0.036992549896240234, 0.03940010070800781, 0.04180765151977539, 0.04421520233154297, 0.04662275314331055, 0.049030303955078125, 0.0514378547668457, 0.05384540557861328, 0.05625295639038086, 0.05866050720214844, 0.061068058013916016, 0.0634756088256836, 0.06588315963745117, 0.06829071044921875, 0.07069826126098633, 0.0731058120727539, 0.07551336288452148, 0.07792091369628906, 0.08032846450805664, 0.08273601531982422, 0.0851435661315918, 0.08755111694335938, 0.08995866775512695, 0.09236621856689453, 0.09477376937866211, 0.09718132019042969, 0.09958887100219727, 0.10199642181396484, 0.10440397262573242, 0.1068115234375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 16.0, 412.0, 520.0, 36.0, 11.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21016788482666016, -0.18899136781692505, -0.16781483590602875, -0.14663830399513245, -0.12546178698539734, -0.10428526252508163, -0.08310873806476593, -0.06193220615386963, -0.04075568914413452, -0.019579164683818817, 0.0015973597764968872, 0.02277388423681259, 0.043950408697128296, 0.065126933157444, 0.0863034576177597, 0.107479989528656, 0.1286565065383911, 0.14983302354812622, 0.17100955545902252, 0.19218608736991882, 0.21336260437965393, 0.23453912138938904, 0.25571566820144653, 0.27689218521118164, 0.29806870222091675, 0.31924521923065186, 0.34042173624038696, 0.36159828305244446, 0.38277480006217957, 0.4039513170719147, 0.42512786388397217, 0.4463043808937073, 0.4674808979034424, 0.4886574149131775, 0.5098339319229126, 0.5310104489326477, 0.5521869659423828, 0.5733635425567627, 0.5945400595664978, 0.6157165765762329, 0.636893093585968, 0.6580696105957031, 0.6792461276054382, 0.7004226446151733, 0.7215992212295532, 0.7427757382392883, 0.7639522552490234, 0.7851287722587585, 0.8063052892684937, 0.8274818062782288, 0.8486583232879639, 0.869834840297699, 0.8910113573074341, 0.912187933921814, 0.9333644509315491, 0.9545409679412842, 0.9757174849510193, 0.9968940019607544, 1.0180705785751343, 1.0392470359802246, 1.0604236125946045, 1.0816000699996948, 1.1027766466140747, 1.123953104019165, 1.145129680633545]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 2.0, 5.0, 20.0, 47.0, 72.0, 103.0, 136.0, 170.0, 150.0, 113.0, 85.0, 45.0, 28.0, 17.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3092511296272278, -0.29772329330444336, -0.28619542717933655, -0.2746675908565521, -0.2631397247314453, -0.2516118884086609, -0.24008403718471527, -0.22855618596076965, -0.21702834963798523, -0.2055004984140396, -0.193972647190094, -0.18244481086730957, -0.17091695964336395, -0.15938910841941833, -0.14786125719547272, -0.1363334059715271, -0.12480555474758148, -0.11327770352363586, -0.10174985975027084, -0.09022200852632523, -0.0786941647529602, -0.06716631352901459, -0.05563846230506897, -0.04411061853170395, -0.03258276730775833, -0.021054919809103012, -0.009527070447802544, 0.002000778913497925, 0.013528626412153244, 0.025056473910808563, 0.03658432513475418, 0.0481121689081192, 0.05964002013206482, 0.07116787135601044, 0.08269571512937546, 0.09422356635332108, 0.1057514101266861, 0.11727926135063171, 0.12880711257457733, 0.14033496379852295, 0.15186280012130737, 0.163390651345253, 0.1749185025691986, 0.18644633889198303, 0.19797419011592865, 0.20950204133987427, 0.22102989256381989, 0.2325577437877655, 0.24408559501171112, 0.25561344623565674, 0.26714128255844116, 0.278669148683548, 0.2901969850063324, 0.3017248511314392, 0.31325268745422363, 0.32478052377700806, 0.33630838990211487, 0.3478362262248993, 0.3593640923500061, 0.3708919286727905, 0.38241979479789734, 0.39394763112068176, 0.4054754972457886, 0.417003333568573, 0.4285311698913574]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 1.0, 3.0, 4.0, 6.0, 7.0, 12.0, 14.0, 22.0, 16.0, 51.0, 67.0, 96.0, 163.0, 271.0, 513.0, 1101.0, 2640.0, 7491.0, 28568.0, 161170.0, 653758.0, 152809.0, 27601.0, 7314.0, 2510.0, 1098.0, 521.0, 274.0, 167.0, 99.0, 60.0, 33.0, 30.0, 20.0, 17.0, 7.0, 10.0, 2.0, 7.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10174560546875, -0.09870719909667969, -0.09566879272460938, -0.09263038635253906, -0.08959197998046875, -0.08655357360839844, -0.08351516723632812, -0.08047676086425781, -0.0774383544921875, -0.07439994812011719, -0.07136154174804688, -0.06832313537597656, -0.06528472900390625, -0.06224632263183594, -0.059207916259765625, -0.05616950988769531, -0.053131103515625, -0.05009269714355469, -0.047054290771484375, -0.04401588439941406, -0.04097747802734375, -0.03793907165527344, -0.034900665283203125, -0.03186225891113281, -0.0288238525390625, -0.025785446166992188, -0.022747039794921875, -0.019708633422851562, -0.01667022705078125, -0.013631820678710938, -0.010593414306640625, -0.0075550079345703125, -0.0045166015625, -0.0014781951904296875, 0.001560211181640625, 0.0045986175537109375, 0.00763702392578125, 0.010675430297851562, 0.013713836669921875, 0.016752243041992188, 0.0197906494140625, 0.022829055786132812, 0.025867462158203125, 0.028905868530273438, 0.03194427490234375, 0.03498268127441406, 0.038021087646484375, 0.04105949401855469, 0.044097900390625, 0.04713630676269531, 0.050174713134765625, 0.05321311950683594, 0.05625152587890625, 0.05928993225097656, 0.062328338623046875, 0.06536674499511719, 0.0684051513671875, 0.07144355773925781, 0.07448196411132812, 0.07752037048339844, 0.08055877685546875, 0.08359718322753906, 0.08663558959960938, 0.08967399597167969, 0.09271240234375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 6.0, 9.0, 21.0, 20.0, 37.0, 51.0, 64.0, 82.0, 92.0, 104.0, 89.0, 85.0, 93.0, 71.0, 58.0, 49.0, 30.0, 18.0, 9.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.061767578125, -0.060302734375, -0.058837890625, -0.057373046875, -0.055908203125, -0.054443359375, -0.052978515625, -0.051513671875, -0.050048828125, -0.048583984375, -0.047119140625, -0.045654296875, -0.044189453125, -0.042724609375, -0.041259765625, -0.039794921875, -0.038330078125, -0.036865234375, -0.035400390625, -0.033935546875, -0.032470703125, -0.031005859375, -0.029541015625, -0.028076171875, -0.026611328125, -0.025146484375, -0.023681640625, -0.022216796875, -0.020751953125, -0.019287109375, -0.017822265625, -0.016357421875, -0.014892578125, -0.013427734375, -0.011962890625, -0.010498046875, -0.009033203125, -0.007568359375, -0.006103515625, -0.004638671875, -0.003173828125, -0.001708984375, -0.000244140625, 0.001220703125, 0.002685546875, 0.004150390625, 0.005615234375, 0.007080078125, 0.008544921875, 0.010009765625, 0.011474609375, 0.012939453125, 0.014404296875, 0.015869140625, 0.017333984375, 0.018798828125, 0.020263671875, 0.021728515625, 0.023193359375, 0.024658203125, 0.026123046875, 0.027587890625, 0.029052734375, 0.030517578125, 0.031982421875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 7.0, 10.0, 12.0, 9.0, 22.0, 16.0, 43.0, 39.0, 49.0, 87.0, 94.0, 159.0, 213.0, 314.0, 480.0, 774.0, 1440.0, 2994.0, 6775.0, 17712.0, 51912.0, 198908.0, 518488.0, 172821.0, 46774.0, 15727.0, 6240.0, 2744.0, 1441.0, 743.0, 489.0, 312.0, 205.0, 133.0, 108.0, 85.0, 54.0, 31.0, 32.0, 19.0, 16.0, 11.0, 9.0, 2.0, 4.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.052978515625, -0.05144071578979492, -0.049902915954589844, -0.048365116119384766, -0.04682731628417969, -0.04528951644897461, -0.04375171661376953, -0.04221391677856445, -0.040676116943359375, -0.0391383171081543, -0.03760051727294922, -0.03606271743774414, -0.03452491760253906, -0.032987117767333984, -0.031449317932128906, -0.029911518096923828, -0.02837371826171875, -0.026835918426513672, -0.025298118591308594, -0.023760318756103516, -0.022222518920898438, -0.02068471908569336, -0.01914691925048828, -0.017609119415283203, -0.016071319580078125, -0.014533519744873047, -0.012995719909667969, -0.01145792007446289, -0.009920120239257812, -0.008382320404052734, -0.006844520568847656, -0.005306720733642578, -0.0037689208984375, -0.002231121063232422, -0.0006933212280273438, 0.0008444786071777344, 0.0023822784423828125, 0.003920078277587891, 0.005457878112792969, 0.006995677947998047, 0.008533477783203125, 0.010071277618408203, 0.011609077453613281, 0.01314687728881836, 0.014684677124023438, 0.016222476959228516, 0.017760276794433594, 0.019298076629638672, 0.02083587646484375, 0.022373676300048828, 0.023911476135253906, 0.025449275970458984, 0.026987075805664062, 0.02852487564086914, 0.03006267547607422, 0.0316004753112793, 0.033138275146484375, 0.03467607498168945, 0.03621387481689453, 0.03775167465209961, 0.03928947448730469, 0.040827274322509766, 0.042365074157714844, 0.04390287399291992, 0.045440673828125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 5.0, 7.0, 11.0, 9.0, 21.0, 13.0, 26.0, 22.0, 19.0, 18.0, 24.0, 28.0, 30.0, 41.0, 40.0, 34.0, 41.0, 59.0, 41.0, 33.0, 34.0, 43.0, 36.0, 53.0, 41.0, 32.0, 39.0, 31.0, 23.0, 25.0, 20.0, 17.0, 17.0, 15.0, 16.0, 10.0, 8.0, 4.0, 6.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0955810546875, -0.0930023193359375, -0.090423583984375, -0.0878448486328125, -0.08526611328125, -0.0826873779296875, -0.080108642578125, -0.0775299072265625, -0.074951171875, -0.0723724365234375, -0.069793701171875, -0.0672149658203125, -0.06463623046875, -0.0620574951171875, -0.059478759765625, -0.0569000244140625, -0.0543212890625, -0.0517425537109375, -0.049163818359375, -0.0465850830078125, -0.04400634765625, -0.0414276123046875, -0.038848876953125, -0.0362701416015625, -0.03369140625, -0.0311126708984375, -0.028533935546875, -0.0259552001953125, -0.02337646484375, -0.0207977294921875, -0.018218994140625, -0.0156402587890625, -0.0130615234375, -0.0104827880859375, -0.007904052734375, -0.0053253173828125, -0.00274658203125, -0.0001678466796875, 0.002410888671875, 0.0049896240234375, 0.007568359375, 0.0101470947265625, 0.012725830078125, 0.0153045654296875, 0.01788330078125, 0.0204620361328125, 0.023040771484375, 0.0256195068359375, 0.0281982421875, 0.0307769775390625, 0.033355712890625, 0.0359344482421875, 0.03851318359375, 0.0410919189453125, 0.043670654296875, 0.0462493896484375, 0.048828125, 0.0514068603515625, 0.053985595703125, 0.0565643310546875, 0.05914306640625, 0.0617218017578125, 0.064300537109375, 0.0668792724609375, 0.0694580078125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 4.0, 4.0, 18.0, 22.0, 40.0, 61.0, 113.0, 183.0, 276.0, 612.0, 1693.0, 5083.0, 28706.0, 336979.0, 594103.0, 68065.0, 8437.0, 2277.0, 932.0, 393.0, 226.0, 119.0, 63.0, 45.0, 27.0, 22.0, 14.0, 9.0, 5.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0191192626953125, -0.018543004989624023, -0.017966747283935547, -0.01739048957824707, -0.016814231872558594, -0.016237974166870117, -0.01566171646118164, -0.015085458755493164, -0.014509201049804688, -0.013932943344116211, -0.013356685638427734, -0.012780427932739258, -0.012204170227050781, -0.011627912521362305, -0.011051654815673828, -0.010475397109985352, -0.009899139404296875, -0.009322881698608398, -0.008746623992919922, -0.008170366287231445, -0.007594108581542969, -0.007017850875854492, -0.006441593170166016, -0.005865335464477539, -0.0052890777587890625, -0.004712820053100586, -0.004136562347412109, -0.003560304641723633, -0.0029840469360351562, -0.0024077892303466797, -0.0018315315246582031, -0.0012552738189697266, -0.00067901611328125, -0.00010275840759277344, 0.0004734992980957031, 0.0010497570037841797, 0.0016260147094726562, 0.002202272415161133, 0.0027785301208496094, 0.003354787826538086, 0.0039310455322265625, 0.004507303237915039, 0.005083560943603516, 0.005659818649291992, 0.006236076354980469, 0.006812334060668945, 0.007388591766357422, 0.007964849472045898, 0.008541107177734375, 0.009117364883422852, 0.009693622589111328, 0.010269880294799805, 0.010846138000488281, 0.011422395706176758, 0.011998653411865234, 0.012574911117553711, 0.013151168823242188, 0.013727426528930664, 0.01430368423461914, 0.014879941940307617, 0.015456199645996094, 0.01603245735168457, 0.016608715057373047, 0.017184972763061523, 0.01776123046875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 4.0, 5.0, 4.0, 14.0, 13.0, 15.0, 28.0, 17.0, 26.0, 46.0, 31.0, 50.0, 58.0, 40.0, 79.0, 27.0, 83.0, 45.0, 39.0, 65.0, 52.0, 40.0, 52.0, 21.0, 37.0, 24.0, 10.0, 18.0, 17.0, 10.0, 8.0, 5.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-5.066394805908203e-06, -4.909932613372803e-06, -4.753470420837402e-06, -4.597008228302002e-06, -4.4405460357666016e-06, -4.284083843231201e-06, -4.127621650695801e-06, -3.9711594581604e-06, -3.814697265625e-06, -3.6582350730895996e-06, -3.5017728805541992e-06, -3.345310688018799e-06, -3.1888484954833984e-06, -3.032386302947998e-06, -2.8759241104125977e-06, -2.7194619178771973e-06, -2.562999725341797e-06, -2.4065375328063965e-06, -2.250075340270996e-06, -2.0936131477355957e-06, -1.9371509552001953e-06, -1.780688762664795e-06, -1.6242265701293945e-06, -1.4677643775939941e-06, -1.3113021850585938e-06, -1.1548399925231934e-06, -9.98377799987793e-07, -8.419156074523926e-07, -6.854534149169922e-07, -5.289912223815918e-07, -3.725290298461914e-07, -2.1606683731079102e-07, -5.960464477539063e-08, 9.685754776000977e-08, 2.5331974029541016e-07, 4.0978193283081055e-07, 5.662441253662109e-07, 7.227063179016113e-07, 8.791685104370117e-07, 1.0356307029724121e-06, 1.1920928955078125e-06, 1.3485550880432129e-06, 1.5050172805786133e-06, 1.6614794731140137e-06, 1.817941665649414e-06, 1.9744038581848145e-06, 2.130866050720215e-06, 2.2873282432556152e-06, 2.4437904357910156e-06, 2.600252628326416e-06, 2.7567148208618164e-06, 2.913177013397217e-06, 3.069639205932617e-06, 3.2261013984680176e-06, 3.382563591003418e-06, 3.5390257835388184e-06, 3.6954879760742188e-06, 3.851950168609619e-06, 4.0084123611450195e-06, 4.16487455368042e-06, 4.32133674621582e-06, 4.477798938751221e-06, 4.634261131286621e-06, 4.7907233238220215e-06, 4.947185516357422e-06]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 6.0, 3.0, 4.0, 6.0, 10.0, 14.0, 17.0, 21.0, 38.0, 39.0, 57.0, 105.0, 193.0, 292.0, 506.0, 1082.0, 2429.0, 6796.0, 23735.0, 122563.0, 511087.0, 303942.0, 55510.0, 12431.0, 4098.0, 1699.0, 821.0, 406.0, 225.0, 151.0, 78.0, 57.0, 33.0, 24.0, 24.0, 16.0, 10.0, 7.0, 9.0, 4.0, 3.0, 0.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.01546478271484375, -0.015032410621643066, -0.014600038528442383, -0.0141676664352417, -0.013735294342041016, -0.013302922248840332, -0.012870550155639648, -0.012438178062438965, -0.012005805969238281, -0.011573433876037598, -0.011141061782836914, -0.01070868968963623, -0.010276317596435547, -0.009843945503234863, -0.00941157341003418, -0.008979201316833496, -0.008546829223632812, -0.008114457130432129, -0.007682085037231445, -0.007249712944030762, -0.006817340850830078, -0.0063849687576293945, -0.005952596664428711, -0.005520224571228027, -0.005087852478027344, -0.00465548038482666, -0.0042231082916259766, -0.003790736198425293, -0.0033583641052246094, -0.0029259920120239258, -0.002493619918823242, -0.0020612478256225586, -0.001628875732421875, -0.0011965036392211914, -0.0007641315460205078, -0.0003317594528198242, 0.00010061264038085938, 0.000532984733581543, 0.0009653568267822266, 0.0013977289199829102, 0.0018301010131835938, 0.0022624731063842773, 0.002694845199584961, 0.0031272172927856445, 0.003559589385986328, 0.003991961479187012, 0.004424333572387695, 0.004856705665588379, 0.0052890777587890625, 0.005721449851989746, 0.00615382194519043, 0.006586194038391113, 0.007018566131591797, 0.0074509382247924805, 0.007883310317993164, 0.008315682411193848, 0.008748054504394531, 0.009180426597595215, 0.009612798690795898, 0.010045170783996582, 0.010477542877197266, 0.01090991497039795, 0.011342287063598633, 0.011774659156799316, 0.01220703125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 7.0, 5.0, 5.0, 13.0, 12.0, 18.0, 17.0, 28.0, 33.0, 44.0, 70.0, 79.0, 88.0, 78.0, 92.0, 81.0, 70.0, 68.0, 50.0, 36.0, 34.0, 17.0, 17.0, 14.0, 4.0, 8.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.019866943359375, -0.019285917282104492, -0.018704891204833984, -0.018123865127563477, -0.01754283905029297, -0.01696181297302246, -0.016380786895751953, -0.015799760818481445, -0.015218734741210938, -0.01463770866394043, -0.014056682586669922, -0.013475656509399414, -0.012894630432128906, -0.012313604354858398, -0.01173257827758789, -0.011151552200317383, -0.010570526123046875, -0.009989500045776367, -0.00940847396850586, -0.008827447891235352, -0.008246421813964844, -0.007665395736694336, -0.007084369659423828, -0.00650334358215332, -0.0059223175048828125, -0.005341291427612305, -0.004760265350341797, -0.004179239273071289, -0.0035982131958007812, -0.0030171871185302734, -0.0024361610412597656, -0.0018551349639892578, -0.00127410888671875, -0.0006930828094482422, -0.00011205673217773438, 0.00046896934509277344, 0.0010499954223632812, 0.001631021499633789, 0.002212047576904297, 0.0027930736541748047, 0.0033740997314453125, 0.00395512580871582, 0.004536151885986328, 0.005117177963256836, 0.005698204040527344, 0.0062792301177978516, 0.006860256195068359, 0.007441282272338867, 0.008022308349609375, 0.008603334426879883, 0.00918436050415039, 0.009765386581420898, 0.010346412658691406, 0.010927438735961914, 0.011508464813232422, 0.01208949089050293, 0.012670516967773438, 0.013251543045043945, 0.013832569122314453, 0.014413595199584961, 0.014994621276855469, 0.015575647354125977, 0.016156673431396484, 0.016737699508666992, 0.0173187255859375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 40.0, 206.0, 570.0, 136.0, 28.0, 15.0, 8.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6432075500488281, -1.60617196559906, -1.5691365003585815, -1.5321009159088135, -1.495065450668335, -1.458029866218567, -1.4209942817687988, -1.3839588165283203, -1.3469232320785522, -1.3098876476287842, -1.2728521823883057, -1.2358165979385376, -1.1987810134887695, -1.161745548248291, -1.124709963798523, -1.0876743793487549, -1.0506389141082764, -1.0136033296585083, -0.9765678644180298, -0.9395322799682617, -0.9024967551231384, -0.8654612302780151, -0.8284256458282471, -0.7913901209831238, -0.7543545961380005, -0.7173190712928772, -0.6802835464477539, -0.6432479619979858, -0.6062124371528625, -0.5691769123077393, -0.5321413278579712, -0.4951058030128479, -0.4580702781677246, -0.4210347533226013, -0.38399919867515564, -0.34696364402770996, -0.30992811918258667, -0.2728925943374634, -0.2358570396900177, -0.19882148504257202, -0.16178596019744873, -0.12475042045116425, -0.08771488070487976, -0.050679340958595276, -0.013643801212310791, 0.023391738533973694, 0.06042727828025818, 0.09746283292770386, 0.13449835777282715, 0.17153389751911163, 0.20856943726539612, 0.2456049770116806, 0.2826405167579651, 0.3196760416030884, 0.35671159625053406, 0.39374715089797974, 0.430782675743103, 0.4678182005882263, 0.5048537254333496, 0.5418893098831177, 0.578924834728241, 0.6159603595733643, 0.6529959440231323, 0.6900314688682556, 0.7270669937133789]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 4.0, 7.0, 7.0, 13.0, 13.0, 11.0, 20.0, 16.0, 18.0, 25.0, 26.0, 18.0, 22.0, 28.0, 24.0, 41.0, 38.0, 35.0, 43.0, 51.0, 56.0, 53.0, 45.0, 47.0, 35.0, 35.0, 32.0, 26.0, 28.0, 27.0, 21.0, 23.0, 24.0, 20.0, 14.0, 12.0, 8.0, 6.0, 9.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.3812182545661926, -0.3682142198085785, -0.35521018505096436, -0.34220612049102783, -0.3292020857334137, -0.31619805097579956, -0.3031940162181854, -0.2901899814605713, -0.27718594670295715, -0.264181911945343, -0.2511778771877289, -0.23817382752895355, -0.22516979277133942, -0.2121657431125641, -0.19916170835494995, -0.18615767359733582, -0.17315362393856049, -0.16014958918094635, -0.14714553952217102, -0.13414150476455688, -0.12113747000694275, -0.10813342779874802, -0.09512938559055328, -0.08212535083293915, -0.06912130862474442, -0.05611727014183998, -0.04311323165893555, -0.030109189450740814, -0.01710515096783638, -0.004101112484931946, 0.008902929723262787, 0.021906964480876923, 0.034911006689071655, 0.04791504517197609, 0.060919083654880524, 0.07392312586307526, 0.08692716062068939, 0.09993120282888412, 0.11293524503707886, 0.125939279794693, 0.13894331455230713, 0.15194734930992126, 0.1649513989686966, 0.17795543372631073, 0.19095946848392487, 0.2039635181427002, 0.21696755290031433, 0.22997158765792847, 0.2429756373167038, 0.2559796869754791, 0.26898372173309326, 0.2819877564907074, 0.29499179124832153, 0.30799582600593567, 0.3209998607635498, 0.33400392532348633, 0.34700796008110046, 0.3600119948387146, 0.37301602959632874, 0.38602006435394287, 0.3990241289138794, 0.41202816367149353, 0.42503219842910767, 0.4380362331867218, 0.45104026794433594]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 4.0, 23.0, 23.0, 68.0, 184.0, 528.0, 1877.0, 12517.0, 3685802.0, 483267.0, 8074.0, 1294.0, 378.0, 129.0, 58.0, 23.0, 16.0, 8.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.264892578125, -0.25936412811279297, -0.25383567810058594, -0.2483072280883789, -0.24277877807617188, -0.23725032806396484, -0.2317218780517578, -0.22619342803955078, -0.22066497802734375, -0.21513652801513672, -0.2096080780029297, -0.20407962799072266, -0.19855117797851562, -0.1930227279663086, -0.18749427795410156, -0.18196582794189453, -0.1764373779296875, -0.17090892791748047, -0.16538047790527344, -0.1598520278930664, -0.15432357788085938, -0.14879512786865234, -0.1432666778564453, -0.13773822784423828, -0.13220977783203125, -0.12668132781982422, -0.12115287780761719, -0.11562442779541016, -0.11009597778320312, -0.1045675277709961, -0.09903907775878906, -0.09351062774658203, -0.087982177734375, -0.08245372772216797, -0.07692527770996094, -0.0713968276977539, -0.06586837768554688, -0.060339927673339844, -0.05481147766113281, -0.04928302764892578, -0.04375457763671875, -0.03822612762451172, -0.03269767761230469, -0.027169227600097656, -0.021640777587890625, -0.016112327575683594, -0.010583877563476562, -0.005055427551269531, 0.0004730224609375, 0.006001472473144531, 0.011529922485351562, 0.017058372497558594, 0.022586822509765625, 0.028115272521972656, 0.03364372253417969, 0.03917217254638672, 0.04470062255859375, 0.05022907257080078, 0.05575752258300781, 0.061285972595214844, 0.06681442260742188, 0.0723428726196289, 0.07787132263183594, 0.08339977264404297, 0.08892822265625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 8.0, 16.0, 14.0, 29.0, 28.0, 37.0, 57.0, 71.0, 65.0, 81.0, 86.0, 89.0, 91.0, 78.0, 58.0, 59.0, 53.0, 28.0, 19.0, 14.0, 9.0, 5.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0562744140625, -0.054900169372558594, -0.05352592468261719, -0.05215167999267578, -0.050777435302734375, -0.04940319061279297, -0.04802894592285156, -0.046654701232910156, -0.04528045654296875, -0.043906211853027344, -0.04253196716308594, -0.04115772247314453, -0.039783477783203125, -0.03840923309326172, -0.03703498840332031, -0.035660743713378906, -0.0342864990234375, -0.032912254333496094, -0.03153800964355469, -0.03016376495361328, -0.028789520263671875, -0.02741527557373047, -0.026041030883789062, -0.024666786193847656, -0.02329254150390625, -0.021918296813964844, -0.020544052124023438, -0.01916980743408203, -0.017795562744140625, -0.01642131805419922, -0.015047073364257812, -0.013672828674316406, -0.012298583984375, -0.010924339294433594, -0.009550094604492188, -0.008175849914550781, -0.006801605224609375, -0.005427360534667969, -0.0040531158447265625, -0.0026788711547851562, -0.00130462646484375, 6.961822509765625e-05, 0.0014438629150390625, 0.0028181076049804688, 0.004192352294921875, 0.005566596984863281, 0.0069408416748046875, 0.008315086364746094, 0.0096893310546875, 0.011063575744628906, 0.012437820434570312, 0.013812065124511719, 0.015186309814453125, 0.01656055450439453, 0.017934799194335938, 0.019309043884277344, 0.02068328857421875, 0.022057533264160156, 0.023431777954101562, 0.02480602264404297, 0.026180267333984375, 0.02755451202392578, 0.028928756713867188, 0.030303001403808594, 0.03167724609375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 10.0, 22.0, 33.0, 74.0, 135.0, 297.0, 654.0, 2058.0, 10577.0, 263250.0, 3871071.0, 38961.0, 4674.0, 1373.0, 576.0, 243.0, 139.0, 49.0, 27.0, 14.0, 17.0, 7.0, 6.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0], "bins": [-0.1187744140625, -0.11582374572753906, -0.11287307739257812, -0.10992240905761719, -0.10697174072265625, -0.10402107238769531, -0.10107040405273438, -0.09811973571777344, -0.0951690673828125, -0.09221839904785156, -0.08926773071289062, -0.08631706237792969, -0.08336639404296875, -0.08041572570800781, -0.07746505737304688, -0.07451438903808594, -0.071563720703125, -0.06861305236816406, -0.06566238403320312, -0.06271171569824219, -0.05976104736328125, -0.05681037902832031, -0.053859710693359375, -0.05090904235839844, -0.0479583740234375, -0.04500770568847656, -0.042057037353515625, -0.03910636901855469, -0.03615570068359375, -0.03320503234863281, -0.030254364013671875, -0.027303695678710938, -0.02435302734375, -0.021402359008789062, -0.018451690673828125, -0.015501022338867188, -0.01255035400390625, -0.009599685668945312, -0.006649017333984375, -0.0036983489990234375, -0.0007476806640625, 0.0022029876708984375, 0.005153656005859375, 0.008104324340820312, 0.01105499267578125, 0.014005661010742188, 0.016956329345703125, 0.019906997680664062, 0.022857666015625, 0.025808334350585938, 0.028759002685546875, 0.03170967102050781, 0.03466033935546875, 0.03761100769042969, 0.040561676025390625, 0.04351234436035156, 0.0464630126953125, 0.04941368103027344, 0.052364349365234375, 0.05531501770019531, 0.05826568603515625, 0.06121635437011719, 0.06416702270507812, 0.06711769104003906, 0.070068359375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 7.0, 5.0, 7.0, 17.0, 18.0, 29.0, 60.0, 97.0, 254.0, 1285.0, 1629.0, 368.0, 143.0, 57.0, 28.0, 23.0, 9.0, 11.0, 9.0, 7.0, 4.0, 5.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02850341796875, -0.027266979217529297, -0.026030540466308594, -0.02479410171508789, -0.023557662963867188, -0.022321224212646484, -0.02108478546142578, -0.019848346710205078, -0.018611907958984375, -0.017375469207763672, -0.01613903045654297, -0.014902591705322266, -0.013666152954101562, -0.01242971420288086, -0.011193275451660156, -0.009956836700439453, -0.00872039794921875, -0.007483959197998047, -0.006247520446777344, -0.005011081695556641, -0.0037746429443359375, -0.0025382041931152344, -0.0013017654418945312, -6.532669067382812e-05, 0.001171112060546875, 0.002407550811767578, 0.0036439895629882812, 0.004880428314208984, 0.0061168670654296875, 0.007353305816650391, 0.008589744567871094, 0.009826183319091797, 0.0110626220703125, 0.012299060821533203, 0.013535499572753906, 0.01477193832397461, 0.016008377075195312, 0.017244815826416016, 0.01848125457763672, 0.019717693328857422, 0.020954132080078125, 0.022190570831298828, 0.02342700958251953, 0.024663448333740234, 0.025899887084960938, 0.02713632583618164, 0.028372764587402344, 0.029609203338623047, 0.03084564208984375, 0.03208208084106445, 0.033318519592285156, 0.03455495834350586, 0.03579139709472656, 0.037027835845947266, 0.03826427459716797, 0.03950071334838867, 0.040737152099609375, 0.04197359085083008, 0.04321002960205078, 0.044446468353271484, 0.04568290710449219, 0.04691934585571289, 0.048155784606933594, 0.0493922233581543, 0.050628662109375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 54.0, 939.0, 19.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11813865602016449, -0.06638765335083008, -0.014636658132076263, 0.03711433708667755, 0.08886533975601196, 0.14061634242534637, 0.1923673301935196, 0.2441183477640152, 0.2958693504333496, 0.3476203382015228, 0.39937135577201843, 0.45112234354019165, 0.5028733611106873, 0.5546243190765381, 0.6063753366470337, 0.6581263542175293, 0.7098773121833801, 0.7616283297538757, 0.8133792877197266, 0.8651303052902222, 0.9168813228607178, 0.9686323404312134, 1.020383358001709, 1.072134256362915, 1.1238852739334106, 1.1756362915039062, 1.2273873090744019, 1.2791383266448975, 1.3308892250061035, 1.3826402425765991, 1.4343912601470947, 1.4861422777175903, 1.5378934144973755, 1.589644432067871, 1.6413954496383667, 1.6931464672088623, 1.7448973655700684, 1.796648383140564, 1.8483994007110596, 1.9001504182815552, 1.9519014358520508, 2.003652334213257, 2.055403470993042, 2.107154369354248, 2.158905506134033, 2.2106564044952393, 2.2624073028564453, 2.3141584396362305, 2.3659093379974365, 2.4176602363586426, 2.4694113731384277, 2.521162271499634, 2.572913408279419, 2.624664306640625, 2.67641544342041, 2.728166341781616, 2.7799174785614014, 2.8316683769226074, 2.8834195137023926, 2.9351704120635986, 2.986921548843384, 3.03867244720459, 3.090423583984375, 3.142174482345581, 3.193925380706787]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 10.0, 14.0, 17.0, 32.0, 32.0, 49.0, 55.0, 67.0, 65.0, 70.0, 72.0, 69.0, 85.0, 72.0, 56.0, 53.0, 47.0, 37.0, 32.0, 22.0, 9.0, 11.0, 8.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.117603600025177, -0.11225791275501251, -0.10691223293542862, -0.10156655311584473, -0.09622086584568024, -0.09087517857551575, -0.08552949875593185, -0.08018381893634796, -0.07483813166618347, -0.06949244439601898, -0.06414676457643509, -0.0588010810315609, -0.05345539748668671, -0.048109713941812515, -0.042764030396938324, -0.03741834685206413, -0.03207266330718994, -0.02672697976231575, -0.02138129621744156, -0.016035612672567368, -0.010689929127693176, -0.005344245582818985, 1.4379620552062988e-06, 0.005347121506929398, 0.010692805051803589, 0.01603848859667778, 0.02138417214155197, 0.026729855686426163, 0.032075539231300354, 0.037421222776174545, 0.04276690632104874, 0.04811258986592293, 0.05345827341079712, 0.05880395695567131, 0.0641496405005455, 0.0694953203201294, 0.07484100759029388, 0.08018669486045837, 0.08553237468004227, 0.09087805449962616, 0.09622374176979065, 0.10156942903995514, 0.10691510885953903, 0.11226078867912292, 0.11760647594928741, 0.1229521632194519, 0.1282978355884552, 0.1336435228586197, 0.13898921012878418, 0.14433489739894867, 0.14968058466911316, 0.15502625703811646, 0.16037194430828094, 0.16571763157844543, 0.17106330394744873, 0.17640899121761322, 0.1817546784877777, 0.1871003657579422, 0.1924460530281067, 0.19779172539710999, 0.20313741266727448, 0.20848309993743896, 0.21382877230644226, 0.21917445957660675, 0.22452014684677124]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 6.0, 2.0, 7.0, 4.0, 8.0, 10.0, 18.0, 28.0, 58.0, 67.0, 130.0, 222.0, 396.0, 858.0, 1724.0, 4247.0, 13033.0, 51899.0, 338563.0, 533829.0, 76416.0, 17364.0, 5409.0, 2221.0, 945.0, 444.0, 242.0, 135.0, 106.0, 58.0, 28.0, 21.0, 21.0, 8.0, 7.0, 4.0, 8.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07513427734375, -0.07246208190917969, -0.06978988647460938, -0.06711769104003906, -0.06444549560546875, -0.06177330017089844, -0.059101104736328125, -0.05642890930175781, -0.0537567138671875, -0.05108451843261719, -0.048412322998046875, -0.04574012756347656, -0.04306793212890625, -0.04039573669433594, -0.037723541259765625, -0.03505134582519531, -0.032379150390625, -0.029706954956054688, -0.027034759521484375, -0.024362564086914062, -0.02169036865234375, -0.019018173217773438, -0.016345977783203125, -0.013673782348632812, -0.0110015869140625, -0.008329391479492188, -0.005657196044921875, -0.0029850006103515625, -0.00031280517578125, 0.0023593902587890625, 0.005031585693359375, 0.0077037811279296875, 0.0103759765625, 0.013048171997070312, 0.015720367431640625, 0.018392562866210938, 0.02106475830078125, 0.023736953735351562, 0.026409149169921875, 0.029081344604492188, 0.0317535400390625, 0.03442573547363281, 0.037097930908203125, 0.03977012634277344, 0.04244232177734375, 0.04511451721191406, 0.047786712646484375, 0.05045890808105469, 0.053131103515625, 0.05580329895019531, 0.058475494384765625, 0.06114768981933594, 0.06381988525390625, 0.06649208068847656, 0.06916427612304688, 0.07183647155761719, 0.0745086669921875, 0.07718086242675781, 0.07985305786132812, 0.08252525329589844, 0.08519744873046875, 0.08786964416503906, 0.09054183959960938, 0.09321403503417969, 0.09588623046875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 3.0, 5.0, 12.0, 14.0, 20.0, 18.0, 32.0, 43.0, 57.0, 67.0, 61.0, 80.0, 79.0, 72.0, 88.0, 76.0, 47.0, 50.0, 56.0, 36.0, 34.0, 16.0, 17.0, 6.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.047943115234375, -0.04671764373779297, -0.04549217224121094, -0.044266700744628906, -0.043041229248046875, -0.041815757751464844, -0.04059028625488281, -0.03936481475830078, -0.03813934326171875, -0.03691387176513672, -0.03568840026855469, -0.034462928771972656, -0.033237457275390625, -0.032011985778808594, -0.030786514282226562, -0.02956104278564453, -0.0283355712890625, -0.02711009979248047, -0.025884628295898438, -0.024659156799316406, -0.023433685302734375, -0.022208213806152344, -0.020982742309570312, -0.01975727081298828, -0.01853179931640625, -0.01730632781982422, -0.016080856323242188, -0.014855384826660156, -0.013629913330078125, -0.012404441833496094, -0.011178970336914062, -0.009953498840332031, -0.00872802734375, -0.007502555847167969, -0.0062770843505859375, -0.005051612854003906, -0.003826141357421875, -0.0026006698608398438, -0.0013751983642578125, -0.00014972686767578125, 0.00107574462890625, 0.0023012161254882812, 0.0035266876220703125, 0.004752159118652344, 0.005977630615234375, 0.007203102111816406, 0.008428573608398438, 0.009654045104980469, 0.0108795166015625, 0.012104988098144531, 0.013330459594726562, 0.014555931091308594, 0.015781402587890625, 0.017006874084472656, 0.018232345581054688, 0.01945781707763672, 0.02068328857421875, 0.02190876007080078, 0.023134231567382812, 0.024359703063964844, 0.025585174560546875, 0.026810646057128906, 0.028036117553710938, 0.02926158905029297, 0.030487060546875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 3.0, 4.0, 5.0, 4.0, 7.0, 6.0, 15.0, 17.0, 26.0, 28.0, 41.0, 79.0, 114.0, 199.0, 299.0, 558.0, 1270.0, 2989.0, 9868.0, 46150.0, 425675.0, 491948.0, 52491.0, 10874.0, 3147.0, 1259.0, 590.0, 310.0, 208.0, 96.0, 84.0, 53.0, 47.0, 27.0, 23.0, 11.0, 13.0, 12.0, 4.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07037353515625, -0.06803035736083984, -0.06568717956542969, -0.06334400177001953, -0.061000823974609375, -0.05865764617919922, -0.05631446838378906, -0.053971290588378906, -0.05162811279296875, -0.049284934997558594, -0.04694175720214844, -0.04459857940673828, -0.042255401611328125, -0.03991222381591797, -0.03756904602050781, -0.035225868225097656, -0.0328826904296875, -0.030539512634277344, -0.028196334838867188, -0.02585315704345703, -0.023509979248046875, -0.02116680145263672, -0.018823623657226562, -0.016480445861816406, -0.01413726806640625, -0.011794090270996094, -0.009450912475585938, -0.007107734680175781, -0.004764556884765625, -0.0024213790893554688, -7.82012939453125e-05, 0.0022649765014648438, 0.004608154296875, 0.006951332092285156, 0.009294509887695312, 0.011637687683105469, 0.013980865478515625, 0.01632404327392578, 0.018667221069335938, 0.021010398864746094, 0.02335357666015625, 0.025696754455566406, 0.028039932250976562, 0.03038311004638672, 0.032726287841796875, 0.03506946563720703, 0.03741264343261719, 0.039755821228027344, 0.0420989990234375, 0.044442176818847656, 0.04678535461425781, 0.04912853240966797, 0.051471710205078125, 0.05381488800048828, 0.05615806579589844, 0.058501243591308594, 0.06084442138671875, 0.0631875991821289, 0.06553077697753906, 0.06787395477294922, 0.07021713256835938, 0.07256031036376953, 0.07490348815917969, 0.07724666595458984, 0.07958984375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 7.0, 8.0, 10.0, 19.0, 14.0, 17.0, 19.0, 41.0, 26.0, 46.0, 43.0, 48.0, 50.0, 55.0, 52.0, 48.0, 58.0, 55.0, 58.0, 46.0, 52.0, 37.0, 32.0, 24.0, 28.0, 25.0, 12.0, 17.0, 10.0, 4.0, 10.0, 6.0, 11.0, 6.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0989990234375, -0.09577751159667969, -0.09255599975585938, -0.08933448791503906, -0.08611297607421875, -0.08289146423339844, -0.07966995239257812, -0.07644844055175781, -0.0732269287109375, -0.07000541687011719, -0.06678390502929688, -0.06356239318847656, -0.06034088134765625, -0.05711936950683594, -0.053897857666015625, -0.05067634582519531, -0.047454833984375, -0.04423332214355469, -0.041011810302734375, -0.03779029846191406, -0.03456878662109375, -0.03134727478027344, -0.028125762939453125, -0.024904251098632812, -0.0216827392578125, -0.018461227416992188, -0.015239715576171875, -0.012018203735351562, -0.00879669189453125, -0.0055751800537109375, -0.002353668212890625, 0.0008678436279296875, 0.00408935546875, 0.0073108673095703125, 0.010532379150390625, 0.013753890991210938, 0.01697540283203125, 0.020196914672851562, 0.023418426513671875, 0.026639938354492188, 0.0298614501953125, 0.03308296203613281, 0.036304473876953125, 0.03952598571777344, 0.04274749755859375, 0.04596900939941406, 0.049190521240234375, 0.05241203308105469, 0.055633544921875, 0.05885505676269531, 0.062076568603515625, 0.06529808044433594, 0.06851959228515625, 0.07174110412597656, 0.07496261596679688, 0.07818412780761719, 0.0814056396484375, 0.08462715148925781, 0.08784866333007812, 0.09107017517089844, 0.09429168701171875, 0.09751319885253906, 0.10073471069335938, 0.10395622253417969, 0.107177734375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 6.0, 2.0, 7.0, 4.0, 4.0, 28.0, 30.0, 70.0, 159.0, 420.0, 1558.0, 11066.0, 653371.0, 372220.0, 7694.0, 1260.0, 371.0, 141.0, 66.0, 30.0, 21.0, 11.0, 8.0, 2.0, 2.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037841796875, -0.0367584228515625, -0.035675048828125, -0.0345916748046875, -0.03350830078125, -0.0324249267578125, -0.031341552734375, -0.0302581787109375, -0.0291748046875, -0.0280914306640625, -0.027008056640625, -0.0259246826171875, -0.02484130859375, -0.0237579345703125, -0.022674560546875, -0.0215911865234375, -0.0205078125, -0.0194244384765625, -0.018341064453125, -0.0172576904296875, -0.01617431640625, -0.0150909423828125, -0.014007568359375, -0.0129241943359375, -0.0118408203125, -0.0107574462890625, -0.009674072265625, -0.0085906982421875, -0.00750732421875, -0.0064239501953125, -0.005340576171875, -0.0042572021484375, -0.003173828125, -0.0020904541015625, -0.001007080078125, 7.62939453125e-05, 0.00115966796875, 0.0022430419921875, 0.003326416015625, 0.0044097900390625, 0.0054931640625, 0.0065765380859375, 0.007659912109375, 0.0087432861328125, 0.00982666015625, 0.0109100341796875, 0.011993408203125, 0.0130767822265625, 0.01416015625, 0.0152435302734375, 0.016326904296875, 0.0174102783203125, 0.01849365234375, 0.0195770263671875, 0.020660400390625, 0.0217437744140625, 0.0228271484375, 0.0239105224609375, 0.024993896484375, 0.0260772705078125, 0.02716064453125, 0.0282440185546875, 0.029327392578125, 0.0304107666015625, 0.031494140625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 11.0, 22.0, 65.0, 124.0, 124.0, 196.0, 164.0, 138.0, 79.0, 40.0, 25.0, 10.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4603137969970703e-05, -1.4112330973148346e-05, -1.3621523976325989e-05, -1.3130716979503632e-05, -1.2639909982681274e-05, -1.2149102985858917e-05, -1.165829598903656e-05, -1.1167488992214203e-05, -1.0676681995391846e-05, -1.0185874998569489e-05, -9.695068001747131e-06, -9.204261004924774e-06, -8.713454008102417e-06, -8.22264701128006e-06, -7.731840014457703e-06, -7.2410330176353455e-06, -6.750226020812988e-06, -6.259419023990631e-06, -5.768612027168274e-06, -5.277805030345917e-06, -4.7869980335235596e-06, -4.296191036701202e-06, -3.8053840398788452e-06, -3.314577043056488e-06, -2.823770046234131e-06, -2.3329630494117737e-06, -1.8421560525894165e-06, -1.3513490557670593e-06, -8.605420589447021e-07, -3.6973506212234497e-07, 1.210719347000122e-07, 6.118789315223694e-07, 1.1026859283447266e-06, 1.5934929251670837e-06, 2.084299921989441e-06, 2.575106918811798e-06, 3.0659139156341553e-06, 3.5567209124565125e-06, 4.04752790927887e-06, 4.538334906101227e-06, 5.029141902923584e-06, 5.519948899745941e-06, 6.010755896568298e-06, 6.5015628933906555e-06, 6.992369890213013e-06, 7.48317688703537e-06, 7.973983883857727e-06, 8.464790880680084e-06, 8.955597877502441e-06, 9.446404874324799e-06, 9.937211871147156e-06, 1.0428018867969513e-05, 1.091882586479187e-05, 1.1409632861614227e-05, 1.1900439858436584e-05, 1.2391246855258942e-05, 1.2882053852081299e-05, 1.3372860848903656e-05, 1.3863667845726013e-05, 1.435447484254837e-05, 1.4845281839370728e-05, 1.5336088836193085e-05, 1.5826895833015442e-05, 1.63177028298378e-05, 1.6808509826660156e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 4.0, 9.0, 7.0, 27.0, 32.0, 44.0, 106.0, 231.0, 642.0, 2568.0, 18177.0, 505618.0, 499186.0, 18171.0, 2608.0, 658.0, 238.0, 107.0, 47.0, 28.0, 11.0, 8.0, 13.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0200958251953125, -0.019222021102905273, -0.018348217010498047, -0.01747441291809082, -0.016600608825683594, -0.015726804733276367, -0.01485300064086914, -0.013979196548461914, -0.013105392456054688, -0.012231588363647461, -0.011357784271240234, -0.010483980178833008, -0.009610176086425781, -0.008736371994018555, -0.007862567901611328, -0.0069887638092041016, -0.006114959716796875, -0.0052411556243896484, -0.004367351531982422, -0.0034935474395751953, -0.0026197433471679688, -0.0017459392547607422, -0.0008721351623535156, 1.6689300537109375e-06, 0.0008754730224609375, 0.001749277114868164, 0.0026230812072753906, 0.003496885299682617, 0.004370689392089844, 0.00524449348449707, 0.006118297576904297, 0.0069921016693115234, 0.00786590576171875, 0.008739709854125977, 0.009613513946533203, 0.01048731803894043, 0.011361122131347656, 0.012234926223754883, 0.01310873031616211, 0.013982534408569336, 0.014856338500976562, 0.01573014259338379, 0.016603946685791016, 0.017477750778198242, 0.01835155487060547, 0.019225358963012695, 0.020099163055419922, 0.02097296714782715, 0.021846771240234375, 0.0227205753326416, 0.023594379425048828, 0.024468183517456055, 0.02534198760986328, 0.026215791702270508, 0.027089595794677734, 0.02796339988708496, 0.028837203979492188, 0.029711008071899414, 0.03058481216430664, 0.03145861625671387, 0.032332420349121094, 0.03320622444152832, 0.03408002853393555, 0.03495383262634277, 0.03582763671875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 5.0, 2.0, 7.0, 4.0, 5.0, 9.0, 13.0, 17.0, 12.0, 23.0, 38.0, 39.0, 46.0, 86.0, 90.0, 111.0, 93.0, 87.0, 79.0, 66.0, 40.0, 37.0, 24.0, 12.0, 12.0, 9.0, 14.0, 4.0, 4.0, 5.0, 2.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016387939453125, -0.015890002250671387, -0.015392065048217773, -0.01489412784576416, -0.014396190643310547, -0.013898253440856934, -0.01340031623840332, -0.012902379035949707, -0.012404441833496094, -0.01190650463104248, -0.011408567428588867, -0.010910630226135254, -0.01041269302368164, -0.009914755821228027, -0.009416818618774414, -0.0089188814163208, -0.008420944213867188, -0.007923007011413574, -0.007425069808959961, -0.006927132606506348, -0.006429195404052734, -0.005931258201599121, -0.005433320999145508, -0.0049353837966918945, -0.004437446594238281, -0.003939509391784668, -0.0034415721893310547, -0.0029436349868774414, -0.002445697784423828, -0.0019477605819702148, -0.0014498233795166016, -0.0009518861770629883, -0.000453948974609375, 4.398822784423828e-05, 0.0005419254302978516, 0.0010398626327514648, 0.0015377998352050781, 0.0020357370376586914, 0.0025336742401123047, 0.003031611442565918, 0.0035295486450195312, 0.0040274858474731445, 0.004525423049926758, 0.005023360252380371, 0.005521297454833984, 0.006019234657287598, 0.006517171859741211, 0.007015109062194824, 0.0075130462646484375, 0.00801098346710205, 0.008508920669555664, 0.009006857872009277, 0.00950479507446289, 0.010002732276916504, 0.010500669479370117, 0.01099860668182373, 0.011496543884277344, 0.011994481086730957, 0.01249241828918457, 0.012990355491638184, 0.013488292694091797, 0.01398622989654541, 0.014484167098999023, 0.014982104301452637, 0.01548004150390625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 47.0, 864.0, 99.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.435272216796875, -0.3565550744533539, -0.27783793210983276, -0.19912078976631165, -0.12040364742279053, -0.04168650507926941, 0.03703063726425171, 0.11574780941009521, 0.19446492195129395, 0.27318206429481506, 0.3518992066383362, 0.4306163489818573, 0.5093334913253784, 0.5880506038665771, 0.6667677760124207, 0.7454849481582642, 0.8242020606994629, 0.9029191732406616, 0.9816363453865051, 1.0603535175323486, 1.1390706300735474, 1.217787742614746, 1.2965049743652344, 1.375222086906433, 1.4539391994476318, 1.5326563119888306, 1.6113734245300293, 1.6900906562805176, 1.7688077688217163, 1.847524881362915, 1.9262421131134033, 2.0049591064453125, 2.083676338195801, 2.162393569946289, 2.2411105632781982, 2.3198277950286865, 2.3985447883605957, 2.477262020111084, 2.5559792518615723, 2.6346964836120605, 2.7134134769439697, 2.792130708694458, 2.870847702026367, 2.9495649337768555, 3.0282821655273438, 3.106999158859253, 3.185716390609741, 3.2644333839416504, 3.3431506156921387, 3.421867847442627, 3.500584840774536, 3.5793020725250244, 3.6580190658569336, 3.736736297607422, 3.81545352935791, 3.8941707611083984, 3.9728877544403076, 4.051604747772217, 4.130321979522705, 4.209039211273193, 4.287756443023682, 4.36647367477417, 4.4451904296875, 4.523907661437988, 4.602624893188477]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 7.0, 9.0, 8.0, 15.0, 19.0, 17.0, 23.0, 31.0, 27.0, 30.0, 29.0, 39.0, 46.0, 44.0, 36.0, 47.0, 51.0, 41.0, 57.0, 56.0, 42.0, 40.0, 31.0, 37.0, 30.0, 28.0, 19.0, 20.0, 27.0, 22.0, 16.0, 12.0, 13.0, 9.0, 5.0, 9.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.43043994903564453, -0.4173564612865448, -0.4042729437351227, -0.39118945598602295, -0.37810593843460083, -0.3650224506855011, -0.35193896293640137, -0.33885544538497925, -0.32577192783355713, -0.3126884400844574, -0.2996049225330353, -0.28652143478393555, -0.2734379172325134, -0.2603544294834137, -0.24727092683315277, -0.23418742418289185, -0.22110393643379211, -0.2080204337835312, -0.19493693113327026, -0.18185344338417053, -0.1687699258327484, -0.15568643808364868, -0.14260293543338776, -0.12951943278312683, -0.1164359301328659, -0.10335242748260498, -0.09026892483234406, -0.07718542963266373, -0.0641019269824028, -0.051018424332141876, -0.03793492913246155, -0.024851426482200623, -0.011767923831939697, 0.0013155769556760788, 0.014399077743291855, 0.02748257666826248, 0.04056607931852341, 0.05364958196878433, 0.06673307716846466, 0.07981657981872559, 0.09290008246898651, 0.10598358511924744, 0.11906708776950836, 0.1321505904197693, 0.14523407816886902, 0.15831759572029114, 0.17140108346939087, 0.1844845861196518, 0.19756808876991272, 0.21065159142017365, 0.22373509407043457, 0.2368185818195343, 0.24990209937095642, 0.26298558712005615, 0.27606910467147827, 0.289152592420578, 0.30223608016967773, 0.31531956791877747, 0.3284030854701996, 0.3414865732192993, 0.35457009077072144, 0.36765357851982117, 0.3807370662689209, 0.393820583820343, 0.40690410137176514]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 9.0, 5.0, 5.0, 7.0, 24.0, 25.0, 18.0, 33.0, 58.0, 85.0, 166.0, 249.0, 563.0, 909.0, 1936.0, 4843.0, 16961.0, 163086.0, 3896567.0, 88434.0, 12739.0, 3917.0, 1629.0, 872.0, 431.0, 271.0, 155.0, 101.0, 54.0, 37.0, 23.0, 19.0, 11.0, 11.0, 11.0, 5.0, 5.0, 5.0, 1.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.07830810546875, -0.07621431350708008, -0.07412052154541016, -0.07202672958374023, -0.06993293762207031, -0.06783914566040039, -0.06574535369873047, -0.06365156173706055, -0.061557769775390625, -0.0594639778137207, -0.05737018585205078, -0.05527639389038086, -0.05318260192871094, -0.051088809967041016, -0.048995018005371094, -0.04690122604370117, -0.04480743408203125, -0.04271364212036133, -0.040619850158691406, -0.038526058197021484, -0.03643226623535156, -0.03433847427368164, -0.03224468231201172, -0.030150890350341797, -0.028057098388671875, -0.025963306427001953, -0.02386951446533203, -0.02177572250366211, -0.019681930541992188, -0.017588138580322266, -0.015494346618652344, -0.013400554656982422, -0.0113067626953125, -0.009212970733642578, -0.007119178771972656, -0.005025386810302734, -0.0029315948486328125, -0.0008378028869628906, 0.0012559890747070312, 0.003349781036376953, 0.005443572998046875, 0.007537364959716797, 0.009631156921386719, 0.01172494888305664, 0.013818740844726562, 0.015912532806396484, 0.018006324768066406, 0.020100116729736328, 0.02219390869140625, 0.024287700653076172, 0.026381492614746094, 0.028475284576416016, 0.030569076538085938, 0.03266286849975586, 0.03475666046142578, 0.0368504524230957, 0.038944244384765625, 0.04103803634643555, 0.04313182830810547, 0.04522562026977539, 0.04731941223144531, 0.049413204193115234, 0.051506996154785156, 0.05360078811645508, 0.055694580078125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 8.0, 8.0, 18.0, 26.0, 33.0, 52.0, 46.0, 70.0, 71.0, 80.0, 89.0, 100.0, 82.0, 70.0, 59.0, 55.0, 42.0, 36.0, 21.0, 9.0, 13.0, 6.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.05511474609375, -0.05376744270324707, -0.05242013931274414, -0.05107283592224121, -0.04972553253173828, -0.04837822914123535, -0.04703092575073242, -0.04568362236022949, -0.04433631896972656, -0.04298901557922363, -0.0416417121887207, -0.04029440879821777, -0.038947105407714844, -0.037599802017211914, -0.036252498626708984, -0.034905195236206055, -0.033557891845703125, -0.032210588455200195, -0.030863285064697266, -0.029515981674194336, -0.028168678283691406, -0.026821374893188477, -0.025474071502685547, -0.024126768112182617, -0.022779464721679688, -0.021432161331176758, -0.020084857940673828, -0.0187375545501709, -0.01739025115966797, -0.01604294776916504, -0.01469564437866211, -0.01334834098815918, -0.01200103759765625, -0.01065373420715332, -0.00930643081665039, -0.007959127426147461, -0.006611824035644531, -0.0052645206451416016, -0.003917217254638672, -0.002569913864135742, -0.0012226104736328125, 0.0001246929168701172, 0.0014719963073730469, 0.0028192996978759766, 0.004166603088378906, 0.005513906478881836, 0.006861209869384766, 0.008208513259887695, 0.009555816650390625, 0.010903120040893555, 0.012250423431396484, 0.013597726821899414, 0.014945030212402344, 0.016292333602905273, 0.017639636993408203, 0.018986940383911133, 0.020334243774414062, 0.021681547164916992, 0.023028850555419922, 0.02437615394592285, 0.02572345733642578, 0.02707076072692871, 0.02841806411743164, 0.02976536750793457, 0.0311126708984375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 9.0, 8.0, 9.0, 20.0, 30.0, 56.0, 61.0, 95.0, 112.0, 271.0, 650.0, 4811.0, 4145576.0, 40110.0, 1454.0, 458.0, 235.0, 110.0, 69.0, 47.0, 29.0, 23.0, 15.0, 7.0, 12.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.306884765625, -0.299530029296875, -0.29217529296875, -0.284820556640625, -0.2774658203125, -0.270111083984375, -0.26275634765625, -0.255401611328125, -0.248046875, -0.240692138671875, -0.23333740234375, -0.225982666015625, -0.2186279296875, -0.211273193359375, -0.20391845703125, -0.196563720703125, -0.189208984375, -0.181854248046875, -0.17449951171875, -0.167144775390625, -0.1597900390625, -0.152435302734375, -0.14508056640625, -0.137725830078125, -0.13037109375, -0.123016357421875, -0.11566162109375, -0.108306884765625, -0.1009521484375, -0.093597412109375, -0.08624267578125, -0.078887939453125, -0.071533203125, -0.064178466796875, -0.05682373046875, -0.049468994140625, -0.0421142578125, -0.034759521484375, -0.02740478515625, -0.020050048828125, -0.0126953125, -0.005340576171875, 0.00201416015625, 0.009368896484375, 0.0167236328125, 0.024078369140625, 0.03143310546875, 0.038787841796875, 0.046142578125, 0.053497314453125, 0.06085205078125, 0.068206787109375, 0.0755615234375, 0.082916259765625, 0.09027099609375, 0.097625732421875, 0.10498046875, 0.112335205078125, 0.11968994140625, 0.127044677734375, 0.1343994140625, 0.141754150390625, 0.14910888671875, 0.156463623046875, 0.163818359375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 8.0, 16.0, 67.0, 872.0, 2920.0, 137.0, 31.0, 14.0, 7.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.089111328125, -0.08642292022705078, -0.08373451232910156, -0.08104610443115234, -0.07835769653320312, -0.0756692886352539, -0.07298088073730469, -0.07029247283935547, -0.06760406494140625, -0.06491565704345703, -0.06222724914550781, -0.059538841247558594, -0.056850433349609375, -0.054162025451660156, -0.05147361755371094, -0.04878520965576172, -0.0460968017578125, -0.04340839385986328, -0.04071998596191406, -0.038031578063964844, -0.035343170166015625, -0.032654762268066406, -0.029966354370117188, -0.02727794647216797, -0.02458953857421875, -0.02190113067626953, -0.019212722778320312, -0.016524314880371094, -0.013835906982421875, -0.011147499084472656, -0.008459091186523438, -0.005770683288574219, -0.003082275390625, -0.00039386749267578125, 0.0022945404052734375, 0.004982948303222656, 0.007671356201171875, 0.010359764099121094, 0.013048171997070312, 0.01573657989501953, 0.01842498779296875, 0.02111339569091797, 0.023801803588867188, 0.026490211486816406, 0.029178619384765625, 0.031867027282714844, 0.03455543518066406, 0.03724384307861328, 0.0399322509765625, 0.04262065887451172, 0.04530906677246094, 0.047997474670410156, 0.050685882568359375, 0.053374290466308594, 0.05606269836425781, 0.05875110626220703, 0.06143951416015625, 0.06412792205810547, 0.06681632995605469, 0.0695047378540039, 0.07219314575195312, 0.07488155364990234, 0.07756996154785156, 0.08025836944580078, 0.08294677734375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 15.0, 246.0, 647.0, 78.0, 12.0, 3.0, 0.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21105194091796875, -0.1904512494802475, -0.16985055804252625, -0.149249866604805, -0.12864917516708374, -0.10804848372936249, -0.08744779229164124, -0.06684710085391998, -0.04624640941619873, -0.025645717978477478, -0.005045026540756226, 0.015555664896965027, 0.03615635633468628, 0.05675704777240753, 0.07735773921012878, 0.09795843064785004, 0.11855912208557129, 0.13915981352329254, 0.1597605049610138, 0.18036119639873505, 0.2009618878364563, 0.22156257927417755, 0.2421632707118988, 0.26276397705078125, 0.2833646535873413, 0.30396533012390137, 0.3245660364627838, 0.34516674280166626, 0.3657674193382263, 0.3863680958747864, 0.4069688022136688, 0.42756950855255127, 0.44817018508911133, 0.4687708616256714, 0.48937156796455383, 0.5099722743034363, 0.5305729508399963, 0.5511736273765564, 0.5717743635177612, 0.5923750400543213, 0.6129757165908813, 0.6335763931274414, 0.6541770696640015, 0.6747778058052063, 0.6953784823417664, 0.7159791588783264, 0.7365798950195312, 0.7571805715560913, 0.7777812480926514, 0.7983819246292114, 0.8189826011657715, 0.8395833373069763, 0.8601840138435364, 0.8807846903800964, 0.9013854265213013, 0.9219861030578613, 0.9425867795944214, 0.9631874561309814, 0.9837881326675415, 1.0043888092041016, 1.0249896049499512, 1.0455902814865112, 1.0661909580230713, 1.0867916345596313, 1.1073923110961914]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 20.0, 23.0, 30.0, 63.0, 111.0, 115.0, 140.0, 142.0, 105.0, 91.0, 56.0, 36.0, 27.0, 17.0, 7.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20321905612945557, -0.19570286571979523, -0.1881866753101349, -0.18067048490047455, -0.1731542944908142, -0.16563811898231506, -0.15812192857265472, -0.15060573816299438, -0.14308954775333405, -0.1355733573436737, -0.12805716693401337, -0.12054098397493362, -0.11302479356527328, -0.10550860315561295, -0.0979924201965332, -0.09047622978687286, -0.08296003937721252, -0.07544384896755219, -0.06792765855789185, -0.0604114755988121, -0.052895285189151764, -0.045379094779491425, -0.037862908095121384, -0.030346721410751343, -0.022830531001091003, -0.015314342454075813, -0.007798153907060623, -0.00028196536004543304, 0.007234223186969757, 0.014750413596630096, 0.022266600281000137, 0.029782786965370178, 0.03729897737503052, 0.04481516778469086, 0.0523313544690609, 0.05984754115343094, 0.06736373156309128, 0.07487992197275162, 0.08239610493183136, 0.0899122953414917, 0.09742848575115204, 0.10494467616081238, 0.11246086657047272, 0.11997704952955246, 0.1274932324886322, 0.13500943779945374, 0.14252561330795288, 0.15004180371761322, 0.15755799412727356, 0.1650741845369339, 0.17259037494659424, 0.18010656535625458, 0.18762275576591492, 0.19513893127441406, 0.2026551216840744, 0.21017131209373474, 0.21768750250339508, 0.22520369291305542, 0.23271988332271576, 0.2402360737323761, 0.24775224924087524, 0.2552684545516968, 0.2627846300601959, 0.27030080556869507, 0.2778170108795166]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 9.0, 8.0, 9.0, 26.0, 41.0, 57.0, 88.0, 167.0, 370.0, 727.0, 1989.0, 6588.0, 31305.0, 244588.0, 655354.0, 86992.0, 14412.0, 3596.0, 1151.0, 512.0, 245.0, 123.0, 69.0, 41.0, 22.0, 20.0, 21.0, 8.0, 5.0, 2.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08709716796875, -0.08431148529052734, -0.08152580261230469, -0.07874011993408203, -0.07595443725585938, -0.07316875457763672, -0.07038307189941406, -0.0675973892211914, -0.06481170654296875, -0.062026023864746094, -0.05924034118652344, -0.05645465850830078, -0.053668975830078125, -0.05088329315185547, -0.04809761047363281, -0.045311927795410156, -0.0425262451171875, -0.039740562438964844, -0.03695487976074219, -0.03416919708251953, -0.031383514404296875, -0.02859783172607422, -0.025812149047851562, -0.023026466369628906, -0.02024078369140625, -0.017455101013183594, -0.014669418334960938, -0.011883735656738281, -0.009098052978515625, -0.006312370300292969, -0.0035266876220703125, -0.0007410049438476562, 0.002044677734375, 0.004830360412597656, 0.0076160430908203125, 0.010401725769042969, 0.013187408447265625, 0.01597309112548828, 0.018758773803710938, 0.021544456481933594, 0.02433013916015625, 0.027115821838378906, 0.029901504516601562, 0.03268718719482422, 0.035472869873046875, 0.03825855255126953, 0.04104423522949219, 0.043829917907714844, 0.0466156005859375, 0.049401283264160156, 0.05218696594238281, 0.05497264862060547, 0.057758331298828125, 0.06054401397705078, 0.06332969665527344, 0.0661153793334961, 0.06890106201171875, 0.0716867446899414, 0.07447242736816406, 0.07725811004638672, 0.08004379272460938, 0.08282947540283203, 0.08561515808105469, 0.08840084075927734, 0.0911865234375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 10.0, 9.0, 15.0, 23.0, 33.0, 51.0, 55.0, 47.0, 73.0, 60.0, 71.0, 97.0, 68.0, 77.0, 67.0, 60.0, 42.0, 42.0, 29.0, 23.0, 15.0, 9.0, 8.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.045806884765625, -0.04461550712585449, -0.043424129486083984, -0.04223275184631348, -0.04104137420654297, -0.03984999656677246, -0.03865861892700195, -0.037467241287231445, -0.03627586364746094, -0.03508448600769043, -0.03389310836791992, -0.032701730728149414, -0.031510353088378906, -0.0303189754486084, -0.02912759780883789, -0.027936220169067383, -0.026744842529296875, -0.025553464889526367, -0.02436208724975586, -0.02317070960998535, -0.021979331970214844, -0.020787954330444336, -0.019596576690673828, -0.01840519905090332, -0.017213821411132812, -0.016022443771362305, -0.014831066131591797, -0.013639688491821289, -0.012448310852050781, -0.011256933212280273, -0.010065555572509766, -0.008874177932739258, -0.00768280029296875, -0.006491422653198242, -0.005300045013427734, -0.0041086673736572266, -0.0029172897338867188, -0.001725912094116211, -0.0005345344543457031, 0.0006568431854248047, 0.0018482208251953125, 0.0030395984649658203, 0.004230976104736328, 0.005422353744506836, 0.006613731384277344, 0.0078051090240478516, 0.00899648666381836, 0.010187864303588867, 0.011379241943359375, 0.012570619583129883, 0.01376199722290039, 0.014953374862670898, 0.016144752502441406, 0.017336130142211914, 0.018527507781982422, 0.01971888542175293, 0.020910263061523438, 0.022101640701293945, 0.023293018341064453, 0.02448439598083496, 0.02567577362060547, 0.026867151260375977, 0.028058528900146484, 0.029249906539916992, 0.0304412841796875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 12.0, 7.0, 10.0, 12.0, 17.0, 25.0, 22.0, 22.0, 48.0, 69.0, 91.0, 117.0, 241.0, 424.0, 806.0, 1801.0, 4672.0, 13903.0, 50042.0, 257662.0, 560420.0, 116458.0, 27395.0, 8436.0, 3006.0, 1243.0, 624.0, 321.0, 204.0, 118.0, 70.0, 59.0, 53.0, 31.0, 28.0, 14.0, 19.0, 8.0, 9.0, 3.0, 8.0, 5.0, 6.0, 3.0, 7.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.052154541015625, -0.05048704147338867, -0.048819541931152344, -0.047152042388916016, -0.04548454284667969, -0.04381704330444336, -0.04214954376220703, -0.0404820442199707, -0.038814544677734375, -0.03714704513549805, -0.03547954559326172, -0.03381204605102539, -0.03214454650878906, -0.030477046966552734, -0.028809547424316406, -0.027142047882080078, -0.02547454833984375, -0.023807048797607422, -0.022139549255371094, -0.020472049713134766, -0.018804550170898438, -0.01713705062866211, -0.015469551086425781, -0.013802051544189453, -0.012134552001953125, -0.010467052459716797, -0.008799552917480469, -0.007132053375244141, -0.0054645538330078125, -0.0037970542907714844, -0.0021295547485351562, -0.0004620552062988281, 0.0012054443359375, 0.002872943878173828, 0.004540443420410156, 0.006207942962646484, 0.007875442504882812, 0.00954294204711914, 0.011210441589355469, 0.012877941131591797, 0.014545440673828125, 0.016212940216064453, 0.01788043975830078, 0.01954793930053711, 0.021215438842773438, 0.022882938385009766, 0.024550437927246094, 0.026217937469482422, 0.02788543701171875, 0.029552936553955078, 0.031220436096191406, 0.032887935638427734, 0.03455543518066406, 0.03622293472290039, 0.03789043426513672, 0.03955793380737305, 0.041225433349609375, 0.0428929328918457, 0.04456043243408203, 0.04622793197631836, 0.04789543151855469, 0.049562931060791016, 0.051230430603027344, 0.05289793014526367, 0.0545654296875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 3.0, 12.0, 6.0, 5.0, 14.0, 12.0, 7.0, 19.0, 12.0, 23.0, 22.0, 31.0, 27.0, 26.0, 30.0, 32.0, 46.0, 42.0, 40.0, 36.0, 47.0, 49.0, 59.0, 45.0, 46.0, 40.0, 34.0, 34.0, 29.0, 24.0, 32.0, 23.0, 10.0, 7.0, 18.0, 15.0, 10.0, 6.0, 6.0, 6.0, 5.0, 2.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.08489990234375, -0.08241462707519531, -0.07992935180664062, -0.07744407653808594, -0.07495880126953125, -0.07247352600097656, -0.06998825073242188, -0.06750297546386719, -0.0650177001953125, -0.06253242492675781, -0.060047149658203125, -0.05756187438964844, -0.05507659912109375, -0.05259132385253906, -0.050106048583984375, -0.04762077331542969, -0.045135498046875, -0.04265022277832031, -0.040164947509765625, -0.03767967224121094, -0.03519439697265625, -0.03270912170410156, -0.030223846435546875, -0.027738571166992188, -0.0252532958984375, -0.022768020629882812, -0.020282745361328125, -0.017797470092773438, -0.01531219482421875, -0.012826919555664062, -0.010341644287109375, -0.007856369018554688, -0.00537109375, -0.0028858184814453125, -0.000400543212890625, 0.0020847320556640625, 0.00457000732421875, 0.0070552825927734375, 0.009540557861328125, 0.012025833129882812, 0.0145111083984375, 0.016996383666992188, 0.019481658935546875, 0.021966934204101562, 0.02445220947265625, 0.026937484741210938, 0.029422760009765625, 0.03190803527832031, 0.034393310546875, 0.03687858581542969, 0.039363861083984375, 0.04184913635253906, 0.04433441162109375, 0.04681968688964844, 0.049304962158203125, 0.05179023742675781, 0.0542755126953125, 0.05676078796386719, 0.059246063232421875, 0.06173133850097656, 0.06421661376953125, 0.06670188903808594, 0.06918716430664062, 0.07167243957519531, 0.07415771484375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 2.0, 1.0, 4.0, 7.0, 8.0, 10.0, 16.0, 22.0, 53.0, 121.0, 253.0, 664.0, 2500.0, 19096.0, 661956.0, 350850.0, 10200.0, 1794.0, 571.0, 206.0, 96.0, 51.0, 21.0, 19.0, 12.0, 6.0, 5.0, 4.0, 3.0, 0.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.028594970703125, -0.0277254581451416, -0.026855945587158203, -0.025986433029174805, -0.025116920471191406, -0.024247407913208008, -0.02337789535522461, -0.02250838279724121, -0.021638870239257812, -0.020769357681274414, -0.019899845123291016, -0.019030332565307617, -0.01816082000732422, -0.01729130744934082, -0.016421794891357422, -0.015552282333374023, -0.014682769775390625, -0.013813257217407227, -0.012943744659423828, -0.01207423210144043, -0.011204719543457031, -0.010335206985473633, -0.009465694427490234, -0.008596181869506836, -0.0077266693115234375, -0.006857156753540039, -0.005987644195556641, -0.005118131637573242, -0.004248619079589844, -0.0033791065216064453, -0.002509593963623047, -0.0016400814056396484, -0.00077056884765625, 9.894371032714844e-05, 0.0009684562683105469, 0.0018379688262939453, 0.0027074813842773438, 0.003576993942260742, 0.004446506500244141, 0.005316019058227539, 0.0061855316162109375, 0.007055044174194336, 0.007924556732177734, 0.008794069290161133, 0.009663581848144531, 0.01053309440612793, 0.011402606964111328, 0.012272119522094727, 0.013141632080078125, 0.014011144638061523, 0.014880657196044922, 0.01575016975402832, 0.01661968231201172, 0.017489194869995117, 0.018358707427978516, 0.019228219985961914, 0.020097732543945312, 0.02096724510192871, 0.02183675765991211, 0.022706270217895508, 0.023575782775878906, 0.024445295333862305, 0.025314807891845703, 0.0261843204498291, 0.0270538330078125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 8.0, 3.0, 13.0, 19.0, 22.0, 25.0, 30.0, 49.0, 47.0, 68.0, 63.0, 86.0, 71.0, 75.0, 91.0, 46.0, 74.0, 49.0, 52.0, 28.0, 23.0, 16.0, 10.0, 19.0, 5.0, 4.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.318092346191406e-06, -6.113201379776001e-06, -5.908310413360596e-06, -5.7034194469451904e-06, -5.498528480529785e-06, -5.29363751411438e-06, -5.088746547698975e-06, -4.883855581283569e-06, -4.678964614868164e-06, -4.474073648452759e-06, -4.2691826820373535e-06, -4.064291715621948e-06, -3.859400749206543e-06, -3.6545097827911377e-06, -3.4496188163757324e-06, -3.244727849960327e-06, -3.039836883544922e-06, -2.8349459171295166e-06, -2.6300549507141113e-06, -2.425163984298706e-06, -2.2202730178833008e-06, -2.0153820514678955e-06, -1.8104910850524902e-06, -1.605600118637085e-06, -1.4007091522216797e-06, -1.1958181858062744e-06, -9.909272193908691e-07, -7.860362529754639e-07, -5.811452865600586e-07, -3.762543201446533e-07, -1.7136335372924805e-07, 3.3527612686157227e-08, 2.384185791015625e-07, 4.4330954551696777e-07, 6.48200511932373e-07, 8.530914783477783e-07, 1.0579824447631836e-06, 1.2628734111785889e-06, 1.4677643775939941e-06, 1.6726553440093994e-06, 1.8775463104248047e-06, 2.08243727684021e-06, 2.2873282432556152e-06, 2.4922192096710205e-06, 2.6971101760864258e-06, 2.902001142501831e-06, 3.1068921089172363e-06, 3.3117830753326416e-06, 3.516674041748047e-06, 3.721565008163452e-06, 3.926455974578857e-06, 4.131346940994263e-06, 4.336237907409668e-06, 4.541128873825073e-06, 4.7460198402404785e-06, 4.950910806655884e-06, 5.155801773071289e-06, 5.360692739486694e-06, 5.5655837059021e-06, 5.770474672317505e-06, 5.97536563873291e-06, 6.1802566051483154e-06, 6.385147571563721e-06, 6.590038537979126e-06, 6.794929504394531e-06]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 1.0, 4.0, 9.0, 7.0, 13.0, 23.0, 48.0, 93.0, 225.0, 540.0, 1829.0, 9916.0, 338633.0, 674026.0, 19433.0, 2502.0, 746.0, 257.0, 116.0, 62.0, 28.0, 14.0, 13.0, 4.0, 8.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.025970458984375, -0.02510833740234375, -0.0242462158203125, -0.02338409423828125, -0.02252197265625, -0.02165985107421875, -0.0207977294921875, -0.01993560791015625, -0.019073486328125, -0.01821136474609375, -0.0173492431640625, -0.01648712158203125, -0.015625, -0.01476287841796875, -0.0139007568359375, -0.01303863525390625, -0.012176513671875, -0.01131439208984375, -0.0104522705078125, -0.00959014892578125, -0.00872802734375, -0.00786590576171875, -0.0070037841796875, -0.00614166259765625, -0.005279541015625, -0.00441741943359375, -0.0035552978515625, -0.00269317626953125, -0.0018310546875, -0.00096893310546875, -0.0001068115234375, 0.00075531005859375, 0.001617431640625, 0.00247955322265625, 0.0033416748046875, 0.00420379638671875, 0.00506591796875, 0.00592803955078125, 0.0067901611328125, 0.00765228271484375, 0.008514404296875, 0.00937652587890625, 0.0102386474609375, 0.01110076904296875, 0.011962890625, 0.01282501220703125, 0.0136871337890625, 0.01454925537109375, 0.015411376953125, 0.01627349853515625, 0.0171356201171875, 0.01799774169921875, 0.01885986328125, 0.01972198486328125, 0.0205841064453125, 0.02144622802734375, 0.022308349609375, 0.02317047119140625, 0.0240325927734375, 0.02489471435546875, 0.0257568359375, 0.02661895751953125, 0.0274810791015625, 0.02834320068359375, 0.029205322265625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 9.0, 15.0, 25.0, 54.0, 68.0, 114.0, 134.0, 149.0, 116.0, 97.0, 82.0, 53.0, 33.0, 15.0, 15.0, 9.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024017333984375, -0.02323007583618164, -0.02244281768798828, -0.021655559539794922, -0.020868301391601562, -0.020081043243408203, -0.019293785095214844, -0.018506526947021484, -0.017719268798828125, -0.016932010650634766, -0.016144752502441406, -0.015357494354248047, -0.014570236206054688, -0.013782978057861328, -0.012995719909667969, -0.01220846176147461, -0.01142120361328125, -0.01063394546508789, -0.009846687316894531, -0.009059429168701172, -0.008272171020507812, -0.007484912872314453, -0.006697654724121094, -0.005910396575927734, -0.005123138427734375, -0.004335880279541016, -0.0035486221313476562, -0.002761363983154297, -0.0019741058349609375, -0.0011868476867675781, -0.00039958953857421875, 0.0003876686096191406, 0.0011749267578125, 0.0019621849060058594, 0.0027494430541992188, 0.003536701202392578, 0.0043239593505859375, 0.005111217498779297, 0.005898475646972656, 0.006685733795166016, 0.007472991943359375, 0.008260250091552734, 0.009047508239746094, 0.009834766387939453, 0.010622024536132812, 0.011409282684326172, 0.012196540832519531, 0.01298379898071289, 0.01377105712890625, 0.01455831527709961, 0.015345573425292969, 0.016132831573486328, 0.016920089721679688, 0.017707347869873047, 0.018494606018066406, 0.019281864166259766, 0.020069122314453125, 0.020856380462646484, 0.021643638610839844, 0.022430896759033203, 0.023218154907226562, 0.024005413055419922, 0.02479267120361328, 0.02557992935180664, 0.0263671875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 23.0, 255.0, 660.0, 58.0, 14.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9308487176895142, -0.8735385537147522, -0.8162283301353455, -0.7589181661605835, -0.7016079425811768, -0.6442977786064148, -0.5869876146316528, -0.5296773910522461, -0.47236722707748413, -0.4150570333003998, -0.35774683952331543, -0.30043667554855347, -0.24312648177146912, -0.18581628799438477, -0.1285061240196228, -0.07119593024253845, -0.013885736465454102, 0.04342444986104965, 0.1007346361875534, 0.15804481506347656, 0.2153550088405609, 0.27266520261764526, 0.3299753665924072, 0.3872855603694916, 0.4445957541465759, 0.5019059181213379, 0.5592161417007446, 0.6165263056755066, 0.6738364696502686, 0.7311466932296753, 0.7884568572044373, 0.8457670211791992, 0.9030773639678955, 0.9603875279426575, 1.0176976919174194, 1.0750079154968262, 1.132318139076233, 1.1896283626556396, 1.2469384670257568, 1.3042486906051636, 1.3615589141845703, 1.418869137763977, 1.4761792421340942, 1.533489465713501, 1.5907996892929077, 1.6481099128723145, 1.7054200172424316, 1.7627302408218384, 1.8200403451919556, 1.8773505687713623, 1.9346606731414795, 1.9919708967208862, 2.049281120300293, 2.10659122467041, 2.1639013290405273, 2.2212116718292236, 2.278521776199341, 2.335831880569458, 2.3931422233581543, 2.4504523277282715, 2.5077624320983887, 2.565072774887085, 2.622382879257202, 2.6796929836273193, 2.7370033264160156]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 6.0, 2.0, 3.0, 3.0, 5.0, 4.0, 4.0, 8.0, 8.0, 8.0, 13.0, 9.0, 12.0, 13.0, 11.0, 25.0, 17.0, 19.0, 16.0, 27.0, 27.0, 39.0, 26.0, 36.0, 44.0, 47.0, 39.0, 35.0, 32.0, 43.0, 43.0, 36.0, 35.0, 28.0, 35.0, 32.0, 20.0, 26.0, 14.0, 16.0, 16.0, 21.0, 12.0, 14.0, 19.0, 12.0, 14.0, 5.0, 6.0, 9.0, 5.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.31014156341552734, -0.2998157739639282, -0.2894899547100067, -0.2791641652584076, -0.2688383460044861, -0.25851255655288696, -0.24818675220012665, -0.23786094784736633, -0.2275351583957672, -0.2172093540430069, -0.20688354969024658, -0.19655776023864746, -0.18623195588588715, -0.17590615153312683, -0.16558034718036652, -0.1552545428276062, -0.1449287384748459, -0.13460293412208557, -0.12427713721990585, -0.11395133286714554, -0.10362553596496582, -0.0932997316122055, -0.08297392725944519, -0.07264813035726547, -0.06232232600450516, -0.05199652537703514, -0.041670724749565125, -0.03134492039680481, -0.021019119769334793, -0.010693319141864777, -0.00036751478910446167, 0.009958282113075256, 0.02028408646583557, 0.030609887093305588, 0.040935687720775604, 0.05126149207353592, 0.061587292701005936, 0.07191309332847595, 0.08223889768123627, 0.09256469458341599, 0.1028904989361763, 0.11321630328893661, 0.12354210019111633, 0.13386790454387665, 0.14419370889663696, 0.15451949834823608, 0.1648453176021576, 0.1751711070537567, 0.18549691140651703, 0.19582271575927734, 0.20614852011203766, 0.21647432446479797, 0.2268001139163971, 0.2371259182691574, 0.24745172262191772, 0.25777751207351685, 0.26810333132743835, 0.2784291207790375, 0.288754940032959, 0.2990807294845581, 0.3094065487384796, 0.31973233819007874, 0.33005815744400024, 0.34038394689559937, 0.3507097363471985]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 2.0, 6.0, 1.0, 6.0, 4.0, 8.0, 4.0, 7.0, 15.0, 26.0, 18.0, 47.0, 67.0, 104.0, 157.0, 223.0, 431.0, 849.0, 1490.0, 3439.0, 8481.0, 28225.0, 303206.0, 3768252.0, 56372.0, 13392.0, 4625.0, 2202.0, 1021.0, 576.0, 309.0, 231.0, 151.0, 81.0, 67.0, 39.0, 42.0, 28.0, 20.0, 15.0, 14.0, 3.0, 10.0, 7.0, 2.0, 9.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05792236328125, -0.05579376220703125, -0.0536651611328125, -0.05153656005859375, -0.049407958984375, -0.04727935791015625, -0.0451507568359375, -0.04302215576171875, -0.0408935546875, -0.03876495361328125, -0.0366363525390625, -0.03450775146484375, -0.032379150390625, -0.03025054931640625, -0.0281219482421875, -0.02599334716796875, -0.02386474609375, -0.02173614501953125, -0.0196075439453125, -0.01747894287109375, -0.015350341796875, -0.01322174072265625, -0.0110931396484375, -0.00896453857421875, -0.0068359375, -0.00470733642578125, -0.0025787353515625, -0.00045013427734375, 0.001678466796875, 0.00380706787109375, 0.0059356689453125, 0.00806427001953125, 0.01019287109375, 0.01232147216796875, 0.0144500732421875, 0.01657867431640625, 0.018707275390625, 0.02083587646484375, 0.0229644775390625, 0.02509307861328125, 0.0272216796875, 0.02935028076171875, 0.0314788818359375, 0.03360748291015625, 0.035736083984375, 0.03786468505859375, 0.0399932861328125, 0.04212188720703125, 0.04425048828125, 0.04637908935546875, 0.0485076904296875, 0.05063629150390625, 0.052764892578125, 0.05489349365234375, 0.0570220947265625, 0.05915069580078125, 0.061279296875, 0.06340789794921875, 0.0655364990234375, 0.06766510009765625, 0.069793701171875, 0.07192230224609375, 0.0740509033203125, 0.07617950439453125, 0.07830810546875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 9.0, 12.0, 15.0, 20.0, 24.0, 48.0, 45.0, 41.0, 56.0, 74.0, 69.0, 100.0, 69.0, 59.0, 65.0, 54.0, 59.0, 39.0, 40.0, 24.0, 23.0, 15.0, 11.0, 7.0, 8.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.041351318359375, -0.040238142013549805, -0.03912496566772461, -0.038011789321899414, -0.03689861297607422, -0.03578543663024902, -0.03467226028442383, -0.03355908393859863, -0.03244590759277344, -0.03133273124694824, -0.030219554901123047, -0.02910637855529785, -0.027993202209472656, -0.02688002586364746, -0.025766849517822266, -0.02465367317199707, -0.023540496826171875, -0.02242732048034668, -0.021314144134521484, -0.02020096778869629, -0.019087791442871094, -0.0179746150970459, -0.016861438751220703, -0.015748262405395508, -0.014635086059570312, -0.013521909713745117, -0.012408733367919922, -0.011295557022094727, -0.010182380676269531, -0.009069204330444336, -0.00795602798461914, -0.006842851638793945, -0.00572967529296875, -0.004616498947143555, -0.0035033226013183594, -0.002390146255493164, -0.0012769699096679688, -0.00016379356384277344, 0.0009493827819824219, 0.002062559127807617, 0.0031757354736328125, 0.004288911819458008, 0.005402088165283203, 0.0065152645111083984, 0.007628440856933594, 0.008741617202758789, 0.009854793548583984, 0.01096796989440918, 0.012081146240234375, 0.01319432258605957, 0.014307498931884766, 0.015420675277709961, 0.016533851623535156, 0.01764702796936035, 0.018760204315185547, 0.019873380661010742, 0.020986557006835938, 0.022099733352661133, 0.023212909698486328, 0.024326086044311523, 0.02543926239013672, 0.026552438735961914, 0.02766561508178711, 0.028778791427612305, 0.0298919677734375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 9.0, 6.0, 12.0, 10.0, 31.0, 34.0, 53.0, 74.0, 108.0, 206.0, 353.0, 643.0, 1640.0, 5776.0, 44237.0, 3990543.0, 136034.0, 9965.0, 2403.0, 940.0, 488.0, 269.0, 164.0, 108.0, 59.0, 39.0, 27.0, 19.0, 16.0, 13.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0694580078125, -0.06652259826660156, -0.06358718872070312, -0.06065177917480469, -0.05771636962890625, -0.05478096008300781, -0.051845550537109375, -0.04891014099121094, -0.0459747314453125, -0.04303932189941406, -0.040103912353515625, -0.03716850280761719, -0.03423309326171875, -0.03129768371582031, -0.028362274169921875, -0.025426864624023438, -0.022491455078125, -0.019556045532226562, -0.016620635986328125, -0.013685226440429688, -0.01074981689453125, -0.007814407348632812, -0.004878997802734375, -0.0019435882568359375, 0.0009918212890625, 0.0039272308349609375, 0.006862640380859375, 0.009798049926757812, 0.01273345947265625, 0.015668869018554688, 0.018604278564453125, 0.021539688110351562, 0.02447509765625, 0.027410507202148438, 0.030345916748046875, 0.03328132629394531, 0.03621673583984375, 0.03915214538574219, 0.042087554931640625, 0.04502296447753906, 0.0479583740234375, 0.05089378356933594, 0.053829193115234375, 0.05676460266113281, 0.05970001220703125, 0.06263542175292969, 0.06557083129882812, 0.06850624084472656, 0.071441650390625, 0.07437705993652344, 0.07731246948242188, 0.08024787902832031, 0.08318328857421875, 0.08611869812011719, 0.08905410766601562, 0.09198951721191406, 0.0949249267578125, 0.09786033630371094, 0.10079574584960938, 0.10373115539550781, 0.10666656494140625, 0.10960197448730469, 0.11253738403320312, 0.11547279357910156, 0.118408203125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 3.0, 4.0, 5.0, 7.0, 5.0, 24.0, 31.0, 78.0, 254.0, 2837.0, 607.0, 105.0, 48.0, 23.0, 17.0, 9.0, 6.0, 5.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02154541015625, -0.020253658294677734, -0.01896190643310547, -0.017670154571533203, -0.016378402709960938, -0.015086650848388672, -0.013794898986816406, -0.01250314712524414, -0.011211395263671875, -0.00991964340209961, -0.008627891540527344, -0.007336139678955078, -0.0060443878173828125, -0.004752635955810547, -0.0034608840942382812, -0.0021691322326660156, -0.00087738037109375, 0.0004143714904785156, 0.0017061233520507812, 0.002997875213623047, 0.0042896270751953125, 0.005581378936767578, 0.006873130798339844, 0.00816488265991211, 0.009456634521484375, 0.01074838638305664, 0.012040138244628906, 0.013331890106201172, 0.014623641967773438, 0.015915393829345703, 0.01720714569091797, 0.018498897552490234, 0.0197906494140625, 0.021082401275634766, 0.02237415313720703, 0.023665904998779297, 0.024957656860351562, 0.026249408721923828, 0.027541160583496094, 0.02883291244506836, 0.030124664306640625, 0.03141641616821289, 0.032708168029785156, 0.03399991989135742, 0.03529167175292969, 0.03658342361450195, 0.03787517547607422, 0.039166927337646484, 0.04045867919921875, 0.041750431060791016, 0.04304218292236328, 0.04433393478393555, 0.04562568664550781, 0.04691743850708008, 0.048209190368652344, 0.04950094223022461, 0.050792694091796875, 0.05208444595336914, 0.053376197814941406, 0.05466794967651367, 0.05595970153808594, 0.0572514533996582, 0.05854320526123047, 0.059834957122802734, 0.061126708984375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 13.0, 83.0, 585.0, 277.0, 25.0, 6.0, 5.0, 10.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.38697558641433716, -0.3743705749511719, -0.3617655634880066, -0.3491605222225189, -0.33655551075935364, -0.32395049929618835, -0.3113454580307007, -0.2987404465675354, -0.2861354351043701, -0.27353042364120483, -0.26092541217803955, -0.24832037091255188, -0.2357153594493866, -0.2231103479862213, -0.21050532162189484, -0.19790029525756836, -0.18529528379440308, -0.1726902723312378, -0.16008524596691132, -0.14748021960258484, -0.13487520813941956, -0.12227018922567368, -0.1096651703119278, -0.09706015139818192, -0.08445513248443604, -0.07185011357069016, -0.059245094656944275, -0.046640075743198395, -0.034035056829452515, -0.021430037915706635, -0.008825019001960754, 0.0037799999117851257, 0.016385018825531006, 0.028990037739276886, 0.041595056653022766, 0.054200075566768646, 0.06680509448051453, 0.0794101133942604, 0.09201513230800629, 0.10462015122175217, 0.11722517013549805, 0.12983018159866333, 0.1424352079629898, 0.15504023432731628, 0.16764524579048157, 0.18025025725364685, 0.19285528361797333, 0.2054603099822998, 0.2180653214454651, 0.23067033290863037, 0.24327535927295685, 0.2558803856372833, 0.2684853971004486, 0.2810904085636139, 0.29369544982910156, 0.30630046129226685, 0.31890547275543213, 0.3315104842185974, 0.3441154956817627, 0.35672053694725037, 0.36932554841041565, 0.38193055987358093, 0.3945356011390686, 0.4071406126022339, 0.41974562406539917]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 7.0, 5.0, 9.0, 24.0, 41.0, 46.0, 85.0, 98.0, 112.0, 125.0, 121.0, 106.0, 75.0, 71.0, 29.0, 19.0, 11.0, 3.0, 7.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.14142745733261108, -0.1362578272819519, -0.13108819723129272, -0.12591858208179474, -0.12074895203113556, -0.11557932198047638, -0.1104096993803978, -0.10524007678031921, -0.10007044672966003, -0.09490081667900085, -0.08973119407892227, -0.08456157147884369, -0.07939194142818451, -0.07422231137752533, -0.06905268877744675, -0.06388306617736816, -0.058713436126708984, -0.0535438098013401, -0.04837418347597122, -0.04320455715060234, -0.03803493082523346, -0.03286530449986458, -0.027695678174495697, -0.022526051849126816, -0.017356425523757935, -0.012186799198389053, -0.007017172873020172, -0.001847546547651291, 0.0033220797777175903, 0.008491706103086472, 0.013661332428455353, 0.018830958753824234, 0.024000585079193115, 0.029170211404561996, 0.03433983772993088, 0.03950946405529976, 0.04467909038066864, 0.04984871670603752, 0.0550183430314064, 0.060187969356775284, 0.06535759568214417, 0.07052722573280334, 0.07569684833288193, 0.08086647093296051, 0.08603610098361969, 0.09120573103427887, 0.09637535363435745, 0.10154497623443604, 0.10671460628509521, 0.1118842363357544, 0.11705385893583298, 0.12222348153591156, 0.12739311158657074, 0.13256274163722992, 0.1377323567867279, 0.14290198683738708, 0.14807161688804626, 0.15324124693870544, 0.15841087698936462, 0.1635804921388626, 0.1687501221895218, 0.17391975224018097, 0.17908936738967896, 0.18425899744033813, 0.18942862749099731]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 4.0, 5.0, 11.0, 8.0, 16.0, 17.0, 35.0, 37.0, 48.0, 63.0, 90.0, 131.0, 209.0, 335.0, 533.0, 911.0, 1674.0, 3092.0, 6288.0, 14260.0, 36125.0, 107571.0, 362712.0, 349207.0, 103331.0, 34634.0, 13787.0, 6289.0, 2971.0, 1685.0, 922.0, 549.0, 344.0, 188.0, 130.0, 106.0, 85.0, 46.0, 32.0, 22.0, 19.0, 11.0, 5.0, 5.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0478515625, -0.04630708694458008, -0.044762611389160156, -0.043218135833740234, -0.04167366027832031, -0.04012918472290039, -0.03858470916748047, -0.03704023361206055, -0.035495758056640625, -0.0339512825012207, -0.03240680694580078, -0.03086233139038086, -0.029317855834960938, -0.027773380279541016, -0.026228904724121094, -0.024684429168701172, -0.02313995361328125, -0.021595478057861328, -0.020051002502441406, -0.018506526947021484, -0.016962051391601562, -0.01541757583618164, -0.013873100280761719, -0.012328624725341797, -0.010784149169921875, -0.009239673614501953, -0.007695198059082031, -0.006150722503662109, -0.0046062469482421875, -0.0030617713928222656, -0.0015172958374023438, 2.7179718017578125e-05, 0.0015716552734375, 0.003116130828857422, 0.004660606384277344, 0.006205081939697266, 0.0077495574951171875, 0.00929403305053711, 0.010838508605957031, 0.012382984161376953, 0.013927459716796875, 0.015471935272216797, 0.01701641082763672, 0.01856088638305664, 0.020105361938476562, 0.021649837493896484, 0.023194313049316406, 0.024738788604736328, 0.02628326416015625, 0.027827739715576172, 0.029372215270996094, 0.030916690826416016, 0.03246116638183594, 0.03400564193725586, 0.03555011749267578, 0.0370945930480957, 0.038639068603515625, 0.04018354415893555, 0.04172801971435547, 0.04327249526977539, 0.04481697082519531, 0.046361446380615234, 0.047905921936035156, 0.04945039749145508, 0.050994873046875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 8.0, 11.0, 11.0, 15.0, 29.0, 27.0, 27.0, 40.0, 57.0, 53.0, 66.0, 82.0, 86.0, 76.0, 63.0, 60.0, 54.0, 53.0, 39.0, 36.0, 26.0, 20.0, 15.0, 21.0, 8.0, 2.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.036468505859375, -0.035399436950683594, -0.03433036804199219, -0.03326129913330078, -0.032192230224609375, -0.03112316131591797, -0.030054092407226562, -0.028985023498535156, -0.02791595458984375, -0.026846885681152344, -0.025777816772460938, -0.02470874786376953, -0.023639678955078125, -0.02257061004638672, -0.021501541137695312, -0.020432472229003906, -0.0193634033203125, -0.018294334411621094, -0.017225265502929688, -0.01615619659423828, -0.015087127685546875, -0.014018058776855469, -0.012948989868164062, -0.011879920959472656, -0.01081085205078125, -0.009741783142089844, -0.008672714233398438, -0.007603645324707031, -0.006534576416015625, -0.005465507507324219, -0.0043964385986328125, -0.0033273696899414062, -0.00225830078125, -0.0011892318725585938, -0.0001201629638671875, 0.0009489059448242188, 0.002017974853515625, 0.0030870437622070312, 0.0041561126708984375, 0.005225181579589844, 0.00629425048828125, 0.007363319396972656, 0.008432388305664062, 0.009501457214355469, 0.010570526123046875, 0.011639595031738281, 0.012708663940429688, 0.013777732849121094, 0.0148468017578125, 0.015915870666503906, 0.016984939575195312, 0.01805400848388672, 0.019123077392578125, 0.02019214630126953, 0.021261215209960938, 0.022330284118652344, 0.02339935302734375, 0.024468421936035156, 0.025537490844726562, 0.02660655975341797, 0.027675628662109375, 0.02874469757080078, 0.029813766479492188, 0.030882835388183594, 0.031951904296875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 2.0, 8.0, 17.0, 15.0, 29.0, 37.0, 37.0, 48.0, 72.0, 125.0, 165.0, 245.0, 445.0, 721.0, 1314.0, 2911.0, 7216.0, 22811.0, 91332.0, 458727.0, 362311.0, 69706.0, 18633.0, 6096.0, 2529.0, 1181.0, 643.0, 397.0, 265.0, 147.0, 83.0, 76.0, 53.0, 36.0, 30.0, 25.0, 18.0, 8.0, 7.0, 7.0, 4.0, 3.0, 4.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.048095703125, -0.04648780822753906, -0.044879913330078125, -0.04327201843261719, -0.04166412353515625, -0.04005622863769531, -0.038448333740234375, -0.03684043884277344, -0.0352325439453125, -0.03362464904785156, -0.032016754150390625, -0.030408859252929688, -0.02880096435546875, -0.027193069458007812, -0.025585174560546875, -0.023977279663085938, -0.022369384765625, -0.020761489868164062, -0.019153594970703125, -0.017545700073242188, -0.01593780517578125, -0.014329910278320312, -0.012722015380859375, -0.011114120483398438, -0.0095062255859375, -0.007898330688476562, -0.006290435791015625, -0.0046825408935546875, -0.00307464599609375, -0.0014667510986328125, 0.000141143798828125, 0.0017490386962890625, 0.00335693359375, 0.0049648284912109375, 0.006572723388671875, 0.008180618286132812, 0.00978851318359375, 0.011396408081054688, 0.013004302978515625, 0.014612197875976562, 0.0162200927734375, 0.017827987670898438, 0.019435882568359375, 0.021043777465820312, 0.02265167236328125, 0.024259567260742188, 0.025867462158203125, 0.027475357055664062, 0.029083251953125, 0.030691146850585938, 0.032299041748046875, 0.03390693664550781, 0.03551483154296875, 0.03712272644042969, 0.038730621337890625, 0.04033851623535156, 0.0419464111328125, 0.04355430603027344, 0.045162200927734375, 0.04677009582519531, 0.04837799072265625, 0.04998588562011719, 0.051593780517578125, 0.05320167541503906, 0.0548095703125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 11.0, 7.0, 13.0, 13.0, 15.0, 22.0, 20.0, 22.0, 29.0, 29.0, 37.0, 38.0, 35.0, 50.0, 53.0, 55.0, 47.0, 45.0, 52.0, 42.0, 35.0, 37.0, 41.0, 28.0, 28.0, 28.0, 31.0, 22.0, 24.0, 23.0, 19.0, 8.0, 5.0, 7.0, 8.0, 5.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08441162109375, -0.08162498474121094, -0.07883834838867188, -0.07605171203613281, -0.07326507568359375, -0.07047843933105469, -0.06769180297851562, -0.06490516662597656, -0.0621185302734375, -0.05933189392089844, -0.056545257568359375, -0.05375862121582031, -0.05097198486328125, -0.04818534851074219, -0.045398712158203125, -0.04261207580566406, -0.039825439453125, -0.03703880310058594, -0.034252166748046875, -0.03146553039550781, -0.02867889404296875, -0.025892257690429688, -0.023105621337890625, -0.020318984985351562, -0.0175323486328125, -0.014745712280273438, -0.011959075927734375, -0.009172439575195312, -0.00638580322265625, -0.0035991668701171875, -0.000812530517578125, 0.0019741058349609375, 0.0047607421875, 0.0075473785400390625, 0.010334014892578125, 0.013120651245117188, 0.01590728759765625, 0.018693923950195312, 0.021480560302734375, 0.024267196655273438, 0.0270538330078125, 0.029840469360351562, 0.032627105712890625, 0.03541374206542969, 0.03820037841796875, 0.04098701477050781, 0.043773651123046875, 0.04656028747558594, 0.049346923828125, 0.05213356018066406, 0.054920196533203125, 0.05770683288574219, 0.06049346923828125, 0.06328010559082031, 0.06606674194335938, 0.06885337829589844, 0.0716400146484375, 0.07442665100097656, 0.07721328735351562, 0.07999992370605469, 0.08278656005859375, 0.08557319641113281, 0.08835983276367188, 0.09114646911621094, 0.09393310546875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 4.0, 8.0, 3.0, 12.0, 13.0, 37.0, 71.0, 171.0, 503.0, 1997.0, 19916.0, 734403.0, 282548.0, 7105.0, 1163.0, 336.0, 139.0, 58.0, 31.0, 15.0, 9.0, 5.0, 5.0, 6.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03546142578125, -0.034523963928222656, -0.03358650207519531, -0.03264904022216797, -0.031711578369140625, -0.03077411651611328, -0.029836654663085938, -0.028899192810058594, -0.02796173095703125, -0.027024269104003906, -0.026086807250976562, -0.02514934539794922, -0.024211883544921875, -0.02327442169189453, -0.022336959838867188, -0.021399497985839844, -0.0204620361328125, -0.019524574279785156, -0.018587112426757812, -0.01764965057373047, -0.016712188720703125, -0.01577472686767578, -0.014837265014648438, -0.013899803161621094, -0.01296234130859375, -0.012024879455566406, -0.011087417602539062, -0.010149955749511719, -0.009212493896484375, -0.008275032043457031, -0.0073375701904296875, -0.006400108337402344, -0.005462646484375, -0.004525184631347656, -0.0035877227783203125, -0.0026502609252929688, -0.001712799072265625, -0.0007753372192382812, 0.0001621246337890625, 0.0010995864868164062, 0.00203704833984375, 0.0029745101928710938, 0.0039119720458984375, 0.004849433898925781, 0.005786895751953125, 0.006724357604980469, 0.0076618194580078125, 0.008599281311035156, 0.0095367431640625, 0.010474205017089844, 0.011411666870117188, 0.012349128723144531, 0.013286590576171875, 0.014224052429199219, 0.015161514282226562, 0.016098976135253906, 0.01703643798828125, 0.017973899841308594, 0.018911361694335938, 0.01984882354736328, 0.020786285400390625, 0.02172374725341797, 0.022661209106445312, 0.023598670959472656, 0.0245361328125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 1.0, 4.0, 5.0, 9.0, 6.0, 12.0, 16.0, 31.0, 32.0, 38.0, 49.0, 65.0, 58.0, 59.0, 67.0, 115.0, 65.0, 62.0, 45.0, 59.0, 54.0, 30.0, 30.0, 19.0, 29.0, 14.0, 10.0, 6.0, 9.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.947185516357422e-06, -4.754401743412018e-06, -4.561617970466614e-06, -4.36883419752121e-06, -4.176050424575806e-06, -3.983266651630402e-06, -3.7904828786849976e-06, -3.5976991057395935e-06, -3.4049153327941895e-06, -3.2121315598487854e-06, -3.0193477869033813e-06, -2.8265640139579773e-06, -2.6337802410125732e-06, -2.440996468067169e-06, -2.248212695121765e-06, -2.055428922176361e-06, -1.862645149230957e-06, -1.669861376285553e-06, -1.477077603340149e-06, -1.2842938303947449e-06, -1.0915100574493408e-06, -8.987262845039368e-07, -7.059425115585327e-07, -5.131587386131287e-07, -3.203749656677246e-07, -1.2759119272232056e-07, 6.51925802230835e-08, 2.5797635316848755e-07, 4.507601261138916e-07, 6.435438990592957e-07, 8.363276720046997e-07, 1.0291114449501038e-06, 1.2218952178955078e-06, 1.4146789908409119e-06, 1.607462763786316e-06, 1.80024653673172e-06, 1.993030309677124e-06, 2.185814082622528e-06, 2.378597855567932e-06, 2.571381628513336e-06, 2.7641654014587402e-06, 2.9569491744041443e-06, 3.1497329473495483e-06, 3.3425167202949524e-06, 3.5353004932403564e-06, 3.7280842661857605e-06, 3.9208680391311646e-06, 4.113651812076569e-06, 4.306435585021973e-06, 4.499219357967377e-06, 4.692003130912781e-06, 4.884786903858185e-06, 5.077570676803589e-06, 5.270354449748993e-06, 5.463138222694397e-06, 5.655921995639801e-06, 5.848705768585205e-06, 6.041489541530609e-06, 6.234273314476013e-06, 6.427057087421417e-06, 6.619840860366821e-06, 6.812624633312225e-06, 7.005408406257629e-06, 7.1981921792030334e-06, 7.3909759521484375e-06]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 11.0, 9.0, 12.0, 15.0, 36.0, 51.0, 71.0, 130.0, 296.0, 632.0, 1788.0, 7921.0, 61682.0, 506466.0, 415950.0, 44543.0, 6135.0, 1635.0, 609.0, 223.0, 129.0, 70.0, 47.0, 41.0, 23.0, 10.0, 4.0, 5.0, 6.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0179901123046875, -0.01738905906677246, -0.016788005828857422, -0.016186952590942383, -0.015585899353027344, -0.014984846115112305, -0.014383792877197266, -0.013782739639282227, -0.013181686401367188, -0.012580633163452148, -0.01197957992553711, -0.01137852668762207, -0.010777473449707031, -0.010176420211791992, -0.009575366973876953, -0.008974313735961914, -0.008373260498046875, -0.007772207260131836, -0.007171154022216797, -0.006570100784301758, -0.005969047546386719, -0.00536799430847168, -0.004766941070556641, -0.0041658878326416016, -0.0035648345947265625, -0.0029637813568115234, -0.0023627281188964844, -0.0017616748809814453, -0.0011606216430664062, -0.0005595684051513672, 4.1484832763671875e-05, 0.0006425380706787109, 0.00124359130859375, 0.001844644546508789, 0.002445697784423828, 0.003046751022338867, 0.0036478042602539062, 0.004248857498168945, 0.004849910736083984, 0.0054509639739990234, 0.0060520172119140625, 0.0066530704498291016, 0.007254123687744141, 0.00785517692565918, 0.008456230163574219, 0.009057283401489258, 0.009658336639404297, 0.010259389877319336, 0.010860443115234375, 0.011461496353149414, 0.012062549591064453, 0.012663602828979492, 0.013264656066894531, 0.01386570930480957, 0.01446676254272461, 0.015067815780639648, 0.015668869018554688, 0.016269922256469727, 0.016870975494384766, 0.017472028732299805, 0.018073081970214844, 0.018674135208129883, 0.019275188446044922, 0.01987624168395996, 0.020477294921875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 13.0, 2.0, 12.0, 20.0, 24.0, 32.0, 38.0, 49.0, 76.0, 86.0, 68.0, 93.0, 87.0, 102.0, 72.0, 65.0, 40.0, 37.0, 29.0, 15.0, 13.0, 12.0, 4.0, 3.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0189666748046875, -0.01835036277770996, -0.017734050750732422, -0.017117738723754883, -0.016501426696777344, -0.015885114669799805, -0.015268802642822266, -0.014652490615844727, -0.014036178588867188, -0.013419866561889648, -0.01280355453491211, -0.01218724250793457, -0.011570930480957031, -0.010954618453979492, -0.010338306427001953, -0.009721994400024414, -0.009105682373046875, -0.008489370346069336, -0.007873058319091797, -0.007256746292114258, -0.006640434265136719, -0.00602412223815918, -0.005407810211181641, -0.0047914981842041016, -0.0041751861572265625, -0.0035588741302490234, -0.0029425621032714844, -0.0023262500762939453, -0.0017099380493164062, -0.0010936260223388672, -0.0004773139953613281, 0.00013899803161621094, 0.00075531005859375, 0.001371622085571289, 0.001987934112548828, 0.002604246139526367, 0.0032205581665039062, 0.0038368701934814453, 0.004453182220458984, 0.0050694942474365234, 0.0056858062744140625, 0.0063021183013916016, 0.006918430328369141, 0.00753474235534668, 0.008151054382324219, 0.008767366409301758, 0.009383678436279297, 0.009999990463256836, 0.010616302490234375, 0.011232614517211914, 0.011848926544189453, 0.012465238571166992, 0.013081550598144531, 0.01369786262512207, 0.01431417465209961, 0.014930486679077148, 0.015546798706054688, 0.016163110733032227, 0.016779422760009766, 0.017395734786987305, 0.018012046813964844, 0.018628358840942383, 0.019244670867919922, 0.01986098289489746, 0.020477294921875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 9.0, 21.0, 87.0, 341.0, 415.0, 93.0, 31.0, 7.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5913399457931519, -0.5587685108184814, -0.5261971354484558, -0.4936257302761078, -0.46105432510375977, -0.42848291993141174, -0.3959115147590637, -0.3633401095867157, -0.3307687044143677, -0.29819729924201965, -0.26562589406967163, -0.2330544888973236, -0.20048308372497559, -0.16791167855262756, -0.13534027338027954, -0.10276886820793152, -0.0701974630355835, -0.037626057863235474, -0.005054652690887451, 0.02751675248146057, 0.060088157653808594, 0.09265956282615662, 0.12523096799850464, 0.15780237317085266, 0.19037377834320068, 0.2229451835155487, 0.25551658868789673, 0.28808799386024475, 0.3206593990325928, 0.3532308042049408, 0.3858022093772888, 0.41837361454963684, 0.4509451389312744, 0.48351654410362244, 0.5160879492759705, 0.5486593246459961, 0.5812307596206665, 0.6138021945953369, 0.6463735699653625, 0.6789449453353882, 0.7115163803100586, 0.744087815284729, 0.7766591906547546, 0.8092305660247803, 0.8418020009994507, 0.8743734359741211, 0.9069448113441467, 0.9395161867141724, 0.9720876216888428, 1.0046590566635132, 1.0372304916381836, 1.0698018074035645, 1.1023732423782349, 1.1349446773529053, 1.1675159931182861, 1.2000874280929565, 1.232658863067627, 1.2652302980422974, 1.2978017330169678, 1.3303730487823486, 1.362944483757019, 1.3955159187316895, 1.4280872344970703, 1.4606586694717407, 1.4932301044464111]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 4.0, 1.0, 9.0, 12.0, 8.0, 5.0, 10.0, 8.0, 19.0, 15.0, 20.0, 14.0, 26.0, 20.0, 20.0, 22.0, 29.0, 22.0, 31.0, 41.0, 33.0, 39.0, 32.0, 47.0, 54.0, 44.0, 46.0, 38.0, 40.0, 39.0, 29.0, 28.0, 26.0, 26.0, 24.0, 15.0, 12.0, 15.0, 14.0, 13.0, 7.0, 9.0, 7.0, 3.0, 8.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.3801348805427551, -0.3685291111469269, -0.35692334175109863, -0.345317542552948, -0.33371177315711975, -0.3221060037612915, -0.31050023436546326, -0.298894464969635, -0.2872886657714844, -0.27568289637565613, -0.2640771269798279, -0.25247132778167725, -0.240865558385849, -0.22925978899002075, -0.2176540195941925, -0.20604825019836426, -0.194442480802536, -0.18283671140670776, -0.17123092710971832, -0.15962515771389008, -0.14801937341690063, -0.1364136040210724, -0.12480783462524414, -0.1132020577788353, -0.10159628093242645, -0.08999050408601761, -0.07838472723960876, -0.06677895784378052, -0.055173180997371674, -0.04356740415096283, -0.03196163475513458, -0.02035585790872574, -0.008750081062316895, 0.0028556939214468002, 0.014461468905210495, 0.02606724202632904, 0.037673018872737885, 0.04927879571914673, 0.060884565114974976, 0.07249034196138382, 0.08409611880779266, 0.09570189565420151, 0.10730767250061035, 0.1189134418964386, 0.13051921129226685, 0.1421249955892563, 0.15373076498508453, 0.16533654928207397, 0.17694231867790222, 0.18854808807373047, 0.2001538723707199, 0.21175964176654816, 0.2233654260635376, 0.23497119545936584, 0.2465769648551941, 0.25818273425102234, 0.2697885036468506, 0.28139427304267883, 0.2930000424385071, 0.3046058416366577, 0.31621161103248596, 0.3278173804283142, 0.33942314982414246, 0.3510289192199707, 0.36263471841812134]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 8.0, 20.0, 21.0, 38.0, 80.0, 149.0, 230.0, 446.0, 1015.0, 2801.0, 13994.0, 3591430.0, 568767.0, 10777.0, 2451.0, 963.0, 425.0, 273.0, 151.0, 83.0, 51.0, 33.0, 22.0, 15.0, 10.0, 5.0, 4.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.15087890625, -0.14690303802490234, -0.1429271697998047, -0.13895130157470703, -0.13497543334960938, -0.13099956512451172, -0.12702369689941406, -0.1230478286743164, -0.11907196044921875, -0.1150960922241211, -0.11112022399902344, -0.10714435577392578, -0.10316848754882812, -0.09919261932373047, -0.09521675109863281, -0.09124088287353516, -0.0872650146484375, -0.08328914642333984, -0.07931327819824219, -0.07533740997314453, -0.07136154174804688, -0.06738567352294922, -0.06340980529785156, -0.059433937072753906, -0.05545806884765625, -0.051482200622558594, -0.04750633239746094, -0.04353046417236328, -0.039554595947265625, -0.03557872772216797, -0.03160285949707031, -0.027626991271972656, -0.023651123046875, -0.019675254821777344, -0.015699386596679688, -0.011723518371582031, -0.007747650146484375, -0.0037717819213867188, 0.0002040863037109375, 0.004179954528808594, 0.00815582275390625, 0.012131690979003906, 0.016107559204101562, 0.02008342742919922, 0.024059295654296875, 0.02803516387939453, 0.03201103210449219, 0.035986900329589844, 0.0399627685546875, 0.043938636779785156, 0.04791450500488281, 0.05189037322998047, 0.055866241455078125, 0.05984210968017578, 0.06381797790527344, 0.0677938461303711, 0.07176971435546875, 0.0757455825805664, 0.07972145080566406, 0.08369731903076172, 0.08767318725585938, 0.09164905548095703, 0.09562492370605469, 0.09960079193115234, 0.10357666015625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 10.0, 6.0, 13.0, 11.0, 23.0, 31.0, 28.0, 30.0, 41.0, 45.0, 64.0, 78.0, 78.0, 70.0, 73.0, 78.0, 53.0, 48.0, 41.0, 56.0, 27.0, 30.0, 21.0, 12.0, 14.0, 4.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.036163330078125, -0.03509092330932617, -0.034018516540527344, -0.032946109771728516, -0.03187370300292969, -0.03080129623413086, -0.02972888946533203, -0.028656482696533203, -0.027584075927734375, -0.026511669158935547, -0.02543926239013672, -0.02436685562133789, -0.023294448852539062, -0.022222042083740234, -0.021149635314941406, -0.020077228546142578, -0.01900482177734375, -0.017932415008544922, -0.016860008239746094, -0.015787601470947266, -0.014715194702148438, -0.01364278793334961, -0.012570381164550781, -0.011497974395751953, -0.010425567626953125, -0.009353160858154297, -0.008280754089355469, -0.007208347320556641, -0.0061359405517578125, -0.005063533782958984, -0.003991127014160156, -0.002918720245361328, -0.0018463134765625, -0.0007739067077636719, 0.00029850006103515625, 0.0013709068298339844, 0.0024433135986328125, 0.0035157203674316406, 0.004588127136230469, 0.005660533905029297, 0.006732940673828125, 0.007805347442626953, 0.008877754211425781, 0.00995016098022461, 0.011022567749023438, 0.012094974517822266, 0.013167381286621094, 0.014239788055419922, 0.01531219482421875, 0.016384601593017578, 0.017457008361816406, 0.018529415130615234, 0.019601821899414062, 0.02067422866821289, 0.02174663543701172, 0.022819042205810547, 0.023891448974609375, 0.024963855743408203, 0.02603626251220703, 0.02710866928100586, 0.028181076049804688, 0.029253482818603516, 0.030325889587402344, 0.03139829635620117, 0.032470703125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 6.0, 6.0, 15.0, 25.0, 40.0, 78.0, 96.0, 177.0, 309.0, 460.0, 811.0, 1561.0, 4301.0, 20782.0, 1517769.0, 2618106.0, 21728.0, 4459.0, 1541.0, 786.0, 444.0, 266.0, 209.0, 113.0, 72.0, 49.0, 23.0, 11.0, 20.0, 6.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0791015625, -0.0762777328491211, -0.07345390319824219, -0.07063007354736328, -0.06780624389648438, -0.06498241424560547, -0.06215858459472656, -0.059334754943847656, -0.05651092529296875, -0.053687095642089844, -0.05086326599121094, -0.04803943634033203, -0.045215606689453125, -0.04239177703857422, -0.03956794738769531, -0.036744117736816406, -0.0339202880859375, -0.031096458435058594, -0.028272628784179688, -0.02544879913330078, -0.022624969482421875, -0.01980113983154297, -0.016977310180664062, -0.014153480529785156, -0.01132965087890625, -0.008505821228027344, -0.0056819915771484375, -0.0028581619262695312, -3.4332275390625e-05, 0.0027894973754882812, 0.0056133270263671875, 0.008437156677246094, 0.011260986328125, 0.014084815979003906, 0.016908645629882812, 0.01973247528076172, 0.022556304931640625, 0.02538013458251953, 0.028203964233398438, 0.031027793884277344, 0.03385162353515625, 0.036675453186035156, 0.03949928283691406, 0.04232311248779297, 0.045146942138671875, 0.04797077178955078, 0.05079460144042969, 0.053618431091308594, 0.0564422607421875, 0.059266090393066406, 0.06208992004394531, 0.06491374969482422, 0.06773757934570312, 0.07056140899658203, 0.07338523864746094, 0.07620906829833984, 0.07903289794921875, 0.08185672760009766, 0.08468055725097656, 0.08750438690185547, 0.09032821655273438, 0.09315204620361328, 0.09597587585449219, 0.0987997055053711, 0.10162353515625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 9.0, 11.0, 12.0, 35.0, 64.0, 197.0, 2696.0, 777.0, 124.0, 60.0, 22.0, 11.0, 14.0, 9.0, 6.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0202484130859375, -0.01877903938293457, -0.01730966567993164, -0.01584029197692871, -0.014370918273925781, -0.012901544570922852, -0.011432170867919922, -0.009962797164916992, -0.008493423461914062, -0.007024049758911133, -0.005554676055908203, -0.0040853023529052734, -0.0026159286499023438, -0.001146554946899414, 0.0003228187561035156, 0.0017921924591064453, 0.003261566162109375, 0.004730939865112305, 0.006200313568115234, 0.007669687271118164, 0.009139060974121094, 0.010608434677124023, 0.012077808380126953, 0.013547182083129883, 0.015016555786132812, 0.016485929489135742, 0.017955303192138672, 0.0194246768951416, 0.02089405059814453, 0.02236342430114746, 0.02383279800415039, 0.02530217170715332, 0.02677154541015625, 0.02824091911315918, 0.02971029281616211, 0.03117966651916504, 0.03264904022216797, 0.0341184139251709, 0.03558778762817383, 0.03705716133117676, 0.03852653503417969, 0.03999590873718262, 0.04146528244018555, 0.04293465614318848, 0.044404029846191406, 0.045873403549194336, 0.047342777252197266, 0.048812150955200195, 0.050281524658203125, 0.051750898361206055, 0.053220272064208984, 0.054689645767211914, 0.056159019470214844, 0.05762839317321777, 0.0590977668762207, 0.06056714057922363, 0.06203651428222656, 0.06350588798522949, 0.06497526168823242, 0.06644463539123535, 0.06791400909423828, 0.06938338279724121, 0.07085275650024414, 0.07232213020324707, 0.07379150390625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 4.0, 10.0, 290.0, 595.0, 76.0, 21.0, 8.0, 5.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08917739987373352, -0.0673225149512291, -0.04546763375401497, -0.023612752556800842, -0.0017578676342964172, 0.020097017288208008, 0.041951894760131836, 0.06380678713321686, 0.08566166460514069, 0.10751654952764511, 0.12937143445014954, 0.15122631192207336, 0.1730811893939972, 0.19493608176708221, 0.21679095923900604, 0.23864585161209106, 0.2605007290840149, 0.2823556065559387, 0.30421048402786255, 0.3260653614997864, 0.3479202687740326, 0.3697751462459564, 0.39163002371788025, 0.41348493099212646, 0.4353398084640503, 0.4571946859359741, 0.47904956340789795, 0.5009044408798218, 0.5227593183517456, 0.5446141958236694, 0.5664690732955933, 0.5883240103721619, 0.6101788878440857, 0.6320337653160095, 0.6538886427879333, 0.6757435202598572, 0.697598397731781, 0.7194533348083496, 0.7413082122802734, 0.7631630897521973, 0.7850179672241211, 0.8068728446960449, 0.8287277221679688, 0.8505825996398926, 0.8724374771118164, 0.8942923545837402, 0.9161472320556641, 0.9380021691322327, 0.9598569869995117, 0.9817118644714355, 1.0035667419433594, 1.0254216194152832, 1.047276496887207, 1.0691313743591309, 1.0909862518310547, 1.1128411293029785, 1.134696125984192, 1.1565510034561157, 1.1784058809280396, 1.2002607583999634, 1.2221156358718872, 1.243970513343811, 1.2658253908157349, 1.2876802682876587, 1.3095351457595825]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 11.0, 11.0, 23.0, 41.0, 52.0, 71.0, 74.0, 94.0, 104.0, 127.0, 95.0, 88.0, 66.0, 51.0, 36.0, 21.0, 11.0, 12.0, 3.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17617905139923096, -0.16945287585258484, -0.16272671520709991, -0.1560005396604538, -0.14927437901496887, -0.14254820346832275, -0.13582202792167664, -0.12909585237503052, -0.1223696917295456, -0.11564352363348007, -0.10891735553741455, -0.10219117999076843, -0.09546501189470291, -0.08873884379863739, -0.08201266825199127, -0.07528650015592575, -0.06856033205986023, -0.06183416396379471, -0.05510799214243889, -0.04838182032108307, -0.04165565222501755, -0.034929484128952026, -0.028203312307596207, -0.021477140486240387, -0.014750972390174866, -0.008024802431464195, -0.0012986324727535248, 0.005427537485957146, 0.012153707444667816, 0.018879875540733337, 0.025606047362089157, 0.03233221918344498, 0.0390583872795105, 0.04578455537557602, 0.05251072719693184, 0.05923689901828766, 0.06596306711435318, 0.0726892352104187, 0.07941541075706482, 0.08614157885313034, 0.09286774694919586, 0.09959391504526138, 0.1063200831413269, 0.11304625868797302, 0.11977242678403854, 0.12649859488010406, 0.13322477042675018, 0.1399509310722351, 0.14667710661888123, 0.15340328216552734, 0.16012944281101227, 0.1668556183576584, 0.1735817790031433, 0.18030795454978943, 0.18703413009643555, 0.19376030564308167, 0.2004864662885666, 0.2072126418352127, 0.21393880248069763, 0.22066497802734375, 0.22739115357398987, 0.2341173142194748, 0.2408434897661209, 0.24756965041160583, 0.25429582595825195]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 5.0, 1.0, 5.0, 6.0, 20.0, 30.0, 45.0, 54.0, 82.0, 101.0, 190.0, 353.0, 602.0, 1080.0, 2208.0, 5749.0, 16571.0, 67794.0, 397164.0, 449539.0, 77377.0, 18424.0, 5985.0, 2392.0, 1208.0, 671.0, 362.0, 204.0, 102.0, 73.0, 42.0, 34.0, 30.0, 14.0, 9.0, 13.0, 2.0, 4.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.07147216796875, -0.06924152374267578, -0.06701087951660156, -0.06478023529052734, -0.06254959106445312, -0.060318946838378906, -0.05808830261230469, -0.05585765838623047, -0.05362701416015625, -0.05139636993408203, -0.04916572570800781, -0.046935081481933594, -0.044704437255859375, -0.042473793029785156, -0.04024314880371094, -0.03801250457763672, -0.0357818603515625, -0.03355121612548828, -0.03132057189941406, -0.029089927673339844, -0.026859283447265625, -0.024628639221191406, -0.022397994995117188, -0.02016735076904297, -0.01793670654296875, -0.01570606231689453, -0.013475418090820312, -0.011244773864746094, -0.009014129638671875, -0.006783485412597656, -0.0045528411865234375, -0.0023221969604492188, -9.1552734375e-05, 0.0021390914916992188, 0.0043697357177734375, 0.006600379943847656, 0.008831024169921875, 0.011061668395996094, 0.013292312622070312, 0.015522956848144531, 0.01775360107421875, 0.01998424530029297, 0.022214889526367188, 0.024445533752441406, 0.026676177978515625, 0.028906822204589844, 0.031137466430664062, 0.03336811065673828, 0.0355987548828125, 0.03782939910888672, 0.04006004333496094, 0.042290687561035156, 0.044521331787109375, 0.046751976013183594, 0.04898262023925781, 0.05121326446533203, 0.05344390869140625, 0.05567455291748047, 0.05790519714355469, 0.060135841369628906, 0.062366485595703125, 0.06459712982177734, 0.06682777404785156, 0.06905841827392578, 0.0712890625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 7.0, 6.0, 9.0, 10.0, 13.0, 21.0, 27.0, 33.0, 43.0, 35.0, 46.0, 68.0, 78.0, 81.0, 71.0, 67.0, 57.0, 64.0, 59.0, 48.0, 33.0, 32.0, 27.0, 23.0, 15.0, 10.0, 7.0, 1.0, 1.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033905029296875, -0.03282976150512695, -0.031754493713378906, -0.03067922592163086, -0.029603958129882812, -0.028528690338134766, -0.02745342254638672, -0.026378154754638672, -0.025302886962890625, -0.024227619171142578, -0.02315235137939453, -0.022077083587646484, -0.021001815795898438, -0.01992654800415039, -0.018851280212402344, -0.017776012420654297, -0.01670074462890625, -0.015625476837158203, -0.014550209045410156, -0.01347494125366211, -0.012399673461914062, -0.011324405670166016, -0.010249137878417969, -0.009173870086669922, -0.008098602294921875, -0.007023334503173828, -0.005948066711425781, -0.004872798919677734, -0.0037975311279296875, -0.0027222633361816406, -0.0016469955444335938, -0.0005717277526855469, 0.0005035400390625, 0.0015788078308105469, 0.0026540756225585938, 0.0037293434143066406, 0.0048046112060546875, 0.005879878997802734, 0.006955146789550781, 0.008030414581298828, 0.009105682373046875, 0.010180950164794922, 0.011256217956542969, 0.012331485748291016, 0.013406753540039062, 0.01448202133178711, 0.015557289123535156, 0.016632556915283203, 0.01770782470703125, 0.018783092498779297, 0.019858360290527344, 0.02093362808227539, 0.022008895874023438, 0.023084163665771484, 0.02415943145751953, 0.025234699249267578, 0.026309967041015625, 0.027385234832763672, 0.02846050262451172, 0.029535770416259766, 0.030611038208007812, 0.03168630599975586, 0.032761573791503906, 0.03383684158325195, 0.034912109375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 5.0, 2.0, 7.0, 6.0, 12.0, 10.0, 13.0, 20.0, 21.0, 36.0, 43.0, 56.0, 70.0, 115.0, 159.0, 212.0, 390.0, 719.0, 1504.0, 3293.0, 8618.0, 28368.0, 124798.0, 588623.0, 225988.0, 44244.0, 12635.0, 4404.0, 1893.0, 900.0, 485.0, 275.0, 186.0, 132.0, 64.0, 63.0, 47.0, 25.0, 26.0, 17.0, 14.0, 6.0, 16.0, 6.0, 9.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 1.0, 2.0, 1.0], "bins": [-0.0540771484375, -0.05242156982421875, -0.0507659912109375, -0.04911041259765625, -0.047454833984375, -0.04579925537109375, -0.0441436767578125, -0.04248809814453125, -0.04083251953125, -0.03917694091796875, -0.0375213623046875, -0.03586578369140625, -0.034210205078125, -0.03255462646484375, -0.0308990478515625, -0.02924346923828125, -0.027587890625, -0.02593231201171875, -0.0242767333984375, -0.02262115478515625, -0.020965576171875, -0.01930999755859375, -0.0176544189453125, -0.01599884033203125, -0.01434326171875, -0.01268768310546875, -0.0110321044921875, -0.00937652587890625, -0.007720947265625, -0.00606536865234375, -0.0044097900390625, -0.00275421142578125, -0.0010986328125, 0.00055694580078125, 0.0022125244140625, 0.00386810302734375, 0.005523681640625, 0.00717926025390625, 0.0088348388671875, 0.01049041748046875, 0.01214599609375, 0.01380157470703125, 0.0154571533203125, 0.01711273193359375, 0.018768310546875, 0.02042388916015625, 0.0220794677734375, 0.02373504638671875, 0.025390625, 0.02704620361328125, 0.0287017822265625, 0.03035736083984375, 0.032012939453125, 0.03366851806640625, 0.0353240966796875, 0.03697967529296875, 0.03863525390625, 0.04029083251953125, 0.0419464111328125, 0.04360198974609375, 0.045257568359375, 0.04691314697265625, 0.0485687255859375, 0.05022430419921875, 0.0518798828125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 4.0, 2.0, 8.0, 9.0, 7.0, 6.0, 11.0, 20.0, 20.0, 21.0, 30.0, 37.0, 28.0, 23.0, 25.0, 45.0, 46.0, 49.0, 45.0, 54.0, 48.0, 36.0, 47.0, 49.0, 47.0, 40.0, 40.0, 32.0, 34.0, 21.0, 27.0, 24.0, 16.0, 12.0, 13.0, 10.0, 7.0, 2.0, 4.0, 1.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0975341796875, -0.09458255767822266, -0.09163093566894531, -0.08867931365966797, -0.08572769165039062, -0.08277606964111328, -0.07982444763183594, -0.0768728256225586, -0.07392120361328125, -0.0709695816040039, -0.06801795959472656, -0.06506633758544922, -0.062114715576171875, -0.05916309356689453, -0.05621147155761719, -0.053259849548339844, -0.0503082275390625, -0.047356605529785156, -0.04440498352050781, -0.04145336151123047, -0.038501739501953125, -0.03555011749267578, -0.03259849548339844, -0.029646873474121094, -0.02669525146484375, -0.023743629455566406, -0.020792007446289062, -0.01784038543701172, -0.014888763427734375, -0.011937141418457031, -0.008985519409179688, -0.006033897399902344, -0.003082275390625, -0.00013065338134765625, 0.0028209686279296875, 0.005772590637207031, 0.008724212646484375, 0.011675834655761719, 0.014627456665039062, 0.017579078674316406, 0.02053070068359375, 0.023482322692871094, 0.026433944702148438, 0.02938556671142578, 0.032337188720703125, 0.03528881072998047, 0.03824043273925781, 0.041192054748535156, 0.0441436767578125, 0.047095298767089844, 0.05004692077636719, 0.05299854278564453, 0.055950164794921875, 0.05890178680419922, 0.06185340881347656, 0.0648050308227539, 0.06775665283203125, 0.0707082748413086, 0.07365989685058594, 0.07661151885986328, 0.07956314086914062, 0.08251476287841797, 0.08546638488769531, 0.08841800689697266, 0.09136962890625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 6.0, 1.0, 8.0, 16.0, 14.0, 20.0, 38.0, 52.0, 65.0, 144.0, 211.0, 503.0, 1467.0, 5990.0, 104231.0, 901752.0, 28682.0, 3457.0, 1016.0, 400.0, 182.0, 97.0, 79.0, 47.0, 19.0, 20.0, 14.0, 14.0, 8.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0482177734375, -0.046959877014160156, -0.04570198059082031, -0.04444408416748047, -0.043186187744140625, -0.04192829132080078, -0.04067039489746094, -0.039412498474121094, -0.03815460205078125, -0.036896705627441406, -0.03563880920410156, -0.03438091278076172, -0.033123016357421875, -0.03186511993408203, -0.030607223510742188, -0.029349327087402344, -0.0280914306640625, -0.026833534240722656, -0.025575637817382812, -0.02431774139404297, -0.023059844970703125, -0.02180194854736328, -0.020544052124023438, -0.019286155700683594, -0.01802825927734375, -0.016770362854003906, -0.015512466430664062, -0.014254570007324219, -0.012996673583984375, -0.011738777160644531, -0.010480880737304688, -0.009222984313964844, -0.007965087890625, -0.006707191467285156, -0.0054492950439453125, -0.004191398620605469, -0.002933502197265625, -0.0016756057739257812, -0.0004177093505859375, 0.0008401870727539062, 0.00209808349609375, 0.0033559799194335938, 0.0046138763427734375, 0.005871772766113281, 0.007129669189453125, 0.008387565612792969, 0.009645462036132812, 0.010903358459472656, 0.0121612548828125, 0.013419151306152344, 0.014677047729492188, 0.01593494415283203, 0.017192840576171875, 0.01845073699951172, 0.019708633422851562, 0.020966529846191406, 0.02222442626953125, 0.023482322692871094, 0.024740219116210938, 0.02599811553955078, 0.027256011962890625, 0.02851390838623047, 0.029771804809570312, 0.031029701232910156, 0.03228759765625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 5.0, 2.0, 5.0, 8.0, 13.0, 11.0, 24.0, 33.0, 37.0, 39.0, 58.0, 73.0, 76.0, 80.0, 73.0, 92.0, 67.0, 65.0, 52.0, 52.0, 41.0, 25.0, 19.0, 17.0, 15.0, 9.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.212162017822266e-06, -6.9765374064445496e-06, -6.7409127950668335e-06, -6.5052881836891174e-06, -6.269663572311401e-06, -6.034038960933685e-06, -5.798414349555969e-06, -5.562789738178253e-06, -5.327165126800537e-06, -5.091540515422821e-06, -4.855915904045105e-06, -4.620291292667389e-06, -4.384666681289673e-06, -4.149042069911957e-06, -3.913417458534241e-06, -3.6777928471565247e-06, -3.4421682357788086e-06, -3.2065436244010925e-06, -2.9709190130233765e-06, -2.7352944016456604e-06, -2.4996697902679443e-06, -2.2640451788902283e-06, -2.028420567512512e-06, -1.7927959561347961e-06, -1.55717134475708e-06, -1.321546733379364e-06, -1.085922122001648e-06, -8.502975106239319e-07, -6.146728992462158e-07, -3.7904828786849976e-07, -1.434236764907837e-07, 9.220093488693237e-08, 3.2782554626464844e-07, 5.634501576423645e-07, 7.990747690200806e-07, 1.0346993803977966e-06, 1.2703239917755127e-06, 1.5059486031532288e-06, 1.7415732145309448e-06, 1.977197825908661e-06, 2.212822437286377e-06, 2.448447048664093e-06, 2.684071660041809e-06, 2.919696271419525e-06, 3.155320882797241e-06, 3.3909454941749573e-06, 3.6265701055526733e-06, 3.862194716930389e-06, 4.0978193283081055e-06, 4.3334439396858215e-06, 4.569068551063538e-06, 4.804693162441254e-06, 5.04031777381897e-06, 5.275942385196686e-06, 5.511566996574402e-06, 5.747191607952118e-06, 5.982816219329834e-06, 6.21844083070755e-06, 6.454065442085266e-06, 6.689690053462982e-06, 6.925314664840698e-06, 7.160939276218414e-06, 7.39656388759613e-06, 7.632188498973846e-06, 7.867813110351562e-06]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 2.0, 6.0, 5.0, 5.0, 12.0, 26.0, 47.0, 82.0, 135.0, 285.0, 578.0, 1673.0, 8343.0, 343839.0, 676558.0, 13542.0, 2092.0, 677.0, 312.0, 140.0, 68.0, 50.0, 22.0, 23.0, 13.0, 6.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.052337646484375, -0.051032304763793945, -0.04972696304321289, -0.048421621322631836, -0.04711627960205078, -0.04581093788146973, -0.04450559616088867, -0.04320025444030762, -0.04189491271972656, -0.04058957099914551, -0.03928422927856445, -0.0379788875579834, -0.036673545837402344, -0.03536820411682129, -0.034062862396240234, -0.03275752067565918, -0.031452178955078125, -0.03014683723449707, -0.028841495513916016, -0.02753615379333496, -0.026230812072753906, -0.02492547035217285, -0.023620128631591797, -0.022314786911010742, -0.021009445190429688, -0.019704103469848633, -0.018398761749267578, -0.017093420028686523, -0.01578807830810547, -0.014482736587524414, -0.01317739486694336, -0.011872053146362305, -0.01056671142578125, -0.009261369705200195, -0.00795602798461914, -0.006650686264038086, -0.005345344543457031, -0.0040400028228759766, -0.002734661102294922, -0.0014293193817138672, -0.0001239776611328125, 0.0011813640594482422, 0.002486705780029297, 0.0037920475006103516, 0.005097389221191406, 0.006402730941772461, 0.007708072662353516, 0.00901341438293457, 0.010318756103515625, 0.01162409782409668, 0.012929439544677734, 0.014234781265258789, 0.015540122985839844, 0.0168454647064209, 0.018150806427001953, 0.019456148147583008, 0.020761489868164062, 0.022066831588745117, 0.023372173309326172, 0.024677515029907227, 0.02598285675048828, 0.027288198471069336, 0.02859354019165039, 0.029898881912231445, 0.0312042236328125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 7.0, 14.0, 30.0, 72.0, 158.0, 266.0, 220.0, 111.0, 67.0, 24.0, 10.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.069580078125, -0.06787633895874023, -0.06617259979248047, -0.0644688606262207, -0.06276512145996094, -0.06106138229370117, -0.059357643127441406, -0.05765390396118164, -0.055950164794921875, -0.05424642562866211, -0.052542686462402344, -0.05083894729614258, -0.04913520812988281, -0.04743146896362305, -0.04572772979736328, -0.044023990631103516, -0.04232025146484375, -0.040616512298583984, -0.03891277313232422, -0.03720903396606445, -0.03550529479980469, -0.03380155563354492, -0.032097816467285156, -0.03039407730102539, -0.028690338134765625, -0.02698659896850586, -0.025282859802246094, -0.023579120635986328, -0.021875381469726562, -0.020171642303466797, -0.01846790313720703, -0.016764163970947266, -0.0150604248046875, -0.013356685638427734, -0.011652946472167969, -0.009949207305908203, -0.008245468139648438, -0.006541728973388672, -0.004837989807128906, -0.0031342506408691406, -0.001430511474609375, 0.0002732276916503906, 0.0019769668579101562, 0.003680706024169922, 0.0053844451904296875, 0.007088184356689453, 0.008791923522949219, 0.010495662689208984, 0.01219940185546875, 0.013903141021728516, 0.015606880187988281, 0.017310619354248047, 0.019014358520507812, 0.020718097686767578, 0.022421836853027344, 0.02412557601928711, 0.025829315185546875, 0.02753305435180664, 0.029236793518066406, 0.030940532684326172, 0.03264427185058594, 0.0343480110168457, 0.03605175018310547, 0.037755489349365234, 0.039459228515625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 10.0, 20.0, 67.0, 217.0, 433.0, 182.0, 45.0, 18.0, 7.0, 3.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32185208797454834, -0.29093965888023376, -0.2600272595882416, -0.229114830493927, -0.19820240139961243, -0.16728998720645905, -0.13637757301330566, -0.10546514391899109, -0.07455272972583771, -0.04364030808210373, -0.01272789016366005, 0.01818452775478363, 0.04909694939851761, 0.08000937104225159, 0.11092178523540497, 0.14183421432971954, 0.17274662852287292, 0.2036590427160263, 0.23457147181034088, 0.26548388600349426, 0.29639631509780884, 0.327308714389801, 0.3582211434841156, 0.3891335725784302, 0.42004597187042236, 0.45095840096473694, 0.4818708002567291, 0.5127832293510437, 0.5436956286430359, 0.5746080875396729, 0.605520486831665, 0.6364328861236572, 0.6673453450202942, 0.6982577443122864, 0.7291702032089233, 0.7600826025009155, 0.7909950017929077, 0.8219074606895447, 0.8528198599815369, 0.8837323188781738, 0.914644718170166, 0.9455571174621582, 0.9764695763587952, 1.0073819160461426, 1.0382944345474243, 1.0692068338394165, 1.1001192331314087, 1.1310316324234009, 1.161944031715393, 1.1928564310073853, 1.2237688302993774, 1.2546813488006592, 1.2855937480926514, 1.3165061473846436, 1.3474185466766357, 1.378330945968628, 1.4092434644699097, 1.4401558637619019, 1.471068263053894, 1.5019807815551758, 1.532893180847168, 1.5638055801391602, 1.5947179794311523, 1.6256303787231445, 1.6565427780151367]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 4.0, 9.0, 7.0, 8.0, 16.0, 13.0, 15.0, 16.0, 21.0, 24.0, 24.0, 36.0, 35.0, 32.0, 39.0, 39.0, 53.0, 53.0, 53.0, 50.0, 43.0, 48.0, 49.0, 35.0, 37.0, 25.0, 29.0, 27.0, 16.0, 21.0, 21.0, 16.0, 22.0, 8.0, 8.0, 13.0, 9.0, 7.0, 1.0, 4.0, 3.0, 5.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.44994056224823, -0.4364429712295532, -0.42294538021087646, -0.4094477891921997, -0.39595019817352295, -0.3824526071548462, -0.36895501613616943, -0.3554574251174927, -0.3419598340988159, -0.32846224308013916, -0.3149646520614624, -0.30146706104278564, -0.2879694700241089, -0.27447187900543213, -0.26097428798675537, -0.24747668206691742, -0.23397907614707947, -0.2204814851284027, -0.20698389410972595, -0.1934863030910492, -0.17998871207237244, -0.16649112105369568, -0.15299351513385773, -0.13949592411518097, -0.1259983330965042, -0.11250074207782745, -0.0990031510591507, -0.08550555258989334, -0.07200796157121658, -0.058510370552539825, -0.04501277208328247, -0.03151518106460571, -0.018017590045928955, -0.004519997164607048, 0.008977595716714859, 0.022475190460681915, 0.03597278147935867, 0.04947037249803543, 0.06296797096729279, 0.07646556198596954, 0.0899631530046463, 0.10346074402332306, 0.11695833504199982, 0.13045594096183777, 0.14395353198051453, 0.15745112299919128, 0.17094871401786804, 0.1844463050365448, 0.19794389605522156, 0.21144148707389832, 0.22493907809257507, 0.23843666911125183, 0.2519342601299286, 0.26543185114860535, 0.2789294719696045, 0.29242706298828125, 0.305924654006958, 0.31942224502563477, 0.3329198360443115, 0.3464174270629883, 0.35991501808166504, 0.3734126091003418, 0.38691020011901855, 0.4004077911376953, 0.41390538215637207]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 6.0, 9.0, 16.0, 19.0, 32.0, 36.0, 79.0, 156.0, 320.0, 1497.0, 256891.0, 3933002.0, 1506.0, 347.0, 145.0, 88.0, 45.0, 33.0, 14.0, 16.0, 3.0, 6.0, 7.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2047119140625, -0.1978912353515625, -0.191070556640625, -0.1842498779296875, -0.17742919921875, -0.1706085205078125, -0.163787841796875, -0.1569671630859375, -0.150146484375, -0.1433258056640625, -0.136505126953125, -0.1296844482421875, -0.12286376953125, -0.1160430908203125, -0.109222412109375, -0.1024017333984375, -0.0955810546875, -0.0887603759765625, -0.081939697265625, -0.0751190185546875, -0.06829833984375, -0.0614776611328125, -0.054656982421875, -0.0478363037109375, -0.041015625, -0.0341949462890625, -0.027374267578125, -0.0205535888671875, -0.01373291015625, -0.0069122314453125, -9.1552734375e-05, 0.0067291259765625, 0.0135498046875, 0.0203704833984375, 0.027191162109375, 0.0340118408203125, 0.04083251953125, 0.0476531982421875, 0.054473876953125, 0.0612945556640625, 0.068115234375, 0.0749359130859375, 0.081756591796875, 0.0885772705078125, 0.09539794921875, 0.1022186279296875, 0.109039306640625, 0.1158599853515625, 0.1226806640625, 0.1295013427734375, 0.136322021484375, 0.1431427001953125, 0.14996337890625, 0.1567840576171875, 0.163604736328125, 0.1704254150390625, 0.17724609375, 0.1840667724609375, 0.190887451171875, 0.1977081298828125, 0.20452880859375, 0.2113494873046875, 0.218170166015625, 0.2249908447265625, 0.2318115234375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 3.0, 9.0, 9.0, 13.0, 16.0, 17.0, 30.0, 30.0, 35.0, 49.0, 54.0, 52.0, 63.0, 70.0, 85.0, 60.0, 71.0, 61.0, 61.0, 45.0, 35.0, 32.0, 24.0, 20.0, 12.0, 13.0, 7.0, 6.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.03521728515625, -0.0341339111328125, -0.033050537109375, -0.0319671630859375, -0.0308837890625, -0.0298004150390625, -0.028717041015625, -0.0276336669921875, -0.02655029296875, -0.0254669189453125, -0.024383544921875, -0.0233001708984375, -0.022216796875, -0.0211334228515625, -0.020050048828125, -0.0189666748046875, -0.01788330078125, -0.0167999267578125, -0.015716552734375, -0.0146331787109375, -0.0135498046875, -0.0124664306640625, -0.011383056640625, -0.0102996826171875, -0.00921630859375, -0.0081329345703125, -0.007049560546875, -0.0059661865234375, -0.0048828125, -0.0037994384765625, -0.002716064453125, -0.0016326904296875, -0.00054931640625, 0.0005340576171875, 0.001617431640625, 0.0027008056640625, 0.0037841796875, 0.0048675537109375, 0.005950927734375, 0.0070343017578125, 0.00811767578125, 0.0092010498046875, 0.010284423828125, 0.0113677978515625, 0.012451171875, 0.0135345458984375, 0.014617919921875, 0.0157012939453125, 0.01678466796875, 0.0178680419921875, 0.018951416015625, 0.0200347900390625, 0.0211181640625, 0.0222015380859375, 0.023284912109375, 0.0243682861328125, 0.02545166015625, 0.0265350341796875, 0.027618408203125, 0.0287017822265625, 0.02978515625, 0.0308685302734375, 0.031951904296875, 0.0330352783203125, 0.03411865234375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 7.0, 6.0, 4.0, 9.0, 15.0, 14.0, 18.0, 22.0, 45.0, 63.0, 109.0, 150.0, 239.0, 349.0, 634.0, 998.0, 1755.0, 3410.0, 6910.0, 20600.0, 348323.0, 3769518.0, 24934.0, 7655.0, 3615.0, 1903.0, 1102.0, 656.0, 422.0, 267.0, 160.0, 110.0, 72.0, 46.0, 39.0, 28.0, 21.0, 11.0, 11.0, 8.0, 10.0, 7.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.040771484375, -0.0394587516784668, -0.038146018981933594, -0.03683328628540039, -0.03552055358886719, -0.034207820892333984, -0.03289508819580078, -0.03158235549926758, -0.030269622802734375, -0.028956890106201172, -0.02764415740966797, -0.026331424713134766, -0.025018692016601562, -0.02370595932006836, -0.022393226623535156, -0.021080493927001953, -0.01976776123046875, -0.018455028533935547, -0.017142295837402344, -0.01582956314086914, -0.014516830444335938, -0.013204097747802734, -0.011891365051269531, -0.010578632354736328, -0.009265899658203125, -0.007953166961669922, -0.006640434265136719, -0.005327701568603516, -0.0040149688720703125, -0.0027022361755371094, -0.0013895034790039062, -7.677078247070312e-05, 0.0012359619140625, 0.002548694610595703, 0.0038614273071289062, 0.005174160003662109, 0.0064868927001953125, 0.007799625396728516, 0.009112358093261719, 0.010425090789794922, 0.011737823486328125, 0.013050556182861328, 0.014363288879394531, 0.015676021575927734, 0.016988754272460938, 0.01830148696899414, 0.019614219665527344, 0.020926952362060547, 0.02223968505859375, 0.023552417755126953, 0.024865150451660156, 0.02617788314819336, 0.027490615844726562, 0.028803348541259766, 0.03011608123779297, 0.03142881393432617, 0.032741546630859375, 0.03405427932739258, 0.03536701202392578, 0.036679744720458984, 0.03799247741699219, 0.03930521011352539, 0.040617942810058594, 0.0419306755065918, 0.043243408203125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 8.0, 12.0, 16.0, 47.0, 181.0, 3551.0, 146.0, 46.0, 26.0, 8.0, 7.0, 5.0, 3.0, 4.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0081939697265625, -0.007810831069946289, -0.007427692413330078, -0.007044553756713867, -0.006661415100097656, -0.006278276443481445, -0.005895137786865234, -0.0055119991302490234, -0.0051288604736328125, -0.0047457218170166016, -0.004362583160400391, -0.00397944450378418, -0.0035963058471679688, -0.003213167190551758, -0.002830028533935547, -0.002446889877319336, -0.002063751220703125, -0.001680612564086914, -0.0012974739074707031, -0.0009143352508544922, -0.0005311965942382812, -0.0001480579376220703, 0.00023508071899414062, 0.0006182193756103516, 0.0010013580322265625, 0.0013844966888427734, 0.0017676353454589844, 0.0021507740020751953, 0.0025339126586914062, 0.002917051315307617, 0.003300189971923828, 0.003683328628540039, 0.00406646728515625, 0.004449605941772461, 0.004832744598388672, 0.005215883255004883, 0.005599021911621094, 0.005982160568237305, 0.006365299224853516, 0.0067484378814697266, 0.0071315765380859375, 0.0075147151947021484, 0.00789785385131836, 0.00828099250793457, 0.008664131164550781, 0.009047269821166992, 0.009430408477783203, 0.009813547134399414, 0.010196685791015625, 0.010579824447631836, 0.010962963104248047, 0.011346101760864258, 0.011729240417480469, 0.01211237907409668, 0.01249551773071289, 0.012878656387329102, 0.013261795043945312, 0.013644933700561523, 0.014028072357177734, 0.014411211013793945, 0.014794349670410156, 0.015177488327026367, 0.015560626983642578, 0.01594376564025879, 0.016326904296875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 6.0, 25.0, 113.0, 332.0, 318.0, 151.0, 44.0, 12.0, 7.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.021176515147089958, -0.018057173117995262, -0.014937830157577991, -0.01181848719716072, -0.008699145168066025, -0.005579803138971329, -0.0024604592472314835, 0.0006588827818632126, 0.0037782248109579086, 0.006897567305713892, 0.010016909800469875, 0.013136252760887146, 0.016255594789981842, 0.019374936819076538, 0.022494280710816383, 0.02561362273991108, 0.028732964769005775, 0.03185230866074562, 0.03497165068984032, 0.03809099271893501, 0.04121033474802971, 0.044329676777124405, 0.0474490225315094, 0.050568364560604095, 0.05368770658969879, 0.05680704861879349, 0.059926390647888184, 0.06304573267698288, 0.06616507470607758, 0.06928441673517227, 0.07240375876426697, 0.07552310824394226, 0.07864244282245636, 0.08176178485155106, 0.08488112688064575, 0.08800046890974045, 0.09111981093883514, 0.09423915296792984, 0.09735849499702454, 0.10047784447669983, 0.10359717905521393, 0.10671652108430862, 0.10983586311340332, 0.11295520514249802, 0.11607454717159271, 0.11919388920068741, 0.1223132312297821, 0.1254325807094574, 0.1285519301891327, 0.13167127966880798, 0.13479061424732208, 0.13790996372699738, 0.14102929830551147, 0.14414864778518677, 0.14726798236370087, 0.15038733184337616, 0.15350666642189026, 0.15662601590156555, 0.15974535048007965, 0.16286469995975494, 0.16598403453826904, 0.16910338401794434, 0.17222271859645844, 0.17534206807613373, 0.17846140265464783]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 10.0, 9.0, 13.0, 10.0, 15.0, 15.0, 24.0, 16.0, 32.0, 38.0, 34.0, 30.0, 34.0, 33.0, 52.0, 53.0, 41.0, 53.0, 36.0, 48.0, 25.0, 41.0, 49.0, 35.0, 32.0, 26.0, 38.0, 17.0, 28.0, 18.0, 19.0, 20.0, 14.0, 9.0, 10.0, 9.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01923394203186035, -0.01858992502093315, -0.01794590801000595, -0.01730189099907875, -0.01665787398815155, -0.01601385697722435, -0.01536983996629715, -0.01472582295536995, -0.014081805944442749, -0.013437788933515549, -0.012793771922588348, -0.012149754911661148, -0.011505737900733948, -0.010861720889806747, -0.010217703878879547, -0.009573686867952347, -0.008929669857025146, -0.008285652846097946, -0.007641635835170746, -0.0069976188242435455, -0.006353601813316345, -0.005709584802389145, -0.005065567791461945, -0.004421550780534744, -0.003777533769607544, -0.0031335167586803436, -0.0024894997477531433, -0.001845482736825943, -0.0012014657258987427, -0.0005574487149715424, 8.656829595565796e-05, 0.0007305853068828583, 0.0013746023178100586, 0.002018619328737259, 0.0026626363396644592, 0.0033066533505916595, 0.00395067036151886, 0.00459468737244606, 0.0052387043833732605, 0.005882721394300461, 0.006526738405227661, 0.0071707554161548615, 0.007814772427082062, 0.008458789438009262, 0.009102806448936462, 0.009746823459863663, 0.010390840470790863, 0.011034857481718063, 0.011678874492645264, 0.012322891503572464, 0.012966908514499664, 0.013610925525426865, 0.014254942536354065, 0.014898959547281265, 0.015542976558208466, 0.016186993569135666, 0.016831010580062866, 0.017475027590990067, 0.018119044601917267, 0.018763061612844467, 0.019407078623771667, 0.020051095634698868, 0.020695112645626068, 0.02133912965655327, 0.02198314666748047]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 9.0, 16.0, 19.0, 26.0, 39.0, 56.0, 96.0, 129.0, 224.0, 441.0, 683.0, 1362.0, 2759.0, 6419.0, 16883.0, 51228.0, 196041.0, 507733.0, 186590.0, 49040.0, 16517.0, 6399.0, 2797.0, 1348.0, 677.0, 378.0, 242.0, 153.0, 94.0, 48.0, 34.0, 21.0, 14.0, 13.0, 9.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.050079345703125, -0.0485377311706543, -0.046996116638183594, -0.04545450210571289, -0.04391288757324219, -0.042371273040771484, -0.04082965850830078, -0.03928804397583008, -0.037746429443359375, -0.03620481491088867, -0.03466320037841797, -0.033121585845947266, -0.03157997131347656, -0.03003835678100586, -0.028496742248535156, -0.026955127716064453, -0.02541351318359375, -0.023871898651123047, -0.022330284118652344, -0.02078866958618164, -0.019247055053710938, -0.017705440521240234, -0.01616382598876953, -0.014622211456298828, -0.013080596923828125, -0.011538982391357422, -0.009997367858886719, -0.008455753326416016, -0.0069141387939453125, -0.005372524261474609, -0.0038309097290039062, -0.002289295196533203, -0.0007476806640625, 0.0007939338684082031, 0.0023355484008789062, 0.0038771629333496094, 0.0054187774658203125, 0.006960391998291016, 0.008502006530761719, 0.010043621063232422, 0.011585235595703125, 0.013126850128173828, 0.014668464660644531, 0.016210079193115234, 0.017751693725585938, 0.01929330825805664, 0.020834922790527344, 0.022376537322998047, 0.02391815185546875, 0.025459766387939453, 0.027001380920410156, 0.02854299545288086, 0.030084609985351562, 0.031626224517822266, 0.03316783905029297, 0.03470945358276367, 0.036251068115234375, 0.03779268264770508, 0.03933429718017578, 0.040875911712646484, 0.04241752624511719, 0.04395914077758789, 0.045500755310058594, 0.0470423698425293, 0.048583984375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 5.0, 4.0, 6.0, 6.0, 16.0, 19.0, 20.0, 24.0, 28.0, 39.0, 48.0, 57.0, 54.0, 57.0, 58.0, 83.0, 78.0, 56.0, 69.0, 56.0, 36.0, 38.0, 30.0, 23.0, 25.0, 16.0, 16.0, 11.0, 9.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.03411865234375, -0.03304338455200195, -0.031968116760253906, -0.03089284896850586, -0.029817581176757812, -0.028742313385009766, -0.02766704559326172, -0.026591777801513672, -0.025516510009765625, -0.024441242218017578, -0.02336597442626953, -0.022290706634521484, -0.021215438842773438, -0.02014017105102539, -0.019064903259277344, -0.017989635467529297, -0.01691436767578125, -0.015839099884033203, -0.014763832092285156, -0.01368856430053711, -0.012613296508789062, -0.011538028717041016, -0.010462760925292969, -0.009387493133544922, -0.008312225341796875, -0.007236957550048828, -0.006161689758300781, -0.005086421966552734, -0.0040111541748046875, -0.0029358863830566406, -0.0018606185913085938, -0.0007853507995605469, 0.0002899169921875, 0.0013651847839355469, 0.0024404525756835938, 0.0035157203674316406, 0.0045909881591796875, 0.005666255950927734, 0.006741523742675781, 0.007816791534423828, 0.008892059326171875, 0.009967327117919922, 0.011042594909667969, 0.012117862701416016, 0.013193130493164062, 0.01426839828491211, 0.015343666076660156, 0.016418933868408203, 0.01749420166015625, 0.018569469451904297, 0.019644737243652344, 0.02072000503540039, 0.021795272827148438, 0.022870540618896484, 0.02394580841064453, 0.025021076202392578, 0.026096343994140625, 0.027171611785888672, 0.02824687957763672, 0.029322147369384766, 0.030397415161132812, 0.03147268295288086, 0.032547950744628906, 0.03362321853637695, 0.034698486328125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 2.0, 6.0, 7.0, 5.0, 19.0, 12.0, 26.0, 21.0, 21.0, 41.0, 46.0, 80.0, 96.0, 168.0, 273.0, 481.0, 937.0, 2173.0, 6397.0, 26426.0, 178904.0, 682125.0, 121532.0, 19744.0, 5156.0, 1873.0, 791.0, 451.0, 235.0, 153.0, 100.0, 61.0, 49.0, 40.0, 25.0, 18.0, 15.0, 11.0, 8.0, 10.0, 3.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0560302734375, -0.05424642562866211, -0.05246257781982422, -0.05067873001098633, -0.04889488220214844, -0.04711103439331055, -0.045327186584472656, -0.043543338775634766, -0.041759490966796875, -0.039975643157958984, -0.038191795349121094, -0.0364079475402832, -0.03462409973144531, -0.03284025192260742, -0.03105640411376953, -0.02927255630493164, -0.02748870849609375, -0.02570486068725586, -0.02392101287841797, -0.022137165069580078, -0.020353317260742188, -0.018569469451904297, -0.016785621643066406, -0.015001773834228516, -0.013217926025390625, -0.011434078216552734, -0.009650230407714844, -0.007866382598876953, -0.0060825347900390625, -0.004298686981201172, -0.0025148391723632812, -0.0007309913635253906, 0.0010528564453125, 0.0028367042541503906, 0.004620552062988281, 0.006404399871826172, 0.008188247680664062, 0.009972095489501953, 0.011755943298339844, 0.013539791107177734, 0.015323638916015625, 0.017107486724853516, 0.018891334533691406, 0.020675182342529297, 0.022459030151367188, 0.024242877960205078, 0.02602672576904297, 0.02781057357788086, 0.02959442138671875, 0.03137826919555664, 0.03316211700439453, 0.03494596481323242, 0.03672981262207031, 0.0385136604309082, 0.040297508239746094, 0.042081356048583984, 0.043865203857421875, 0.045649051666259766, 0.047432899475097656, 0.04921674728393555, 0.05100059509277344, 0.05278444290161133, 0.05456829071044922, 0.05635213851928711, 0.058135986328125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 5.0, 14.0, 12.0, 17.0, 28.0, 30.0, 26.0, 34.0, 31.0, 49.0, 54.0, 49.0, 73.0, 59.0, 58.0, 45.0, 52.0, 55.0, 33.0, 47.0, 46.0, 35.0, 28.0, 25.0, 21.0, 14.0, 14.0, 12.0, 6.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08837890625, -0.08526039123535156, -0.08214187622070312, -0.07902336120605469, -0.07590484619140625, -0.07278633117675781, -0.06966781616210938, -0.06654930114746094, -0.0634307861328125, -0.06031227111816406, -0.057193756103515625, -0.05407524108886719, -0.05095672607421875, -0.04783821105957031, -0.044719696044921875, -0.04160118103027344, -0.038482666015625, -0.03536415100097656, -0.032245635986328125, -0.029127120971679688, -0.02600860595703125, -0.022890090942382812, -0.019771575927734375, -0.016653060913085938, -0.0135345458984375, -0.010416030883789062, -0.007297515869140625, -0.0041790008544921875, -0.00106048583984375, 0.0020580291748046875, 0.005176544189453125, 0.008295059204101562, 0.01141357421875, 0.014532089233398438, 0.017650604248046875, 0.020769119262695312, 0.02388763427734375, 0.027006149291992188, 0.030124664306640625, 0.03324317932128906, 0.0363616943359375, 0.03948020935058594, 0.042598724365234375, 0.04571723937988281, 0.04883575439453125, 0.05195426940917969, 0.055072784423828125, 0.05819129943847656, 0.061309814453125, 0.06442832946777344, 0.06754684448242188, 0.07066535949707031, 0.07378387451171875, 0.07690238952636719, 0.08002090454101562, 0.08313941955566406, 0.0862579345703125, 0.08937644958496094, 0.09249496459960938, 0.09561347961425781, 0.09873199462890625, 0.10185050964355469, 0.10496902465820312, 0.10808753967285156, 0.1112060546875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 8.0, 4.0, 16.0, 12.0, 14.0, 19.0, 38.0, 40.0, 64.0, 86.0, 131.0, 250.0, 410.0, 724.0, 1923.0, 5710.0, 22073.0, 97872.0, 412248.0, 386191.0, 91136.0, 20533.0, 5429.0, 1842.0, 742.0, 369.0, 213.0, 128.0, 102.0, 54.0, 54.0, 33.0, 25.0, 9.0, 15.0, 16.0, 6.0, 3.0, 2.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.0108489990234375, -0.010538816452026367, -0.010228633880615234, -0.009918451309204102, -0.009608268737792969, -0.009298086166381836, -0.008987903594970703, -0.00867772102355957, -0.008367538452148438, -0.008057355880737305, -0.007747173309326172, -0.007436990737915039, -0.007126808166503906, -0.0068166255950927734, -0.006506443023681641, -0.006196260452270508, -0.005886077880859375, -0.005575895309448242, -0.005265712738037109, -0.0049555301666259766, -0.004645347595214844, -0.004335165023803711, -0.004024982452392578, -0.0037147998809814453, -0.0034046173095703125, -0.0030944347381591797, -0.002784252166748047, -0.002474069595336914, -0.0021638870239257812, -0.0018537044525146484, -0.0015435218811035156, -0.0012333393096923828, -0.00092315673828125, -0.0006129741668701172, -0.0003027915954589844, 7.3909759521484375e-06, 0.00031757354736328125, 0.0006277561187744141, 0.0009379386901855469, 0.0012481212615966797, 0.0015583038330078125, 0.0018684864044189453, 0.002178668975830078, 0.002488851547241211, 0.0027990341186523438, 0.0031092166900634766, 0.0034193992614746094, 0.003729581832885742, 0.004039764404296875, 0.004349946975708008, 0.004660129547119141, 0.0049703121185302734, 0.005280494689941406, 0.005590677261352539, 0.005900859832763672, 0.006211042404174805, 0.0065212249755859375, 0.00683140754699707, 0.007141590118408203, 0.007451772689819336, 0.007761955261230469, 0.008072137832641602, 0.008382320404052734, 0.008692502975463867, 0.009002685546875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 5.0, 7.0, 8.0, 11.0, 8.0, 24.0, 15.0, 26.0, 32.0, 34.0, 33.0, 52.0, 42.0, 51.0, 41.0, 42.0, 66.0, 49.0, 51.0, 66.0, 38.0, 46.0, 50.0, 20.0, 23.0, 36.0, 23.0, 15.0, 14.0, 10.0, 11.0, 16.0, 9.0, 4.0, 8.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.304813385009766e-06, -5.165114998817444e-06, -5.025416612625122e-06, -4.8857182264328e-06, -4.7460198402404785e-06, -4.606321454048157e-06, -4.466623067855835e-06, -4.326924681663513e-06, -4.187226295471191e-06, -4.04752790927887e-06, -3.907829523086548e-06, -3.768131136894226e-06, -3.6284327507019043e-06, -3.4887343645095825e-06, -3.3490359783172607e-06, -3.209337592124939e-06, -3.069639205932617e-06, -2.9299408197402954e-06, -2.7902424335479736e-06, -2.650544047355652e-06, -2.51084566116333e-06, -2.3711472749710083e-06, -2.2314488887786865e-06, -2.0917505025863647e-06, -1.952052116394043e-06, -1.8123537302017212e-06, -1.6726553440093994e-06, -1.5329569578170776e-06, -1.3932585716247559e-06, -1.253560185432434e-06, -1.1138617992401123e-06, -9.741634130477905e-07, -8.344650268554688e-07, -6.94766640663147e-07, -5.550682544708252e-07, -4.153698682785034e-07, -2.7567148208618164e-07, -1.3597309589385986e-07, 3.725290298461914e-09, 1.434236764907837e-07, 2.8312206268310547e-07, 4.2282044887542725e-07, 5.62518835067749e-07, 7.022172212600708e-07, 8.419156074523926e-07, 9.816139936447144e-07, 1.1213123798370361e-06, 1.261010766029358e-06, 1.4007091522216797e-06, 1.5404075384140015e-06, 1.6801059246063232e-06, 1.819804310798645e-06, 1.959502696990967e-06, 2.0992010831832886e-06, 2.2388994693756104e-06, 2.378597855567932e-06, 2.518296241760254e-06, 2.6579946279525757e-06, 2.7976930141448975e-06, 2.9373914003372192e-06, 3.077089786529541e-06, 3.216788172721863e-06, 3.3564865589141846e-06, 3.4961849451065063e-06, 3.635883331298828e-06]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 5.0, 4.0, 9.0, 18.0, 24.0, 32.0, 39.0, 79.0, 153.0, 264.0, 528.0, 1286.0, 3360.0, 11448.0, 50262.0, 247177.0, 524059.0, 163556.0, 33544.0, 8114.0, 2559.0, 1002.0, 449.0, 231.0, 128.0, 81.0, 51.0, 35.0, 17.0, 14.0, 7.0, 1.0, 5.0, 5.0, 0.0, 5.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01245880126953125, -0.012096285820007324, -0.011733770370483398, -0.011371254920959473, -0.011008739471435547, -0.010646224021911621, -0.010283708572387695, -0.00992119312286377, -0.009558677673339844, -0.009196162223815918, -0.008833646774291992, -0.008471131324768066, -0.00810861587524414, -0.007746100425720215, -0.007383584976196289, -0.007021069526672363, -0.0066585540771484375, -0.006296038627624512, -0.005933523178100586, -0.00557100772857666, -0.005208492279052734, -0.004845976829528809, -0.004483461380004883, -0.004120945930480957, -0.0037584304809570312, -0.0033959150314331055, -0.0030333995819091797, -0.002670884132385254, -0.002308368682861328, -0.0019458532333374023, -0.0015833377838134766, -0.0012208223342895508, -0.000858306884765625, -0.0004957914352416992, -0.00013327598571777344, 0.00022923946380615234, 0.0005917549133300781, 0.0009542703628540039, 0.0013167858123779297, 0.0016793012619018555, 0.0020418167114257812, 0.002404332160949707, 0.002766847610473633, 0.0031293630599975586, 0.0034918785095214844, 0.00385439395904541, 0.004216909408569336, 0.004579424858093262, 0.0049419403076171875, 0.005304455757141113, 0.005666971206665039, 0.006029486656188965, 0.006392002105712891, 0.006754517555236816, 0.007117033004760742, 0.007479548454284668, 0.007842063903808594, 0.00820457935333252, 0.008567094802856445, 0.008929610252380371, 0.009292125701904297, 0.009654641151428223, 0.010017156600952148, 0.010379672050476074, 0.0107421875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 12.0, 9.0, 12.0, 16.0, 18.0, 21.0, 25.0, 31.0, 44.0, 44.0, 42.0, 48.0, 40.0, 60.0, 69.0, 56.0, 60.0, 62.0, 51.0, 53.0, 33.0, 40.0, 27.0, 32.0, 20.0, 13.0, 8.0, 10.0, 13.0, 6.0, 11.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0104827880859375, -0.01013195514678955, -0.009781122207641602, -0.009430289268493652, -0.009079456329345703, -0.008728623390197754, -0.008377790451049805, -0.008026957511901855, -0.007676124572753906, -0.007325291633605957, -0.006974458694458008, -0.006623625755310059, -0.006272792816162109, -0.00592195987701416, -0.005571126937866211, -0.005220293998718262, -0.0048694610595703125, -0.004518628120422363, -0.004167795181274414, -0.003816962242126465, -0.0034661293029785156, -0.0031152963638305664, -0.002764463424682617, -0.002413630485534668, -0.0020627975463867188, -0.0017119646072387695, -0.0013611316680908203, -0.001010298728942871, -0.0006594657897949219, -0.00030863285064697266, 4.220008850097656e-05, 0.0003930330276489258, 0.000743865966796875, 0.0010946989059448242, 0.0014455318450927734, 0.0017963647842407227, 0.002147197723388672, 0.002498030662536621, 0.0028488636016845703, 0.0031996965408325195, 0.0035505294799804688, 0.003901362419128418, 0.004252195358276367, 0.004603028297424316, 0.004953861236572266, 0.005304694175720215, 0.005655527114868164, 0.006006360054016113, 0.0063571929931640625, 0.006708025932312012, 0.007058858871459961, 0.00740969181060791, 0.007760524749755859, 0.008111357688903809, 0.008462190628051758, 0.008813023567199707, 0.009163856506347656, 0.009514689445495605, 0.009865522384643555, 0.010216355323791504, 0.010567188262939453, 0.010918021202087402, 0.011268854141235352, 0.0116196870803833, 0.01197052001953125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 2.0, 8.0, 13.0, 15.0, 22.0, 62.0, 126.0, 192.0, 210.0, 135.0, 95.0, 57.0, 34.0, 21.0, 7.0, 5.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.35261350870132446, -0.3387903571128845, -0.3249672055244446, -0.31114405393600464, -0.2973209023475647, -0.28349775075912476, -0.2696745991706848, -0.25585147738456726, -0.24202832579612732, -0.22820517420768738, -0.21438202261924744, -0.2005588710308075, -0.18673573434352875, -0.1729125827550888, -0.15908943116664886, -0.14526629447937012, -0.13144312798976898, -0.11761997640132904, -0.1037968322634697, -0.08997368067502975, -0.07615053653717041, -0.06232738494873047, -0.04850423336029053, -0.03468108922243118, -0.02085793763399124, -0.007034788839519024, 0.006788359954953194, 0.020611509680747986, 0.03443465754389763, 0.04825780540704727, 0.06208095699548721, 0.07590410113334656, 0.0897272527217865, 0.10355040431022644, 0.11737354844808578, 0.13119670748710632, 0.14501984417438507, 0.158842995762825, 0.17266614735126495, 0.1864892840385437, 0.20031243562698364, 0.21413558721542358, 0.22795873880386353, 0.24178189039230347, 0.2556050419807434, 0.26942819356918335, 0.2832513451576233, 0.29707446694374084, 0.3108976483345032, 0.3247207999229431, 0.33854395151138306, 0.352367103099823, 0.36619025468826294, 0.3800134062767029, 0.3938365578651428, 0.4076596796512604, 0.4214828312397003, 0.43530598282814026, 0.4491291344165802, 0.46295228600502014, 0.4767754375934601, 0.49059855937957764, 0.5044217109680176, 0.5182448625564575, 0.5320680141448975]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 4.0, 2.0, 4.0, 7.0, 9.0, 10.0, 13.0, 17.0, 11.0, 13.0, 16.0, 29.0, 20.0, 25.0, 22.0, 29.0, 39.0, 37.0, 36.0, 43.0, 57.0, 55.0, 52.0, 49.0, 38.0, 42.0, 36.0, 45.0, 30.0, 19.0, 31.0, 19.0, 19.0, 18.0, 16.0, 19.0, 16.0, 16.0, 8.0, 5.0, 8.0, 10.0, 4.0, 1.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3543928265571594, -0.34270575642585754, -0.33101871609687805, -0.31933164596557617, -0.3076446056365967, -0.2959575355052948, -0.2842704653739929, -0.2725834250450134, -0.26089635491371155, -0.24920929968357086, -0.23752224445343018, -0.2258351743221283, -0.2141481190919876, -0.20246106386184692, -0.19077400863170624, -0.17908695340156555, -0.16739989817142487, -0.15571284294128418, -0.1440257877111435, -0.1323387324810028, -0.12065166234970093, -0.10896460711956024, -0.09727755188941956, -0.08559048920869827, -0.07390343397855759, -0.0622163750231266, -0.05052931606769562, -0.03884226083755493, -0.027155201882123947, -0.015468142926692963, -0.0037810876965522766, 0.007905974984169006, 0.019593030214309692, 0.03128008916974068, 0.04296714812517166, 0.05465420335531235, 0.06634126603603363, 0.07802832126617432, 0.089715376496315, 0.10140243917703629, 0.11308949440717697, 0.12477654963731766, 0.13646361231803894, 0.14815066754817963, 0.1598377227783203, 0.1715247929096222, 0.18321183323860168, 0.19489890336990356, 0.20658595860004425, 0.21827301383018494, 0.22996006906032562, 0.2416471242904663, 0.2533341944217682, 0.26502126455307007, 0.27670830488204956, 0.28839537501335144, 0.30008241534233093, 0.3117694854736328, 0.3234565258026123, 0.3351435959339142, 0.3468306362628937, 0.35851770639419556, 0.37020474672317505, 0.38189181685447693, 0.3935788869857788]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 8.0, 5.0, 13.0, 21.0, 14.0, 25.0, 45.0, 85.0, 137.0, 247.0, 529.0, 1330.0, 6193.0, 4152258.0, 29697.0, 2181.0, 734.0, 322.0, 166.0, 107.0, 50.0, 35.0, 22.0, 12.0, 12.0, 7.0, 4.0, 8.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09014892578125, -0.08700942993164062, -0.08386993408203125, -0.08073043823242188, -0.0775909423828125, -0.07445144653320312, -0.07131195068359375, -0.06817245483398438, -0.065032958984375, -0.061893463134765625, -0.05875396728515625, -0.055614471435546875, -0.0524749755859375, -0.049335479736328125, -0.04619598388671875, -0.043056488037109375, -0.0399169921875, -0.036777496337890625, -0.03363800048828125, -0.030498504638671875, -0.0273590087890625, -0.024219512939453125, -0.02108001708984375, -0.017940521240234375, -0.014801025390625, -0.011661529541015625, -0.00852203369140625, -0.005382537841796875, -0.0022430419921875, 0.000896453857421875, 0.00403594970703125, 0.007175445556640625, 0.01031494140625, 0.013454437255859375, 0.01659393310546875, 0.019733428955078125, 0.0228729248046875, 0.026012420654296875, 0.02915191650390625, 0.032291412353515625, 0.035430908203125, 0.038570404052734375, 0.04170989990234375, 0.044849395751953125, 0.0479888916015625, 0.051128387451171875, 0.05426788330078125, 0.057407379150390625, 0.060546875, 0.06368637084960938, 0.06682586669921875, 0.06996536254882812, 0.0731048583984375, 0.07624435424804688, 0.07938385009765625, 0.08252334594726562, 0.085662841796875, 0.08880233764648438, 0.09194183349609375, 0.09508132934570312, 0.0982208251953125, 0.10136032104492188, 0.10449981689453125, 0.10763931274414062, 0.11077880859375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 4.0, 7.0, 5.0, 15.0, 13.0, 19.0, 24.0, 35.0, 24.0, 43.0, 52.0, 58.0, 76.0, 75.0, 64.0, 88.0, 64.0, 63.0, 54.0, 46.0, 37.0, 34.0, 29.0, 21.0, 12.0, 9.0, 9.0, 7.0, 4.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.036468505859375, -0.035358428955078125, -0.03424835205078125, -0.033138275146484375, -0.0320281982421875, -0.030918121337890625, -0.02980804443359375, -0.028697967529296875, -0.027587890625, -0.026477813720703125, -0.02536773681640625, -0.024257659912109375, -0.0231475830078125, -0.022037506103515625, -0.02092742919921875, -0.019817352294921875, -0.018707275390625, -0.017597198486328125, -0.01648712158203125, -0.015377044677734375, -0.0142669677734375, -0.013156890869140625, -0.01204681396484375, -0.010936737060546875, -0.00982666015625, -0.008716583251953125, -0.00760650634765625, -0.006496429443359375, -0.0053863525390625, -0.004276275634765625, -0.00316619873046875, -0.002056121826171875, -0.000946044921875, 0.000164031982421875, 0.00127410888671875, 0.002384185791015625, 0.0034942626953125, 0.004604339599609375, 0.00571441650390625, 0.006824493408203125, 0.0079345703125, 0.009044647216796875, 0.01015472412109375, 0.011264801025390625, 0.0123748779296875, 0.013484954833984375, 0.01459503173828125, 0.015705108642578125, 0.016815185546875, 0.017925262451171875, 0.01903533935546875, 0.020145416259765625, 0.0212554931640625, 0.022365570068359375, 0.02347564697265625, 0.024585723876953125, 0.02569580078125, 0.026805877685546875, 0.02791595458984375, 0.029026031494140625, 0.0301361083984375, 0.031246185302734375, 0.03235626220703125, 0.033466339111328125, 0.034576416015625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 7.0, 6.0, 12.0, 9.0, 9.0, 18.0, 16.0, 25.0, 33.0, 52.0, 55.0, 68.0, 81.0, 135.0, 156.0, 224.0, 310.0, 439.0, 747.0, 1321.0, 3159.0, 12629.0, 343108.0, 3807621.0, 16477.0, 3565.0, 1391.0, 861.0, 478.0, 350.0, 223.0, 152.0, 110.0, 91.0, 74.0, 67.0, 50.0, 50.0, 23.0, 22.0, 18.0, 24.0, 12.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037200927734375, -0.03587532043457031, -0.034549713134765625, -0.03322410583496094, -0.03189849853515625, -0.030572891235351562, -0.029247283935546875, -0.027921676635742188, -0.0265960693359375, -0.025270462036132812, -0.023944854736328125, -0.022619247436523438, -0.02129364013671875, -0.019968032836914062, -0.018642425537109375, -0.017316818237304688, -0.0159912109375, -0.014665603637695312, -0.013339996337890625, -0.012014389038085938, -0.01068878173828125, -0.009363174438476562, -0.008037567138671875, -0.0067119598388671875, -0.0053863525390625, -0.0040607452392578125, -0.002735137939453125, -0.0014095306396484375, -8.392333984375e-05, 0.0012416839599609375, 0.002567291259765625, 0.0038928985595703125, 0.005218505859375, 0.0065441131591796875, 0.007869720458984375, 0.009195327758789062, 0.01052093505859375, 0.011846542358398438, 0.013172149658203125, 0.014497756958007812, 0.0158233642578125, 0.017148971557617188, 0.018474578857421875, 0.019800186157226562, 0.02112579345703125, 0.022451400756835938, 0.023777008056640625, 0.025102615356445312, 0.02642822265625, 0.027753829956054688, 0.029079437255859375, 0.030405044555664062, 0.03173065185546875, 0.03305625915527344, 0.034381866455078125, 0.03570747375488281, 0.0370330810546875, 0.03835868835449219, 0.039684295654296875, 0.04100990295410156, 0.04233551025390625, 0.04366111755371094, 0.044986724853515625, 0.04631233215332031, 0.047637939453125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 2.0, 11.0, 47.0, 135.0, 3588.0, 209.0, 43.0, 24.0, 7.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0194091796875, -0.018954038619995117, -0.018498897552490234, -0.01804375648498535, -0.01758861541748047, -0.017133474349975586, -0.016678333282470703, -0.01622319221496582, -0.015768051147460938, -0.015312910079956055, -0.014857769012451172, -0.014402627944946289, -0.013947486877441406, -0.013492345809936523, -0.01303720474243164, -0.012582063674926758, -0.012126922607421875, -0.011671781539916992, -0.01121664047241211, -0.010761499404907227, -0.010306358337402344, -0.009851217269897461, -0.009396076202392578, -0.008940935134887695, -0.008485794067382812, -0.00803065299987793, -0.007575511932373047, -0.007120370864868164, -0.006665229797363281, -0.0062100887298583984, -0.005754947662353516, -0.005299806594848633, -0.00484466552734375, -0.004389524459838867, -0.003934383392333984, -0.0034792423248291016, -0.0030241012573242188, -0.002568960189819336, -0.002113819122314453, -0.0016586780548095703, -0.0012035369873046875, -0.0007483959197998047, -0.0002932548522949219, 0.00016188621520996094, 0.0006170272827148438, 0.0010721683502197266, 0.0015273094177246094, 0.001982450485229492, 0.002437591552734375, 0.002892732620239258, 0.0033478736877441406, 0.0038030147552490234, 0.004258155822753906, 0.004713296890258789, 0.005168437957763672, 0.005623579025268555, 0.0060787200927734375, 0.00653386116027832, 0.006989002227783203, 0.007444143295288086, 0.007899284362792969, 0.008354425430297852, 0.008809566497802734, 0.009264707565307617, 0.0097198486328125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 5.0, 4.0, 21.0, 29.0, 55.0, 116.0, 227.0, 263.0, 165.0, 72.0, 39.0, 9.0, 7.0, 1.0, 0.0, 1.0], "bins": [-0.11476375162601471, -0.11268938332796097, -0.11061502248048782, -0.10854065418243408, -0.10646628588438034, -0.1043919175863266, -0.10231755673885345, -0.10024318844079971, -0.09816882014274597, -0.09609445184469223, -0.09402009099721909, -0.09194572269916534, -0.0898713544011116, -0.08779698610305786, -0.08572262525558472, -0.08364825695753098, -0.08157389611005783, -0.07949952781200409, -0.07742516696453094, -0.0753507986664772, -0.07327643036842346, -0.07120206952095032, -0.06912770122289658, -0.06705333292484283, -0.06497897207736969, -0.06290460377931595, -0.060830239206552505, -0.05875587463378906, -0.05668150633573532, -0.05460714176297188, -0.052532777190208435, -0.050458408892154694, -0.04838404059410095, -0.04630967602133751, -0.04423530772328377, -0.042160943150520325, -0.04008657485246658, -0.03801221027970314, -0.0359378457069397, -0.033863477408885956, -0.03178911656141281, -0.02971475012600422, -0.027640383690595627, -0.025566019117832184, -0.02349165268242359, -0.021417286247015, -0.019342921674251556, -0.017268555238842964, -0.015194186940789223, -0.01311982050538063, -0.011045455001294613, -0.008971089497208595, -0.006896723061800003, -0.004822356626391411, -0.0027479911223053932, -0.0006736256182193756, 0.0014007408171892166, 0.0034751067869365215, 0.0055494727566838264, 0.007623838726431131, 0.009698204696178436, 0.011772571131587029, 0.013846936635673046, 0.015921302139759064, 0.017995668575167656]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 7.0, 6.0, 9.0, 8.0, 8.0, 16.0, 23.0, 14.0, 28.0, 23.0, 20.0, 29.0, 30.0, 38.0, 39.0, 45.0, 41.0, 41.0, 50.0, 49.0, 61.0, 44.0, 47.0, 32.0, 33.0, 28.0, 32.0, 28.0, 37.0, 22.0, 15.0, 19.0, 15.0, 10.0, 15.0, 7.0, 4.0, 6.0, 8.0, 5.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.01711338758468628, -0.01656441017985344, -0.01601543091237545, -0.015466452576220036, -0.014917474240064621, -0.014368495903909206, -0.013819517567753792, -0.013270539231598377, -0.012721560895442963, -0.012172582559287548, -0.011623604223132133, -0.011074625886976719, -0.010525647550821304, -0.00997666921466589, -0.009427690878510475, -0.00887871254235506, -0.008329734206199646, -0.007780755870044231, -0.007231777533888817, -0.006682799197733402, -0.006133820861577988, -0.005584842525422573, -0.0050358641892671585, -0.004486885853111744, -0.003937907516956329, -0.0033889291808009148, -0.0028399508446455, -0.0022909725084900856, -0.001741994172334671, -0.0011930158361792564, -0.0006440375000238419, -9.505916386842728e-05, 0.0004539191722869873, 0.0010028975084424019, 0.0015518758445978165, 0.002100854180753231, 0.0026498325169086456, 0.00319881085306406, 0.003747789189219475, 0.004296767525374889, 0.004845745861530304, 0.0053947241976857185, 0.005943702533841133, 0.006492680869996548, 0.007041659206151962, 0.007590637542307377, 0.008139615878462791, 0.008688594214618206, 0.00923757255077362, 0.009786550886929035, 0.01033552922308445, 0.010884507559239864, 0.011433485895395279, 0.011982464231550694, 0.012531442567706108, 0.013080420903861523, 0.013629399240016937, 0.014178377576172352, 0.014727355912327766, 0.015276334248483181, 0.015825312584638596, 0.016374289989471436, 0.016923269256949425, 0.017472248524427414, 0.018021225929260254]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 3.0, 11.0, 19.0, 9.0, 30.0, 35.0, 56.0, 87.0, 100.0, 176.0, 260.0, 416.0, 689.0, 1192.0, 2240.0, 4878.0, 11838.0, 32226.0, 110666.0, 438137.0, 326295.0, 77182.0, 24160.0, 9239.0, 3975.0, 1891.0, 1065.0, 552.0, 381.0, 261.0, 161.0, 99.0, 72.0, 51.0, 35.0, 21.0, 14.0, 9.0, 9.0, 7.0, 0.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.052032470703125, -0.05049610137939453, -0.04895973205566406, -0.047423362731933594, -0.045886993408203125, -0.044350624084472656, -0.04281425476074219, -0.04127788543701172, -0.03974151611328125, -0.03820514678955078, -0.03666877746582031, -0.035132408142089844, -0.033596038818359375, -0.032059669494628906, -0.030523300170898438, -0.02898693084716797, -0.0274505615234375, -0.02591419219970703, -0.024377822875976562, -0.022841453552246094, -0.021305084228515625, -0.019768714904785156, -0.018232345581054688, -0.01669597625732422, -0.01515960693359375, -0.013623237609863281, -0.012086868286132812, -0.010550498962402344, -0.009014129638671875, -0.007477760314941406, -0.0059413909912109375, -0.004405021667480469, -0.00286865234375, -0.0013322830200195312, 0.0002040863037109375, 0.0017404556274414062, 0.003276824951171875, 0.004813194274902344, 0.0063495635986328125, 0.007885932922363281, 0.00942230224609375, 0.010958671569824219, 0.012495040893554688, 0.014031410217285156, 0.015567779541015625, 0.017104148864746094, 0.018640518188476562, 0.02017688751220703, 0.0217132568359375, 0.02324962615966797, 0.024785995483398438, 0.026322364807128906, 0.027858734130859375, 0.029395103454589844, 0.030931472778320312, 0.03246784210205078, 0.03400421142578125, 0.03554058074951172, 0.03707695007324219, 0.038613319396972656, 0.040149688720703125, 0.041686058044433594, 0.04322242736816406, 0.04475879669189453, 0.046295166015625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 5.0, 3.0, 8.0, 10.0, 8.0, 15.0, 22.0, 25.0, 32.0, 38.0, 41.0, 42.0, 60.0, 73.0, 73.0, 71.0, 81.0, 71.0, 52.0, 64.0, 39.0, 42.0, 30.0, 22.0, 27.0, 12.0, 11.0, 7.0, 7.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.03607177734375, -0.03496837615966797, -0.03386497497558594, -0.032761573791503906, -0.031658172607421875, -0.030554771423339844, -0.029451370239257812, -0.02834796905517578, -0.02724456787109375, -0.02614116668701172, -0.025037765502929688, -0.023934364318847656, -0.022830963134765625, -0.021727561950683594, -0.020624160766601562, -0.01952075958251953, -0.0184173583984375, -0.01731395721435547, -0.016210556030273438, -0.015107154846191406, -0.014003753662109375, -0.012900352478027344, -0.011796951293945312, -0.010693550109863281, -0.00959014892578125, -0.008486747741699219, -0.0073833465576171875, -0.006279945373535156, -0.005176544189453125, -0.004073143005371094, -0.0029697418212890625, -0.0018663406372070312, -0.000762939453125, 0.00034046173095703125, 0.0014438629150390625, 0.0025472640991210938, 0.003650665283203125, 0.004754066467285156, 0.0058574676513671875, 0.006960868835449219, 0.00806427001953125, 0.009167671203613281, 0.010271072387695312, 0.011374473571777344, 0.012477874755859375, 0.013581275939941406, 0.014684677124023438, 0.01578807830810547, 0.0168914794921875, 0.01799488067626953, 0.019098281860351562, 0.020201683044433594, 0.021305084228515625, 0.022408485412597656, 0.023511886596679688, 0.02461528778076172, 0.02571868896484375, 0.02682209014892578, 0.027925491333007812, 0.029028892517089844, 0.030132293701171875, 0.031235694885253906, 0.03233909606933594, 0.03344249725341797, 0.0345458984375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 8.0, 4.0, 14.0, 12.0, 22.0, 28.0, 43.0, 41.0, 67.0, 125.0, 174.0, 283.0, 576.0, 1231.0, 3492.0, 11392.0, 51830.0, 500800.0, 417326.0, 45220.0, 10116.0, 3137.0, 1205.0, 590.0, 278.0, 159.0, 99.0, 70.0, 48.0, 36.0, 30.0, 29.0, 17.0, 11.0, 4.0, 12.0, 6.0, 3.0, 7.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052093505859375, -0.05023050308227539, -0.04836750030517578, -0.04650449752807617, -0.04464149475097656, -0.04277849197387695, -0.040915489196777344, -0.039052486419677734, -0.037189483642578125, -0.035326480865478516, -0.033463478088378906, -0.0316004753112793, -0.029737472534179688, -0.027874469757080078, -0.02601146697998047, -0.02414846420288086, -0.02228546142578125, -0.02042245864868164, -0.01855945587158203, -0.016696453094482422, -0.014833450317382812, -0.012970447540283203, -0.011107444763183594, -0.009244441986083984, -0.007381439208984375, -0.005518436431884766, -0.0036554336547851562, -0.0017924308776855469, 7.05718994140625e-05, 0.0019335746765136719, 0.0037965774536132812, 0.005659580230712891, 0.0075225830078125, 0.00938558578491211, 0.011248588562011719, 0.013111591339111328, 0.014974594116210938, 0.016837596893310547, 0.018700599670410156, 0.020563602447509766, 0.022426605224609375, 0.024289608001708984, 0.026152610778808594, 0.028015613555908203, 0.029878616333007812, 0.03174161911010742, 0.03360462188720703, 0.03546762466430664, 0.03733062744140625, 0.03919363021850586, 0.04105663299560547, 0.04291963577270508, 0.04478263854980469, 0.0466456413269043, 0.048508644104003906, 0.050371646881103516, 0.052234649658203125, 0.054097652435302734, 0.055960655212402344, 0.05782365798950195, 0.05968666076660156, 0.06154966354370117, 0.06341266632080078, 0.06527566909790039, 0.067138671875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 5.0, 10.0, 17.0, 11.0, 10.0, 17.0, 23.0, 27.0, 35.0, 20.0, 39.0, 25.0, 42.0, 40.0, 30.0, 48.0, 37.0, 36.0, 47.0, 48.0, 34.0, 36.0, 30.0, 33.0, 43.0, 38.0, 29.0, 17.0, 26.0, 20.0, 16.0, 16.0, 18.0, 13.0, 12.0, 15.0, 7.0, 3.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0716552734375, -0.06933403015136719, -0.06701278686523438, -0.06469154357910156, -0.06237030029296875, -0.06004905700683594, -0.057727813720703125, -0.05540657043457031, -0.0530853271484375, -0.05076408386230469, -0.048442840576171875, -0.04612159729003906, -0.04380035400390625, -0.04147911071777344, -0.039157867431640625, -0.03683662414550781, -0.034515380859375, -0.03219413757324219, -0.029872894287109375, -0.027551651000976562, -0.02523040771484375, -0.022909164428710938, -0.020587921142578125, -0.018266677856445312, -0.0159454345703125, -0.013624191284179688, -0.011302947998046875, -0.008981704711914062, -0.00666046142578125, -0.0043392181396484375, -0.002017974853515625, 0.0003032684326171875, 0.00262451171875, 0.0049457550048828125, 0.007266998291015625, 0.009588241577148438, 0.01190948486328125, 0.014230728149414062, 0.016551971435546875, 0.018873214721679688, 0.0211944580078125, 0.023515701293945312, 0.025836944580078125, 0.028158187866210938, 0.03047943115234375, 0.03280067443847656, 0.035121917724609375, 0.03744316101074219, 0.039764404296875, 0.04208564758300781, 0.044406890869140625, 0.04672813415527344, 0.04904937744140625, 0.05137062072753906, 0.053691864013671875, 0.05601310729980469, 0.0583343505859375, 0.06065559387207031, 0.06297683715820312, 0.06529808044433594, 0.06761932373046875, 0.06994056701660156, 0.07226181030273438, 0.07458305358886719, 0.076904296875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 11.0, 5.0, 12.0, 9.0, 14.0, 17.0, 34.0, 35.0, 63.0, 112.0, 208.0, 510.0, 1447.0, 6181.0, 51314.0, 750374.0, 218433.0, 15493.0, 2773.0, 826.0, 303.0, 125.0, 71.0, 52.0, 25.0, 20.0, 17.0, 12.0, 13.0, 13.0, 7.0, 6.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0187835693359375, -0.01820993423461914, -0.01763629913330078, -0.017062664031982422, -0.016489028930664062, -0.015915393829345703, -0.015341758728027344, -0.014768123626708984, -0.014194488525390625, -0.013620853424072266, -0.013047218322753906, -0.012473583221435547, -0.011899948120117188, -0.011326313018798828, -0.010752677917480469, -0.01017904281616211, -0.00960540771484375, -0.00903177261352539, -0.008458137512207031, -0.007884502410888672, -0.0073108673095703125, -0.006737232208251953, -0.006163597106933594, -0.005589962005615234, -0.005016326904296875, -0.004442691802978516, -0.0038690567016601562, -0.003295421600341797, -0.0027217864990234375, -0.002148151397705078, -0.0015745162963867188, -0.0010008811950683594, -0.00042724609375, 0.00014638900756835938, 0.0007200241088867188, 0.0012936592102050781, 0.0018672943115234375, 0.002440929412841797, 0.0030145645141601562, 0.0035881996154785156, 0.004161834716796875, 0.004735469818115234, 0.005309104919433594, 0.005882740020751953, 0.0064563751220703125, 0.007030010223388672, 0.007603645324707031, 0.00817728042602539, 0.00875091552734375, 0.00932455062866211, 0.009898185729980469, 0.010471820831298828, 0.011045455932617188, 0.011619091033935547, 0.012192726135253906, 0.012766361236572266, 0.013339996337890625, 0.013913631439208984, 0.014487266540527344, 0.015060901641845703, 0.015634536743164062, 0.016208171844482422, 0.01678180694580078, 0.01735544204711914, 0.0179290771484375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 0.0, 3.0, 3.0, 5.0, 7.0, 3.0, 16.0, 7.0, 13.0, 16.0, 25.0, 20.0, 23.0, 13.0, 35.0, 35.0, 46.0, 36.0, 42.0, 27.0, 61.0, 53.0, 54.0, 46.0, 50.0, 45.0, 25.0, 51.0, 36.0, 40.0, 36.0, 25.0, 12.0, 30.0, 14.0, 11.0, 16.0, 4.0, 8.0, 2.0, 6.0, 2.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.7550926208496094e-06, -3.645196557044983e-06, -3.5353004932403564e-06, -3.42540442943573e-06, -3.3155083656311035e-06, -3.205612301826477e-06, -3.0957162380218506e-06, -2.985820174217224e-06, -2.8759241104125977e-06, -2.766028046607971e-06, -2.6561319828033447e-06, -2.5462359189987183e-06, -2.436339855194092e-06, -2.3264437913894653e-06, -2.216547727584839e-06, -2.1066516637802124e-06, -1.996755599975586e-06, -1.8868595361709595e-06, -1.776963472366333e-06, -1.6670674085617065e-06, -1.55717134475708e-06, -1.4472752809524536e-06, -1.3373792171478271e-06, -1.2274831533432007e-06, -1.1175870895385742e-06, -1.0076910257339478e-06, -8.977949619293213e-07, -7.878988981246948e-07, -6.780028343200684e-07, -5.681067705154419e-07, -4.5821070671081543e-07, -3.4831464290618896e-07, -2.384185791015625e-07, -1.2852251529693604e-07, -1.862645149230957e-08, 9.12696123123169e-08, 2.0116567611694336e-07, 3.110617399215698e-07, 4.209578037261963e-07, 5.308538675308228e-07, 6.407499313354492e-07, 7.506459951400757e-07, 8.605420589447021e-07, 9.704381227493286e-07, 1.080334186553955e-06, 1.1902302503585815e-06, 1.300126314163208e-06, 1.4100223779678345e-06, 1.519918441772461e-06, 1.6298145055770874e-06, 1.7397105693817139e-06, 1.8496066331863403e-06, 1.959502696990967e-06, 2.0693987607955933e-06, 2.1792948246002197e-06, 2.289190888404846e-06, 2.3990869522094727e-06, 2.508983016014099e-06, 2.6188790798187256e-06, 2.728775143623352e-06, 2.8386712074279785e-06, 2.948567271232605e-06, 3.0584633350372314e-06, 3.168359398841858e-06, 3.2782554626464844e-06]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 7.0, 4.0, 6.0, 11.0, 13.0, 15.0, 29.0, 33.0, 68.0, 84.0, 161.0, 301.0, 537.0, 1170.0, 2952.0, 10875.0, 71725.0, 568921.0, 341849.0, 38800.0, 6956.0, 2071.0, 882.0, 465.0, 243.0, 131.0, 62.0, 44.0, 41.0, 23.0, 20.0, 14.0, 13.0, 9.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0137176513671875, -0.013300061225891113, -0.012882471084594727, -0.01246488094329834, -0.012047290802001953, -0.011629700660705566, -0.01121211051940918, -0.010794520378112793, -0.010376930236816406, -0.00995934009552002, -0.009541749954223633, -0.009124159812927246, -0.00870656967163086, -0.008288979530334473, -0.007871389389038086, -0.007453799247741699, -0.0070362091064453125, -0.006618618965148926, -0.006201028823852539, -0.005783438682556152, -0.005365848541259766, -0.004948258399963379, -0.004530668258666992, -0.0041130781173706055, -0.0036954879760742188, -0.003277897834777832, -0.0028603076934814453, -0.0024427175521850586, -0.002025127410888672, -0.0016075372695922852, -0.0011899471282958984, -0.0007723569869995117, -0.000354766845703125, 6.282329559326172e-05, 0.00048041343688964844, 0.0008980035781860352, 0.0013155937194824219, 0.0017331838607788086, 0.0021507740020751953, 0.002568364143371582, 0.0029859542846679688, 0.0034035444259643555, 0.003821134567260742, 0.004238724708557129, 0.004656314849853516, 0.005073904991149902, 0.005491495132446289, 0.005909085273742676, 0.0063266754150390625, 0.006744265556335449, 0.007161855697631836, 0.007579445838928223, 0.00799703598022461, 0.008414626121520996, 0.008832216262817383, 0.00924980640411377, 0.009667396545410156, 0.010084986686706543, 0.01050257682800293, 0.010920166969299316, 0.011337757110595703, 0.01175534725189209, 0.012172937393188477, 0.012590527534484863, 0.01300811767578125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 2.0, 7.0, 12.0, 20.0, 22.0, 30.0, 30.0, 51.0, 71.0, 106.0, 112.0, 123.0, 124.0, 79.0, 68.0, 37.0, 31.0, 25.0, 15.0, 11.0, 7.0, 8.0, 0.0, 5.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01436614990234375, -0.013744473457336426, -0.013122797012329102, -0.012501120567321777, -0.011879444122314453, -0.011257767677307129, -0.010636091232299805, -0.01001441478729248, -0.009392738342285156, -0.008771061897277832, -0.008149385452270508, -0.007527709007263184, -0.006906032562255859, -0.006284356117248535, -0.005662679672241211, -0.005041003227233887, -0.0044193267822265625, -0.0037976503372192383, -0.003175973892211914, -0.00255429744720459, -0.0019326210021972656, -0.0013109445571899414, -0.0006892681121826172, -6.759166717529297e-05, 0.0005540847778320312, 0.0011757612228393555, 0.0017974376678466797, 0.002419114112854004, 0.003040790557861328, 0.0036624670028686523, 0.0042841434478759766, 0.004905819892883301, 0.005527496337890625, 0.006149172782897949, 0.0067708492279052734, 0.007392525672912598, 0.008014202117919922, 0.008635878562927246, 0.00925755500793457, 0.009879231452941895, 0.010500907897949219, 0.011122584342956543, 0.011744260787963867, 0.012365937232971191, 0.012987613677978516, 0.01360929012298584, 0.014230966567993164, 0.014852643013000488, 0.015474319458007812, 0.016095995903015137, 0.01671767234802246, 0.017339348793029785, 0.01796102523803711, 0.018582701683044434, 0.019204378128051758, 0.019826054573059082, 0.020447731018066406, 0.02106940746307373, 0.021691083908081055, 0.02231276035308838, 0.022934436798095703, 0.023556113243103027, 0.02417778968811035, 0.024799466133117676, 0.025421142578125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 7.0, 15.0, 18.0, 19.0, 53.0, 64.0, 93.0, 122.0, 163.0, 139.0, 100.0, 78.0, 46.0, 33.0, 16.0, 19.0, 10.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29850900173187256, -0.2884170711040497, -0.2783251404762268, -0.26823320984840393, -0.25814127922058105, -0.24804934859275818, -0.2379574030637741, -0.22786547243595123, -0.21777354180812836, -0.20768161118030548, -0.1975896805524826, -0.18749774992465973, -0.17740580439567566, -0.16731387376785278, -0.1572219431400299, -0.14713001251220703, -0.13703808188438416, -0.12694615125656128, -0.1168542206287384, -0.10676228255033493, -0.09667035192251205, -0.08657842129468918, -0.0764864832162857, -0.06639455258846283, -0.056302621960639954, -0.04621069133281708, -0.0361187569797039, -0.026026824489235878, -0.015934891998767853, -0.005842961370944977, 0.004248972982168198, 0.014340907335281372, 0.024432837963104248, 0.034524768590927124, 0.0446167029440403, 0.05470863729715347, 0.06480056792497635, 0.07489249855279922, 0.0849844366312027, 0.09507636725902557, 0.10516829788684845, 0.11526022851467133, 0.1253521591424942, 0.13544408977031708, 0.14553603529930115, 0.15562796592712402, 0.1657198965549469, 0.17581182718276978, 0.18590375781059265, 0.19599568843841553, 0.2060876190662384, 0.21617954969406128, 0.22627148032188416, 0.23636341094970703, 0.2464553564786911, 0.2565472722053528, 0.26663923263549805, 0.2767311632633209, 0.2868230938911438, 0.2969150245189667, 0.30700695514678955, 0.3170988857746124, 0.3271908164024353, 0.33728277683258057, 0.34737467765808105]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 5.0, 4.0, 6.0, 5.0, 11.0, 11.0, 10.0, 12.0, 11.0, 25.0, 26.0, 19.0, 26.0, 38.0, 35.0, 45.0, 37.0, 52.0, 47.0, 45.0, 61.0, 71.0, 56.0, 48.0, 43.0, 38.0, 35.0, 26.0, 31.0, 24.0, 21.0, 17.0, 14.0, 14.0, 10.0, 7.0, 9.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.4649689793586731, -0.4517395496368408, -0.43851009011268616, -0.4252806603908539, -0.4120512008666992, -0.39882177114486694, -0.38559234142303467, -0.37236288189888, -0.35913345217704773, -0.34590402245521545, -0.3326745629310608, -0.3194451332092285, -0.30621567368507385, -0.2929862439632416, -0.2797567844390869, -0.26652735471725464, -0.25329792499542236, -0.2400684803724289, -0.22683903574943542, -0.21360960602760315, -0.20038016140460968, -0.1871507167816162, -0.17392127215862274, -0.16069182753562927, -0.1474623680114746, -0.13423292338848114, -0.12100348621606827, -0.1077740415930748, -0.09454460442066193, -0.08131515979766846, -0.06808571517467499, -0.054856278002262115, -0.04162684082984924, -0.028397399932146072, -0.015167957171797752, -0.0019385144114494324, 0.011290926486253738, 0.02452036738395691, 0.03774981200695038, 0.05097924917936325, 0.06420869380235672, 0.07743813842535019, 0.09066757559776306, 0.10389702022075653, 0.11712646484375, 0.13035589456558228, 0.14358535408973694, 0.1568147838115692, 0.17004422843456268, 0.18327367305755615, 0.19650311768054962, 0.2097325623035431, 0.22296199202537537, 0.23619143664836884, 0.2494208812713623, 0.2626503109931946, 0.27587977051734924, 0.2891092002391815, 0.3023386597633362, 0.31556808948516846, 0.3287975490093231, 0.3420269787311554, 0.35525643825531006, 0.36848586797714233, 0.3817152976989746]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 11.0, 6.0, 8.0, 14.0, 37.0, 32.0, 30.0, 58.0, 96.0, 233.0, 967.0, 4189302.0, 2840.0, 290.0, 131.0, 59.0, 55.0, 37.0, 25.0, 16.0, 10.0, 10.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.325439453125, -0.3140830993652344, -0.30272674560546875, -0.2913703918457031, -0.2800140380859375, -0.2686576843261719, -0.25730133056640625, -0.24594497680664062, -0.234588623046875, -0.22323226928710938, -0.21187591552734375, -0.20051956176757812, -0.1891632080078125, -0.17780685424804688, -0.16645050048828125, -0.15509414672851562, -0.14373779296875, -0.13238143920898438, -0.12102508544921875, -0.10966873168945312, -0.0983123779296875, -0.08695602416992188, -0.07559967041015625, -0.06424331665039062, -0.052886962890625, -0.041530609130859375, -0.03017425537109375, -0.018817901611328125, -0.0074615478515625, 0.003894805908203125, 0.01525115966796875, 0.026607513427734375, 0.0379638671875, 0.049320220947265625, 0.06067657470703125, 0.07203292846679688, 0.0833892822265625, 0.09474563598632812, 0.10610198974609375, 0.11745834350585938, 0.128814697265625, 0.14017105102539062, 0.15152740478515625, 0.16288375854492188, 0.1742401123046875, 0.18559646606445312, 0.19695281982421875, 0.20830917358398438, 0.21966552734375, 0.23102188110351562, 0.24237823486328125, 0.2537345886230469, 0.2650909423828125, 0.2764472961425781, 0.28780364990234375, 0.2991600036621094, 0.310516357421875, 0.3218727111816406, 0.33322906494140625, 0.3445854187011719, 0.3559417724609375, 0.3672981262207031, 0.37865447998046875, 0.3900108337402344, 0.4013671875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 7.0, 4.0, 9.0, 6.0, 10.0, 8.0, 18.0, 28.0, 30.0, 34.0, 42.0, 44.0, 63.0, 78.0, 57.0, 84.0, 77.0, 73.0, 55.0, 55.0, 59.0, 30.0, 39.0, 30.0, 16.0, 10.0, 13.0, 7.0, 5.0, 2.0, 3.0, 6.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0382080078125, -0.037077903747558594, -0.03594779968261719, -0.03481769561767578, -0.033687591552734375, -0.03255748748779297, -0.03142738342285156, -0.030297279357910156, -0.02916717529296875, -0.028037071228027344, -0.026906967163085938, -0.02577686309814453, -0.024646759033203125, -0.02351665496826172, -0.022386550903320312, -0.021256446838378906, -0.0201263427734375, -0.018996238708496094, -0.017866134643554688, -0.01673603057861328, -0.015605926513671875, -0.014475822448730469, -0.013345718383789062, -0.012215614318847656, -0.01108551025390625, -0.009955406188964844, -0.008825302124023438, -0.007695198059082031, -0.006565093994140625, -0.005434989929199219, -0.0043048858642578125, -0.0031747817993164062, -0.002044677734375, -0.0009145736694335938, 0.0002155303955078125, 0.0013456344604492188, 0.002475738525390625, 0.0036058425903320312, 0.0047359466552734375, 0.005866050720214844, 0.00699615478515625, 0.008126258850097656, 0.009256362915039062, 0.010386466979980469, 0.011516571044921875, 0.012646675109863281, 0.013776779174804688, 0.014906883239746094, 0.0160369873046875, 0.017167091369628906, 0.018297195434570312, 0.01942729949951172, 0.020557403564453125, 0.02168750762939453, 0.022817611694335938, 0.023947715759277344, 0.02507781982421875, 0.026207923889160156, 0.027338027954101562, 0.02846813201904297, 0.029598236083984375, 0.03072834014892578, 0.03185844421386719, 0.032988548278808594, 0.03411865234375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 2.0, 3.0, 1.0, 3.0, 5.0, 3.0, 9.0, 17.0, 32.0, 39.0, 44.0, 72.0, 82.0, 122.0, 134.0, 218.0, 311.0, 531.0, 760.0, 1391.0, 2497.0, 5522.0, 18960.0, 3648442.0, 484981.0, 18462.0, 5418.0, 2523.0, 1286.0, 780.0, 483.0, 320.0, 223.0, 144.0, 106.0, 80.0, 70.0, 72.0, 40.0, 32.0, 20.0, 9.0, 12.0, 6.0, 5.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.031890869140625, -0.030861854553222656, -0.029832839965820312, -0.02880382537841797, -0.027774810791015625, -0.02674579620361328, -0.025716781616210938, -0.024687767028808594, -0.02365875244140625, -0.022629737854003906, -0.021600723266601562, -0.02057170867919922, -0.019542694091796875, -0.01851367950439453, -0.017484664916992188, -0.016455650329589844, -0.0154266357421875, -0.014397621154785156, -0.013368606567382812, -0.012339591979980469, -0.011310577392578125, -0.010281562805175781, -0.009252548217773438, -0.008223533630371094, -0.00719451904296875, -0.006165504455566406, -0.0051364898681640625, -0.004107475280761719, -0.003078460693359375, -0.0020494461059570312, -0.0010204315185546875, 8.58306884765625e-06, 0.00103759765625, 0.0020666122436523438, 0.0030956268310546875, 0.004124641418457031, 0.005153656005859375, 0.006182670593261719, 0.0072116851806640625, 0.008240699768066406, 0.00926971435546875, 0.010298728942871094, 0.011327743530273438, 0.012356758117675781, 0.013385772705078125, 0.014414787292480469, 0.015443801879882812, 0.016472816467285156, 0.0175018310546875, 0.018530845642089844, 0.019559860229492188, 0.02058887481689453, 0.021617889404296875, 0.02264690399169922, 0.023675918579101562, 0.024704933166503906, 0.02573394775390625, 0.026762962341308594, 0.027791976928710938, 0.02882099151611328, 0.029850006103515625, 0.03087902069091797, 0.03190803527832031, 0.032937049865722656, 0.033966064453125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 10.0, 12.0, 44.0, 279.0, 3634.0, 58.0, 15.0, 2.0, 8.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015655517578125, -0.015152215957641602, -0.014648914337158203, -0.014145612716674805, -0.013642311096191406, -0.013139009475708008, -0.01263570785522461, -0.012132406234741211, -0.011629104614257812, -0.011125802993774414, -0.010622501373291016, -0.010119199752807617, -0.009615898132324219, -0.00911259651184082, -0.008609294891357422, -0.008105993270874023, -0.007602691650390625, -0.0070993900299072266, -0.006596088409423828, -0.00609278678894043, -0.005589485168457031, -0.005086183547973633, -0.004582881927490234, -0.004079580307006836, -0.0035762786865234375, -0.003072977066040039, -0.0025696754455566406, -0.002066373825073242, -0.0015630722045898438, -0.0010597705841064453, -0.0005564689636230469, -5.316734313964844e-05, 0.00045013427734375, 0.0009534358978271484, 0.0014567375183105469, 0.0019600391387939453, 0.0024633407592773438, 0.002966642379760742, 0.0034699440002441406, 0.003973245620727539, 0.0044765472412109375, 0.004979848861694336, 0.005483150482177734, 0.005986452102661133, 0.006489753723144531, 0.00699305534362793, 0.007496356964111328, 0.007999658584594727, 0.008502960205078125, 0.009006261825561523, 0.009509563446044922, 0.01001286506652832, 0.010516166687011719, 0.011019468307495117, 0.011522769927978516, 0.012026071548461914, 0.012529373168945312, 0.013032674789428711, 0.01353597640991211, 0.014039278030395508, 0.014542579650878906, 0.015045881271362305, 0.015549182891845703, 0.0160524845123291, 0.0165557861328125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 38.0, 85.0, 237.0, 347.0, 194.0, 69.0, 24.0, 9.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.051758598536252975, -0.049242254346609116, -0.046725913882255554, -0.044209569692611694, -0.041693225502967834, -0.03917688503861427, -0.03666054084897041, -0.03414420038461685, -0.03162785619497299, -0.02911151386797428, -0.02659517154097557, -0.02407882735133171, -0.021562485024333, -0.01904614269733429, -0.01652979850769043, -0.014013456180691719, -0.011497113853693008, -0.008980771526694298, -0.0064644282683730125, -0.003948085475713015, -0.0014317426830530167, 0.001084599643945694, 0.0036009429022669792, 0.0061172861605882645, 0.008633628487586975, 0.011149970814585686, 0.013666314072906971, 0.016182657331228256, 0.018698999658226967, 0.021215341985225677, 0.023731686174869537, 0.026248028501868248, 0.028764374554157257, 0.03128071874380112, 0.03379705920815468, 0.03631340339779854, 0.0388297438621521, 0.04134608805179596, 0.04386243224143982, 0.04637877643108368, 0.04889511689543724, 0.0514114610850811, 0.05392780154943466, 0.05644414573907852, 0.05896048992872238, 0.06147683039307594, 0.0639931708574295, 0.06650951504707336, 0.06902585923671722, 0.07154220342636108, 0.07405854761600494, 0.0765748843550682, 0.07909122854471207, 0.08160757273435593, 0.08412391692399979, 0.08664026111364365, 0.08915659785270691, 0.09167294204235077, 0.09418928623199463, 0.09670562297105789, 0.09922196716070175, 0.10173831135034561, 0.10425465553998947, 0.10677099972963333, 0.10928734391927719]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 8.0, 13.0, 11.0, 7.0, 15.0, 14.0, 14.0, 22.0, 22.0, 24.0, 31.0, 21.0, 37.0, 39.0, 45.0, 39.0, 38.0, 49.0, 50.0, 43.0, 39.0, 42.0, 50.0, 32.0, 32.0, 38.0, 38.0, 41.0, 14.0, 24.0, 23.0, 12.0, 19.0, 10.0, 13.0, 11.0, 8.0, 4.0, 2.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02038675546646118, -0.01981344074010849, -0.019240127876400948, -0.018666815012693405, -0.018093500286340714, -0.017520185559988022, -0.01694687269628048, -0.016373559832572937, -0.015800245106220245, -0.015226931311190128, -0.014653617516160011, -0.014080303721129894, -0.013506989926099777, -0.01293367613106966, -0.012360362336039543, -0.011787048541009426, -0.011213734745979309, -0.010640420950949192, -0.010067107155919075, -0.009493793360888958, -0.008920479565858841, -0.008347165770828724, -0.007773851975798607, -0.00720053818076849, -0.006627224385738373, -0.006053910590708256, -0.005480596795678139, -0.004907283000648022, -0.004333969205617905, -0.0037606554105877876, -0.0031873416155576706, -0.0026140278205275536, -0.0020407140254974365, -0.0014674002304673195, -0.0008940864354372025, -0.0003207726404070854, 0.0002525411546230316, 0.0008258549496531487, 0.0013991687446832657, 0.0019724825397133827, 0.0025457963347434998, 0.003119110129773617, 0.003692423924803734, 0.004265737719833851, 0.004839051514863968, 0.005412365309894085, 0.005985679104924202, 0.006558992899954319, 0.007132306694984436, 0.007705620490014553, 0.00827893428504467, 0.008852248080074787, 0.009425561875104904, 0.009998875670135021, 0.010572189465165138, 0.011145503260195255, 0.011718817055225372, 0.01229213085025549, 0.012865444645285606, 0.013438758440315723, 0.01401207223534584, 0.014585386030375957, 0.015158699825406075, 0.015732012689113617, 0.01630532741546631]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 3.0, 5.0, 7.0, 6.0, 6.0, 9.0, 7.0, 14.0, 23.0, 39.0, 46.0, 54.0, 71.0, 96.0, 133.0, 249.0, 392.0, 516.0, 867.0, 1685.0, 3242.0, 8843.0, 63006.0, 830989.0, 117809.0, 11850.0, 3854.0, 1842.0, 1026.0, 624.0, 383.0, 256.0, 164.0, 125.0, 86.0, 44.0, 48.0, 31.0, 32.0, 27.0, 8.0, 14.0, 7.0, 3.0, 4.0, 1.0, 6.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0921630859375, -0.08924674987792969, -0.08633041381835938, -0.08341407775878906, -0.08049774169921875, -0.07758140563964844, -0.07466506958007812, -0.07174873352050781, -0.0688323974609375, -0.06591606140136719, -0.06299972534179688, -0.06008338928222656, -0.05716705322265625, -0.05425071716308594, -0.051334381103515625, -0.04841804504394531, -0.045501708984375, -0.04258537292480469, -0.039669036865234375, -0.03675270080566406, -0.03383636474609375, -0.030920028686523438, -0.028003692626953125, -0.025087356567382812, -0.0221710205078125, -0.019254684448242188, -0.016338348388671875, -0.013422012329101562, -0.01050567626953125, -0.0075893402099609375, -0.004673004150390625, -0.0017566680908203125, 0.00115966796875, 0.0040760040283203125, 0.006992340087890625, 0.009908676147460938, 0.01282501220703125, 0.015741348266601562, 0.018657684326171875, 0.021574020385742188, 0.0244903564453125, 0.027406692504882812, 0.030323028564453125, 0.03323936462402344, 0.03615570068359375, 0.03907203674316406, 0.041988372802734375, 0.04490470886230469, 0.047821044921875, 0.05073738098144531, 0.053653717041015625, 0.05657005310058594, 0.05948638916015625, 0.06240272521972656, 0.06531906127929688, 0.06823539733886719, 0.0711517333984375, 0.07406806945800781, 0.07698440551757812, 0.07990074157714844, 0.08281707763671875, 0.08573341369628906, 0.08864974975585938, 0.09156608581542969, 0.094482421875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 7.0, 5.0, 6.0, 10.0, 9.0, 20.0, 26.0, 30.0, 27.0, 41.0, 44.0, 47.0, 66.0, 79.0, 76.0, 73.0, 82.0, 61.0, 54.0, 46.0, 46.0, 33.0, 27.0, 28.0, 12.0, 6.0, 11.0, 9.0, 3.0, 4.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.038330078125, -0.03720569610595703, -0.03608131408691406, -0.034956932067871094, -0.033832550048828125, -0.032708168029785156, -0.03158378601074219, -0.03045940399169922, -0.02933502197265625, -0.02821063995361328, -0.027086257934570312, -0.025961875915527344, -0.024837493896484375, -0.023713111877441406, -0.022588729858398438, -0.02146434783935547, -0.0203399658203125, -0.01921558380126953, -0.018091201782226562, -0.016966819763183594, -0.015842437744140625, -0.014718055725097656, -0.013593673706054688, -0.012469291687011719, -0.01134490966796875, -0.010220527648925781, -0.009096145629882812, -0.007971763610839844, -0.006847381591796875, -0.005722999572753906, -0.0045986175537109375, -0.0034742355346679688, -0.002349853515625, -0.0012254714965820312, -0.0001010894775390625, 0.0010232925415039062, 0.002147674560546875, 0.0032720565795898438, 0.0043964385986328125, 0.005520820617675781, 0.00664520263671875, 0.007769584655761719, 0.008893966674804688, 0.010018348693847656, 0.011142730712890625, 0.012267112731933594, 0.013391494750976562, 0.014515876770019531, 0.0156402587890625, 0.01676464080810547, 0.017889022827148438, 0.019013404846191406, 0.020137786865234375, 0.021262168884277344, 0.022386550903320312, 0.02351093292236328, 0.02463531494140625, 0.02575969696044922, 0.026884078979492188, 0.028008460998535156, 0.029132843017578125, 0.030257225036621094, 0.03138160705566406, 0.03250598907470703, 0.03363037109375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 6.0, 19.0, 20.0, 30.0, 39.0, 42.0, 96.0, 137.0, 197.0, 353.0, 649.0, 1248.0, 2615.0, 8955.0, 162104.0, 842583.0, 21706.0, 4099.0, 1612.0, 873.0, 430.0, 277.0, 185.0, 77.0, 59.0, 49.0, 32.0, 16.0, 16.0, 9.0, 6.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.09405517578125, -0.0908355712890625, -0.087615966796875, -0.0843963623046875, -0.0811767578125, -0.0779571533203125, -0.074737548828125, -0.0715179443359375, -0.06829833984375, -0.0650787353515625, -0.061859130859375, -0.0586395263671875, -0.055419921875, -0.0522003173828125, -0.048980712890625, -0.0457611083984375, -0.04254150390625, -0.0393218994140625, -0.036102294921875, -0.0328826904296875, -0.0296630859375, -0.0264434814453125, -0.023223876953125, -0.0200042724609375, -0.01678466796875, -0.0135650634765625, -0.010345458984375, -0.0071258544921875, -0.00390625, -0.0006866455078125, 0.002532958984375, 0.0057525634765625, 0.00897216796875, 0.0121917724609375, 0.015411376953125, 0.0186309814453125, 0.0218505859375, 0.0250701904296875, 0.028289794921875, 0.0315093994140625, 0.03472900390625, 0.0379486083984375, 0.041168212890625, 0.0443878173828125, 0.047607421875, 0.0508270263671875, 0.054046630859375, 0.0572662353515625, 0.06048583984375, 0.0637054443359375, 0.066925048828125, 0.0701446533203125, 0.0733642578125, 0.0765838623046875, 0.079803466796875, 0.0830230712890625, 0.08624267578125, 0.0894622802734375, 0.092681884765625, 0.0959014892578125, 0.09912109375, 0.1023406982421875, 0.105560302734375, 0.1087799072265625, 0.11199951171875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 5.0, 9.0, 12.0, 12.0, 10.0, 17.0, 17.0, 33.0, 32.0, 39.0, 40.0, 59.0, 53.0, 55.0, 72.0, 51.0, 53.0, 52.0, 59.0, 39.0, 39.0, 51.0, 34.0, 34.0, 29.0, 24.0, 16.0, 14.0, 12.0, 11.0, 7.0, 2.0, 0.0, 4.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11834716796875, -0.1147623062133789, -0.11117744445800781, -0.10759258270263672, -0.10400772094726562, -0.10042285919189453, -0.09683799743652344, -0.09325313568115234, -0.08966827392578125, -0.08608341217041016, -0.08249855041503906, -0.07891368865966797, -0.07532882690429688, -0.07174396514892578, -0.06815910339355469, -0.0645742416381836, -0.0609893798828125, -0.057404518127441406, -0.05381965637207031, -0.05023479461669922, -0.046649932861328125, -0.04306507110595703, -0.03948020935058594, -0.035895347595214844, -0.03231048583984375, -0.028725624084472656, -0.025140762329101562, -0.02155590057373047, -0.017971038818359375, -0.014386177062988281, -0.010801315307617188, -0.007216453552246094, -0.003631591796875, -4.673004150390625e-05, 0.0035381317138671875, 0.007122993469238281, 0.010707855224609375, 0.014292716979980469, 0.017877578735351562, 0.021462440490722656, 0.02504730224609375, 0.028632164001464844, 0.03221702575683594, 0.03580188751220703, 0.039386749267578125, 0.04297161102294922, 0.04655647277832031, 0.050141334533691406, 0.0537261962890625, 0.057311058044433594, 0.06089591979980469, 0.06448078155517578, 0.06806564331054688, 0.07165050506591797, 0.07523536682128906, 0.07882022857666016, 0.08240509033203125, 0.08598995208740234, 0.08957481384277344, 0.09315967559814453, 0.09674453735351562, 0.10032939910888672, 0.10391426086425781, 0.1074991226196289, 0.111083984375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 7.0, 6.0, 8.0, 21.0, 39.0, 56.0, 147.0, 492.0, 1767.0, 17648.0, 950401.0, 73330.0, 3456.0, 720.0, 246.0, 110.0, 43.0, 19.0, 10.0, 6.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0270843505859375, -0.025890111923217773, -0.024695873260498047, -0.02350163459777832, -0.022307395935058594, -0.021113157272338867, -0.01991891860961914, -0.018724679946899414, -0.017530441284179688, -0.01633620262145996, -0.015141963958740234, -0.013947725296020508, -0.012753486633300781, -0.011559247970581055, -0.010365009307861328, -0.009170770645141602, -0.007976531982421875, -0.0067822933197021484, -0.005588054656982422, -0.004393815994262695, -0.0031995773315429688, -0.002005338668823242, -0.0008111000061035156, 0.00038313865661621094, 0.0015773773193359375, 0.002771615982055664, 0.003965854644775391, 0.005160093307495117, 0.006354331970214844, 0.00754857063293457, 0.008742809295654297, 0.009937047958374023, 0.01113128662109375, 0.012325525283813477, 0.013519763946533203, 0.01471400260925293, 0.015908241271972656, 0.017102479934692383, 0.01829671859741211, 0.019490957260131836, 0.020685195922851562, 0.02187943458557129, 0.023073673248291016, 0.024267911911010742, 0.02546215057373047, 0.026656389236450195, 0.027850627899169922, 0.02904486656188965, 0.030239105224609375, 0.0314333438873291, 0.03262758255004883, 0.033821821212768555, 0.03501605987548828, 0.03621029853820801, 0.037404537200927734, 0.03859877586364746, 0.03979301452636719, 0.040987253189086914, 0.04218149185180664, 0.04337573051452637, 0.044569969177246094, 0.04576420783996582, 0.04695844650268555, 0.04815268516540527, 0.049346923828125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 5.0, 5.0, 7.0, 5.0, 10.0, 15.0, 38.0, 38.0, 61.0, 63.0, 125.0, 104.0, 129.0, 129.0, 84.0, 78.0, 26.0, 35.0, 22.0, 9.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3887882232666016e-05, -1.355726271867752e-05, -1.3226643204689026e-05, -1.2896023690700531e-05, -1.2565404176712036e-05, -1.2234784662723541e-05, -1.1904165148735046e-05, -1.1573545634746552e-05, -1.1242926120758057e-05, -1.0912306606769562e-05, -1.0581687092781067e-05, -1.0251067578792572e-05, -9.920448064804077e-06, -9.589828550815582e-06, -9.259209036827087e-06, -8.928589522838593e-06, -8.597970008850098e-06, -8.267350494861603e-06, -7.936730980873108e-06, -7.606111466884613e-06, -7.275491952896118e-06, -6.944872438907623e-06, -6.614252924919128e-06, -6.2836334109306335e-06, -5.953013896942139e-06, -5.622394382953644e-06, -5.291774868965149e-06, -4.961155354976654e-06, -4.630535840988159e-06, -4.299916326999664e-06, -3.9692968130111694e-06, -3.6386772990226746e-06, -3.3080577850341797e-06, -2.977438271045685e-06, -2.64681875705719e-06, -2.316199243068695e-06, -1.9855797290802e-06, -1.6549602150917053e-06, -1.3243407011032104e-06, -9.937211871147156e-07, -6.631016731262207e-07, -3.3248215913772583e-07, -1.862645149230957e-09, 3.287568688392639e-07, 6.593763828277588e-07, 9.899958968162537e-07, 1.3206154108047485e-06, 1.6512349247932434e-06, 1.9818544387817383e-06, 2.312473952770233e-06, 2.643093466758728e-06, 2.973712980747223e-06, 3.3043324947357178e-06, 3.6349520087242126e-06, 3.9655715227127075e-06, 4.296191036701202e-06, 4.626810550689697e-06, 4.957430064678192e-06, 5.288049578666687e-06, 5.618669092655182e-06, 5.949288606643677e-06, 6.279908120632172e-06, 6.6105276346206665e-06, 6.941147148609161e-06, 7.271766662597656e-06]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 0.0, 4.0, 5.0, 9.0, 16.0, 25.0, 38.0, 83.0, 167.0, 354.0, 934.0, 2893.0, 17488.0, 906621.0, 111501.0, 5878.0, 1543.0, 537.0, 230.0, 98.0, 51.0, 28.0, 12.0, 6.0, 6.0, 5.0, 3.0, 1.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03973388671875, -0.03852033615112305, -0.037306785583496094, -0.03609323501586914, -0.03487968444824219, -0.033666133880615234, -0.03245258331298828, -0.031239032745361328, -0.030025482177734375, -0.028811931610107422, -0.02759838104248047, -0.026384830474853516, -0.025171279907226562, -0.02395772933959961, -0.022744178771972656, -0.021530628204345703, -0.02031707763671875, -0.019103527069091797, -0.017889976501464844, -0.01667642593383789, -0.015462875366210938, -0.014249324798583984, -0.013035774230957031, -0.011822223663330078, -0.010608673095703125, -0.009395122528076172, -0.008181571960449219, -0.006968021392822266, -0.0057544708251953125, -0.004540920257568359, -0.0033273696899414062, -0.002113819122314453, -0.0009002685546875, 0.0003132820129394531, 0.0015268325805664062, 0.0027403831481933594, 0.0039539337158203125, 0.005167484283447266, 0.006381034851074219, 0.007594585418701172, 0.008808135986328125, 0.010021686553955078, 0.011235237121582031, 0.012448787689208984, 0.013662338256835938, 0.01487588882446289, 0.016089439392089844, 0.017302989959716797, 0.01851654052734375, 0.019730091094970703, 0.020943641662597656, 0.02215719223022461, 0.023370742797851562, 0.024584293365478516, 0.02579784393310547, 0.027011394500732422, 0.028224945068359375, 0.029438495635986328, 0.03065204620361328, 0.031865596771240234, 0.03307914733886719, 0.03429269790649414, 0.035506248474121094, 0.03671979904174805, 0.037933349609375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 4.0, 1.0, 2.0, 5.0, 5.0, 6.0, 15.0, 20.0, 70.0, 215.0, 323.0, 201.0, 61.0, 30.0, 15.0, 6.0, 5.0, 9.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07843017578125, -0.07628011703491211, -0.07413005828857422, -0.07197999954223633, -0.06982994079589844, -0.06767988204956055, -0.06552982330322266, -0.06337976455688477, -0.061229705810546875, -0.059079647064208984, -0.056929588317871094, -0.0547795295715332, -0.05262947082519531, -0.05047941207885742, -0.04832935333251953, -0.04617929458618164, -0.04402923583984375, -0.04187917709350586, -0.03972911834716797, -0.03757905960083008, -0.03542900085449219, -0.0332789421081543, -0.031128883361816406, -0.028978824615478516, -0.026828765869140625, -0.024678707122802734, -0.022528648376464844, -0.020378589630126953, -0.018228530883789062, -0.016078472137451172, -0.013928413391113281, -0.01177835464477539, -0.0096282958984375, -0.007478237152099609, -0.005328178405761719, -0.003178119659423828, -0.0010280609130859375, 0.0011219978332519531, 0.0032720565795898438, 0.005422115325927734, 0.007572174072265625, 0.009722232818603516, 0.011872291564941406, 0.014022350311279297, 0.016172409057617188, 0.018322467803955078, 0.02047252655029297, 0.02262258529663086, 0.02477264404296875, 0.02692270278930664, 0.02907276153564453, 0.031222820281982422, 0.03337287902832031, 0.0355229377746582, 0.037672996520996094, 0.039823055267333984, 0.041973114013671875, 0.044123172760009766, 0.046273231506347656, 0.04842329025268555, 0.05057334899902344, 0.05272340774536133, 0.05487346649169922, 0.05702352523803711, 0.059173583984375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 8.0, 8.0, 20.0, 64.0, 101.0, 229.0, 308.0, 178.0, 67.0, 20.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1404783725738525, -1.1170368194580078, -1.0935951471328735, -1.0701534748077393, -1.0467119216918945, -1.0232703685760498, -0.9998286962509155, -0.976387083530426, -0.9529454708099365, -0.929503858089447, -0.9060622453689575, -0.882620632648468, -0.8591790199279785, -0.835737407207489, -0.8122957944869995, -0.78885418176651, -0.7654125690460205, -0.741970956325531, -0.7185293436050415, -0.695087730884552, -0.6716461181640625, -0.648204505443573, -0.6247628927230835, -0.601321280002594, -0.5778796672821045, -0.554438054561615, -0.5309964418411255, -0.507554829120636, -0.4841132164001465, -0.460671603679657, -0.4372299909591675, -0.413788378238678, -0.3903467059135437, -0.3669050931930542, -0.3434634804725647, -0.3200218677520752, -0.2965802550315857, -0.2731386423110962, -0.2496970295906067, -0.2262554168701172, -0.20281380414962769, -0.17937219142913818, -0.15593057870864868, -0.13248896598815918, -0.10904735326766968, -0.08560574054718018, -0.062164127826690674, -0.03872251510620117, -0.01528090238571167, 0.008160710334777832, 0.031602323055267334, 0.055043935775756836, 0.07848554849624634, 0.10192716121673584, 0.12536877393722534, 0.14881038665771484, 0.17225199937820435, 0.19569361209869385, 0.21913522481918335, 0.24257683753967285, 0.26601845026016235, 0.28946006298065186, 0.31290167570114136, 0.33634328842163086, 0.35978490114212036]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 3.0, 4.0, 5.0, 13.0, 13.0, 12.0, 15.0, 17.0, 22.0, 22.0, 19.0, 26.0, 22.0, 36.0, 41.0, 38.0, 52.0, 42.0, 41.0, 46.0, 47.0, 55.0, 38.0, 40.0, 32.0, 36.0, 45.0, 30.0, 31.0, 23.0, 25.0, 14.0, 20.0, 10.0, 8.0, 15.0, 10.0, 12.0, 6.0, 8.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.4403841495513916, -0.4279022812843323, -0.41542044281959534, -0.402938574552536, -0.3904567360877991, -0.37797486782073975, -0.3654929995536804, -0.3530111610889435, -0.34052929282188416, -0.32804742455482483, -0.3155655860900879, -0.30308371782302856, -0.2906018793582916, -0.2781200110912323, -0.26563817262649536, -0.25315630435943604, -0.2406744509935379, -0.22819259762763977, -0.21571074426174164, -0.2032288908958435, -0.19074702262878418, -0.17826516926288605, -0.16578331589698792, -0.1533014476299286, -0.14081960916519165, -0.12833775579929352, -0.11585589498281479, -0.10337404161691666, -0.09089218080043793, -0.0784103274345398, -0.06592847406864166, -0.05344661325216293, -0.040964752435684204, -0.028482895344495773, -0.016001040115952492, -0.00351918488740921, 0.00896267220377922, 0.02144452929496765, 0.033926382660865784, 0.04640824347734451, 0.058890096843242645, 0.07137195020914078, 0.0838538110256195, 0.09633566439151764, 0.10881751775741577, 0.1212993785738945, 0.13378122448921204, 0.14626309275627136, 0.1587449461221695, 0.17122679948806763, 0.18370865285396576, 0.1961905062198639, 0.20867237448692322, 0.22115422785282135, 0.23363608121871948, 0.2461179494857788, 0.25859978795051575, 0.2710816562175751, 0.283563494682312, 0.29604536294937134, 0.3085272014141083, 0.3210090696811676, 0.33349090814590454, 0.34597277641296387, 0.3584546446800232]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 8.0, 9.0, 9.0, 28.0, 25.0, 42.0, 40.0, 58.0, 78.0, 200.0, 2534.0, 4188755.0, 2035.0, 165.0, 76.0, 68.0, 43.0, 38.0, 26.0, 15.0, 11.0, 9.0, 5.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2049560546875, -0.19721412658691406, -0.18947219848632812, -0.1817302703857422, -0.17398834228515625, -0.1662464141845703, -0.15850448608398438, -0.15076255798339844, -0.1430206298828125, -0.13527870178222656, -0.12753677368164062, -0.11979484558105469, -0.11205291748046875, -0.10431098937988281, -0.09656906127929688, -0.08882713317871094, -0.081085205078125, -0.07334327697753906, -0.06560134887695312, -0.05785942077636719, -0.05011749267578125, -0.04237556457519531, -0.034633636474609375, -0.026891708374023438, -0.0191497802734375, -0.011407852172851562, -0.003665924072265625, 0.0040760040283203125, 0.01181793212890625, 0.019559860229492188, 0.027301788330078125, 0.03504371643066406, 0.04278564453125, 0.05052757263183594, 0.058269500732421875, 0.06601142883300781, 0.07375335693359375, 0.08149528503417969, 0.08923721313476562, 0.09697914123535156, 0.1047210693359375, 0.11246299743652344, 0.12020492553710938, 0.1279468536376953, 0.13568878173828125, 0.1434307098388672, 0.15117263793945312, 0.15891456604003906, 0.166656494140625, 0.17439842224121094, 0.18214035034179688, 0.1898822784423828, 0.19762420654296875, 0.2053661346435547, 0.21310806274414062, 0.22084999084472656, 0.2285919189453125, 0.23633384704589844, 0.24407577514648438, 0.2518177032470703, 0.25955963134765625, 0.2673015594482422, 0.2750434875488281, 0.28278541564941406, 0.29052734375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 7.0, 4.0, 9.0, 5.0, 12.0, 23.0, 14.0, 23.0, 35.0, 39.0, 52.0, 53.0, 55.0, 66.0, 78.0, 76.0, 77.0, 64.0, 64.0, 55.0, 46.0, 26.0, 23.0, 19.0, 20.0, 21.0, 10.0, 8.0, 5.0, 3.0, 0.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.03399658203125, -0.03294515609741211, -0.03189373016357422, -0.030842304229736328, -0.029790878295898438, -0.028739452362060547, -0.027688026428222656, -0.026636600494384766, -0.025585174560546875, -0.024533748626708984, -0.023482322692871094, -0.022430896759033203, -0.021379470825195312, -0.020328044891357422, -0.01927661895751953, -0.01822519302368164, -0.01717376708984375, -0.01612234115600586, -0.015070915222167969, -0.014019489288330078, -0.012968063354492188, -0.011916637420654297, -0.010865211486816406, -0.009813785552978516, -0.008762359619140625, -0.007710933685302734, -0.006659507751464844, -0.005608081817626953, -0.0045566558837890625, -0.003505229949951172, -0.0024538040161132812, -0.0014023780822753906, -0.0003509521484375, 0.0007004737854003906, 0.0017518997192382812, 0.002803325653076172, 0.0038547515869140625, 0.004906177520751953, 0.005957603454589844, 0.007009029388427734, 0.008060455322265625, 0.009111881256103516, 0.010163307189941406, 0.011214733123779297, 0.012266159057617188, 0.013317584991455078, 0.014369010925292969, 0.01542043685913086, 0.01647186279296875, 0.01752328872680664, 0.01857471466064453, 0.019626140594482422, 0.020677566528320312, 0.021728992462158203, 0.022780418395996094, 0.023831844329833984, 0.024883270263671875, 0.025934696197509766, 0.026986122131347656, 0.028037548065185547, 0.029088973999023438, 0.030140399932861328, 0.03119182586669922, 0.03224325180053711, 0.033294677734375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 5.0, 8.0, 7.0, 11.0, 14.0, 17.0, 28.0, 30.0, 42.0, 53.0, 72.0, 97.0, 136.0, 199.0, 253.0, 459.0, 744.0, 1513.0, 3510.0, 11920.0, 209953.0, 3937620.0, 18584.0, 4648.0, 1861.0, 866.0, 507.0, 315.0, 205.0, 152.0, 125.0, 78.0, 68.0, 46.0, 33.0, 28.0, 22.0, 17.0, 11.0, 7.0, 7.0, 2.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.050872802734375, -0.04942464828491211, -0.04797649383544922, -0.04652833938598633, -0.04508018493652344, -0.04363203048706055, -0.042183876037597656, -0.040735721588134766, -0.039287567138671875, -0.037839412689208984, -0.036391258239746094, -0.0349431037902832, -0.03349494934082031, -0.03204679489135742, -0.03059864044189453, -0.02915048599243164, -0.02770233154296875, -0.02625417709350586, -0.02480602264404297, -0.023357868194580078, -0.021909713745117188, -0.020461559295654297, -0.019013404846191406, -0.017565250396728516, -0.016117095947265625, -0.014668941497802734, -0.013220787048339844, -0.011772632598876953, -0.010324478149414062, -0.008876323699951172, -0.007428169250488281, -0.005980014801025391, -0.0045318603515625, -0.0030837059020996094, -0.0016355514526367188, -0.00018739700317382812, 0.0012607574462890625, 0.002708911895751953, 0.004157066345214844, 0.005605220794677734, 0.007053375244140625, 0.008501529693603516, 0.009949684143066406, 0.011397838592529297, 0.012845993041992188, 0.014294147491455078, 0.01574230194091797, 0.01719045639038086, 0.01863861083984375, 0.02008676528930664, 0.02153491973876953, 0.022983074188232422, 0.024431228637695312, 0.025879383087158203, 0.027327537536621094, 0.028775691986083984, 0.030223846435546875, 0.031672000885009766, 0.033120155334472656, 0.03456830978393555, 0.03601646423339844, 0.03746461868286133, 0.03891277313232422, 0.04036092758178711, 0.04180908203125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 8.0, 8.0, 18.0, 92.0, 3711.0, 181.0, 37.0, 12.0, 6.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03265380859375, -0.03146934509277344, -0.030284881591796875, -0.029100418090820312, -0.02791595458984375, -0.026731491088867188, -0.025547027587890625, -0.024362564086914062, -0.0231781005859375, -0.021993637084960938, -0.020809173583984375, -0.019624710083007812, -0.01844024658203125, -0.017255783081054688, -0.016071319580078125, -0.014886856079101562, -0.013702392578125, -0.012517929077148438, -0.011333465576171875, -0.010149002075195312, -0.00896453857421875, -0.0077800750732421875, -0.006595611572265625, -0.0054111480712890625, -0.0042266845703125, -0.0030422210693359375, -0.001857757568359375, -0.0006732940673828125, 0.00051116943359375, 0.0016956329345703125, 0.002880096435546875, 0.0040645599365234375, 0.0052490234375, 0.0064334869384765625, 0.007617950439453125, 0.008802413940429688, 0.00998687744140625, 0.011171340942382812, 0.012355804443359375, 0.013540267944335938, 0.0147247314453125, 0.015909194946289062, 0.017093658447265625, 0.018278121948242188, 0.01946258544921875, 0.020647048950195312, 0.021831512451171875, 0.023015975952148438, 0.024200439453125, 0.025384902954101562, 0.026569366455078125, 0.027753829956054688, 0.02893829345703125, 0.030122756958007812, 0.031307220458984375, 0.03249168395996094, 0.0336761474609375, 0.03486061096191406, 0.036045074462890625, 0.03722953796386719, 0.03841400146484375, 0.03959846496582031, 0.040782928466796875, 0.04196739196777344, 0.04315185546875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 23.0, 42.0, 97.0, 193.0, 258.0, 201.0, 113.0, 46.0, 14.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055754147469997406, -0.05212680995464325, -0.04849947243928909, -0.044872134923934937, -0.04124479740858078, -0.037617459893226624, -0.033990126103162766, -0.03036278858780861, -0.026735451072454453, -0.023108113557100296, -0.01948077604174614, -0.015853440389037132, -0.012226102873682976, -0.00859876535832882, -0.004971429705619812, -0.0013440921902656555, 0.002283245325088501, 0.00591058237478137, 0.00953791942447424, 0.013165256008505821, 0.016792593523859978, 0.020419931039214134, 0.02404726669192314, 0.027674604207277298, 0.031301941722631454, 0.03492927923798561, 0.03855661675333977, 0.042183950543403625, 0.04581128805875778, 0.04943862557411194, 0.053065963089466095, 0.05669330060482025, 0.06032063066959381, 0.06394796818494797, 0.06757530570030212, 0.07120264321565628, 0.07482998073101044, 0.0784573182463646, 0.08208465576171875, 0.08571198582649231, 0.08933933079242706, 0.09296666830778122, 0.09659400582313538, 0.10022134333848953, 0.10384868085384369, 0.10747601836919785, 0.111103355884552, 0.11473068594932556, 0.11835802346467972, 0.12198536098003387, 0.12561269104480743, 0.1292400360107422, 0.13286736607551575, 0.1364947110414505, 0.14012204110622406, 0.1437493860721588, 0.14737671613693237, 0.15100404620170593, 0.15463139116764069, 0.15825872123241425, 0.161886066198349, 0.16551339626312256, 0.1691407412290573, 0.17276807129383087, 0.17639541625976562]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 12.0, 10.0, 29.0, 35.0, 46.0, 50.0, 70.0, 72.0, 79.0, 84.0, 79.0, 68.0, 95.0, 75.0, 54.0, 53.0, 29.0, 16.0, 18.0, 13.0, 4.0, 11.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06794911623001099, -0.06543556600809097, -0.06292201578617096, -0.060408465564250946, -0.05789491534233093, -0.05538136512041092, -0.052867814898490906, -0.05035426467657089, -0.04784071445465088, -0.045327164232730865, -0.04281361401081085, -0.04030006378889084, -0.037786513566970825, -0.03527296334505081, -0.0327594131231308, -0.030245862901210785, -0.02773231267929077, -0.025218762457370758, -0.022705212235450745, -0.02019166201353073, -0.017678111791610718, -0.015164561569690704, -0.012651011347770691, -0.010137461125850677, -0.007623910903930664, -0.005110360682010651, -0.002596810460090637, -8.326023817062378e-05, 0.0024302899837493896, 0.004943840205669403, 0.0074573904275894165, 0.00997094064950943, 0.012484490871429443, 0.014998041093349457, 0.01751159131526947, 0.020025141537189484, 0.022538691759109497, 0.02505224198102951, 0.027565792202949524, 0.030079342424869537, 0.03259289264678955, 0.035106442868709564, 0.03761999309062958, 0.04013354331254959, 0.042647093534469604, 0.04516064375638962, 0.04767419397830963, 0.050187744200229645, 0.05270129442214966, 0.05521484464406967, 0.057728394865989685, 0.0602419450879097, 0.06275549530982971, 0.06526904553174973, 0.06778259575366974, 0.07029614597558975, 0.07280969619750977, 0.07532324641942978, 0.07783679664134979, 0.0803503468632698, 0.08286389708518982, 0.08537744730710983, 0.08789099752902985, 0.09040454775094986, 0.09291809797286987]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 3.0, 8.0, 11.0, 10.0, 10.0, 23.0, 27.0, 43.0, 77.0, 109.0, 155.0, 300.0, 575.0, 1035.0, 2400.0, 6730.0, 24240.0, 122766.0, 587782.0, 244103.0, 41459.0, 10325.0, 3362.0, 1383.0, 665.0, 359.0, 208.0, 128.0, 75.0, 50.0, 45.0, 17.0, 24.0, 9.0, 9.0, 8.0, 7.0, 2.0, 4.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048065185546875, -0.04663801193237305, -0.045210838317871094, -0.04378366470336914, -0.04235649108886719, -0.040929317474365234, -0.03950214385986328, -0.03807497024536133, -0.036647796630859375, -0.03522062301635742, -0.03379344940185547, -0.032366275787353516, -0.030939102172851562, -0.02951192855834961, -0.028084754943847656, -0.026657581329345703, -0.02523040771484375, -0.023803234100341797, -0.022376060485839844, -0.02094888687133789, -0.019521713256835938, -0.018094539642333984, -0.01666736602783203, -0.015240192413330078, -0.013813018798828125, -0.012385845184326172, -0.010958671569824219, -0.009531497955322266, -0.008104324340820312, -0.006677150726318359, -0.005249977111816406, -0.003822803497314453, -0.0023956298828125, -0.0009684562683105469, 0.00045871734619140625, 0.0018858909606933594, 0.0033130645751953125, 0.004740238189697266, 0.006167411804199219, 0.007594585418701172, 0.009021759033203125, 0.010448932647705078, 0.011876106262207031, 0.013303279876708984, 0.014730453491210938, 0.01615762710571289, 0.017584800720214844, 0.019011974334716797, 0.02043914794921875, 0.021866321563720703, 0.023293495178222656, 0.02472066879272461, 0.026147842407226562, 0.027575016021728516, 0.02900218963623047, 0.030429363250732422, 0.031856536865234375, 0.03328371047973633, 0.03471088409423828, 0.036138057708740234, 0.03756523132324219, 0.03899240493774414, 0.040419578552246094, 0.04184675216674805, 0.04327392578125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 7.0, 7.0, 3.0, 9.0, 11.0, 7.0, 13.0, 39.0, 30.0, 29.0, 53.0, 47.0, 59.0, 46.0, 84.0, 76.0, 78.0, 66.0, 59.0, 58.0, 50.0, 34.0, 25.0, 16.0, 27.0, 14.0, 20.0, 8.0, 9.0, 4.0, 2.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.03265380859375, -0.031624794006347656, -0.030595779418945312, -0.02956676483154297, -0.028537750244140625, -0.02750873565673828, -0.026479721069335938, -0.025450706481933594, -0.02442169189453125, -0.023392677307128906, -0.022363662719726562, -0.02133464813232422, -0.020305633544921875, -0.01927661895751953, -0.018247604370117188, -0.017218589782714844, -0.0161895751953125, -0.015160560607910156, -0.014131546020507812, -0.013102531433105469, -0.012073516845703125, -0.011044502258300781, -0.010015487670898438, -0.008986473083496094, -0.00795745849609375, -0.006928443908691406, -0.0058994293212890625, -0.004870414733886719, -0.003841400146484375, -0.0028123855590820312, -0.0017833709716796875, -0.0007543563842773438, 0.000274658203125, 0.0013036727905273438, 0.0023326873779296875, 0.0033617019653320312, 0.004390716552734375, 0.005419731140136719, 0.0064487457275390625, 0.007477760314941406, 0.00850677490234375, 0.009535789489746094, 0.010564804077148438, 0.011593818664550781, 0.012622833251953125, 0.013651847839355469, 0.014680862426757812, 0.015709877014160156, 0.0167388916015625, 0.017767906188964844, 0.018796920776367188, 0.01982593536376953, 0.020854949951171875, 0.02188396453857422, 0.022912979125976562, 0.023941993713378906, 0.02497100830078125, 0.026000022888183594, 0.027029037475585938, 0.02805805206298828, 0.029087066650390625, 0.03011608123779297, 0.031145095825195312, 0.032174110412597656, 0.033203125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 7.0, 13.0, 11.0, 17.0, 15.0, 29.0, 36.0, 56.0, 72.0, 112.0, 180.0, 322.0, 620.0, 1584.0, 5406.0, 36545.0, 564795.0, 403573.0, 27659.0, 4628.0, 1433.0, 547.0, 314.0, 217.0, 102.0, 71.0, 53.0, 43.0, 25.0, 16.0, 20.0, 8.0, 8.0, 4.0, 1.0, 5.0, 6.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.059326171875, -0.057578086853027344, -0.05583000183105469, -0.05408191680908203, -0.052333831787109375, -0.05058574676513672, -0.04883766174316406, -0.047089576721191406, -0.04534149169921875, -0.043593406677246094, -0.04184532165527344, -0.04009723663330078, -0.038349151611328125, -0.03660106658935547, -0.03485298156738281, -0.033104896545410156, -0.0313568115234375, -0.029608726501464844, -0.027860641479492188, -0.02611255645751953, -0.024364471435546875, -0.02261638641357422, -0.020868301391601562, -0.019120216369628906, -0.01737213134765625, -0.015624046325683594, -0.013875961303710938, -0.012127876281738281, -0.010379791259765625, -0.008631706237792969, -0.0068836212158203125, -0.005135536193847656, -0.003387451171875, -0.0016393661499023438, 0.0001087188720703125, 0.0018568038940429688, 0.003604888916015625, 0.005352973937988281, 0.0071010589599609375, 0.008849143981933594, 0.01059722900390625, 0.012345314025878906, 0.014093399047851562, 0.01584148406982422, 0.017589569091796875, 0.01933765411376953, 0.021085739135742188, 0.022833824157714844, 0.0245819091796875, 0.026329994201660156, 0.028078079223632812, 0.02982616424560547, 0.031574249267578125, 0.03332233428955078, 0.03507041931152344, 0.036818504333496094, 0.03856658935546875, 0.040314674377441406, 0.04206275939941406, 0.04381084442138672, 0.045558929443359375, 0.04730701446533203, 0.04905509948730469, 0.050803184509277344, 0.05255126953125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 4.0, 7.0, 6.0, 13.0, 25.0, 20.0, 20.0, 32.0, 38.0, 36.0, 32.0, 49.0, 48.0, 57.0, 57.0, 54.0, 73.0, 52.0, 54.0, 58.0, 59.0, 43.0, 29.0, 26.0, 21.0, 18.0, 22.0, 16.0, 16.0, 4.0, 6.0, 5.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0841064453125, -0.080810546875, -0.0775146484375, -0.07421875, -0.0709228515625, -0.067626953125, -0.0643310546875, -0.06103515625, -0.0577392578125, -0.054443359375, -0.0511474609375, -0.0478515625, -0.0445556640625, -0.041259765625, -0.0379638671875, -0.03466796875, -0.0313720703125, -0.028076171875, -0.0247802734375, -0.021484375, -0.0181884765625, -0.014892578125, -0.0115966796875, -0.00830078125, -0.0050048828125, -0.001708984375, 0.0015869140625, 0.0048828125, 0.0081787109375, 0.011474609375, 0.0147705078125, 0.01806640625, 0.0213623046875, 0.024658203125, 0.0279541015625, 0.03125, 0.0345458984375, 0.037841796875, 0.0411376953125, 0.04443359375, 0.0477294921875, 0.051025390625, 0.0543212890625, 0.0576171875, 0.0609130859375, 0.064208984375, 0.0675048828125, 0.07080078125, 0.0740966796875, 0.077392578125, 0.0806884765625, 0.083984375, 0.0872802734375, 0.090576171875, 0.0938720703125, 0.09716796875, 0.1004638671875, 0.103759765625, 0.1070556640625, 0.1103515625, 0.1136474609375, 0.116943359375, 0.1202392578125, 0.12353515625, 0.1268310546875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 6.0, 4.0, 8.0, 19.0, 9.0, 42.0, 62.0, 85.0, 154.0, 334.0, 756.0, 2114.0, 11529.0, 250909.0, 752431.0, 24874.0, 3327.0, 1012.0, 395.0, 196.0, 120.0, 66.0, 34.0, 18.0, 15.0, 12.0, 10.0, 3.0, 5.0, 1.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.021453857421875, -0.020876526832580566, -0.020299196243286133, -0.0197218656539917, -0.019144535064697266, -0.018567204475402832, -0.0179898738861084, -0.017412543296813965, -0.01683521270751953, -0.016257882118225098, -0.015680551528930664, -0.01510322093963623, -0.014525890350341797, -0.013948559761047363, -0.01337122917175293, -0.012793898582458496, -0.012216567993164062, -0.011639237403869629, -0.011061906814575195, -0.010484576225280762, -0.009907245635986328, -0.009329915046691895, -0.008752584457397461, -0.008175253868103027, -0.007597923278808594, -0.00702059268951416, -0.0064432621002197266, -0.005865931510925293, -0.005288600921630859, -0.004711270332336426, -0.004133939743041992, -0.0035566091537475586, -0.002979278564453125, -0.0024019479751586914, -0.0018246173858642578, -0.0012472867965698242, -0.0006699562072753906, -9.262561798095703e-05, 0.00048470497131347656, 0.0010620355606079102, 0.0016393661499023438, 0.0022166967391967773, 0.002794027328491211, 0.0033713579177856445, 0.003948688507080078, 0.004526019096374512, 0.005103349685668945, 0.005680680274963379, 0.0062580108642578125, 0.006835341453552246, 0.00741267204284668, 0.007990002632141113, 0.008567333221435547, 0.00914466381072998, 0.009721994400024414, 0.010299324989318848, 0.010876655578613281, 0.011453986167907715, 0.012031316757202148, 0.012608647346496582, 0.013185977935791016, 0.01376330852508545, 0.014340639114379883, 0.014917969703674316, 0.01549530029296875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 5.0, 3.0, 7.0, 12.0, 12.0, 23.0, 19.0, 37.0, 36.0, 52.0, 72.0, 54.0, 77.0, 76.0, 83.0, 71.0, 70.0, 58.0, 54.0, 48.0, 35.0, 25.0, 26.0, 16.0, 18.0, 7.0, 5.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-7.68899917602539e-06, -7.511116564273834e-06, -7.333233952522278e-06, -7.1553513407707214e-06, -6.977468729019165e-06, -6.799586117267609e-06, -6.621703505516052e-06, -6.443820893764496e-06, -6.2659382820129395e-06, -6.088055670261383e-06, -5.910173058509827e-06, -5.73229044675827e-06, -5.554407835006714e-06, -5.3765252232551575e-06, -5.198642611503601e-06, -5.020759999752045e-06, -4.842877388000488e-06, -4.664994776248932e-06, -4.4871121644973755e-06, -4.309229552745819e-06, -4.131346940994263e-06, -3.953464329242706e-06, -3.77558171749115e-06, -3.5976991057395935e-06, -3.419816493988037e-06, -3.2419338822364807e-06, -3.0640512704849243e-06, -2.886168658733368e-06, -2.7082860469818115e-06, -2.530403435230255e-06, -2.3525208234786987e-06, -2.1746382117271423e-06, -1.996755599975586e-06, -1.8188729882240295e-06, -1.6409903764724731e-06, -1.4631077647209167e-06, -1.2852251529693604e-06, -1.107342541217804e-06, -9.294599294662476e-07, -7.515773177146912e-07, -5.736947059631348e-07, -3.9581209421157837e-07, -2.1792948246002197e-07, -4.0046870708465576e-08, 1.3783574104309082e-07, 3.157183527946472e-07, 4.936009645462036e-07, 6.7148357629776e-07, 8.493661880493164e-07, 1.0272487998008728e-06, 1.2051314115524292e-06, 1.3830140233039856e-06, 1.560896635055542e-06, 1.7387792468070984e-06, 1.9166618585586548e-06, 2.094544470310211e-06, 2.2724270820617676e-06, 2.450309693813324e-06, 2.6281923055648804e-06, 2.8060749173164368e-06, 2.983957529067993e-06, 3.1618401408195496e-06, 3.339722752571106e-06, 3.5176053643226624e-06, 3.6954879760742188e-06]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 15.0, 23.0, 54.0, 143.0, 467.0, 3433.0, 236309.0, 800344.0, 6749.0, 671.0, 215.0, 73.0, 38.0, 12.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04156494140625, -0.04047441482543945, -0.039383888244628906, -0.03829336166381836, -0.03720283508300781, -0.036112308502197266, -0.03502178192138672, -0.03393125534057617, -0.032840728759765625, -0.03175020217895508, -0.03065967559814453, -0.029569149017333984, -0.028478622436523438, -0.02738809585571289, -0.026297569274902344, -0.025207042694091797, -0.02411651611328125, -0.023025989532470703, -0.021935462951660156, -0.02084493637084961, -0.019754409790039062, -0.018663883209228516, -0.01757335662841797, -0.016482830047607422, -0.015392303466796875, -0.014301776885986328, -0.013211250305175781, -0.012120723724365234, -0.011030197143554688, -0.00993967056274414, -0.008849143981933594, -0.007758617401123047, -0.0066680908203125, -0.005577564239501953, -0.004487037658691406, -0.0033965110778808594, -0.0023059844970703125, -0.0012154579162597656, -0.00012493133544921875, 0.0009655952453613281, 0.002056121826171875, 0.003146648406982422, 0.004237174987792969, 0.005327701568603516, 0.0064182281494140625, 0.007508754730224609, 0.008599281311035156, 0.009689807891845703, 0.01078033447265625, 0.011870861053466797, 0.012961387634277344, 0.01405191421508789, 0.015142440795898438, 0.016232967376708984, 0.01732349395751953, 0.018414020538330078, 0.019504547119140625, 0.020595073699951172, 0.02168560028076172, 0.022776126861572266, 0.023866653442382812, 0.02495718002319336, 0.026047706604003906, 0.027138233184814453, 0.028228759765625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 6.0, 8.0, 18.0, 16.0, 36.0, 64.0, 138.0, 165.0, 204.0, 134.0, 85.0, 49.0, 37.0, 25.0, 7.0, 6.0, 1.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0170135498046875, -0.015967130661010742, -0.014920711517333984, -0.013874292373657227, -0.012827873229980469, -0.011781454086303711, -0.010735034942626953, -0.009688615798950195, -0.008642196655273438, -0.00759577751159668, -0.006549358367919922, -0.005502939224243164, -0.004456520080566406, -0.0034101009368896484, -0.0023636817932128906, -0.0013172626495361328, -0.000270843505859375, 0.0007755756378173828, 0.0018219947814941406, 0.0028684139251708984, 0.003914833068847656, 0.004961252212524414, 0.006007671356201172, 0.00705409049987793, 0.008100509643554688, 0.009146928787231445, 0.010193347930908203, 0.011239767074584961, 0.012286186218261719, 0.013332605361938477, 0.014379024505615234, 0.015425443649291992, 0.01647186279296875, 0.017518281936645508, 0.018564701080322266, 0.019611120223999023, 0.02065753936767578, 0.02170395851135254, 0.022750377655029297, 0.023796796798706055, 0.024843215942382812, 0.02588963508605957, 0.026936054229736328, 0.027982473373413086, 0.029028892517089844, 0.0300753116607666, 0.03112173080444336, 0.03216814994812012, 0.033214569091796875, 0.03426098823547363, 0.03530740737915039, 0.03635382652282715, 0.037400245666503906, 0.038446664810180664, 0.03949308395385742, 0.04053950309753418, 0.04158592224121094, 0.042632341384887695, 0.04367876052856445, 0.04472517967224121, 0.04577159881591797, 0.04681801795959473, 0.047864437103271484, 0.04891085624694824, 0.049957275390625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 13.0, 24.0, 77.0, 175.0, 304.0, 256.0, 113.0, 28.0, 13.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8697724938392639, -0.8503541350364685, -0.8309357166290283, -0.8115173578262329, -0.7920989394187927, -0.7726805806159973, -0.7532621622085571, -0.7338438034057617, -0.7144254446029663, -0.6950070858001709, -0.6755886673927307, -0.6561703085899353, -0.6367518901824951, -0.6173335313796997, -0.5979151725769043, -0.5784967541694641, -0.5590783357620239, -0.5396599769592285, -0.5202415585517883, -0.5008231997489929, -0.4814048111438751, -0.4619864225387573, -0.4425680339336395, -0.42314964532852173, -0.4037312865257263, -0.3843128979206085, -0.3648945093154907, -0.3454761505126953, -0.3260577619075775, -0.3066393733024597, -0.2872209846973419, -0.2678025960922241, -0.2483842670917511, -0.2289658784866333, -0.2095475047826767, -0.1901291161775589, -0.1707107424736023, -0.1512923538684845, -0.1318739652633667, -0.1124555915594101, -0.0930372029542923, -0.0736188217997551, -0.0542004369199276, -0.0347820520401001, -0.015363670885562897, 0.004054710268974304, 0.023473098874092102, 0.042891472578048706, 0.062309861183166504, 0.0817282423377037, 0.1011466234922409, 0.1205650120973587, 0.1399833858013153, 0.1594017744064331, 0.1788201630115509, 0.1982385367155075, 0.2176569253206253, 0.2370753139257431, 0.2564936876296997, 0.2759120762348175, 0.2953304648399353, 0.3147488236427307, 0.3341672420501709, 0.3535856008529663, 0.3730039894580841]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 5.0, 8.0, 8.0, 9.0, 8.0, 16.0, 19.0, 20.0, 18.0, 24.0, 21.0, 39.0, 30.0, 40.0, 48.0, 55.0, 47.0, 63.0, 47.0, 61.0, 58.0, 36.0, 31.0, 40.0, 42.0, 23.0, 24.0, 26.0, 20.0, 22.0, 21.0, 23.0, 6.0, 10.0, 7.0, 5.0, 5.0, 3.0, 3.0, 3.0, 4.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3795636296272278, -0.36788442730903625, -0.3562052249908447, -0.3445260524749756, -0.33284685015678406, -0.32116764783859253, -0.3094884753227234, -0.29780927300453186, -0.28613007068634033, -0.2744508683681488, -0.2627716660499573, -0.25109249353408813, -0.2394132912158966, -0.22773408889770508, -0.21605490148067474, -0.2043757140636444, -0.19269651174545288, -0.18101730942726135, -0.16933812201023102, -0.15765893459320068, -0.14597973227500916, -0.13430052995681763, -0.12262134253978729, -0.11094214767217636, -0.09926295280456543, -0.0875837579369545, -0.07590456306934357, -0.06422536820173264, -0.052546173334121704, -0.04086697846651077, -0.02918778359889984, -0.01750858873128891, -0.0058293938636779785, 0.005849801003932953, 0.017528995871543884, 0.029208190739154816, 0.04088738560676575, 0.05256658047437668, 0.06424577534198761, 0.07592497020959854, 0.08760416507720947, 0.0992833599448204, 0.11096255481243134, 0.12264174968004227, 0.1343209445476532, 0.14600014686584473, 0.15767933428287506, 0.1693585216999054, 0.18103772401809692, 0.19271692633628845, 0.2043961137533188, 0.21607530117034912, 0.22775450348854065, 0.23943370580673218, 0.2511128783226013, 0.26279208064079285, 0.2744712829589844, 0.2861504852771759, 0.29782968759536743, 0.3095088601112366, 0.3211880624294281, 0.33286726474761963, 0.34454643726348877, 0.3562256395816803, 0.3679048418998718]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 12.0, 20.0, 16.0, 33.0, 62.0, 94.0, 157.0, 316.0, 604.0, 1373.0, 3377.0, 10397.0, 55339.0, 3018558.0, 1057087.0, 33570.0, 7933.0, 2641.0, 1191.0, 620.0, 344.0, 209.0, 119.0, 59.0, 52.0, 30.0, 25.0, 17.0, 10.0, 10.0, 7.0, 6.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06207275390625, -0.060517311096191406, -0.05896186828613281, -0.05740642547607422, -0.055850982666015625, -0.05429553985595703, -0.05274009704589844, -0.051184654235839844, -0.04962921142578125, -0.048073768615722656, -0.04651832580566406, -0.04496288299560547, -0.043407440185546875, -0.04185199737548828, -0.04029655456542969, -0.038741111755371094, -0.0371856689453125, -0.035630226135253906, -0.03407478332519531, -0.03251934051513672, -0.030963897705078125, -0.02940845489501953, -0.027853012084960938, -0.026297569274902344, -0.02474212646484375, -0.023186683654785156, -0.021631240844726562, -0.02007579803466797, -0.018520355224609375, -0.01696491241455078, -0.015409469604492188, -0.013854026794433594, -0.012298583984375, -0.010743141174316406, -0.009187698364257812, -0.007632255554199219, -0.006076812744140625, -0.004521369934082031, -0.0029659271240234375, -0.0014104843139648438, 0.00014495849609375, 0.0017004013061523438, 0.0032558441162109375, 0.004811286926269531, 0.006366729736328125, 0.007922172546386719, 0.009477615356445312, 0.011033058166503906, 0.0125885009765625, 0.014143943786621094, 0.015699386596679688, 0.01725482940673828, 0.018810272216796875, 0.02036571502685547, 0.021921157836914062, 0.023476600646972656, 0.02503204345703125, 0.026587486267089844, 0.028142929077148438, 0.02969837188720703, 0.031253814697265625, 0.03280925750732422, 0.03436470031738281, 0.035920143127441406, 0.0374755859375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 3.0, 4.0, 7.0, 7.0, 12.0, 9.0, 18.0, 34.0, 34.0, 43.0, 43.0, 60.0, 54.0, 71.0, 76.0, 70.0, 71.0, 78.0, 70.0, 58.0, 37.0, 38.0, 23.0, 27.0, 15.0, 7.0, 5.0, 5.0, 3.0, 2.0, 6.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.03338623046875, -0.03235197067260742, -0.031317710876464844, -0.030283451080322266, -0.029249191284179688, -0.02821493148803711, -0.02718067169189453, -0.026146411895751953, -0.025112152099609375, -0.024077892303466797, -0.02304363250732422, -0.02200937271118164, -0.020975112915039062, -0.019940853118896484, -0.018906593322753906, -0.017872333526611328, -0.01683807373046875, -0.015803813934326172, -0.014769554138183594, -0.013735294342041016, -0.012701034545898438, -0.01166677474975586, -0.010632514953613281, -0.009598255157470703, -0.008563995361328125, -0.007529735565185547, -0.006495475769042969, -0.005461215972900391, -0.0044269561767578125, -0.0033926963806152344, -0.0023584365844726562, -0.0013241767883300781, -0.0002899169921875, 0.0007443428039550781, 0.0017786026000976562, 0.0028128623962402344, 0.0038471221923828125, 0.004881381988525391, 0.005915641784667969, 0.006949901580810547, 0.007984161376953125, 0.009018421173095703, 0.010052680969238281, 0.01108694076538086, 0.012121200561523438, 0.013155460357666016, 0.014189720153808594, 0.015223979949951172, 0.01625823974609375, 0.017292499542236328, 0.018326759338378906, 0.019361019134521484, 0.020395278930664062, 0.02142953872680664, 0.02246379852294922, 0.023498058319091797, 0.024532318115234375, 0.025566577911376953, 0.02660083770751953, 0.02763509750366211, 0.028669357299804688, 0.029703617095947266, 0.030737876892089844, 0.03177213668823242, 0.032806396484375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 2.0, 5.0, 3.0, 3.0, 4.0, 5.0, 5.0, 5.0, 10.0, 9.0, 21.0, 21.0, 26.0, 49.0, 49.0, 120.0, 278.0, 886.0, 3396.0, 20859.0, 595122.0, 3534720.0, 32085.0, 4733.0, 1093.0, 355.0, 150.0, 60.0, 44.0, 33.0, 21.0, 21.0, 19.0, 20.0, 9.0, 8.0, 7.0, 7.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0], "bins": [-0.07470703125, -0.07263755798339844, -0.07056808471679688, -0.06849861145019531, -0.06642913818359375, -0.06435966491699219, -0.062290191650390625, -0.06022071838378906, -0.0581512451171875, -0.05608177185058594, -0.054012298583984375, -0.05194282531738281, -0.04987335205078125, -0.04780387878417969, -0.045734405517578125, -0.04366493225097656, -0.041595458984375, -0.03952598571777344, -0.037456512451171875, -0.03538703918457031, -0.03331756591796875, -0.031248092651367188, -0.029178619384765625, -0.027109146118164062, -0.0250396728515625, -0.022970199584960938, -0.020900726318359375, -0.018831253051757812, -0.01676177978515625, -0.014692306518554688, -0.012622833251953125, -0.010553359985351562, -0.00848388671875, -0.0064144134521484375, -0.004344940185546875, -0.0022754669189453125, -0.00020599365234375, 0.0018634796142578125, 0.003932952880859375, 0.0060024261474609375, 0.0080718994140625, 0.010141372680664062, 0.012210845947265625, 0.014280319213867188, 0.01634979248046875, 0.018419265747070312, 0.020488739013671875, 0.022558212280273438, 0.024627685546875, 0.026697158813476562, 0.028766632080078125, 0.030836105346679688, 0.03290557861328125, 0.03497505187988281, 0.037044525146484375, 0.03911399841308594, 0.0411834716796875, 0.04325294494628906, 0.045322418212890625, 0.04739189147949219, 0.04946136474609375, 0.05153083801269531, 0.053600311279296875, 0.05566978454589844, 0.0577392578125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 4.0, 3.0, 11.0, 20.0, 13.0, 11.0, 20.0, 33.0, 40.0, 52.0, 154.0, 533.0, 1742.0, 934.0, 242.0, 86.0, 41.0, 32.0, 22.0, 14.0, 18.0, 6.0, 8.0, 6.0, 2.0, 4.0, 6.0, 1.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049072265625, -0.04746723175048828, -0.04586219787597656, -0.044257164001464844, -0.042652130126953125, -0.041047096252441406, -0.03944206237792969, -0.03783702850341797, -0.03623199462890625, -0.03462696075439453, -0.03302192687988281, -0.031416893005371094, -0.029811859130859375, -0.028206825256347656, -0.026601791381835938, -0.02499675750732422, -0.0233917236328125, -0.02178668975830078, -0.020181655883789062, -0.018576622009277344, -0.016971588134765625, -0.015366554260253906, -0.013761520385742188, -0.012156486511230469, -0.01055145263671875, -0.008946418762207031, -0.0073413848876953125, -0.005736351013183594, -0.004131317138671875, -0.0025262832641601562, -0.0009212493896484375, 0.0006837844848632812, 0.002288818359375, 0.0038938522338867188, 0.0054988861083984375, 0.007103919982910156, 0.008708953857421875, 0.010313987731933594, 0.011919021606445312, 0.013524055480957031, 0.01512908935546875, 0.01673412322998047, 0.018339157104492188, 0.019944190979003906, 0.021549224853515625, 0.023154258728027344, 0.024759292602539062, 0.02636432647705078, 0.0279693603515625, 0.02957439422607422, 0.031179428100585938, 0.032784461975097656, 0.034389495849609375, 0.035994529724121094, 0.03759956359863281, 0.03920459747314453, 0.04080963134765625, 0.04241466522216797, 0.04401969909667969, 0.045624732971191406, 0.047229766845703125, 0.048834800720214844, 0.05043983459472656, 0.05204486846923828, 0.05364990234375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 20.0, 82.0, 312.0, 339.0, 151.0, 51.0, 17.0, 10.0, 5.0, 1.0, 6.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41352394223213196, -0.39378079771995544, -0.3740376830101013, -0.3542945384979248, -0.3345513939857483, -0.31480827927589417, -0.29506513476371765, -0.2753220200538635, -0.255578875541687, -0.2358357459306717, -0.21609261631965637, -0.19634947180747986, -0.17660634219646454, -0.15686321258544922, -0.1371200680732727, -0.11737693846225739, -0.09763380885124207, -0.07789067924022675, -0.05814754217863083, -0.03840440884232521, -0.018661275506019592, 0.0010818541049957275, 0.020824991166591644, 0.04056812822818756, 0.06031125783920288, 0.0800543874502182, 0.09979752451181412, 0.11954066157341003, 0.13928379118442535, 0.15902692079544067, 0.1787700653076172, 0.1985131949186325, 0.21825635433197021, 0.23799948394298553, 0.25774261355400085, 0.27748575806617737, 0.2972288727760315, 0.316972017288208, 0.3367151618003845, 0.35645830631256104, 0.37620142102241516, 0.3959445655345917, 0.4156876802444458, 0.4354308247566223, 0.45517396926879883, 0.47491708397865295, 0.49466022849082947, 0.5144033432006836, 0.5341464877128601, 0.5538896322250366, 0.5736327767372131, 0.5933758616447449, 0.6131190061569214, 0.6328621506690979, 0.6526052951812744, 0.6723484396934509, 0.6920915842056274, 0.711834728717804, 0.7315778732299805, 0.7513209581375122, 0.7710641026496887, 0.7908072471618652, 0.8105503916740417, 0.8302935361862183, 0.85003662109375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 8.0, 7.0, 13.0, 17.0, 11.0, 18.0, 12.0, 28.0, 25.0, 23.0, 28.0, 44.0, 25.0, 54.0, 37.0, 53.0, 37.0, 41.0, 45.0, 40.0, 46.0, 44.0, 36.0, 38.0, 30.0, 30.0, 41.0, 26.0, 24.0, 21.0, 20.0, 11.0, 13.0, 10.0, 10.0, 4.0, 8.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.21093696355819702, -0.2046351581811905, -0.19833336770534515, -0.19203156232833862, -0.1857297718524933, -0.17942796647548676, -0.17312616109848022, -0.1668243706226349, -0.16052256524562836, -0.15422075986862183, -0.1479189693927765, -0.14161716401576996, -0.13531535863876343, -0.1290135681629181, -0.12271176278591156, -0.11640996485948563, -0.11010816693305969, -0.10380636900663376, -0.09750457108020782, -0.0912027657032013, -0.08490096777677536, -0.07859916985034943, -0.0722973644733429, -0.06599556654691696, -0.05969376862049103, -0.053391970694065094, -0.04709016904234886, -0.04078836739063263, -0.034486569464206696, -0.02818477153778076, -0.02188296988606453, -0.015581168234348297, -0.009279370307922363, -0.00297757051885128, 0.003324229270219803, 0.009626029059290886, 0.01592782884836197, 0.022229626774787903, 0.028531428426504135, 0.03483323007822037, 0.0411350280046463, 0.047436825931072235, 0.05373862758278847, 0.0600404292345047, 0.06634222716093063, 0.07264402508735657, 0.0789458304643631, 0.08524762839078903, 0.09154942631721497, 0.0978512242436409, 0.10415302217006683, 0.11045482754707336, 0.1167566254734993, 0.12305842339992523, 0.12936022877693176, 0.1356620192527771, 0.14196382462978363, 0.14826563000679016, 0.1545674204826355, 0.16086922585964203, 0.16717103123664856, 0.1734728217124939, 0.17977462708950043, 0.18607643246650696, 0.1923782229423523]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 4.0, 6.0, 16.0, 9.0, 8.0, 23.0, 32.0, 43.0, 59.0, 78.0, 119.0, 170.0, 211.0, 322.0, 520.0, 825.0, 1396.0, 2684.0, 5322.0, 11637.0, 28885.0, 84075.0, 254551.0, 384432.0, 176998.0, 56852.0, 20942.0, 8841.0, 4263.0, 2139.0, 1145.0, 696.0, 424.0, 282.0, 174.0, 121.0, 76.0, 49.0, 38.0, 35.0, 13.0, 10.0, 11.0, 7.0, 9.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0242156982421875, -0.023329496383666992, -0.022443294525146484, -0.021557092666625977, -0.02067089080810547, -0.01978468894958496, -0.018898487091064453, -0.018012285232543945, -0.017126083374023438, -0.01623988151550293, -0.015353679656982422, -0.014467477798461914, -0.013581275939941406, -0.012695074081420898, -0.01180887222290039, -0.010922670364379883, -0.010036468505859375, -0.009150266647338867, -0.00826406478881836, -0.0073778629302978516, -0.006491661071777344, -0.005605459213256836, -0.004719257354736328, -0.0038330554962158203, -0.0029468536376953125, -0.0020606517791748047, -0.0011744499206542969, -0.00028824806213378906, 0.0005979537963867188, 0.0014841556549072266, 0.0023703575134277344, 0.003256559371948242, 0.00414276123046875, 0.005028963088989258, 0.005915164947509766, 0.0068013668060302734, 0.007687568664550781, 0.008573770523071289, 0.009459972381591797, 0.010346174240112305, 0.011232376098632812, 0.01211857795715332, 0.013004779815673828, 0.013890981674194336, 0.014777183532714844, 0.01566338539123535, 0.01654958724975586, 0.017435789108276367, 0.018321990966796875, 0.019208192825317383, 0.02009439468383789, 0.0209805965423584, 0.021866798400878906, 0.022753000259399414, 0.023639202117919922, 0.02452540397644043, 0.025411605834960938, 0.026297807693481445, 0.027184009552001953, 0.02807021141052246, 0.02895641326904297, 0.029842615127563477, 0.030728816986083984, 0.03161501884460449, 0.032501220703125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 1.0, 3.0, 11.0, 10.0, 8.0, 22.0, 26.0, 27.0, 44.0, 59.0, 43.0, 65.0, 71.0, 71.0, 74.0, 76.0, 68.0, 72.0, 59.0, 40.0, 33.0, 34.0, 19.0, 16.0, 7.0, 17.0, 6.0, 4.0, 3.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0347900390625, -0.033720970153808594, -0.03265190124511719, -0.03158283233642578, -0.030513763427734375, -0.02944469451904297, -0.028375625610351562, -0.027306556701660156, -0.02623748779296875, -0.025168418884277344, -0.024099349975585938, -0.02303028106689453, -0.021961212158203125, -0.02089214324951172, -0.019823074340820312, -0.018754005432128906, -0.0176849365234375, -0.016615867614746094, -0.015546798706054688, -0.014477729797363281, -0.013408660888671875, -0.012339591979980469, -0.011270523071289062, -0.010201454162597656, -0.00913238525390625, -0.008063316345214844, -0.0069942474365234375, -0.005925178527832031, -0.004856109619140625, -0.0037870407104492188, -0.0027179718017578125, -0.0016489028930664062, -0.000579833984375, 0.0004892349243164062, 0.0015583038330078125, 0.0026273727416992188, 0.003696441650390625, 0.004765510559082031, 0.0058345794677734375, 0.006903648376464844, 0.00797271728515625, 0.009041786193847656, 0.010110855102539062, 0.011179924011230469, 0.012248992919921875, 0.013318061828613281, 0.014387130737304688, 0.015456199645996094, 0.0165252685546875, 0.017594337463378906, 0.018663406372070312, 0.01973247528076172, 0.020801544189453125, 0.02187061309814453, 0.022939682006835938, 0.024008750915527344, 0.02507781982421875, 0.026146888732910156, 0.027215957641601562, 0.02828502655029297, 0.029354095458984375, 0.03042316436767578, 0.03149223327636719, 0.032561302185058594, 0.03363037109375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 1.0, 5.0, 6.0, 8.0, 15.0, 16.0, 23.0, 29.0, 66.0, 115.0, 179.0, 287.0, 541.0, 1173.0, 2908.0, 12435.0, 198881.0, 781689.0, 40970.0, 5285.0, 1883.0, 901.0, 453.0, 251.0, 151.0, 98.0, 54.0, 53.0, 28.0, 18.0, 16.0, 5.0, 5.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.059295654296875, -0.057268619537353516, -0.05524158477783203, -0.05321455001831055, -0.05118751525878906, -0.04916048049926758, -0.047133445739746094, -0.04510641098022461, -0.043079376220703125, -0.04105234146118164, -0.039025306701660156, -0.03699827194213867, -0.03497123718261719, -0.0329442024230957, -0.03091716766357422, -0.028890132904052734, -0.02686309814453125, -0.024836063385009766, -0.02280902862548828, -0.020781993865966797, -0.018754959106445312, -0.016727924346923828, -0.014700889587402344, -0.01267385482788086, -0.010646820068359375, -0.00861978530883789, -0.006592750549316406, -0.004565715789794922, -0.0025386810302734375, -0.0005116462707519531, 0.0015153884887695312, 0.0035424232482910156, 0.0055694580078125, 0.007596492767333984, 0.009623527526855469, 0.011650562286376953, 0.013677597045898438, 0.015704631805419922, 0.017731666564941406, 0.01975870132446289, 0.021785736083984375, 0.02381277084350586, 0.025839805603027344, 0.027866840362548828, 0.029893875122070312, 0.0319209098815918, 0.03394794464111328, 0.035974979400634766, 0.03800201416015625, 0.040029048919677734, 0.04205608367919922, 0.0440831184387207, 0.04611015319824219, 0.04813718795776367, 0.050164222717285156, 0.05219125747680664, 0.054218292236328125, 0.05624532699584961, 0.058272361755371094, 0.06029939651489258, 0.06232643127441406, 0.06435346603393555, 0.06638050079345703, 0.06840753555297852, 0.0704345703125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 7.0, 4.0, 3.0, 7.0, 7.0, 12.0, 16.0, 17.0, 30.0, 27.0, 36.0, 38.0, 47.0, 35.0, 49.0, 51.0, 51.0, 62.0, 48.0, 50.0, 50.0, 56.0, 54.0, 34.0, 25.0, 30.0, 21.0, 26.0, 30.0, 22.0, 10.0, 15.0, 10.0, 6.0, 4.0, 6.0, 5.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07647705078125, -0.07359695434570312, -0.07071685791015625, -0.06783676147460938, -0.0649566650390625, -0.062076568603515625, -0.05919647216796875, -0.056316375732421875, -0.053436279296875, -0.050556182861328125, -0.04767608642578125, -0.044795989990234375, -0.0419158935546875, -0.039035797119140625, -0.03615570068359375, -0.033275604248046875, -0.0303955078125, -0.027515411376953125, -0.02463531494140625, -0.021755218505859375, -0.0188751220703125, -0.015995025634765625, -0.01311492919921875, -0.010234832763671875, -0.007354736328125, -0.004474639892578125, -0.00159454345703125, 0.001285552978515625, 0.0041656494140625, 0.007045745849609375, 0.00992584228515625, 0.012805938720703125, 0.01568603515625, 0.018566131591796875, 0.02144622802734375, 0.024326324462890625, 0.0272064208984375, 0.030086517333984375, 0.03296661376953125, 0.035846710205078125, 0.038726806640625, 0.041606903076171875, 0.04448699951171875, 0.047367095947265625, 0.0502471923828125, 0.053127288818359375, 0.05600738525390625, 0.058887481689453125, 0.061767578125, 0.06464767456054688, 0.06752777099609375, 0.07040786743164062, 0.0732879638671875, 0.07616806030273438, 0.07904815673828125, 0.08192825317382812, 0.084808349609375, 0.08768844604492188, 0.09056854248046875, 0.09344863891601562, 0.0963287353515625, 0.09920883178710938, 0.10208892822265625, 0.10496902465820312, 0.10784912109375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 8.0, 4.0, 20.0, 12.0, 19.0, 17.0, 33.0, 32.0, 67.0, 105.0, 169.0, 322.0, 718.0, 1777.0, 6151.0, 49037.0, 922425.0, 57682.0, 6532.0, 1886.0, 655.0, 355.0, 180.0, 100.0, 65.0, 49.0, 35.0, 24.0, 17.0, 12.0, 10.0, 6.0, 12.0, 7.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0243072509765625, -0.02351093292236328, -0.022714614868164062, -0.021918296813964844, -0.021121978759765625, -0.020325660705566406, -0.019529342651367188, -0.01873302459716797, -0.01793670654296875, -0.01714038848876953, -0.016344070434570312, -0.015547752380371094, -0.014751434326171875, -0.013955116271972656, -0.013158798217773438, -0.012362480163574219, -0.011566162109375, -0.010769844055175781, -0.009973526000976562, -0.009177207946777344, -0.008380889892578125, -0.007584571838378906, -0.0067882537841796875, -0.005991935729980469, -0.00519561767578125, -0.004399299621582031, -0.0036029815673828125, -0.0028066635131835938, -0.002010345458984375, -0.0012140274047851562, -0.0004177093505859375, 0.00037860870361328125, 0.0011749267578125, 0.0019712448120117188, 0.0027675628662109375, 0.0035638809204101562, 0.004360198974609375, 0.005156517028808594, 0.0059528350830078125, 0.006749153137207031, 0.00754547119140625, 0.008341789245605469, 0.009138107299804688, 0.009934425354003906, 0.010730743408203125, 0.011527061462402344, 0.012323379516601562, 0.013119697570800781, 0.013916015625, 0.014712333679199219, 0.015508651733398438, 0.016304969787597656, 0.017101287841796875, 0.017897605895996094, 0.018693923950195312, 0.01949024200439453, 0.02028656005859375, 0.02108287811279297, 0.021879196166992188, 0.022675514221191406, 0.023471832275390625, 0.024268150329589844, 0.025064468383789062, 0.02586078643798828, 0.0266571044921875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 0.0, 4.0, 7.0, 8.0, 10.0, 15.0, 15.0, 30.0, 17.0, 40.0, 31.0, 42.0, 42.0, 48.0, 68.0, 43.0, 74.0, 58.0, 74.0, 38.0, 53.0, 37.0, 60.0, 28.0, 33.0, 17.0, 36.0, 9.0, 12.0, 15.0, 7.0, 13.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.4836273193359375e-06, -5.336478352546692e-06, -5.189329385757446e-06, -5.042180418968201e-06, -4.895031452178955e-06, -4.7478824853897095e-06, -4.600733518600464e-06, -4.453584551811218e-06, -4.306435585021973e-06, -4.159286618232727e-06, -4.0121376514434814e-06, -3.864988684654236e-06, -3.7178397178649902e-06, -3.5706907510757446e-06, -3.423541784286499e-06, -3.2763928174972534e-06, -3.129243850708008e-06, -2.982094883918762e-06, -2.8349459171295166e-06, -2.687796950340271e-06, -2.5406479835510254e-06, -2.3934990167617798e-06, -2.246350049972534e-06, -2.0992010831832886e-06, -1.952052116394043e-06, -1.8049031496047974e-06, -1.6577541828155518e-06, -1.5106052160263062e-06, -1.3634562492370605e-06, -1.216307282447815e-06, -1.0691583156585693e-06, -9.220093488693237e-07, -7.748603820800781e-07, -6.277114152908325e-07, -4.805624485015869e-07, -3.334134817123413e-07, -1.862645149230957e-07, -3.91155481338501e-08, 1.0803341865539551e-07, 2.551823854446411e-07, 4.023313522338867e-07, 5.494803190231323e-07, 6.966292858123779e-07, 8.437782526016235e-07, 9.909272193908691e-07, 1.1380761861801147e-06, 1.2852251529693604e-06, 1.432374119758606e-06, 1.5795230865478516e-06, 1.7266720533370972e-06, 1.8738210201263428e-06, 2.0209699869155884e-06, 2.168118953704834e-06, 2.3152679204940796e-06, 2.462416887283325e-06, 2.609565854072571e-06, 2.7567148208618164e-06, 2.903863787651062e-06, 3.0510127544403076e-06, 3.1981617212295532e-06, 3.345310688018799e-06, 3.4924596548080444e-06, 3.63960862159729e-06, 3.7867575883865356e-06, 3.933906555175781e-06]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 8.0, 5.0, 14.0, 19.0, 21.0, 33.0, 41.0, 82.0, 127.0, 237.0, 556.0, 1859.0, 10905.0, 387242.0, 629610.0, 14222.0, 2291.0, 630.0, 254.0, 134.0, 86.0, 56.0, 40.0, 18.0, 21.0, 7.0, 7.0, 5.0, 4.0, 3.0, 2.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.027069091796875, -0.026250123977661133, -0.025431156158447266, -0.0246121883392334, -0.02379322052001953, -0.022974252700805664, -0.022155284881591797, -0.02133631706237793, -0.020517349243164062, -0.019698381423950195, -0.018879413604736328, -0.01806044578552246, -0.017241477966308594, -0.016422510147094727, -0.01560354232788086, -0.014784574508666992, -0.013965606689453125, -0.013146638870239258, -0.01232767105102539, -0.011508703231811523, -0.010689735412597656, -0.009870767593383789, -0.009051799774169922, -0.008232831954956055, -0.0074138641357421875, -0.00659489631652832, -0.005775928497314453, -0.004956960678100586, -0.004137992858886719, -0.0033190250396728516, -0.0025000572204589844, -0.0016810894012451172, -0.00086212158203125, -4.315376281738281e-05, 0.0007758140563964844, 0.0015947818756103516, 0.0024137496948242188, 0.003232717514038086, 0.004051685333251953, 0.00487065315246582, 0.0056896209716796875, 0.006508588790893555, 0.007327556610107422, 0.008146524429321289, 0.008965492248535156, 0.009784460067749023, 0.01060342788696289, 0.011422395706176758, 0.012241363525390625, 0.013060331344604492, 0.01387929916381836, 0.014698266983032227, 0.015517234802246094, 0.01633620262145996, 0.017155170440673828, 0.017974138259887695, 0.018793106079101562, 0.01961207389831543, 0.020431041717529297, 0.021250009536743164, 0.02206897735595703, 0.0228879451751709, 0.023706912994384766, 0.024525880813598633, 0.0253448486328125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 6.0, 9.0, 24.0, 31.0, 41.0, 69.0, 82.0, 139.0, 141.0, 142.0, 108.0, 72.0, 51.0, 28.0, 21.0, 6.0, 10.0, 5.0, 4.0, 5.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0254669189453125, -0.024540185928344727, -0.023613452911376953, -0.02268671989440918, -0.021759986877441406, -0.020833253860473633, -0.01990652084350586, -0.018979787826538086, -0.018053054809570312, -0.01712632179260254, -0.016199588775634766, -0.015272855758666992, -0.014346122741699219, -0.013419389724731445, -0.012492656707763672, -0.011565923690795898, -0.010639190673828125, -0.009712457656860352, -0.008785724639892578, -0.007858991622924805, -0.006932258605957031, -0.006005525588989258, -0.005078792572021484, -0.004152059555053711, -0.0032253265380859375, -0.002298593521118164, -0.0013718605041503906, -0.0004451274871826172, 0.00048160552978515625, 0.0014083385467529297, 0.002335071563720703, 0.0032618045806884766, 0.00418853759765625, 0.0051152706146240234, 0.006042003631591797, 0.00696873664855957, 0.007895469665527344, 0.008822202682495117, 0.00974893569946289, 0.010675668716430664, 0.011602401733398438, 0.012529134750366211, 0.013455867767333984, 0.014382600784301758, 0.015309333801269531, 0.016236066818237305, 0.017162799835205078, 0.01808953285217285, 0.019016265869140625, 0.0199429988861084, 0.020869731903076172, 0.021796464920043945, 0.02272319793701172, 0.023649930953979492, 0.024576663970947266, 0.02550339698791504, 0.026430130004882812, 0.027356863021850586, 0.02828359603881836, 0.029210329055786133, 0.030137062072753906, 0.03106379508972168, 0.03199052810668945, 0.03291726112365723, 0.033843994140625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 6.0, 14.0, 76.0, 687.0, 213.0, 15.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4092322587966919, -0.35650432109832764, -0.3037763833999634, -0.25104841589927673, -0.19832047820091248, -0.14559254050254822, -0.09286457300186157, -0.040136635303497314, 0.012591302394866943, 0.0653192475438118, 0.11804719269275665, 0.1707751452922821, 0.22350308299064636, 0.2762310206890106, 0.32895898818969727, 0.3816869258880615, 0.4344148635864258, 0.48714280128479004, 0.5398707389831543, 0.5925986766815186, 0.6453266143798828, 0.6980545520782471, 0.7507825493812561, 0.8035104870796204, 0.8562384247779846, 0.9089663624763489, 0.9616943001747131, 1.0144222974777222, 1.0671502351760864, 1.1198781728744507, 1.172606110572815, 1.2253340482711792, 1.278062105178833, 1.3307900428771973, 1.3835179805755615, 1.4362459182739258, 1.48897385597229, 1.5417017936706543, 1.5944297313690186, 1.6471576690673828, 1.699885606765747, 1.7526135444641113, 1.8053414821624756, 1.8580694198608398, 1.910797357559204, 1.9635252952575684, 2.0162532329559326, 2.068981170654297, 2.1217093467712402, 2.1744372844696045, 2.2271652221679688, 2.279893159866333, 2.3326210975646973, 2.3853490352630615, 2.438076972961426, 2.49080491065979, 2.5435328483581543, 2.5962607860565186, 2.648988723754883, 2.701716661453247, 2.7544445991516113, 2.8071725368499756, 2.85990047454834, 2.912628412246704, 2.9653563499450684]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 6.0, 6.0, 10.0, 11.0, 13.0, 14.0, 14.0, 19.0, 14.0, 27.0, 35.0, 29.0, 32.0, 41.0, 38.0, 44.0, 54.0, 54.0, 55.0, 64.0, 62.0, 41.0, 40.0, 29.0, 31.0, 41.0, 27.0, 16.0, 29.0, 18.0, 17.0, 13.0, 13.0, 6.0, 7.0, 9.0, 5.0, 4.0, 0.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.33547884225845337, -0.32543352246284485, -0.31538820266723633, -0.3053428828716278, -0.2952975630760193, -0.28525227308273315, -0.27520692348480225, -0.2651616334915161, -0.2551163136959076, -0.24507099390029907, -0.23502567410469055, -0.22498035430908203, -0.2149350494146347, -0.20488972961902618, -0.19484440982341766, -0.18479910492897034, -0.17475377023220062, -0.1647084504365921, -0.15466313064098358, -0.14461782574653625, -0.13457250595092773, -0.12452718615531921, -0.1144818663597107, -0.10443655401468277, -0.09439123421907425, -0.08434591442346573, -0.0743006020784378, -0.06425528228282928, -0.05420996621251106, -0.04416465014219284, -0.03411933034658432, -0.024074018001556396, -0.014028698205947876, -0.003983381204307079, 0.006061935797333717, 0.01610725373029709, 0.02615256980061531, 0.03619788587093353, 0.04624320566654205, 0.05628851801156998, 0.0663338378071785, 0.07637915760278702, 0.08642446994781494, 0.09646978974342346, 0.10651510953903198, 0.1165604218840599, 0.12660574913024902, 0.13665105402469635, 0.14669637382030487, 0.1567416936159134, 0.1667870134115219, 0.17683231830596924, 0.18687763810157776, 0.19692295789718628, 0.2069682776927948, 0.21701359748840332, 0.22705891728401184, 0.23710423707962036, 0.24714955687522888, 0.2571948766708374, 0.2672401964664459, 0.27728551626205444, 0.2873308062553406, 0.2973761260509491, 0.3074214458465576]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 14.0, 29.0, 69.0, 172.0, 387.0, 151502.0, 4041372.0, 423.0, 181.0, 71.0, 40.0, 17.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.1494140625, -1.1264419555664062, -1.1034698486328125, -1.0804977416992188, -1.057525634765625, -1.0345535278320312, -1.0115814208984375, -0.9886093139648438, -0.96563720703125, -0.9426651000976562, -0.9196929931640625, -0.8967208862304688, -0.873748779296875, -0.8507766723632812, -0.8278045654296875, -0.8048324584960938, -0.7818603515625, -0.7588882446289062, -0.7359161376953125, -0.7129440307617188, -0.689971923828125, -0.6669998168945312, -0.6440277099609375, -0.6210556030273438, -0.59808349609375, -0.5751113891601562, -0.5521392822265625, -0.5291671752929688, -0.506195068359375, -0.48322296142578125, -0.4602508544921875, -0.43727874755859375, -0.414306640625, -0.39133453369140625, -0.3683624267578125, -0.34539031982421875, -0.322418212890625, -0.29944610595703125, -0.2764739990234375, -0.25350189208984375, -0.23052978515625, -0.20755767822265625, -0.1845855712890625, -0.16161346435546875, -0.138641357421875, -0.11566925048828125, -0.0926971435546875, -0.06972503662109375, -0.0467529296875, -0.02378082275390625, -0.0008087158203125, 0.02216339111328125, 0.045135498046875, 0.06810760498046875, 0.0910797119140625, 0.11405181884765625, 0.13702392578125, 0.15999603271484375, 0.1829681396484375, 0.20594024658203125, 0.228912353515625, 0.25188446044921875, 0.2748565673828125, 0.29782867431640625, 0.32080078125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 3.0, 8.0, 6.0, 14.0, 19.0, 28.0, 31.0, 41.0, 36.0, 62.0, 62.0, 66.0, 81.0, 86.0, 79.0, 78.0, 58.0, 59.0, 45.0, 30.0, 19.0, 22.0, 19.0, 17.0, 8.0, 9.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.033538818359375, -0.03247213363647461, -0.03140544891357422, -0.030338764190673828, -0.029272079467773438, -0.028205394744873047, -0.027138710021972656, -0.026072025299072266, -0.025005340576171875, -0.023938655853271484, -0.022871971130371094, -0.021805286407470703, -0.020738601684570312, -0.019671916961669922, -0.01860523223876953, -0.01753854751586914, -0.01647186279296875, -0.01540517807006836, -0.014338493347167969, -0.013271808624267578, -0.012205123901367188, -0.011138439178466797, -0.010071754455566406, -0.009005069732666016, -0.007938385009765625, -0.006871700286865234, -0.005805015563964844, -0.004738330841064453, -0.0036716461181640625, -0.002604961395263672, -0.0015382766723632812, -0.0004715919494628906, 0.0005950927734375, 0.0016617774963378906, 0.0027284622192382812, 0.003795146942138672, 0.0048618316650390625, 0.005928516387939453, 0.006995201110839844, 0.008061885833740234, 0.009128570556640625, 0.010195255279541016, 0.011261940002441406, 0.012328624725341797, 0.013395309448242188, 0.014461994171142578, 0.015528678894042969, 0.01659536361694336, 0.01766204833984375, 0.01872873306274414, 0.01979541778564453, 0.020862102508544922, 0.021928787231445312, 0.022995471954345703, 0.024062156677246094, 0.025128841400146484, 0.026195526123046875, 0.027262210845947266, 0.028328895568847656, 0.029395580291748047, 0.030462265014648438, 0.03152894973754883, 0.03259563446044922, 0.03366231918334961, 0.03472900390625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 8.0, 8.0, 12.0, 10.0, 26.0, 31.0, 48.0, 72.0, 110.0, 156.0, 279.0, 633.0, 2457.0, 20579.0, 3685429.0, 468962.0, 12127.0, 2131.0, 604.0, 280.0, 124.0, 65.0, 53.0, 30.0, 22.0, 11.0, 6.0, 6.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09588623046875, -0.09341955184936523, -0.09095287322998047, -0.0884861946105957, -0.08601951599121094, -0.08355283737182617, -0.0810861587524414, -0.07861948013305664, -0.07615280151367188, -0.07368612289428711, -0.07121944427490234, -0.06875276565551758, -0.06628608703613281, -0.06381940841674805, -0.06135272979736328, -0.058886051177978516, -0.05641937255859375, -0.053952693939208984, -0.05148601531982422, -0.04901933670043945, -0.04655265808105469, -0.04408597946166992, -0.041619300842285156, -0.03915262222290039, -0.036685943603515625, -0.03421926498413086, -0.031752586364746094, -0.029285907745361328, -0.026819229125976562, -0.024352550506591797, -0.02188587188720703, -0.019419193267822266, -0.0169525146484375, -0.014485836029052734, -0.012019157409667969, -0.009552478790283203, -0.0070858001708984375, -0.004619121551513672, -0.0021524429321289062, 0.0003142356872558594, 0.002780914306640625, 0.005247592926025391, 0.007714271545410156, 0.010180950164794922, 0.012647628784179688, 0.015114307403564453, 0.01758098602294922, 0.020047664642333984, 0.02251434326171875, 0.024981021881103516, 0.02744770050048828, 0.029914379119873047, 0.03238105773925781, 0.03484773635864258, 0.037314414978027344, 0.03978109359741211, 0.042247772216796875, 0.04471445083618164, 0.047181129455566406, 0.04964780807495117, 0.05211448669433594, 0.0545811653137207, 0.05704784393310547, 0.059514522552490234, 0.061981201171875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 11.0, 10.0, 21.0, 26.0, 56.0, 146.0, 707.0, 2230.0, 635.0, 104.0, 44.0, 26.0, 20.0, 10.0, 11.0, 6.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0743408203125, -0.0721139907836914, -0.06988716125488281, -0.06766033172607422, -0.06543350219726562, -0.06320667266845703, -0.06097984313964844, -0.058753013610839844, -0.05652618408203125, -0.054299354553222656, -0.05207252502441406, -0.04984569549560547, -0.047618865966796875, -0.04539203643798828, -0.04316520690917969, -0.040938377380371094, -0.0387115478515625, -0.036484718322753906, -0.03425788879394531, -0.03203105926513672, -0.029804229736328125, -0.02757740020751953, -0.025350570678710938, -0.023123741149902344, -0.02089691162109375, -0.018670082092285156, -0.016443252563476562, -0.014216423034667969, -0.011989593505859375, -0.009762763977050781, -0.0075359344482421875, -0.005309104919433594, -0.003082275390625, -0.0008554458618164062, 0.0013713836669921875, 0.0035982131958007812, 0.005825042724609375, 0.008051872253417969, 0.010278701782226562, 0.012505531311035156, 0.01473236083984375, 0.016959190368652344, 0.019186019897460938, 0.02141284942626953, 0.023639678955078125, 0.02586650848388672, 0.028093338012695312, 0.030320167541503906, 0.0325469970703125, 0.034773826599121094, 0.03700065612792969, 0.03922748565673828, 0.041454315185546875, 0.04368114471435547, 0.04590797424316406, 0.048134803771972656, 0.05036163330078125, 0.052588462829589844, 0.05481529235839844, 0.05704212188720703, 0.059268951416015625, 0.06149578094482422, 0.06372261047363281, 0.0659494400024414, 0.06817626953125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 7.0, 21.0, 40.0, 207.0, 555.0, 154.0, 18.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5451600551605225, -1.50963294506073, -1.4741058349609375, -1.4385786056518555, -1.403051495552063, -1.3675243854522705, -1.331997275352478, -1.2964701652526855, -1.2609429359436035, -1.225415825843811, -1.1898887157440186, -1.1543614864349365, -1.118834376335144, -1.0833072662353516, -1.047780156135559, -1.0122530460357666, -0.9767258763313293, -0.9411987662315369, -0.9056715965270996, -0.8701444864273071, -0.8346173167228699, -0.7990902066230774, -0.7635630369186401, -0.7280359268188477, -0.6925088167190552, -0.6569817066192627, -0.6214545369148254, -0.585927426815033, -0.5504002571105957, -0.5148731470108032, -0.47934600710868835, -0.4438188672065735, -0.40829163789749146, -0.3727644979953766, -0.3372373580932617, -0.30171024799346924, -0.266183078289032, -0.2306559532880783, -0.19512882828712463, -0.15960168838500977, -0.1240745484828949, -0.08854740858078003, -0.05302027612924576, -0.017493143677711487, 0.01803399622440338, 0.05356113612651825, 0.08908826112747192, 0.12461540102958679, 0.16014254093170166, 0.19566968083381653, 0.2311968207359314, 0.2667239308357239, 0.30225110054016113, 0.3377782106399536, 0.3733053505420685, 0.40883249044418335, 0.4443596303462982, 0.4798867702484131, 0.5154138803482056, 0.5509410500526428, 0.5864681601524353, 0.6219953298568726, 0.657522439956665, 0.6930495500564575, 0.7285767197608948]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 6.0, 5.0, 7.0, 7.0, 10.0, 15.0, 22.0, 21.0, 28.0, 37.0, 41.0, 50.0, 67.0, 57.0, 59.0, 61.0, 66.0, 67.0, 65.0, 62.0, 37.0, 42.0, 34.0, 25.0, 24.0, 14.0, 18.0, 12.0, 12.0, 16.0, 6.0, 5.0, 0.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24401086568832397, -0.23522941768169403, -0.22644798457622528, -0.21766653656959534, -0.2088850885629654, -0.20010364055633545, -0.1913222074508667, -0.18254075944423676, -0.1737593114376068, -0.16497786343097687, -0.15619643032550812, -0.14741498231887817, -0.13863353431224823, -0.1298520863056183, -0.12107065320014954, -0.11228920519351959, -0.10350777208805084, -0.0947263315320015, -0.08594488352537155, -0.0771634429693222, -0.06838199496269226, -0.059600554406642914, -0.05081911385059357, -0.04203766956925392, -0.033256225287914276, -0.02447478100657463, -0.015693338587880135, -0.006911896169185638, 0.001869548112154007, 0.010650992393493652, 0.019432432949543, 0.028213877230882645, 0.03699532151222229, 0.045776765793561935, 0.05455821007490158, 0.06333965063095093, 0.07212109863758087, 0.08090253919363022, 0.08968397974967957, 0.09846542775630951, 0.10724686831235886, 0.1160283088684082, 0.12480975687503815, 0.1335912048816681, 0.14237263798713684, 0.15115408599376678, 0.15993553400039673, 0.16871696710586548, 0.17749841511249542, 0.18627986311912537, 0.19506129622459412, 0.20384274423122406, 0.212624192237854, 0.22140562534332275, 0.2301870733499527, 0.23896852135658264, 0.2477499544620514, 0.25653138756752014, 0.2653128504753113, 0.27409428358078003, 0.2828757166862488, 0.2916571795940399, 0.30043861269950867, 0.3092200458049774, 0.31800150871276855]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 7.0, 4.0, 12.0, 10.0, 17.0, 29.0, 37.0, 59.0, 83.0, 163.0, 305.0, 607.0, 1461.0, 4104.0, 22308.0, 546091.0, 447576.0, 19177.0, 3867.0, 1342.0, 588.0, 266.0, 158.0, 93.0, 49.0, 45.0, 25.0, 20.0, 14.0, 7.0, 6.0, 7.0, 6.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0], "bins": [-0.134765625, -0.13121604919433594, -0.12766647338867188, -0.12411689758300781, -0.12056732177734375, -0.11701774597167969, -0.11346817016601562, -0.10991859436035156, -0.1063690185546875, -0.10281944274902344, -0.09926986694335938, -0.09572029113769531, -0.09217071533203125, -0.08862113952636719, -0.08507156372070312, -0.08152198791503906, -0.077972412109375, -0.07442283630371094, -0.07087326049804688, -0.06732368469238281, -0.06377410888671875, -0.06022453308105469, -0.056674957275390625, -0.05312538146972656, -0.0495758056640625, -0.04602622985839844, -0.042476654052734375, -0.03892707824707031, -0.03537750244140625, -0.03182792663574219, -0.028278350830078125, -0.024728775024414062, -0.02117919921875, -0.017629623413085938, -0.014080047607421875, -0.010530471801757812, -0.00698089599609375, -0.0034313201904296875, 0.000118255615234375, 0.0036678314208984375, 0.0072174072265625, 0.010766983032226562, 0.014316558837890625, 0.017866134643554688, 0.02141571044921875, 0.024965286254882812, 0.028514862060546875, 0.03206443786621094, 0.035614013671875, 0.03916358947753906, 0.042713165283203125, 0.04626274108886719, 0.04981231689453125, 0.05336189270019531, 0.056911468505859375, 0.06046104431152344, 0.0640106201171875, 0.06756019592285156, 0.07110977172851562, 0.07465934753417969, 0.07820892333984375, 0.08175849914550781, 0.08530807495117188, 0.08885765075683594, 0.0924072265625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 1.0, 3.0, 7.0, 3.0, 8.0, 5.0, 17.0, 23.0, 28.0, 28.0, 38.0, 43.0, 48.0, 62.0, 69.0, 86.0, 74.0, 71.0, 74.0, 68.0, 45.0, 44.0, 32.0, 33.0, 21.0, 16.0, 14.0, 13.0, 12.0, 3.0, 3.0, 3.0, 0.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.03338623046875, -0.03229379653930664, -0.03120136260986328, -0.030108928680419922, -0.029016494750976562, -0.027924060821533203, -0.026831626892089844, -0.025739192962646484, -0.024646759033203125, -0.023554325103759766, -0.022461891174316406, -0.021369457244873047, -0.020277023315429688, -0.019184589385986328, -0.01809215545654297, -0.01699972152709961, -0.01590728759765625, -0.01481485366821289, -0.013722419738769531, -0.012629985809326172, -0.011537551879882812, -0.010445117950439453, -0.009352684020996094, -0.008260250091552734, -0.007167816162109375, -0.006075382232666016, -0.004982948303222656, -0.003890514373779297, -0.0027980804443359375, -0.0017056465148925781, -0.0006132125854492188, 0.0004792213439941406, 0.0015716552734375, 0.0026640892028808594, 0.0037565231323242188, 0.004848957061767578, 0.0059413909912109375, 0.007033824920654297, 0.008126258850097656, 0.009218692779541016, 0.010311126708984375, 0.011403560638427734, 0.012495994567871094, 0.013588428497314453, 0.014680862426757812, 0.015773296356201172, 0.01686573028564453, 0.01795816421508789, 0.01905059814453125, 0.02014303207397461, 0.02123546600341797, 0.022327899932861328, 0.023420333862304688, 0.024512767791748047, 0.025605201721191406, 0.026697635650634766, 0.027790069580078125, 0.028882503509521484, 0.029974937438964844, 0.031067371368408203, 0.03215980529785156, 0.03325223922729492, 0.03434467315673828, 0.03543710708618164, 0.036529541015625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 2.0, 5.0, 3.0, 8.0, 8.0, 9.0, 17.0, 24.0, 44.0, 73.0, 122.0, 251.0, 573.0, 1611.0, 5941.0, 98544.0, 912818.0, 23168.0, 3386.0, 1081.0, 392.0, 195.0, 110.0, 53.0, 40.0, 21.0, 13.0, 11.0, 9.0, 5.0, 2.0, 5.0, 3.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.129150390625, -0.12502479553222656, -0.12089920043945312, -0.11677360534667969, -0.11264801025390625, -0.10852241516113281, -0.10439682006835938, -0.10027122497558594, -0.0961456298828125, -0.09202003479003906, -0.08789443969726562, -0.08376884460449219, -0.07964324951171875, -0.07551765441894531, -0.07139205932617188, -0.06726646423339844, -0.063140869140625, -0.05901527404785156, -0.054889678955078125, -0.05076408386230469, -0.04663848876953125, -0.04251289367675781, -0.038387298583984375, -0.03426170349121094, -0.0301361083984375, -0.026010513305664062, -0.021884918212890625, -0.017759323120117188, -0.01363372802734375, -0.009508132934570312, -0.005382537841796875, -0.0012569427490234375, 0.00286865234375, 0.0069942474365234375, 0.011119842529296875, 0.015245437622070312, 0.01937103271484375, 0.023496627807617188, 0.027622222900390625, 0.03174781799316406, 0.0358734130859375, 0.03999900817871094, 0.044124603271484375, 0.04825019836425781, 0.05237579345703125, 0.05650138854980469, 0.060626983642578125, 0.06475257873535156, 0.068878173828125, 0.07300376892089844, 0.07712936401367188, 0.08125495910644531, 0.08538055419921875, 0.08950614929199219, 0.09363174438476562, 0.09775733947753906, 0.1018829345703125, 0.10600852966308594, 0.11013412475585938, 0.11425971984863281, 0.11838531494140625, 0.12251091003417969, 0.12663650512695312, 0.13076210021972656, 0.1348876953125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 12.0, 5.0, 8.0, 7.0, 13.0, 18.0, 14.0, 25.0, 37.0, 35.0, 49.0, 44.0, 49.0, 75.0, 54.0, 59.0, 55.0, 67.0, 56.0, 64.0, 36.0, 43.0, 33.0, 29.0, 15.0, 20.0, 24.0, 13.0, 8.0, 4.0, 3.0, 8.0, 6.0, 2.0, 1.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.094482421875, -0.09134769439697266, -0.08821296691894531, -0.08507823944091797, -0.08194351196289062, -0.07880878448486328, -0.07567405700683594, -0.0725393295288086, -0.06940460205078125, -0.0662698745727539, -0.06313514709472656, -0.06000041961669922, -0.056865692138671875, -0.05373096466064453, -0.05059623718261719, -0.047461509704589844, -0.0443267822265625, -0.041192054748535156, -0.03805732727050781, -0.03492259979248047, -0.031787872314453125, -0.02865314483642578, -0.025518417358398438, -0.022383689880371094, -0.01924896240234375, -0.016114234924316406, -0.012979507446289062, -0.009844779968261719, -0.006710052490234375, -0.0035753250122070312, -0.0004405975341796875, 0.0026941299438476562, 0.005828857421875, 0.008963584899902344, 0.012098312377929688, 0.015233039855957031, 0.018367767333984375, 0.02150249481201172, 0.024637222290039062, 0.027771949768066406, 0.03090667724609375, 0.034041404724121094, 0.03717613220214844, 0.04031085968017578, 0.043445587158203125, 0.04658031463623047, 0.04971504211425781, 0.052849769592285156, 0.0559844970703125, 0.059119224548339844, 0.06225395202636719, 0.06538867950439453, 0.06852340698242188, 0.07165813446044922, 0.07479286193847656, 0.0779275894165039, 0.08106231689453125, 0.0841970443725586, 0.08733177185058594, 0.09046649932861328, 0.09360122680664062, 0.09673595428466797, 0.09987068176269531, 0.10300540924072266, 0.10614013671875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 3.0, 8.0, 6.0, 19.0, 20.0, 44.0, 61.0, 95.0, 175.0, 429.0, 1002.0, 2958.0, 16133.0, 1000129.0, 21867.0, 3543.0, 1054.0, 465.0, 227.0, 110.0, 69.0, 35.0, 27.0, 18.0, 14.0, 10.0, 9.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.166259765625, -0.16099166870117188, -0.15572357177734375, -0.15045547485351562, -0.1451873779296875, -0.13991928100585938, -0.13465118408203125, -0.12938308715820312, -0.124114990234375, -0.11884689331054688, -0.11357879638671875, -0.10831069946289062, -0.1030426025390625, -0.09777450561523438, -0.09250640869140625, -0.08723831176757812, -0.08197021484375, -0.07670211791992188, -0.07143402099609375, -0.06616592407226562, -0.0608978271484375, -0.055629730224609375, -0.05036163330078125, -0.045093536376953125, -0.039825439453125, -0.034557342529296875, -0.02928924560546875, -0.024021148681640625, -0.0187530517578125, -0.013484954833984375, -0.00821685791015625, -0.002948760986328125, 0.0023193359375, 0.007587432861328125, 0.01285552978515625, 0.018123626708984375, 0.0233917236328125, 0.028659820556640625, 0.03392791748046875, 0.039196014404296875, 0.044464111328125, 0.049732208251953125, 0.05500030517578125, 0.060268402099609375, 0.0655364990234375, 0.07080459594726562, 0.07607269287109375, 0.08134078979492188, 0.08660888671875, 0.09187698364257812, 0.09714508056640625, 0.10241317749023438, 0.1076812744140625, 0.11294937133789062, 0.11821746826171875, 0.12348556518554688, 0.128753662109375, 0.13402175903320312, 0.13928985595703125, 0.14455795288085938, 0.1498260498046875, 0.15509414672851562, 0.16036224365234375, 0.16563034057617188, 0.1708984375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 1.0, 3.0, 7.0, 10.0, 34.0, 94.0, 295.0, 322.0, 156.0, 43.0, 14.0, 11.0, 4.0, 7.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.744529724121094e-05, -4.6370550990104675e-05, -4.529580473899841e-05, -4.422105848789215e-05, -4.314631223678589e-05, -4.2071565985679626e-05, -4.0996819734573364e-05, -3.99220734834671e-05, -3.884732723236084e-05, -3.777258098125458e-05, -3.6697834730148315e-05, -3.562308847904205e-05, -3.454834222793579e-05, -3.347359597682953e-05, -3.2398849725723267e-05, -3.1324103474617004e-05, -3.0249357223510742e-05, -2.917461097240448e-05, -2.8099864721298218e-05, -2.7025118470191956e-05, -2.5950372219085693e-05, -2.487562596797943e-05, -2.380087971687317e-05, -2.2726133465766907e-05, -2.1651387214660645e-05, -2.0576640963554382e-05, -1.950189471244812e-05, -1.8427148461341858e-05, -1.7352402210235596e-05, -1.6277655959129333e-05, -1.5202909708023071e-05, -1.4128163456916809e-05, -1.3053417205810547e-05, -1.1978670954704285e-05, -1.0903924703598022e-05, -9.82917845249176e-06, -8.754432201385498e-06, -7.679685950279236e-06, -6.604939699172974e-06, -5.5301934480667114e-06, -4.455447196960449e-06, -3.380700945854187e-06, -2.305954694747925e-06, -1.2312084436416626e-06, -1.564621925354004e-07, 9.182840585708618e-07, 1.993030309677124e-06, 3.0677765607833862e-06, 4.1425228118896484e-06, 5.217269062995911e-06, 6.292015314102173e-06, 7.366761565208435e-06, 8.441507816314697e-06, 9.51625406742096e-06, 1.0591000318527222e-05, 1.1665746569633484e-05, 1.2740492820739746e-05, 1.3815239071846008e-05, 1.488998532295227e-05, 1.5964731574058533e-05, 1.7039477825164795e-05, 1.8114224076271057e-05, 1.918897032737732e-05, 2.026371657848358e-05, 2.1338462829589844e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 4.0, 2.0, 11.0, 13.0, 17.0, 16.0, 21.0, 46.0, 73.0, 129.0, 275.0, 678.0, 1864.0, 8138.0, 583907.0, 442344.0, 7960.0, 1775.0, 637.0, 279.0, 130.0, 80.0, 46.0, 25.0, 21.0, 22.0, 8.0, 4.0, 2.0, 5.0, 4.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11474609375, -0.1112680435180664, -0.10778999328613281, -0.10431194305419922, -0.10083389282226562, -0.09735584259033203, -0.09387779235839844, -0.09039974212646484, -0.08692169189453125, -0.08344364166259766, -0.07996559143066406, -0.07648754119873047, -0.07300949096679688, -0.06953144073486328, -0.06605339050292969, -0.0625753402709961, -0.0590972900390625, -0.055619239807128906, -0.05214118957519531, -0.04866313934326172, -0.045185089111328125, -0.04170703887939453, -0.03822898864746094, -0.034750938415527344, -0.03127288818359375, -0.027794837951660156, -0.024316787719726562, -0.02083873748779297, -0.017360687255859375, -0.013882637023925781, -0.010404586791992188, -0.006926536560058594, -0.003448486328125, 2.956390380859375e-05, 0.0035076141357421875, 0.006985664367675781, 0.010463714599609375, 0.013941764831542969, 0.017419815063476562, 0.020897865295410156, 0.02437591552734375, 0.027853965759277344, 0.03133201599121094, 0.03481006622314453, 0.038288116455078125, 0.04176616668701172, 0.04524421691894531, 0.048722267150878906, 0.0522003173828125, 0.055678367614746094, 0.05915641784667969, 0.06263446807861328, 0.06611251831054688, 0.06959056854248047, 0.07306861877441406, 0.07654666900634766, 0.08002471923828125, 0.08350276947021484, 0.08698081970214844, 0.09045886993408203, 0.09393692016601562, 0.09741497039794922, 0.10089302062988281, 0.1043710708618164, 0.10784912109375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 5.0, 5.0, 15.0, 14.0, 26.0, 48.0, 109.0, 236.0, 269.0, 126.0, 52.0, 31.0, 13.0, 11.0, 6.0, 4.0, 7.0, 1.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.08648681640625, -0.08415699005126953, -0.08182716369628906, -0.0794973373413086, -0.07716751098632812, -0.07483768463134766, -0.07250785827636719, -0.07017803192138672, -0.06784820556640625, -0.06551837921142578, -0.06318855285644531, -0.060858726501464844, -0.058528900146484375, -0.056199073791503906, -0.05386924743652344, -0.05153942108154297, -0.0492095947265625, -0.04687976837158203, -0.04454994201660156, -0.042220115661621094, -0.039890289306640625, -0.037560462951660156, -0.03523063659667969, -0.03290081024169922, -0.03057098388671875, -0.02824115753173828, -0.025911331176757812, -0.023581504821777344, -0.021251678466796875, -0.018921852111816406, -0.016592025756835938, -0.014262199401855469, -0.011932373046875, -0.009602546691894531, -0.0072727203369140625, -0.004942893981933594, -0.002613067626953125, -0.00028324127197265625, 0.0020465850830078125, 0.004376411437988281, 0.00670623779296875, 0.009036064147949219, 0.011365890502929688, 0.013695716857910156, 0.016025543212890625, 0.018355369567871094, 0.020685195922851562, 0.02301502227783203, 0.0253448486328125, 0.02767467498779297, 0.030004501342773438, 0.032334327697753906, 0.034664154052734375, 0.036993980407714844, 0.03932380676269531, 0.04165363311767578, 0.04398345947265625, 0.04631328582763672, 0.04864311218261719, 0.050972938537597656, 0.053302764892578125, 0.055632591247558594, 0.05796241760253906, 0.06029224395751953, 0.0626220703125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 98.0, 673.0, 140.0, 52.0, 21.0, 7.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1362041234970093, -1.0447371006011963, -0.9532701373100281, -0.8618031144142151, -0.7703361511230469, -0.6788691282272339, -0.5874021053314209, -0.4959351420402527, -0.4044681191444397, -0.3130011260509491, -0.2215341180562973, -0.1300671100616455, -0.03860011696815491, 0.05286687612533569, 0.14433389902114868, 0.2358008623123169, 0.3272678852081299, 0.4187348783016205, 0.5102018713951111, 0.6016688942909241, 0.6931358575820923, 0.7846028804779053, 0.8760699033737183, 0.9675368666648865, 1.0590038299560547, 1.1504708528518677, 1.2419378757476807, 1.333404779434204, 1.424871802330017, 1.51633882522583, 1.607805848121643, 1.699272871017456, 1.7907397747039795, 1.8822067975997925, 1.9736738204956055, 2.065140724182129, 2.1566078662872314, 2.248074769973755, 2.3395419120788574, 2.431008815765381, 2.5224757194519043, 2.6139426231384277, 2.7054097652435303, 2.7968766689300537, 2.8883438110351562, 2.9798107147216797, 3.071277618408203, 3.1627447605133057, 3.254211902618408, 3.3456788063049316, 3.437145948410034, 3.5286128520965576, 3.62007999420166, 3.7115468978881836, 3.803013801574707, 3.8944809436798096, 3.985947847366333, 4.0774149894714355, 4.168881893157959, 4.260348796844482, 4.351815700531006, 4.4432830810546875, 4.534749984741211, 4.626216888427734, 4.717683792114258]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 6.0, 10.0, 11.0, 10.0, 22.0, 19.0, 29.0, 44.0, 49.0, 63.0, 57.0, 78.0, 104.0, 109.0, 73.0, 63.0, 45.0, 52.0, 35.0, 30.0, 24.0, 21.0, 22.0, 6.0, 9.0, 5.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7244210839271545, -0.7024327516555786, -0.6804443597793579, -0.658456027507782, -0.636467695236206, -0.6144793033599854, -0.5924909710884094, -0.5705026388168335, -0.5485142469406128, -0.5265259146690369, -0.5045375227928162, -0.48254919052124023, -0.4605608582496643, -0.438572496175766, -0.4165841341018677, -0.39459580183029175, -0.3726074695587158, -0.3506191074848175, -0.3286307752132416, -0.30664241313934326, -0.28465408086776733, -0.262665718793869, -0.2406773567199707, -0.21868900954723358, -0.19670066237449646, -0.17471231520175934, -0.15272396802902222, -0.1307356059551239, -0.10874725878238678, -0.08675891160964966, -0.06477054953575134, -0.04278220236301422, -0.020793795585632324, 0.0011945553123950958, 0.023182906210422516, 0.045171260833740234, 0.06715960800647736, 0.08914795517921448, 0.11113631725311279, 0.13312466442584991, 0.15511301159858704, 0.17710135877132416, 0.19908970594406128, 0.2210780680179596, 0.24306641519069672, 0.26505476236343384, 0.28704312443733215, 0.30903148651123047, 0.3310198187828064, 0.3530081808567047, 0.37499651312828064, 0.39698487520217896, 0.4189732074737549, 0.4409615695476532, 0.4629499316215515, 0.48493826389312744, 0.5069266557693481, 0.5289149880409241, 0.5509033799171448, 0.5728917121887207, 0.5948800444602966, 0.6168683767318726, 0.6388567686080933, 0.6608451008796692, 0.6828334331512451]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 4.0, 2.0, 10.0, 9.0, 15.0, 37.0, 32.0, 64.0, 99.0, 196.0, 475.0, 3337.0, 3964889.0, 222695.0, 1600.0, 396.0, 157.0, 84.0, 63.0, 44.0, 20.0, 21.0, 8.0, 8.0, 5.0, 2.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2125244140625, -0.20642662048339844, -0.20032882690429688, -0.1942310333251953, -0.18813323974609375, -0.1820354461669922, -0.17593765258789062, -0.16983985900878906, -0.1637420654296875, -0.15764427185058594, -0.15154647827148438, -0.1454486846923828, -0.13935089111328125, -0.1332530975341797, -0.12715530395507812, -0.12105751037597656, -0.114959716796875, -0.10886192321777344, -0.10276412963867188, -0.09666633605957031, -0.09056854248046875, -0.08447074890136719, -0.07837295532226562, -0.07227516174316406, -0.0661773681640625, -0.06007957458496094, -0.053981781005859375, -0.04788398742675781, -0.04178619384765625, -0.03568840026855469, -0.029590606689453125, -0.023492813110351562, -0.01739501953125, -0.011297225952148438, -0.005199432373046875, 0.0008983612060546875, 0.00699615478515625, 0.013093948364257812, 0.019191741943359375, 0.025289535522460938, 0.0313873291015625, 0.03748512268066406, 0.043582916259765625, 0.04968070983886719, 0.05577850341796875, 0.06187629699707031, 0.06797409057617188, 0.07407188415527344, 0.080169677734375, 0.08626747131347656, 0.09236526489257812, 0.09846305847167969, 0.10456085205078125, 0.11065864562988281, 0.11675643920898438, 0.12285423278808594, 0.1289520263671875, 0.13504981994628906, 0.14114761352539062, 0.1472454071044922, 0.15334320068359375, 0.1594409942626953, 0.16553878784179688, 0.17163658142089844, 0.177734375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 5.0, 6.0, 7.0, 10.0, 13.0, 20.0, 22.0, 34.0, 32.0, 38.0, 60.0, 48.0, 63.0, 73.0, 92.0, 57.0, 74.0, 53.0, 63.0, 45.0, 45.0, 35.0, 22.0, 18.0, 16.0, 13.0, 10.0, 10.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0289459228515625, -0.027945280075073242, -0.026944637298583984, -0.025943994522094727, -0.02494335174560547, -0.02394270896911621, -0.022942066192626953, -0.021941423416137695, -0.020940780639648438, -0.01994013786315918, -0.018939495086669922, -0.017938852310180664, -0.016938209533691406, -0.01593756675720215, -0.01493692398071289, -0.013936281204223633, -0.012935638427734375, -0.011934995651245117, -0.01093435287475586, -0.009933710098266602, -0.008933067321777344, -0.007932424545288086, -0.006931781768798828, -0.00593113899230957, -0.0049304962158203125, -0.003929853439331055, -0.002929210662841797, -0.001928567886352539, -0.0009279251098632812, 7.271766662597656e-05, 0.0010733604431152344, 0.002074003219604492, 0.00307464599609375, 0.004075288772583008, 0.005075931549072266, 0.0060765743255615234, 0.007077217102050781, 0.008077859878540039, 0.009078502655029297, 0.010079145431518555, 0.011079788208007812, 0.01208043098449707, 0.013081073760986328, 0.014081716537475586, 0.015082359313964844, 0.0160830020904541, 0.01708364486694336, 0.018084287643432617, 0.019084930419921875, 0.020085573196411133, 0.02108621597290039, 0.02208685874938965, 0.023087501525878906, 0.024088144302368164, 0.025088787078857422, 0.02608942985534668, 0.027090072631835938, 0.028090715408325195, 0.029091358184814453, 0.03009200096130371, 0.03109264373779297, 0.03209328651428223, 0.033093929290771484, 0.03409457206726074, 0.03509521484375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 9.0, 11.0, 11.0, 14.0, 25.0, 33.0, 44.0, 65.0, 95.0, 188.0, 454.0, 1600.0, 33615.0, 4143972.0, 12707.0, 977.0, 248.0, 81.0, 46.0, 25.0, 21.0, 13.0, 15.0, 6.0, 6.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.138916015625, -0.13271331787109375, -0.1265106201171875, -0.12030792236328125, -0.114105224609375, -0.10790252685546875, -0.1016998291015625, -0.09549713134765625, -0.08929443359375, -0.08309173583984375, -0.0768890380859375, -0.07068634033203125, -0.064483642578125, -0.05828094482421875, -0.0520782470703125, -0.04587554931640625, -0.0396728515625, -0.03347015380859375, -0.0272674560546875, -0.02106475830078125, -0.014862060546875, -0.00865936279296875, -0.0024566650390625, 0.00374603271484375, 0.00994873046875, 0.01615142822265625, 0.0223541259765625, 0.02855682373046875, 0.034759521484375, 0.04096221923828125, 0.0471649169921875, 0.05336761474609375, 0.0595703125, 0.06577301025390625, 0.0719757080078125, 0.07817840576171875, 0.084381103515625, 0.09058380126953125, 0.0967864990234375, 0.10298919677734375, 0.10919189453125, 0.11539459228515625, 0.1215972900390625, 0.12779998779296875, 0.134002685546875, 0.14020538330078125, 0.1464080810546875, 0.15261077880859375, 0.1588134765625, 0.16501617431640625, 0.1712188720703125, 0.17742156982421875, 0.183624267578125, 0.18982696533203125, 0.1960296630859375, 0.20223236083984375, 0.20843505859375, 0.21463775634765625, 0.2208404541015625, 0.22704315185546875, 0.233245849609375, 0.23944854736328125, 0.2456512451171875, 0.25185394287109375, 0.258056640625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 8.0, 9.0, 17.0, 27.0, 91.0, 353.0, 2727.0, 670.0, 97.0, 42.0, 18.0, 9.0, 7.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2152099609375, -0.20990657806396484, -0.2046031951904297, -0.19929981231689453, -0.19399642944335938, -0.18869304656982422, -0.18338966369628906, -0.1780862808227539, -0.17278289794921875, -0.1674795150756836, -0.16217613220214844, -0.15687274932861328, -0.15156936645507812, -0.14626598358154297, -0.1409626007080078, -0.13565921783447266, -0.1303558349609375, -0.12505245208740234, -0.11974906921386719, -0.11444568634033203, -0.10914230346679688, -0.10383892059326172, -0.09853553771972656, -0.0932321548461914, -0.08792877197265625, -0.0826253890991211, -0.07732200622558594, -0.07201862335205078, -0.06671524047851562, -0.06141185760498047, -0.05610847473144531, -0.050805091857910156, -0.045501708984375, -0.040198326110839844, -0.03489494323730469, -0.02959156036376953, -0.024288177490234375, -0.01898479461669922, -0.013681411743164062, -0.008378028869628906, -0.00307464599609375, 0.0022287368774414062, 0.0075321197509765625, 0.012835502624511719, 0.018138885498046875, 0.02344226837158203, 0.028745651245117188, 0.034049034118652344, 0.0393524169921875, 0.044655799865722656, 0.04995918273925781, 0.05526256561279297, 0.060565948486328125, 0.06586933135986328, 0.07117271423339844, 0.0764760971069336, 0.08177947998046875, 0.0870828628540039, 0.09238624572753906, 0.09768962860107422, 0.10299301147460938, 0.10829639434814453, 0.11359977722167969, 0.11890316009521484, 0.12420654296875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 2.0, 3.0, 7.0, 2.0, 9.0, 13.0, 29.0, 48.0, 70.0, 136.0, 304.0, 243.0, 102.0, 19.0, 8.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9359114170074463, -0.9024567604064941, -0.8690021634101868, -0.8355475664138794, -0.8020929098129272, -0.7686382532119751, -0.7351836562156677, -0.7017290592193604, -0.6682744026184082, -0.634819746017456, -0.6013651490211487, -0.5679105520248413, -0.5344558954238892, -0.501001238822937, -0.46754664182662964, -0.4340920150279999, -0.4006373882293701, -0.36718276143074036, -0.3337281346321106, -0.30027350783348083, -0.2668188810348511, -0.2333642542362213, -0.19990962743759155, -0.1664550006389618, -0.13300037384033203, -0.09954574704170227, -0.06609112024307251, -0.03263649344444275, 0.0008181333541870117, 0.03427276015281677, 0.06772738695144653, 0.1011820137500763, 0.1346367597579956, 0.16809138655662537, 0.20154601335525513, 0.2350006401538849, 0.26845526695251465, 0.3019098937511444, 0.33536452054977417, 0.36881914734840393, 0.4022737741470337, 0.43572840094566345, 0.4691830277442932, 0.5026376247406006, 0.5360922813415527, 0.5695469379425049, 0.6030015349388123, 0.6364561319351196, 0.6699107885360718, 0.7033654451370239, 0.7368200421333313, 0.7702746391296387, 0.8037292957305908, 0.837183952331543, 0.8706385493278503, 0.9040931463241577, 0.9375478029251099, 0.971002459526062, 1.0044569969177246, 1.0379116535186768, 1.071366310119629, 1.104820966720581, 1.1382756233215332, 1.1717301607131958, 1.205184817314148]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 5.0, 3.0, 4.0, 8.0, 7.0, 7.0, 10.0, 12.0, 15.0, 18.0, 36.0, 22.0, 27.0, 35.0, 37.0, 50.0, 45.0, 51.0, 46.0, 65.0, 46.0, 47.0, 44.0, 34.0, 39.0, 52.0, 30.0, 29.0, 31.0, 15.0, 13.0, 13.0, 15.0, 20.0, 17.0, 11.0, 8.0, 11.0, 6.0, 7.0, 6.0, 2.0, 5.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3829692006111145, -0.36958047747612, -0.3561917543411255, -0.34280306100845337, -0.32941433787345886, -0.31602561473846436, -0.30263689160346985, -0.28924816846847534, -0.2758594751358032, -0.2624707520008087, -0.2490820437669754, -0.2356933206319809, -0.22230461239814758, -0.20891588926315308, -0.19552716612815857, -0.18213845789432526, -0.16874973475933075, -0.15536101162433624, -0.14197230339050293, -0.12858358025550842, -0.11519487202167511, -0.1018061488866806, -0.0884174332022667, -0.07502871751785278, -0.06164000183343887, -0.04825128614902496, -0.03486257046461105, -0.021473851054906845, -0.008085135370492935, 0.005303584039211273, 0.018692299723625183, 0.03208101540803909, 0.045469731092453, 0.05885844677686691, 0.07224716246128082, 0.08563588559627533, 0.09902459383010864, 0.11241331696510315, 0.12580204010009766, 0.13919074833393097, 0.15257945656776428, 0.1659681797027588, 0.1793568879365921, 0.1927456110715866, 0.20613431930541992, 0.21952304244041443, 0.23291176557540894, 0.24630047380924225, 0.25968921184539795, 0.27307793498039246, 0.28646665811538696, 0.2998553514480591, 0.3132440745830536, 0.3266327977180481, 0.3400215208530426, 0.3534102439880371, 0.36679893732070923, 0.38018766045570374, 0.39357638359069824, 0.40696507692337036, 0.42035380005836487, 0.4337425231933594, 0.4471312463283539, 0.4605199694633484, 0.4739086627960205]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 6.0, 5.0, 4.0, 6.0, 6.0, 23.0, 22.0, 32.0, 56.0, 69.0, 128.0, 236.0, 316.0, 506.0, 888.0, 1519.0, 2900.0, 5217.0, 10896.0, 23653.0, 55663.0, 139813.0, 301805.0, 285137.0, 126920.0, 50177.0, 21265.0, 9873.0, 5105.0, 2625.0, 1453.0, 873.0, 504.0, 311.0, 189.0, 119.0, 70.0, 57.0, 37.0, 22.0, 19.0, 12.0, 10.0, 4.0, 6.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.035491943359375, -0.034476280212402344, -0.03346061706542969, -0.03244495391845703, -0.031429290771484375, -0.03041362762451172, -0.029397964477539062, -0.028382301330566406, -0.02736663818359375, -0.026350975036621094, -0.025335311889648438, -0.02431964874267578, -0.023303985595703125, -0.02228832244873047, -0.021272659301757812, -0.020256996154785156, -0.0192413330078125, -0.018225669860839844, -0.017210006713867188, -0.01619434356689453, -0.015178680419921875, -0.014163017272949219, -0.013147354125976562, -0.012131690979003906, -0.01111602783203125, -0.010100364685058594, -0.009084701538085938, -0.008069038391113281, -0.007053375244140625, -0.006037712097167969, -0.0050220489501953125, -0.004006385803222656, -0.00299072265625, -0.0019750595092773438, -0.0009593963623046875, 5.626678466796875e-05, 0.001071929931640625, 0.0020875930786132812, 0.0031032562255859375, 0.004118919372558594, 0.00513458251953125, 0.006150245666503906, 0.0071659088134765625, 0.008181571960449219, 0.009197235107421875, 0.010212898254394531, 0.011228561401367188, 0.012244224548339844, 0.0132598876953125, 0.014275550842285156, 0.015291213989257812, 0.01630687713623047, 0.017322540283203125, 0.01833820343017578, 0.019353866577148438, 0.020369529724121094, 0.02138519287109375, 0.022400856018066406, 0.023416519165039062, 0.02443218231201172, 0.025447845458984375, 0.02646350860595703, 0.027479171752929688, 0.028494834899902344, 0.029510498046875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 7.0, 4.0, 8.0, 17.0, 9.0, 21.0, 17.0, 30.0, 27.0, 30.0, 30.0, 45.0, 47.0, 57.0, 37.0, 56.0, 58.0, 55.0, 49.0, 50.0, 47.0, 57.0, 40.0, 34.0, 38.0, 20.0, 25.0, 23.0, 13.0, 10.0, 14.0, 6.0, 3.0, 2.0, 10.0, 1.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0283966064453125, -0.027385950088500977, -0.026375293731689453, -0.02536463737487793, -0.024353981018066406, -0.023343324661254883, -0.02233266830444336, -0.021322011947631836, -0.020311355590820312, -0.01930069923400879, -0.018290042877197266, -0.017279386520385742, -0.01626873016357422, -0.015258073806762695, -0.014247417449951172, -0.013236761093139648, -0.012226104736328125, -0.011215448379516602, -0.010204792022705078, -0.009194135665893555, -0.008183479309082031, -0.007172822952270508, -0.006162166595458984, -0.005151510238647461, -0.0041408538818359375, -0.003130197525024414, -0.0021195411682128906, -0.0011088848114013672, -9.822845458984375e-05, 0.0009124279022216797, 0.0019230842590332031, 0.0029337406158447266, 0.00394439697265625, 0.0049550533294677734, 0.005965709686279297, 0.00697636604309082, 0.007987022399902344, 0.008997678756713867, 0.01000833511352539, 0.011018991470336914, 0.012029647827148438, 0.013040304183959961, 0.014050960540771484, 0.015061616897583008, 0.01607227325439453, 0.017082929611206055, 0.018093585968017578, 0.0191042423248291, 0.020114898681640625, 0.02112555503845215, 0.022136211395263672, 0.023146867752075195, 0.02415752410888672, 0.025168180465698242, 0.026178836822509766, 0.02718949317932129, 0.028200149536132812, 0.029210805892944336, 0.03022146224975586, 0.031232118606567383, 0.032242774963378906, 0.03325343132019043, 0.03426408767700195, 0.03527474403381348, 0.036285400390625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 9.0, 2.0, 7.0, 10.0, 7.0, 13.0, 15.0, 22.0, 40.0, 60.0, 65.0, 129.0, 230.0, 486.0, 1125.0, 3205.0, 15055.0, 606629.0, 402186.0, 14031.0, 3095.0, 1078.0, 484.0, 227.0, 117.0, 79.0, 39.0, 33.0, 18.0, 15.0, 5.0, 7.0, 7.0, 10.0, 2.0, 6.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1661376953125, -0.16094207763671875, -0.1557464599609375, -0.15055084228515625, -0.145355224609375, -0.14015960693359375, -0.1349639892578125, -0.12976837158203125, -0.12457275390625, -0.11937713623046875, -0.1141815185546875, -0.10898590087890625, -0.103790283203125, -0.09859466552734375, -0.0933990478515625, -0.08820343017578125, -0.0830078125, -0.07781219482421875, -0.0726165771484375, -0.06742095947265625, -0.062225341796875, -0.05702972412109375, -0.0518341064453125, -0.04663848876953125, -0.04144287109375, -0.03624725341796875, -0.0310516357421875, -0.02585601806640625, -0.020660400390625, -0.01546478271484375, -0.0102691650390625, -0.00507354736328125, 0.0001220703125, 0.00531768798828125, 0.0105133056640625, 0.01570892333984375, 0.020904541015625, 0.02610015869140625, 0.0312957763671875, 0.03649139404296875, 0.04168701171875, 0.04688262939453125, 0.0520782470703125, 0.05727386474609375, 0.062469482421875, 0.06766510009765625, 0.0728607177734375, 0.07805633544921875, 0.083251953125, 0.08844757080078125, 0.0936431884765625, 0.09883880615234375, 0.104034423828125, 0.10923004150390625, 0.1144256591796875, 0.11962127685546875, 0.12481689453125, 0.13001251220703125, 0.1352081298828125, 0.14040374755859375, 0.145599365234375, 0.15079498291015625, 0.1559906005859375, 0.16118621826171875, 0.1663818359375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 7.0, 12.0, 11.0, 12.0, 11.0, 21.0, 29.0, 41.0, 39.0, 63.0, 56.0, 66.0, 65.0, 72.0, 85.0, 68.0, 63.0, 55.0, 52.0, 47.0, 31.0, 22.0, 10.0, 18.0, 10.0, 6.0, 2.0, 4.0, 5.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.20751953125, -0.2014923095703125, -0.195465087890625, -0.1894378662109375, -0.18341064453125, -0.1773834228515625, -0.171356201171875, -0.1653289794921875, -0.1593017578125, -0.1532745361328125, -0.147247314453125, -0.1412200927734375, -0.13519287109375, -0.1291656494140625, -0.123138427734375, -0.1171112060546875, -0.111083984375, -0.1050567626953125, -0.099029541015625, -0.0930023193359375, -0.08697509765625, -0.0809478759765625, -0.074920654296875, -0.0688934326171875, -0.0628662109375, -0.0568389892578125, -0.050811767578125, -0.0447845458984375, -0.03875732421875, -0.0327301025390625, -0.026702880859375, -0.0206756591796875, -0.0146484375, -0.0086212158203125, -0.002593994140625, 0.0034332275390625, 0.00946044921875, 0.0154876708984375, 0.021514892578125, 0.0275421142578125, 0.0335693359375, 0.0395965576171875, 0.045623779296875, 0.0516510009765625, 0.05767822265625, 0.0637054443359375, 0.069732666015625, 0.0757598876953125, 0.081787109375, 0.0878143310546875, 0.093841552734375, 0.0998687744140625, 0.10589599609375, 0.1119232177734375, 0.117950439453125, 0.1239776611328125, 0.1300048828125, 0.1360321044921875, 0.142059326171875, 0.1480865478515625, 0.15411376953125, 0.1601409912109375, 0.166168212890625, 0.1721954345703125, 0.17822265625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 6.0, 7.0, 9.0, 15.0, 18.0, 43.0, 48.0, 79.0, 127.0, 236.0, 410.0, 771.0, 1658.0, 3771.0, 9913.0, 34791.0, 915207.0, 58566.0, 13672.0, 4961.0, 2106.0, 965.0, 486.0, 254.0, 165.0, 103.0, 71.0, 27.0, 26.0, 15.0, 11.0, 4.0, 4.0, 5.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.11749267578125, -0.11428642272949219, -0.11108016967773438, -0.10787391662597656, -0.10466766357421875, -0.10146141052246094, -0.09825515747070312, -0.09504890441894531, -0.0918426513671875, -0.08863639831542969, -0.08543014526367188, -0.08222389221191406, -0.07901763916015625, -0.07581138610839844, -0.07260513305664062, -0.06939888000488281, -0.066192626953125, -0.06298637390136719, -0.059780120849609375, -0.05657386779785156, -0.05336761474609375, -0.05016136169433594, -0.046955108642578125, -0.04374885559082031, -0.0405426025390625, -0.03733634948730469, -0.034130096435546875, -0.030923843383789062, -0.02771759033203125, -0.024511337280273438, -0.021305084228515625, -0.018098831176757812, -0.014892578125, -0.011686325073242188, -0.008480072021484375, -0.0052738189697265625, -0.00206756591796875, 0.0011386871337890625, 0.004344940185546875, 0.0075511932373046875, 0.0107574462890625, 0.013963699340820312, 0.017169952392578125, 0.020376205444335938, 0.02358245849609375, 0.026788711547851562, 0.029994964599609375, 0.03320121765136719, 0.036407470703125, 0.03961372375488281, 0.042819976806640625, 0.04602622985839844, 0.04923248291015625, 0.05243873596191406, 0.055644989013671875, 0.05885124206542969, 0.0620574951171875, 0.06526374816894531, 0.06847000122070312, 0.07167625427246094, 0.07488250732421875, 0.07808876037597656, 0.08129501342773438, 0.08450126647949219, 0.08770751953125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 3.0, 7.0, 4.0, 14.0, 24.0, 25.0, 113.0, 384.0, 296.0, 70.0, 29.0, 7.0, 8.0, 7.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4849853515625e-05, -6.322190165519714e-05, -6.159394979476929e-05, -5.996599793434143e-05, -5.8338046073913574e-05, -5.671009421348572e-05, -5.508214235305786e-05, -5.3454190492630005e-05, -5.182623863220215e-05, -5.019828677177429e-05, -4.8570334911346436e-05, -4.694238305091858e-05, -4.531443119049072e-05, -4.3686479330062866e-05, -4.205852746963501e-05, -4.043057560920715e-05, -3.88026237487793e-05, -3.717467188835144e-05, -3.5546720027923584e-05, -3.391876816749573e-05, -3.229081630706787e-05, -3.0662864446640015e-05, -2.9034912586212158e-05, -2.7406960725784302e-05, -2.5779008865356445e-05, -2.415105700492859e-05, -2.2523105144500732e-05, -2.0895153284072876e-05, -1.926720142364502e-05, -1.7639249563217163e-05, -1.6011297702789307e-05, -1.438334584236145e-05, -1.2755393981933594e-05, -1.1127442121505737e-05, -9.499490261077881e-06, -7.871538400650024e-06, -6.243586540222168e-06, -4.6156346797943115e-06, -2.987682819366455e-06, -1.3597309589385986e-06, 2.682209014892578e-07, 1.8961727619171143e-06, 3.5241246223449707e-06, 5.152076482772827e-06, 6.780028343200684e-06, 8.40798020362854e-06, 1.0035932064056396e-05, 1.1663883924484253e-05, 1.329183578491211e-05, 1.4919787645339966e-05, 1.6547739505767822e-05, 1.817569136619568e-05, 1.9803643226623535e-05, 2.143159508705139e-05, 2.3059546947479248e-05, 2.4687498807907104e-05, 2.631545066833496e-05, 2.7943402528762817e-05, 2.9571354389190674e-05, 3.119930624961853e-05, 3.282725811004639e-05, 3.445520997047424e-05, 3.60831618309021e-05, 3.7711113691329956e-05, 3.933906555175781e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 7.0, 2.0, 4.0, 8.0, 9.0, 26.0, 20.0, 63.0, 94.0, 192.0, 353.0, 904.0, 2406.0, 6961.0, 26171.0, 919708.0, 71859.0, 13169.0, 4017.0, 1487.0, 525.0, 265.0, 125.0, 65.0, 33.0, 26.0, 11.0, 13.0, 10.0, 3.0, 5.0, 5.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.125244140625, -0.12164020538330078, -0.11803627014160156, -0.11443233489990234, -0.11082839965820312, -0.1072244644165039, -0.10362052917480469, -0.10001659393310547, -0.09641265869140625, -0.09280872344970703, -0.08920478820800781, -0.0856008529663086, -0.08199691772460938, -0.07839298248291016, -0.07478904724121094, -0.07118511199951172, -0.0675811767578125, -0.06397724151611328, -0.06037330627441406, -0.056769371032714844, -0.053165435791015625, -0.049561500549316406, -0.04595756530761719, -0.04235363006591797, -0.03874969482421875, -0.03514575958251953, -0.03154182434082031, -0.027937889099121094, -0.024333953857421875, -0.020730018615722656, -0.017126083374023438, -0.013522148132324219, -0.009918212890625, -0.006314277648925781, -0.0027103424072265625, 0.0008935928344726562, 0.004497528076171875, 0.008101463317871094, 0.011705398559570312, 0.015309333801269531, 0.01891326904296875, 0.02251720428466797, 0.026121139526367188, 0.029725074768066406, 0.033329010009765625, 0.036932945251464844, 0.04053688049316406, 0.04414081573486328, 0.0477447509765625, 0.05134868621826172, 0.05495262145996094, 0.058556556701660156, 0.062160491943359375, 0.0657644271850586, 0.06936836242675781, 0.07297229766845703, 0.07657623291015625, 0.08018016815185547, 0.08378410339355469, 0.0873880386352539, 0.09099197387695312, 0.09459590911865234, 0.09819984436035156, 0.10180377960205078, 0.10540771484375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 6.0, 3.0, 5.0, 4.0, 5.0, 11.0, 18.0, 9.0, 11.0, 10.0, 47.0, 99.0, 239.0, 276.0, 125.0, 34.0, 13.0, 17.0, 11.0, 4.0, 10.0, 9.0, 10.0, 6.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08184814453125, -0.07893180847167969, -0.07601547241210938, -0.07309913635253906, -0.07018280029296875, -0.06726646423339844, -0.06435012817382812, -0.06143379211425781, -0.0585174560546875, -0.05560111999511719, -0.052684783935546875, -0.04976844787597656, -0.04685211181640625, -0.04393577575683594, -0.041019439697265625, -0.03810310363769531, -0.035186767578125, -0.03227043151855469, -0.029354095458984375, -0.026437759399414062, -0.02352142333984375, -0.020605087280273438, -0.017688751220703125, -0.014772415161132812, -0.0118560791015625, -0.008939743041992188, -0.006023406982421875, -0.0031070709228515625, -0.00019073486328125, 0.0027256011962890625, 0.005641937255859375, 0.008558273315429688, 0.011474609375, 0.014390945434570312, 0.017307281494140625, 0.020223617553710938, 0.02313995361328125, 0.026056289672851562, 0.028972625732421875, 0.03188896179199219, 0.0348052978515625, 0.03772163391113281, 0.040637969970703125, 0.04355430603027344, 0.04647064208984375, 0.04938697814941406, 0.052303314208984375, 0.05521965026855469, 0.058135986328125, 0.06105232238769531, 0.06396865844726562, 0.06688499450683594, 0.06980133056640625, 0.07271766662597656, 0.07563400268554688, 0.07855033874511719, 0.0814666748046875, 0.08438301086425781, 0.08729934692382812, 0.09021568298339844, 0.09313201904296875, 0.09604835510253906, 0.09896469116210938, 0.10188102722167969, 0.10479736328125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 9.0, 10.0, 26.0, 88.0, 238.0, 355.0, 144.0, 63.0, 26.0, 13.0, 16.0, 6.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9866142272949219, -1.92489755153656, -1.8631807565689087, -1.8014640808105469, -1.739747405052185, -1.6780307292938232, -1.6163139343261719, -1.55459725856781, -1.4928805828094482, -1.4311639070510864, -1.369447112083435, -1.3077304363250732, -1.2460137605667114, -1.1842970848083496, -1.1225802898406982, -1.0608636140823364, -0.9991468191146851, -0.9374300837516785, -0.8757134079933167, -0.8139966726303101, -0.7522799968719482, -0.6905632615089417, -0.6288465261459351, -0.5671298503875732, -0.5054131150245667, -0.44369640946388245, -0.38197970390319824, -0.32026296854019165, -0.25854626297950745, -0.19682955741882324, -0.13511282205581665, -0.07339611649513245, -0.011679530143737793, 0.05003718286752701, 0.11175389587879181, 0.1734706163406372, 0.2351873219013214, 0.2969040274620056, 0.3586207628250122, 0.4203374683856964, 0.4820541739463806, 0.5437709093093872, 0.605487585067749, 0.6672043204307556, 0.7289210557937622, 0.790637731552124, 0.8523544669151306, 0.9140712022781372, 0.975787878036499, 1.0375045537948608, 1.0992213487625122, 1.160938024520874, 1.2226547002792358, 1.2843713760375977, 1.346088171005249, 1.4078048467636108, 1.4695215225219727, 1.5312381982803345, 1.5929549932479858, 1.6546716690063477, 1.7163883447647095, 1.7781050205230713, 1.8398218154907227, 1.9015384912490845, 1.9632552862167358]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 3.0, 4.0, 4.0, 5.0, 15.0, 15.0, 19.0, 7.0, 16.0, 16.0, 19.0, 22.0, 20.0, 25.0, 36.0, 34.0, 32.0, 33.0, 66.0, 65.0, 90.0, 59.0, 45.0, 43.0, 43.0, 37.0, 31.0, 31.0, 31.0, 25.0, 23.0, 17.0, 10.0, 11.0, 8.0, 9.0, 8.0, 4.0, 5.0, 2.0, 0.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0], "bins": [-0.899845540523529, -0.8758163452148438, -0.8517871499061584, -0.8277579545974731, -0.8037287592887878, -0.7796995639801025, -0.7556703686714172, -0.7316411733627319, -0.7076119780540466, -0.6835827827453613, -0.659553587436676, -0.6355243921279907, -0.6114951968193054, -0.5874660015106201, -0.5634368062019348, -0.5394076108932495, -0.515378475189209, -0.4913492798805237, -0.4673200845718384, -0.4432908892631531, -0.4192616939544678, -0.39523249864578247, -0.37120330333709717, -0.34717410802841187, -0.32314491271972656, -0.29911571741104126, -0.27508652210235596, -0.25105732679367065, -0.22702813148498535, -0.20299893617630005, -0.17896975576877594, -0.15494056046009064, -0.13091135025024414, -0.10688215494155884, -0.08285295963287354, -0.05882377177476883, -0.03479457646608353, -0.010765381157398224, 0.013263806700706482, 0.037293002009391785, 0.06132219731807709, 0.08535139262676239, 0.10938058793544769, 0.1334097683429718, 0.1574389636516571, 0.1814681589603424, 0.2054973542690277, 0.229526549577713, 0.2535557448863983, 0.2775849401950836, 0.3016141355037689, 0.3256433308124542, 0.3496725261211395, 0.37370172142982483, 0.39773088693618774, 0.42176008224487305, 0.44578927755355835, 0.46981847286224365, 0.49384766817092896, 0.5178768634796143, 0.5419060587882996, 0.5659352540969849, 0.5899644494056702, 0.6139936447143555, 0.6380228400230408]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 5.0, 11.0, 10.0, 8.0, 16.0, 13.0, 14.0, 31.0, 46.0, 58.0, 73.0, 116.0, 174.0, 410.0, 971.0, 3526.0, 18996.0, 376897.0, 3639136.0, 138014.0, 11628.0, 2450.0, 735.0, 335.0, 166.0, 124.0, 94.0, 56.0, 46.0, 30.0, 25.0, 15.0, 18.0, 12.0, 8.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0838623046875, -0.08142280578613281, -0.07898330688476562, -0.07654380798339844, -0.07410430908203125, -0.07166481018066406, -0.06922531127929688, -0.06678581237792969, -0.0643463134765625, -0.06190681457519531, -0.059467315673828125, -0.05702781677246094, -0.05458831787109375, -0.05214881896972656, -0.049709320068359375, -0.04726982116699219, -0.044830322265625, -0.04239082336425781, -0.039951324462890625, -0.03751182556152344, -0.03507232666015625, -0.03263282775878906, -0.030193328857421875, -0.027753829956054688, -0.0253143310546875, -0.022874832153320312, -0.020435333251953125, -0.017995834350585938, -0.01555633544921875, -0.013116836547851562, -0.010677337646484375, -0.008237838745117188, -0.00579833984375, -0.0033588409423828125, -0.000919342041015625, 0.0015201568603515625, 0.00395965576171875, 0.0063991546630859375, 0.008838653564453125, 0.011278152465820312, 0.0137176513671875, 0.016157150268554688, 0.018596649169921875, 0.021036148071289062, 0.02347564697265625, 0.025915145874023438, 0.028354644775390625, 0.030794143676757812, 0.033233642578125, 0.03567314147949219, 0.038112640380859375, 0.04055213928222656, 0.04299163818359375, 0.04543113708496094, 0.047870635986328125, 0.05031013488769531, 0.0527496337890625, 0.05518913269042969, 0.057628631591796875, 0.06006813049316406, 0.06250762939453125, 0.06494712829589844, 0.06738662719726562, 0.06982612609863281, 0.072265625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 3.0, 4.0, 2.0, 4.0, 9.0, 13.0, 14.0, 22.0, 18.0, 21.0, 21.0, 32.0, 40.0, 47.0, 50.0, 48.0, 69.0, 61.0, 56.0, 74.0, 53.0, 55.0, 50.0, 49.0, 26.0, 22.0, 28.0, 24.0, 20.0, 14.0, 13.0, 11.0, 9.0, 6.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03350830078125, -0.03244209289550781, -0.031375885009765625, -0.030309677124023438, -0.02924346923828125, -0.028177261352539062, -0.027111053466796875, -0.026044845581054688, -0.0249786376953125, -0.023912429809570312, -0.022846221923828125, -0.021780014038085938, -0.02071380615234375, -0.019647598266601562, -0.018581390380859375, -0.017515182495117188, -0.016448974609375, -0.015382766723632812, -0.014316558837890625, -0.013250350952148438, -0.01218414306640625, -0.011117935180664062, -0.010051727294921875, -0.008985519409179688, -0.0079193115234375, -0.0068531036376953125, -0.005786895751953125, -0.0047206878662109375, -0.00365447998046875, -0.0025882720947265625, -0.001522064208984375, -0.0004558563232421875, 0.0006103515625, 0.0016765594482421875, 0.002742767333984375, 0.0038089752197265625, 0.00487518310546875, 0.0059413909912109375, 0.007007598876953125, 0.008073806762695312, 0.0091400146484375, 0.010206222534179688, 0.011272430419921875, 0.012338638305664062, 0.01340484619140625, 0.014471054077148438, 0.015537261962890625, 0.016603469848632812, 0.017669677734375, 0.018735885620117188, 0.019802093505859375, 0.020868301391601562, 0.02193450927734375, 0.023000717163085938, 0.024066925048828125, 0.025133132934570312, 0.0261993408203125, 0.027265548706054688, 0.028331756591796875, 0.029397964477539062, 0.03046417236328125, 0.03153038024902344, 0.032596588134765625, 0.03366279602050781, 0.03472900390625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 7.0, 9.0, 15.0, 23.0, 30.0, 45.0, 50.0, 76.0, 103.0, 128.0, 227.0, 449.0, 895.0, 6335.0, 3658135.0, 523132.0, 3105.0, 561.0, 283.0, 194.0, 131.0, 94.0, 83.0, 54.0, 35.0, 33.0, 15.0, 15.0, 7.0, 8.0, 5.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2052001953125, -0.1972827911376953, -0.18936538696289062, -0.18144798278808594, -0.17353057861328125, -0.16561317443847656, -0.15769577026367188, -0.1497783660888672, -0.1418609619140625, -0.1339435577392578, -0.12602615356445312, -0.11810874938964844, -0.11019134521484375, -0.10227394104003906, -0.09435653686523438, -0.08643913269042969, -0.078521728515625, -0.07060432434082031, -0.06268692016601562, -0.05476951599121094, -0.04685211181640625, -0.03893470764160156, -0.031017303466796875, -0.023099899291992188, -0.0151824951171875, -0.0072650909423828125, 0.000652313232421875, 0.008569717407226562, 0.01648712158203125, 0.024404525756835938, 0.032321929931640625, 0.04023933410644531, 0.04815673828125, 0.05607414245605469, 0.06399154663085938, 0.07190895080566406, 0.07982635498046875, 0.08774375915527344, 0.09566116333007812, 0.10357856750488281, 0.1114959716796875, 0.11941337585449219, 0.12733078002929688, 0.13524818420410156, 0.14316558837890625, 0.15108299255371094, 0.15900039672851562, 0.1669178009033203, 0.174835205078125, 0.1827526092529297, 0.19067001342773438, 0.19858741760253906, 0.20650482177734375, 0.21442222595214844, 0.22233963012695312, 0.2302570343017578, 0.2381744384765625, 0.2460918426513672, 0.2540092468261719, 0.26192665100097656, 0.26984405517578125, 0.27776145935058594, 0.2856788635253906, 0.2935962677001953, 0.301513671875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 18.0, 33.0, 52.0, 116.0, 486.0, 2227.0, 885.0, 159.0, 54.0, 26.0, 12.0, 7.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1473388671875, -0.1413593292236328, -0.13537979125976562, -0.12940025329589844, -0.12342071533203125, -0.11744117736816406, -0.11146163940429688, -0.10548210144042969, -0.0995025634765625, -0.09352302551269531, -0.08754348754882812, -0.08156394958496094, -0.07558441162109375, -0.06960487365722656, -0.06362533569335938, -0.05764579772949219, -0.051666259765625, -0.04568672180175781, -0.039707183837890625, -0.03372764587402344, -0.02774810791015625, -0.021768569946289062, -0.015789031982421875, -0.009809494018554688, -0.0038299560546875, 0.0021495819091796875, 0.008129119873046875, 0.014108657836914062, 0.02008819580078125, 0.026067733764648438, 0.032047271728515625, 0.03802680969238281, 0.04400634765625, 0.04998588562011719, 0.055965423583984375, 0.06194496154785156, 0.06792449951171875, 0.07390403747558594, 0.07988357543945312, 0.08586311340332031, 0.0918426513671875, 0.09782218933105469, 0.10380172729492188, 0.10978126525878906, 0.11576080322265625, 0.12174034118652344, 0.12771987915039062, 0.1336994171142578, 0.139678955078125, 0.1456584930419922, 0.15163803100585938, 0.15761756896972656, 0.16359710693359375, 0.16957664489746094, 0.17555618286132812, 0.1815357208251953, 0.1875152587890625, 0.1934947967529297, 0.19947433471679688, 0.20545387268066406, 0.21143341064453125, 0.21741294860839844, 0.22339248657226562, 0.2293720245361328, 0.2353515625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 7.0, 8.0, 9.0, 13.0, 16.0, 29.0, 47.0, 95.0, 175.0, 207.0, 163.0, 112.0, 56.0, 26.0, 19.0, 8.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.516302466392517, -1.4816023111343384, -1.4469021558761597, -1.4122021198272705, -1.3775019645690918, -1.342801809310913, -1.3081016540527344, -1.2734014987945557, -1.2387014627456665, -1.2040013074874878, -1.169301152229309, -1.13460111618042, -1.0999009609222412, -1.0652008056640625, -1.0305006504058838, -0.9958005547523499, -0.9611003994941711, -0.9264002442359924, -0.8917001485824585, -0.8569999933242798, -0.8222998976707458, -0.7875997424125671, -0.7528996467590332, -0.7181994915008545, -0.6834993362426758, -0.6487991809844971, -0.6140990853309631, -0.5793989300727844, -0.5446988344192505, -0.5099986791610718, -0.47529855370521545, -0.44059842824935913, -0.4058983325958252, -0.37119820713996887, -0.33649808168411255, -0.30179792642593384, -0.2670978307723999, -0.23239769041538239, -0.19769755005836487, -0.16299742460250854, -0.12829729914665222, -0.0935971736907959, -0.05889704078435898, -0.024196907877922058, 0.010503217577934265, 0.04520334303379059, 0.0799034833908081, 0.11460360884666443, 0.14930373430252075, 0.18400385975837708, 0.2187039852142334, 0.2534041404724121, 0.28810423612594604, 0.32280439138412476, 0.3575045168399811, 0.3922046422958374, 0.4269047677516937, 0.46160489320755005, 0.49630501866340637, 0.5310051441192627, 0.5657052993774414, 0.6004053950309753, 0.635105550289154, 0.669805645942688, 0.7045058012008667]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 5.0, 3.0, 11.0, 5.0, 6.0, 11.0, 13.0, 11.0, 7.0, 21.0, 13.0, 11.0, 28.0, 26.0, 29.0, 32.0, 38.0, 38.0, 31.0, 33.0, 55.0, 39.0, 45.0, 50.0, 43.0, 48.0, 37.0, 30.0, 35.0, 35.0, 30.0, 27.0, 21.0, 19.0, 28.0, 20.0, 12.0, 11.0, 8.0, 9.0, 5.0, 2.0, 3.0, 5.0, 2.0, 7.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2868998646736145, -0.27773603796958923, -0.2685721814632416, -0.2594083547592163, -0.25024449825286865, -0.24108067154884338, -0.23191684484481812, -0.22275300323963165, -0.2135891616344452, -0.20442532002925873, -0.19526147842407227, -0.186097651720047, -0.17693381011486053, -0.16776996850967407, -0.1586061418056488, -0.14944230020046234, -0.14027845859527588, -0.13111461699008942, -0.12195078283548355, -0.11278694868087769, -0.10362310707569122, -0.09445926547050476, -0.0852954313158989, -0.07613159716129303, -0.06696775555610657, -0.0578039176762104, -0.04864007979631424, -0.039476241916418076, -0.03031240403652191, -0.021148566156625748, -0.011984728276729584, -0.0028208941221237183, 0.006342947483062744, 0.015506785362958908, 0.024670623242855072, 0.033834461122751236, 0.0429982990026474, 0.052162136882543564, 0.06132597476243973, 0.0704898089170456, 0.07965365052223206, 0.08881749212741852, 0.09798132628202438, 0.10714516043663025, 0.11630900204181671, 0.12547284364700317, 0.13463667035102844, 0.1438005119562149, 0.15296435356140137, 0.16212819516658783, 0.1712920367717743, 0.18045586347579956, 0.18961970508098602, 0.19878354668617249, 0.20794737339019775, 0.21711121499538422, 0.22627505660057068, 0.23543889820575714, 0.2446027398109436, 0.25376656651496887, 0.26293039321899414, 0.2720942497253418, 0.28125807642936707, 0.29042190313339233, 0.29958575963974]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 8.0, 7.0, 7.0, 19.0, 13.0, 32.0, 41.0, 54.0, 87.0, 152.0, 278.0, 427.0, 760.0, 1312.0, 2376.0, 4505.0, 8872.0, 19264.0, 44956.0, 117326.0, 306672.0, 324307.0, 127834.0, 48627.0, 20681.0, 9562.0, 4707.0, 2386.0, 1378.0, 742.0, 428.0, 266.0, 139.0, 111.0, 69.0, 56.0, 31.0, 18.0, 15.0, 9.0, 6.0, 7.0, 2.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.050018310546875, -0.04829597473144531, -0.046573638916015625, -0.04485130310058594, -0.04312896728515625, -0.04140663146972656, -0.039684295654296875, -0.03796195983886719, -0.0362396240234375, -0.03451728820800781, -0.032794952392578125, -0.031072616577148438, -0.02935028076171875, -0.027627944946289062, -0.025905609130859375, -0.024183273315429688, -0.0224609375, -0.020738601684570312, -0.019016265869140625, -0.017293930053710938, -0.01557159423828125, -0.013849258422851562, -0.012126922607421875, -0.010404586791992188, -0.0086822509765625, -0.0069599151611328125, -0.005237579345703125, -0.0035152435302734375, -0.00179290771484375, -7.05718994140625e-05, 0.001651763916015625, 0.0033740997314453125, 0.005096435546875, 0.0068187713623046875, 0.008541107177734375, 0.010263442993164062, 0.01198577880859375, 0.013708114624023438, 0.015430450439453125, 0.017152786254882812, 0.0188751220703125, 0.020597457885742188, 0.022319793701171875, 0.024042129516601562, 0.02576446533203125, 0.027486801147460938, 0.029209136962890625, 0.030931472778320312, 0.03265380859375, 0.03437614440917969, 0.036098480224609375, 0.03782081604003906, 0.03954315185546875, 0.04126548767089844, 0.042987823486328125, 0.04471015930175781, 0.0464324951171875, 0.04815483093261719, 0.049877166748046875, 0.05159950256347656, 0.05332183837890625, 0.05504417419433594, 0.056766510009765625, 0.05848884582519531, 0.060211181640625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 7.0, 9.0, 12.0, 11.0, 22.0, 15.0, 28.0, 23.0, 22.0, 43.0, 27.0, 45.0, 61.0, 46.0, 64.0, 59.0, 69.0, 65.0, 41.0, 50.0, 41.0, 26.0, 32.0, 41.0, 24.0, 26.0, 19.0, 13.0, 14.0, 11.0, 11.0, 8.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.033599853515625, -0.03251934051513672, -0.03143882751464844, -0.030358314514160156, -0.029277801513671875, -0.028197288513183594, -0.027116775512695312, -0.02603626251220703, -0.02495574951171875, -0.02387523651123047, -0.022794723510742188, -0.021714210510253906, -0.020633697509765625, -0.019553184509277344, -0.018472671508789062, -0.01739215850830078, -0.0163116455078125, -0.015231132507324219, -0.014150619506835938, -0.013070106506347656, -0.011989593505859375, -0.010909080505371094, -0.009828567504882812, -0.008748054504394531, -0.00766754150390625, -0.006587028503417969, -0.0055065155029296875, -0.004426002502441406, -0.003345489501953125, -0.0022649765014648438, -0.0011844635009765625, -0.00010395050048828125, 0.0009765625, 0.0020570755004882812, 0.0031375885009765625, 0.004218101501464844, 0.005298614501953125, 0.006379127502441406, 0.0074596405029296875, 0.008540153503417969, 0.00962066650390625, 0.010701179504394531, 0.011781692504882812, 0.012862205505371094, 0.013942718505859375, 0.015023231506347656, 0.016103744506835938, 0.01718425750732422, 0.0182647705078125, 0.01934528350830078, 0.020425796508789062, 0.021506309509277344, 0.022586822509765625, 0.023667335510253906, 0.024747848510742188, 0.02582836151123047, 0.02690887451171875, 0.02798938751220703, 0.029069900512695312, 0.030150413513183594, 0.031230926513671875, 0.032311439514160156, 0.03339195251464844, 0.03447246551513672, 0.035552978515625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 13.0, 12.0, 15.0, 32.0, 51.0, 73.0, 94.0, 111.0, 204.0, 315.0, 488.0, 839.0, 1540.0, 3302.0, 9292.0, 35324.0, 244159.0, 654762.0, 72635.0, 15264.0, 5100.0, 2099.0, 1068.0, 577.0, 371.0, 262.0, 165.0, 112.0, 81.0, 55.0, 34.0, 28.0, 20.0, 13.0, 14.0, 10.0, 7.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.10455322265625, -0.10056400299072266, -0.09657478332519531, -0.09258556365966797, -0.08859634399414062, -0.08460712432861328, -0.08061790466308594, -0.0766286849975586, -0.07263946533203125, -0.0686502456665039, -0.06466102600097656, -0.06067180633544922, -0.056682586669921875, -0.05269336700439453, -0.04870414733886719, -0.044714927673339844, -0.0407257080078125, -0.036736488342285156, -0.03274726867675781, -0.02875804901123047, -0.024768829345703125, -0.02077960968017578, -0.016790390014648438, -0.012801170349121094, -0.00881195068359375, -0.004822731018066406, -0.0008335113525390625, 0.0031557083129882812, 0.007144927978515625, 0.011134147644042969, 0.015123367309570312, 0.019112586975097656, 0.023101806640625, 0.027091026306152344, 0.031080245971679688, 0.03506946563720703, 0.039058685302734375, 0.04304790496826172, 0.04703712463378906, 0.051026344299316406, 0.05501556396484375, 0.059004783630371094, 0.06299400329589844, 0.06698322296142578, 0.07097244262695312, 0.07496166229248047, 0.07895088195800781, 0.08294010162353516, 0.0869293212890625, 0.09091854095458984, 0.09490776062011719, 0.09889698028564453, 0.10288619995117188, 0.10687541961669922, 0.11086463928222656, 0.1148538589477539, 0.11884307861328125, 0.1228322982788086, 0.12682151794433594, 0.13081073760986328, 0.13479995727539062, 0.13878917694091797, 0.1427783966064453, 0.14676761627197266, 0.1507568359375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 4.0, 1.0, 8.0, 7.0, 9.0, 10.0, 11.0, 20.0, 11.0, 22.0, 17.0, 24.0, 35.0, 33.0, 36.0, 36.0, 38.0, 44.0, 49.0, 44.0, 42.0, 43.0, 42.0, 48.0, 34.0, 32.0, 32.0, 38.0, 35.0, 26.0, 21.0, 23.0, 19.0, 17.0, 15.0, 19.0, 8.0, 8.0, 9.0, 7.0, 4.0, 6.0, 2.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.10797119140625, -0.10443878173828125, -0.1009063720703125, -0.09737396240234375, -0.093841552734375, -0.09030914306640625, -0.0867767333984375, -0.08324432373046875, -0.0797119140625, -0.07617950439453125, -0.0726470947265625, -0.06911468505859375, -0.065582275390625, -0.06204986572265625, -0.0585174560546875, -0.05498504638671875, -0.05145263671875, -0.04792022705078125, -0.0443878173828125, -0.04085540771484375, -0.037322998046875, -0.03379058837890625, -0.0302581787109375, -0.02672576904296875, -0.023193359375, -0.01966094970703125, -0.0161285400390625, -0.01259613037109375, -0.009063720703125, -0.00553131103515625, -0.0019989013671875, 0.00153350830078125, 0.00506591796875, 0.00859832763671875, 0.0121307373046875, 0.01566314697265625, 0.019195556640625, 0.02272796630859375, 0.0262603759765625, 0.02979278564453125, 0.0333251953125, 0.03685760498046875, 0.0403900146484375, 0.04392242431640625, 0.047454833984375, 0.05098724365234375, 0.0545196533203125, 0.05805206298828125, 0.06158447265625, 0.06511688232421875, 0.0686492919921875, 0.07218170166015625, 0.075714111328125, 0.07924652099609375, 0.0827789306640625, 0.08631134033203125, 0.08984375, 0.09337615966796875, 0.0969085693359375, 0.10044097900390625, 0.103973388671875, 0.10750579833984375, 0.1110382080078125, 0.11457061767578125, 0.11810302734375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 4.0, 4.0, 10.0, 15.0, 18.0, 23.0, 22.0, 55.0, 54.0, 103.0, 104.0, 145.0, 229.0, 348.0, 545.0, 826.0, 1467.0, 2390.0, 4312.0, 8384.0, 18202.0, 48589.0, 339138.0, 532032.0, 52448.0, 19352.0, 8834.0, 4413.0, 2374.0, 1423.0, 883.0, 572.0, 373.0, 248.0, 170.0, 122.0, 91.0, 59.0, 43.0, 36.0, 20.0, 16.0, 16.0, 17.0, 8.0, 9.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.05572509765625, -0.05392932891845703, -0.05213356018066406, -0.050337791442871094, -0.048542022705078125, -0.046746253967285156, -0.04495048522949219, -0.04315471649169922, -0.04135894775390625, -0.03956317901611328, -0.03776741027832031, -0.035971641540527344, -0.034175872802734375, -0.032380104064941406, -0.030584335327148438, -0.02878856658935547, -0.0269927978515625, -0.02519702911376953, -0.023401260375976562, -0.021605491638183594, -0.019809722900390625, -0.018013954162597656, -0.016218185424804688, -0.014422416687011719, -0.01262664794921875, -0.010830879211425781, -0.009035110473632812, -0.007239341735839844, -0.005443572998046875, -0.0036478042602539062, -0.0018520355224609375, -5.626678466796875e-05, 0.001739501953125, 0.0035352706909179688, 0.0053310394287109375, 0.007126808166503906, 0.008922576904296875, 0.010718345642089844, 0.012514114379882812, 0.014309883117675781, 0.01610565185546875, 0.01790142059326172, 0.019697189331054688, 0.021492958068847656, 0.023288726806640625, 0.025084495544433594, 0.026880264282226562, 0.02867603302001953, 0.0304718017578125, 0.03226757049560547, 0.03406333923339844, 0.035859107971191406, 0.037654876708984375, 0.039450645446777344, 0.04124641418457031, 0.04304218292236328, 0.04483795166015625, 0.04663372039794922, 0.04842948913574219, 0.050225257873535156, 0.052021026611328125, 0.053816795349121094, 0.05561256408691406, 0.05740833282470703, 0.0592041015625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 5.0, 11.0, 9.0, 7.0, 24.0, 24.0, 60.0, 181.0, 288.0, 214.0, 69.0, 37.0, 15.0, 15.0, 11.0, 8.0, 3.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.649162292480469e-05, -4.4920481741428375e-05, -4.334934055805206e-05, -4.177819937467575e-05, -4.020705819129944e-05, -3.8635917007923126e-05, -3.7064775824546814e-05, -3.54936346411705e-05, -3.392249345779419e-05, -3.235135227441788e-05, -3.0780211091041565e-05, -2.9209069907665253e-05, -2.763792872428894e-05, -2.6066787540912628e-05, -2.4495646357536316e-05, -2.2924505174160004e-05, -2.135336399078369e-05, -1.978222280740738e-05, -1.8211081624031067e-05, -1.6639940440654755e-05, -1.5068799257278442e-05, -1.349765807390213e-05, -1.1926516890525818e-05, -1.0355375707149506e-05, -8.784234523773193e-06, -7.213093340396881e-06, -5.641952157020569e-06, -4.070810973644257e-06, -2.4996697902679443e-06, -9.285286068916321e-07, 6.426125764846802e-07, 2.2137537598609924e-06, 3.7848949432373047e-06, 5.356036126613617e-06, 6.927177309989929e-06, 8.498318493366241e-06, 1.0069459676742554e-05, 1.1640600860118866e-05, 1.3211742043495178e-05, 1.478288322687149e-05, 1.6354024410247803e-05, 1.7925165593624115e-05, 1.9496306777000427e-05, 2.106744796037674e-05, 2.2638589143753052e-05, 2.4209730327129364e-05, 2.5780871510505676e-05, 2.735201269388199e-05, 2.89231538772583e-05, 3.0494295060634613e-05, 3.2065436244010925e-05, 3.363657742738724e-05, 3.520771861076355e-05, 3.677885979413986e-05, 3.8350000977516174e-05, 3.9921142160892487e-05, 4.14922833442688e-05, 4.306342452764511e-05, 4.463456571102142e-05, 4.6205706894397736e-05, 4.777684807777405e-05, 4.934798926115036e-05, 5.091913044452667e-05, 5.2490271627902985e-05, 5.40614128112793e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 3.0, 4.0, 2.0, 11.0, 8.0, 16.0, 13.0, 23.0, 29.0, 58.0, 99.0, 113.0, 258.0, 393.0, 796.0, 1746.0, 4354.0, 12768.0, 53491.0, 787947.0, 152092.0, 22453.0, 6826.0, 2582.0, 1112.0, 575.0, 320.0, 169.0, 96.0, 68.0, 37.0, 31.0, 16.0, 19.0, 9.0, 5.0, 4.0, 4.0, 2.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0966796875, -0.09372520446777344, -0.09077072143554688, -0.08781623840332031, -0.08486175537109375, -0.08190727233886719, -0.07895278930664062, -0.07599830627441406, -0.0730438232421875, -0.07008934020996094, -0.06713485717773438, -0.06418037414550781, -0.06122589111328125, -0.05827140808105469, -0.055316925048828125, -0.05236244201660156, -0.049407958984375, -0.04645347595214844, -0.043498992919921875, -0.04054450988769531, -0.03759002685546875, -0.03463554382324219, -0.031681060791015625, -0.028726577758789062, -0.0257720947265625, -0.022817611694335938, -0.019863128662109375, -0.016908645629882812, -0.01395416259765625, -0.010999679565429688, -0.008045196533203125, -0.0050907135009765625, -0.00213623046875, 0.0008182525634765625, 0.003772735595703125, 0.0067272186279296875, 0.00968170166015625, 0.012636184692382812, 0.015590667724609375, 0.018545150756835938, 0.0214996337890625, 0.024454116821289062, 0.027408599853515625, 0.030363082885742188, 0.03331756591796875, 0.03627204895019531, 0.039226531982421875, 0.04218101501464844, 0.045135498046875, 0.04808998107910156, 0.051044464111328125, 0.05399894714355469, 0.05695343017578125, 0.05990791320800781, 0.06286239624023438, 0.06581687927246094, 0.0687713623046875, 0.07172584533691406, 0.07468032836914062, 0.07763481140136719, 0.08058929443359375, 0.08354377746582031, 0.08649826049804688, 0.08945274353027344, 0.0924072265625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 0.0, 5.0, 1.0, 6.0, 1.0, 7.0, 9.0, 3.0, 11.0, 6.0, 20.0, 17.0, 14.0, 37.0, 61.0, 66.0, 94.0, 103.0, 117.0, 118.0, 84.0, 56.0, 43.0, 27.0, 25.0, 15.0, 7.0, 10.0, 8.0, 7.0, 3.0, 5.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.05517578125, -0.053218841552734375, -0.05126190185546875, -0.049304962158203125, -0.0473480224609375, -0.045391082763671875, -0.04343414306640625, -0.041477203369140625, -0.039520263671875, -0.037563323974609375, -0.03560638427734375, -0.033649444580078125, -0.0316925048828125, -0.029735565185546875, -0.02777862548828125, -0.025821685791015625, -0.02386474609375, -0.021907806396484375, -0.01995086669921875, -0.017993927001953125, -0.0160369873046875, -0.014080047607421875, -0.01212310791015625, -0.010166168212890625, -0.008209228515625, -0.006252288818359375, -0.00429534912109375, -0.002338409423828125, -0.0003814697265625, 0.001575469970703125, 0.00353240966796875, 0.005489349365234375, 0.0074462890625, 0.009403228759765625, 0.01136016845703125, 0.013317108154296875, 0.0152740478515625, 0.017230987548828125, 0.01918792724609375, 0.021144866943359375, 0.023101806640625, 0.025058746337890625, 0.02701568603515625, 0.028972625732421875, 0.0309295654296875, 0.032886505126953125, 0.03484344482421875, 0.036800384521484375, 0.03875732421875, 0.040714263916015625, 0.04267120361328125, 0.044628143310546875, 0.0465850830078125, 0.048542022705078125, 0.05049896240234375, 0.052455902099609375, 0.054412841796875, 0.056369781494140625, 0.05832672119140625, 0.060283660888671875, 0.0622406005859375, 0.06419754028320312, 0.06615447998046875, 0.06811141967773438, 0.070068359375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 9.0, 8.0, 4.0, 23.0, 33.0, 77.0, 128.0, 285.0, 193.0, 107.0, 56.0, 29.0, 25.0, 14.0, 10.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8750150799751282, -0.8281829953193665, -0.78135085105896, -0.7345187664031982, -0.6876866221427917, -0.64085453748703, -0.5940223932266235, -0.5471903085708618, -0.5003582239151001, -0.453526109457016, -0.4066939949989319, -0.35986191034317017, -0.31302976608276367, -0.26619768142700195, -0.21936556696891785, -0.17253345251083374, -0.12570130825042725, -0.07886919379234314, -0.03203708678483963, 0.01479502022266388, 0.061627134680747986, 0.10845924913883209, 0.155291348695755, 0.2021234631538391, 0.24895557761192322, 0.2957876920700073, 0.34261980652809143, 0.38945192098617554, 0.43628400564193726, 0.48311614990234375, 0.5299482345581055, 0.5767803192138672, 0.6236125230789185, 0.6704446077346802, 0.7172767519950867, 0.7641088366508484, 0.8109409809112549, 0.8577730655670166, 0.9046051502227783, 0.9514372944831848, 0.9982694387435913, 1.045101523399353, 1.0919336080551147, 1.138765811920166, 1.1855978965759277, 1.2324299812316895, 1.2792620658874512, 1.326094150543213, 1.3729262351989746, 1.4197583198547363, 1.466590404510498, 1.5134226083755493, 1.560254693031311, 1.6070867776870728, 1.6539188623428345, 1.7007510662078857, 1.7475831508636475, 1.7944152355194092, 1.841247320175171, 1.8880795240402222, 1.9349116086959839, 1.9817436933517456, 2.028575897216797, 2.0754079818725586, 2.1222400665283203]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 6.0, 4.0, 5.0, 5.0, 8.0, 2.0, 9.0, 10.0, 13.0, 18.0, 23.0, 28.0, 22.0, 33.0, 28.0, 38.0, 27.0, 50.0, 33.0, 62.0, 81.0, 67.0, 70.0, 51.0, 34.0, 39.0, 42.0, 28.0, 26.0, 22.0, 18.0, 19.0, 12.0, 9.0, 14.0, 11.0, 8.0, 7.0, 7.0, 6.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5673937797546387, -0.5503169298171997, -0.5332400798797607, -0.5161632895469666, -0.4990864396095276, -0.4820095896720886, -0.46493273973464966, -0.4478558897972107, -0.4307790696620941, -0.41370221972465515, -0.3966253995895386, -0.3795485496520996, -0.36247169971466064, -0.34539487957954407, -0.3283180296421051, -0.3112412095069885, -0.29416435956954956, -0.2770875096321106, -0.260010689496994, -0.24293383955955505, -0.22585700452327728, -0.2087801694869995, -0.19170331954956055, -0.17462648451328278, -0.157549649477005, -0.14047281444072723, -0.12339597195386887, -0.1063191294670105, -0.08924229443073273, -0.07216545939445496, -0.05508861690759659, -0.03801177442073822, -0.020934998989105225, -0.003858160227537155, 0.013218678534030914, 0.030295517295598984, 0.04737235605716705, 0.06444919109344482, 0.08152603358030319, 0.09860287606716156, 0.11567971110343933, 0.1327565461397171, 0.14983338117599487, 0.16691023111343384, 0.1839870661497116, 0.20106390118598938, 0.21814075112342834, 0.23521758615970612, 0.2522944211959839, 0.26937127113342285, 0.28644809126853943, 0.3035249412059784, 0.32060176134109497, 0.33767861127853394, 0.3547554612159729, 0.37183231115341187, 0.38890913128852844, 0.4059859812259674, 0.423062801361084, 0.44013965129852295, 0.4572165012359619, 0.4742933213710785, 0.49137017130851746, 0.508446991443634, 0.525523841381073]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 6.0, 7.0, 6.0, 15.0, 15.0, 17.0, 16.0, 26.0, 40.0, 48.0, 81.0, 164.0, 255.0, 484.0, 1002.0, 2249.0, 5502.0, 17820.0, 109298.0, 2231203.0, 1721710.0, 79575.0, 15655.0, 5004.0, 2033.0, 912.0, 480.0, 244.0, 134.0, 92.0, 60.0, 40.0, 22.0, 14.0, 15.0, 6.0, 10.0, 8.0, 4.0, 3.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.067138671875, -0.0648193359375, -0.0625, -0.0601806640625, -0.057861328125, -0.0555419921875, -0.05322265625, -0.0509033203125, -0.048583984375, -0.0462646484375, -0.0439453125, -0.0416259765625, -0.039306640625, -0.0369873046875, -0.03466796875, -0.0323486328125, -0.030029296875, -0.0277099609375, -0.025390625, -0.0230712890625, -0.020751953125, -0.0184326171875, -0.01611328125, -0.0137939453125, -0.011474609375, -0.0091552734375, -0.0068359375, -0.0045166015625, -0.002197265625, 0.0001220703125, 0.00244140625, 0.0047607421875, 0.007080078125, 0.0093994140625, 0.01171875, 0.0140380859375, 0.016357421875, 0.0186767578125, 0.02099609375, 0.0233154296875, 0.025634765625, 0.0279541015625, 0.0302734375, 0.0325927734375, 0.034912109375, 0.0372314453125, 0.03955078125, 0.0418701171875, 0.044189453125, 0.0465087890625, 0.048828125, 0.0511474609375, 0.053466796875, 0.0557861328125, 0.05810546875, 0.0604248046875, 0.062744140625, 0.0650634765625, 0.0673828125, 0.0697021484375, 0.072021484375, 0.0743408203125, 0.07666015625, 0.0789794921875, 0.081298828125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 5.0, 3.0, 13.0, 4.0, 11.0, 12.0, 15.0, 26.0, 25.0, 25.0, 36.0, 33.0, 45.0, 46.0, 55.0, 54.0, 65.0, 59.0, 56.0, 54.0, 47.0, 42.0, 47.0, 42.0, 34.0, 23.0, 25.0, 25.0, 16.0, 9.0, 11.0, 8.0, 6.0, 9.0, 4.0, 3.0, 6.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.033050537109375, -0.031972408294677734, -0.03089427947998047, -0.029816150665283203, -0.028738021850585938, -0.027659893035888672, -0.026581764221191406, -0.02550363540649414, -0.024425506591796875, -0.02334737777709961, -0.022269248962402344, -0.021191120147705078, -0.020112991333007812, -0.019034862518310547, -0.01795673370361328, -0.016878604888916016, -0.01580047607421875, -0.014722347259521484, -0.013644218444824219, -0.012566089630126953, -0.011487960815429688, -0.010409832000732422, -0.009331703186035156, -0.00825357437133789, -0.007175445556640625, -0.006097316741943359, -0.005019187927246094, -0.003941059112548828, -0.0028629302978515625, -0.0017848014831542969, -0.0007066726684570312, 0.0003714561462402344, 0.0014495849609375, 0.0025277137756347656, 0.0036058425903320312, 0.004683971405029297, 0.0057621002197265625, 0.006840229034423828, 0.007918357849121094, 0.00899648666381836, 0.010074615478515625, 0.01115274429321289, 0.012230873107910156, 0.013309001922607422, 0.014387130737304688, 0.015465259552001953, 0.01654338836669922, 0.017621517181396484, 0.01869964599609375, 0.019777774810791016, 0.02085590362548828, 0.021934032440185547, 0.023012161254882812, 0.024090290069580078, 0.025168418884277344, 0.02624654769897461, 0.027324676513671875, 0.02840280532836914, 0.029480934143066406, 0.030559062957763672, 0.03163719177246094, 0.0327153205871582, 0.03379344940185547, 0.034871578216552734, 0.03594970703125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 8.0, 10.0, 13.0, 19.0, 25.0, 33.0, 31.0, 58.0, 77.0, 123.0, 148.0, 244.0, 359.0, 587.0, 1366.0, 11165.0, 3913069.0, 259888.0, 4562.0, 1027.0, 475.0, 282.0, 189.0, 145.0, 104.0, 77.0, 53.0, 34.0, 29.0, 21.0, 17.0, 11.0, 6.0, 11.0, 5.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.338134765625, -0.3281402587890625, -0.318145751953125, -0.3081512451171875, -0.29815673828125, -0.2881622314453125, -0.278167724609375, -0.2681732177734375, -0.2581787109375, -0.2481842041015625, -0.238189697265625, -0.2281951904296875, -0.21820068359375, -0.2082061767578125, -0.198211669921875, -0.1882171630859375, -0.17822265625, -0.1682281494140625, -0.158233642578125, -0.1482391357421875, -0.13824462890625, -0.1282501220703125, -0.118255615234375, -0.1082611083984375, -0.0982666015625, -0.0882720947265625, -0.078277587890625, -0.0682830810546875, -0.05828857421875, -0.0482940673828125, -0.038299560546875, -0.0283050537109375, -0.018310546875, -0.0083160400390625, 0.001678466796875, 0.0116729736328125, 0.02166748046875, 0.0316619873046875, 0.041656494140625, 0.0516510009765625, 0.0616455078125, 0.0716400146484375, 0.081634521484375, 0.0916290283203125, 0.10162353515625, 0.1116180419921875, 0.121612548828125, 0.1316070556640625, 0.1416015625, 0.1515960693359375, 0.161590576171875, 0.1715850830078125, 0.18157958984375, 0.1915740966796875, 0.201568603515625, 0.2115631103515625, 0.2215576171875, 0.2315521240234375, 0.241546630859375, 0.2515411376953125, 0.26153564453125, 0.2715301513671875, 0.281524658203125, 0.2915191650390625, 0.301513671875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 4.0, 11.0, 17.0, 44.0, 134.0, 627.0, 2361.0, 650.0, 145.0, 44.0, 20.0, 11.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28515625, -0.27637481689453125, -0.2675933837890625, -0.25881195068359375, -0.250030517578125, -0.24124908447265625, -0.2324676513671875, -0.22368621826171875, -0.21490478515625, -0.20612335205078125, -0.1973419189453125, -0.18856048583984375, -0.179779052734375, -0.17099761962890625, -0.1622161865234375, -0.15343475341796875, -0.1446533203125, -0.13587188720703125, -0.1270904541015625, -0.11830902099609375, -0.109527587890625, -0.10074615478515625, -0.0919647216796875, -0.08318328857421875, -0.07440185546875, -0.06562042236328125, -0.0568389892578125, -0.04805755615234375, -0.039276123046875, -0.03049468994140625, -0.0217132568359375, -0.01293182373046875, -0.004150390625, 0.00463104248046875, 0.0134124755859375, 0.02219390869140625, 0.030975341796875, 0.03975677490234375, 0.0485382080078125, 0.05731964111328125, 0.06610107421875, 0.07488250732421875, 0.0836639404296875, 0.09244537353515625, 0.101226806640625, 0.11000823974609375, 0.1187896728515625, 0.12757110595703125, 0.1363525390625, 0.14513397216796875, 0.1539154052734375, 0.16269683837890625, 0.171478271484375, 0.18025970458984375, 0.1890411376953125, 0.19782257080078125, 0.20660400390625, 0.21538543701171875, 0.2241668701171875, 0.23294830322265625, 0.241729736328125, 0.25051116943359375, 0.2592926025390625, 0.26807403564453125, 0.27685546875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 3.0, 7.0, 6.0, 14.0, 17.0, 37.0, 66.0, 176.0, 292.0, 219.0, 108.0, 35.0, 14.0, 6.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4648717641830444, -1.4002680778503418, -1.3356645107269287, -1.271060824394226, -1.2064571380615234, -1.1418535709381104, -1.0772498846054077, -1.012646198272705, -0.9480425715446472, -0.8834389448165894, -0.8188352584838867, -0.7542316317558289, -0.689628005027771, -0.6250243186950684, -0.5604206919670105, -0.49581703543663025, -0.43121337890625, -0.36660972237586975, -0.3020060658454895, -0.23740243911743164, -0.1727987825870514, -0.10819512605667114, -0.04359149932861328, 0.021012157201766968, 0.08561581373214722, 0.15021947026252747, 0.21482311189174652, 0.2794267535209656, 0.3440304100513458, 0.4086340665817261, 0.47323769330978394, 0.5378413200378418, 0.6024448871612549, 0.6670485138893127, 0.7316522002220154, 0.7962558269500732, 0.8608595132827759, 0.9254631400108337, 0.9900667667388916, 1.0546704530715942, 1.1192741394042969, 1.1838778257369995, 1.2484813928604126, 1.3130850791931152, 1.3776887655258179, 1.4422924518585205, 1.5068960189819336, 1.5714997053146362, 1.6361032724380493, 1.700706958770752, 1.765310525894165, 1.8299142122268677, 1.8945178985595703, 1.9591214656829834, 2.0237250328063965, 2.0883288383483887, 2.1529324054718018, 2.217535972595215, 2.282139778137207, 2.34674334526062, 2.411346912384033, 2.4759507179260254, 2.5405542850494385, 2.6051578521728516, 2.6697616577148438]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 11.0, 6.0, 10.0, 17.0, 21.0, 34.0, 40.0, 49.0, 60.0, 76.0, 80.0, 69.0, 96.0, 82.0, 80.0, 75.0, 54.0, 42.0, 27.0, 26.0, 12.0, 10.0, 12.0, 5.0, 7.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8500900864601135, -0.8251577615737915, -0.8002253770828247, -0.7752930521965027, -0.7503606677055359, -0.7254283428192139, -0.7004959583282471, -0.675563633441925, -0.6506312489509583, -0.6256989240646362, -0.6007665395736694, -0.5758342146873474, -0.5509018301963806, -0.5259695053100586, -0.5010371208190918, -0.4761047959327698, -0.45117244124412537, -0.42624008655548096, -0.40130773186683655, -0.37637537717819214, -0.35144302248954773, -0.3265106678009033, -0.3015783429145813, -0.2766459584236145, -0.2517136335372925, -0.22678127884864807, -0.20184892416000366, -0.17691656947135925, -0.15198421478271484, -0.12705186009407043, -0.10211952030658722, -0.07718716561794281, -0.05225479602813721, -0.027322443202137947, -0.002390090376138687, 0.022542260587215424, 0.04747461527585983, 0.07240696996450424, 0.09733931720256805, 0.12227167189121246, 0.14720402657985687, 0.17213638126850128, 0.1970687359571457, 0.2220010757446289, 0.24693343043327332, 0.2718657851219177, 0.29679813981056213, 0.32173049449920654, 0.34666284918785095, 0.37159520387649536, 0.39652755856513977, 0.4214599132537842, 0.4463922679424286, 0.471324622631073, 0.496256947517395, 0.5211893320083618, 0.5461216568946838, 0.5710539817810059, 0.5959863662719727, 0.6209186911582947, 0.6458510756492615, 0.6707834005355835, 0.6957157850265503, 0.7206481099128723, 0.7455804944038391]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 1.0, 5.0, 7.0, 16.0, 15.0, 28.0, 46.0, 75.0, 88.0, 143.0, 189.0, 347.0, 532.0, 860.0, 1541.0, 2854.0, 5442.0, 11054.0, 22711.0, 50966.0, 117432.0, 247681.0, 292971.0, 161351.0, 70724.0, 31270.0, 14585.0, 7134.0, 3680.0, 2028.0, 1145.0, 617.0, 361.0, 245.0, 146.0, 79.0, 70.0, 38.0, 26.0, 18.0, 9.0, 8.0, 10.0, 7.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0574951171875, -0.05581378936767578, -0.05413246154785156, -0.052451133728027344, -0.050769805908203125, -0.049088478088378906, -0.04740715026855469, -0.04572582244873047, -0.04404449462890625, -0.04236316680908203, -0.04068183898925781, -0.039000511169433594, -0.037319183349609375, -0.035637855529785156, -0.03395652770996094, -0.03227519989013672, -0.0305938720703125, -0.02891254425048828, -0.027231216430664062, -0.025549888610839844, -0.023868560791015625, -0.022187232971191406, -0.020505905151367188, -0.01882457733154297, -0.01714324951171875, -0.015461921691894531, -0.013780593872070312, -0.012099266052246094, -0.010417938232421875, -0.008736610412597656, -0.0070552825927734375, -0.005373954772949219, -0.003692626953125, -0.0020112991333007812, -0.0003299713134765625, 0.0013513565063476562, 0.003032684326171875, 0.004714012145996094, 0.0063953399658203125, 0.008076667785644531, 0.00975799560546875, 0.011439323425292969, 0.013120651245117188, 0.014801979064941406, 0.016483306884765625, 0.018164634704589844, 0.019845962524414062, 0.02152729034423828, 0.0232086181640625, 0.02488994598388672, 0.026571273803710938, 0.028252601623535156, 0.029933929443359375, 0.031615257263183594, 0.03329658508300781, 0.03497791290283203, 0.03665924072265625, 0.03834056854248047, 0.04002189636230469, 0.041703224182128906, 0.043384552001953125, 0.045065879821777344, 0.04674720764160156, 0.04842853546142578, 0.05010986328125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 8.0, 7.0, 13.0, 6.0, 10.0, 14.0, 17.0, 20.0, 22.0, 35.0, 40.0, 27.0, 47.0, 39.0, 45.0, 53.0, 62.0, 40.0, 49.0, 49.0, 51.0, 40.0, 52.0, 34.0, 43.0, 25.0, 23.0, 21.0, 13.0, 24.0, 14.0, 12.0, 11.0, 8.0, 6.0, 2.0, 8.0, 3.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.03253173828125, -0.03145265579223633, -0.030373573303222656, -0.029294490814208984, -0.028215408325195312, -0.02713632583618164, -0.02605724334716797, -0.024978160858154297, -0.023899078369140625, -0.022819995880126953, -0.02174091339111328, -0.02066183090209961, -0.019582748413085938, -0.018503665924072266, -0.017424583435058594, -0.016345500946044922, -0.01526641845703125, -0.014187335968017578, -0.013108253479003906, -0.012029170989990234, -0.010950088500976562, -0.00987100601196289, -0.008791923522949219, -0.007712841033935547, -0.006633758544921875, -0.005554676055908203, -0.004475593566894531, -0.0033965110778808594, -0.0023174285888671875, -0.0012383460998535156, -0.00015926361083984375, 0.0009198188781738281, 0.0019989013671875, 0.003077983856201172, 0.004157066345214844, 0.005236148834228516, 0.0063152313232421875, 0.007394313812255859, 0.008473396301269531, 0.009552478790283203, 0.010631561279296875, 0.011710643768310547, 0.012789726257324219, 0.01386880874633789, 0.014947891235351562, 0.016026973724365234, 0.017106056213378906, 0.018185138702392578, 0.01926422119140625, 0.020343303680419922, 0.021422386169433594, 0.022501468658447266, 0.023580551147460938, 0.02465963363647461, 0.02573871612548828, 0.026817798614501953, 0.027896881103515625, 0.028975963592529297, 0.03005504608154297, 0.03113412857055664, 0.03221321105957031, 0.033292293548583984, 0.034371376037597656, 0.03545045852661133, 0.036529541015625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 7.0, 4.0, 7.0, 21.0, 9.0, 18.0, 41.0, 43.0, 64.0, 111.0, 160.0, 320.0, 558.0, 1262.0, 3061.0, 9061.0, 41309.0, 265839.0, 619171.0, 83702.0, 15864.0, 4434.0, 1730.0, 769.0, 386.0, 215.0, 108.0, 87.0, 47.0, 39.0, 28.0, 22.0, 11.0, 7.0, 5.0, 8.0, 5.0, 1.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.13720703125, -0.13280868530273438, -0.12841033935546875, -0.12401199340820312, -0.1196136474609375, -0.11521530151367188, -0.11081695556640625, -0.10641860961914062, -0.102020263671875, -0.09762191772460938, -0.09322357177734375, -0.08882522583007812, -0.0844268798828125, -0.08002853393554688, -0.07563018798828125, -0.07123184204101562, -0.06683349609375, -0.062435150146484375, -0.05803680419921875, -0.053638458251953125, -0.0492401123046875, -0.044841766357421875, -0.04044342041015625, -0.036045074462890625, -0.031646728515625, -0.027248382568359375, -0.02285003662109375, -0.018451690673828125, -0.0140533447265625, -0.009654998779296875, -0.00525665283203125, -0.000858306884765625, 0.0035400390625, 0.007938385009765625, 0.01233673095703125, 0.016735076904296875, 0.0211334228515625, 0.025531768798828125, 0.02993011474609375, 0.034328460693359375, 0.038726806640625, 0.043125152587890625, 0.04752349853515625, 0.051921844482421875, 0.0563201904296875, 0.060718536376953125, 0.06511688232421875, 0.06951522827148438, 0.07391357421875, 0.07831192016601562, 0.08271026611328125, 0.08710861206054688, 0.0915069580078125, 0.09590530395507812, 0.10030364990234375, 0.10470199584960938, 0.109100341796875, 0.11349868774414062, 0.11789703369140625, 0.12229537963867188, 0.1266937255859375, 0.13109207153320312, 0.13549041748046875, 0.13988876342773438, 0.144287109375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 9.0, 4.0, 15.0, 16.0, 25.0, 20.0, 31.0, 26.0, 35.0, 52.0, 39.0, 46.0, 44.0, 52.0, 50.0, 51.0, 49.0, 52.0, 59.0, 52.0, 39.0, 35.0, 47.0, 33.0, 22.0, 18.0, 16.0, 12.0, 9.0, 5.0, 4.0, 8.0, 8.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1224365234375, -0.11798095703125, -0.113525390625, -0.10906982421875, -0.1046142578125, -0.10015869140625, -0.095703125, -0.09124755859375, -0.0867919921875, -0.08233642578125, -0.077880859375, -0.07342529296875, -0.0689697265625, -0.06451416015625, -0.06005859375, -0.05560302734375, -0.0511474609375, -0.04669189453125, -0.042236328125, -0.03778076171875, -0.0333251953125, -0.02886962890625, -0.0244140625, -0.01995849609375, -0.0155029296875, -0.01104736328125, -0.006591796875, -0.00213623046875, 0.0023193359375, 0.00677490234375, 0.01123046875, 0.01568603515625, 0.0201416015625, 0.02459716796875, 0.029052734375, 0.03350830078125, 0.0379638671875, 0.04241943359375, 0.046875, 0.05133056640625, 0.0557861328125, 0.06024169921875, 0.064697265625, 0.06915283203125, 0.0736083984375, 0.07806396484375, 0.08251953125, 0.08697509765625, 0.0914306640625, 0.09588623046875, 0.100341796875, 0.10479736328125, 0.1092529296875, 0.11370849609375, 0.1181640625, 0.12261962890625, 0.1270751953125, 0.13153076171875, 0.135986328125, 0.14044189453125, 0.1448974609375, 0.14935302734375, 0.15380859375, 0.15826416015625, 0.1627197265625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 8.0, 16.0, 18.0, 24.0, 49.0, 87.0, 131.0, 213.0, 336.0, 634.0, 1270.0, 2523.0, 5522.0, 13512.0, 38083.0, 145168.0, 645673.0, 135435.0, 36430.0, 12924.0, 5381.0, 2413.0, 1173.0, 668.0, 353.0, 184.0, 110.0, 73.0, 53.0, 25.0, 20.0, 11.0, 8.0, 3.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.057891845703125, -0.05585908889770508, -0.053826332092285156, -0.051793575286865234, -0.04976081848144531, -0.04772806167602539, -0.04569530487060547, -0.04366254806518555, -0.041629791259765625, -0.0395970344543457, -0.03756427764892578, -0.03553152084350586, -0.03349876403808594, -0.031466007232666016, -0.029433250427246094, -0.027400493621826172, -0.02536773681640625, -0.023334980010986328, -0.021302223205566406, -0.019269466400146484, -0.017236709594726562, -0.01520395278930664, -0.013171195983886719, -0.011138439178466797, -0.009105682373046875, -0.007072925567626953, -0.005040168762207031, -0.0030074119567871094, -0.0009746551513671875, 0.0010581016540527344, 0.0030908584594726562, 0.005123615264892578, 0.0071563720703125, 0.009189128875732422, 0.011221885681152344, 0.013254642486572266, 0.015287399291992188, 0.01732015609741211, 0.01935291290283203, 0.021385669708251953, 0.023418426513671875, 0.025451183319091797, 0.02748394012451172, 0.02951669692993164, 0.03154945373535156, 0.033582210540771484, 0.035614967346191406, 0.03764772415161133, 0.03968048095703125, 0.04171323776245117, 0.043745994567871094, 0.045778751373291016, 0.04781150817871094, 0.04984426498413086, 0.05187702178955078, 0.0539097785949707, 0.055942535400390625, 0.05797529220581055, 0.06000804901123047, 0.06204080581665039, 0.06407356262207031, 0.06610631942749023, 0.06813907623291016, 0.07017183303833008, 0.07220458984375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 7.0, 3.0, 8.0, 15.0, 11.0, 21.0, 24.0, 27.0, 50.0, 62.0, 101.0, 151.0, 172.0, 98.0, 74.0, 52.0, 38.0, 12.0, 13.0, 12.0, 8.0, 4.0, 6.0, 5.0, 3.0, 3.0, 5.0, 7.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.057718276977539e-05, -2.9489398002624512e-05, -2.8401613235473633e-05, -2.7313828468322754e-05, -2.6226043701171875e-05, -2.5138258934020996e-05, -2.4050474166870117e-05, -2.2962689399719238e-05, -2.187490463256836e-05, -2.078711986541748e-05, -1.96993350982666e-05, -1.8611550331115723e-05, -1.7523765563964844e-05, -1.6435980796813965e-05, -1.5348196029663086e-05, -1.4260411262512207e-05, -1.3172626495361328e-05, -1.208484172821045e-05, -1.099705696105957e-05, -9.909272193908691e-06, -8.821487426757812e-06, -7.733702659606934e-06, -6.645917892456055e-06, -5.558133125305176e-06, -4.470348358154297e-06, -3.382563591003418e-06, -2.294778823852539e-06, -1.2069940567016602e-06, -1.1920928955078125e-07, 9.685754776000977e-07, 2.0563602447509766e-06, 3.1441450119018555e-06, 4.231929779052734e-06, 5.319714546203613e-06, 6.407499313354492e-06, 7.495284080505371e-06, 8.58306884765625e-06, 9.670853614807129e-06, 1.0758638381958008e-05, 1.1846423149108887e-05, 1.2934207916259766e-05, 1.4021992683410645e-05, 1.5109777450561523e-05, 1.6197562217712402e-05, 1.728534698486328e-05, 1.837313175201416e-05, 1.946091651916504e-05, 2.0548701286315918e-05, 2.1636486053466797e-05, 2.2724270820617676e-05, 2.3812055587768555e-05, 2.4899840354919434e-05, 2.5987625122070312e-05, 2.707540988922119e-05, 2.816319465637207e-05, 2.925097942352295e-05, 3.0338764190673828e-05, 3.142654895782471e-05, 3.2514333724975586e-05, 3.3602118492126465e-05, 3.4689903259277344e-05, 3.577768802642822e-05, 3.68654727935791e-05, 3.795325756072998e-05, 3.904104232788086e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 9.0, 3.0, 5.0, 7.0, 9.0, 16.0, 24.0, 31.0, 64.0, 97.0, 150.0, 219.0, 422.0, 769.0, 1584.0, 3769.0, 9935.0, 33426.0, 161287.0, 683410.0, 113013.0, 25972.0, 8146.0, 3206.0, 1395.0, 687.0, 337.0, 208.0, 134.0, 73.0, 56.0, 39.0, 18.0, 10.0, 14.0, 6.0, 5.0, 3.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08221435546875, -0.07975292205810547, -0.07729148864746094, -0.0748300552368164, -0.07236862182617188, -0.06990718841552734, -0.06744575500488281, -0.06498432159423828, -0.06252288818359375, -0.06006145477294922, -0.05760002136230469, -0.055138587951660156, -0.052677154541015625, -0.050215721130371094, -0.04775428771972656, -0.04529285430908203, -0.0428314208984375, -0.04036998748779297, -0.03790855407714844, -0.035447120666503906, -0.032985687255859375, -0.030524253845214844, -0.028062820434570312, -0.02560138702392578, -0.02313995361328125, -0.02067852020263672, -0.018217086791992188, -0.015755653381347656, -0.013294219970703125, -0.010832786560058594, -0.008371353149414062, -0.005909919738769531, -0.003448486328125, -0.0009870529174804688, 0.0014743804931640625, 0.003935813903808594, 0.006397247314453125, 0.008858680725097656, 0.011320114135742188, 0.013781547546386719, 0.01624298095703125, 0.01870441436767578, 0.021165847778320312, 0.023627281188964844, 0.026088714599609375, 0.028550148010253906, 0.031011581420898438, 0.03347301483154297, 0.0359344482421875, 0.03839588165283203, 0.04085731506347656, 0.043318748474121094, 0.045780181884765625, 0.048241615295410156, 0.05070304870605469, 0.05316448211669922, 0.05562591552734375, 0.05808734893798828, 0.06054878234863281, 0.06301021575927734, 0.06547164916992188, 0.0679330825805664, 0.07039451599121094, 0.07285594940185547, 0.0753173828125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 1.0, 5.0, 5.0, 4.0, 5.0, 10.0, 13.0, 13.0, 17.0, 22.0, 29.0, 22.0, 37.0, 40.0, 71.0, 62.0, 101.0, 75.0, 76.0, 81.0, 66.0, 51.0, 33.0, 40.0, 30.0, 17.0, 15.0, 11.0, 15.0, 5.0, 7.0, 6.0, 7.0, 3.0, 1.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.059051513671875, -0.05743408203125, -0.055816650390625, -0.05419921875, -0.052581787109375, -0.05096435546875, -0.049346923828125, -0.0477294921875, -0.046112060546875, -0.04449462890625, -0.042877197265625, -0.041259765625, -0.039642333984375, -0.03802490234375, -0.036407470703125, -0.0347900390625, -0.033172607421875, -0.03155517578125, -0.029937744140625, -0.0283203125, -0.026702880859375, -0.02508544921875, -0.023468017578125, -0.0218505859375, -0.020233154296875, -0.01861572265625, -0.016998291015625, -0.015380859375, -0.013763427734375, -0.01214599609375, -0.010528564453125, -0.0089111328125, -0.007293701171875, -0.00567626953125, -0.004058837890625, -0.00244140625, -0.000823974609375, 0.00079345703125, 0.002410888671875, 0.0040283203125, 0.005645751953125, 0.00726318359375, 0.008880615234375, 0.010498046875, 0.012115478515625, 0.01373291015625, 0.015350341796875, 0.0169677734375, 0.018585205078125, 0.02020263671875, 0.021820068359375, 0.0234375, 0.025054931640625, 0.02667236328125, 0.028289794921875, 0.0299072265625, 0.031524658203125, 0.03314208984375, 0.034759521484375, 0.036376953125, 0.037994384765625, 0.03961181640625, 0.041229248046875, 0.0428466796875, 0.044464111328125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 11.0, 23.0, 51.0, 84.0, 120.0, 261.0, 177.0, 107.0, 76.0, 38.0, 18.0, 11.0, 13.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4934729039669037, -0.4513281583786011, -0.40918341279029846, -0.36703866720199585, -0.32489389181137085, -0.2827491760253906, -0.24060440063476562, -0.198459655046463, -0.1563149094581604, -0.11417016386985779, -0.07202541083097458, -0.02988065779209137, 0.012264087796211243, 0.054408833384513855, 0.09655359387397766, 0.13869833946228027, 0.18084308505058289, 0.2229878306388855, 0.2651325762271881, 0.3072773218154907, 0.3494220972061157, 0.39156681299209595, 0.43371158838272095, 0.47585633397102356, 0.5180010795593262, 0.5601458549499512, 0.6022905707359314, 0.6444353461265564, 0.6865800619125366, 0.7287248373031616, 0.7708696126937866, 0.8130143284797668, 0.8551591634750366, 0.8973039388656616, 0.9394486546516418, 0.9815934300422668, 1.023738145828247, 1.065882921218872, 1.108027696609497, 1.150172472000122, 1.1923171281814575, 1.2344619035720825, 1.2766066789627075, 1.318751335144043, 1.360896110534668, 1.403040885925293, 1.445185661315918, 1.487330436706543, 1.529475212097168, 1.571619987487793, 1.613764762878418, 1.6559094190597534, 1.6980541944503784, 1.7401989698410034, 1.7823437452316284, 1.8244884014129639, 1.8666331768035889, 1.9087779521942139, 1.9509227275848389, 1.9930673837661743, 2.035212278366089, 2.0773568153381348, 2.1195015907287598, 2.1616463661193848, 2.2037911415100098]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 0.0, 4.0, 6.0, 11.0, 11.0, 15.0, 21.0, 14.0, 15.0, 26.0, 25.0, 28.0, 21.0, 32.0, 38.0, 53.0, 62.0, 87.0, 82.0, 71.0, 44.0, 39.0, 38.0, 28.0, 37.0, 30.0, 22.0, 25.0, 23.0, 15.0, 13.0, 11.0, 12.0, 11.0, 2.0, 4.0, 7.0, 1.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.568529486656189, -0.5504900813102722, -0.5324506759643555, -0.5144112706184387, -0.49637189507484436, -0.4783324897289276, -0.46029311418533325, -0.4422537088394165, -0.42421430349349976, -0.406174898147583, -0.38813549280166626, -0.3700961172580719, -0.35205671191215515, -0.3340173065662384, -0.31597793102264404, -0.2979385256767273, -0.27989912033081055, -0.2618597149848938, -0.24382032454013824, -0.2257809340953827, -0.20774152874946594, -0.1897021234035492, -0.17166273295879364, -0.15362334251403809, -0.13558393716812134, -0.11754453927278519, -0.09950514137744904, -0.08146574348211288, -0.06342634558677673, -0.04538694769144058, -0.02734754979610443, -0.009308159351348877, 0.008731245994567871, 0.026770643889904022, 0.04481004178524017, 0.06284943968057632, 0.08088883757591248, 0.09892823547124863, 0.11696763336658478, 0.13500702381134033, 0.15304642915725708, 0.17108583450317383, 0.18912522494792938, 0.20716461539268494, 0.22520402073860168, 0.24324342608451843, 0.2612828016281128, 0.27932220697402954, 0.2973616123199463, 0.31540101766586304, 0.3334404230117798, 0.35147979855537415, 0.3695192039012909, 0.38755860924720764, 0.405597984790802, 0.42363739013671875, 0.4416767954826355, 0.45971620082855225, 0.477755606174469, 0.49579498171806335, 0.5138343572616577, 0.5318737626075745, 0.5499131679534912, 0.567952573299408, 0.5859919786453247]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 7.0, 17.0, 22.0, 23.0, 38.0, 83.0, 142.0, 244.0, 443.0, 860.0, 1815.0, 4304.0, 11984.0, 53973.0, 729405.0, 3096913.0, 250051.0, 29660.0, 8270.0, 3150.0, 1411.0, 642.0, 352.0, 196.0, 97.0, 57.0, 34.0, 33.0, 15.0, 7.0, 13.0, 6.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0], "bins": [-0.11981201171875, -0.116912841796875, -0.114013671875, -0.111114501953125, -0.10821533203125, -0.105316162109375, -0.1024169921875, -0.099517822265625, -0.09661865234375, -0.093719482421875, -0.0908203125, -0.087921142578125, -0.08502197265625, -0.082122802734375, -0.0792236328125, -0.076324462890625, -0.07342529296875, -0.070526123046875, -0.067626953125, -0.064727783203125, -0.06182861328125, -0.058929443359375, -0.0560302734375, -0.053131103515625, -0.05023193359375, -0.047332763671875, -0.04443359375, -0.041534423828125, -0.03863525390625, -0.035736083984375, -0.0328369140625, -0.029937744140625, -0.02703857421875, -0.024139404296875, -0.021240234375, -0.018341064453125, -0.01544189453125, -0.012542724609375, -0.0096435546875, -0.006744384765625, -0.00384521484375, -0.000946044921875, 0.001953125, 0.004852294921875, 0.00775146484375, 0.010650634765625, 0.0135498046875, 0.016448974609375, 0.01934814453125, 0.022247314453125, 0.025146484375, 0.028045654296875, 0.03094482421875, 0.033843994140625, 0.0367431640625, 0.039642333984375, 0.04254150390625, 0.045440673828125, 0.04833984375, 0.051239013671875, 0.05413818359375, 0.057037353515625, 0.0599365234375, 0.062835693359375, 0.06573486328125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 8.0, 5.0, 8.0, 7.0, 10.0, 12.0, 12.0, 20.0, 16.0, 26.0, 39.0, 39.0, 36.0, 30.0, 47.0, 52.0, 58.0, 59.0, 45.0, 50.0, 49.0, 36.0, 58.0, 40.0, 45.0, 26.0, 35.0, 21.0, 24.0, 19.0, 18.0, 16.0, 10.0, 7.0, 5.0, 1.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.038330078125, -0.03711509704589844, -0.035900115966796875, -0.03468513488769531, -0.03347015380859375, -0.03225517272949219, -0.031040191650390625, -0.029825210571289062, -0.0286102294921875, -0.027395248413085938, -0.026180267333984375, -0.024965286254882812, -0.02375030517578125, -0.022535324096679688, -0.021320343017578125, -0.020105361938476562, -0.018890380859375, -0.017675399780273438, -0.016460418701171875, -0.015245437622070312, -0.01403045654296875, -0.012815475463867188, -0.011600494384765625, -0.010385513305664062, -0.0091705322265625, -0.007955551147460938, -0.006740570068359375, -0.0055255889892578125, -0.00431060791015625, -0.0030956268310546875, -0.001880645751953125, -0.0006656646728515625, 0.00054931640625, 0.0017642974853515625, 0.002979278564453125, 0.0041942596435546875, 0.00540924072265625, 0.0066242218017578125, 0.007839202880859375, 0.009054183959960938, 0.0102691650390625, 0.011484146118164062, 0.012699127197265625, 0.013914108276367188, 0.01512908935546875, 0.016344070434570312, 0.017559051513671875, 0.018774032592773438, 0.019989013671875, 0.021203994750976562, 0.022418975830078125, 0.023633956909179688, 0.02484893798828125, 0.026063919067382812, 0.027278900146484375, 0.028493881225585938, 0.0297088623046875, 0.030923843383789062, 0.032138824462890625, 0.03335380554199219, 0.03456878662109375, 0.03578376770019531, 0.036998748779296875, 0.03821372985839844, 0.0394287109375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 4.0, 9.0, 23.0, 38.0, 98.0, 217.0, 576.0, 2553.0, 63035.0, 4113957.0, 11652.0, 1434.0, 395.0, 156.0, 70.0, 29.0, 17.0, 7.0, 9.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64453125, -0.6262741088867188, -0.6080169677734375, -0.5897598266601562, -0.571502685546875, -0.5532455444335938, -0.5349884033203125, -0.5167312622070312, -0.49847412109375, -0.48021697998046875, -0.4619598388671875, -0.44370269775390625, -0.425445556640625, -0.40718841552734375, -0.3889312744140625, -0.37067413330078125, -0.3524169921875, -0.33415985107421875, -0.3159027099609375, -0.29764556884765625, -0.279388427734375, -0.26113128662109375, -0.2428741455078125, -0.22461700439453125, -0.20635986328125, -0.18810272216796875, -0.1698455810546875, -0.15158843994140625, -0.133331298828125, -0.11507415771484375, -0.0968170166015625, -0.07855987548828125, -0.060302734375, -0.04204559326171875, -0.0237884521484375, -0.00553131103515625, 0.012725830078125, 0.03098297119140625, 0.0492401123046875, 0.06749725341796875, 0.08575439453125, 0.10401153564453125, 0.1222686767578125, 0.14052581787109375, 0.158782958984375, 0.17704010009765625, 0.1952972412109375, 0.21355438232421875, 0.2318115234375, 0.25006866455078125, 0.2683258056640625, 0.28658294677734375, 0.304840087890625, 0.32309722900390625, 0.3413543701171875, 0.35961151123046875, 0.37786865234375, 0.39612579345703125, 0.4143829345703125, 0.43264007568359375, 0.450897216796875, 0.46915435791015625, 0.4874114990234375, 0.5056686401367188, 0.52392578125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 5.0, 8.0, 8.0, 17.0, 39.0, 63.0, 198.0, 575.0, 1843.0, 912.0, 239.0, 72.0, 40.0, 23.0, 12.0, 9.0, 6.0, 0.0, 5.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2257080078125, -0.2169017791748047, -0.20809555053710938, -0.19928932189941406, -0.19048309326171875, -0.18167686462402344, -0.17287063598632812, -0.1640644073486328, -0.1552581787109375, -0.1464519500732422, -0.13764572143554688, -0.12883949279785156, -0.12003326416015625, -0.11122703552246094, -0.10242080688476562, -0.09361457824707031, -0.084808349609375, -0.07600212097167969, -0.06719589233398438, -0.05838966369628906, -0.04958343505859375, -0.04077720642089844, -0.031970977783203125, -0.023164749145507812, -0.0143585205078125, -0.0055522918701171875, 0.003253936767578125, 0.012060165405273438, 0.02086639404296875, 0.029672622680664062, 0.038478851318359375, 0.04728507995605469, 0.05609130859375, 0.06489753723144531, 0.07370376586914062, 0.08250999450683594, 0.09131622314453125, 0.10012245178222656, 0.10892868041992188, 0.11773490905761719, 0.1265411376953125, 0.1353473663330078, 0.14415359497070312, 0.15295982360839844, 0.16176605224609375, 0.17057228088378906, 0.17937850952148438, 0.1881847381591797, 0.196990966796875, 0.2057971954345703, 0.21460342407226562, 0.22340965270996094, 0.23221588134765625, 0.24102210998535156, 0.24982833862304688, 0.2586345672607422, 0.2674407958984375, 0.2762470245361328, 0.2850532531738281, 0.29385948181152344, 0.30266571044921875, 0.31147193908691406, 0.3202781677246094, 0.3290843963623047, 0.337890625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 2.0, 0.0, 4.0, 4.0, 10.0, 14.0, 21.0, 26.0, 32.0, 59.0, 88.0, 118.0, 125.0, 114.0, 110.0, 84.0, 67.0, 41.0, 29.0, 19.0, 13.0, 10.0, 3.0, 5.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3822675943374634, -1.3486002683639526, -1.314932942390442, -1.2812657356262207, -1.24759840965271, -1.2139310836791992, -1.1802637577056885, -1.1465964317321777, -1.112929105758667, -1.0792617797851562, -1.0455944538116455, -1.0119272470474243, -0.9782599210739136, -0.9445925951004028, -0.9109252691268921, -0.8772579431533813, -0.8435907363891602, -0.8099234104156494, -0.7762561440467834, -0.7425888180732727, -0.7089215517044067, -0.675254225730896, -0.6415868997573853, -0.6079195737838745, -0.5742523074150085, -0.5405849814414978, -0.5069177150726318, -0.4732503890991211, -0.43958309292793274, -0.4059157967567444, -0.37224847078323364, -0.3385811746120453, -0.3049139976501465, -0.27124670147895813, -0.23757939040660858, -0.20391207933425903, -0.17024478316307068, -0.13657748699188232, -0.10291017591953278, -0.06924286484718323, -0.03557556867599487, -0.0019082650542259216, 0.03175903856754303, 0.06542634218931198, 0.09909364581108093, 0.1327609419822693, 0.16642825305461884, 0.20009556412696838, 0.23376286029815674, 0.2674301564693451, 0.30109745264053345, 0.3347647786140442, 0.36843207478523254, 0.4020993709564209, 0.43576669692993164, 0.46943399310112, 0.5031012892723083, 0.5367686152458191, 0.5704358816146851, 0.6041032075881958, 0.6377705335617065, 0.6714377999305725, 0.7051051259040833, 0.7387723922729492, 0.77243971824646]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 6.0, 7.0, 8.0, 12.0, 12.0, 19.0, 18.0, 17.0, 22.0, 23.0, 39.0, 38.0, 37.0, 44.0, 59.0, 45.0, 59.0, 49.0, 51.0, 47.0, 62.0, 56.0, 38.0, 37.0, 32.0, 28.0, 22.0, 27.0, 18.0, 18.0, 12.0, 10.0, 10.0, 1.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7562676668167114, -0.7345211505889893, -0.7127746343612671, -0.6910281181335449, -0.6692816019058228, -0.6475350260734558, -0.6257885098457336, -0.6040419936180115, -0.5822954773902893, -0.5605489611625671, -0.538802444934845, -0.5170559287071228, -0.49530938267707825, -0.4735628664493561, -0.4518163204193115, -0.43006980419158936, -0.4083232879638672, -0.386576771736145, -0.36483025550842285, -0.3430837094783783, -0.32133719325065613, -0.29959067702293396, -0.2778441309928894, -0.25609761476516724, -0.23435109853744507, -0.2126045823097229, -0.19085805118083954, -0.16911152005195618, -0.147365003824234, -0.12561848759651184, -0.10387195646762848, -0.08212542533874512, -0.060378849506378174, -0.03863232582807541, -0.016885802149772644, 0.004860721528530121, 0.026607245206832886, 0.04835376888513565, 0.07010029256343842, 0.09184682369232178, 0.11359333992004395, 0.1353398561477661, 0.15708638727664948, 0.17883291840553284, 0.200579434633255, 0.22232595086097717, 0.24407248198986053, 0.2658190131187439, 0.28756552934646606, 0.30931204557418823, 0.3310585618019104, 0.35280510783195496, 0.3745516240596771, 0.3962981402873993, 0.41804468631744385, 0.439791202545166, 0.4615377187728882, 0.48328423500061035, 0.5050307512283325, 0.5267772674560547, 0.5485237836837769, 0.5702703595161438, 0.592016875743866, 0.6137633919715881, 0.6355099081993103]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 7.0, 4.0, 10.0, 13.0, 14.0, 29.0, 39.0, 52.0, 96.0, 112.0, 149.0, 287.0, 400.0, 653.0, 1101.0, 1717.0, 3125.0, 5426.0, 9812.0, 18907.0, 36958.0, 75812.0, 157703.0, 273821.0, 230336.0, 116156.0, 55566.0, 27637.0, 14320.0, 7590.0, 4341.0, 2350.0, 1505.0, 917.0, 538.0, 381.0, 230.0, 153.0, 111.0, 58.0, 44.0, 29.0, 19.0, 8.0, 12.0, 3.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.056304931640625, -0.054476261138916016, -0.05264759063720703, -0.05081892013549805, -0.04899024963378906, -0.04716157913208008, -0.045332908630371094, -0.04350423812866211, -0.041675567626953125, -0.03984689712524414, -0.038018226623535156, -0.03618955612182617, -0.03436088562011719, -0.0325322151184082, -0.03070354461669922, -0.028874874114990234, -0.02704620361328125, -0.025217533111572266, -0.02338886260986328, -0.021560192108154297, -0.019731521606445312, -0.017902851104736328, -0.016074180603027344, -0.01424551010131836, -0.012416839599609375, -0.01058816909790039, -0.008759498596191406, -0.006930828094482422, -0.0051021575927734375, -0.003273487091064453, -0.0014448165893554688, 0.0003838539123535156, 0.0022125244140625, 0.004041194915771484, 0.005869865417480469, 0.007698535919189453, 0.009527206420898438, 0.011355876922607422, 0.013184547424316406, 0.01501321792602539, 0.016841888427734375, 0.01867055892944336, 0.020499229431152344, 0.022327899932861328, 0.024156570434570312, 0.025985240936279297, 0.02781391143798828, 0.029642581939697266, 0.03147125244140625, 0.033299922943115234, 0.03512859344482422, 0.0369572639465332, 0.03878593444824219, 0.04061460494995117, 0.042443275451660156, 0.04427194595336914, 0.046100616455078125, 0.04792928695678711, 0.049757957458496094, 0.05158662796020508, 0.05341529846191406, 0.05524396896362305, 0.05707263946533203, 0.058901309967041016, 0.06072998046875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 5.0, 15.0, 9.0, 13.0, 17.0, 14.0, 25.0, 20.0, 30.0, 30.0, 35.0, 31.0, 37.0, 58.0, 41.0, 46.0, 53.0, 62.0, 48.0, 42.0, 50.0, 36.0, 44.0, 37.0, 21.0, 26.0, 28.0, 21.0, 18.0, 17.0, 12.0, 12.0, 5.0, 8.0, 4.0, 4.0, 6.0, 5.0, 6.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.050262451171875, -0.0487065315246582, -0.047150611877441406, -0.04559469223022461, -0.04403877258300781, -0.042482852935791016, -0.04092693328857422, -0.03937101364135742, -0.037815093994140625, -0.03625917434692383, -0.03470325469970703, -0.033147335052490234, -0.03159141540527344, -0.03003549575805664, -0.028479576110839844, -0.026923656463623047, -0.02536773681640625, -0.023811817169189453, -0.022255897521972656, -0.02069997787475586, -0.019144058227539062, -0.017588138580322266, -0.01603221893310547, -0.014476299285888672, -0.012920379638671875, -0.011364459991455078, -0.009808540344238281, -0.008252620697021484, -0.0066967010498046875, -0.005140781402587891, -0.0035848617553710938, -0.002028942108154297, -0.0004730224609375, 0.0010828971862792969, 0.0026388168334960938, 0.004194736480712891, 0.0057506561279296875, 0.007306575775146484, 0.008862495422363281, 0.010418415069580078, 0.011974334716796875, 0.013530254364013672, 0.015086174011230469, 0.016642093658447266, 0.018198013305664062, 0.01975393295288086, 0.021309852600097656, 0.022865772247314453, 0.02442169189453125, 0.025977611541748047, 0.027533531188964844, 0.02908945083618164, 0.030645370483398438, 0.032201290130615234, 0.03375720977783203, 0.03531312942504883, 0.036869049072265625, 0.03842496871948242, 0.03998088836669922, 0.041536808013916016, 0.04309272766113281, 0.04464864730834961, 0.046204566955566406, 0.0477604866027832, 0.04931640625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 4.0, 9.0, 5.0, 5.0, 13.0, 15.0, 15.0, 34.0, 40.0, 57.0, 68.0, 137.0, 234.0, 404.0, 764.0, 2012.0, 6756.0, 36941.0, 405675.0, 546047.0, 38370.0, 7118.0, 1994.0, 799.0, 385.0, 202.0, 137.0, 95.0, 58.0, 54.0, 30.0, 20.0, 19.0, 8.0, 12.0, 6.0, 7.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2174072265625, -0.2106151580810547, -0.20382308959960938, -0.19703102111816406, -0.19023895263671875, -0.18344688415527344, -0.17665481567382812, -0.1698627471923828, -0.1630706787109375, -0.1562786102294922, -0.14948654174804688, -0.14269447326660156, -0.13590240478515625, -0.12911033630371094, -0.12231826782226562, -0.11552619934082031, -0.108734130859375, -0.10194206237792969, -0.09514999389648438, -0.08835792541503906, -0.08156585693359375, -0.07477378845214844, -0.06798171997070312, -0.06118965148925781, -0.0543975830078125, -0.04760551452636719, -0.040813446044921875, -0.03402137756347656, -0.02722930908203125, -0.020437240600585938, -0.013645172119140625, -0.0068531036376953125, -6.103515625e-05, 0.0067310333251953125, 0.013523101806640625, 0.020315170288085938, 0.02710723876953125, 0.03389930725097656, 0.040691375732421875, 0.04748344421386719, 0.0542755126953125, 0.06106758117675781, 0.06785964965820312, 0.07465171813964844, 0.08144378662109375, 0.08823585510253906, 0.09502792358398438, 0.10181999206542969, 0.108612060546875, 0.11540412902832031, 0.12219619750976562, 0.12898826599121094, 0.13578033447265625, 0.14257240295410156, 0.14936447143554688, 0.1561565399169922, 0.1629486083984375, 0.1697406768798828, 0.17653274536132812, 0.18332481384277344, 0.19011688232421875, 0.19690895080566406, 0.20370101928710938, 0.2104930877685547, 0.21728515625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 5.0, 3.0, 6.0, 8.0, 7.0, 12.0, 16.0, 6.0, 22.0, 25.0, 19.0, 36.0, 42.0, 49.0, 52.0, 53.0, 62.0, 55.0, 63.0, 62.0, 63.0, 61.0, 45.0, 45.0, 30.0, 32.0, 22.0, 22.0, 18.0, 20.0, 10.0, 9.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.239990234375, -0.2322998046875, -0.224609375, -0.2169189453125, -0.209228515625, -0.2015380859375, -0.19384765625, -0.1861572265625, -0.178466796875, -0.1707763671875, -0.1630859375, -0.1553955078125, -0.147705078125, -0.1400146484375, -0.13232421875, -0.1246337890625, -0.116943359375, -0.1092529296875, -0.1015625, -0.0938720703125, -0.086181640625, -0.0784912109375, -0.07080078125, -0.0631103515625, -0.055419921875, -0.0477294921875, -0.0400390625, -0.0323486328125, -0.024658203125, -0.0169677734375, -0.00927734375, -0.0015869140625, 0.006103515625, 0.0137939453125, 0.021484375, 0.0291748046875, 0.036865234375, 0.0445556640625, 0.05224609375, 0.0599365234375, 0.067626953125, 0.0753173828125, 0.0830078125, 0.0906982421875, 0.098388671875, 0.1060791015625, 0.11376953125, 0.1214599609375, 0.129150390625, 0.1368408203125, 0.14453125, 0.1522216796875, 0.159912109375, 0.1676025390625, 0.17529296875, 0.1829833984375, 0.190673828125, 0.1983642578125, 0.2060546875, 0.2137451171875, 0.221435546875, 0.2291259765625, 0.23681640625, 0.2445068359375, 0.252197265625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 7.0, 9.0, 12.0, 18.0, 21.0, 33.0, 47.0, 76.0, 85.0, 142.0, 195.0, 355.0, 532.0, 902.0, 1838.0, 3896.0, 9040.0, 24829.0, 81495.0, 634541.0, 212359.0, 49283.0, 16218.0, 6332.0, 2876.0, 1453.0, 752.0, 415.0, 228.0, 180.0, 127.0, 77.0, 48.0, 38.0, 22.0, 21.0, 11.0, 11.0, 10.0, 3.0, 6.0, 6.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0634765625, -0.061415672302246094, -0.05935478210449219, -0.05729389190673828, -0.055233001708984375, -0.05317211151123047, -0.05111122131347656, -0.049050331115722656, -0.04698944091796875, -0.044928550720214844, -0.04286766052246094, -0.04080677032470703, -0.038745880126953125, -0.03668498992919922, -0.03462409973144531, -0.032563209533691406, -0.0305023193359375, -0.028441429138183594, -0.026380538940429688, -0.02431964874267578, -0.022258758544921875, -0.02019786834716797, -0.018136978149414062, -0.016076087951660156, -0.01401519775390625, -0.011954307556152344, -0.009893417358398438, -0.007832527160644531, -0.005771636962890625, -0.0037107467651367188, -0.0016498565673828125, 0.00041103363037109375, 0.002471923828125, 0.004532814025878906, 0.0065937042236328125, 0.008654594421386719, 0.010715484619140625, 0.012776374816894531, 0.014837265014648438, 0.016898155212402344, 0.01895904541015625, 0.021019935607910156, 0.023080825805664062, 0.02514171600341797, 0.027202606201171875, 0.02926349639892578, 0.03132438659667969, 0.033385276794433594, 0.0354461669921875, 0.037507057189941406, 0.03956794738769531, 0.04162883758544922, 0.043689727783203125, 0.04575061798095703, 0.04781150817871094, 0.049872398376464844, 0.05193328857421875, 0.053994178771972656, 0.05605506896972656, 0.05811595916748047, 0.060176849365234375, 0.06223773956298828, 0.06429862976074219, 0.0663595199584961, 0.06842041015625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 1.0, 3.0, 4.0, 10.0, 9.0, 5.0, 11.0, 10.0, 18.0, 25.0, 33.0, 37.0, 40.0, 88.0, 115.0, 161.0, 116.0, 96.0, 58.0, 36.0, 27.0, 16.0, 21.0, 13.0, 6.0, 5.0, 9.0, 5.0, 8.0, 4.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4497509002685547e-05, -2.345070242881775e-05, -2.240389585494995e-05, -2.1357089281082153e-05, -2.0310282707214355e-05, -1.9263476133346558e-05, -1.821666955947876e-05, -1.7169862985610962e-05, -1.6123056411743164e-05, -1.5076249837875366e-05, -1.4029443264007568e-05, -1.298263669013977e-05, -1.1935830116271973e-05, -1.0889023542404175e-05, -9.842216968536377e-06, -8.795410394668579e-06, -7.748603820800781e-06, -6.701797246932983e-06, -5.6549906730651855e-06, -4.608184099197388e-06, -3.56137752532959e-06, -2.514570951461792e-06, -1.4677643775939941e-06, -4.209578037261963e-07, 6.258487701416016e-07, 1.6726553440093994e-06, 2.7194619178771973e-06, 3.766268491744995e-06, 4.813075065612793e-06, 5.859881639480591e-06, 6.906688213348389e-06, 7.953494787216187e-06, 9.000301361083984e-06, 1.0047107934951782e-05, 1.109391450881958e-05, 1.2140721082687378e-05, 1.3187527656555176e-05, 1.4234334230422974e-05, 1.528114080429077e-05, 1.632794737815857e-05, 1.7374753952026367e-05, 1.8421560525894165e-05, 1.9468367099761963e-05, 2.051517367362976e-05, 2.156198024749756e-05, 2.2608786821365356e-05, 2.3655593395233154e-05, 2.4702399969100952e-05, 2.574920654296875e-05, 2.6796013116836548e-05, 2.7842819690704346e-05, 2.8889626264572144e-05, 2.993643283843994e-05, 3.098323941230774e-05, 3.203004598617554e-05, 3.3076852560043335e-05, 3.412365913391113e-05, 3.517046570777893e-05, 3.621727228164673e-05, 3.7264078855514526e-05, 3.8310885429382324e-05, 3.935769200325012e-05, 4.040449857711792e-05, 4.145130515098572e-05, 4.2498111724853516e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 1.0, 4.0, 7.0, 9.0, 12.0, 32.0, 44.0, 58.0, 87.0, 209.0, 367.0, 1069.0, 3656.0, 20363.0, 218241.0, 756030.0, 39592.0, 6144.0, 1566.0, 509.0, 260.0, 110.0, 74.0, 38.0, 27.0, 10.0, 19.0, 9.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1259765625, -0.12205982208251953, -0.11814308166503906, -0.1142263412475586, -0.11030960083007812, -0.10639286041259766, -0.10247611999511719, -0.09855937957763672, -0.09464263916015625, -0.09072589874267578, -0.08680915832519531, -0.08289241790771484, -0.07897567749023438, -0.0750589370727539, -0.07114219665527344, -0.06722545623779297, -0.0633087158203125, -0.05939197540283203, -0.05547523498535156, -0.051558494567871094, -0.047641754150390625, -0.043725013732910156, -0.03980827331542969, -0.03589153289794922, -0.03197479248046875, -0.02805805206298828, -0.024141311645507812, -0.020224571228027344, -0.016307830810546875, -0.012391090393066406, -0.008474349975585938, -0.004557609558105469, -0.000640869140625, 0.0032758712768554688, 0.0071926116943359375, 0.011109352111816406, 0.015026092529296875, 0.018942832946777344, 0.022859573364257812, 0.02677631378173828, 0.03069305419921875, 0.03460979461669922, 0.03852653503417969, 0.042443275451660156, 0.046360015869140625, 0.050276756286621094, 0.05419349670410156, 0.05811023712158203, 0.0620269775390625, 0.06594371795654297, 0.06986045837402344, 0.0737771987915039, 0.07769393920898438, 0.08161067962646484, 0.08552742004394531, 0.08944416046142578, 0.09336090087890625, 0.09727764129638672, 0.10119438171386719, 0.10511112213134766, 0.10902786254882812, 0.1129446029663086, 0.11686134338378906, 0.12077808380126953, 0.12469482421875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 8.0, 11.0, 9.0, 16.0, 17.0, 26.0, 25.0, 37.0, 59.0, 87.0, 112.0, 158.0, 127.0, 84.0, 53.0, 40.0, 33.0, 32.0, 12.0, 14.0, 8.0, 7.0, 9.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.087158203125, -0.08455562591552734, -0.08195304870605469, -0.07935047149658203, -0.07674789428710938, -0.07414531707763672, -0.07154273986816406, -0.0689401626586914, -0.06633758544921875, -0.0637350082397461, -0.06113243103027344, -0.05852985382080078, -0.055927276611328125, -0.05332469940185547, -0.05072212219238281, -0.048119544982910156, -0.0455169677734375, -0.042914390563964844, -0.04031181335449219, -0.03770923614501953, -0.035106658935546875, -0.03250408172607422, -0.029901504516601562, -0.027298927307128906, -0.02469635009765625, -0.022093772888183594, -0.019491195678710938, -0.01688861846923828, -0.014286041259765625, -0.011683464050292969, -0.009080886840820312, -0.006478309631347656, -0.003875732421875, -0.0012731552124023438, 0.0013294219970703125, 0.003931999206542969, 0.006534576416015625, 0.009137153625488281, 0.011739730834960938, 0.014342308044433594, 0.01694488525390625, 0.019547462463378906, 0.022150039672851562, 0.02475261688232422, 0.027355194091796875, 0.02995777130126953, 0.03256034851074219, 0.035162925720214844, 0.0377655029296875, 0.040368080139160156, 0.04297065734863281, 0.04557323455810547, 0.048175811767578125, 0.05077838897705078, 0.05338096618652344, 0.055983543395996094, 0.05858612060546875, 0.061188697814941406, 0.06379127502441406, 0.06639385223388672, 0.06899642944335938, 0.07159900665283203, 0.07420158386230469, 0.07680416107177734, 0.07940673828125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 6.0, 15.0, 29.0, 74.0, 152.0, 380.0, 169.0, 99.0, 45.0, 22.0, 10.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5809786319732666, -1.5139507055282593, -1.446922779083252, -1.3798949718475342, -1.3128670454025269, -1.2458391189575195, -1.1788111925125122, -1.1117832660675049, -1.044755458831787, -0.9777275323867798, -0.9106996655464172, -0.8436717391014099, -0.7766438722610474, -0.70961594581604, -0.6425880193710327, -0.5755600929260254, -0.5085321664810181, -0.44150426983833313, -0.3744763731956482, -0.30744844675064087, -0.24042055010795593, -0.173392653465271, -0.10636472702026367, -0.039336830377578735, 0.0276910662651062, 0.09471897035837173, 0.16174687445163727, 0.2287747859954834, 0.29580268263816833, 0.36283057928085327, 0.4298585057258606, 0.49688640236854553, 0.5639142990112305, 0.6309422254562378, 0.6979700922966003, 0.7649980187416077, 0.8320258855819702, 0.8990538120269775, 0.9660817384719849, 1.0331096649169922, 1.10013747215271, 1.1671653985977173, 1.2341933250427246, 1.3012211322784424, 1.3682490587234497, 1.435276985168457, 1.5023049116134644, 1.5693328380584717, 1.636360764503479, 1.7033886909484863, 1.7704166173934937, 1.837444543838501, 1.9044723510742188, 1.971500277519226, 2.0385282039642334, 2.105556011199951, 2.172584056854248, 2.239611864089966, 2.3066399097442627, 2.3736677169799805, 2.4406957626342773, 2.507723569869995, 2.574751377105713, 2.6417794227600098, 2.7088072299957275]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 5.0, 2.0, 4.0, 8.0, 1.0, 7.0, 8.0, 15.0, 17.0, 16.0, 18.0, 20.0, 23.0, 21.0, 27.0, 33.0, 36.0, 25.0, 52.0, 73.0, 102.0, 86.0, 66.0, 51.0, 38.0, 30.0, 28.0, 33.0, 18.0, 20.0, 16.0, 21.0, 16.0, 14.0, 14.0, 17.0, 9.0, 8.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9006272554397583, -0.8724240064620972, -0.844220757484436, -0.8160175085067749, -0.7878142595291138, -0.7596110105514526, -0.7314077615737915, -0.7032045125961304, -0.6750012636184692, -0.6467980146408081, -0.618594765663147, -0.5903915166854858, -0.5621882677078247, -0.5339850187301636, -0.5057817697525024, -0.4775785207748413, -0.4493752717971802, -0.42117202281951904, -0.3929687738418579, -0.3647655248641968, -0.33656227588653564, -0.3083590269088745, -0.2801557779312134, -0.25195252895355225, -0.2237492799758911, -0.19554603099822998, -0.16734278202056885, -0.13913953304290771, -0.11093628406524658, -0.08273303508758545, -0.054529786109924316, -0.026326537132263184, 0.0018766522407531738, 0.030079901218414307, 0.05828315019607544, 0.08648639917373657, 0.1146896481513977, 0.14289289712905884, 0.17109614610671997, 0.1992993950843811, 0.22750264406204224, 0.25570589303970337, 0.2839091420173645, 0.31211239099502563, 0.34031563997268677, 0.3685188889503479, 0.39672213792800903, 0.42492538690567017, 0.4531286358833313, 0.48133188486099243, 0.5095351338386536, 0.5377383828163147, 0.5659416317939758, 0.594144880771637, 0.6223481297492981, 0.6505513787269592, 0.6787546277046204, 0.7069578766822815, 0.7351611256599426, 0.7633643746376038, 0.7915676236152649, 0.819770872592926, 0.8479741215705872, 0.8761773705482483, 0.9043806195259094]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 3.0, 5.0, 9.0, 6.0, 7.0, 11.0, 12.0, 27.0, 30.0, 47.0, 72.0, 98.0, 138.0, 231.0, 331.0, 598.0, 1090.0, 2130.0, 4436.0, 11037.0, 42694.0, 485616.0, 3169058.0, 414566.0, 41494.0, 11391.0, 4436.0, 2076.0, 1131.0, 603.0, 362.0, 220.0, 103.0, 66.0, 49.0, 29.0, 25.0, 9.0, 11.0, 8.0, 6.0, 7.0, 1.0, 5.0, 5.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.131103515625, -0.12760543823242188, -0.12410736083984375, -0.12060928344726562, -0.1171112060546875, -0.11361312866210938, -0.11011505126953125, -0.10661697387695312, -0.103118896484375, -0.09962081909179688, -0.09612274169921875, -0.09262466430664062, -0.0891265869140625, -0.08562850952148438, -0.08213043212890625, -0.07863235473632812, -0.07513427734375, -0.07163619995117188, -0.06813812255859375, -0.06464004516601562, -0.0611419677734375, -0.057643890380859375, -0.05414581298828125, -0.050647735595703125, -0.047149658203125, -0.043651580810546875, -0.04015350341796875, -0.036655426025390625, -0.0331573486328125, -0.029659271240234375, -0.02616119384765625, -0.022663116455078125, -0.0191650390625, -0.015666961669921875, -0.01216888427734375, -0.008670806884765625, -0.0051727294921875, -0.001674652099609375, 0.00182342529296875, 0.005321502685546875, 0.008819580078125, 0.012317657470703125, 0.01581573486328125, 0.019313812255859375, 0.0228118896484375, 0.026309967041015625, 0.02980804443359375, 0.033306121826171875, 0.03680419921875, 0.040302276611328125, 0.04380035400390625, 0.047298431396484375, 0.0507965087890625, 0.054294586181640625, 0.05779266357421875, 0.061290740966796875, 0.064788818359375, 0.06828689575195312, 0.07178497314453125, 0.07528305053710938, 0.0787811279296875, 0.08227920532226562, 0.08577728271484375, 0.08927536010742188, 0.0927734375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 6.0, 3.0, 3.0, 6.0, 7.0, 6.0, 8.0, 11.0, 26.0, 26.0, 24.0, 27.0, 28.0, 26.0, 35.0, 47.0, 47.0, 30.0, 48.0, 58.0, 50.0, 52.0, 47.0, 40.0, 43.0, 43.0, 27.0, 32.0, 33.0, 23.0, 22.0, 28.0, 11.0, 11.0, 4.0, 7.0, 8.0, 8.0, 9.0, 5.0, 7.0, 5.0, 8.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043701171875, -0.042272090911865234, -0.04084300994873047, -0.0394139289855957, -0.03798484802246094, -0.03655576705932617, -0.035126686096191406, -0.03369760513305664, -0.032268524169921875, -0.03083944320678711, -0.029410362243652344, -0.027981281280517578, -0.026552200317382812, -0.025123119354248047, -0.02369403839111328, -0.022264957427978516, -0.02083587646484375, -0.019406795501708984, -0.01797771453857422, -0.016548633575439453, -0.015119552612304688, -0.013690471649169922, -0.012261390686035156, -0.01083230972290039, -0.009403228759765625, -0.00797414779663086, -0.006545066833496094, -0.005115985870361328, -0.0036869049072265625, -0.002257823944091797, -0.0008287429809570312, 0.0006003379821777344, 0.0020294189453125, 0.0034584999084472656, 0.004887580871582031, 0.006316661834716797, 0.0077457427978515625, 0.009174823760986328, 0.010603904724121094, 0.01203298568725586, 0.013462066650390625, 0.01489114761352539, 0.016320228576660156, 0.017749309539794922, 0.019178390502929688, 0.020607471466064453, 0.02203655242919922, 0.023465633392333984, 0.02489471435546875, 0.026323795318603516, 0.02775287628173828, 0.029181957244873047, 0.030611038208007812, 0.03204011917114258, 0.033469200134277344, 0.03489828109741211, 0.036327362060546875, 0.03775644302368164, 0.039185523986816406, 0.04061460494995117, 0.04204368591308594, 0.0434727668762207, 0.04490184783935547, 0.046330928802490234, 0.047760009765625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 1.0, 5.0, 7.0, 13.0, 21.0, 46.0, 72.0, 134.0, 298.0, 751.0, 2360.0, 14265.0, 3684884.0, 480228.0, 8310.0, 1726.0, 606.0, 267.0, 134.0, 67.0, 40.0, 15.0, 11.0, 9.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.552734375, -0.5373306274414062, -0.5219268798828125, -0.5065231323242188, -0.491119384765625, -0.47571563720703125, -0.4603118896484375, -0.44490814208984375, -0.42950439453125, -0.41410064697265625, -0.3986968994140625, -0.38329315185546875, -0.367889404296875, -0.35248565673828125, -0.3370819091796875, -0.32167816162109375, -0.3062744140625, -0.29087066650390625, -0.2754669189453125, -0.26006317138671875, -0.244659423828125, -0.22925567626953125, -0.2138519287109375, -0.19844818115234375, -0.18304443359375, -0.16764068603515625, -0.1522369384765625, -0.13683319091796875, -0.121429443359375, -0.10602569580078125, -0.0906219482421875, -0.07521820068359375, -0.059814453125, -0.04441070556640625, -0.0290069580078125, -0.01360321044921875, 0.001800537109375, 0.01720428466796875, 0.0326080322265625, 0.04801177978515625, 0.06341552734375, 0.07881927490234375, 0.0942230224609375, 0.10962677001953125, 0.125030517578125, 0.14043426513671875, 0.1558380126953125, 0.17124176025390625, 0.1866455078125, 0.20204925537109375, 0.2174530029296875, 0.23285675048828125, 0.248260498046875, 0.26366424560546875, 0.2790679931640625, 0.29447174072265625, 0.30987548828125, 0.32527923583984375, 0.3406829833984375, 0.35608673095703125, 0.371490478515625, 0.38689422607421875, 0.4022979736328125, 0.41770172119140625, 0.43310546875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 2.0, 6.0, 1.0, 9.0, 9.0, 13.0, 25.0, 51.0, 81.0, 198.0, 553.0, 1462.0, 1064.0, 339.0, 127.0, 54.0, 29.0, 22.0, 7.0, 5.0, 8.0, 3.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.279052734375, -0.2696876525878906, -0.26032257080078125, -0.2509574890136719, -0.2415924072265625, -0.23222732543945312, -0.22286224365234375, -0.21349716186523438, -0.204132080078125, -0.19476699829101562, -0.18540191650390625, -0.17603683471679688, -0.1666717529296875, -0.15730667114257812, -0.14794158935546875, -0.13857650756835938, -0.12921142578125, -0.11984634399414062, -0.11048126220703125, -0.10111618041992188, -0.0917510986328125, -0.08238601684570312, -0.07302093505859375, -0.06365585327148438, -0.054290771484375, -0.044925689697265625, -0.03556060791015625, -0.026195526123046875, -0.0168304443359375, -0.007465362548828125, 0.00189971923828125, 0.011264801025390625, 0.0206298828125, 0.029994964599609375, 0.03936004638671875, 0.048725128173828125, 0.0580902099609375, 0.06745529174804688, 0.07682037353515625, 0.08618545532226562, 0.095550537109375, 0.10491561889648438, 0.11428070068359375, 0.12364578247070312, 0.1330108642578125, 0.14237594604492188, 0.15174102783203125, 0.16110610961914062, 0.17047119140625, 0.17983627319335938, 0.18920135498046875, 0.19856643676757812, 0.2079315185546875, 0.21729660034179688, 0.22666168212890625, 0.23602676391601562, 0.245391845703125, 0.2547569274902344, 0.26412200927734375, 0.2734870910644531, 0.2828521728515625, 0.2922172546386719, 0.30158233642578125, 0.3109474182128906, 0.3203125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 1.0, 2.0, 2.0, 4.0, 13.0, 20.0, 64.0, 149.0, 308.0, 261.0, 119.0, 43.0, 15.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-5.625086307525635, -5.520579814910889, -5.416073322296143, -5.311567306518555, -5.207060813903809, -5.1025543212890625, -4.998047828674316, -4.89354133605957, -4.789034843444824, -4.684528350830078, -4.580021858215332, -4.475515365600586, -4.371009349822998, -4.266502857208252, -4.161996364593506, -4.05748987197876, -3.952983856201172, -3.848477363586426, -3.743971109390259, -3.6394646167755127, -3.5349581241607666, -3.4304518699645996, -3.3259453773498535, -3.2214388847351074, -3.1169323921203613, -3.0124258995056152, -2.9079196453094482, -2.803413152694702, -2.698906660079956, -2.594400405883789, -2.489893913269043, -2.385387420654297, -2.28088116645813, -2.176374673843384, -2.071868419647217, -1.9673619270324707, -1.8628555536270142, -1.7583491802215576, -1.6538426876068115, -1.549336314201355, -1.4448299407958984, -1.340323567390442, -1.2358170747756958, -1.1313107013702393, -1.0268043279647827, -0.9222978949546814, -0.8177914619445801, -0.7132850885391235, -0.6087785959243774, -0.5042721629142761, -0.3997657895088196, -0.29525935649871826, -0.19075295329093933, -0.0862465500831604, 0.018259882926940918, 0.12276625633239746, 0.22727268934249878, 0.3317790925502777, 0.43628549575805664, 0.540791928768158, 0.6452983617782593, 0.7498047351837158, 0.8543111681938171, 0.9588175415992737, 1.063323974609375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 5.0, 3.0, 4.0, 6.0, 22.0, 27.0, 10.0, 20.0, 16.0, 18.0, 28.0, 36.0, 24.0, 38.0, 44.0, 48.0, 49.0, 65.0, 67.0, 56.0, 51.0, 46.0, 45.0, 30.0, 44.0, 34.0, 30.0, 27.0, 21.0, 16.0, 11.0, 7.0, 14.0, 11.0, 4.0, 2.0, 9.0, 8.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7457953095436096, -0.7195703387260437, -0.693345308303833, -0.6671203374862671, -0.6408953666687012, -0.6146703958511353, -0.5884453654289246, -0.5622203946113586, -0.535995364189148, -0.509770393371582, -0.4835453927516937, -0.4573203921318054, -0.4310954213142395, -0.4048704206943512, -0.3786454200744629, -0.352420449256897, -0.32619547843933105, -0.29997047781944275, -0.27374550700187683, -0.24752050638198853, -0.2212955206632614, -0.1950705349445343, -0.168845534324646, -0.14262054860591888, -0.11639556288719177, -0.09017057716846466, -0.06394558399915695, -0.03772059082984924, -0.011495605111122131, 0.01472938060760498, 0.040954381227493286, 0.0671793669462204, 0.09340429306030273, 0.11962927877902985, 0.14585426449775696, 0.17207926511764526, 0.19830425083637238, 0.2245292365550995, 0.2507542371749878, 0.2769792079925537, 0.303204208612442, 0.3294292092323303, 0.35565418004989624, 0.38187918066978455, 0.40810418128967285, 0.43432915210723877, 0.4605541527271271, 0.4867791533470154, 0.5130041241645813, 0.5392290949821472, 0.5654541254043579, 0.5916790962219238, 0.6179040670394897, 0.6441290378570557, 0.6703540682792664, 0.6965790390968323, 0.722804069519043, 0.7490290403366089, 0.7752540707588196, 0.8014790415763855, 0.8277040123939514, 0.8539290428161621, 0.880154013633728, 0.906378984451294, 0.9326039552688599]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 7.0, 5.0, 8.0, 9.0, 10.0, 28.0, 33.0, 49.0, 129.0, 200.0, 303.0, 532.0, 1069.0, 2068.0, 4323.0, 9510.0, 22632.0, 61150.0, 189650.0, 423118.0, 218213.0, 69753.0, 25700.0, 10461.0, 4774.0, 2212.0, 1127.0, 611.0, 370.0, 205.0, 110.0, 63.0, 53.0, 33.0, 17.0, 8.0, 10.0, 9.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11285400390625, -0.10903644561767578, -0.10521888732910156, -0.10140132904052734, -0.09758377075195312, -0.0937662124633789, -0.08994865417480469, -0.08613109588623047, -0.08231353759765625, -0.07849597930908203, -0.07467842102050781, -0.0708608627319336, -0.06704330444335938, -0.06322574615478516, -0.05940818786621094, -0.05559062957763672, -0.0517730712890625, -0.04795551300048828, -0.04413795471191406, -0.040320396423339844, -0.036502838134765625, -0.032685279846191406, -0.028867721557617188, -0.02505016326904297, -0.02123260498046875, -0.01741504669189453, -0.013597488403320312, -0.009779930114746094, -0.005962371826171875, -0.0021448135375976562, 0.0016727447509765625, 0.005490303039550781, 0.009307861328125, 0.013125419616699219, 0.016942977905273438, 0.020760536193847656, 0.024578094482421875, 0.028395652770996094, 0.03221321105957031, 0.03603076934814453, 0.03984832763671875, 0.04366588592529297, 0.04748344421386719, 0.051301002502441406, 0.055118560791015625, 0.058936119079589844, 0.06275367736816406, 0.06657123565673828, 0.0703887939453125, 0.07420635223388672, 0.07802391052246094, 0.08184146881103516, 0.08565902709960938, 0.0894765853881836, 0.09329414367675781, 0.09711170196533203, 0.10092926025390625, 0.10474681854248047, 0.10856437683105469, 0.1123819351196289, 0.11619949340820312, 0.12001705169677734, 0.12383460998535156, 0.12765216827392578, 0.1314697265625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 4.0, 5.0, 11.0, 7.0, 11.0, 13.0, 23.0, 25.0, 38.0, 36.0, 37.0, 47.0, 39.0, 45.0, 55.0, 57.0, 44.0, 46.0, 50.0, 46.0, 46.0, 49.0, 43.0, 28.0, 24.0, 32.0, 29.0, 26.0, 26.0, 10.0, 13.0, 8.0, 3.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.056121826171875, -0.05418825149536133, -0.052254676818847656, -0.050321102142333984, -0.04838752746582031, -0.04645395278930664, -0.04452037811279297, -0.0425868034362793, -0.040653228759765625, -0.03871965408325195, -0.03678607940673828, -0.03485250473022461, -0.03291893005371094, -0.030985355377197266, -0.029051780700683594, -0.027118206024169922, -0.02518463134765625, -0.023251056671142578, -0.021317481994628906, -0.019383907318115234, -0.017450332641601562, -0.01551675796508789, -0.013583183288574219, -0.011649608612060547, -0.009716033935546875, -0.007782459259033203, -0.005848884582519531, -0.003915309906005859, -0.0019817352294921875, -4.8160552978515625e-05, 0.0018854141235351562, 0.003818988800048828, 0.0057525634765625, 0.007686138153076172, 0.009619712829589844, 0.011553287506103516, 0.013486862182617188, 0.01542043685913086, 0.01735401153564453, 0.019287586212158203, 0.021221160888671875, 0.023154735565185547, 0.02508831024169922, 0.02702188491821289, 0.028955459594726562, 0.030889034271240234, 0.032822608947753906, 0.03475618362426758, 0.03668975830078125, 0.03862333297729492, 0.040556907653808594, 0.042490482330322266, 0.04442405700683594, 0.04635763168334961, 0.04829120635986328, 0.05022478103637695, 0.052158355712890625, 0.0540919303894043, 0.05602550506591797, 0.05795907974243164, 0.05989265441894531, 0.061826229095458984, 0.06375980377197266, 0.06569337844848633, 0.067626953125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 8.0, 13.0, 19.0, 20.0, 40.0, 50.0, 87.0, 113.0, 237.0, 423.0, 936.0, 2378.0, 10900.0, 146213.0, 841167.0, 38067.0, 4979.0, 1520.0, 626.0, 307.0, 150.0, 107.0, 72.0, 45.0, 24.0, 12.0, 19.0, 10.0, 3.0, 1.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37890625, -0.36785125732421875, -0.3567962646484375, -0.34574127197265625, -0.334686279296875, -0.32363128662109375, -0.3125762939453125, -0.30152130126953125, -0.29046630859375, -0.27941131591796875, -0.2683563232421875, -0.25730133056640625, -0.246246337890625, -0.23519134521484375, -0.2241363525390625, -0.21308135986328125, -0.2020263671875, -0.19097137451171875, -0.1799163818359375, -0.16886138916015625, -0.157806396484375, -0.14675140380859375, -0.1356964111328125, -0.12464141845703125, -0.11358642578125, -0.10253143310546875, -0.0914764404296875, -0.08042144775390625, -0.069366455078125, -0.05831146240234375, -0.0472564697265625, -0.03620147705078125, -0.025146484375, -0.01409149169921875, -0.0030364990234375, 0.00801849365234375, 0.019073486328125, 0.03012847900390625, 0.0411834716796875, 0.05223846435546875, 0.06329345703125, 0.07434844970703125, 0.0854034423828125, 0.09645843505859375, 0.107513427734375, 0.11856842041015625, 0.1296234130859375, 0.14067840576171875, 0.1517333984375, 0.16278839111328125, 0.1738433837890625, 0.18489837646484375, 0.195953369140625, 0.20700836181640625, 0.2180633544921875, 0.22911834716796875, 0.24017333984375, 0.25122833251953125, 0.2622833251953125, 0.27333831787109375, 0.284393310546875, 0.29544830322265625, 0.3065032958984375, 0.31755828857421875, 0.32861328125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 6.0, 5.0, 6.0, 11.0, 11.0, 13.0, 9.0, 18.0, 17.0, 19.0, 20.0, 26.0, 32.0, 43.0, 43.0, 45.0, 50.0, 39.0, 55.0, 70.0, 48.0, 54.0, 36.0, 49.0, 40.0, 35.0, 40.0, 29.0, 21.0, 23.0, 18.0, 11.0, 13.0, 12.0, 8.0, 7.0, 3.0, 4.0, 2.0, 5.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2457275390625, -0.23836898803710938, -0.23101043701171875, -0.22365188598632812, -0.2162933349609375, -0.20893478393554688, -0.20157623291015625, -0.19421768188476562, -0.186859130859375, -0.17950057983398438, -0.17214202880859375, -0.16478347778320312, -0.1574249267578125, -0.15006637573242188, -0.14270782470703125, -0.13534927368164062, -0.12799072265625, -0.12063217163085938, -0.11327362060546875, -0.10591506958007812, -0.0985565185546875, -0.09119796752929688, -0.08383941650390625, -0.07648086547851562, -0.069122314453125, -0.061763763427734375, -0.05440521240234375, -0.047046661376953125, -0.0396881103515625, -0.032329559326171875, -0.02497100830078125, -0.017612457275390625, -0.01025390625, -0.002895355224609375, 0.00446319580078125, 0.011821746826171875, 0.0191802978515625, 0.026538848876953125, 0.03389739990234375, 0.041255950927734375, 0.048614501953125, 0.055973052978515625, 0.06333160400390625, 0.07069015502929688, 0.0780487060546875, 0.08540725708007812, 0.09276580810546875, 0.10012435913085938, 0.10748291015625, 0.11484146118164062, 0.12220001220703125, 0.12955856323242188, 0.1369171142578125, 0.14427566528320312, 0.15163421630859375, 0.15899276733398438, 0.166351318359375, 0.17370986938476562, 0.18106842041015625, 0.18842697143554688, 0.1957855224609375, 0.20314407348632812, 0.21050262451171875, 0.21786117553710938, 0.2252197265625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 6.0, 6.0, 6.0, 6.0, 11.0, 13.0, 16.0, 30.0, 36.0, 61.0, 70.0, 113.0, 156.0, 246.0, 418.0, 670.0, 1192.0, 2638.0, 5891.0, 16457.0, 57588.0, 565137.0, 316011.0, 54857.0, 15528.0, 5794.0, 2450.0, 1229.0, 690.0, 424.0, 265.0, 169.0, 100.0, 84.0, 52.0, 40.0, 34.0, 14.0, 13.0, 9.0, 4.0, 8.0, 4.0, 4.0, 2.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0592041015625, -0.05716133117675781, -0.055118560791015625, -0.05307579040527344, -0.05103302001953125, -0.04899024963378906, -0.046947479248046875, -0.04490470886230469, -0.0428619384765625, -0.04081916809082031, -0.038776397705078125, -0.03673362731933594, -0.03469085693359375, -0.03264808654785156, -0.030605316162109375, -0.028562545776367188, -0.026519775390625, -0.024477005004882812, -0.022434234619140625, -0.020391464233398438, -0.01834869384765625, -0.016305923461914062, -0.014263153076171875, -0.012220382690429688, -0.0101776123046875, -0.008134841918945312, -0.006092071533203125, -0.0040493011474609375, -0.00200653076171875, 3.62396240234375e-05, 0.002079010009765625, 0.0041217803955078125, 0.00616455078125, 0.008207321166992188, 0.010250091552734375, 0.012292861938476562, 0.01433563232421875, 0.016378402709960938, 0.018421173095703125, 0.020463943481445312, 0.0225067138671875, 0.024549484252929688, 0.026592254638671875, 0.028635025024414062, 0.03067779541015625, 0.03272056579589844, 0.034763336181640625, 0.03680610656738281, 0.038848876953125, 0.04089164733886719, 0.042934417724609375, 0.04497718811035156, 0.04701995849609375, 0.04906272888183594, 0.051105499267578125, 0.05314826965332031, 0.0551910400390625, 0.05723381042480469, 0.059276580810546875, 0.06131935119628906, 0.06336212158203125, 0.06540489196777344, 0.06744766235351562, 0.06949043273925781, 0.071533203125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 6.0, 2.0, 3.0, 1.0, 3.0, 4.0, 2.0, 3.0, 2.0, 6.0, 4.0, 7.0, 7.0, 11.0, 13.0, 22.0, 23.0, 34.0, 47.0, 69.0, 82.0, 104.0, 105.0, 111.0, 72.0, 51.0, 44.0, 38.0, 35.0, 20.0, 16.0, 14.0, 14.0, 11.0, 6.0, 8.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.057718276977539e-05, -2.9607675969600677e-05, -2.8638169169425964e-05, -2.766866236925125e-05, -2.6699155569076538e-05, -2.5729648768901825e-05, -2.4760141968727112e-05, -2.37906351685524e-05, -2.2821128368377686e-05, -2.1851621568202972e-05, -2.088211476802826e-05, -1.9912607967853546e-05, -1.8943101167678833e-05, -1.797359436750412e-05, -1.7004087567329407e-05, -1.6034580767154694e-05, -1.506507396697998e-05, -1.4095567166805267e-05, -1.3126060366630554e-05, -1.2156553566455841e-05, -1.1187046766281128e-05, -1.0217539966106415e-05, -9.248033165931702e-06, -8.278526365756989e-06, -7.309019565582275e-06, -6.339512765407562e-06, -5.370005965232849e-06, -4.400499165058136e-06, -3.430992364883423e-06, -2.4614855647087097e-06, -1.4919787645339966e-06, -5.224719643592834e-07, 4.470348358154297e-07, 1.4165416359901428e-06, 2.386048436164856e-06, 3.355555236339569e-06, 4.325062036514282e-06, 5.294568836688995e-06, 6.2640756368637085e-06, 7.233582437038422e-06, 8.203089237213135e-06, 9.172596037387848e-06, 1.0142102837562561e-05, 1.1111609637737274e-05, 1.2081116437911987e-05, 1.30506232380867e-05, 1.4020130038261414e-05, 1.4989636838436127e-05, 1.595914363861084e-05, 1.6928650438785553e-05, 1.7898157238960266e-05, 1.886766403913498e-05, 1.9837170839309692e-05, 2.0806677639484406e-05, 2.177618443965912e-05, 2.2745691239833832e-05, 2.3715198040008545e-05, 2.4684704840183258e-05, 2.565421164035797e-05, 2.6623718440532684e-05, 2.7593225240707397e-05, 2.856273204088211e-05, 2.9532238841056824e-05, 3.0501745641231537e-05, 3.147125244140625e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 6.0, 12.0, 19.0, 14.0, 25.0, 36.0, 58.0, 85.0, 140.0, 219.0, 311.0, 611.0, 1265.0, 3273.0, 10690.0, 48798.0, 632928.0, 294698.0, 40411.0, 9360.0, 2901.0, 1213.0, 556.0, 325.0, 208.0, 109.0, 83.0, 61.0, 37.0, 22.0, 25.0, 16.0, 13.0, 4.0, 6.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.076171875, -0.07371044158935547, -0.07124900817871094, -0.0687875747680664, -0.06632614135742188, -0.06386470794677734, -0.06140327453613281, -0.05894184112548828, -0.05648040771484375, -0.05401897430419922, -0.05155754089355469, -0.049096107482910156, -0.046634674072265625, -0.044173240661621094, -0.04171180725097656, -0.03925037384033203, -0.0367889404296875, -0.03432750701904297, -0.03186607360839844, -0.029404640197753906, -0.026943206787109375, -0.024481773376464844, -0.022020339965820312, -0.01955890655517578, -0.01709747314453125, -0.014636039733886719, -0.012174606323242188, -0.009713172912597656, -0.007251739501953125, -0.004790306091308594, -0.0023288726806640625, 0.00013256072998046875, 0.002593994140625, 0.005055427551269531, 0.0075168609619140625, 0.009978294372558594, 0.012439727783203125, 0.014901161193847656, 0.017362594604492188, 0.01982402801513672, 0.02228546142578125, 0.02474689483642578, 0.027208328247070312, 0.029669761657714844, 0.032131195068359375, 0.034592628479003906, 0.03705406188964844, 0.03951549530029297, 0.0419769287109375, 0.04443836212158203, 0.04689979553222656, 0.049361228942871094, 0.051822662353515625, 0.054284095764160156, 0.05674552917480469, 0.05920696258544922, 0.06166839599609375, 0.06412982940673828, 0.06659126281738281, 0.06905269622802734, 0.07151412963867188, 0.0739755630493164, 0.07643699645996094, 0.07889842987060547, 0.08135986328125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 2.0, 6.0, 3.0, 9.0, 3.0, 10.0, 12.0, 17.0, 9.0, 12.0, 23.0, 26.0, 33.0, 46.0, 55.0, 44.0, 44.0, 101.0, 105.0, 72.0, 62.0, 48.0, 48.0, 34.0, 31.0, 22.0, 26.0, 21.0, 18.0, 7.0, 15.0, 5.0, 9.0, 7.0, 1.0, 6.0, 0.0, 3.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043212890625, -0.04173469543457031, -0.040256500244140625, -0.03877830505371094, -0.03730010986328125, -0.03582191467285156, -0.034343719482421875, -0.03286552429199219, -0.0313873291015625, -0.029909133911132812, -0.028430938720703125, -0.026952743530273438, -0.02547454833984375, -0.023996353149414062, -0.022518157958984375, -0.021039962768554688, -0.019561767578125, -0.018083572387695312, -0.016605377197265625, -0.015127182006835938, -0.01364898681640625, -0.012170791625976562, -0.010692596435546875, -0.009214401245117188, -0.0077362060546875, -0.0062580108642578125, -0.004779815673828125, -0.0033016204833984375, -0.00182342529296875, -0.0003452301025390625, 0.001132965087890625, 0.0026111602783203125, 0.00408935546875, 0.0055675506591796875, 0.007045745849609375, 0.008523941040039062, 0.01000213623046875, 0.011480331420898438, 0.012958526611328125, 0.014436721801757812, 0.0159149169921875, 0.017393112182617188, 0.018871307373046875, 0.020349502563476562, 0.02182769775390625, 0.023305892944335938, 0.024784088134765625, 0.026262283325195312, 0.027740478515625, 0.029218673706054688, 0.030696868896484375, 0.03217506408691406, 0.03365325927734375, 0.03513145446777344, 0.036609649658203125, 0.03808784484863281, 0.0395660400390625, 0.04104423522949219, 0.042522430419921875, 0.04400062561035156, 0.04547882080078125, 0.04695701599121094, 0.048435211181640625, 0.04991340637207031, 0.0513916015625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 4.0, 12.0, 16.0, 36.0, 54.0, 98.0, 218.0, 346.0, 102.0, 55.0, 27.0, 15.0, 7.0, 4.0, 1.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7580373287200928, -1.690746545791626, -1.6234556436538696, -1.5561648607254028, -1.4888739585876465, -1.4215831756591797, -1.354292392730713, -1.287001609802246, -1.2197107076644897, -1.152419924736023, -1.0851290225982666, -1.0178382396697998, -0.9505473971366882, -0.8832565546035767, -0.8159657716751099, -0.7486749291419983, -0.6813840866088867, -0.6140932440757751, -0.5468024015426636, -0.4795116186141968, -0.4122207760810852, -0.34492993354797363, -0.27763912081718445, -0.21034830808639526, -0.1430574655532837, -0.07576663792133331, -0.008475810289382935, 0.058815017342567444, 0.12610584497451782, 0.1933966875076294, 0.2606875002384186, 0.32797831296920776, 0.39526891708374023, 0.4625597596168518, 0.5298506021499634, 0.5971413850784302, 0.6644322276115417, 0.7317230701446533, 0.7990138530731201, 0.8663046956062317, 0.9335955381393433, 1.00088632106781, 1.0681772232055664, 1.1354680061340332, 1.2027587890625, 1.2700496912002563, 1.3373404741287231, 1.4046313762664795, 1.4719221591949463, 1.539212942123413, 1.6065038442611694, 1.6737946271896362, 1.7410855293273926, 1.8083763122558594, 1.8756670951843262, 1.942957878112793, 2.0102486610412598, 2.0775394439697266, 2.1448302268981934, 2.2121212482452393, 2.279412031173706, 2.346702814102173, 2.4139935970306396, 2.4812843799591064, 2.5485754013061523]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 8.0, 5.0, 5.0, 10.0, 7.0, 13.0, 14.0, 15.0, 22.0, 28.0, 26.0, 20.0, 27.0, 35.0, 42.0, 60.0, 137.0, 160.0, 46.0, 44.0, 36.0, 38.0, 27.0, 28.0, 24.0, 30.0, 18.0, 19.0, 13.0, 13.0, 7.0, 7.0, 6.0, 5.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.088390827178955, -1.0543274879455566, -1.0202640295028687, -0.9862006306648254, -0.9521372318267822, -0.918073832988739, -0.8840104341506958, -0.8499470949172974, -0.8158836364746094, -0.7818202376365662, -0.747756838798523, -0.7136934399604797, -0.6796300411224365, -0.6455666422843933, -0.6115032434463501, -0.5774399042129517, -0.5433765053749084, -0.5093131065368652, -0.475249707698822, -0.4411863088607788, -0.4071229100227356, -0.3730595111846924, -0.33899614214897156, -0.30493274331092834, -0.27086934447288513, -0.23680594563484192, -0.2027425467967987, -0.1686791628599167, -0.13461576402187347, -0.10055236518383026, -0.06648898124694824, -0.03242558240890503, 0.0016378164291381836, 0.0357012115418911, 0.06976460665464401, 0.10382799804210663, 0.13789139688014984, 0.17195479571819305, 0.20601817965507507, 0.2400815784931183, 0.2741449773311615, 0.3082083761692047, 0.3422717750072479, 0.37633514404296875, 0.41039854288101196, 0.4444619417190552, 0.4785253405570984, 0.5125887393951416, 0.5466521382331848, 0.580715537071228, 0.6147789359092712, 0.6488423347473145, 0.6829057335853577, 0.7169691324234009, 0.7510324716567993, 0.7850959300994873, 0.8191592693328857, 0.853222668170929, 0.8872860670089722, 0.9213494658470154, 0.9554128646850586, 0.9894762635231018, 1.023539662361145, 1.0576030015945435, 1.0916664600372314]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 4.0, 1.0, 2.0, 4.0, 9.0, 14.0, 17.0, 14.0, 23.0, 38.0, 55.0, 80.0, 118.0, 193.0, 309.0, 527.0, 903.0, 1603.0, 2786.0, 5497.0, 11760.0, 27830.0, 87330.0, 438235.0, 2170330.0, 1174983.0, 188204.0, 48030.0, 18063.0, 8188.0, 4060.0, 2103.0, 1203.0, 675.0, 422.0, 257.0, 138.0, 98.0, 55.0, 47.0, 36.0, 19.0, 13.0, 1.0, 6.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.097900390625, -0.0944967269897461, -0.09109306335449219, -0.08768939971923828, -0.08428573608398438, -0.08088207244873047, -0.07747840881347656, -0.07407474517822266, -0.07067108154296875, -0.06726741790771484, -0.06386375427246094, -0.06046009063720703, -0.057056427001953125, -0.05365276336669922, -0.05024909973144531, -0.046845436096191406, -0.0434417724609375, -0.040038108825683594, -0.03663444519042969, -0.03323078155517578, -0.029827117919921875, -0.02642345428466797, -0.023019790649414062, -0.019616127014160156, -0.01621246337890625, -0.012808799743652344, -0.009405136108398438, -0.006001472473144531, -0.002597808837890625, 0.0008058547973632812, 0.0042095184326171875, 0.007613182067871094, 0.011016845703125, 0.014420509338378906, 0.017824172973632812, 0.02122783660888672, 0.024631500244140625, 0.02803516387939453, 0.03143882751464844, 0.034842491149902344, 0.03824615478515625, 0.041649818420410156, 0.04505348205566406, 0.04845714569091797, 0.051860809326171875, 0.05526447296142578, 0.05866813659667969, 0.062071800231933594, 0.0654754638671875, 0.0688791275024414, 0.07228279113769531, 0.07568645477294922, 0.07909011840820312, 0.08249378204345703, 0.08589744567871094, 0.08930110931396484, 0.09270477294921875, 0.09610843658447266, 0.09951210021972656, 0.10291576385498047, 0.10631942749023438, 0.10972309112548828, 0.11312675476074219, 0.1165304183959961, 0.11993408203125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 8.0, 7.0, 6.0, 12.0, 20.0, 22.0, 18.0, 27.0, 22.0, 35.0, 33.0, 36.0, 35.0, 51.0, 48.0, 56.0, 54.0, 56.0, 66.0, 51.0, 50.0, 41.0, 45.0, 34.0, 33.0, 29.0, 28.0, 13.0, 19.0, 13.0, 7.0, 6.0, 4.0, 6.0, 2.0, 6.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041107177734375, -0.03932332992553711, -0.03753948211669922, -0.03575563430786133, -0.03397178649902344, -0.03218793869018555, -0.030404090881347656, -0.028620243072509766, -0.026836395263671875, -0.025052547454833984, -0.023268699645996094, -0.021484851837158203, -0.019701004028320312, -0.017917156219482422, -0.01613330841064453, -0.01434946060180664, -0.01256561279296875, -0.01078176498413086, -0.008997917175292969, -0.007214069366455078, -0.0054302215576171875, -0.003646373748779297, -0.0018625259399414062, -7.867813110351562e-05, 0.001705169677734375, 0.0034890174865722656, 0.005272865295410156, 0.007056713104248047, 0.008840560913085938, 0.010624408721923828, 0.012408256530761719, 0.01419210433959961, 0.0159759521484375, 0.01775979995727539, 0.01954364776611328, 0.021327495574951172, 0.023111343383789062, 0.024895191192626953, 0.026679039001464844, 0.028462886810302734, 0.030246734619140625, 0.032030582427978516, 0.033814430236816406, 0.0355982780456543, 0.03738212585449219, 0.03916597366333008, 0.04094982147216797, 0.04273366928100586, 0.04451751708984375, 0.04630136489868164, 0.04808521270751953, 0.04986906051635742, 0.05165290832519531, 0.0534367561340332, 0.055220603942871094, 0.057004451751708984, 0.058788299560546875, 0.060572147369384766, 0.062355995178222656, 0.06413984298706055, 0.06592369079589844, 0.06770753860473633, 0.06949138641357422, 0.07127523422241211, 0.07305908203125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 8.0, 8.0, 10.0, 12.0, 23.0, 28.0, 71.0, 95.0, 143.0, 291.0, 597.0, 1405.0, 5400.0, 113876.0, 4038819.0, 28109.0, 3329.0, 966.0, 483.0, 250.0, 135.0, 70.0, 45.0, 36.0, 22.0, 18.0, 11.0, 4.0, 4.0, 6.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.693359375, -0.6719131469726562, -0.6504669189453125, -0.6290206909179688, -0.607574462890625, -0.5861282348632812, -0.5646820068359375, -0.5432357788085938, -0.52178955078125, -0.5003433227539062, -0.4788970947265625, -0.45745086669921875, -0.436004638671875, -0.41455841064453125, -0.3931121826171875, -0.37166595458984375, -0.3502197265625, -0.32877349853515625, -0.3073272705078125, -0.28588104248046875, -0.264434814453125, -0.24298858642578125, -0.2215423583984375, -0.20009613037109375, -0.17864990234375, -0.15720367431640625, -0.1357574462890625, -0.11431121826171875, -0.092864990234375, -0.07141876220703125, -0.0499725341796875, -0.02852630615234375, -0.007080078125, 0.01436614990234375, 0.0358123779296875, 0.05725860595703125, 0.078704833984375, 0.10015106201171875, 0.1215972900390625, 0.14304351806640625, 0.16448974609375, 0.18593597412109375, 0.2073822021484375, 0.22882843017578125, 0.250274658203125, 0.27172088623046875, 0.2931671142578125, 0.31461334228515625, 0.3360595703125, 0.35750579833984375, 0.3789520263671875, 0.40039825439453125, 0.421844482421875, 0.44329071044921875, 0.4647369384765625, 0.48618316650390625, 0.50762939453125, 0.5290756225585938, 0.5505218505859375, 0.5719680786132812, 0.593414306640625, 0.6148605346679688, 0.6363067626953125, 0.6577529907226562, 0.67919921875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 0.0, 4.0, 2.0, 6.0, 5.0, 4.0, 22.0, 18.0, 33.0, 43.0, 60.0, 123.0, 191.0, 302.0, 606.0, 907.0, 690.0, 383.0, 231.0, 161.0, 78.0, 67.0, 40.0, 28.0, 28.0, 10.0, 15.0, 8.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3330078125, -0.3233795166015625, -0.313751220703125, -0.3041229248046875, -0.29449462890625, -0.2848663330078125, -0.275238037109375, -0.2656097412109375, -0.2559814453125, -0.2463531494140625, -0.236724853515625, -0.2270965576171875, -0.21746826171875, -0.2078399658203125, -0.198211669921875, -0.1885833740234375, -0.178955078125, -0.1693267822265625, -0.159698486328125, -0.1500701904296875, -0.14044189453125, -0.1308135986328125, -0.121185302734375, -0.1115570068359375, -0.1019287109375, -0.0923004150390625, -0.082672119140625, -0.0730438232421875, -0.06341552734375, -0.0537872314453125, -0.044158935546875, -0.0345306396484375, -0.02490234375, -0.0152740478515625, -0.005645751953125, 0.0039825439453125, 0.01361083984375, 0.0232391357421875, 0.032867431640625, 0.0424957275390625, 0.0521240234375, 0.0617523193359375, 0.071380615234375, 0.0810089111328125, 0.09063720703125, 0.1002655029296875, 0.109893798828125, 0.1195220947265625, 0.129150390625, 0.1387786865234375, 0.148406982421875, 0.1580352783203125, 0.16766357421875, 0.1772918701171875, 0.186920166015625, 0.1965484619140625, 0.2061767578125, 0.2158050537109375, 0.225433349609375, 0.2350616455078125, 0.24468994140625, 0.2543182373046875, 0.263946533203125, 0.2735748291015625, 0.283203125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 14.0, 16.0, 40.0, 84.0, 153.0, 245.0, 208.0, 116.0, 65.0, 24.0, 9.0, 7.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.000347137451172, -4.860213756561279, -4.720080852508545, -4.579947471618652, -4.43981409072876, -4.299680709838867, -4.159547805786133, -4.01941442489624, -3.8792812824249268, -3.7391481399536133, -3.5990147590637207, -3.4588816165924072, -3.3187484741210938, -3.178615093231201, -3.0384819507598877, -2.898348808288574, -2.7582154273986816, -2.618082284927368, -2.4779489040374756, -2.337815761566162, -2.1976823806762695, -2.057549238204956, -1.9174160957336426, -1.7772828340530396, -1.6371495723724365, -1.4970163106918335, -1.3568830490112305, -1.216749906539917, -1.076616644859314, -0.9364833831787109, -0.7963501811027527, -0.6562169790267944, -0.5160841941833496, -0.37595096230506897, -0.23581773042678833, -0.09568449854850769, 0.04444873332977295, 0.18458199501037598, 0.32471519708633423, 0.4648483991622925, 0.6049816608428955, 0.7451149225234985, 0.8852481245994568, 1.025381326675415, 1.165514588356018, 1.305647850036621, 1.4457809925079346, 1.5859142541885376, 1.7260475158691406, 1.8661807775497437, 2.0063140392303467, 2.14644718170166, 2.2865805625915527, 2.426713705062866, 2.5668468475341797, 2.7069802284240723, 2.8471133708953857, 2.987246513366699, 3.127379894256592, 3.2675130367279053, 3.4076461791992188, 3.5477795600891113, 3.687912702560425, 3.8280458450317383, 3.968179225921631]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 8.0, 7.0, 15.0, 13.0, 17.0, 17.0, 24.0, 34.0, 28.0, 39.0, 44.0, 50.0, 51.0, 72.0, 55.0, 63.0, 70.0, 55.0, 48.0, 64.0, 37.0, 36.0, 38.0, 29.0, 23.0, 12.0, 16.0, 11.0, 4.0, 9.0, 3.0, 2.0, 4.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.582747459411621, -1.5295206308364868, -1.476293683052063, -1.4230668544769287, -1.3698399066925049, -1.3166130781173706, -1.2633862495422363, -1.2101593017578125, -1.1569323539733887, -1.1037055253982544, -1.0504785776138306, -0.9972517490386963, -0.9440248012542725, -0.8907979726791382, -0.8375710844993591, -0.7843441963195801, -0.7311173677444458, -0.6778904795646667, -0.6246635913848877, -0.5714367628097534, -0.5182098150253296, -0.4649829566478729, -0.41175609827041626, -0.3585292100906372, -0.30530232191085815, -0.2520754337310791, -0.19884856045246124, -0.14562168717384338, -0.09239479899406433, -0.03916791081428528, 0.014058947563171387, 0.06728583574295044, 0.12051272392272949, 0.17373961210250854, 0.2269664853811264, 0.28019335865974426, 0.3334202468395233, 0.38664713501930237, 0.43987399339675903, 0.4931008815765381, 0.5463277697563171, 0.5995546579360962, 0.6527815461158752, 0.7060084342956543, 0.7592352628707886, 0.8124622106552124, 0.8656890392303467, 0.9189159274101257, 0.9721428155899048, 1.025369644165039, 1.078596591949463, 1.1318234205245972, 1.185050368309021, 1.2382771968841553, 1.291504144668579, 1.3447309732437134, 1.3979578018188477, 1.451184630393982, 1.5044115781784058, 1.55763840675354, 1.6108653545379639, 1.6640921831130981, 1.7173190116882324, 1.7705459594726562, 1.82377290725708]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 1.0, 2.0, 2.0, 4.0, 7.0, 14.0, 13.0, 25.0, 31.0, 55.0, 100.0, 207.0, 455.0, 1079.0, 3002.0, 10256.0, 56911.0, 710287.0, 230974.0, 25869.0, 5883.0, 1890.0, 797.0, 308.0, 178.0, 76.0, 51.0, 38.0, 15.0, 10.0, 9.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2568359375, -0.2482147216796875, -0.239593505859375, -0.2309722900390625, -0.22235107421875, -0.2137298583984375, -0.205108642578125, -0.1964874267578125, -0.1878662109375, -0.1792449951171875, -0.170623779296875, -0.1620025634765625, -0.15338134765625, -0.1447601318359375, -0.136138916015625, -0.1275177001953125, -0.118896484375, -0.1102752685546875, -0.101654052734375, -0.0930328369140625, -0.08441162109375, -0.0757904052734375, -0.067169189453125, -0.0585479736328125, -0.0499267578125, -0.0413055419921875, -0.032684326171875, -0.0240631103515625, -0.01544189453125, -0.0068206787109375, 0.001800537109375, 0.0104217529296875, 0.01904296875, 0.0276641845703125, 0.036285400390625, 0.0449066162109375, 0.05352783203125, 0.0621490478515625, 0.070770263671875, 0.0793914794921875, 0.0880126953125, 0.0966339111328125, 0.105255126953125, 0.1138763427734375, 0.12249755859375, 0.1311187744140625, 0.139739990234375, 0.1483612060546875, 0.156982421875, 0.1656036376953125, 0.174224853515625, 0.1828460693359375, 0.19146728515625, 0.2000885009765625, 0.208709716796875, 0.2173309326171875, 0.2259521484375, 0.2345733642578125, 0.243194580078125, 0.2518157958984375, 0.26043701171875, 0.2690582275390625, 0.277679443359375, 0.2863006591796875, 0.294921875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 6.0, 9.0, 7.0, 13.0, 13.0, 17.0, 36.0, 29.0, 42.0, 42.0, 52.0, 56.0, 65.0, 68.0, 69.0, 73.0, 67.0, 68.0, 57.0, 50.0, 31.0, 29.0, 25.0, 19.0, 9.0, 14.0, 8.0, 7.0, 7.0, 1.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10040283203125, -0.09698677062988281, -0.09357070922851562, -0.09015464782714844, -0.08673858642578125, -0.08332252502441406, -0.07990646362304688, -0.07649040222167969, -0.0730743408203125, -0.06965827941894531, -0.06624221801757812, -0.06282615661621094, -0.05941009521484375, -0.05599403381347656, -0.052577972412109375, -0.04916191101074219, -0.045745849609375, -0.04232978820800781, -0.038913726806640625, -0.03549766540527344, -0.03208160400390625, -0.028665542602539062, -0.025249481201171875, -0.021833419799804688, -0.0184173583984375, -0.015001296997070312, -0.011585235595703125, -0.008169174194335938, -0.00475311279296875, -0.0013370513916015625, 0.002079010009765625, 0.0054950714111328125, 0.0089111328125, 0.012327194213867188, 0.015743255615234375, 0.019159317016601562, 0.02257537841796875, 0.025991439819335938, 0.029407501220703125, 0.03282356262207031, 0.0362396240234375, 0.03965568542480469, 0.043071746826171875, 0.04648780822753906, 0.04990386962890625, 0.05331993103027344, 0.056735992431640625, 0.06015205383300781, 0.063568115234375, 0.06698417663574219, 0.07040023803710938, 0.07381629943847656, 0.07723236083984375, 0.08064842224121094, 0.08406448364257812, 0.08748054504394531, 0.0908966064453125, 0.09431266784667969, 0.09772872924804688, 0.10114479064941406, 0.10456085205078125, 0.10797691345214844, 0.11139297485351562, 0.11480903625488281, 0.11822509765625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 5.0, 4.0, 8.0, 9.0, 7.0, 20.0, 21.0, 25.0, 36.0, 44.0, 65.0, 109.0, 165.0, 282.0, 526.0, 1148.0, 3053.0, 12753.0, 115223.0, 874233.0, 31555.0, 5627.0, 1868.0, 757.0, 388.0, 215.0, 98.0, 83.0, 51.0, 38.0, 33.0, 26.0, 13.0, 20.0, 16.0, 6.0, 6.0, 4.0, 7.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.24072265625, -0.23249053955078125, -0.2242584228515625, -0.21602630615234375, -0.207794189453125, -0.19956207275390625, -0.1913299560546875, -0.18309783935546875, -0.17486572265625, -0.16663360595703125, -0.1584014892578125, -0.15016937255859375, -0.141937255859375, -0.13370513916015625, -0.1254730224609375, -0.11724090576171875, -0.1090087890625, -0.10077667236328125, -0.0925445556640625, -0.08431243896484375, -0.076080322265625, -0.06784820556640625, -0.0596160888671875, -0.05138397216796875, -0.04315185546875, -0.03491973876953125, -0.0266876220703125, -0.01845550537109375, -0.010223388671875, -0.00199127197265625, 0.0062408447265625, 0.01447296142578125, 0.022705078125, 0.03093719482421875, 0.0391693115234375, 0.04740142822265625, 0.055633544921875, 0.06386566162109375, 0.0720977783203125, 0.08032989501953125, 0.08856201171875, 0.09679412841796875, 0.1050262451171875, 0.11325836181640625, 0.121490478515625, 0.12972259521484375, 0.1379547119140625, 0.14618682861328125, 0.1544189453125, 0.16265106201171875, 0.1708831787109375, 0.17911529541015625, 0.187347412109375, 0.19557952880859375, 0.2038116455078125, 0.21204376220703125, 0.22027587890625, 0.22850799560546875, 0.2367401123046875, 0.24497222900390625, 0.253204345703125, 0.26143646240234375, 0.2696685791015625, 0.27790069580078125, 0.2861328125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 9.0, 5.0, 11.0, 13.0, 4.0, 17.0, 14.0, 27.0, 24.0, 22.0, 27.0, 33.0, 62.0, 84.0, 101.0, 98.0, 89.0, 66.0, 59.0, 39.0, 36.0, 36.0, 31.0, 17.0, 12.0, 16.0, 12.0, 15.0, 7.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.445068359375, -0.43184661865234375, -0.4186248779296875, -0.40540313720703125, -0.392181396484375, -0.37895965576171875, -0.3657379150390625, -0.35251617431640625, -0.33929443359375, -0.32607269287109375, -0.3128509521484375, -0.29962921142578125, -0.286407470703125, -0.27318572998046875, -0.2599639892578125, -0.24674224853515625, -0.2335205078125, -0.22029876708984375, -0.2070770263671875, -0.19385528564453125, -0.180633544921875, -0.16741180419921875, -0.1541900634765625, -0.14096832275390625, -0.12774658203125, -0.11452484130859375, -0.1013031005859375, -0.08808135986328125, -0.074859619140625, -0.06163787841796875, -0.0484161376953125, -0.03519439697265625, -0.02197265625, -0.00875091552734375, 0.0044708251953125, 0.01769256591796875, 0.030914306640625, 0.04413604736328125, 0.0573577880859375, 0.07057952880859375, 0.08380126953125, 0.09702301025390625, 0.1102447509765625, 0.12346649169921875, 0.136688232421875, 0.14990997314453125, 0.1631317138671875, 0.17635345458984375, 0.1895751953125, 0.20279693603515625, 0.2160186767578125, 0.22924041748046875, 0.242462158203125, 0.25568389892578125, 0.2689056396484375, 0.28212738037109375, 0.29534912109375, 0.30857086181640625, 0.3217926025390625, 0.33501434326171875, 0.348236083984375, 0.36145782470703125, 0.3746795654296875, 0.38790130615234375, 0.401123046875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 5.0, 7.0, 15.0, 19.0, 30.0, 32.0, 51.0, 85.0, 157.0, 336.0, 847.0, 2619.0, 12464.0, 202634.0, 807606.0, 16792.0, 3059.0, 979.0, 394.0, 162.0, 82.0, 60.0, 38.0, 25.0, 19.0, 11.0, 9.0, 9.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.07568359375, -0.07324790954589844, -0.07081222534179688, -0.06837654113769531, -0.06594085693359375, -0.06350517272949219, -0.061069488525390625, -0.05863380432128906, -0.0561981201171875, -0.05376243591308594, -0.051326751708984375, -0.04889106750488281, -0.04645538330078125, -0.04401969909667969, -0.041584014892578125, -0.03914833068847656, -0.036712646484375, -0.03427696228027344, -0.031841278076171875, -0.029405593872070312, -0.02696990966796875, -0.024534225463867188, -0.022098541259765625, -0.019662857055664062, -0.0172271728515625, -0.014791488647460938, -0.012355804443359375, -0.009920120239257812, -0.00748443603515625, -0.0050487518310546875, -0.002613067626953125, -0.0001773834228515625, 0.00225830078125, 0.0046939849853515625, 0.007129669189453125, 0.009565353393554688, 0.01200103759765625, 0.014436721801757812, 0.016872406005859375, 0.019308090209960938, 0.0217437744140625, 0.024179458618164062, 0.026615142822265625, 0.029050827026367188, 0.03148651123046875, 0.03392219543457031, 0.036357879638671875, 0.03879356384277344, 0.041229248046875, 0.04366493225097656, 0.046100616455078125, 0.04853630065917969, 0.05097198486328125, 0.05340766906738281, 0.055843353271484375, 0.05827903747558594, 0.0607147216796875, 0.06315040588378906, 0.06558609008789062, 0.06802177429199219, 0.07045745849609375, 0.07289314270019531, 0.07532882690429688, 0.07776451110839844, 0.0802001953125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 6.0, 8.0, 7.0, 5.0, 14.0, 16.0, 28.0, 30.0, 36.0, 62.0, 64.0, 117.0, 131.0, 123.0, 107.0, 64.0, 52.0, 24.0, 20.0, 23.0, 12.0, 12.0, 9.0, 7.0, 6.0, 7.0, 0.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.378225326538086e-05, -2.2989697754383087e-05, -2.2197142243385315e-05, -2.1404586732387543e-05, -2.061203122138977e-05, -1.9819475710391998e-05, -1.9026920199394226e-05, -1.8234364688396454e-05, -1.744180917739868e-05, -1.664925366640091e-05, -1.5856698155403137e-05, -1.5064142644405365e-05, -1.4271587133407593e-05, -1.347903162240982e-05, -1.2686476111412048e-05, -1.1893920600414276e-05, -1.1101365089416504e-05, -1.0308809578418732e-05, -9.51625406742096e-06, -8.723698556423187e-06, -7.931143045425415e-06, -7.138587534427643e-06, -6.346032023429871e-06, -5.553476512432098e-06, -4.760921001434326e-06, -3.968365490436554e-06, -3.1758099794387817e-06, -2.3832544684410095e-06, -1.5906989574432373e-06, -7.981434464454651e-07, -5.587935447692871e-09, 7.869675755500793e-07, 1.5795230865478516e-06, 2.3720785975456238e-06, 3.164634108543396e-06, 3.957189619541168e-06, 4.7497451305389404e-06, 5.542300641536713e-06, 6.334856152534485e-06, 7.127411663532257e-06, 7.91996717453003e-06, 8.712522685527802e-06, 9.505078196525574e-06, 1.0297633707523346e-05, 1.1090189218521118e-05, 1.188274472951889e-05, 1.2675300240516663e-05, 1.3467855751514435e-05, 1.4260411262512207e-05, 1.505296677350998e-05, 1.584552228450775e-05, 1.6638077795505524e-05, 1.7430633306503296e-05, 1.8223188817501068e-05, 1.901574432849884e-05, 1.9808299839496613e-05, 2.0600855350494385e-05, 2.1393410861492157e-05, 2.218596637248993e-05, 2.29785218834877e-05, 2.3771077394485474e-05, 2.4563632905483246e-05, 2.5356188416481018e-05, 2.614874392747879e-05, 2.6941299438476562e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 5.0, 3.0, 8.0, 5.0, 14.0, 16.0, 31.0, 40.0, 57.0, 110.0, 155.0, 301.0, 545.0, 1085.0, 2253.0, 5781.0, 16865.0, 72680.0, 816033.0, 99525.0, 20812.0, 6819.0, 2678.0, 1305.0, 583.0, 360.0, 178.0, 109.0, 75.0, 44.0, 24.0, 16.0, 15.0, 9.0, 5.0, 6.0, 4.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0303955078125, -0.029106616973876953, -0.027817726135253906, -0.02652883529663086, -0.025239944458007812, -0.023951053619384766, -0.02266216278076172, -0.021373271942138672, -0.020084381103515625, -0.018795490264892578, -0.01750659942626953, -0.016217708587646484, -0.014928817749023438, -0.01363992691040039, -0.012351036071777344, -0.011062145233154297, -0.00977325439453125, -0.008484363555908203, -0.007195472717285156, -0.005906581878662109, -0.0046176910400390625, -0.0033288002014160156, -0.0020399093627929688, -0.0007510185241699219, 0.000537872314453125, 0.0018267631530761719, 0.0031156539916992188, 0.004404544830322266, 0.0056934356689453125, 0.006982326507568359, 0.008271217346191406, 0.009560108184814453, 0.0108489990234375, 0.012137889862060547, 0.013426780700683594, 0.01471567153930664, 0.016004562377929688, 0.017293453216552734, 0.01858234405517578, 0.019871234893798828, 0.021160125732421875, 0.022449016571044922, 0.02373790740966797, 0.025026798248291016, 0.026315689086914062, 0.02760457992553711, 0.028893470764160156, 0.030182361602783203, 0.03147125244140625, 0.0327601432800293, 0.034049034118652344, 0.03533792495727539, 0.03662681579589844, 0.037915706634521484, 0.03920459747314453, 0.04049348831176758, 0.041782379150390625, 0.04307126998901367, 0.04436016082763672, 0.045649051666259766, 0.04693794250488281, 0.04822683334350586, 0.049515724182128906, 0.05080461502075195, 0.052093505859375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 1.0, 5.0, 0.0, 7.0, 5.0, 9.0, 24.0, 20.0, 31.0, 42.0, 49.0, 98.0, 137.0, 133.0, 138.0, 99.0, 51.0, 34.0, 26.0, 26.0, 22.0, 21.0, 11.0, 6.0, 5.0, 2.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041107177734375, -0.03943014144897461, -0.03775310516357422, -0.03607606887817383, -0.03439903259277344, -0.03272199630737305, -0.031044960021972656, -0.029367923736572266, -0.027690887451171875, -0.026013851165771484, -0.024336814880371094, -0.022659778594970703, -0.020982742309570312, -0.019305706024169922, -0.01762866973876953, -0.01595163345336914, -0.01427459716796875, -0.01259756088256836, -0.010920524597167969, -0.009243488311767578, -0.0075664520263671875, -0.005889415740966797, -0.004212379455566406, -0.0025353431701660156, -0.000858306884765625, 0.0008187294006347656, 0.0024957656860351562, 0.004172801971435547, 0.0058498382568359375, 0.007526874542236328, 0.009203910827636719, 0.01088094711303711, 0.0125579833984375, 0.01423501968383789, 0.01591205596923828, 0.017589092254638672, 0.019266128540039062, 0.020943164825439453, 0.022620201110839844, 0.024297237396240234, 0.025974273681640625, 0.027651309967041016, 0.029328346252441406, 0.031005382537841797, 0.03268241882324219, 0.03435945510864258, 0.03603649139404297, 0.03771352767944336, 0.03939056396484375, 0.04106760025024414, 0.04274463653564453, 0.04442167282104492, 0.04609870910644531, 0.0477757453918457, 0.049452781677246094, 0.051129817962646484, 0.052806854248046875, 0.054483890533447266, 0.056160926818847656, 0.05783796310424805, 0.05951499938964844, 0.06119203567504883, 0.06286907196044922, 0.06454610824584961, 0.06622314453125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 13.0, 27.0, 63.0, 149.0, 598.0, 98.0, 31.0, 13.0, 9.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.519035816192627, -3.4270524978637695, -3.335068941116333, -3.2430856227874756, -3.151102304458618, -3.0591187477111816, -2.967135429382324, -2.875152111053467, -2.7831687927246094, -2.691185474395752, -2.5992019176483154, -2.507218599319458, -2.4152352809906006, -2.323251724243164, -2.2312684059143066, -2.139285087585449, -2.0473015308380127, -1.9553180932998657, -1.8633347749710083, -1.7713513374328613, -1.679368019104004, -1.587384581565857, -1.49540114402771, -1.4034178256988525, -1.3114343881607056, -1.2194509506225586, -1.1274676322937012, -1.0354841947555542, -0.943500816822052, -0.8515174388885498, -0.7595340013504028, -0.6675506234169006, -0.5755672454833984, -0.48358386754989624, -0.39160045981407166, -0.29961705207824707, -0.20763367414474487, -0.11565029621124268, -0.023666858673095703, 0.0683165192604065, 0.1602998971939087, 0.2522832751274109, 0.3442666828632355, 0.43625009059906006, 0.5282334685325623, 0.6202168464660645, 0.7122002840042114, 0.8041836619377136, 0.8961670398712158, 0.988150417804718, 1.0801337957382202, 1.1721172332763672, 1.2641005516052246, 1.3560839891433716, 1.4480674266815186, 1.540050745010376, 1.632034182548523, 1.72401762008667, 1.8160009384155273, 1.9079843759536743, 1.9999678134918213, 2.0919511318206787, 2.1839346885681152, 2.2759180068969727, 2.36790132522583]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 3.0, 3.0, 6.0, 2.0, 7.0, 8.0, 7.0, 10.0, 11.0, 8.0, 15.0, 13.0, 17.0, 22.0, 11.0, 30.0, 30.0, 25.0, 26.0, 78.0, 335.0, 79.0, 31.0, 37.0, 26.0, 28.0, 21.0, 12.0, 14.0, 23.0, 13.0, 12.0, 10.0, 5.0, 5.0, 4.0, 3.0, 8.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8351212739944458, -0.804752767086029, -0.7743842601776123, -0.7440156936645508, -0.713647186756134, -0.6832786798477173, -0.6529101133346558, -0.622541606426239, -0.5921730995178223, -0.5618045926094055, -0.5314360857009888, -0.5010675191879272, -0.4706990122795105, -0.44033050537109375, -0.4099619686603546, -0.3795934319496155, -0.34922492504119873, -0.318856418132782, -0.28848788142204285, -0.2581193447113037, -0.22775083780288696, -0.19738231599330902, -0.16701379418373108, -0.13664527237415314, -0.1062767505645752, -0.07590822875499725, -0.04553970694541931, -0.01517118513584137, 0.015197336673736572, 0.045565858483314514, 0.07593438029289246, 0.1063029021024704, 0.13667142391204834, 0.16703994572162628, 0.19740846753120422, 0.22777698934078217, 0.2581455111503601, 0.28851401805877686, 0.318882554769516, 0.3492510914802551, 0.3796195983886719, 0.4099881052970886, 0.44035664200782776, 0.4707251787185669, 0.5010936856269836, 0.5314621925354004, 0.5618307590484619, 0.5921992659568787, 0.6225677728652954, 0.6529362797737122, 0.6833047866821289, 0.7136733531951904, 0.7440418601036072, 0.7744103670120239, 0.8047789335250854, 0.8351474404335022, 0.865515947341919, 0.8958844542503357, 0.9262529611587524, 0.956621527671814, 0.9869900345802307, 1.0173585414886475, 1.047727108001709, 1.078095555305481, 1.1084641218185425]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 7.0, 6.0, 8.0, 13.0, 14.0, 18.0, 18.0, 25.0, 28.0, 51.0, 61.0, 160.0, 279.0, 89.0, 42.0, 43.0, 34.0, 28.0, 18.0, 25.0, 7.0, 9.0, 8.0, 3.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.12310791015625, -0.11889171600341797, -0.11467552185058594, -0.1104593276977539, -0.10624313354492188, -0.10202693939208984, -0.09781074523925781, -0.09359455108642578, -0.08937835693359375, -0.08516216278076172, -0.08094596862792969, -0.07672977447509766, -0.07251358032226562, -0.0682973861694336, -0.06408119201660156, -0.05986499786376953, -0.0556488037109375, -0.05143260955810547, -0.04721641540527344, -0.043000221252441406, -0.038784027099609375, -0.034567832946777344, -0.030351638793945312, -0.02613544464111328, -0.02191925048828125, -0.01770305633544922, -0.013486862182617188, -0.009270668029785156, -0.005054473876953125, -0.0008382797241210938, 0.0033779144287109375, 0.007594108581542969, 0.011810302734375, 0.01602649688720703, 0.020242691040039062, 0.024458885192871094, 0.028675079345703125, 0.032891273498535156, 0.03710746765136719, 0.04132366180419922, 0.04553985595703125, 0.04975605010986328, 0.05397224426269531, 0.058188438415527344, 0.062404632568359375, 0.0666208267211914, 0.07083702087402344, 0.07505321502685547, 0.0792694091796875, 0.08348560333251953, 0.08770179748535156, 0.0919179916381836, 0.09613418579101562, 0.10035037994384766, 0.10456657409667969, 0.10878276824951172, 0.11299896240234375, 0.11721515655517578, 0.12143135070800781, 0.12564754486083984, 0.12986373901367188, 0.1340799331665039, 0.13829612731933594, 0.14251232147216797, 0.146728515625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 6.0, 7.0, 5.0, 12.0, 24.0, 32.0, 51.0, 106.0, 304.0, 954.0, 5300.0, 8338845.0, 39332.0, 2596.0, 589.0, 227.0, 80.0, 43.0, 29.0, 8.0, 8.0, 2.0, 9.0, 9.0, 5.0, 3.0, 1.0, 1.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.73725426197052, -1.6924943923950195, -1.6477344036102295, -1.602974534034729, -1.5582146644592285, -1.5134546756744385, -1.468694806098938, -1.4239349365234375, -1.3791749477386475, -1.334415078163147, -1.289655089378357, -1.2448952198028564, -1.2001352310180664, -1.155375361442566, -1.1106154918670654, -1.0658555030822754, -1.021095633506775, -0.9763357043266296, -0.9315757751464844, -0.8868159055709839, -0.8420559763908386, -0.7972960472106934, -0.7525361776351929, -0.7077762484550476, -0.6630163192749023, -0.6182563900947571, -0.5734964609146118, -0.5287365913391113, -0.48397666215896606, -0.4392167329788208, -0.3944568336009979, -0.34969693422317505, -0.3049370050430298, -0.2601770758628845, -0.21541717648506165, -0.17065726220607758, -0.1258973479270935, -0.08113743364810944, -0.036377519369125366, 0.00838238000869751, 0.05314230918884277, 0.09790222346782684, 0.1426621377468109, 0.18742205202579498, 0.23218196630477905, 0.2769418954849243, 0.3217017948627472, 0.36646169424057007, 0.41122162342071533, 0.4559815526008606, 0.5007414817810059, 0.5455013513565063, 0.5902612805366516, 0.6350212097167969, 0.6797810792922974, 0.7245410084724426, 0.7693009376525879, 0.8140608668327332, 0.8588207960128784, 0.9035806655883789, 0.9483405947685242, 0.9931005239486694, 1.03786039352417, 1.08262038230896, 1.1273802518844604]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 4.0, 8.0, 10.0, 5.0, 3.0, 7.0, 2.0, 9.0, 4.0, 1.0, 11.0, 7.0, 4.0, 2.0, 4.0, 3.0, 1.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6668081879615784, -0.6346549987792969, -0.6025018692016602, -0.5703486800193787, -0.5381954908370972, -0.5060423612594604, -0.47388917207717896, -0.44173598289489746, -0.40958282351493835, -0.37742966413497925, -0.34527647495269775, -0.31312331557273865, -0.28097015619277954, -0.24881696701049805, -0.21666380763053894, -0.18451063334941864, -0.15235745906829834, -0.12020428478717804, -0.08805111795663834, -0.05589795112609863, -0.023744776844978333, 0.008408397436141968, 0.040561556816101074, 0.07271473109722137, 0.10486790537834167, 0.13702107965946198, 0.16917425394058228, 0.20132741332054138, 0.23348058760166168, 0.265633761882782, 0.2977869212627411, 0.3299400806427002, 0.36209332942962646, 0.39424648880958557, 0.42639967799186707, 0.45855283737182617, 0.49070602655410767, 0.5228592157363892, 0.5550123453140259, 0.5871655344963074, 0.6193187236785889, 0.6514719128608704, 0.6836250424385071, 0.7157782316207886, 0.7479314208030701, 0.7800846099853516, 0.8122377395629883, 0.8443909287452698, 0.8765440583229065, 0.908697247505188, 0.9408503770828247, 0.9730035662651062, 1.0051567554473877, 1.0373098850250244, 1.0694630146026611, 1.1016162633895874, 1.1337693929672241, 1.1659225225448608, 1.198075771331787, 1.2302289009094238, 1.2623820304870605, 1.2945352792739868, 1.3266884088516235, 1.3588415384292603, 1.3909947872161865]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 5.0, 11.0, 11.0, 8.0, 21.0, 36.0, 50.0, 76.0, 116.0, 170.0, 359.0, 727.0, 1519.0, 3870.0, 12353.0, 53016.0, 254328.0, 156532.0, 29080.0, 7201.0, 2478.0, 1041.0, 530.0, 271.0, 149.0, 96.0, 57.0, 41.0, 36.0, 20.0, 14.0, 1.0, 13.0, 5.0, 4.0, 6.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.046875, -1.0105438232421875, -0.974212646484375, -0.9378814697265625, -0.90155029296875, -0.8652191162109375, -0.828887939453125, -0.7925567626953125, -0.7562255859375, -0.7198944091796875, -0.683563232421875, -0.6472320556640625, -0.61090087890625, -0.5745697021484375, -0.538238525390625, -0.5019073486328125, -0.465576171875, -0.4292449951171875, -0.392913818359375, -0.3565826416015625, -0.32025146484375, -0.2839202880859375, -0.247589111328125, -0.2112579345703125, -0.1749267578125, -0.1385955810546875, -0.102264404296875, -0.0659332275390625, -0.02960205078125, 0.0067291259765625, 0.043060302734375, 0.0793914794921875, 0.11572265625, 0.1520538330078125, 0.188385009765625, 0.2247161865234375, 0.26104736328125, 0.2973785400390625, 0.333709716796875, 0.3700408935546875, 0.4063720703125, 0.4427032470703125, 0.479034423828125, 0.5153656005859375, 0.55169677734375, 0.5880279541015625, 0.624359130859375, 0.6606903076171875, 0.697021484375, 0.7333526611328125, 0.769683837890625, 0.8060150146484375, 0.84234619140625, 0.8786773681640625, 0.915008544921875, 0.9513397216796875, 0.9876708984375, 1.0240020751953125, 1.060333251953125, 1.0966644287109375, 1.13299560546875, 1.1693267822265625, 1.205657958984375, 1.2419891357421875, 1.2783203125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 10.0, 5.0, 15.0, 16.0, 22.0, 28.0, 22.0, 46.0, 63.0, 85.0, 87.0, 94.0, 118.0, 93.0, 72.0, 57.0, 57.0, 35.0, 23.0, 20.0, 14.0, 7.0, 8.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1571044921875, -0.15263748168945312, -0.14817047119140625, -0.14370346069335938, -0.1392364501953125, -0.13476943969726562, -0.13030242919921875, -0.12583541870117188, -0.121368408203125, -0.11690139770507812, -0.11243438720703125, -0.10796737670898438, -0.1035003662109375, -0.09903335571289062, -0.09456634521484375, -0.09009933471679688, -0.08563232421875, -0.08116531372070312, -0.07669830322265625, -0.07223129272460938, -0.0677642822265625, -0.06329727172851562, -0.05883026123046875, -0.054363250732421875, -0.049896240234375, -0.045429229736328125, -0.04096221923828125, -0.036495208740234375, -0.0320281982421875, -0.027561187744140625, -0.02309417724609375, -0.018627166748046875, -0.01416015625, -0.009693145751953125, -0.00522613525390625, -0.000759124755859375, 0.0037078857421875, 0.008174896240234375, 0.01264190673828125, 0.017108917236328125, 0.021575927734375, 0.026042938232421875, 0.03050994873046875, 0.034976959228515625, 0.0394439697265625, 0.043910980224609375, 0.04837799072265625, 0.052845001220703125, 0.05731201171875, 0.061779022216796875, 0.06624603271484375, 0.07071304321289062, 0.0751800537109375, 0.07964706420898438, 0.08411407470703125, 0.08858108520507812, 0.093048095703125, 0.09751510620117188, 0.10198211669921875, 0.10644912719726562, 0.1109161376953125, 0.11538314819335938, 0.11985015869140625, 0.12431716918945312, 0.1287841796875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 8.0, 6.0, 9.0, 19.0, 47.0, 117.0, 154.0, 63.0, 28.0, 11.0, 11.0, 6.0, 4.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.457155227661133, -2.3986170291900635, -2.3400790691375732, -2.281540870666504, -2.2230029106140137, -2.1644647121429443, -2.105926513671875, -2.0473885536193848, -1.9888503551483154, -1.9303122758865356, -1.8717741966247559, -1.8132359981536865, -1.7546979188919067, -1.696159839630127, -1.6376217603683472, -1.5790836811065674, -1.520545482635498, -1.4620074033737183, -1.4034693241119385, -1.3449311256408691, -1.2863930463790894, -1.2278549671173096, -1.1693168878555298, -1.11077880859375, -1.0522407293319702, -0.9937026500701904, -0.9351645112037659, -0.8766264319419861, -0.8180882930755615, -0.7595502138137817, -0.701012134552002, -0.6424739956855774, -0.5839358568191528, -0.525397777557373, -0.4668596386909485, -0.4083215594291687, -0.34978342056274414, -0.29124534130096436, -0.23270723223686218, -0.17416912317276, -0.11563101410865784, -0.05709290876984596, 0.0014451965689659119, 0.05998329818248749, 0.11852140724658966, 0.17705950140953064, 0.2355976104736328, 0.294135719537735, 0.35267382860183716, 0.41121193766593933, 0.4697500467300415, 0.5282881259918213, 0.5868262648582458, 0.6453643441200256, 0.7039024829864502, 0.76244056224823, 0.8209786415100098, 0.8795167207717896, 0.9380548596382141, 0.9965929388999939, 1.0551310777664185, 1.1136691570281982, 1.172207236289978, 1.2307453155517578, 1.2892835140228271]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 4.0, 7.0, 4.0, 9.0, 9.0, 8.0, 17.0, 47.0, 95.0, 129.0, 70.0, 30.0, 9.0, 5.0, 7.0, 7.0, 7.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7965117692947388, -0.773281455039978, -0.7500510811805725, -0.7268207669258118, -0.7035903930664062, -0.6803600788116455, -0.6571297645568848, -0.633899450302124, -0.6106690764427185, -0.5874387621879578, -0.5642083883285522, -0.5409780740737915, -0.5177477598190308, -0.49451738595962524, -0.4712870717048645, -0.44805672764778137, -0.42482638359069824, -0.4015960395336151, -0.378365695476532, -0.35513538122177124, -0.3319050371646881, -0.308674693107605, -0.28544437885284424, -0.2622140347957611, -0.23898369073867798, -0.21575334668159485, -0.1925230175256729, -0.16929268836975098, -0.14606234431266785, -0.12283200770616531, -0.09960167109966278, -0.07637134194374084, -0.053140997886657715, -0.029910661280155182, -0.006680324673652649, 0.016550011932849884, 0.03978034853935242, 0.06301068514585495, 0.08624102175235748, 0.10947135090827942, 0.13270169496536255, 0.15593203902244568, 0.17916236817836761, 0.20239269733428955, 0.22562304139137268, 0.2488533854484558, 0.27208369970321655, 0.2953140437602997, 0.3185443878173828, 0.34177473187446594, 0.3650050759315491, 0.3882353901863098, 0.41146573424339294, 0.4346960783004761, 0.4579263925552368, 0.48115673661231995, 0.5043870806694031, 0.5276173949241638, 0.5508477687835693, 0.5740780830383301, 0.5973083972930908, 0.6205387711524963, 0.6437690854072571, 0.6669994592666626, 0.6902297735214233]}, "_wandb": {"runtime": 3622}} \ No newline at end of file