diff --git "a/wandb/run-20220307_135359-2ct09q1k/files/wandb-summary.json" "b/wandb/run-20220307_135359-2ct09q1k/files/wandb-summary.json" --- "a/wandb/run-20220307_135359-2ct09q1k/files/wandb-summary.json" +++ "b/wandb/run-20220307_135359-2ct09q1k/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 0.5258, "train/learning_rate": 5.068289786223278e-06, "train/epoch": 16.82, "train/global_step": 15000, "_runtime": 98095, "_timestamp": 1646759334, "_step": 15009, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 16.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 12.0, 29.0, 30160.0, 218.0, 32.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-204.0, -200.2578125, -196.515625, -192.7734375, -189.03125, -185.2890625, -181.546875, -177.8046875, -174.0625, -170.3203125, -166.578125, -162.8359375, -159.09375, -155.3515625, -151.609375, -147.8671875, -144.125, -140.3828125, -136.640625, -132.8984375, -129.15625, -125.4140625, -121.671875, -117.9296875, -114.1875, -110.4453125, -106.703125, -102.9609375, -99.21875, -95.4765625, -91.734375, -87.9921875, -84.25, -80.5078125, -76.765625, -73.0234375, -69.28125, -65.5390625, -61.796875, -58.0546875, -54.3125, -50.5703125, -46.828125, -43.0859375, -39.34375, -35.6015625, -31.859375, -28.1171875, -24.375, -20.6328125, -16.890625, -13.1484375, -9.40625, -5.6640625, -1.921875, 1.8203125, 5.5625, 9.3046875, 13.046875, 16.7890625, 20.53125, 24.2734375, 28.015625, 31.7578125, 35.5]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 0.0, 5.0, 2.0, 4.0, 4.0, 8.0, 10.0, 12.0, 7.0, 8.0, 18.0, 15.0, 10.0, 11.0, 15.0, 16.0, 24.0, 21.0, 27.0, 27.0, 22.0, 39.0, 34.0, 47.0, 43.0, 44.0, 41.0, 33.0, 47.0, 33.0, 55.0, 32.0, 37.0, 31.0, 20.0, 19.0, 34.0, 27.0, 18.0, 12.0, 16.0, 15.0, 9.0, 12.0, 12.0, 13.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-58.242820739746094, -56.97196960449219, -55.70111846923828, -54.430267333984375, -53.15941619873047, -51.88856506347656, -50.617713928222656, -49.346866607666016, -48.07601547241211, -46.8051643371582, -45.5343132019043, -44.26346206665039, -42.992610931396484, -41.721763610839844, -40.45091247558594, -39.18006134033203, -37.909210205078125, -36.63835906982422, -35.36750793457031, -34.096656799316406, -32.8258056640625, -31.554956436157227, -30.28410530090332, -29.013256072998047, -27.742401123046875, -26.47154998779297, -25.200698852539062, -23.929847717285156, -22.658998489379883, -21.388147354125977, -20.11729621887207, -18.846446990966797, -17.575593948364258, -16.30474281311035, -15.033892631530762, -13.763041496276855, -12.492191314697266, -11.22134017944336, -9.950489044189453, -8.679638862609863, -7.408787727355957, -6.137937068939209, -4.867086410522461, -3.5962352752685547, -2.3253846168518066, -1.0545339584350586, 0.21631717681884766, 1.4871673583984375, 2.7580184936523438, 4.028869152069092, 5.29971981048584, 6.570570945739746, 7.841421604156494, 9.112272262573242, 10.383123397827148, 11.653973579406738, 12.924824714660645, 14.19567584991455, 15.46652603149414, 16.737377166748047, 18.008228302001953, 19.27907943725586, 20.549930572509766, 21.82077980041504, 23.091630935668945]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 10.0, 9.0, 11.0, 10.0, 15.0, 9.0, 24.0, 16.0, 25.0, 21.0, 31.0, 25.0, 35.0, 31.0, 27.0, 39.0, 39.0, 35.0, 41.0, 40.0, 42.0, 47.0, 37.0, 38.0, 31.0, 36.0, 35.0, 36.0, 43.0, 30.0, 19.0, 14.0, 23.0, 12.0, 14.0, 14.0, 12.0, 8.0, 7.0, 4.0, 6.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.22478103637695, -37.84811019897461, -36.471435546875, -35.094764709472656, -33.71809387207031, -32.3414192199707, -30.96474838256836, -29.588075637817383, -28.211402893066406, -26.83473014831543, -25.458059310913086, -24.08138656616211, -22.704713821411133, -21.328041076660156, -19.951370239257812, -18.574697494506836, -17.198026657104492, -15.821354866027832, -14.444682121276855, -13.068010330200195, -11.691337585449219, -10.314665794372559, -8.937994003295898, -7.561321258544922, -6.184649467468262, -4.807977199554443, -3.431305170059204, -2.054633140563965, -0.6779608726501465, 0.6987113952636719, 2.075383186340332, 3.4520559310913086, 4.828727722167969, 6.205399990081787, 7.5820722579956055, 8.958744049072266, 10.335416793823242, 11.712088584899902, 13.088760375976562, 14.465433120727539, 15.8421049118042, 17.21877670288086, 18.595449447631836, 19.972122192382812, 21.348793029785156, 22.725465774536133, 24.10213851928711, 25.478809356689453, 26.85548210144043, 28.232154846191406, 29.60882568359375, 30.985498428344727, 32.3621711730957, 33.73884201049805, 35.115516662597656, 36.4921875, 37.868858337402344, 39.24552917480469, 40.6222038269043, 41.99887466430664, 43.375545501708984, 44.752220153808594, 46.12889099121094, 47.50556182861328, 48.88223648071289]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 3.0, 8.0, 25.0, 25.0, 35.0, 59.0, 69.0, 131.0, 198.0, 339.0, 505.0, 848.0, 1367.0, 2121.0, 3390.0, 5243.0, 7777.0, 11615.0, 17170.0, 24596.0, 34286.0, 46270.0, 60108.0, 75241.0, 89448.0, 101241.0, 126627.0, 95908.0, 84113.0, 69515.0, 55165.0, 40889.0, 30012.0, 21089.0, 14654.0, 9856.0, 6604.0, 4347.0, 2808.0, 1772.0, 1187.0, 738.0, 422.0, 270.0, 170.0, 120.0, 62.0, 46.0, 27.0, 17.0, 12.0, 7.0, 3.0, 3.0, 2.0, 2.0], "bins": [-161.375, -156.669921875, -151.96484375, -147.259765625, -142.5546875, -137.849609375, -133.14453125, -128.439453125, -123.734375, -119.029296875, -114.32421875, -109.619140625, -104.9140625, -100.208984375, -95.50390625, -90.798828125, -86.09375, -81.388671875, -76.68359375, -71.978515625, -67.2734375, -62.568359375, -57.86328125, -53.158203125, -48.453125, -43.748046875, -39.04296875, -34.337890625, -29.6328125, -24.927734375, -20.22265625, -15.517578125, -10.8125, -6.107421875, -1.40234375, 3.302734375, 8.0078125, 12.712890625, 17.41796875, 22.123046875, 26.828125, 31.533203125, 36.23828125, 40.943359375, 45.6484375, 50.353515625, 55.05859375, 59.763671875, 64.46875, 69.173828125, 73.87890625, 78.583984375, 83.2890625, 87.994140625, 92.69921875, 97.404296875, 102.109375, 106.814453125, 111.51953125, 116.224609375, 120.9296875, 125.634765625, 130.33984375, 135.044921875, 139.75]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 1.0, 5.0, 1.0, 7.0, 5.0, 10.0, 7.0, 8.0, 10.0, 10.0, 9.0, 10.0, 14.0, 22.0, 22.0, 18.0, 25.0, 21.0, 29.0, 35.0, 39.0, 37.0, 29.0, 45.0, 36.0, 50.0, 50.0, 35.0, 32.0, 34.0, 31.0, 35.0, 33.0, 25.0, 17.0, 30.0, 17.0, 23.0, 20.0, 11.0, 15.0, 17.0, 17.0, 7.0, 8.0, 10.0, 10.0, 9.0, 6.0, 2.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.90625, -57.91845703125, -55.9306640625, -53.94287109375, -51.955078125, -49.96728515625, -47.9794921875, -45.99169921875, -44.00390625, -42.01611328125, -40.0283203125, -38.04052734375, -36.052734375, -34.06494140625, -32.0771484375, -30.08935546875, -28.1015625, -26.11376953125, -24.1259765625, -22.13818359375, -20.150390625, -18.16259765625, -16.1748046875, -14.18701171875, -12.19921875, -10.21142578125, -8.2236328125, -6.23583984375, -4.248046875, -2.26025390625, -0.2724609375, 1.71533203125, 3.703125, 5.69091796875, 7.6787109375, 9.66650390625, 11.654296875, 13.64208984375, 15.6298828125, 17.61767578125, 19.60546875, 21.59326171875, 23.5810546875, 25.56884765625, 27.556640625, 29.54443359375, 31.5322265625, 33.52001953125, 35.5078125, 37.49560546875, 39.4833984375, 41.47119140625, 43.458984375, 45.44677734375, 47.4345703125, 49.42236328125, 51.41015625, 53.39794921875, 55.3857421875, 57.37353515625, 59.361328125, 61.34912109375, 63.3369140625, 65.32470703125, 67.3125]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 6.0, 3.0, 5.0, 4.0, 5.0, 6.0, 11.0, 14.0, 11.0, 15.0, 20.0, 17.0, 31.0, 35.0, 35.0, 27.0, 38.0, 44.0, 47.0, 39.0, 56.0, 42.0, 45.0, 54.0, 44.0, 46.0, 37.0, 43.0, 35.0, 25.0, 19.0, 25.0, 17.0, 22.0, 11.0, 17.0, 11.0, 13.0, 7.0, 7.0, 2.0, 5.0, 7.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-48.55672836303711, -47.03756332397461, -45.518394470214844, -43.999229431152344, -42.48006057739258, -40.96089553833008, -39.44172668457031, -37.92256164550781, -36.40339660644531, -34.88423156738281, -33.36506271362305, -31.845897674560547, -30.32672882080078, -28.80756378173828, -27.28839683532715, -25.769229888916016, -24.25006103515625, -22.730894088745117, -21.211727142333984, -19.692562103271484, -18.17339324951172, -16.65422821044922, -15.135061264038086, -13.615894317626953, -12.09672737121582, -10.577560424804688, -9.058393478393555, -7.539227485656738, -6.0200605392456055, -4.500893592834473, -2.9817276000976562, -1.4625606536865234, 0.056610107421875, 1.5757768154144287, 3.0949435234069824, 4.614109992980957, 6.13327693939209, 7.652443885803223, 9.171609878540039, 10.690776824951172, 12.209943771362305, 13.729110717773438, 15.24827766418457, 16.767444610595703, 18.286609649658203, 19.80577850341797, 21.32494354248047, 22.8441104888916, 24.363277435302734, 25.882444381713867, 27.401611328125, 28.9207763671875, 30.439945220947266, 31.959110260009766, 33.47827911376953, 34.99744415283203, 36.51660919189453, 38.03577423095703, 39.5549430847168, 41.0741081237793, 42.59327697753906, 44.11244201660156, 45.63160705566406, 47.15077590942383, 48.669944763183594]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 5.0, 6.0, 6.0, 8.0, 12.0, 14.0, 18.0, 14.0, 13.0, 24.0, 18.0, 23.0, 21.0, 28.0, 24.0, 30.0, 36.0, 44.0, 46.0, 50.0, 29.0, 44.0, 48.0, 42.0, 36.0, 18.0, 49.0, 35.0, 31.0, 46.0, 18.0, 16.0, 26.0, 21.0, 16.0, 24.0, 9.0, 11.0, 7.0, 5.0, 4.0, 7.0, 4.0, 3.0, 3.0, 2.0, 0.0, 3.0, 3.0, 2.0, 1.0], "bins": [-51.44761657714844, -49.96538162231445, -48.4831428527832, -47.00090789794922, -45.51866912841797, -44.036434173583984, -42.55419921875, -41.07196044921875, -39.589725494384766, -38.10749053955078, -36.62525177001953, -35.14301681518555, -33.66078186035156, -32.17854309082031, -30.696308135986328, -29.21407127380371, -27.731834411621094, -26.249597549438477, -24.76736068725586, -23.285125732421875, -21.802888870239258, -20.32065200805664, -18.838417053222656, -17.35618019104004, -15.873943328857422, -14.391706466674805, -12.909470558166504, -11.427234649658203, -9.944997787475586, -8.462760925292969, -6.980525016784668, -5.498289108276367, -4.01605224609375, -2.533815860748291, -1.051579475402832, 0.43065690994262695, 1.912893295288086, 3.395129680633545, 4.877366065979004, 6.359601974487305, 7.841838836669922, 9.324075698852539, 10.80631160736084, 12.28854751586914, 13.770784378051758, 15.253021240234375, 16.73525619506836, 18.217493057250977, 19.699729919433594, 21.18196678161621, 22.664203643798828, 24.146438598632812, 25.62867546081543, 27.110912322998047, 28.59314727783203, 30.07538414001465, 31.557621002197266, 33.03985595703125, 34.5220947265625, 36.004329681396484, 37.48656463623047, 38.96880340576172, 40.4510383605957, 41.93327331542969, 43.41551208496094]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 3.0, 9.0, 20.0, 25.0, 37.0, 52.0, 93.0, 149.0, 275.0, 339.0, 609.0, 943.0, 1510.0, 2436.0, 3865.0, 6211.0, 9995.0, 16294.0, 26501.0, 43423.0, 70672.0, 117489.0, 193413.0, 320495.0, 528809.0, 787279.0, 772325.0, 512200.0, 309424.0, 186214.0, 111785.0, 67434.0, 40454.0, 24690.0, 14972.0, 9217.0, 5618.0, 3455.0, 2140.0, 1253.0, 834.0, 513.0, 289.0, 214.0, 128.0, 72.0, 38.0, 39.0, 15.0, 10.0, 6.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.6875, -76.2255859375, -73.763671875, -71.3017578125, -68.83984375, -66.3779296875, -63.916015625, -61.4541015625, -58.9921875, -56.5302734375, -54.068359375, -51.6064453125, -49.14453125, -46.6826171875, -44.220703125, -41.7587890625, -39.296875, -36.8349609375, -34.373046875, -31.9111328125, -29.44921875, -26.9873046875, -24.525390625, -22.0634765625, -19.6015625, -17.1396484375, -14.677734375, -12.2158203125, -9.75390625, -7.2919921875, -4.830078125, -2.3681640625, 0.09375, 2.5556640625, 5.017578125, 7.4794921875, 9.94140625, 12.4033203125, 14.865234375, 17.3271484375, 19.7890625, 22.2509765625, 24.712890625, 27.1748046875, 29.63671875, 32.0986328125, 34.560546875, 37.0224609375, 39.484375, 41.9462890625, 44.408203125, 46.8701171875, 49.33203125, 51.7939453125, 54.255859375, 56.7177734375, 59.1796875, 61.6416015625, 64.103515625, 66.5654296875, 69.02734375, 71.4892578125, 73.951171875, 76.4130859375, 78.875]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 3.0, 7.0, 5.0, 10.0, 11.0, 6.0, 7.0, 13.0, 17.0, 25.0, 12.0, 16.0, 19.0, 25.0, 30.0, 26.0, 25.0, 27.0, 45.0, 42.0, 31.0, 40.0, 39.0, 38.0, 41.0, 48.0, 41.0, 38.0, 26.0, 29.0, 27.0, 37.0, 17.0, 27.0, 26.0, 21.0, 22.0, 19.0, 8.0, 8.0, 8.0, 14.0, 5.0, 7.0, 1.0, 2.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-41.8125, -40.55517578125, -39.2978515625, -38.04052734375, -36.783203125, -35.52587890625, -34.2685546875, -33.01123046875, -31.75390625, -30.49658203125, -29.2392578125, -27.98193359375, -26.724609375, -25.46728515625, -24.2099609375, -22.95263671875, -21.6953125, -20.43798828125, -19.1806640625, -17.92333984375, -16.666015625, -15.40869140625, -14.1513671875, -12.89404296875, -11.63671875, -10.37939453125, -9.1220703125, -7.86474609375, -6.607421875, -5.35009765625, -4.0927734375, -2.83544921875, -1.578125, -0.32080078125, 0.9365234375, 2.19384765625, 3.451171875, 4.70849609375, 5.9658203125, 7.22314453125, 8.48046875, 9.73779296875, 10.9951171875, 12.25244140625, 13.509765625, 14.76708984375, 16.0244140625, 17.28173828125, 18.5390625, 19.79638671875, 21.0537109375, 22.31103515625, 23.568359375, 24.82568359375, 26.0830078125, 27.34033203125, 28.59765625, 29.85498046875, 31.1123046875, 32.36962890625, 33.626953125, 34.88427734375, 36.1416015625, 37.39892578125, 38.65625]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 6.0, 10.0, 10.0, 17.0, 27.0, 41.0, 68.0, 79.0, 139.0, 221.0, 366.0, 567.0, 937.0, 1559.0, 2673.0, 4364.0, 7335.0, 11855.0, 20233.0, 33330.0, 55258.0, 91577.0, 147523.0, 235897.0, 361487.0, 516783.0, 649434.0, 637974.0, 494972.0, 341776.0, 222490.0, 139409.0, 85942.0, 51698.0, 31423.0, 18455.0, 11160.0, 6912.0, 4024.0, 2446.0, 1461.0, 918.0, 539.0, 314.0, 223.0, 123.0, 78.0, 48.0, 32.0, 21.0, 20.0, 14.0, 7.0, 7.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0], "bins": [-48.0625, -46.5087890625, -44.955078125, -43.4013671875, -41.84765625, -40.2939453125, -38.740234375, -37.1865234375, -35.6328125, -34.0791015625, -32.525390625, -30.9716796875, -29.41796875, -27.8642578125, -26.310546875, -24.7568359375, -23.203125, -21.6494140625, -20.095703125, -18.5419921875, -16.98828125, -15.4345703125, -13.880859375, -12.3271484375, -10.7734375, -9.2197265625, -7.666015625, -6.1123046875, -4.55859375, -3.0048828125, -1.451171875, 0.1025390625, 1.65625, 3.2099609375, 4.763671875, 6.3173828125, 7.87109375, 9.4248046875, 10.978515625, 12.5322265625, 14.0859375, 15.6396484375, 17.193359375, 18.7470703125, 20.30078125, 21.8544921875, 23.408203125, 24.9619140625, 26.515625, 28.0693359375, 29.623046875, 31.1767578125, 32.73046875, 34.2841796875, 35.837890625, 37.3916015625, 38.9453125, 40.4990234375, 42.052734375, 43.6064453125, 45.16015625, 46.7138671875, 48.267578125, 49.8212890625, 51.375]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 7.0, 11.0, 13.0, 3.0, 15.0, 15.0, 17.0, 24.0, 31.0, 34.0, 52.0, 39.0, 77.0, 81.0, 94.0, 125.0, 129.0, 154.0, 186.0, 207.0, 186.0, 213.0, 244.0, 224.0, 216.0, 231.0, 205.0, 219.0, 165.0, 147.0, 140.0, 117.0, 83.0, 84.0, 63.0, 50.0, 44.0, 31.0, 18.0, 15.0, 17.0, 7.0, 14.0, 11.0, 8.0, 6.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.65625, -20.01171875, -19.3671875, -18.72265625, -18.078125, -17.43359375, -16.7890625, -16.14453125, -15.5, -14.85546875, -14.2109375, -13.56640625, -12.921875, -12.27734375, -11.6328125, -10.98828125, -10.34375, -9.69921875, -9.0546875, -8.41015625, -7.765625, -7.12109375, -6.4765625, -5.83203125, -5.1875, -4.54296875, -3.8984375, -3.25390625, -2.609375, -1.96484375, -1.3203125, -0.67578125, -0.03125, 0.61328125, 1.2578125, 1.90234375, 2.546875, 3.19140625, 3.8359375, 4.48046875, 5.125, 5.76953125, 6.4140625, 7.05859375, 7.703125, 8.34765625, 8.9921875, 9.63671875, 10.28125, 10.92578125, 11.5703125, 12.21484375, 12.859375, 13.50390625, 14.1484375, 14.79296875, 15.4375, 16.08203125, 16.7265625, 17.37109375, 18.015625, 18.66015625, 19.3046875, 19.94921875, 20.59375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 5.0, 11.0, 13.0, 15.0, 19.0, 20.0, 24.0, 25.0, 41.0, 44.0, 46.0, 58.0, 58.0, 45.0, 44.0, 54.0, 68.0, 39.0, 49.0, 40.0, 40.0, 31.0, 39.0, 21.0, 26.0, 21.0, 15.0, 22.0, 18.0, 18.0, 8.0, 7.0, 5.0, 6.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-52.5589714050293, -50.855369567871094, -49.15176773071289, -47.44816589355469, -45.744564056396484, -44.04096221923828, -42.33735656738281, -40.633758544921875, -38.930152893066406, -37.2265510559082, -35.52294921875, -33.8193473815918, -32.115745544433594, -30.41214370727539, -28.708539962768555, -27.00493812561035, -25.30133819580078, -23.597736358642578, -21.894134521484375, -20.190532684326172, -18.48693084716797, -16.783329010009766, -15.07972526550293, -13.376123428344727, -11.672521591186523, -9.96891975402832, -8.265317916870117, -6.561715126037598, -4.8581132888793945, -3.1545114517211914, -1.4509086608886719, 0.25269317626953125, 1.9562950134277344, 3.6598970890045166, 5.363499164581299, 7.06710147857666, 8.770703315734863, 10.474305152893066, 12.177907943725586, 13.881509780883789, 15.585111618041992, 17.288713455200195, 18.9923152923584, 20.695919036865234, 22.399520874023438, 24.10312271118164, 25.806724548339844, 27.510326385498047, 29.21392822265625, 30.917530059814453, 32.621131896972656, 34.32473373413086, 36.02833557128906, 37.731937408447266, 39.43553924560547, 41.13914489746094, 42.842742919921875, 44.54634475708008, 46.24994659423828, 47.953548431396484, 49.65715026855469, 51.36075210571289, 53.064353942871094, 54.76795959472656, 56.471561431884766]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 6.0, 4.0, 8.0, 8.0, 5.0, 15.0, 12.0, 10.0, 14.0, 11.0, 20.0, 12.0, 21.0, 19.0, 31.0, 36.0, 33.0, 47.0, 32.0, 42.0, 51.0, 30.0, 32.0, 31.0, 46.0, 37.0, 40.0, 42.0, 37.0, 33.0, 29.0, 29.0, 25.0, 21.0, 20.0, 17.0, 27.0, 14.0, 13.0, 7.0, 9.0, 9.0, 3.0, 4.0, 2.0, 0.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-47.955162048339844, -46.58327102661133, -45.21137619018555, -43.83948516845703, -42.46759033203125, -41.095699310302734, -39.72380828857422, -38.35191345214844, -36.980018615722656, -35.60812759399414, -34.23623275756836, -32.864341735839844, -31.492446899414062, -30.120555877685547, -28.7486629486084, -27.37677001953125, -26.004878997802734, -24.632986068725586, -23.261093139648438, -21.889202117919922, -20.51730728149414, -19.145416259765625, -17.773523330688477, -16.401630401611328, -15.02973747253418, -13.657844543457031, -12.285951614379883, -10.91405963897705, -9.542166709899902, -8.170273780822754, -6.798381805419922, -5.426488876342773, -4.054599761962891, -2.6827070713043213, -1.310814380645752, 0.06107807159423828, 1.4329710006713867, 2.804863929748535, 4.176755905151367, 5.548648834228516, 6.920541763305664, 8.292434692382812, 9.664327621459961, 11.036219596862793, 12.408112525939941, 13.78000545501709, 15.151897430419922, 16.52379035949707, 17.89568328857422, 19.267576217651367, 20.639469146728516, 22.01136016845703, 23.383255004882812, 24.755146026611328, 26.127038955688477, 27.498931884765625, 28.870824813842773, 30.242717742919922, 31.61461067199707, 32.98650360107422, 34.358394622802734, 35.730289459228516, 37.10218048095703, 38.47407531738281, 39.84596633911133]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 9.0, 14.0, 21.0, 39.0, 44.0, 71.0, 107.0, 163.0, 238.0, 397.0, 611.0, 930.0, 1363.0, 2189.0, 3275.0, 5170.0, 7678.0, 12117.0, 18816.0, 29531.0, 47621.0, 78676.0, 127177.0, 179032.0, 182505.0, 132928.0, 81872.0, 50047.0, 30402.0, 19418.0, 12609.0, 8209.0, 5391.0, 3501.0, 2268.0, 1447.0, 926.0, 615.0, 402.0, 251.0, 169.0, 123.0, 61.0, 46.0, 30.0, 14.0, 18.0, 4.0, 7.0, 6.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-72.0625, -69.8818359375, -67.701171875, -65.5205078125, -63.33984375, -61.1591796875, -58.978515625, -56.7978515625, -54.6171875, -52.4365234375, -50.255859375, -48.0751953125, -45.89453125, -43.7138671875, -41.533203125, -39.3525390625, -37.171875, -34.9912109375, -32.810546875, -30.6298828125, -28.44921875, -26.2685546875, -24.087890625, -21.9072265625, -19.7265625, -17.5458984375, -15.365234375, -13.1845703125, -11.00390625, -8.8232421875, -6.642578125, -4.4619140625, -2.28125, -0.1005859375, 2.080078125, 4.2607421875, 6.44140625, 8.6220703125, 10.802734375, 12.9833984375, 15.1640625, 17.3447265625, 19.525390625, 21.7060546875, 23.88671875, 26.0673828125, 28.248046875, 30.4287109375, 32.609375, 34.7900390625, 36.970703125, 39.1513671875, 41.33203125, 43.5126953125, 45.693359375, 47.8740234375, 50.0546875, 52.2353515625, 54.416015625, 56.5966796875, 58.77734375, 60.9580078125, 63.138671875, 65.3193359375, 67.5]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 2.0, 2.0, 2.0, 7.0, 11.0, 4.0, 6.0, 7.0, 12.0, 10.0, 10.0, 20.0, 19.0, 20.0, 29.0, 29.0, 41.0, 40.0, 26.0, 42.0, 37.0, 34.0, 32.0, 41.0, 45.0, 39.0, 50.0, 45.0, 37.0, 38.0, 31.0, 34.0, 23.0, 28.0, 28.0, 24.0, 14.0, 11.0, 17.0, 13.0, 10.0, 6.0, 7.0, 1.0, 4.0, 3.0, 6.0, 3.0, 2.0, 0.0, 5.0], "bins": [-45.78125, -44.54638671875, -43.3115234375, -42.07666015625, -40.841796875, -39.60693359375, -38.3720703125, -37.13720703125, -35.90234375, -34.66748046875, -33.4326171875, -32.19775390625, -30.962890625, -29.72802734375, -28.4931640625, -27.25830078125, -26.0234375, -24.78857421875, -23.5537109375, -22.31884765625, -21.083984375, -19.84912109375, -18.6142578125, -17.37939453125, -16.14453125, -14.90966796875, -13.6748046875, -12.43994140625, -11.205078125, -9.97021484375, -8.7353515625, -7.50048828125, -6.265625, -5.03076171875, -3.7958984375, -2.56103515625, -1.326171875, -0.09130859375, 1.1435546875, 2.37841796875, 3.61328125, 4.84814453125, 6.0830078125, 7.31787109375, 8.552734375, 9.78759765625, 11.0224609375, 12.25732421875, 13.4921875, 14.72705078125, 15.9619140625, 17.19677734375, 18.431640625, 19.66650390625, 20.9013671875, 22.13623046875, 23.37109375, 24.60595703125, 25.8408203125, 27.07568359375, 28.310546875, 29.54541015625, 30.7802734375, 32.01513671875, 33.25]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 8.0, 4.0, 9.0, 13.0, 18.0, 30.0, 36.0, 61.0, 70.0, 109.0, 173.0, 196.0, 380.0, 531.0, 751.0, 1086.0, 1657.0, 2575.0, 3910.0, 6251.0, 9744.0, 15968.0, 26566.0, 45571.0, 85470.0, 164166.0, 255535.0, 192641.0, 101553.0, 53644.0, 30438.0, 18055.0, 11160.0, 7198.0, 4483.0, 2869.0, 1873.0, 1134.0, 858.0, 536.0, 392.0, 251.0, 198.0, 118.0, 76.0, 60.0, 37.0, 26.0, 17.0, 20.0, 11.0, 9.0, 8.0, 6.0, 2.0, 0.0, 1.0, 5.0], "bins": [-93.625, -90.755859375, -87.88671875, -85.017578125, -82.1484375, -79.279296875, -76.41015625, -73.541015625, -70.671875, -67.802734375, -64.93359375, -62.064453125, -59.1953125, -56.326171875, -53.45703125, -50.587890625, -47.71875, -44.849609375, -41.98046875, -39.111328125, -36.2421875, -33.373046875, -30.50390625, -27.634765625, -24.765625, -21.896484375, -19.02734375, -16.158203125, -13.2890625, -10.419921875, -7.55078125, -4.681640625, -1.8125, 1.056640625, 3.92578125, 6.794921875, 9.6640625, 12.533203125, 15.40234375, 18.271484375, 21.140625, 24.009765625, 26.87890625, 29.748046875, 32.6171875, 35.486328125, 38.35546875, 41.224609375, 44.09375, 46.962890625, 49.83203125, 52.701171875, 55.5703125, 58.439453125, 61.30859375, 64.177734375, 67.046875, 69.916015625, 72.78515625, 75.654296875, 78.5234375, 81.392578125, 84.26171875, 87.130859375, 90.0]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 5.0, 8.0, 13.0, 15.0, 22.0, 18.0, 17.0, 23.0, 19.0, 24.0, 36.0, 35.0, 34.0, 25.0, 32.0, 29.0, 36.0, 38.0, 37.0, 40.0, 35.0, 47.0, 51.0, 40.0, 36.0, 36.0, 31.0, 36.0, 27.0, 23.0, 30.0, 9.0, 18.0, 14.0, 14.0, 2.0, 15.0, 4.0, 9.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-27.609375, -26.753662109375, -25.89794921875, -25.042236328125, -24.1865234375, -23.330810546875, -22.47509765625, -21.619384765625, -20.763671875, -19.907958984375, -19.05224609375, -18.196533203125, -17.3408203125, -16.485107421875, -15.62939453125, -14.773681640625, -13.91796875, -13.062255859375, -12.20654296875, -11.350830078125, -10.4951171875, -9.639404296875, -8.78369140625, -7.927978515625, -7.072265625, -6.216552734375, -5.36083984375, -4.505126953125, -3.6494140625, -2.793701171875, -1.93798828125, -1.082275390625, -0.2265625, 0.629150390625, 1.48486328125, 2.340576171875, 3.1962890625, 4.052001953125, 4.90771484375, 5.763427734375, 6.619140625, 7.474853515625, 8.33056640625, 9.186279296875, 10.0419921875, 10.897705078125, 11.75341796875, 12.609130859375, 13.46484375, 14.320556640625, 15.17626953125, 16.031982421875, 16.8876953125, 17.743408203125, 18.59912109375, 19.454833984375, 20.310546875, 21.166259765625, 22.02197265625, 22.877685546875, 23.7333984375, 24.589111328125, 25.44482421875, 26.300537109375, 27.15625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 14.0, 15.0, 25.0, 33.0, 52.0, 52.0, 92.0, 152.0, 236.0, 300.0, 564.0, 918.0, 1525.0, 2820.0, 5294.0, 10068.0, 20319.0, 43603.0, 97125.0, 206720.0, 294559.0, 193679.0, 89912.0, 40455.0, 19289.0, 9192.0, 4980.0, 2683.0, 1510.0, 887.0, 537.0, 324.0, 212.0, 118.0, 92.0, 68.0, 34.0, 31.0, 20.0, 14.0, 13.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-42.625, -41.3115234375, -39.998046875, -38.6845703125, -37.37109375, -36.0576171875, -34.744140625, -33.4306640625, -32.1171875, -30.8037109375, -29.490234375, -28.1767578125, -26.86328125, -25.5498046875, -24.236328125, -22.9228515625, -21.609375, -20.2958984375, -18.982421875, -17.6689453125, -16.35546875, -15.0419921875, -13.728515625, -12.4150390625, -11.1015625, -9.7880859375, -8.474609375, -7.1611328125, -5.84765625, -4.5341796875, -3.220703125, -1.9072265625, -0.59375, 0.7197265625, 2.033203125, 3.3466796875, 4.66015625, 5.9736328125, 7.287109375, 8.6005859375, 9.9140625, 11.2275390625, 12.541015625, 13.8544921875, 15.16796875, 16.4814453125, 17.794921875, 19.1083984375, 20.421875, 21.7353515625, 23.048828125, 24.3623046875, 25.67578125, 26.9892578125, 28.302734375, 29.6162109375, 30.9296875, 32.2431640625, 33.556640625, 34.8701171875, 36.18359375, 37.4970703125, 38.810546875, 40.1240234375, 41.4375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 4.0, 6.0, 4.0, 5.0, 12.0, 11.0, 28.0, 34.0, 104.0, 156.0, 203.0, 176.0, 99.0, 62.0, 28.0, 28.0, 8.0, 10.0, 5.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.007694244384765625, -0.007504522800445557, -0.007314801216125488, -0.00712507963180542, -0.0069353580474853516, -0.006745636463165283, -0.006555914878845215, -0.0063661932945251465, -0.006176471710205078, -0.00598675012588501, -0.005797028541564941, -0.005607306957244873, -0.005417585372924805, -0.005227863788604736, -0.005038142204284668, -0.0048484206199646, -0.004658699035644531, -0.004468977451324463, -0.0042792558670043945, -0.004089534282684326, -0.003899812698364258, -0.0037100911140441895, -0.003520369529724121, -0.0033306479454040527, -0.0031409263610839844, -0.002951204776763916, -0.0027614831924438477, -0.0025717616081237793, -0.002382040023803711, -0.0021923184394836426, -0.0020025968551635742, -0.0018128752708435059, -0.0016231536865234375, -0.0014334321022033691, -0.0012437105178833008, -0.0010539889335632324, -0.0008642673492431641, -0.0006745457649230957, -0.00048482418060302734, -0.000295102596282959, -0.00010538101196289062, 8.434057235717773e-05, 0.0002740621566772461, 0.00046378374099731445, 0.0006535053253173828, 0.0008432269096374512, 0.0010329484939575195, 0.0012226700782775879, 0.0014123916625976562, 0.0016021132469177246, 0.001791834831237793, 0.0019815564155578613, 0.0021712779998779297, 0.002360999584197998, 0.0025507211685180664, 0.0027404427528381348, 0.002930164337158203, 0.0031198859214782715, 0.00330960750579834, 0.003499329090118408, 0.0036890506744384766, 0.003878772258758545, 0.004068493843078613, 0.004258215427398682, 0.00444793701171875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 12.0, 13.0, 6.0, 21.0, 22.0, 33.0, 43.0, 71.0, 98.0, 144.0, 263.0, 384.0, 583.0, 1032.0, 1878.0, 3133.0, 5843.0, 10738.0, 19964.0, 37650.0, 68236.0, 115371.0, 169329.0, 195367.0, 164929.0, 111178.0, 65043.0, 35332.0, 18950.0, 10007.0, 5457.0, 3028.0, 1742.0, 979.0, 592.0, 399.0, 218.0, 153.0, 98.0, 73.0, 45.0, 28.0, 18.0, 13.0, 9.0, 15.0, 6.0, 6.0, 8.0, 1.0, 2.0, 0.0, 2.0], "bins": [-40.125, -38.96044921875, -37.7958984375, -36.63134765625, -35.466796875, -34.30224609375, -33.1376953125, -31.97314453125, -30.80859375, -29.64404296875, -28.4794921875, -27.31494140625, -26.150390625, -24.98583984375, -23.8212890625, -22.65673828125, -21.4921875, -20.32763671875, -19.1630859375, -17.99853515625, -16.833984375, -15.66943359375, -14.5048828125, -13.34033203125, -12.17578125, -11.01123046875, -9.8466796875, -8.68212890625, -7.517578125, -6.35302734375, -5.1884765625, -4.02392578125, -2.859375, -1.69482421875, -0.5302734375, 0.63427734375, 1.798828125, 2.96337890625, 4.1279296875, 5.29248046875, 6.45703125, 7.62158203125, 8.7861328125, 9.95068359375, 11.115234375, 12.27978515625, 13.4443359375, 14.60888671875, 15.7734375, 16.93798828125, 18.1025390625, 19.26708984375, 20.431640625, 21.59619140625, 22.7607421875, 23.92529296875, 25.08984375, 26.25439453125, 27.4189453125, 28.58349609375, 29.748046875, 30.91259765625, 32.0771484375, 33.24169921875, 34.40625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 8.0, 2.0, 1.0, 2.0, 11.0, 6.0, 14.0, 14.0, 20.0, 16.0, 34.0, 28.0, 21.0, 33.0, 48.0, 52.0, 58.0, 38.0, 54.0, 59.0, 69.0, 54.0, 44.0, 49.0, 49.0, 44.0, 31.0, 31.0, 20.0, 19.0, 17.0, 16.0, 7.0, 6.0, 9.0, 7.0, 0.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.7734375, -12.3704833984375, -11.967529296875, -11.5645751953125, -11.16162109375, -10.7586669921875, -10.355712890625, -9.9527587890625, -9.5498046875, -9.1468505859375, -8.743896484375, -8.3409423828125, -7.93798828125, -7.5350341796875, -7.132080078125, -6.7291259765625, -6.326171875, -5.9232177734375, -5.520263671875, -5.1173095703125, -4.71435546875, -4.3114013671875, -3.908447265625, -3.5054931640625, -3.1025390625, -2.6995849609375, -2.296630859375, -1.8936767578125, -1.49072265625, -1.0877685546875, -0.684814453125, -0.2818603515625, 0.12109375, 0.5240478515625, 0.927001953125, 1.3299560546875, 1.73291015625, 2.1358642578125, 2.538818359375, 2.9417724609375, 3.3447265625, 3.7476806640625, 4.150634765625, 4.5535888671875, 4.95654296875, 5.3594970703125, 5.762451171875, 6.1654052734375, 6.568359375, 6.9713134765625, 7.374267578125, 7.7772216796875, 8.18017578125, 8.5831298828125, 8.986083984375, 9.3890380859375, 9.7919921875, 10.1949462890625, 10.597900390625, 11.0008544921875, 11.40380859375, 11.8067626953125, 12.209716796875, 12.6126708984375, 13.015625]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 10.0, 11.0, 9.0, 12.0, 19.0, 15.0, 33.0, 25.0, 33.0, 45.0, 38.0, 52.0, 52.0, 55.0, 59.0, 46.0, 58.0, 75.0, 33.0, 49.0, 50.0, 31.0, 34.0, 20.0, 25.0, 21.0, 16.0, 18.0, 10.0, 10.0, 9.0, 13.0, 7.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-49.54157257080078, -48.033504486083984, -46.52544021606445, -45.017372131347656, -43.509307861328125, -42.00123977661133, -40.49317169189453, -38.985107421875, -37.47704315185547, -35.96897506713867, -34.46091079711914, -32.952842712402344, -31.444778442382812, -29.936710357666016, -28.42864418029785, -26.920578002929688, -25.41250991821289, -23.904443740844727, -22.396377563476562, -20.888309478759766, -19.380245208740234, -17.872177124023438, -16.364110946655273, -14.85604476928711, -13.347978591918945, -11.839912414550781, -10.331846237182617, -8.823779106140137, -7.315712928771973, -5.807646751403809, -4.299579620361328, -2.791513442993164, -1.2834510803222656, 0.22461533546447754, 1.7326817512512207, 3.240748405456543, 4.748814582824707, 6.256880760192871, 7.764947891235352, 9.273014068603516, 10.78108024597168, 12.289146423339844, 13.797212600708008, 15.305279731750488, 16.81334686279297, 18.3214111328125, 19.829479217529297, 21.33754539489746, 22.845611572265625, 24.35367774963379, 25.861743927001953, 27.36981201171875, 28.87787628173828, 30.385944366455078, 31.894010543823242, 33.402076721191406, 34.91014099121094, 36.418209075927734, 37.926273345947266, 39.43434143066406, 40.942405700683594, 42.45047378540039, 43.95854187011719, 45.46660614013672, 46.974674224853516]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 1.0, 4.0, 0.0, 4.0, 4.0, 10.0, 8.0, 10.0, 23.0, 9.0, 9.0, 8.0, 19.0, 19.0, 19.0, 26.0, 22.0, 18.0, 33.0, 47.0, 34.0, 52.0, 40.0, 36.0, 35.0, 31.0, 39.0, 45.0, 40.0, 35.0, 37.0, 56.0, 31.0, 18.0, 21.0, 23.0, 19.0, 21.0, 17.0, 13.0, 16.0, 14.0, 7.0, 7.0, 6.0, 5.0, 4.0, 2.0, 0.0, 3.0, 3.0, 3.0, 2.0, 1.0], "bins": [-40.58488082885742, -39.42475128173828, -38.26462173461914, -37.1044921875, -35.94436264038086, -34.78423309326172, -33.62410354614258, -32.46397399902344, -31.303844451904297, -30.143714904785156, -28.983585357666016, -27.823455810546875, -26.663326263427734, -25.503196716308594, -24.343067169189453, -23.182937622070312, -22.02280616760254, -20.8626766204834, -19.702547073364258, -18.542417526245117, -17.382287979125977, -16.222158432006836, -15.062027931213379, -13.901898384094238, -12.741768836975098, -11.581639289855957, -10.421509742736816, -9.26137924194336, -8.101249694824219, -6.941120624542236, -5.7809906005859375, -4.620861053466797, -3.4607315063476562, -2.3006019592285156, -1.140472173690796, 0.019657611846923828, 1.1797871589660645, 2.339916706085205, 3.500046730041504, 4.6601762771606445, 5.820305824279785, 6.980435371398926, 8.140564918518066, 9.300695419311523, 10.460824966430664, 11.620954513549805, 12.781084060668945, 13.941213607788086, 15.101343154907227, 16.261472702026367, 17.421602249145508, 18.58173179626465, 19.74186134338379, 20.90199089050293, 22.062122344970703, 23.222251892089844, 24.382381439208984, 25.542510986328125, 26.702640533447266, 27.862770080566406, 29.022899627685547, 30.183029174804688, 31.343158721923828, 32.50328826904297, 33.66341781616211]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 7.0, 12.0, 15.0, 33.0, 34.0, 50.0, 78.0, 163.0, 201.0, 305.0, 528.0, 795.0, 1191.0, 1896.0, 3124.0, 4759.0, 7258.0, 11451.0, 17487.0, 26634.0, 39100.0, 55328.0, 75192.0, 94269.0, 110395.0, 117948.0, 113353.0, 99236.0, 79780.0, 60058.0, 42763.0, 29409.0, 19882.0, 12851.0, 8228.0, 5421.0, 3368.0, 2159.0, 1419.0, 806.0, 573.0, 352.0, 220.0, 169.0, 88.0, 52.0, 46.0, 18.0, 16.0, 19.0, 8.0, 4.0, 7.0, 3.0, 1.0, 2.0, 1.0], "bins": [-47.8125, -46.34716796875, -44.8818359375, -43.41650390625, -41.951171875, -40.48583984375, -39.0205078125, -37.55517578125, -36.08984375, -34.62451171875, -33.1591796875, -31.69384765625, -30.228515625, -28.76318359375, -27.2978515625, -25.83251953125, -24.3671875, -22.90185546875, -21.4365234375, -19.97119140625, -18.505859375, -17.04052734375, -15.5751953125, -14.10986328125, -12.64453125, -11.17919921875, -9.7138671875, -8.24853515625, -6.783203125, -5.31787109375, -3.8525390625, -2.38720703125, -0.921875, 0.54345703125, 2.0087890625, 3.47412109375, 4.939453125, 6.40478515625, 7.8701171875, 9.33544921875, 10.80078125, 12.26611328125, 13.7314453125, 15.19677734375, 16.662109375, 18.12744140625, 19.5927734375, 21.05810546875, 22.5234375, 23.98876953125, 25.4541015625, 26.91943359375, 28.384765625, 29.85009765625, 31.3154296875, 32.78076171875, 34.24609375, 35.71142578125, 37.1767578125, 38.64208984375, 40.107421875, 41.57275390625, 43.0380859375, 44.50341796875, 45.96875]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 5.0, 6.0, 3.0, 5.0, 6.0, 9.0, 11.0, 14.0, 9.0, 9.0, 15.0, 19.0, 20.0, 15.0, 23.0, 31.0, 26.0, 30.0, 29.0, 31.0, 35.0, 41.0, 51.0, 43.0, 29.0, 34.0, 49.0, 33.0, 48.0, 40.0, 37.0, 28.0, 25.0, 32.0, 24.0, 17.0, 16.0, 10.0, 21.0, 16.0, 14.0, 12.0, 5.0, 7.0, 3.0, 4.0, 3.0, 2.0, 2.0, 6.0, 1.0, 0.0, 3.0], "bins": [-37.03125, -35.975341796875, -34.91943359375, -33.863525390625, -32.8076171875, -31.751708984375, -30.69580078125, -29.639892578125, -28.583984375, -27.528076171875, -26.47216796875, -25.416259765625, -24.3603515625, -23.304443359375, -22.24853515625, -21.192626953125, -20.13671875, -19.080810546875, -18.02490234375, -16.968994140625, -15.9130859375, -14.857177734375, -13.80126953125, -12.745361328125, -11.689453125, -10.633544921875, -9.57763671875, -8.521728515625, -7.4658203125, -6.409912109375, -5.35400390625, -4.298095703125, -3.2421875, -2.186279296875, -1.13037109375, -0.074462890625, 0.9814453125, 2.037353515625, 3.09326171875, 4.149169921875, 5.205078125, 6.260986328125, 7.31689453125, 8.372802734375, 9.4287109375, 10.484619140625, 11.54052734375, 12.596435546875, 13.65234375, 14.708251953125, 15.76416015625, 16.820068359375, 17.8759765625, 18.931884765625, 19.98779296875, 21.043701171875, 22.099609375, 23.155517578125, 24.21142578125, 25.267333984375, 26.3232421875, 27.379150390625, 28.43505859375, 29.490966796875, 30.546875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 9.0, 6.0, 24.0, 31.0, 37.0, 78.0, 138.0, 233.0, 386.0, 658.0, 1146.0, 1985.0, 3439.0, 6278.0, 10776.0, 18044.0, 29903.0, 47372.0, 70692.0, 97786.0, 122984.0, 136800.0, 133736.0, 115352.0, 88330.0, 61432.0, 40073.0, 25012.0, 14879.0, 8915.0, 5167.0, 2893.0, 1622.0, 959.0, 562.0, 314.0, 223.0, 111.0, 56.0, 47.0, 27.0, 22.0, 7.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.0, -48.4287109375, -46.857421875, -45.2861328125, -43.71484375, -42.1435546875, -40.572265625, -39.0009765625, -37.4296875, -35.8583984375, -34.287109375, -32.7158203125, -31.14453125, -29.5732421875, -28.001953125, -26.4306640625, -24.859375, -23.2880859375, -21.716796875, -20.1455078125, -18.57421875, -17.0029296875, -15.431640625, -13.8603515625, -12.2890625, -10.7177734375, -9.146484375, -7.5751953125, -6.00390625, -4.4326171875, -2.861328125, -1.2900390625, 0.28125, 1.8525390625, 3.423828125, 4.9951171875, 6.56640625, 8.1376953125, 9.708984375, 11.2802734375, 12.8515625, 14.4228515625, 15.994140625, 17.5654296875, 19.13671875, 20.7080078125, 22.279296875, 23.8505859375, 25.421875, 26.9931640625, 28.564453125, 30.1357421875, 31.70703125, 33.2783203125, 34.849609375, 36.4208984375, 37.9921875, 39.5634765625, 41.134765625, 42.7060546875, 44.27734375, 45.8486328125, 47.419921875, 48.9912109375, 50.5625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 1.0, 6.0, 9.0, 9.0, 10.0, 14.0, 16.0, 17.0, 22.0, 26.0, 29.0, 25.0, 23.0, 32.0, 46.0, 37.0, 46.0, 49.0, 41.0, 49.0, 42.0, 41.0, 28.0, 31.0, 30.0, 24.0, 32.0, 28.0, 34.0, 27.0, 35.0, 19.0, 26.0, 9.0, 15.0, 10.0, 14.0, 17.0, 4.0, 5.0, 6.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-24.328125, -23.59619140625, -22.8642578125, -22.13232421875, -21.400390625, -20.66845703125, -19.9365234375, -19.20458984375, -18.47265625, -17.74072265625, -17.0087890625, -16.27685546875, -15.544921875, -14.81298828125, -14.0810546875, -13.34912109375, -12.6171875, -11.88525390625, -11.1533203125, -10.42138671875, -9.689453125, -8.95751953125, -8.2255859375, -7.49365234375, -6.76171875, -6.02978515625, -5.2978515625, -4.56591796875, -3.833984375, -3.10205078125, -2.3701171875, -1.63818359375, -0.90625, -0.17431640625, 0.5576171875, 1.28955078125, 2.021484375, 2.75341796875, 3.4853515625, 4.21728515625, 4.94921875, 5.68115234375, 6.4130859375, 7.14501953125, 7.876953125, 8.60888671875, 9.3408203125, 10.07275390625, 10.8046875, 11.53662109375, 12.2685546875, 13.00048828125, 13.732421875, 14.46435546875, 15.1962890625, 15.92822265625, 16.66015625, 17.39208984375, 18.1240234375, 18.85595703125, 19.587890625, 20.31982421875, 21.0517578125, 21.78369140625, 22.515625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 2.0, 5.0, 4.0, 6.0, 9.0, 7.0, 15.0, 28.0, 33.0, 53.0, 75.0, 80.0, 128.0, 157.0, 231.0, 370.0, 516.0, 769.0, 1313.0, 2150.0, 3949.0, 7366.0, 14507.0, 30301.0, 62441.0, 122172.0, 200716.0, 231380.0, 174566.0, 97784.0, 48611.0, 23334.0, 11333.0, 5837.0, 3185.0, 1899.0, 1078.0, 648.0, 465.0, 292.0, 238.0, 121.0, 95.0, 83.0, 63.0, 37.0, 31.0, 28.0, 20.0, 9.0, 11.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-28.296875, -27.3935546875, -26.490234375, -25.5869140625, -24.68359375, -23.7802734375, -22.876953125, -21.9736328125, -21.0703125, -20.1669921875, -19.263671875, -18.3603515625, -17.45703125, -16.5537109375, -15.650390625, -14.7470703125, -13.84375, -12.9404296875, -12.037109375, -11.1337890625, -10.23046875, -9.3271484375, -8.423828125, -7.5205078125, -6.6171875, -5.7138671875, -4.810546875, -3.9072265625, -3.00390625, -2.1005859375, -1.197265625, -0.2939453125, 0.609375, 1.5126953125, 2.416015625, 3.3193359375, 4.22265625, 5.1259765625, 6.029296875, 6.9326171875, 7.8359375, 8.7392578125, 9.642578125, 10.5458984375, 11.44921875, 12.3525390625, 13.255859375, 14.1591796875, 15.0625, 15.9658203125, 16.869140625, 17.7724609375, 18.67578125, 19.5791015625, 20.482421875, 21.3857421875, 22.2890625, 23.1923828125, 24.095703125, 24.9990234375, 25.90234375, 26.8056640625, 27.708984375, 28.6123046875, 29.515625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 6.0, 13.0, 6.0, 18.0, 18.0, 26.0, 35.0, 45.0, 51.0, 61.0, 86.0, 82.0, 91.0, 92.0, 83.0, 60.0, 57.0, 35.0, 34.0, 21.0, 15.0, 15.0, 9.0, 6.0, 1.0, 10.0, 5.0, 8.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0029392242431640625, -0.0028423964977264404, -0.0027455687522888184, -0.0026487410068511963, -0.0025519132614135742, -0.002455085515975952, -0.00235825777053833, -0.002261430025100708, -0.002164602279663086, -0.002067774534225464, -0.001970946788787842, -0.0018741190433502197, -0.0017772912979125977, -0.0016804635524749756, -0.0015836358070373535, -0.0014868080615997314, -0.0013899803161621094, -0.0012931525707244873, -0.0011963248252868652, -0.0010994970798492432, -0.001002669334411621, -0.000905841588973999, -0.000809013843536377, -0.0007121860980987549, -0.0006153583526611328, -0.0005185306072235107, -0.00042170286178588867, -0.0003248751163482666, -0.00022804737091064453, -0.00013121962547302246, -3.439188003540039e-05, 6.243586540222168e-05, 0.00015926361083984375, 0.0002560913562774658, 0.0003529191017150879, 0.00044974684715270996, 0.000546574592590332, 0.0006434023380279541, 0.0007402300834655762, 0.0008370578289031982, 0.0009338855743408203, 0.0010307133197784424, 0.0011275410652160645, 0.0012243688106536865, 0.0013211965560913086, 0.0014180243015289307, 0.0015148520469665527, 0.0016116797924041748, 0.0017085075378417969, 0.001805335283279419, 0.001902163028717041, 0.001998990774154663, 0.002095818519592285, 0.0021926462650299072, 0.0022894740104675293, 0.0023863017559051514, 0.0024831295013427734, 0.0025799572467803955, 0.0026767849922180176, 0.0027736127376556396, 0.0028704404830932617, 0.002967268228530884, 0.003064095973968506, 0.003160923719406128, 0.00325775146484375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 5.0, 5.0, 4.0, 13.0, 18.0, 34.0, 44.0, 75.0, 92.0, 145.0, 200.0, 331.0, 457.0, 721.0, 1118.0, 1830.0, 2879.0, 4767.0, 8029.0, 13350.0, 22974.0, 38804.0, 64802.0, 103760.0, 146971.0, 172121.0, 157665.0, 117788.0, 76332.0, 45982.0, 27282.0, 15967.0, 9280.0, 5486.0, 3359.0, 2041.0, 1309.0, 878.0, 573.0, 354.0, 243.0, 144.0, 105.0, 64.0, 45.0, 35.0, 27.0, 19.0, 9.0, 4.0, 7.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0], "bins": [-20.140625, -19.52392578125, -18.9072265625, -18.29052734375, -17.673828125, -17.05712890625, -16.4404296875, -15.82373046875, -15.20703125, -14.59033203125, -13.9736328125, -13.35693359375, -12.740234375, -12.12353515625, -11.5068359375, -10.89013671875, -10.2734375, -9.65673828125, -9.0400390625, -8.42333984375, -7.806640625, -7.18994140625, -6.5732421875, -5.95654296875, -5.33984375, -4.72314453125, -4.1064453125, -3.48974609375, -2.873046875, -2.25634765625, -1.6396484375, -1.02294921875, -0.40625, 0.21044921875, 0.8271484375, 1.44384765625, 2.060546875, 2.67724609375, 3.2939453125, 3.91064453125, 4.52734375, 5.14404296875, 5.7607421875, 6.37744140625, 6.994140625, 7.61083984375, 8.2275390625, 8.84423828125, 9.4609375, 10.07763671875, 10.6943359375, 11.31103515625, 11.927734375, 12.54443359375, 13.1611328125, 13.77783203125, 14.39453125, 15.01123046875, 15.6279296875, 16.24462890625, 16.861328125, 17.47802734375, 18.0947265625, 18.71142578125, 19.328125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 9.0, 4.0, 3.0, 13.0, 18.0, 15.0, 15.0, 20.0, 23.0, 14.0, 37.0, 38.0, 43.0, 48.0, 48.0, 52.0, 45.0, 47.0, 53.0, 45.0, 54.0, 34.0, 42.0, 35.0, 32.0, 34.0, 35.0, 24.0, 24.0, 18.0, 15.0, 10.0, 12.0, 6.0, 6.0, 3.0, 1.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.91015625, -6.686279296875, -6.46240234375, -6.238525390625, -6.0146484375, -5.790771484375, -5.56689453125, -5.343017578125, -5.119140625, -4.895263671875, -4.67138671875, -4.447509765625, -4.2236328125, -3.999755859375, -3.77587890625, -3.552001953125, -3.328125, -3.104248046875, -2.88037109375, -2.656494140625, -2.4326171875, -2.208740234375, -1.98486328125, -1.760986328125, -1.537109375, -1.313232421875, -1.08935546875, -0.865478515625, -0.6416015625, -0.417724609375, -0.19384765625, 0.030029296875, 0.25390625, 0.477783203125, 0.70166015625, 0.925537109375, 1.1494140625, 1.373291015625, 1.59716796875, 1.821044921875, 2.044921875, 2.268798828125, 2.49267578125, 2.716552734375, 2.9404296875, 3.164306640625, 3.38818359375, 3.612060546875, 3.8359375, 4.059814453125, 4.28369140625, 4.507568359375, 4.7314453125, 4.955322265625, 5.17919921875, 5.403076171875, 5.626953125, 5.850830078125, 6.07470703125, 6.298583984375, 6.5224609375, 6.746337890625, 6.97021484375, 7.194091796875, 7.41796875]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 4.0, 6.0, 5.0, 7.0, 4.0, 9.0, 22.0, 17.0, 29.0, 24.0, 39.0, 32.0, 35.0, 45.0, 54.0, 58.0, 57.0, 56.0, 51.0, 50.0, 46.0, 56.0, 43.0, 43.0, 30.0, 26.0, 23.0, 27.0, 24.0, 17.0, 13.0, 13.0, 9.0, 10.0, 6.0, 7.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.233482360839844, -38.822452545166016, -37.41141891479492, -36.000389099121094, -34.58935546875, -33.17832565307617, -31.76729393005371, -30.35626220703125, -28.94523048400879, -27.534198760986328, -26.123167037963867, -24.712135314941406, -23.301105499267578, -21.890071868896484, -20.479042053222656, -19.068010330200195, -17.656978607177734, -16.245946884155273, -14.834915161132812, -13.423884391784668, -12.012852668762207, -10.601820945739746, -9.190790176391602, -7.779758453369141, -6.36872673034668, -4.957695007324219, -3.546663761138916, -2.1356325149536133, -0.7246007919311523, 0.6864309310913086, 2.097461700439453, 3.508493423461914, 4.919521331787109, 6.33055305480957, 7.741584300994873, 9.152615547180176, 10.563647270202637, 11.974678993225098, 13.385709762573242, 14.796741485595703, 16.207773208618164, 17.618804931640625, 19.029836654663086, 20.440868377685547, 21.851898193359375, 23.26293182373047, 24.673961639404297, 26.084993362426758, 27.49602508544922, 28.90705680847168, 30.31808853149414, 31.72911834716797, 33.14015197753906, 34.55118179321289, 35.96221160888672, 37.37324523925781, 38.784278869628906, 40.195308685302734, 41.60634231567383, 43.017372131347656, 44.42840576171875, 45.83943557739258, 47.250465393066406, 48.6614990234375, 50.07252883911133]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 2.0, 7.0, 9.0, 5.0, 6.0, 7.0, 10.0, 8.0, 10.0, 16.0, 6.0, 11.0, 17.0, 18.0, 19.0, 25.0, 38.0, 39.0, 19.0, 41.0, 36.0, 47.0, 36.0, 37.0, 42.0, 44.0, 49.0, 41.0, 45.0, 32.0, 24.0, 31.0, 36.0, 23.0, 25.0, 15.0, 23.0, 21.0, 17.0, 22.0, 14.0, 6.0, 9.0, 4.0, 3.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-40.91275405883789, -39.78478240966797, -38.65681076049805, -37.528839111328125, -36.4008674621582, -35.27289581298828, -34.14492416381836, -33.01695251464844, -31.888978958129883, -30.76100730895996, -29.63303565979004, -28.505064010620117, -27.377090454101562, -26.24911880493164, -25.12114715576172, -23.993175506591797, -22.865203857421875, -21.737232208251953, -20.60926055908203, -19.48128890991211, -18.353317260742188, -17.225345611572266, -16.09737205505371, -14.969400405883789, -13.841428756713867, -12.713457107543945, -11.585485458374023, -10.457512855529785, -9.329541206359863, -8.201569557189941, -7.073597431182861, -5.945625305175781, -4.817649841308594, -3.6896779537200928, -2.561706066131592, -1.4337341785430908, -0.30576229095458984, 0.822209358215332, 1.950181484222412, 3.078153610229492, 4.206125259399414, 5.334096908569336, 6.462069034576416, 7.590041160583496, 8.718012809753418, 9.84598445892334, 10.973957061767578, 12.1019287109375, 13.229900360107422, 14.357872009277344, 15.485843658447266, 16.613815307617188, 17.74178695678711, 18.86975860595703, 19.997732162475586, 21.125703811645508, 22.25367546081543, 23.38164710998535, 24.509618759155273, 25.637590408325195, 26.76556396484375, 27.893535614013672, 29.021507263183594, 30.149478912353516, 31.277450561523438]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 6.0, 11.0, 8.0, 18.0, 34.0, 43.0, 60.0, 88.0, 144.0, 215.0, 316.0, 471.0, 722.0, 1197.0, 1820.0, 2963.0, 4814.0, 7859.0, 12766.0, 21281.0, 35084.0, 58698.0, 99158.0, 168897.0, 292391.0, 493190.0, 748890.0, 804589.0, 580676.0, 352488.0, 207352.0, 121112.0, 71273.0, 42173.0, 25336.0, 15114.0, 9113.0, 5374.0, 3261.0, 1954.0, 1260.0, 752.0, 488.0, 277.0, 190.0, 118.0, 86.0, 52.0, 38.0, 21.0, 19.0, 10.0, 10.0, 2.0, 2.0, 2.0], "bins": [-54.0625, -52.52490234375, -50.9873046875, -49.44970703125, -47.912109375, -46.37451171875, -44.8369140625, -43.29931640625, -41.76171875, -40.22412109375, -38.6865234375, -37.14892578125, -35.611328125, -34.07373046875, -32.5361328125, -30.99853515625, -29.4609375, -27.92333984375, -26.3857421875, -24.84814453125, -23.310546875, -21.77294921875, -20.2353515625, -18.69775390625, -17.16015625, -15.62255859375, -14.0849609375, -12.54736328125, -11.009765625, -9.47216796875, -7.9345703125, -6.39697265625, -4.859375, -3.32177734375, -1.7841796875, -0.24658203125, 1.291015625, 2.82861328125, 4.3662109375, 5.90380859375, 7.44140625, 8.97900390625, 10.5166015625, 12.05419921875, 13.591796875, 15.12939453125, 16.6669921875, 18.20458984375, 19.7421875, 21.27978515625, 22.8173828125, 24.35498046875, 25.892578125, 27.43017578125, 28.9677734375, 30.50537109375, 32.04296875, 33.58056640625, 35.1181640625, 36.65576171875, 38.193359375, 39.73095703125, 41.2685546875, 42.80615234375, 44.34375]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 8.0, 1.0, 4.0, 6.0, 7.0, 13.0, 10.0, 3.0, 12.0, 11.0, 16.0, 14.0, 13.0, 20.0, 28.0, 26.0, 29.0, 41.0, 36.0, 36.0, 47.0, 36.0, 39.0, 39.0, 50.0, 47.0, 52.0, 34.0, 31.0, 32.0, 23.0, 36.0, 30.0, 24.0, 25.0, 14.0, 22.0, 19.0, 10.0, 14.0, 14.0, 8.0, 5.0, 6.0, 3.0, 6.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-29.4375, -28.629150390625, -27.82080078125, -27.012451171875, -26.2041015625, -25.395751953125, -24.58740234375, -23.779052734375, -22.970703125, -22.162353515625, -21.35400390625, -20.545654296875, -19.7373046875, -18.928955078125, -18.12060546875, -17.312255859375, -16.50390625, -15.695556640625, -14.88720703125, -14.078857421875, -13.2705078125, -12.462158203125, -11.65380859375, -10.845458984375, -10.037109375, -9.228759765625, -8.42041015625, -7.612060546875, -6.8037109375, -5.995361328125, -5.18701171875, -4.378662109375, -3.5703125, -2.761962890625, -1.95361328125, -1.145263671875, -0.3369140625, 0.471435546875, 1.27978515625, 2.088134765625, 2.896484375, 3.704833984375, 4.51318359375, 5.321533203125, 6.1298828125, 6.938232421875, 7.74658203125, 8.554931640625, 9.36328125, 10.171630859375, 10.97998046875, 11.788330078125, 12.5966796875, 13.405029296875, 14.21337890625, 15.021728515625, 15.830078125, 16.638427734375, 17.44677734375, 18.255126953125, 19.0634765625, 19.871826171875, 20.68017578125, 21.488525390625, 22.296875]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 8.0, 10.0, 18.0, 22.0, 21.0, 48.0, 87.0, 125.0, 180.0, 308.0, 606.0, 1008.0, 1826.0, 3350.0, 5958.0, 11064.0, 20526.0, 38176.0, 72667.0, 135413.0, 248043.0, 431045.0, 670883.0, 820532.0, 696986.0, 456845.0, 265053.0, 145910.0, 77410.0, 41512.0, 22055.0, 11951.0, 6351.0, 3620.0, 1989.0, 1111.0, 621.0, 398.0, 208.0, 140.0, 81.0, 36.0, 25.0, 21.0, 16.0, 13.0, 10.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.03125, -39.77099609375, -38.5107421875, -37.25048828125, -35.990234375, -34.72998046875, -33.4697265625, -32.20947265625, -30.94921875, -29.68896484375, -28.4287109375, -27.16845703125, -25.908203125, -24.64794921875, -23.3876953125, -22.12744140625, -20.8671875, -19.60693359375, -18.3466796875, -17.08642578125, -15.826171875, -14.56591796875, -13.3056640625, -12.04541015625, -10.78515625, -9.52490234375, -8.2646484375, -7.00439453125, -5.744140625, -4.48388671875, -3.2236328125, -1.96337890625, -0.703125, 0.55712890625, 1.8173828125, 3.07763671875, 4.337890625, 5.59814453125, 6.8583984375, 8.11865234375, 9.37890625, 10.63916015625, 11.8994140625, 13.15966796875, 14.419921875, 15.68017578125, 16.9404296875, 18.20068359375, 19.4609375, 20.72119140625, 21.9814453125, 23.24169921875, 24.501953125, 25.76220703125, 27.0224609375, 28.28271484375, 29.54296875, 30.80322265625, 32.0634765625, 33.32373046875, 34.583984375, 35.84423828125, 37.1044921875, 38.36474609375, 39.625]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 3.0, 3.0, 6.0, 11.0, 14.0, 30.0, 24.0, 41.0, 46.0, 67.0, 69.0, 94.0, 98.0, 130.0, 148.0, 180.0, 180.0, 200.0, 235.0, 270.0, 288.0, 227.0, 258.0, 236.0, 216.0, 202.0, 167.0, 124.0, 95.0, 84.0, 67.0, 60.0, 57.0, 41.0, 25.0, 21.0, 17.0, 17.0, 4.0, 9.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.15625, -14.688232421875, -14.22021484375, -13.752197265625, -13.2841796875, -12.816162109375, -12.34814453125, -11.880126953125, -11.412109375, -10.944091796875, -10.47607421875, -10.008056640625, -9.5400390625, -9.072021484375, -8.60400390625, -8.135986328125, -7.66796875, -7.199951171875, -6.73193359375, -6.263916015625, -5.7958984375, -5.327880859375, -4.85986328125, -4.391845703125, -3.923828125, -3.455810546875, -2.98779296875, -2.519775390625, -2.0517578125, -1.583740234375, -1.11572265625, -0.647705078125, -0.1796875, 0.288330078125, 0.75634765625, 1.224365234375, 1.6923828125, 2.160400390625, 2.62841796875, 3.096435546875, 3.564453125, 4.032470703125, 4.50048828125, 4.968505859375, 5.4365234375, 5.904541015625, 6.37255859375, 6.840576171875, 7.30859375, 7.776611328125, 8.24462890625, 8.712646484375, 9.1806640625, 9.648681640625, 10.11669921875, 10.584716796875, 11.052734375, 11.520751953125, 11.98876953125, 12.456787109375, 12.9248046875, 13.392822265625, 13.86083984375, 14.328857421875, 14.796875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 6.0, 5.0, 2.0, 14.0, 3.0, 11.0, 12.0, 15.0, 24.0, 24.0, 32.0, 42.0, 41.0, 42.0, 35.0, 40.0, 52.0, 66.0, 54.0, 64.0, 48.0, 54.0, 47.0, 39.0, 39.0, 32.0, 25.0, 31.0, 15.0, 22.0, 16.0, 10.0, 8.0, 4.0, 6.0, 5.0, 4.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.40579605102539, -28.250099182128906, -27.094402313232422, -25.938703536987305, -24.78300666809082, -23.627309799194336, -22.47161102294922, -21.315914154052734, -20.16021728515625, -19.004520416259766, -17.84882354736328, -16.693124771118164, -15.53742790222168, -14.381731033325195, -13.226033210754395, -12.070335388183594, -10.91463851928711, -9.758941650390625, -8.603243827819824, -7.447546482086182, -6.291849136352539, -5.1361517906188965, -3.980454444885254, -2.824756622314453, -1.6690597534179688, -0.5133624076843262, 0.6423349380493164, 1.798032283782959, 2.9537296295166016, 4.109426975250244, 5.265124320983887, 6.4208221435546875, 7.576515197753906, 8.73221206665039, 9.887909889221191, 11.043607711791992, 12.199304580688477, 13.355001449584961, 14.510699272155762, 15.666397094726562, 16.822093963623047, 17.97779083251953, 19.133487701416016, 20.289186477661133, 21.444883346557617, 22.6005802154541, 23.75627899169922, 24.911975860595703, 26.067672729492188, 27.223369598388672, 28.379066467285156, 29.534765243530273, 30.690462112426758, 31.846158981323242, 33.00185775756836, 34.157554626464844, 35.31325149536133, 36.46894836425781, 37.6246452331543, 38.78034210205078, 39.93604278564453, 41.091739654541016, 42.2474365234375, 43.403133392333984, 44.55883026123047]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 5.0, 6.0, 10.0, 7.0, 6.0, 9.0, 6.0, 18.0, 21.0, 26.0, 26.0, 26.0, 25.0, 21.0, 39.0, 39.0, 35.0, 43.0, 38.0, 35.0, 52.0, 45.0, 28.0, 37.0, 44.0, 44.0, 42.0, 33.0, 29.0, 26.0, 29.0, 24.0, 25.0, 16.0, 17.0, 14.0, 8.0, 9.0, 11.0, 7.0, 3.0, 4.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0], "bins": [-31.140579223632812, -30.188535690307617, -29.236492156982422, -28.28445053100586, -27.332406997680664, -26.38036346435547, -25.428321838378906, -24.47627830505371, -23.524234771728516, -22.57219123840332, -21.620147705078125, -20.668106079101562, -19.716062545776367, -18.764019012451172, -17.81197738647461, -16.859933853149414, -15.907890319824219, -14.955846786499023, -14.003804206848145, -13.051761627197266, -12.09971809387207, -11.147674560546875, -10.195631980895996, -9.243589401245117, -8.291545867919922, -7.339502811431885, -6.387459754943848, -5.4354166984558105, -4.483373641967773, -3.5313305854797363, -2.579287528991699, -1.627244472503662, -0.6751995086669922, 0.2768435478210449, 1.228886604309082, 2.180929660797119, 3.1329727172851562, 4.085015773773193, 5.0370588302612305, 5.989101886749268, 6.941144943237305, 7.893187999725342, 8.845231056213379, 9.797273635864258, 10.749317169189453, 11.701360702514648, 12.653403282165527, 13.605445861816406, 14.557489395141602, 15.509532928466797, 16.46157455444336, 17.413618087768555, 18.36566162109375, 19.317705154418945, 20.26974868774414, 21.221790313720703, 22.1738338470459, 23.125877380371094, 24.077919006347656, 25.02996253967285, 25.982006072998047, 26.934049606323242, 27.886093139648438, 28.838134765625, 29.790178298950195]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 6.0, 5.0, 14.0, 20.0, 29.0, 31.0, 69.0, 109.0, 152.0, 271.0, 441.0, 735.0, 1230.0, 2119.0, 3577.0, 6233.0, 11135.0, 18571.0, 30696.0, 50133.0, 77452.0, 111214.0, 140879.0, 152386.0, 138337.0, 107848.0, 74506.0, 47997.0, 29425.0, 17821.0, 10457.0, 6167.0, 3487.0, 1969.0, 1192.0, 739.0, 444.0, 233.0, 153.0, 95.0, 73.0, 35.0, 26.0, 13.0, 10.0, 14.0, 7.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-66.9375, -64.875, -62.8125, -60.75, -58.6875, -56.625, -54.5625, -52.5, -50.4375, -48.375, -46.3125, -44.25, -42.1875, -40.125, -38.0625, -36.0, -33.9375, -31.875, -29.8125, -27.75, -25.6875, -23.625, -21.5625, -19.5, -17.4375, -15.375, -13.3125, -11.25, -9.1875, -7.125, -5.0625, -3.0, -0.9375, 1.125, 3.1875, 5.25, 7.3125, 9.375, 11.4375, 13.5, 15.5625, 17.625, 19.6875, 21.75, 23.8125, 25.875, 27.9375, 30.0, 32.0625, 34.125, 36.1875, 38.25, 40.3125, 42.375, 44.4375, 46.5, 48.5625, 50.625, 52.6875, 54.75, 56.8125, 58.875, 60.9375, 63.0, 65.0625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 10.0, 4.0, 5.0, 2.0, 3.0, 9.0, 6.0, 5.0, 18.0, 14.0, 19.0, 21.0, 15.0, 19.0, 25.0, 24.0, 34.0, 32.0, 35.0, 33.0, 30.0, 40.0, 45.0, 40.0, 43.0, 39.0, 43.0, 41.0, 42.0, 26.0, 37.0, 25.0, 32.0, 22.0, 22.0, 17.0, 27.0, 14.0, 19.0, 11.0, 10.0, 5.0, 9.0, 4.0, 8.0, 4.0, 4.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 3.0], "bins": [-20.5625, -19.95654296875, -19.3505859375, -18.74462890625, -18.138671875, -17.53271484375, -16.9267578125, -16.32080078125, -15.71484375, -15.10888671875, -14.5029296875, -13.89697265625, -13.291015625, -12.68505859375, -12.0791015625, -11.47314453125, -10.8671875, -10.26123046875, -9.6552734375, -9.04931640625, -8.443359375, -7.83740234375, -7.2314453125, -6.62548828125, -6.01953125, -5.41357421875, -4.8076171875, -4.20166015625, -3.595703125, -2.98974609375, -2.3837890625, -1.77783203125, -1.171875, -0.56591796875, 0.0400390625, 0.64599609375, 1.251953125, 1.85791015625, 2.4638671875, 3.06982421875, 3.67578125, 4.28173828125, 4.8876953125, 5.49365234375, 6.099609375, 6.70556640625, 7.3115234375, 7.91748046875, 8.5234375, 9.12939453125, 9.7353515625, 10.34130859375, 10.947265625, 11.55322265625, 12.1591796875, 12.76513671875, 13.37109375, 13.97705078125, 14.5830078125, 15.18896484375, 15.794921875, 16.40087890625, 17.0068359375, 17.61279296875, 18.21875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 15.0, 14.0, 17.0, 22.0, 47.0, 96.0, 101.0, 198.0, 330.0, 484.0, 755.0, 1230.0, 1897.0, 2997.0, 4809.0, 7669.0, 12967.0, 21192.0, 34601.0, 57754.0, 94939.0, 146880.0, 188409.0, 169864.0, 116935.0, 72346.0, 43341.0, 26557.0, 15799.0, 9887.0, 6033.0, 3812.0, 2434.0, 1508.0, 995.0, 577.0, 383.0, 238.0, 157.0, 101.0, 60.0, 34.0, 20.0, 20.0, 14.0, 9.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-71.8125, -69.6181640625, -67.423828125, -65.2294921875, -63.03515625, -60.8408203125, -58.646484375, -56.4521484375, -54.2578125, -52.0634765625, -49.869140625, -47.6748046875, -45.48046875, -43.2861328125, -41.091796875, -38.8974609375, -36.703125, -34.5087890625, -32.314453125, -30.1201171875, -27.92578125, -25.7314453125, -23.537109375, -21.3427734375, -19.1484375, -16.9541015625, -14.759765625, -12.5654296875, -10.37109375, -8.1767578125, -5.982421875, -3.7880859375, -1.59375, 0.6005859375, 2.794921875, 4.9892578125, 7.18359375, 9.3779296875, 11.572265625, 13.7666015625, 15.9609375, 18.1552734375, 20.349609375, 22.5439453125, 24.73828125, 26.9326171875, 29.126953125, 31.3212890625, 33.515625, 35.7099609375, 37.904296875, 40.0986328125, 42.29296875, 44.4873046875, 46.681640625, 48.8759765625, 51.0703125, 53.2646484375, 55.458984375, 57.6533203125, 59.84765625, 62.0419921875, 64.236328125, 66.4306640625, 68.625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 2.0, 2.0, 4.0, 7.0, 7.0, 8.0, 4.0, 15.0, 7.0, 10.0, 16.0, 18.0, 23.0, 24.0, 31.0, 24.0, 25.0, 33.0, 37.0, 31.0, 38.0, 45.0, 44.0, 35.0, 32.0, 41.0, 36.0, 41.0, 33.0, 35.0, 26.0, 47.0, 37.0, 30.0, 28.0, 26.0, 25.0, 21.0, 15.0, 13.0, 8.0, 11.0, 2.0, 2.0, 8.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8515625, -14.3096923828125, -13.767822265625, -13.2259521484375, -12.68408203125, -12.1422119140625, -11.600341796875, -11.0584716796875, -10.5166015625, -9.9747314453125, -9.432861328125, -8.8909912109375, -8.34912109375, -7.8072509765625, -7.265380859375, -6.7235107421875, -6.181640625, -5.6397705078125, -5.097900390625, -4.5560302734375, -4.01416015625, -3.4722900390625, -2.930419921875, -2.3885498046875, -1.8466796875, -1.3048095703125, -0.762939453125, -0.2210693359375, 0.32080078125, 0.8626708984375, 1.404541015625, 1.9464111328125, 2.48828125, 3.0301513671875, 3.572021484375, 4.1138916015625, 4.65576171875, 5.1976318359375, 5.739501953125, 6.2813720703125, 6.8232421875, 7.3651123046875, 7.906982421875, 8.4488525390625, 8.99072265625, 9.5325927734375, 10.074462890625, 10.6163330078125, 11.158203125, 11.7000732421875, 12.241943359375, 12.7838134765625, 13.32568359375, 13.8675537109375, 14.409423828125, 14.9512939453125, 15.4931640625, 16.0350341796875, 16.576904296875, 17.1187744140625, 17.66064453125, 18.2025146484375, 18.744384765625, 19.2862548828125, 19.828125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 5.0, 3.0, 4.0, 9.0, 17.0, 14.0, 21.0, 37.0, 50.0, 70.0, 89.0, 155.0, 168.0, 267.0, 393.0, 609.0, 852.0, 1307.0, 2097.0, 3635.0, 6763.0, 13749.0, 32039.0, 92044.0, 324319.0, 383908.0, 113928.0, 37795.0, 15916.0, 7673.0, 4089.0, 2351.0, 1320.0, 871.0, 562.0, 423.0, 284.0, 181.0, 136.0, 128.0, 68.0, 62.0, 51.0, 21.0, 25.0, 17.0, 15.0, 7.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-62.46875, -60.52197265625, -58.5751953125, -56.62841796875, -54.681640625, -52.73486328125, -50.7880859375, -48.84130859375, -46.89453125, -44.94775390625, -43.0009765625, -41.05419921875, -39.107421875, -37.16064453125, -35.2138671875, -33.26708984375, -31.3203125, -29.37353515625, -27.4267578125, -25.47998046875, -23.533203125, -21.58642578125, -19.6396484375, -17.69287109375, -15.74609375, -13.79931640625, -11.8525390625, -9.90576171875, -7.958984375, -6.01220703125, -4.0654296875, -2.11865234375, -0.171875, 1.77490234375, 3.7216796875, 5.66845703125, 7.615234375, 9.56201171875, 11.5087890625, 13.45556640625, 15.40234375, 17.34912109375, 19.2958984375, 21.24267578125, 23.189453125, 25.13623046875, 27.0830078125, 29.02978515625, 30.9765625, 32.92333984375, 34.8701171875, 36.81689453125, 38.763671875, 40.71044921875, 42.6572265625, 44.60400390625, 46.55078125, 48.49755859375, 50.4443359375, 52.39111328125, 54.337890625, 56.28466796875, 58.2314453125, 60.17822265625, 62.125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 8.0, 3.0, 8.0, 13.0, 13.0, 20.0, 21.0, 25.0, 36.0, 69.0, 84.0, 109.0, 129.0, 123.0, 102.0, 77.0, 51.0, 30.0, 22.0, 10.0, 18.0, 7.0, 5.0, 4.0, 5.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.005649566650390625, -0.0054724812507629395, -0.005295395851135254, -0.005118310451507568, -0.004941225051879883, -0.004764139652252197, -0.004587054252624512, -0.004409968852996826, -0.004232883453369141, -0.004055798053741455, -0.0038787126541137695, -0.003701627254486084, -0.0035245418548583984, -0.003347456455230713, -0.0031703710556030273, -0.002993285655975342, -0.0028162002563476562, -0.0026391148567199707, -0.002462029457092285, -0.0022849440574645996, -0.002107858657836914, -0.0019307732582092285, -0.001753687858581543, -0.0015766024589538574, -0.0013995170593261719, -0.0012224316596984863, -0.0010453462600708008, -0.0008682608604431152, -0.0006911754608154297, -0.0005140900611877441, -0.0003370046615600586, -0.00015991926193237305, 1.71661376953125e-05, 0.00019425153732299805, 0.0003713369369506836, 0.0005484223365783691, 0.0007255077362060547, 0.0009025931358337402, 0.0010796785354614258, 0.0012567639350891113, 0.0014338493347167969, 0.0016109347343444824, 0.001788020133972168, 0.0019651055335998535, 0.002142190933227539, 0.0023192763328552246, 0.00249636173248291, 0.0026734471321105957, 0.0028505325317382812, 0.003027617931365967, 0.0032047033309936523, 0.003381788730621338, 0.0035588741302490234, 0.003735959529876709, 0.0039130449295043945, 0.00409013032913208, 0.004267215728759766, 0.004444301128387451, 0.004621386528015137, 0.004798471927642822, 0.004975557327270508, 0.005152642726898193, 0.005329728126525879, 0.0055068135261535645, 0.00568389892578125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 0.0, 4.0, 10.0, 16.0, 10.0, 23.0, 29.0, 45.0, 60.0, 84.0, 90.0, 122.0, 156.0, 212.0, 301.0, 425.0, 578.0, 841.0, 1114.0, 1771.0, 2765.0, 4595.0, 8464.0, 17606.0, 42407.0, 111086.0, 257671.0, 314130.0, 166599.0, 64011.0, 25612.0, 11467.0, 5897.0, 3378.0, 2175.0, 1382.0, 939.0, 689.0, 478.0, 355.0, 251.0, 198.0, 135.0, 99.0, 80.0, 54.0, 35.0, 40.0, 21.0, 20.0, 15.0, 2.0, 9.0, 2.0, 5.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-32.40625, -31.3681640625, -30.330078125, -29.2919921875, -28.25390625, -27.2158203125, -26.177734375, -25.1396484375, -24.1015625, -23.0634765625, -22.025390625, -20.9873046875, -19.94921875, -18.9111328125, -17.873046875, -16.8349609375, -15.796875, -14.7587890625, -13.720703125, -12.6826171875, -11.64453125, -10.6064453125, -9.568359375, -8.5302734375, -7.4921875, -6.4541015625, -5.416015625, -4.3779296875, -3.33984375, -2.3017578125, -1.263671875, -0.2255859375, 0.8125, 1.8505859375, 2.888671875, 3.9267578125, 4.96484375, 6.0029296875, 7.041015625, 8.0791015625, 9.1171875, 10.1552734375, 11.193359375, 12.2314453125, 13.26953125, 14.3076171875, 15.345703125, 16.3837890625, 17.421875, 18.4599609375, 19.498046875, 20.5361328125, 21.57421875, 22.6123046875, 23.650390625, 24.6884765625, 25.7265625, 26.7646484375, 27.802734375, 28.8408203125, 29.87890625, 30.9169921875, 31.955078125, 32.9931640625, 34.03125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 0.0, 3.0, 3.0, 3.0, 2.0, 4.0, 5.0, 4.0, 9.0, 12.0, 12.0, 21.0, 27.0, 39.0, 67.0, 87.0, 118.0, 124.0, 110.0, 90.0, 66.0, 49.0, 43.0, 30.0, 21.0, 13.0, 8.0, 7.0, 3.0, 5.0, 5.0, 7.0, 7.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0234375, -12.6365966796875, -12.249755859375, -11.8629150390625, -11.47607421875, -11.0892333984375, -10.702392578125, -10.3155517578125, -9.9287109375, -9.5418701171875, -9.155029296875, -8.7681884765625, -8.38134765625, -7.9945068359375, -7.607666015625, -7.2208251953125, -6.833984375, -6.4471435546875, -6.060302734375, -5.6734619140625, -5.28662109375, -4.8997802734375, -4.512939453125, -4.1260986328125, -3.7392578125, -3.3524169921875, -2.965576171875, -2.5787353515625, -2.19189453125, -1.8050537109375, -1.418212890625, -1.0313720703125, -0.64453125, -0.2576904296875, 0.129150390625, 0.5159912109375, 0.90283203125, 1.2896728515625, 1.676513671875, 2.0633544921875, 2.4501953125, 2.8370361328125, 3.223876953125, 3.6107177734375, 3.99755859375, 4.3843994140625, 4.771240234375, 5.1580810546875, 5.544921875, 5.9317626953125, 6.318603515625, 6.7054443359375, 7.09228515625, 7.4791259765625, 7.865966796875, 8.2528076171875, 8.6396484375, 9.0264892578125, 9.413330078125, 9.8001708984375, 10.18701171875, 10.5738525390625, 10.960693359375, 11.3475341796875, 11.734375]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 1.0, 7.0, 5.0, 7.0, 4.0, 9.0, 14.0, 9.0, 8.0, 23.0, 15.0, 20.0, 20.0, 39.0, 44.0, 40.0, 38.0, 45.0, 43.0, 48.0, 59.0, 52.0, 52.0, 61.0, 55.0, 39.0, 33.0, 34.0, 31.0, 32.0, 25.0, 19.0, 13.0, 11.0, 11.0, 10.0, 6.0, 8.0, 7.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.93026351928711, -20.15152359008789, -19.372785568237305, -18.59404754638672, -17.8153076171875, -17.03656768798828, -16.257829666137695, -15.479090690612793, -14.70035171508789, -13.921612739562988, -13.142873764038086, -12.364134788513184, -11.585395812988281, -10.806656837463379, -10.027917861938477, -9.249178886413574, -8.470439910888672, -7.6917009353637695, -6.912961959838867, -6.134222984313965, -5.3554840087890625, -4.57674503326416, -3.798006057739258, -3.0192670822143555, -2.240528106689453, -1.4617891311645508, -0.6830501556396484, 0.0956888198852539, 0.8744277954101562, 1.6531667709350586, 2.431905746459961, 3.2106447219848633, 3.9893856048583984, 4.768124580383301, 5.546863555908203, 6.3256025314331055, 7.104341506958008, 7.88308048248291, 8.661819458007812, 9.440558433532715, 10.219297409057617, 10.99803638458252, 11.776775360107422, 12.555514335632324, 13.334253311157227, 14.112992286682129, 14.891731262207031, 15.670470237731934, 16.449209213256836, 17.227947235107422, 18.00668716430664, 18.78542709350586, 19.564165115356445, 20.34290313720703, 21.12164306640625, 21.90038299560547, 22.679121017456055, 23.45785903930664, 24.23659896850586, 25.015338897705078, 25.794076919555664, 26.57281494140625, 27.35155487060547, 28.130294799804688, 28.909032821655273]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 6.0, 2.0, 7.0, 2.0, 8.0, 4.0, 9.0, 7.0, 11.0, 17.0, 20.0, 16.0, 17.0, 13.0, 18.0, 26.0, 21.0, 34.0, 33.0, 34.0, 34.0, 36.0, 37.0, 54.0, 45.0, 34.0, 27.0, 35.0, 41.0, 24.0, 42.0, 35.0, 35.0, 25.0, 26.0, 37.0, 19.0, 21.0, 11.0, 15.0, 14.0, 5.0, 8.0, 6.0, 8.0, 5.0, 4.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-18.94991683959961, -18.35383415222168, -17.757753372192383, -17.161670684814453, -16.565587997436523, -15.96950626373291, -15.373424530029297, -14.777341842651367, -14.181260108947754, -13.58517837524414, -12.989095687866211, -12.393013954162598, -11.796932220458984, -11.200849533081055, -10.604767799377441, -10.008686065673828, -9.412603378295898, -8.816521644592285, -8.220438957214355, -7.624357223510742, -7.028275012969971, -6.432192802429199, -5.836111068725586, -5.2400288581848145, -4.643946647644043, -4.0478644371032715, -3.451782464981079, -2.8557004928588867, -2.2596182823181152, -1.6635360717773438, -1.0674540996551514, -0.471372127532959, 0.12471199035644531, 0.7207940816879272, 1.3168761730194092, 1.9129582643508911, 2.509040355682373, 3.1051225662231445, 3.701204538345337, 4.297286510467529, 4.893368721008301, 5.489450931549072, 6.085533142089844, 6.681614875793457, 7.2776970863342285, 7.873779296875, 8.469861030578613, 9.065942764282227, 9.662025451660156, 10.25810718536377, 10.8541898727417, 11.450271606445312, 12.046354293823242, 12.642436027526855, 13.238517761230469, 13.834600448608398, 14.430682182312012, 15.026763916015625, 15.622846603393555, 16.218929290771484, 16.81501007080078, 17.41109275817871, 18.00717544555664, 18.603256225585938, 19.199338912963867]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 11.0, 10.0, 17.0, 14.0, 23.0, 31.0, 65.0, 99.0, 124.0, 185.0, 303.0, 400.0, 687.0, 987.0, 1536.0, 2315.0, 3568.0, 5245.0, 8097.0, 12217.0, 18713.0, 27616.0, 39665.0, 56286.0, 75608.0, 96796.0, 113196.0, 119923.0, 113718.0, 96491.0, 75889.0, 56172.0, 39708.0, 27481.0, 18799.0, 12576.0, 8121.0, 5455.0, 3556.0, 2344.0, 1591.0, 987.0, 677.0, 422.0, 278.0, 174.0, 135.0, 100.0, 48.0, 46.0, 20.0, 16.0, 10.0, 4.0, 4.0, 1.0, 3.0], "bins": [-18.65625, -18.1156005859375, -17.574951171875, -17.0343017578125, -16.49365234375, -15.9530029296875, -15.412353515625, -14.8717041015625, -14.3310546875, -13.7904052734375, -13.249755859375, -12.7091064453125, -12.16845703125, -11.6278076171875, -11.087158203125, -10.5465087890625, -10.005859375, -9.4652099609375, -8.924560546875, -8.3839111328125, -7.84326171875, -7.3026123046875, -6.761962890625, -6.2213134765625, -5.6806640625, -5.1400146484375, -4.599365234375, -4.0587158203125, -3.51806640625, -2.9774169921875, -2.436767578125, -1.8961181640625, -1.35546875, -0.8148193359375, -0.274169921875, 0.2664794921875, 0.80712890625, 1.3477783203125, 1.888427734375, 2.4290771484375, 2.9697265625, 3.5103759765625, 4.051025390625, 4.5916748046875, 5.13232421875, 5.6729736328125, 6.213623046875, 6.7542724609375, 7.294921875, 7.8355712890625, 8.376220703125, 8.9168701171875, 9.45751953125, 9.9981689453125, 10.538818359375, 11.0794677734375, 11.6201171875, 12.1607666015625, 12.701416015625, 13.2420654296875, 13.78271484375, 14.3233642578125, 14.864013671875, 15.4046630859375, 15.9453125]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 4.0, 2.0, 10.0, 4.0, 7.0, 12.0, 11.0, 16.0, 13.0, 13.0, 16.0, 17.0, 21.0, 22.0, 24.0, 25.0, 25.0, 41.0, 30.0, 38.0, 45.0, 37.0, 44.0, 38.0, 29.0, 35.0, 36.0, 28.0, 31.0, 44.0, 40.0, 31.0, 32.0, 24.0, 28.0, 16.0, 17.0, 19.0, 15.0, 13.0, 12.0, 7.0, 6.0, 8.0, 2.0, 3.0, 6.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-17.0625, -16.50830078125, -15.9541015625, -15.39990234375, -14.845703125, -14.29150390625, -13.7373046875, -13.18310546875, -12.62890625, -12.07470703125, -11.5205078125, -10.96630859375, -10.412109375, -9.85791015625, -9.3037109375, -8.74951171875, -8.1953125, -7.64111328125, -7.0869140625, -6.53271484375, -5.978515625, -5.42431640625, -4.8701171875, -4.31591796875, -3.76171875, -3.20751953125, -2.6533203125, -2.09912109375, -1.544921875, -0.99072265625, -0.4365234375, 0.11767578125, 0.671875, 1.22607421875, 1.7802734375, 2.33447265625, 2.888671875, 3.44287109375, 3.9970703125, 4.55126953125, 5.10546875, 5.65966796875, 6.2138671875, 6.76806640625, 7.322265625, 7.87646484375, 8.4306640625, 8.98486328125, 9.5390625, 10.09326171875, 10.6474609375, 11.20166015625, 11.755859375, 12.31005859375, 12.8642578125, 13.41845703125, 13.97265625, 14.52685546875, 15.0810546875, 15.63525390625, 16.189453125, 16.74365234375, 17.2978515625, 17.85205078125, 18.40625]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 8.0, 11.0, 17.0, 35.0, 28.0, 58.0, 74.0, 145.0, 241.0, 350.0, 582.0, 963.0, 1604.0, 2644.0, 4558.0, 7877.0, 14256.0, 25127.0, 44033.0, 75277.0, 119143.0, 164357.0, 180092.0, 151866.0, 104894.0, 64333.0, 37105.0, 20903.0, 11626.0, 6774.0, 3809.0, 2389.0, 1340.0, 783.0, 442.0, 324.0, 191.0, 115.0, 73.0, 36.0, 33.0, 17.0, 12.0, 6.0, 7.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-26.46875, -25.650390625, -24.83203125, -24.013671875, -23.1953125, -22.376953125, -21.55859375, -20.740234375, -19.921875, -19.103515625, -18.28515625, -17.466796875, -16.6484375, -15.830078125, -15.01171875, -14.193359375, -13.375, -12.556640625, -11.73828125, -10.919921875, -10.1015625, -9.283203125, -8.46484375, -7.646484375, -6.828125, -6.009765625, -5.19140625, -4.373046875, -3.5546875, -2.736328125, -1.91796875, -1.099609375, -0.28125, 0.537109375, 1.35546875, 2.173828125, 2.9921875, 3.810546875, 4.62890625, 5.447265625, 6.265625, 7.083984375, 7.90234375, 8.720703125, 9.5390625, 10.357421875, 11.17578125, 11.994140625, 12.8125, 13.630859375, 14.44921875, 15.267578125, 16.0859375, 16.904296875, 17.72265625, 18.541015625, 19.359375, 20.177734375, 20.99609375, 21.814453125, 22.6328125, 23.451171875, 24.26953125, 25.087890625, 25.90625]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 3.0, 6.0, 3.0, 0.0, 4.0, 6.0, 7.0, 8.0, 6.0, 8.0, 10.0, 11.0, 24.0, 23.0, 28.0, 20.0, 23.0, 24.0, 40.0, 39.0, 35.0, 37.0, 43.0, 50.0, 39.0, 51.0, 42.0, 33.0, 43.0, 34.0, 37.0, 34.0, 35.0, 34.0, 27.0, 24.0, 22.0, 15.0, 10.0, 15.0, 9.0, 8.0, 7.0, 9.0, 11.0, 3.0, 3.0, 2.0, 3.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.28125, -11.8624267578125, -11.443603515625, -11.0247802734375, -10.60595703125, -10.1871337890625, -9.768310546875, -9.3494873046875, -8.9306640625, -8.5118408203125, -8.093017578125, -7.6741943359375, -7.25537109375, -6.8365478515625, -6.417724609375, -5.9989013671875, -5.580078125, -5.1612548828125, -4.742431640625, -4.3236083984375, -3.90478515625, -3.4859619140625, -3.067138671875, -2.6483154296875, -2.2294921875, -1.8106689453125, -1.391845703125, -0.9730224609375, -0.55419921875, -0.1353759765625, 0.283447265625, 0.7022705078125, 1.12109375, 1.5399169921875, 1.958740234375, 2.3775634765625, 2.79638671875, 3.2152099609375, 3.634033203125, 4.0528564453125, 4.4716796875, 4.8905029296875, 5.309326171875, 5.7281494140625, 6.14697265625, 6.5657958984375, 6.984619140625, 7.4034423828125, 7.822265625, 8.2410888671875, 8.659912109375, 9.0787353515625, 9.49755859375, 9.9163818359375, 10.335205078125, 10.7540283203125, 11.1728515625, 11.5916748046875, 12.010498046875, 12.4293212890625, 12.84814453125, 13.2669677734375, 13.685791015625, 14.1046142578125, 14.5234375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 2.0, 9.0, 13.0, 20.0, 25.0, 38.0, 60.0, 93.0, 113.0, 155.0, 242.0, 349.0, 580.0, 830.0, 1265.0, 2088.0, 3493.0, 6147.0, 10677.0, 18756.0, 35132.0, 65036.0, 115011.0, 182545.0, 212501.0, 166419.0, 101228.0, 55814.0, 30455.0, 16500.0, 9117.0, 5374.0, 3127.0, 1917.0, 1181.0, 720.0, 502.0, 311.0, 215.0, 149.0, 108.0, 68.0, 50.0, 38.0, 26.0, 19.0, 13.0, 7.0, 4.0, 0.0, 8.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-16.703125, -16.1533203125, -15.603515625, -15.0537109375, -14.50390625, -13.9541015625, -13.404296875, -12.8544921875, -12.3046875, -11.7548828125, -11.205078125, -10.6552734375, -10.10546875, -9.5556640625, -9.005859375, -8.4560546875, -7.90625, -7.3564453125, -6.806640625, -6.2568359375, -5.70703125, -5.1572265625, -4.607421875, -4.0576171875, -3.5078125, -2.9580078125, -2.408203125, -1.8583984375, -1.30859375, -0.7587890625, -0.208984375, 0.3408203125, 0.890625, 1.4404296875, 1.990234375, 2.5400390625, 3.08984375, 3.6396484375, 4.189453125, 4.7392578125, 5.2890625, 5.8388671875, 6.388671875, 6.9384765625, 7.48828125, 8.0380859375, 8.587890625, 9.1376953125, 9.6875, 10.2373046875, 10.787109375, 11.3369140625, 11.88671875, 12.4365234375, 12.986328125, 13.5361328125, 14.0859375, 14.6357421875, 15.185546875, 15.7353515625, 16.28515625, 16.8349609375, 17.384765625, 17.9345703125, 18.484375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 6.0, 2.0, 12.0, 20.0, 28.0, 28.0, 33.0, 47.0, 57.0, 59.0, 72.0, 68.0, 83.0, 86.0, 67.0, 54.0, 62.0, 50.0, 31.0, 40.0, 21.0, 12.0, 9.0, 8.0, 13.0, 11.0, 5.0, 8.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00156402587890625, -0.0015097260475158691, -0.0014554262161254883, -0.0014011263847351074, -0.0013468265533447266, -0.0012925267219543457, -0.0012382268905639648, -0.001183927059173584, -0.0011296272277832031, -0.0010753273963928223, -0.0010210275650024414, -0.0009667277336120605, -0.0009124279022216797, -0.0008581280708312988, -0.000803828239440918, -0.0007495284080505371, -0.0006952285766601562, -0.0006409287452697754, -0.0005866289138793945, -0.0005323290824890137, -0.0004780292510986328, -0.00042372941970825195, -0.0003694295883178711, -0.00031512975692749023, -0.0002608299255371094, -0.00020653009414672852, -0.00015223026275634766, -9.79304313659668e-05, -4.363059997558594e-05, 1.0669231414794922e-05, 6.496906280517578e-05, 0.00011926889419555664, 0.0001735687255859375, 0.00022786855697631836, 0.0002821683883666992, 0.0003364682197570801, 0.00039076805114746094, 0.0004450678825378418, 0.0004993677139282227, 0.0005536675453186035, 0.0006079673767089844, 0.0006622672080993652, 0.0007165670394897461, 0.000770866870880127, 0.0008251667022705078, 0.0008794665336608887, 0.0009337663650512695, 0.0009880661964416504, 0.0010423660278320312, 0.0010966658592224121, 0.001150965690612793, 0.0012052655220031738, 0.0012595653533935547, 0.0013138651847839355, 0.0013681650161743164, 0.0014224648475646973, 0.0014767646789550781, 0.001531064510345459, 0.0015853643417358398, 0.0016396641731262207, 0.0016939640045166016, 0.0017482638359069824, 0.0018025636672973633, 0.0018568634986877441, 0.001911163330078125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 5.0, 22.0, 21.0, 42.0, 56.0, 81.0, 118.0, 172.0, 239.0, 417.0, 544.0, 847.0, 1200.0, 1898.0, 2775.0, 4056.0, 6241.0, 9315.0, 14092.0, 21533.0, 32821.0, 49374.0, 72942.0, 102212.0, 130032.0, 141953.0, 130610.0, 102833.0, 74225.0, 50517.0, 33132.0, 21663.0, 14257.0, 9361.0, 6267.0, 4104.0, 2726.0, 1915.0, 1283.0, 855.0, 584.0, 405.0, 267.0, 179.0, 120.0, 75.0, 59.0, 40.0, 30.0, 20.0, 10.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.6640625, -10.32568359375, -9.9873046875, -9.64892578125, -9.310546875, -8.97216796875, -8.6337890625, -8.29541015625, -7.95703125, -7.61865234375, -7.2802734375, -6.94189453125, -6.603515625, -6.26513671875, -5.9267578125, -5.58837890625, -5.25, -4.91162109375, -4.5732421875, -4.23486328125, -3.896484375, -3.55810546875, -3.2197265625, -2.88134765625, -2.54296875, -2.20458984375, -1.8662109375, -1.52783203125, -1.189453125, -0.85107421875, -0.5126953125, -0.17431640625, 0.1640625, 0.50244140625, 0.8408203125, 1.17919921875, 1.517578125, 1.85595703125, 2.1943359375, 2.53271484375, 2.87109375, 3.20947265625, 3.5478515625, 3.88623046875, 4.224609375, 4.56298828125, 4.9013671875, 5.23974609375, 5.578125, 5.91650390625, 6.2548828125, 6.59326171875, 6.931640625, 7.27001953125, 7.6083984375, 7.94677734375, 8.28515625, 8.62353515625, 8.9619140625, 9.30029296875, 9.638671875, 9.97705078125, 10.3154296875, 10.65380859375, 10.9921875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 5.0, 8.0, 7.0, 16.0, 10.0, 12.0, 16.0, 25.0, 29.0, 30.0, 36.0, 26.0, 43.0, 44.0, 46.0, 50.0, 70.0, 61.0, 72.0, 55.0, 58.0, 58.0, 43.0, 28.0, 44.0, 23.0, 13.0, 14.0, 12.0, 16.0, 7.0, 4.0, 8.0, 7.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.03515625, -5.8533935546875, -5.671630859375, -5.4898681640625, -5.30810546875, -5.1263427734375, -4.944580078125, -4.7628173828125, -4.5810546875, -4.3992919921875, -4.217529296875, -4.0357666015625, -3.85400390625, -3.6722412109375, -3.490478515625, -3.3087158203125, -3.126953125, -2.9451904296875, -2.763427734375, -2.5816650390625, -2.39990234375, -2.2181396484375, -2.036376953125, -1.8546142578125, -1.6728515625, -1.4910888671875, -1.309326171875, -1.1275634765625, -0.94580078125, -0.7640380859375, -0.582275390625, -0.4005126953125, -0.21875, -0.0369873046875, 0.144775390625, 0.3265380859375, 0.50830078125, 0.6900634765625, 0.871826171875, 1.0535888671875, 1.2353515625, 1.4171142578125, 1.598876953125, 1.7806396484375, 1.96240234375, 2.1441650390625, 2.325927734375, 2.5076904296875, 2.689453125, 2.8712158203125, 3.052978515625, 3.2347412109375, 3.41650390625, 3.5982666015625, 3.780029296875, 3.9617919921875, 4.1435546875, 4.3253173828125, 4.507080078125, 4.6888427734375, 4.87060546875, 5.0523681640625, 5.234130859375, 5.4158935546875, 5.59765625]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 4.0, 3.0, 5.0, 4.0, 4.0, 3.0, 8.0, 15.0, 11.0, 20.0, 21.0, 23.0, 18.0, 27.0, 35.0, 33.0, 39.0, 59.0, 52.0, 49.0, 52.0, 71.0, 64.0, 51.0, 52.0, 41.0, 40.0, 28.0, 28.0, 20.0, 28.0, 16.0, 20.0, 17.0, 15.0, 8.0, 5.0, 4.0, 7.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.777170181274414, -20.99321937561035, -20.209270477294922, -19.42531967163086, -18.641368865966797, -17.857418060302734, -17.073467254638672, -16.289518356323242, -15.50556755065918, -14.721616744995117, -13.937666893005371, -13.153717041015625, -12.369766235351562, -11.5858154296875, -10.801865577697754, -10.017915725708008, -9.233964920043945, -8.450014114379883, -7.666064262390137, -6.882113933563232, -6.098163604736328, -5.314213275909424, -4.5302629470825195, -3.7463126182556152, -2.962362289428711, -2.1784119606018066, -1.3944616317749023, -0.610511302947998, 0.17343902587890625, 0.9573893547058105, 1.7413396835327148, 2.525290012359619, 3.3092403411865234, 4.093190670013428, 4.877140998840332, 5.661091327667236, 6.445041656494141, 7.228991985321045, 8.01294231414795, 8.796892166137695, 9.580842971801758, 10.36479377746582, 11.148743629455566, 11.932693481445312, 12.716644287109375, 13.500595092773438, 14.284544944763184, 15.06849479675293, 15.852445602416992, 16.636396408081055, 17.420345306396484, 18.204296112060547, 18.98824691772461, 19.772197723388672, 20.556148529052734, 21.340097427368164, 22.124048233032227, 22.90799903869629, 23.69194793701172, 24.47589874267578, 25.259849548339844, 26.043800354003906, 26.82775115966797, 27.6117000579834, 28.39565086364746]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 1.0, 5.0, 4.0, 7.0, 5.0, 5.0, 6.0, 16.0, 9.0, 12.0, 14.0, 14.0, 20.0, 23.0, 20.0, 23.0, 23.0, 38.0, 37.0, 22.0, 37.0, 31.0, 43.0, 36.0, 39.0, 42.0, 39.0, 40.0, 40.0, 32.0, 31.0, 31.0, 33.0, 30.0, 23.0, 20.0, 26.0, 20.0, 14.0, 20.0, 15.0, 11.0, 9.0, 7.0, 8.0, 5.0, 3.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-18.282730102539062, -17.698646545410156, -17.11456298828125, -16.530481338500977, -15.94639778137207, -15.362314224243164, -14.778231620788574, -14.194149017333984, -13.610065460205078, -13.025981903076172, -12.441899299621582, -11.857816696166992, -11.273733139038086, -10.68964958190918, -10.10556697845459, -9.521484375, -8.937400817871094, -8.353317260742188, -7.769234657287598, -7.18515157699585, -6.601068496704102, -6.0169854164123535, -5.4329023361206055, -4.848819255828857, -4.264736175537109, -3.6806530952453613, -3.0965700149536133, -2.5124869346618652, -1.9284038543701172, -1.3443207740783691, -0.7602376937866211, -0.17615461349487305, 0.4079265594482422, 0.9920096397399902, 1.5760927200317383, 2.1601758003234863, 2.7442588806152344, 3.3283419609069824, 3.9124250411987305, 4.4965081214904785, 5.080591201782227, 5.664674282073975, 6.248757362365723, 6.832840442657471, 7.416923522949219, 8.001007080078125, 8.585089683532715, 9.169172286987305, 9.753255844116211, 10.337339401245117, 10.921422004699707, 11.505504608154297, 12.089588165283203, 12.67367172241211, 13.2577543258667, 13.841836929321289, 14.425920486450195, 15.010004043579102, 15.594086647033691, 16.17816925048828, 16.762252807617188, 17.346336364746094, 17.930419921875, 18.514501571655273, 19.09858512878418]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 5.0, 6.0, 8.0, 9.0, 13.0, 22.0, 33.0, 39.0, 58.0, 104.0, 141.0, 251.0, 349.0, 522.0, 842.0, 1383.0, 2239.0, 3751.0, 6390.0, 10906.0, 19303.0, 34865.0, 65121.0, 126112.0, 251957.0, 498013.0, 840633.0, 944350.0, 661286.0, 352082.0, 175014.0, 89538.0, 47293.0, 25764.0, 14798.0, 8389.0, 4886.0, 2889.0, 1837.0, 1134.0, 678.0, 458.0, 240.0, 197.0, 134.0, 85.0, 55.0, 36.0, 24.0, 23.0, 7.0, 8.0, 9.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-21.46875, -20.781494140625, -20.09423828125, -19.406982421875, -18.7197265625, -18.032470703125, -17.34521484375, -16.657958984375, -15.970703125, -15.283447265625, -14.59619140625, -13.908935546875, -13.2216796875, -12.534423828125, -11.84716796875, -11.159912109375, -10.47265625, -9.785400390625, -9.09814453125, -8.410888671875, -7.7236328125, -7.036376953125, -6.34912109375, -5.661865234375, -4.974609375, -4.287353515625, -3.60009765625, -2.912841796875, -2.2255859375, -1.538330078125, -0.85107421875, -0.163818359375, 0.5234375, 1.210693359375, 1.89794921875, 2.585205078125, 3.2724609375, 3.959716796875, 4.64697265625, 5.334228515625, 6.021484375, 6.708740234375, 7.39599609375, 8.083251953125, 8.7705078125, 9.457763671875, 10.14501953125, 10.832275390625, 11.51953125, 12.206787109375, 12.89404296875, 13.581298828125, 14.2685546875, 14.955810546875, 15.64306640625, 16.330322265625, 17.017578125, 17.704833984375, 18.39208984375, 19.079345703125, 19.7666015625, 20.453857421875, 21.14111328125, 21.828369140625, 22.515625]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 5.0, 13.0, 8.0, 7.0, 9.0, 21.0, 13.0, 22.0, 18.0, 23.0, 27.0, 20.0, 31.0, 26.0, 34.0, 40.0, 33.0, 41.0, 39.0, 44.0, 45.0, 54.0, 42.0, 37.0, 36.0, 24.0, 33.0, 39.0, 29.0, 21.0, 35.0, 12.0, 17.0, 16.0, 19.0, 11.0, 9.0, 9.0, 7.0, 6.0, 3.0, 3.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-14.125, -13.6710205078125, -13.217041015625, -12.7630615234375, -12.30908203125, -11.8551025390625, -11.401123046875, -10.9471435546875, -10.4931640625, -10.0391845703125, -9.585205078125, -9.1312255859375, -8.67724609375, -8.2232666015625, -7.769287109375, -7.3153076171875, -6.861328125, -6.4073486328125, -5.953369140625, -5.4993896484375, -5.04541015625, -4.5914306640625, -4.137451171875, -3.6834716796875, -3.2294921875, -2.7755126953125, -2.321533203125, -1.8675537109375, -1.41357421875, -0.9595947265625, -0.505615234375, -0.0516357421875, 0.40234375, 0.8563232421875, 1.310302734375, 1.7642822265625, 2.21826171875, 2.6722412109375, 3.126220703125, 3.5802001953125, 4.0341796875, 4.4881591796875, 4.942138671875, 5.3961181640625, 5.85009765625, 6.3040771484375, 6.758056640625, 7.2120361328125, 7.666015625, 8.1199951171875, 8.573974609375, 9.0279541015625, 9.48193359375, 9.9359130859375, 10.389892578125, 10.8438720703125, 11.2978515625, 11.7518310546875, 12.205810546875, 12.6597900390625, 13.11376953125, 13.5677490234375, 14.021728515625, 14.4757080078125, 14.9296875]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 8.0, 12.0, 11.0, 23.0, 25.0, 44.0, 74.0, 131.0, 197.0, 270.0, 476.0, 726.0, 1137.0, 1881.0, 3106.0, 5307.0, 8765.0, 14902.0, 25829.0, 45126.0, 77991.0, 136778.0, 232662.0, 385400.0, 585130.0, 738348.0, 686736.0, 493560.0, 310828.0, 184725.0, 106539.0, 61912.0, 35458.0, 20369.0, 11808.0, 6877.0, 4359.0, 2604.0, 1551.0, 938.0, 598.0, 375.0, 262.0, 164.0, 108.0, 63.0, 32.0, 27.0, 18.0, 7.0, 7.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-18.0625, -17.494140625, -16.92578125, -16.357421875, -15.7890625, -15.220703125, -14.65234375, -14.083984375, -13.515625, -12.947265625, -12.37890625, -11.810546875, -11.2421875, -10.673828125, -10.10546875, -9.537109375, -8.96875, -8.400390625, -7.83203125, -7.263671875, -6.6953125, -6.126953125, -5.55859375, -4.990234375, -4.421875, -3.853515625, -3.28515625, -2.716796875, -2.1484375, -1.580078125, -1.01171875, -0.443359375, 0.125, 0.693359375, 1.26171875, 1.830078125, 2.3984375, 2.966796875, 3.53515625, 4.103515625, 4.671875, 5.240234375, 5.80859375, 6.376953125, 6.9453125, 7.513671875, 8.08203125, 8.650390625, 9.21875, 9.787109375, 10.35546875, 10.923828125, 11.4921875, 12.060546875, 12.62890625, 13.197265625, 13.765625, 14.333984375, 14.90234375, 15.470703125, 16.0390625, 16.607421875, 17.17578125, 17.744140625, 18.3125]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 7.0, 2.0, 4.0, 12.0, 7.0, 11.0, 18.0, 27.0, 31.0, 36.0, 45.0, 53.0, 80.0, 112.0, 133.0, 142.0, 154.0, 196.0, 191.0, 227.0, 263.0, 268.0, 263.0, 258.0, 244.0, 207.0, 175.0, 152.0, 155.0, 102.0, 103.0, 99.0, 76.0, 56.0, 36.0, 33.0, 28.0, 20.0, 19.0, 11.0, 7.0, 4.0, 4.0, 5.0, 4.0, 1.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.15234375, -6.91156005859375, -6.6707763671875, -6.42999267578125, -6.189208984375, -5.94842529296875, -5.7076416015625, -5.46685791015625, -5.22607421875, -4.98529052734375, -4.7445068359375, -4.50372314453125, -4.262939453125, -4.02215576171875, -3.7813720703125, -3.54058837890625, -3.2998046875, -3.05902099609375, -2.8182373046875, -2.57745361328125, -2.336669921875, -2.09588623046875, -1.8551025390625, -1.61431884765625, -1.37353515625, -1.13275146484375, -0.8919677734375, -0.65118408203125, -0.410400390625, -0.16961669921875, 0.0711669921875, 0.31195068359375, 0.552734375, 0.79351806640625, 1.0343017578125, 1.27508544921875, 1.515869140625, 1.75665283203125, 1.9974365234375, 2.23822021484375, 2.47900390625, 2.71978759765625, 2.9605712890625, 3.20135498046875, 3.442138671875, 3.68292236328125, 3.9237060546875, 4.16448974609375, 4.4052734375, 4.64605712890625, 4.8868408203125, 5.12762451171875, 5.368408203125, 5.60919189453125, 5.8499755859375, 6.09075927734375, 6.33154296875, 6.57232666015625, 6.8131103515625, 7.05389404296875, 7.294677734375, 7.53546142578125, 7.7762451171875, 8.01702880859375, 8.2578125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [5.0, 0.0, 2.0, 3.0, 1.0, 5.0, 1.0, 2.0, 11.0, 10.0, 9.0, 11.0, 17.0, 18.0, 17.0, 25.0, 33.0, 31.0, 33.0, 43.0, 58.0, 66.0, 57.0, 72.0, 54.0, 57.0, 61.0, 64.0, 43.0, 35.0, 35.0, 40.0, 21.0, 17.0, 17.0, 10.0, 5.0, 5.0, 7.0, 6.0, 0.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.756803512573242, -16.042152404785156, -15.327502250671387, -14.6128511428833, -13.898200988769531, -13.183549880981445, -12.46889877319336, -11.754247665405273, -11.039597511291504, -10.324946403503418, -9.610296249389648, -8.895645141601562, -8.180994033813477, -7.466343879699707, -6.751692771911621, -6.037042140960693, -5.322391510009766, -4.607740879058838, -3.893090009689331, -3.178439140319824, -2.4637885093688965, -1.7491378784179688, -1.0344867706298828, -0.3198361396789551, 0.39481449127197266, 1.10946524143219, 1.8241159915924072, 2.538766860961914, 3.253417491912842, 3.9680681228637695, 4.6827192306518555, 5.397369861602783, 6.112022399902344, 6.8266730308532715, 7.541323661804199, 8.255974769592285, 8.970624923706055, 9.68527603149414, 10.399927139282227, 11.114578247070312, 11.829228401184082, 12.543879508972168, 13.258529663085938, 13.973180770874023, 14.68783187866211, 15.402482032775879, 16.11713409423828, 16.831783294677734, 17.54643440246582, 18.261085510253906, 18.975736618041992, 19.690387725830078, 20.40503692626953, 21.119688034057617, 21.834339141845703, 22.54899024963379, 23.263641357421875, 23.97829246520996, 24.692943572998047, 25.4075927734375, 26.122243881225586, 26.836894989013672, 27.551546096801758, 28.266197204589844, 28.980846405029297]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 7.0, 12.0, 6.0, 10.0, 7.0, 8.0, 15.0, 9.0, 20.0, 20.0, 18.0, 20.0, 24.0, 30.0, 26.0, 37.0, 21.0, 31.0, 40.0, 35.0, 43.0, 33.0, 46.0, 31.0, 39.0, 52.0, 43.0, 30.0, 27.0, 26.0, 27.0, 35.0, 22.0, 15.0, 24.0, 15.0, 10.0, 21.0, 12.0, 14.0, 10.0, 8.0, 8.0, 2.0, 6.0, 3.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-16.44165802001953, -15.951186180114746, -15.460715293884277, -14.970243453979492, -14.479771614074707, -13.989299774169922, -13.498828887939453, -13.008357048034668, -12.517885208129883, -12.027413368225098, -11.536942481994629, -11.046470642089844, -10.555998802185059, -10.065526962280273, -9.575056076049805, -9.08458423614502, -8.59411334991455, -8.103641510009766, -7.613170146942139, -7.122698783874512, -6.632226943969727, -6.1417555809021, -5.651284217834473, -5.1608123779296875, -4.6703410148620605, -4.179869651794434, -3.6893978118896484, -3.1989264488220215, -2.7084548473358154, -2.2179832458496094, -1.7275118827819824, -1.2370402812957764, -0.7465677261352539, -0.2560961842536926, 0.23437535762786865, 0.7248468399047852, 1.2153184413909912, 1.7057900428771973, 2.196261405944824, 2.6867330074310303, 3.1772046089172363, 3.6676762104034424, 4.158147811889648, 4.648619174957275, 5.139090538024902, 5.6295623779296875, 6.1200337409973145, 6.610505104064941, 7.100976943969727, 7.5914483070373535, 8.08191967010498, 8.572391510009766, 9.06286334991455, 9.553335189819336, 10.043806076049805, 10.53427791595459, 11.024749755859375, 11.51522159576416, 12.005692481994629, 12.496164321899414, 12.9866361618042, 13.477108001708984, 13.967578887939453, 14.458050727844238, 14.948521614074707]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 8.0, 17.0, 23.0, 29.0, 45.0, 58.0, 102.0, 153.0, 230.0, 324.0, 502.0, 737.0, 1156.0, 1718.0, 2676.0, 4212.0, 6861.0, 10942.0, 17867.0, 29504.0, 49723.0, 83332.0, 135872.0, 192615.0, 186923.0, 127350.0, 77428.0, 45942.0, 27489.0, 16899.0, 10314.0, 6211.0, 3981.0, 2553.0, 1669.0, 1043.0, 666.0, 462.0, 299.0, 202.0, 128.0, 84.0, 69.0, 38.0, 30.0, 22.0, 18.0, 7.0, 7.0, 6.0, 2.0, 3.0, 2.0, 2.0], "bins": [-53.875, -52.287109375, -50.69921875, -49.111328125, -47.5234375, -45.935546875, -44.34765625, -42.759765625, -41.171875, -39.583984375, -37.99609375, -36.408203125, -34.8203125, -33.232421875, -31.64453125, -30.056640625, -28.46875, -26.880859375, -25.29296875, -23.705078125, -22.1171875, -20.529296875, -18.94140625, -17.353515625, -15.765625, -14.177734375, -12.58984375, -11.001953125, -9.4140625, -7.826171875, -6.23828125, -4.650390625, -3.0625, -1.474609375, 0.11328125, 1.701171875, 3.2890625, 4.876953125, 6.46484375, 8.052734375, 9.640625, 11.228515625, 12.81640625, 14.404296875, 15.9921875, 17.580078125, 19.16796875, 20.755859375, 22.34375, 23.931640625, 25.51953125, 27.107421875, 28.6953125, 30.283203125, 31.87109375, 33.458984375, 35.046875, 36.634765625, 38.22265625, 39.810546875, 41.3984375, 42.986328125, 44.57421875, 46.162109375, 47.75]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 1.0, 4.0, 4.0, 4.0, 6.0, 11.0, 14.0, 10.0, 12.0, 15.0, 10.0, 11.0, 18.0, 25.0, 25.0, 35.0, 29.0, 40.0, 30.0, 29.0, 46.0, 41.0, 44.0, 46.0, 28.0, 32.0, 47.0, 28.0, 39.0, 52.0, 32.0, 29.0, 32.0, 24.0, 22.0, 17.0, 20.0, 15.0, 11.0, 13.0, 15.0, 10.0, 6.0, 4.0, 4.0, 4.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.984375, -12.567138671875, -12.14990234375, -11.732666015625, -11.3154296875, -10.898193359375, -10.48095703125, -10.063720703125, -9.646484375, -9.229248046875, -8.81201171875, -8.394775390625, -7.9775390625, -7.560302734375, -7.14306640625, -6.725830078125, -6.30859375, -5.891357421875, -5.47412109375, -5.056884765625, -4.6396484375, -4.222412109375, -3.80517578125, -3.387939453125, -2.970703125, -2.553466796875, -2.13623046875, -1.718994140625, -1.3017578125, -0.884521484375, -0.46728515625, -0.050048828125, 0.3671875, 0.784423828125, 1.20166015625, 1.618896484375, 2.0361328125, 2.453369140625, 2.87060546875, 3.287841796875, 3.705078125, 4.122314453125, 4.53955078125, 4.956787109375, 5.3740234375, 5.791259765625, 6.20849609375, 6.625732421875, 7.04296875, 7.460205078125, 7.87744140625, 8.294677734375, 8.7119140625, 9.129150390625, 9.54638671875, 9.963623046875, 10.380859375, 10.798095703125, 11.21533203125, 11.632568359375, 12.0498046875, 12.467041015625, 12.88427734375, 13.301513671875, 13.71875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 7.0, 18.0, 23.0, 30.0, 47.0, 65.0, 98.0, 141.0, 205.0, 341.0, 530.0, 819.0, 1257.0, 1917.0, 3119.0, 5194.0, 8650.0, 15001.0, 26320.0, 48678.0, 91981.0, 177534.0, 261423.0, 188151.0, 98045.0, 51674.0, 28061.0, 15794.0, 9039.0, 5421.0, 3307.0, 2016.0, 1304.0, 784.0, 524.0, 342.0, 223.0, 156.0, 86.0, 78.0, 47.0, 33.0, 27.0, 16.0, 10.0, 5.0, 7.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-50.1875, -48.54443359375, -46.9013671875, -45.25830078125, -43.615234375, -41.97216796875, -40.3291015625, -38.68603515625, -37.04296875, -35.39990234375, -33.7568359375, -32.11376953125, -30.470703125, -28.82763671875, -27.1845703125, -25.54150390625, -23.8984375, -22.25537109375, -20.6123046875, -18.96923828125, -17.326171875, -15.68310546875, -14.0400390625, -12.39697265625, -10.75390625, -9.11083984375, -7.4677734375, -5.82470703125, -4.181640625, -2.53857421875, -0.8955078125, 0.74755859375, 2.390625, 4.03369140625, 5.6767578125, 7.31982421875, 8.962890625, 10.60595703125, 12.2490234375, 13.89208984375, 15.53515625, 17.17822265625, 18.8212890625, 20.46435546875, 22.107421875, 23.75048828125, 25.3935546875, 27.03662109375, 28.6796875, 30.32275390625, 31.9658203125, 33.60888671875, 35.251953125, 36.89501953125, 38.5380859375, 40.18115234375, 41.82421875, 43.46728515625, 45.1103515625, 46.75341796875, 48.396484375, 50.03955078125, 51.6826171875, 53.32568359375, 54.96875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 11.0, 6.0, 3.0, 7.0, 11.0, 13.0, 18.0, 19.0, 18.0, 27.0, 27.0, 34.0, 45.0, 40.0, 46.0, 43.0, 43.0, 48.0, 43.0, 62.0, 39.0, 43.0, 55.0, 37.0, 27.0, 36.0, 33.0, 37.0, 30.0, 18.0, 17.0, 20.0, 13.0, 15.0, 6.0, 7.0, 6.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.390625, -10.0281982421875, -9.665771484375, -9.3033447265625, -8.94091796875, -8.5784912109375, -8.216064453125, -7.8536376953125, -7.4912109375, -7.1287841796875, -6.766357421875, -6.4039306640625, -6.04150390625, -5.6790771484375, -5.316650390625, -4.9542236328125, -4.591796875, -4.2293701171875, -3.866943359375, -3.5045166015625, -3.14208984375, -2.7796630859375, -2.417236328125, -2.0548095703125, -1.6923828125, -1.3299560546875, -0.967529296875, -0.6051025390625, -0.24267578125, 0.1197509765625, 0.482177734375, 0.8446044921875, 1.20703125, 1.5694580078125, 1.931884765625, 2.2943115234375, 2.65673828125, 3.0191650390625, 3.381591796875, 3.7440185546875, 4.1064453125, 4.4688720703125, 4.831298828125, 5.1937255859375, 5.55615234375, 5.9185791015625, 6.281005859375, 6.6434326171875, 7.005859375, 7.3682861328125, 7.730712890625, 8.0931396484375, 8.45556640625, 8.8179931640625, 9.180419921875, 9.5428466796875, 9.9052734375, 10.2677001953125, 10.630126953125, 10.9925537109375, 11.35498046875, 11.7174072265625, 12.079833984375, 12.4422607421875, 12.8046875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 7.0, 6.0, 15.0, 12.0, 41.0, 60.0, 77.0, 110.0, 148.0, 231.0, 346.0, 531.0, 757.0, 1231.0, 1917.0, 3209.0, 5513.0, 9689.0, 19914.0, 52765.0, 225760.0, 530416.0, 125548.0, 35235.0, 15135.0, 7856.0, 4540.0, 2717.0, 1664.0, 1077.0, 723.0, 431.0, 293.0, 195.0, 94.0, 91.0, 60.0, 62.0, 25.0, 17.0, 10.0, 13.0, 8.0, 3.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.375, -66.3828125, -64.390625, -62.3984375, -60.40625, -58.4140625, -56.421875, -54.4296875, -52.4375, -50.4453125, -48.453125, -46.4609375, -44.46875, -42.4765625, -40.484375, -38.4921875, -36.5, -34.5078125, -32.515625, -30.5234375, -28.53125, -26.5390625, -24.546875, -22.5546875, -20.5625, -18.5703125, -16.578125, -14.5859375, -12.59375, -10.6015625, -8.609375, -6.6171875, -4.625, -2.6328125, -0.640625, 1.3515625, 3.34375, 5.3359375, 7.328125, 9.3203125, 11.3125, 13.3046875, 15.296875, 17.2890625, 19.28125, 21.2734375, 23.265625, 25.2578125, 27.25, 29.2421875, 31.234375, 33.2265625, 35.21875, 37.2109375, 39.203125, 41.1953125, 43.1875, 45.1796875, 47.171875, 49.1640625, 51.15625, 53.1484375, 55.140625, 57.1328125, 59.125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 1.0, 2.0, 5.0, 9.0, 7.0, 11.0, 8.0, 16.0, 25.0, 22.0, 45.0, 56.0, 126.0, 201.0, 204.0, 95.0, 53.0, 25.0, 18.0, 15.0, 11.0, 7.0, 9.0, 5.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.005359649658203125, -0.005191922187805176, -0.0050241947174072266, -0.004856467247009277, -0.004688739776611328, -0.004521012306213379, -0.00435328483581543, -0.0041855573654174805, -0.004017829895019531, -0.003850102424621582, -0.003682374954223633, -0.0035146474838256836, -0.0033469200134277344, -0.003179192543029785, -0.003011465072631836, -0.0028437376022338867, -0.0026760101318359375, -0.0025082826614379883, -0.002340555191040039, -0.00217282772064209, -0.0020051002502441406, -0.0018373727798461914, -0.0016696453094482422, -0.001501917839050293, -0.0013341903686523438, -0.0011664628982543945, -0.0009987354278564453, -0.0008310079574584961, -0.0006632804870605469, -0.0004955530166625977, -0.00032782554626464844, -0.00016009807586669922, 7.62939453125e-06, 0.00017535686492919922, 0.00034308433532714844, 0.0005108118057250977, 0.0006785392761230469, 0.0008462667465209961, 0.0010139942169189453, 0.0011817216873168945, 0.0013494491577148438, 0.001517176628112793, 0.0016849040985107422, 0.0018526315689086914, 0.0020203590393066406, 0.00218808650970459, 0.002355813980102539, 0.0025235414505004883, 0.0026912689208984375, 0.0028589963912963867, 0.003026723861694336, 0.003194451332092285, 0.0033621788024902344, 0.0035299062728881836, 0.003697633743286133, 0.003865361213684082, 0.004033088684082031, 0.0042008161544799805, 0.00436854362487793, 0.004536271095275879, 0.004703998565673828, 0.004871726036071777, 0.0050394535064697266, 0.005207180976867676, 0.005374908447265625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 4.0, 5.0, 6.0, 14.0, 9.0, 16.0, 23.0, 27.0, 58.0, 65.0, 126.0, 201.0, 256.0, 435.0, 692.0, 1118.0, 1775.0, 2922.0, 5036.0, 8551.0, 15089.0, 27969.0, 54827.0, 113401.0, 213150.0, 256957.0, 170330.0, 83515.0, 40932.0, 21552.0, 11986.0, 6979.0, 4055.0, 2421.0, 1511.0, 932.0, 555.0, 328.0, 254.0, 156.0, 111.0, 63.0, 50.0, 29.0, 27.0, 18.0, 9.0, 6.0, 4.0, 6.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.46875, -19.745361328125, -19.02197265625, -18.298583984375, -17.5751953125, -16.851806640625, -16.12841796875, -15.405029296875, -14.681640625, -13.958251953125, -13.23486328125, -12.511474609375, -11.7880859375, -11.064697265625, -10.34130859375, -9.617919921875, -8.89453125, -8.171142578125, -7.44775390625, -6.724365234375, -6.0009765625, -5.277587890625, -4.55419921875, -3.830810546875, -3.107421875, -2.384033203125, -1.66064453125, -0.937255859375, -0.2138671875, 0.509521484375, 1.23291015625, 1.956298828125, 2.6796875, 3.403076171875, 4.12646484375, 4.849853515625, 5.5732421875, 6.296630859375, 7.02001953125, 7.743408203125, 8.466796875, 9.190185546875, 9.91357421875, 10.636962890625, 11.3603515625, 12.083740234375, 12.80712890625, 13.530517578125, 14.25390625, 14.977294921875, 15.70068359375, 16.424072265625, 17.1474609375, 17.870849609375, 18.59423828125, 19.317626953125, 20.041015625, 20.764404296875, 21.48779296875, 22.211181640625, 22.9345703125, 23.657958984375, 24.38134765625, 25.104736328125, 25.828125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 0.0, 11.0, 3.0, 13.0, 7.0, 4.0, 13.0, 14.0, 16.0, 20.0, 33.0, 38.0, 45.0, 33.0, 62.0, 64.0, 66.0, 62.0, 70.0, 75.0, 51.0, 51.0, 52.0, 26.0, 28.0, 20.0, 23.0, 21.0, 9.0, 13.0, 16.0, 8.0, 5.0, 8.0, 3.0, 6.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.296875, -7.0692138671875, -6.841552734375, -6.6138916015625, -6.38623046875, -6.1585693359375, -5.930908203125, -5.7032470703125, -5.4755859375, -5.2479248046875, -5.020263671875, -4.7926025390625, -4.56494140625, -4.3372802734375, -4.109619140625, -3.8819580078125, -3.654296875, -3.4266357421875, -3.198974609375, -2.9713134765625, -2.74365234375, -2.5159912109375, -2.288330078125, -2.0606689453125, -1.8330078125, -1.6053466796875, -1.377685546875, -1.1500244140625, -0.92236328125, -0.6947021484375, -0.467041015625, -0.2393798828125, -0.01171875, 0.2159423828125, 0.443603515625, 0.6712646484375, 0.89892578125, 1.1265869140625, 1.354248046875, 1.5819091796875, 1.8095703125, 2.0372314453125, 2.264892578125, 2.4925537109375, 2.72021484375, 2.9478759765625, 3.175537109375, 3.4031982421875, 3.630859375, 3.8585205078125, 4.086181640625, 4.3138427734375, 4.54150390625, 4.7691650390625, 4.996826171875, 5.2244873046875, 5.4521484375, 5.6798095703125, 5.907470703125, 6.1351318359375, 6.36279296875, 6.5904541015625, 6.818115234375, 7.0457763671875, 7.2734375]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 1.0, 1.0, 6.0, 2.0, 2.0, 2.0, 7.0, 6.0, 13.0, 15.0, 16.0, 26.0, 32.0, 33.0, 24.0, 34.0, 40.0, 41.0, 62.0, 50.0, 68.0, 67.0, 63.0, 63.0, 40.0, 53.0, 43.0, 44.0, 26.0, 21.0, 21.0, 14.0, 12.0, 12.0, 16.0, 17.0, 4.0, 5.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.731992721557617, -17.144939422607422, -16.557886123657227, -15.970832824707031, -15.383779525756836, -14.79672622680664, -14.209672927856445, -13.62261962890625, -13.035566329956055, -12.44851303100586, -11.861459732055664, -11.274406433105469, -10.687353134155273, -10.100299835205078, -9.513246536254883, -8.926193237304688, -8.339139938354492, -7.752086639404297, -7.165033340454102, -6.577980041503906, -5.990926742553711, -5.403873443603516, -4.81682014465332, -4.229766845703125, -3.6427135467529297, -3.0556602478027344, -2.468606948852539, -1.8815536499023438, -1.2945003509521484, -0.7074470520019531, -0.12039375305175781, 0.4666595458984375, 1.0537109375, 1.6407642364501953, 2.2278175354003906, 2.814870834350586, 3.4019241333007812, 3.9889774322509766, 4.576030731201172, 5.163084030151367, 5.7501373291015625, 6.337190628051758, 6.924243927001953, 7.511297225952148, 8.098350524902344, 8.685403823852539, 9.272457122802734, 9.85951042175293, 10.446563720703125, 11.03361701965332, 11.620670318603516, 12.207723617553711, 12.794776916503906, 13.381830215454102, 13.968883514404297, 14.555936813354492, 15.142990112304688, 15.730043411254883, 16.317096710205078, 16.904150009155273, 17.49120330810547, 18.078256607055664, 18.66530990600586, 19.252363204956055, 19.83941650390625]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 7.0, 7.0, 10.0, 9.0, 3.0, 11.0, 8.0, 12.0, 15.0, 20.0, 21.0, 21.0, 24.0, 43.0, 25.0, 26.0, 27.0, 39.0, 35.0, 35.0, 43.0, 32.0, 36.0, 42.0, 40.0, 35.0, 37.0, 29.0, 46.0, 30.0, 29.0, 28.0, 31.0, 21.0, 12.0, 18.0, 18.0, 8.0, 13.0, 14.0, 13.0, 6.0, 6.0, 3.0, 5.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.537544250488281, -13.119582176208496, -12.701620101928711, -12.283658027648926, -11.86569595336914, -11.447732925415039, -11.029770851135254, -10.611808776855469, -10.193846702575684, -9.775884628295898, -9.357922554016113, -8.939960479736328, -8.521997451782227, -8.104036331176758, -7.686073303222656, -7.268111228942871, -6.850149154663086, -6.432187080383301, -6.014225006103516, -5.596262454986572, -5.178300380706787, -4.760338306427002, -4.342375755310059, -3.9244136810302734, -3.5064516067504883, -3.088489532470703, -2.670527219772339, -2.2525649070739746, -1.8346028327941895, -1.4166407585144043, -0.99867844581604, -0.5807161331176758, -0.16275405883789062, 0.2552081346511841, 0.6731703281402588, 1.0911325216293335, 1.5090947151184082, 1.9270567893981934, 2.3450191020965576, 2.762981414794922, 3.180943489074707, 3.598905563354492, 4.016867637634277, 4.434830188751221, 4.852792263031006, 5.270754337310791, 5.688716888427734, 6.1066789627075195, 6.524641036987305, 6.94260311126709, 7.360565185546875, 7.778527736663818, 8.196489334106445, 8.614452362060547, 9.032414436340332, 9.450376510620117, 9.868338584899902, 10.286300659179688, 10.704262733459473, 11.122224807739258, 11.54018783569336, 11.958148956298828, 12.37611198425293, 12.794074058532715, 13.2120361328125]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 1.0, 3.0, 4.0, 9.0, 15.0, 17.0, 35.0, 43.0, 43.0, 68.0, 117.0, 188.0, 263.0, 420.0, 584.0, 966.0, 1453.0, 2194.0, 3312.0, 5101.0, 7665.0, 11510.0, 17013.0, 25047.0, 36329.0, 51203.0, 69625.0, 89380.0, 106633.0, 116517.0, 114517.0, 101045.0, 81939.0, 62711.0, 45189.0, 31718.0, 21828.0, 14578.0, 10102.0, 6569.0, 4261.0, 2892.0, 1855.0, 1244.0, 809.0, 539.0, 328.0, 239.0, 147.0, 99.0, 64.0, 53.0, 21.0, 20.0, 18.0, 15.0, 7.0, 1.0, 1.0, 1.0, 2.0], "bins": [-10.84375, -10.5133056640625, -10.182861328125, -9.8524169921875, -9.52197265625, -9.1915283203125, -8.861083984375, -8.5306396484375, -8.2001953125, -7.8697509765625, -7.539306640625, -7.2088623046875, -6.87841796875, -6.5479736328125, -6.217529296875, -5.8870849609375, -5.556640625, -5.2261962890625, -4.895751953125, -4.5653076171875, -4.23486328125, -3.9044189453125, -3.573974609375, -3.2435302734375, -2.9130859375, -2.5826416015625, -2.252197265625, -1.9217529296875, -1.59130859375, -1.2608642578125, -0.930419921875, -0.5999755859375, -0.26953125, 0.0609130859375, 0.391357421875, 0.7218017578125, 1.05224609375, 1.3826904296875, 1.713134765625, 2.0435791015625, 2.3740234375, 2.7044677734375, 3.034912109375, 3.3653564453125, 3.69580078125, 4.0262451171875, 4.356689453125, 4.6871337890625, 5.017578125, 5.3480224609375, 5.678466796875, 6.0089111328125, 6.33935546875, 6.6697998046875, 7.000244140625, 7.3306884765625, 7.6611328125, 7.9915771484375, 8.322021484375, 8.6524658203125, 8.98291015625, 9.3133544921875, 9.643798828125, 9.9742431640625, 10.3046875]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 5.0, 3.0, 7.0, 8.0, 6.0, 7.0, 12.0, 7.0, 7.0, 15.0, 11.0, 17.0, 32.0, 25.0, 20.0, 22.0, 23.0, 39.0, 43.0, 41.0, 33.0, 31.0, 32.0, 41.0, 50.0, 39.0, 38.0, 34.0, 38.0, 24.0, 33.0, 41.0, 41.0, 20.0, 34.0, 26.0, 22.0, 16.0, 14.0, 7.0, 6.0, 9.0, 6.0, 10.0, 4.0, 1.0, 4.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.0703125, -12.662353515625, -12.25439453125, -11.846435546875, -11.4384765625, -11.030517578125, -10.62255859375, -10.214599609375, -9.806640625, -9.398681640625, -8.99072265625, -8.582763671875, -8.1748046875, -7.766845703125, -7.35888671875, -6.950927734375, -6.54296875, -6.135009765625, -5.72705078125, -5.319091796875, -4.9111328125, -4.503173828125, -4.09521484375, -3.687255859375, -3.279296875, -2.871337890625, -2.46337890625, -2.055419921875, -1.6474609375, -1.239501953125, -0.83154296875, -0.423583984375, -0.015625, 0.392333984375, 0.80029296875, 1.208251953125, 1.6162109375, 2.024169921875, 2.43212890625, 2.840087890625, 3.248046875, 3.656005859375, 4.06396484375, 4.471923828125, 4.8798828125, 5.287841796875, 5.69580078125, 6.103759765625, 6.51171875, 6.919677734375, 7.32763671875, 7.735595703125, 8.1435546875, 8.551513671875, 8.95947265625, 9.367431640625, 9.775390625, 10.183349609375, 10.59130859375, 10.999267578125, 11.4072265625, 11.815185546875, 12.22314453125, 12.631103515625, 13.0390625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 6.0, 2.0, 6.0, 7.0, 9.0, 10.0, 17.0, 35.0, 43.0, 61.0, 125.0, 170.0, 234.0, 377.0, 561.0, 797.0, 1199.0, 1813.0, 2798.0, 4238.0, 6656.0, 10348.0, 16055.0, 25578.0, 38449.0, 57980.0, 82791.0, 109264.0, 130881.0, 136108.0, 121355.0, 96107.0, 69374.0, 46867.0, 31312.0, 20035.0, 12936.0, 8303.0, 5302.0, 3459.0, 2277.0, 1502.0, 1035.0, 660.0, 470.0, 321.0, 193.0, 143.0, 103.0, 73.0, 43.0, 29.0, 17.0, 17.0, 8.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0], "bins": [-11.234375, -10.885986328125, -10.53759765625, -10.189208984375, -9.8408203125, -9.492431640625, -9.14404296875, -8.795654296875, -8.447265625, -8.098876953125, -7.75048828125, -7.402099609375, -7.0537109375, -6.705322265625, -6.35693359375, -6.008544921875, -5.66015625, -5.311767578125, -4.96337890625, -4.614990234375, -4.2666015625, -3.918212890625, -3.56982421875, -3.221435546875, -2.873046875, -2.524658203125, -2.17626953125, -1.827880859375, -1.4794921875, -1.131103515625, -0.78271484375, -0.434326171875, -0.0859375, 0.262451171875, 0.61083984375, 0.959228515625, 1.3076171875, 1.656005859375, 2.00439453125, 2.352783203125, 2.701171875, 3.049560546875, 3.39794921875, 3.746337890625, 4.0947265625, 4.443115234375, 4.79150390625, 5.139892578125, 5.48828125, 5.836669921875, 6.18505859375, 6.533447265625, 6.8818359375, 7.230224609375, 7.57861328125, 7.927001953125, 8.275390625, 8.623779296875, 8.97216796875, 9.320556640625, 9.6689453125, 10.017333984375, 10.36572265625, 10.714111328125, 11.0625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 9.0, 6.0, 10.0, 17.0, 9.0, 12.0, 13.0, 14.0, 21.0, 19.0, 22.0, 34.0, 34.0, 27.0, 30.0, 39.0, 36.0, 33.0, 45.0, 34.0, 48.0, 45.0, 33.0, 33.0, 26.0, 34.0, 35.0, 30.0, 27.0, 33.0, 31.0, 21.0, 22.0, 24.0, 15.0, 7.0, 9.0, 14.0, 7.0, 10.0, 3.0, 6.0, 11.0, 5.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 2.0], "bins": [-9.0390625, -8.7698974609375, -8.500732421875, -8.2315673828125, -7.96240234375, -7.6932373046875, -7.424072265625, -7.1549072265625, -6.8857421875, -6.6165771484375, -6.347412109375, -6.0782470703125, -5.80908203125, -5.5399169921875, -5.270751953125, -5.0015869140625, -4.732421875, -4.4632568359375, -4.194091796875, -3.9249267578125, -3.65576171875, -3.3865966796875, -3.117431640625, -2.8482666015625, -2.5791015625, -2.3099365234375, -2.040771484375, -1.7716064453125, -1.50244140625, -1.2332763671875, -0.964111328125, -0.6949462890625, -0.42578125, -0.1566162109375, 0.112548828125, 0.3817138671875, 0.65087890625, 0.9200439453125, 1.189208984375, 1.4583740234375, 1.7275390625, 1.9967041015625, 2.265869140625, 2.5350341796875, 2.80419921875, 3.0733642578125, 3.342529296875, 3.6116943359375, 3.880859375, 4.1500244140625, 4.419189453125, 4.6883544921875, 4.95751953125, 5.2266845703125, 5.495849609375, 5.7650146484375, 6.0341796875, 6.3033447265625, 6.572509765625, 6.8416748046875, 7.11083984375, 7.3800048828125, 7.649169921875, 7.9183349609375, 8.1875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 4.0, 0.0, 9.0, 2.0, 7.0, 9.0, 24.0, 22.0, 37.0, 52.0, 81.0, 127.0, 198.0, 293.0, 499.0, 781.0, 1201.0, 2093.0, 3707.0, 6459.0, 11743.0, 21699.0, 41113.0, 79188.0, 144675.0, 215558.0, 213364.0, 141148.0, 77006.0, 40080.0, 21103.0, 11237.0, 6240.0, 3561.0, 2063.0, 1165.0, 728.0, 454.0, 267.0, 201.0, 128.0, 85.0, 43.0, 41.0, 20.0, 18.0, 6.0, 8.0, 9.0, 4.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.4609375, -12.0308837890625, -11.600830078125, -11.1707763671875, -10.74072265625, -10.3106689453125, -9.880615234375, -9.4505615234375, -9.0205078125, -8.5904541015625, -8.160400390625, -7.7303466796875, -7.30029296875, -6.8702392578125, -6.440185546875, -6.0101318359375, -5.580078125, -5.1500244140625, -4.719970703125, -4.2899169921875, -3.85986328125, -3.4298095703125, -2.999755859375, -2.5697021484375, -2.1396484375, -1.7095947265625, -1.279541015625, -0.8494873046875, -0.41943359375, 0.0106201171875, 0.440673828125, 0.8707275390625, 1.30078125, 1.7308349609375, 2.160888671875, 2.5909423828125, 3.02099609375, 3.4510498046875, 3.881103515625, 4.3111572265625, 4.7412109375, 5.1712646484375, 5.601318359375, 6.0313720703125, 6.46142578125, 6.8914794921875, 7.321533203125, 7.7515869140625, 8.181640625, 8.6116943359375, 9.041748046875, 9.4718017578125, 9.90185546875, 10.3319091796875, 10.761962890625, 11.1920166015625, 11.6220703125, 12.0521240234375, 12.482177734375, 12.9122314453125, 13.34228515625, 13.7723388671875, 14.202392578125, 14.6324462890625, 15.0625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 2.0, 7.0, 11.0, 14.0, 18.0, 30.0, 35.0, 42.0, 56.0, 60.0, 77.0, 91.0, 93.0, 84.0, 70.0, 66.0, 58.0, 45.0, 37.0, 25.0, 25.0, 19.0, 16.0, 6.0, 5.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010709762573242188, -0.0010169297456741333, -0.0009628832340240479, -0.0009088367223739624, -0.000854790210723877, -0.0008007436990737915, -0.0007466971874237061, -0.0006926506757736206, -0.0006386041641235352, -0.0005845576524734497, -0.0005305111408233643, -0.0004764646291732788, -0.00042241811752319336, -0.0003683716058731079, -0.00031432509422302246, -0.000260278582572937, -0.00020623207092285156, -0.0001521855592727661, -9.813904762268066e-05, -4.4092535972595215e-05, 9.953975677490234e-06, 6.400048732757568e-05, 0.00011804699897766113, 0.00017209351062774658, 0.00022614002227783203, 0.0002801865339279175, 0.00033423304557800293, 0.0003882795572280884, 0.00044232606887817383, 0.0004963725805282593, 0.0005504190921783447, 0.0006044656038284302, 0.0006585121154785156, 0.0007125586271286011, 0.0007666051387786865, 0.000820651650428772, 0.0008746981620788574, 0.0009287446737289429, 0.0009827911853790283, 0.0010368376970291138, 0.0010908842086791992, 0.0011449307203292847, 0.0011989772319793701, 0.0012530237436294556, 0.001307070255279541, 0.0013611167669296265, 0.001415163278579712, 0.0014692097902297974, 0.0015232563018798828, 0.0015773028135299683, 0.0016313493251800537, 0.0016853958368301392, 0.0017394423484802246, 0.00179348886013031, 0.0018475353717803955, 0.001901581883430481, 0.0019556283950805664, 0.002009674906730652, 0.0020637214183807373, 0.0021177679300308228, 0.002171814441680908, 0.0022258609533309937, 0.002279907464981079, 0.0023339539766311646, 0.00238800048828125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 2.0, 2.0, 7.0, 7.0, 16.0, 11.0, 22.0, 31.0, 48.0, 71.0, 115.0, 160.0, 224.0, 421.0, 674.0, 1202.0, 2137.0, 4205.0, 8099.0, 16358.0, 33959.0, 70540.0, 141798.0, 229378.0, 235063.0, 152643.0, 77791.0, 37156.0, 17665.0, 8761.0, 4519.0, 2301.0, 1263.0, 702.0, 429.0, 255.0, 180.0, 115.0, 73.0, 47.0, 31.0, 22.0, 12.0, 17.0, 5.0, 7.0, 5.0, 6.0, 7.0, 0.0, 3.0, 0.0, 1.0], "bins": [-16.203125, -15.740966796875, -15.27880859375, -14.816650390625, -14.3544921875, -13.892333984375, -13.43017578125, -12.968017578125, -12.505859375, -12.043701171875, -11.58154296875, -11.119384765625, -10.6572265625, -10.195068359375, -9.73291015625, -9.270751953125, -8.80859375, -8.346435546875, -7.88427734375, -7.422119140625, -6.9599609375, -6.497802734375, -6.03564453125, -5.573486328125, -5.111328125, -4.649169921875, -4.18701171875, -3.724853515625, -3.2626953125, -2.800537109375, -2.33837890625, -1.876220703125, -1.4140625, -0.951904296875, -0.48974609375, -0.027587890625, 0.4345703125, 0.896728515625, 1.35888671875, 1.821044921875, 2.283203125, 2.745361328125, 3.20751953125, 3.669677734375, 4.1318359375, 4.593994140625, 5.05615234375, 5.518310546875, 5.98046875, 6.442626953125, 6.90478515625, 7.366943359375, 7.8291015625, 8.291259765625, 8.75341796875, 9.215576171875, 9.677734375, 10.139892578125, 10.60205078125, 11.064208984375, 11.5263671875, 11.988525390625, 12.45068359375, 12.912841796875, 13.375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 7.0, 12.0, 5.0, 14.0, 15.0, 15.0, 15.0, 21.0, 19.0, 26.0, 20.0, 36.0, 36.0, 35.0, 37.0, 58.0, 58.0, 55.0, 69.0, 50.0, 52.0, 53.0, 66.0, 35.0, 29.0, 35.0, 28.0, 16.0, 13.0, 16.0, 16.0, 7.0, 13.0, 3.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.275390625, -3.1685791015625, -3.061767578125, -2.9549560546875, -2.84814453125, -2.7413330078125, -2.634521484375, -2.5277099609375, -2.4208984375, -2.3140869140625, -2.207275390625, -2.1004638671875, -1.99365234375, -1.8868408203125, -1.780029296875, -1.6732177734375, -1.56640625, -1.4595947265625, -1.352783203125, -1.2459716796875, -1.13916015625, -1.0323486328125, -0.925537109375, -0.8187255859375, -0.7119140625, -0.6051025390625, -0.498291015625, -0.3914794921875, -0.28466796875, -0.1778564453125, -0.071044921875, 0.0357666015625, 0.142578125, 0.2493896484375, 0.356201171875, 0.4630126953125, 0.56982421875, 0.6766357421875, 0.783447265625, 0.8902587890625, 0.9970703125, 1.1038818359375, 1.210693359375, 1.3175048828125, 1.42431640625, 1.5311279296875, 1.637939453125, 1.7447509765625, 1.8515625, 1.9583740234375, 2.065185546875, 2.1719970703125, 2.27880859375, 2.3856201171875, 2.492431640625, 2.5992431640625, 2.7060546875, 2.8128662109375, 2.919677734375, 3.0264892578125, 3.13330078125, 3.2401123046875, 3.346923828125, 3.4537353515625, 3.560546875]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 0.0, 2.0, 0.0, 6.0, 10.0, 7.0, 8.0, 16.0, 20.0, 19.0, 35.0, 30.0, 30.0, 49.0, 38.0, 63.0, 66.0, 64.0, 56.0, 73.0, 66.0, 57.0, 51.0, 49.0, 33.0, 24.0, 28.0, 22.0, 16.0, 10.0, 15.0, 12.0, 9.0, 7.0, 7.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.925884246826172, -18.344158172607422, -17.762432098388672, -17.180706024169922, -16.598979949951172, -16.017255783081055, -15.435529708862305, -14.853803634643555, -14.272077560424805, -13.690351486206055, -13.108625411987305, -12.526900291442871, -11.945174217224121, -11.363448143005371, -10.781723022460938, -10.199996948242188, -9.618270874023438, -9.036544799804688, -8.454818725585938, -7.873093605041504, -7.291367530822754, -6.709641456604004, -6.127915859222412, -5.54619026184082, -4.96446418762207, -4.38273811340332, -3.8010125160217285, -3.2192866802215576, -2.6375608444213867, -2.055835008621216, -1.474109172821045, -0.8923835754394531, -0.3106575012207031, 0.2710683345794678, 0.8527941703796387, 1.4345200061798096, 2.0162458419799805, 2.5979716777801514, 3.1796975135803223, 3.761423110961914, 4.343149185180664, 4.924875259399414, 5.506600856781006, 6.088326454162598, 6.670052528381348, 7.251778602600098, 7.8335041999816895, 8.415229797363281, 8.996955871582031, 9.578681945800781, 10.160408020019531, 10.742133140563965, 11.323859214782715, 11.905585289001465, 12.487310409545898, 13.069036483764648, 13.650762557983398, 14.232488632202148, 14.814214706420898, 15.395939826965332, 15.977665901184082, 16.559391021728516, 17.141117095947266, 17.722843170166016, 18.304569244384766]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 2.0, 6.0, 6.0, 6.0, 6.0, 6.0, 11.0, 12.0, 12.0, 11.0, 14.0, 14.0, 17.0, 16.0, 27.0, 18.0, 21.0, 24.0, 28.0, 35.0, 27.0, 36.0, 36.0, 33.0, 34.0, 39.0, 48.0, 33.0, 38.0, 35.0, 28.0, 39.0, 29.0, 20.0, 25.0, 16.0, 30.0, 27.0, 20.0, 14.0, 20.0, 14.0, 12.0, 11.0, 5.0, 13.0, 5.0, 9.0, 10.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-11.267414093017578, -10.8882417678833, -10.509069442749023, -10.129897117614746, -9.750724792480469, -9.371553421020508, -8.99238109588623, -8.613208770751953, -8.234036445617676, -7.854864120483398, -7.475691795349121, -7.096519947052002, -6.717347621917725, -6.338175296783447, -5.959003448486328, -5.579831123352051, -5.200658798217773, -4.821486473083496, -4.442314147949219, -4.0631422996521, -3.6839699745178223, -3.304797649383545, -2.9256255626678467, -2.5464534759521484, -2.167281150817871, -1.7881089448928833, -1.4089367389678955, -1.0297645330429077, -0.6505923271179199, -0.27142012119293213, 0.10775208473205566, 0.4869241714477539, 0.8660955429077148, 1.2452677488327026, 1.6244399547576904, 2.0036120414733887, 2.382784366607666, 2.7619566917419434, 3.1411287784576416, 3.52030086517334, 3.899473190307617, 4.2786455154418945, 4.657817840576172, 5.036989688873291, 5.416162014007568, 5.795334339141846, 6.174506187438965, 6.553678512573242, 6.9328508377075195, 7.312023162841797, 7.691195487976074, 8.070367813110352, 8.449539184570312, 8.82871150970459, 9.207883834838867, 9.587056159973145, 9.966228485107422, 10.3454008102417, 10.724573135375977, 11.103745460510254, 11.482917785644531, 11.862089157104492, 12.24126148223877, 12.620433807373047, 12.999606132507324]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 3.0, 5.0, 4.0, 7.0, 8.0, 23.0, 34.0, 47.0, 63.0, 112.0, 147.0, 261.0, 425.0, 646.0, 1032.0, 1734.0, 2861.0, 4728.0, 7842.0, 12972.0, 22349.0, 37767.0, 66672.0, 119785.0, 221210.0, 407467.0, 672667.0, 842449.0, 730747.0, 466408.0, 255253.0, 137538.0, 75797.0, 43165.0, 24901.0, 14655.0, 8839.0, 5226.0, 3237.0, 1966.0, 1171.0, 760.0, 500.0, 311.0, 168.0, 133.0, 80.0, 44.0, 22.0, 16.0, 11.0, 7.0, 9.0, 2.0, 3.0, 2.0, 2.0], "bins": [-12.875, -12.5030517578125, -12.131103515625, -11.7591552734375, -11.38720703125, -11.0152587890625, -10.643310546875, -10.2713623046875, -9.8994140625, -9.5274658203125, -9.155517578125, -8.7835693359375, -8.41162109375, -8.0396728515625, -7.667724609375, -7.2957763671875, -6.923828125, -6.5518798828125, -6.179931640625, -5.8079833984375, -5.43603515625, -5.0640869140625, -4.692138671875, -4.3201904296875, -3.9482421875, -3.5762939453125, -3.204345703125, -2.8323974609375, -2.46044921875, -2.0885009765625, -1.716552734375, -1.3446044921875, -0.97265625, -0.6007080078125, -0.228759765625, 0.1431884765625, 0.51513671875, 0.8870849609375, 1.259033203125, 1.6309814453125, 2.0029296875, 2.3748779296875, 2.746826171875, 3.1187744140625, 3.49072265625, 3.8626708984375, 4.234619140625, 4.6065673828125, 4.978515625, 5.3504638671875, 5.722412109375, 6.0943603515625, 6.46630859375, 6.8382568359375, 7.210205078125, 7.5821533203125, 7.9541015625, 8.3260498046875, 8.697998046875, 9.0699462890625, 9.44189453125, 9.8138427734375, 10.185791015625, 10.5577392578125, 10.9296875]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 9.0, 3.0, 7.0, 8.0, 9.0, 9.0, 10.0, 14.0, 15.0, 18.0, 12.0, 16.0, 32.0, 23.0, 25.0, 29.0, 28.0, 31.0, 39.0, 36.0, 33.0, 30.0, 33.0, 37.0, 40.0, 44.0, 32.0, 39.0, 41.0, 24.0, 25.0, 29.0, 27.0, 32.0, 22.0, 22.0, 19.0, 16.0, 12.0, 12.0, 11.0, 13.0, 9.0, 7.0, 8.0, 5.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0], "bins": [-9.390625, -9.1121826171875, -8.833740234375, -8.5552978515625, -8.27685546875, -7.9984130859375, -7.719970703125, -7.4415283203125, -7.1630859375, -6.8846435546875, -6.606201171875, -6.3277587890625, -6.04931640625, -5.7708740234375, -5.492431640625, -5.2139892578125, -4.935546875, -4.6571044921875, -4.378662109375, -4.1002197265625, -3.82177734375, -3.5433349609375, -3.264892578125, -2.9864501953125, -2.7080078125, -2.4295654296875, -2.151123046875, -1.8726806640625, -1.59423828125, -1.3157958984375, -1.037353515625, -0.7589111328125, -0.48046875, -0.2020263671875, 0.076416015625, 0.3548583984375, 0.63330078125, 0.9117431640625, 1.190185546875, 1.4686279296875, 1.7470703125, 2.0255126953125, 2.303955078125, 2.5823974609375, 2.86083984375, 3.1392822265625, 3.417724609375, 3.6961669921875, 3.974609375, 4.2530517578125, 4.531494140625, 4.8099365234375, 5.08837890625, 5.3668212890625, 5.645263671875, 5.9237060546875, 6.2021484375, 6.4805908203125, 6.759033203125, 7.0374755859375, 7.31591796875, 7.5943603515625, 7.872802734375, 8.1512451171875, 8.4296875]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 15.0, 6.0, 9.0, 13.0, 34.0, 32.0, 80.0, 114.0, 195.0, 317.0, 583.0, 980.0, 1920.0, 3210.0, 6255.0, 11884.0, 22534.0, 44803.0, 90057.0, 184016.0, 365729.0, 673924.0, 955697.0, 831436.0, 494061.0, 253448.0, 125490.0, 62254.0, 31148.0, 15625.0, 8379.0, 4444.0, 2360.0, 1394.0, 781.0, 407.0, 260.0, 166.0, 81.0, 54.0, 35.0, 27.0, 15.0, 9.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.765625, -14.30029296875, -13.8349609375, -13.36962890625, -12.904296875, -12.43896484375, -11.9736328125, -11.50830078125, -11.04296875, -10.57763671875, -10.1123046875, -9.64697265625, -9.181640625, -8.71630859375, -8.2509765625, -7.78564453125, -7.3203125, -6.85498046875, -6.3896484375, -5.92431640625, -5.458984375, -4.99365234375, -4.5283203125, -4.06298828125, -3.59765625, -3.13232421875, -2.6669921875, -2.20166015625, -1.736328125, -1.27099609375, -0.8056640625, -0.34033203125, 0.125, 0.59033203125, 1.0556640625, 1.52099609375, 1.986328125, 2.45166015625, 2.9169921875, 3.38232421875, 3.84765625, 4.31298828125, 4.7783203125, 5.24365234375, 5.708984375, 6.17431640625, 6.6396484375, 7.10498046875, 7.5703125, 8.03564453125, 8.5009765625, 8.96630859375, 9.431640625, 9.89697265625, 10.3623046875, 10.82763671875, 11.29296875, 11.75830078125, 12.2236328125, 12.68896484375, 13.154296875, 13.61962890625, 14.0849609375, 14.55029296875, 15.015625]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 8.0, 7.0, 6.0, 18.0, 25.0, 33.0, 34.0, 56.0, 93.0, 89.0, 140.0, 161.0, 184.0, 234.0, 258.0, 302.0, 320.0, 285.0, 323.0, 306.0, 210.0, 206.0, 166.0, 135.0, 115.0, 80.0, 75.0, 55.0, 42.0, 24.0, 21.0, 18.0, 18.0, 7.0, 6.0, 5.0, 5.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8515625, -4.6717529296875, -4.491943359375, -4.3121337890625, -4.13232421875, -3.9525146484375, -3.772705078125, -3.5928955078125, -3.4130859375, -3.2332763671875, -3.053466796875, -2.8736572265625, -2.69384765625, -2.5140380859375, -2.334228515625, -2.1544189453125, -1.974609375, -1.7947998046875, -1.614990234375, -1.4351806640625, -1.25537109375, -1.0755615234375, -0.895751953125, -0.7159423828125, -0.5361328125, -0.3563232421875, -0.176513671875, 0.0032958984375, 0.18310546875, 0.3629150390625, 0.542724609375, 0.7225341796875, 0.90234375, 1.0821533203125, 1.261962890625, 1.4417724609375, 1.62158203125, 1.8013916015625, 1.981201171875, 2.1610107421875, 2.3408203125, 2.5206298828125, 2.700439453125, 2.8802490234375, 3.06005859375, 3.2398681640625, 3.419677734375, 3.5994873046875, 3.779296875, 3.9591064453125, 4.138916015625, 4.3187255859375, 4.49853515625, 4.6783447265625, 4.858154296875, 5.0379638671875, 5.2177734375, 5.3975830078125, 5.577392578125, 5.7572021484375, 5.93701171875, 6.1168212890625, 6.296630859375, 6.4764404296875, 6.65625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 4.0, 6.0, 4.0, 3.0, 13.0, 12.0, 22.0, 27.0, 22.0, 34.0, 37.0, 47.0, 48.0, 56.0, 77.0, 67.0, 66.0, 68.0, 60.0, 47.0, 42.0, 42.0, 38.0, 35.0, 30.0, 21.0, 21.0, 12.0, 10.0, 10.0, 7.0, 6.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.35306739807129, -15.859697341918945, -15.366327285766602, -14.872958183288574, -14.37958812713623, -13.886218070983887, -13.392848014831543, -12.899478912353516, -12.406108856201172, -11.912738800048828, -11.419368743896484, -10.925999641418457, -10.432629585266113, -9.93925952911377, -9.445889472961426, -8.952520370483398, -8.459150314331055, -7.965780258178711, -7.472410678863525, -6.979040622711182, -6.485671043395996, -5.992300987243652, -5.498930931091309, -5.005561351776123, -4.512190818786621, -4.018820762634277, -3.525451183319092, -3.032081127166748, -2.5387115478515625, -2.0453414916992188, -1.551971673965454, -1.0586018562316895, -0.5652322769165039, -0.07186242938041687, 0.42150741815567017, 0.9148772954940796, 1.4082471132278442, 1.9016170501708984, 2.394986867904663, 2.8883566856384277, 3.3817265033721924, 3.875096321105957, 4.368466377258301, 4.861835956573486, 5.35520601272583, 5.848575592041016, 6.341945648193359, 6.835315704345703, 7.328685283660889, 7.822055339813232, 8.315424919128418, 8.808794975280762, 9.302165031433105, 9.795534133911133, 10.288904190063477, 10.78227424621582, 11.275644302368164, 11.769014358520508, 12.262384414672852, 12.755753517150879, 13.249123573303223, 13.742493629455566, 14.23586368560791, 14.729232788085938, 15.222602844238281]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 6.0, 9.0, 7.0, 11.0, 5.0, 12.0, 13.0, 20.0, 28.0, 30.0, 24.0, 25.0, 32.0, 33.0, 36.0, 45.0, 38.0, 41.0, 41.0, 42.0, 45.0, 34.0, 35.0, 40.0, 36.0, 36.0, 34.0, 28.0, 30.0, 28.0, 20.0, 25.0, 19.0, 18.0, 11.0, 11.0, 14.0, 11.0, 6.0, 7.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.916070938110352, -10.57299518585205, -10.22991943359375, -9.88684368133545, -9.543767929077148, -9.200692176818848, -8.857616424560547, -8.514540672302246, -8.171464920043945, -7.8283891677856445, -7.485313415527344, -7.142237663269043, -6.799161911010742, -6.456086158752441, -6.113010406494141, -5.76993465423584, -5.426858901977539, -5.083783149719238, -4.7407073974609375, -4.397631645202637, -4.054555892944336, -3.711480140686035, -3.3684043884277344, -3.0253286361694336, -2.682252883911133, -2.339177131652832, -1.9961013793945312, -1.6530256271362305, -1.3099498748779297, -0.9668741226196289, -0.6237983703613281, -0.28072261810302734, 0.062354087829589844, 0.4054298400878906, 0.7485055923461914, 1.0915813446044922, 1.434657096862793, 1.7777328491210938, 2.1208086013793945, 2.4638843536376953, 2.806960105895996, 3.150035858154297, 3.4931116104125977, 3.8361873626708984, 4.179263114929199, 4.5223388671875, 4.865414619445801, 5.208490371704102, 5.551566123962402, 5.894641876220703, 6.237717628479004, 6.580793380737305, 6.9238691329956055, 7.266944885253906, 7.610020637512207, 7.953096389770508, 8.296172142028809, 8.63924789428711, 8.98232364654541, 9.325399398803711, 9.668475151062012, 10.011550903320312, 10.354626655578613, 10.697702407836914, 11.040778160095215]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 10.0, 7.0, 21.0, 15.0, 30.0, 42.0, 66.0, 88.0, 128.0, 169.0, 242.0, 348.0, 440.0, 606.0, 930.0, 1328.0, 2095.0, 3140.0, 4886.0, 8178.0, 14342.0, 29209.0, 71116.0, 198042.0, 357410.0, 210879.0, 75655.0, 30505.0, 15035.0, 8460.0, 5157.0, 3281.0, 2184.0, 1368.0, 904.0, 642.0, 471.0, 341.0, 240.0, 175.0, 112.0, 85.0, 42.0, 43.0, 26.0, 21.0, 16.0, 11.0, 3.0, 7.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-33.78125, -32.6748046875, -31.568359375, -30.4619140625, -29.35546875, -28.2490234375, -27.142578125, -26.0361328125, -24.9296875, -23.8232421875, -22.716796875, -21.6103515625, -20.50390625, -19.3974609375, -18.291015625, -17.1845703125, -16.078125, -14.9716796875, -13.865234375, -12.7587890625, -11.65234375, -10.5458984375, -9.439453125, -8.3330078125, -7.2265625, -6.1201171875, -5.013671875, -3.9072265625, -2.80078125, -1.6943359375, -0.587890625, 0.5185546875, 1.625, 2.7314453125, 3.837890625, 4.9443359375, 6.05078125, 7.1572265625, 8.263671875, 9.3701171875, 10.4765625, 11.5830078125, 12.689453125, 13.7958984375, 14.90234375, 16.0087890625, 17.115234375, 18.2216796875, 19.328125, 20.4345703125, 21.541015625, 22.6474609375, 23.75390625, 24.8603515625, 25.966796875, 27.0732421875, 28.1796875, 29.2861328125, 30.392578125, 31.4990234375, 32.60546875, 33.7119140625, 34.818359375, 35.9248046875, 37.03125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 5.0, 2.0, 1.0, 7.0, 3.0, 8.0, 6.0, 6.0, 6.0, 16.0, 14.0, 18.0, 21.0, 18.0, 33.0, 31.0, 30.0, 34.0, 31.0, 37.0, 43.0, 46.0, 34.0, 35.0, 34.0, 38.0, 35.0, 42.0, 45.0, 44.0, 41.0, 25.0, 26.0, 28.0, 22.0, 25.0, 18.0, 22.0, 15.0, 13.0, 14.0, 8.0, 6.0, 7.0, 3.0, 5.0, 6.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-10.09375, -9.7830810546875, -9.472412109375, -9.1617431640625, -8.85107421875, -8.5404052734375, -8.229736328125, -7.9190673828125, -7.6083984375, -7.2977294921875, -6.987060546875, -6.6763916015625, -6.36572265625, -6.0550537109375, -5.744384765625, -5.4337158203125, -5.123046875, -4.8123779296875, -4.501708984375, -4.1910400390625, -3.88037109375, -3.5697021484375, -3.259033203125, -2.9483642578125, -2.6376953125, -2.3270263671875, -2.016357421875, -1.7056884765625, -1.39501953125, -1.0843505859375, -0.773681640625, -0.4630126953125, -0.15234375, 0.1583251953125, 0.468994140625, 0.7796630859375, 1.09033203125, 1.4010009765625, 1.711669921875, 2.0223388671875, 2.3330078125, 2.6436767578125, 2.954345703125, 3.2650146484375, 3.57568359375, 3.8863525390625, 4.197021484375, 4.5076904296875, 4.818359375, 5.1290283203125, 5.439697265625, 5.7503662109375, 6.06103515625, 6.3717041015625, 6.682373046875, 6.9930419921875, 7.3037109375, 7.6143798828125, 7.925048828125, 8.2357177734375, 8.54638671875, 8.8570556640625, 9.167724609375, 9.4783935546875, 9.7890625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 10.0, 21.0, 14.0, 27.0, 55.0, 69.0, 119.0, 199.0, 354.0, 500.0, 771.0, 1372.0, 2199.0, 3706.0, 6576.0, 11647.0, 22201.0, 46851.0, 115482.0, 302284.0, 311853.0, 121886.0, 49024.0, 22885.0, 12069.0, 6735.0, 3749.0, 2281.0, 1365.0, 842.0, 544.0, 325.0, 204.0, 124.0, 82.0, 44.0, 24.0, 15.0, 8.0, 9.0, 9.0, 5.0, 8.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-34.90625, -33.88037109375, -32.8544921875, -31.82861328125, -30.802734375, -29.77685546875, -28.7509765625, -27.72509765625, -26.69921875, -25.67333984375, -24.6474609375, -23.62158203125, -22.595703125, -21.56982421875, -20.5439453125, -19.51806640625, -18.4921875, -17.46630859375, -16.4404296875, -15.41455078125, -14.388671875, -13.36279296875, -12.3369140625, -11.31103515625, -10.28515625, -9.25927734375, -8.2333984375, -7.20751953125, -6.181640625, -5.15576171875, -4.1298828125, -3.10400390625, -2.078125, -1.05224609375, -0.0263671875, 0.99951171875, 2.025390625, 3.05126953125, 4.0771484375, 5.10302734375, 6.12890625, 7.15478515625, 8.1806640625, 9.20654296875, 10.232421875, 11.25830078125, 12.2841796875, 13.31005859375, 14.3359375, 15.36181640625, 16.3876953125, 17.41357421875, 18.439453125, 19.46533203125, 20.4912109375, 21.51708984375, 22.54296875, 23.56884765625, 24.5947265625, 25.62060546875, 26.646484375, 27.67236328125, 28.6982421875, 29.72412109375, 30.75]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 7.0, 7.0, 6.0, 9.0, 12.0, 14.0, 23.0, 15.0, 29.0, 24.0, 27.0, 38.0, 38.0, 56.0, 35.0, 48.0, 44.0, 52.0, 57.0, 46.0, 39.0, 61.0, 37.0, 43.0, 37.0, 32.0, 31.0, 27.0, 20.0, 20.0, 15.0, 16.0, 12.0, 11.0, 9.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.1875, -8.93505859375, -8.6826171875, -8.43017578125, -8.177734375, -7.92529296875, -7.6728515625, -7.42041015625, -7.16796875, -6.91552734375, -6.6630859375, -6.41064453125, -6.158203125, -5.90576171875, -5.6533203125, -5.40087890625, -5.1484375, -4.89599609375, -4.6435546875, -4.39111328125, -4.138671875, -3.88623046875, -3.6337890625, -3.38134765625, -3.12890625, -2.87646484375, -2.6240234375, -2.37158203125, -2.119140625, -1.86669921875, -1.6142578125, -1.36181640625, -1.109375, -0.85693359375, -0.6044921875, -0.35205078125, -0.099609375, 0.15283203125, 0.4052734375, 0.65771484375, 0.91015625, 1.16259765625, 1.4150390625, 1.66748046875, 1.919921875, 2.17236328125, 2.4248046875, 2.67724609375, 2.9296875, 3.18212890625, 3.4345703125, 3.68701171875, 3.939453125, 4.19189453125, 4.4443359375, 4.69677734375, 4.94921875, 5.20166015625, 5.4541015625, 5.70654296875, 5.958984375, 6.21142578125, 6.4638671875, 6.71630859375, 6.96875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 8.0, 11.0, 25.0, 25.0, 33.0, 54.0, 83.0, 130.0, 169.0, 281.0, 380.0, 620.0, 955.0, 1488.0, 2471.0, 3965.0, 6912.0, 13229.0, 28187.0, 75232.0, 239899.0, 409027.0, 164285.0, 53671.0, 21813.0, 10506.0, 5873.0, 3480.0, 2012.0, 1246.0, 853.0, 579.0, 348.0, 234.0, 152.0, 100.0, 79.0, 37.0, 36.0, 19.0, 18.0, 12.0, 7.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.28125, -17.73291015625, -17.1845703125, -16.63623046875, -16.087890625, -15.53955078125, -14.9912109375, -14.44287109375, -13.89453125, -13.34619140625, -12.7978515625, -12.24951171875, -11.701171875, -11.15283203125, -10.6044921875, -10.05615234375, -9.5078125, -8.95947265625, -8.4111328125, -7.86279296875, -7.314453125, -6.76611328125, -6.2177734375, -5.66943359375, -5.12109375, -4.57275390625, -4.0244140625, -3.47607421875, -2.927734375, -2.37939453125, -1.8310546875, -1.28271484375, -0.734375, -0.18603515625, 0.3623046875, 0.91064453125, 1.458984375, 2.00732421875, 2.5556640625, 3.10400390625, 3.65234375, 4.20068359375, 4.7490234375, 5.29736328125, 5.845703125, 6.39404296875, 6.9423828125, 7.49072265625, 8.0390625, 8.58740234375, 9.1357421875, 9.68408203125, 10.232421875, 10.78076171875, 11.3291015625, 11.87744140625, 12.42578125, 12.97412109375, 13.5224609375, 14.07080078125, 14.619140625, 15.16748046875, 15.7158203125, 16.26416015625, 16.8125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 1.0, 5.0, 7.0, 5.0, 13.0, 15.0, 32.0, 54.0, 113.0, 208.0, 239.0, 133.0, 69.0, 24.0, 19.0, 12.0, 10.0, 6.0, 6.0, 4.0, 3.0, 2.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001354217529296875, -0.0013023614883422852, -0.0012505054473876953, -0.0011986494064331055, -0.0011467933654785156, -0.0010949373245239258, -0.001043081283569336, -0.000991225242614746, -0.0009393692016601562, -0.0008875131607055664, -0.0008356571197509766, -0.0007838010787963867, -0.0007319450378417969, -0.000680088996887207, -0.0006282329559326172, -0.0005763769149780273, -0.0005245208740234375, -0.00047266483306884766, -0.0004208087921142578, -0.00036895275115966797, -0.0003170967102050781, -0.0002652406692504883, -0.00021338462829589844, -0.0001615285873413086, -0.00010967254638671875, -5.7816505432128906e-05, -5.9604644775390625e-06, 4.589557647705078e-05, 9.775161743164062e-05, 0.00014960765838623047, 0.0002014636993408203, 0.00025331974029541016, 0.00030517578125, 0.00035703182220458984, 0.0004088878631591797, 0.00046074390411376953, 0.0005125999450683594, 0.0005644559860229492, 0.0006163120269775391, 0.0006681680679321289, 0.0007200241088867188, 0.0007718801498413086, 0.0008237361907958984, 0.0008755922317504883, 0.0009274482727050781, 0.000979304313659668, 0.0010311603546142578, 0.0010830163955688477, 0.0011348724365234375, 0.0011867284774780273, 0.0012385845184326172, 0.001290440559387207, 0.0013422966003417969, 0.0013941526412963867, 0.0014460086822509766, 0.0014978647232055664, 0.0015497207641601562, 0.001601576805114746, 0.001653432846069336, 0.0017052888870239258, 0.0017571449279785156, 0.0018090009689331055, 0.0018608570098876953, 0.0019127130508422852, 0.001964569091796875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 5.0, 4.0, 5.0, 21.0, 25.0, 27.0, 42.0, 49.0, 92.0, 129.0, 189.0, 282.0, 383.0, 512.0, 775.0, 1145.0, 1684.0, 2394.0, 3477.0, 5543.0, 8707.0, 14192.0, 24289.0, 43735.0, 81277.0, 148599.0, 220437.0, 204474.0, 125885.0, 67957.0, 36777.0, 20851.0, 12106.0, 7511.0, 4847.0, 3155.0, 2081.0, 1532.0, 1052.0, 706.0, 464.0, 346.0, 253.0, 167.0, 119.0, 77.0, 54.0, 54.0, 15.0, 21.0, 13.0, 7.0, 8.0, 5.0, 4.0, 1.0, 1.0], "bins": [-10.6953125, -10.37939453125, -10.0634765625, -9.74755859375, -9.431640625, -9.11572265625, -8.7998046875, -8.48388671875, -8.16796875, -7.85205078125, -7.5361328125, -7.22021484375, -6.904296875, -6.58837890625, -6.2724609375, -5.95654296875, -5.640625, -5.32470703125, -5.0087890625, -4.69287109375, -4.376953125, -4.06103515625, -3.7451171875, -3.42919921875, -3.11328125, -2.79736328125, -2.4814453125, -2.16552734375, -1.849609375, -1.53369140625, -1.2177734375, -0.90185546875, -0.5859375, -0.27001953125, 0.0458984375, 0.36181640625, 0.677734375, 0.99365234375, 1.3095703125, 1.62548828125, 1.94140625, 2.25732421875, 2.5732421875, 2.88916015625, 3.205078125, 3.52099609375, 3.8369140625, 4.15283203125, 4.46875, 4.78466796875, 5.1005859375, 5.41650390625, 5.732421875, 6.04833984375, 6.3642578125, 6.68017578125, 6.99609375, 7.31201171875, 7.6279296875, 7.94384765625, 8.259765625, 8.57568359375, 8.8916015625, 9.20751953125, 9.5234375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 0.0, 5.0, 4.0, 6.0, 7.0, 10.0, 14.0, 12.0, 12.0, 24.0, 25.0, 27.0, 46.0, 46.0, 47.0, 56.0, 65.0, 63.0, 65.0, 73.0, 58.0, 48.0, 46.0, 29.0, 35.0, 34.0, 20.0, 20.0, 20.0, 10.0, 10.0, 15.0, 9.0, 5.0, 7.0, 4.0, 7.0, 2.0, 2.0, 3.0, 0.0, 0.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-3.77734375, -3.6678466796875, -3.558349609375, -3.4488525390625, -3.33935546875, -3.2298583984375, -3.120361328125, -3.0108642578125, -2.9013671875, -2.7918701171875, -2.682373046875, -2.5728759765625, -2.46337890625, -2.3538818359375, -2.244384765625, -2.1348876953125, -2.025390625, -1.9158935546875, -1.806396484375, -1.6968994140625, -1.58740234375, -1.4779052734375, -1.368408203125, -1.2589111328125, -1.1494140625, -1.0399169921875, -0.930419921875, -0.8209228515625, -0.71142578125, -0.6019287109375, -0.492431640625, -0.3829345703125, -0.2734375, -0.1639404296875, -0.054443359375, 0.0550537109375, 0.16455078125, 0.2740478515625, 0.383544921875, 0.4930419921875, 0.6025390625, 0.7120361328125, 0.821533203125, 0.9310302734375, 1.04052734375, 1.1500244140625, 1.259521484375, 1.3690185546875, 1.478515625, 1.5880126953125, 1.697509765625, 1.8070068359375, 1.91650390625, 2.0260009765625, 2.135498046875, 2.2449951171875, 2.3544921875, 2.4639892578125, 2.573486328125, 2.6829833984375, 2.79248046875, 2.9019775390625, 3.011474609375, 3.1209716796875, 3.23046875]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 4.0, 5.0, 6.0, 5.0, 10.0, 15.0, 18.0, 30.0, 27.0, 41.0, 33.0, 33.0, 56.0, 43.0, 58.0, 56.0, 67.0, 59.0, 46.0, 45.0, 57.0, 44.0, 36.0, 36.0, 29.0, 36.0, 22.0, 15.0, 15.0, 11.0, 11.0, 7.0, 5.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.397262573242188, -11.993739128112793, -11.590215682983398, -11.18669319152832, -10.783169746398926, -10.379646301269531, -9.976123809814453, -9.572600364685059, -9.169076919555664, -8.76555347442627, -8.362030029296875, -7.958507537841797, -7.554984092712402, -7.151460647583008, -6.7479376792907715, -6.344414710998535, -5.940891265869141, -5.537367820739746, -5.13384485244751, -4.730321884155273, -4.326798439025879, -3.9232752323150635, -3.519752025604248, -3.1162288188934326, -2.712705612182617, -2.3091824054718018, -1.9056591987609863, -1.502135992050171, -1.0986127853393555, -0.69508957862854, -0.2915663719177246, 0.11195683479309082, 0.5154809951782227, 0.9190042018890381, 1.3225274085998535, 1.726050615310669, 2.1295738220214844, 2.5330970287323, 2.9366202354431152, 3.3401434421539307, 3.743666648864746, 4.147190093994141, 4.550713062286377, 4.954236030578613, 5.357759475708008, 5.761282920837402, 6.164805889129639, 6.568328857421875, 6.9718523025512695, 7.375375747680664, 7.7788987159729, 8.182421684265137, 8.585945129394531, 8.989468574523926, 9.39299201965332, 9.796514511108398, 10.200037956237793, 10.603561401367188, 11.007083892822266, 11.41060733795166, 11.814130783081055, 12.21765422821045, 12.621177673339844, 13.024700164794922, 13.428223609924316]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 4.0, 3.0, 8.0, 10.0, 9.0, 6.0, 9.0, 6.0, 24.0, 20.0, 15.0, 12.0, 25.0, 30.0, 23.0, 34.0, 47.0, 31.0, 40.0, 42.0, 42.0, 33.0, 29.0, 41.0, 41.0, 44.0, 38.0, 24.0, 42.0, 27.0, 34.0, 30.0, 23.0, 18.0, 15.0, 34.0, 16.0, 13.0, 18.0, 8.0, 10.0, 3.0, 5.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.400344848632812, -9.10395622253418, -8.807567596435547, -8.511178970336914, -8.214790344238281, -7.918401718139648, -7.622012615203857, -7.325623989105225, -7.029235363006592, -6.732846736907959, -6.436458110809326, -6.140069484710693, -5.843680381774902, -5.5472917556762695, -5.250903129577637, -4.954514503479004, -4.658125877380371, -4.361737251281738, -4.0653486251831055, -3.7689597606658936, -3.4725711345672607, -3.176182508468628, -2.879793643951416, -2.583405017852783, -2.2870163917541504, -1.9906277656555176, -1.6942390203475952, -1.3978502750396729, -1.10146164894104, -0.8050730228424072, -0.5086842775344849, -0.2122955322265625, 0.08409404754638672, 0.3804827332496643, 0.6768714189529419, 0.9732601046562195, 1.269648790359497, 1.5660374164581299, 1.8624261617660522, 2.1588149070739746, 2.4552035331726074, 2.7515921592712402, 3.047980785369873, 3.344369649887085, 3.6407582759857178, 3.9371469020843506, 4.2335357666015625, 4.529924392700195, 4.826313018798828, 5.122701644897461, 5.419090270996094, 5.715478897094727, 6.011867523193359, 6.308256149291992, 6.604645252227783, 6.901033878326416, 7.197422504425049, 7.493811130523682, 7.7901997566223145, 8.086588859558105, 8.382977485656738, 8.679366111755371, 8.975754737854004, 9.272143363952637, 9.56853199005127]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 7.0, 7.0, 14.0, 16.0, 33.0, 50.0, 75.0, 117.0, 153.0, 242.0, 360.0, 596.0, 888.0, 1447.0, 2242.0, 3461.0, 5398.0, 8505.0, 13307.0, 21045.0, 32578.0, 48962.0, 70915.0, 98560.0, 124216.0, 136167.0, 130083.0, 107818.0, 80482.0, 56051.0, 37048.0, 24173.0, 15801.0, 10124.0, 6410.0, 4009.0, 2570.0, 1594.0, 1081.0, 667.0, 437.0, 293.0, 200.0, 118.0, 102.0, 59.0, 29.0, 22.0, 12.0, 8.0, 4.0, 4.0, 2.0, 1.0, 0.0, 3.0], "bins": [-9.2890625, -9.01318359375, -8.7373046875, -8.46142578125, -8.185546875, -7.90966796875, -7.6337890625, -7.35791015625, -7.08203125, -6.80615234375, -6.5302734375, -6.25439453125, -5.978515625, -5.70263671875, -5.4267578125, -5.15087890625, -4.875, -4.59912109375, -4.3232421875, -4.04736328125, -3.771484375, -3.49560546875, -3.2197265625, -2.94384765625, -2.66796875, -2.39208984375, -2.1162109375, -1.84033203125, -1.564453125, -1.28857421875, -1.0126953125, -0.73681640625, -0.4609375, -0.18505859375, 0.0908203125, 0.36669921875, 0.642578125, 0.91845703125, 1.1943359375, 1.47021484375, 1.74609375, 2.02197265625, 2.2978515625, 2.57373046875, 2.849609375, 3.12548828125, 3.4013671875, 3.67724609375, 3.953125, 4.22900390625, 4.5048828125, 4.78076171875, 5.056640625, 5.33251953125, 5.6083984375, 5.88427734375, 6.16015625, 6.43603515625, 6.7119140625, 6.98779296875, 7.263671875, 7.53955078125, 7.8154296875, 8.09130859375, 8.3671875]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 7.0, 7.0, 6.0, 4.0, 4.0, 3.0, 9.0, 7.0, 15.0, 11.0, 24.0, 16.0, 25.0, 24.0, 25.0, 27.0, 32.0, 45.0, 33.0, 38.0, 33.0, 42.0, 43.0, 38.0, 42.0, 31.0, 37.0, 40.0, 29.0, 30.0, 32.0, 25.0, 27.0, 23.0, 29.0, 22.0, 17.0, 18.0, 20.0, 12.0, 14.0, 7.0, 9.0, 8.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-9.71875, -9.438232421875, -9.15771484375, -8.877197265625, -8.5966796875, -8.316162109375, -8.03564453125, -7.755126953125, -7.474609375, -7.194091796875, -6.91357421875, -6.633056640625, -6.3525390625, -6.072021484375, -5.79150390625, -5.510986328125, -5.23046875, -4.949951171875, -4.66943359375, -4.388916015625, -4.1083984375, -3.827880859375, -3.54736328125, -3.266845703125, -2.986328125, -2.705810546875, -2.42529296875, -2.144775390625, -1.8642578125, -1.583740234375, -1.30322265625, -1.022705078125, -0.7421875, -0.461669921875, -0.18115234375, 0.099365234375, 0.3798828125, 0.660400390625, 0.94091796875, 1.221435546875, 1.501953125, 1.782470703125, 2.06298828125, 2.343505859375, 2.6240234375, 2.904541015625, 3.18505859375, 3.465576171875, 3.74609375, 4.026611328125, 4.30712890625, 4.587646484375, 4.8681640625, 5.148681640625, 5.42919921875, 5.709716796875, 5.990234375, 6.270751953125, 6.55126953125, 6.831787109375, 7.1123046875, 7.392822265625, 7.67333984375, 7.953857421875, 8.234375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 12.0, 21.0, 26.0, 52.0, 58.0, 111.0, 186.0, 268.0, 404.0, 678.0, 1112.0, 1969.0, 3129.0, 5303.0, 8832.0, 15104.0, 25813.0, 42076.0, 68583.0, 102174.0, 138942.0, 159001.0, 148712.0, 117667.0, 80353.0, 51055.0, 31179.0, 18562.0, 11075.0, 6389.0, 3845.0, 2258.0, 1357.0, 833.0, 532.0, 324.0, 219.0, 134.0, 78.0, 57.0, 26.0, 16.0, 14.0, 5.0, 6.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.7421875, -8.44775390625, -8.1533203125, -7.85888671875, -7.564453125, -7.27001953125, -6.9755859375, -6.68115234375, -6.38671875, -6.09228515625, -5.7978515625, -5.50341796875, -5.208984375, -4.91455078125, -4.6201171875, -4.32568359375, -4.03125, -3.73681640625, -3.4423828125, -3.14794921875, -2.853515625, -2.55908203125, -2.2646484375, -1.97021484375, -1.67578125, -1.38134765625, -1.0869140625, -0.79248046875, -0.498046875, -0.20361328125, 0.0908203125, 0.38525390625, 0.6796875, 0.97412109375, 1.2685546875, 1.56298828125, 1.857421875, 2.15185546875, 2.4462890625, 2.74072265625, 3.03515625, 3.32958984375, 3.6240234375, 3.91845703125, 4.212890625, 4.50732421875, 4.8017578125, 5.09619140625, 5.390625, 5.68505859375, 5.9794921875, 6.27392578125, 6.568359375, 6.86279296875, 7.1572265625, 7.45166015625, 7.74609375, 8.04052734375, 8.3349609375, 8.62939453125, 8.923828125, 9.21826171875, 9.5126953125, 9.80712890625, 10.1015625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 3.0, 7.0, 8.0, 8.0, 19.0, 19.0, 16.0, 14.0, 19.0, 28.0, 32.0, 30.0, 37.0, 41.0, 27.0, 38.0, 34.0, 37.0, 57.0, 52.0, 41.0, 32.0, 39.0, 34.0, 38.0, 32.0, 38.0, 39.0, 28.0, 23.0, 17.0, 24.0, 12.0, 18.0, 15.0, 9.0, 6.0, 6.0, 11.0, 6.0, 7.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-7.07421875, -6.8753662109375, -6.676513671875, -6.4776611328125, -6.27880859375, -6.0799560546875, -5.881103515625, -5.6822509765625, -5.4833984375, -5.2845458984375, -5.085693359375, -4.8868408203125, -4.68798828125, -4.4891357421875, -4.290283203125, -4.0914306640625, -3.892578125, -3.6937255859375, -3.494873046875, -3.2960205078125, -3.09716796875, -2.8983154296875, -2.699462890625, -2.5006103515625, -2.3017578125, -2.1029052734375, -1.904052734375, -1.7052001953125, -1.50634765625, -1.3074951171875, -1.108642578125, -0.9097900390625, -0.7109375, -0.5120849609375, -0.313232421875, -0.1143798828125, 0.08447265625, 0.2833251953125, 0.482177734375, 0.6810302734375, 0.8798828125, 1.0787353515625, 1.277587890625, 1.4764404296875, 1.67529296875, 1.8741455078125, 2.072998046875, 2.2718505859375, 2.470703125, 2.6695556640625, 2.868408203125, 3.0672607421875, 3.26611328125, 3.4649658203125, 3.663818359375, 3.8626708984375, 4.0615234375, 4.2603759765625, 4.459228515625, 4.6580810546875, 4.85693359375, 5.0557861328125, 5.254638671875, 5.4534912109375, 5.65234375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 10.0, 7.0, 20.0, 17.0, 27.0, 37.0, 45.0, 71.0, 138.0, 156.0, 234.0, 373.0, 590.0, 909.0, 1360.0, 2501.0, 4270.0, 7608.0, 14135.0, 27343.0, 57002.0, 121707.0, 225898.0, 259061.0, 165541.0, 79884.0, 37500.0, 18634.0, 9844.0, 5453.0, 3174.0, 1875.0, 1128.0, 702.0, 414.0, 295.0, 204.0, 131.0, 77.0, 59.0, 34.0, 22.0, 21.0, 17.0, 11.0, 6.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.15625, -8.880615234375, -8.60498046875, -8.329345703125, -8.0537109375, -7.778076171875, -7.50244140625, -7.226806640625, -6.951171875, -6.675537109375, -6.39990234375, -6.124267578125, -5.8486328125, -5.572998046875, -5.29736328125, -5.021728515625, -4.74609375, -4.470458984375, -4.19482421875, -3.919189453125, -3.6435546875, -3.367919921875, -3.09228515625, -2.816650390625, -2.541015625, -2.265380859375, -1.98974609375, -1.714111328125, -1.4384765625, -1.162841796875, -0.88720703125, -0.611572265625, -0.3359375, -0.060302734375, 0.21533203125, 0.490966796875, 0.7666015625, 1.042236328125, 1.31787109375, 1.593505859375, 1.869140625, 2.144775390625, 2.42041015625, 2.696044921875, 2.9716796875, 3.247314453125, 3.52294921875, 3.798583984375, 4.07421875, 4.349853515625, 4.62548828125, 4.901123046875, 5.1767578125, 5.452392578125, 5.72802734375, 6.003662109375, 6.279296875, 6.554931640625, 6.83056640625, 7.106201171875, 7.3818359375, 7.657470703125, 7.93310546875, 8.208740234375, 8.484375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 5.0, 8.0, 6.0, 14.0, 13.0, 12.0, 17.0, 29.0, 31.0, 32.0, 49.0, 68.0, 68.0, 79.0, 70.0, 69.0, 65.0, 67.0, 63.0, 53.0, 34.0, 27.0, 23.0, 19.0, 13.0, 15.0, 9.0, 10.0, 9.0, 6.0, 4.0, 1.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0009379386901855469, -0.0009131729602813721, -0.0008884072303771973, -0.0008636415004730225, -0.0008388757705688477, -0.0008141100406646729, -0.000789344310760498, -0.0007645785808563232, -0.0007398128509521484, -0.0007150471210479736, -0.0006902813911437988, -0.000665515661239624, -0.0006407499313354492, -0.0006159842014312744, -0.0005912184715270996, -0.0005664527416229248, -0.00054168701171875, -0.0005169212818145752, -0.0004921555519104004, -0.0004673898220062256, -0.0004426240921020508, -0.000417858362197876, -0.00039309263229370117, -0.00036832690238952637, -0.00034356117248535156, -0.00031879544258117676, -0.00029402971267700195, -0.00026926398277282715, -0.00024449825286865234, -0.00021973252296447754, -0.00019496679306030273, -0.00017020106315612793, -0.00014543533325195312, -0.00012066960334777832, -9.590387344360352e-05, -7.113814353942871e-05, -4.6372413635253906e-05, -2.16066837310791e-05, 3.159046173095703e-06, 2.7924776077270508e-05, 5.269050598144531e-05, 7.745623588562012e-05, 0.00010222196578979492, 0.00012698769569396973, 0.00015175342559814453, 0.00017651915550231934, 0.00020128488540649414, 0.00022605061531066895, 0.00025081634521484375, 0.00027558207511901855, 0.00030034780502319336, 0.00032511353492736816, 0.00034987926483154297, 0.0003746449947357178, 0.0003994107246398926, 0.0004241764545440674, 0.0004489421844482422, 0.000473707914352417, 0.0004984736442565918, 0.0005232393741607666, 0.0005480051040649414, 0.0005727708339691162, 0.000597536563873291, 0.0006223022937774658, 0.0006470680236816406]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 5.0, 6.0, 12.0, 26.0, 31.0, 61.0, 75.0, 150.0, 258.0, 379.0, 699.0, 1232.0, 2080.0, 3736.0, 6542.0, 12153.0, 22525.0, 42240.0, 79699.0, 141819.0, 205604.0, 207591.0, 145187.0, 81722.0, 43383.0, 23300.0, 12351.0, 6795.0, 3671.0, 2225.0, 1228.0, 711.0, 415.0, 285.0, 134.0, 74.0, 68.0, 34.0, 17.0, 22.0, 9.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.4609375, -7.24163818359375, -7.0223388671875, -6.80303955078125, -6.583740234375, -6.36444091796875, -6.1451416015625, -5.92584228515625, -5.70654296875, -5.48724365234375, -5.2679443359375, -5.04864501953125, -4.829345703125, -4.61004638671875, -4.3907470703125, -4.17144775390625, -3.9521484375, -3.73284912109375, -3.5135498046875, -3.29425048828125, -3.074951171875, -2.85565185546875, -2.6363525390625, -2.41705322265625, -2.19775390625, -1.97845458984375, -1.7591552734375, -1.53985595703125, -1.320556640625, -1.10125732421875, -0.8819580078125, -0.66265869140625, -0.443359375, -0.22406005859375, -0.0047607421875, 0.21453857421875, 0.433837890625, 0.65313720703125, 0.8724365234375, 1.09173583984375, 1.31103515625, 1.53033447265625, 1.7496337890625, 1.96893310546875, 2.188232421875, 2.40753173828125, 2.6268310546875, 2.84613037109375, 3.0654296875, 3.28472900390625, 3.5040283203125, 3.72332763671875, 3.942626953125, 4.16192626953125, 4.3812255859375, 4.60052490234375, 4.81982421875, 5.03912353515625, 5.2584228515625, 5.47772216796875, 5.697021484375, 5.91632080078125, 6.1356201171875, 6.35491943359375, 6.57421875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 8.0, 4.0, 10.0, 10.0, 12.0, 14.0, 12.0, 29.0, 28.0, 33.0, 52.0, 35.0, 80.0, 68.0, 74.0, 74.0, 62.0, 64.0, 65.0, 62.0, 35.0, 45.0, 31.0, 18.0, 19.0, 6.0, 15.0, 2.0, 4.0, 9.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.705078125, -2.62939453125, -2.5537109375, -2.47802734375, -2.40234375, -2.32666015625, -2.2509765625, -2.17529296875, -2.099609375, -2.02392578125, -1.9482421875, -1.87255859375, -1.796875, -1.72119140625, -1.6455078125, -1.56982421875, -1.494140625, -1.41845703125, -1.3427734375, -1.26708984375, -1.19140625, -1.11572265625, -1.0400390625, -0.96435546875, -0.888671875, -0.81298828125, -0.7373046875, -0.66162109375, -0.5859375, -0.51025390625, -0.4345703125, -0.35888671875, -0.283203125, -0.20751953125, -0.1318359375, -0.05615234375, 0.01953125, 0.09521484375, 0.1708984375, 0.24658203125, 0.322265625, 0.39794921875, 0.4736328125, 0.54931640625, 0.625, 0.70068359375, 0.7763671875, 0.85205078125, 0.927734375, 1.00341796875, 1.0791015625, 1.15478515625, 1.23046875, 1.30615234375, 1.3818359375, 1.45751953125, 1.533203125, 1.60888671875, 1.6845703125, 1.76025390625, 1.8359375, 1.91162109375, 1.9873046875, 2.06298828125, 2.138671875]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 6.0, 6.0, 6.0, 9.0, 11.0, 16.0, 9.0, 30.0, 23.0, 33.0, 34.0, 38.0, 39.0, 50.0, 44.0, 58.0, 57.0, 48.0, 53.0, 48.0, 43.0, 47.0, 46.0, 35.0, 40.0, 46.0, 15.0, 22.0, 17.0, 15.0, 15.0, 7.0, 8.0, 11.0, 7.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.908158302307129, -11.533546447753906, -11.158933639526367, -10.784321784973145, -10.409708976745605, -10.035097122192383, -9.660484313964844, -9.285872459411621, -8.911260604858398, -8.536648750305176, -8.162035942077637, -7.787424087524414, -7.412811279296875, -7.038199424743652, -6.6635870933532715, -6.288974761962891, -5.914361953735352, -5.539749622344971, -5.16513729095459, -4.790525436401367, -4.415912628173828, -4.0413007736206055, -3.6666884422302246, -3.2920761108398438, -2.917463779449463, -2.542851448059082, -2.168239116668701, -1.7936270236968994, -1.4190146923065186, -1.0444023609161377, -0.6697902679443359, -0.2951779365539551, 0.07943439483642578, 0.45404666662216187, 0.828658938407898, 1.2032711505889893, 1.5778834819793701, 1.952495813369751, 2.3271079063415527, 2.7017202377319336, 3.0763325691223145, 3.4509449005126953, 3.825557231903076, 4.200169563293457, 4.57478141784668, 4.949394226074219, 5.324006080627441, 5.698618412017822, 6.073230743408203, 6.447843074798584, 6.822455406188965, 7.1970672607421875, 7.571680068969727, 7.946291923522949, 8.320903778076172, 8.695516586303711, 9.07012939453125, 9.444741249084473, 9.819354057312012, 10.193965911865234, 10.568578720092773, 10.943190574645996, 11.317802429199219, 11.692415237426758, 12.06702709197998]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 8.0, 9.0, 8.0, 13.0, 7.0, 14.0, 12.0, 15.0, 32.0, 18.0, 19.0, 33.0, 27.0, 35.0, 40.0, 43.0, 37.0, 43.0, 37.0, 41.0, 38.0, 45.0, 41.0, 39.0, 29.0, 31.0, 44.0, 37.0, 27.0, 31.0, 31.0, 24.0, 14.0, 18.0, 18.0, 9.0, 12.0, 3.0, 3.0, 9.0, 4.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.542945861816406, -10.234869003295898, -9.926793098449707, -9.6187162399292, -9.310640335083008, -9.0025634765625, -8.694487571716309, -8.3864107131958, -8.07833480834961, -7.77025842666626, -7.46218204498291, -7.1541056632995605, -6.846029281616211, -6.537952423095703, -6.2298760414123535, -5.921799659729004, -5.613722801208496, -5.3056464195251465, -4.997570037841797, -4.689493656158447, -4.381417274475098, -4.07334041595459, -3.7652640342712402, -3.4571876525878906, -3.149111270904541, -2.8410348892211914, -2.532958507537842, -2.224881887435913, -1.9168055057525635, -1.6087291240692139, -1.3006526231765747, -0.9925761222839355, -0.6845006942749023, -0.37642425298690796, -0.06834781169891357, 0.2397286295890808, 0.5478050708770752, 0.8558814525604248, 1.163957953453064, 1.4720344543457031, 1.7801108360290527, 2.0881872177124023, 2.396263599395752, 2.7043402194976807, 3.0124166011810303, 3.32049298286438, 3.6285696029663086, 3.936645984649658, 4.244722366333008, 4.552798748016357, 4.860875129699707, 5.168951511383057, 5.477027893066406, 5.785104751586914, 6.093181133270264, 6.401257514953613, 6.709333896636963, 7.0174102783203125, 7.325486660003662, 7.633563041687012, 7.9416399002075195, 8.249715805053711, 8.557792663574219, 8.865869522094727, 9.173945426940918]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 11.0, 10.0, 14.0, 20.0, 39.0, 52.0, 80.0, 107.0, 155.0, 266.0, 436.0, 634.0, 1033.0, 1647.0, 2600.0, 4257.0, 7141.0, 12318.0, 21712.0, 39254.0, 75224.0, 148606.0, 312483.0, 625358.0, 957229.0, 898150.0, 541000.0, 266716.0, 130012.0, 65902.0, 35453.0, 19619.0, 11044.0, 6498.0, 3596.0, 2274.0, 1245.0, 776.0, 494.0, 310.0, 180.0, 115.0, 81.0, 56.0, 31.0, 23.0, 15.0, 6.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0], "bins": [-11.0, -10.6846923828125, -10.369384765625, -10.0540771484375, -9.73876953125, -9.4234619140625, -9.108154296875, -8.7928466796875, -8.4775390625, -8.1622314453125, -7.846923828125, -7.5316162109375, -7.21630859375, -6.9010009765625, -6.585693359375, -6.2703857421875, -5.955078125, -5.6397705078125, -5.324462890625, -5.0091552734375, -4.69384765625, -4.3785400390625, -4.063232421875, -3.7479248046875, -3.4326171875, -3.1173095703125, -2.802001953125, -2.4866943359375, -2.17138671875, -1.8560791015625, -1.540771484375, -1.2254638671875, -0.91015625, -0.5948486328125, -0.279541015625, 0.0357666015625, 0.35107421875, 0.6663818359375, 0.981689453125, 1.2969970703125, 1.6123046875, 1.9276123046875, 2.242919921875, 2.5582275390625, 2.87353515625, 3.1888427734375, 3.504150390625, 3.8194580078125, 4.134765625, 4.4500732421875, 4.765380859375, 5.0806884765625, 5.39599609375, 5.7113037109375, 6.026611328125, 6.3419189453125, 6.6572265625, 6.9725341796875, 7.287841796875, 7.6031494140625, 7.91845703125, 8.2337646484375, 8.549072265625, 8.8643798828125, 9.1796875]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 6.0, 6.0, 7.0, 9.0, 9.0, 18.0, 14.0, 11.0, 14.0, 29.0, 28.0, 28.0, 36.0, 27.0, 30.0, 51.0, 39.0, 41.0, 35.0, 46.0, 33.0, 34.0, 31.0, 47.0, 35.0, 24.0, 47.0, 38.0, 39.0, 37.0, 24.0, 12.0, 18.0, 22.0, 11.0, 14.0, 14.0, 5.0, 10.0, 6.0, 5.0, 3.0, 0.0, 3.0, 4.0, 0.0, 1.0, 2.0], "bins": [-7.49609375, -7.2891845703125, -7.082275390625, -6.8753662109375, -6.66845703125, -6.4615478515625, -6.254638671875, -6.0477294921875, -5.8408203125, -5.6339111328125, -5.427001953125, -5.2200927734375, -5.01318359375, -4.8062744140625, -4.599365234375, -4.3924560546875, -4.185546875, -3.9786376953125, -3.771728515625, -3.5648193359375, -3.35791015625, -3.1510009765625, -2.944091796875, -2.7371826171875, -2.5302734375, -2.3233642578125, -2.116455078125, -1.9095458984375, -1.70263671875, -1.4957275390625, -1.288818359375, -1.0819091796875, -0.875, -0.6680908203125, -0.461181640625, -0.2542724609375, -0.04736328125, 0.1595458984375, 0.366455078125, 0.5733642578125, 0.7802734375, 0.9871826171875, 1.194091796875, 1.4010009765625, 1.60791015625, 1.8148193359375, 2.021728515625, 2.2286376953125, 2.435546875, 2.6424560546875, 2.849365234375, 3.0562744140625, 3.26318359375, 3.4700927734375, 3.677001953125, 3.8839111328125, 4.0908203125, 4.2977294921875, 4.504638671875, 4.7115478515625, 4.91845703125, 5.1253662109375, 5.332275390625, 5.5391845703125, 5.74609375]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 7.0, 13.0, 17.0, 27.0, 37.0, 50.0, 84.0, 115.0, 178.0, 277.0, 423.0, 681.0, 1060.0, 1630.0, 2460.0, 3817.0, 6146.0, 9833.0, 16267.0, 26855.0, 45287.0, 76466.0, 130528.0, 221630.0, 369830.0, 571713.0, 743872.0, 700965.0, 498807.0, 311026.0, 185055.0, 108320.0, 63728.0, 37812.0, 22693.0, 13421.0, 8604.0, 5257.0, 3337.0, 2054.0, 1352.0, 905.0, 614.0, 357.0, 228.0, 153.0, 108.0, 63.0, 44.0, 29.0, 24.0, 17.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0], "bins": [-8.2890625, -8.03656005859375, -7.7840576171875, -7.53155517578125, -7.279052734375, -7.02655029296875, -6.7740478515625, -6.52154541015625, -6.26904296875, -6.01654052734375, -5.7640380859375, -5.51153564453125, -5.259033203125, -5.00653076171875, -4.7540283203125, -4.50152587890625, -4.2490234375, -3.99652099609375, -3.7440185546875, -3.49151611328125, -3.239013671875, -2.98651123046875, -2.7340087890625, -2.48150634765625, -2.22900390625, -1.97650146484375, -1.7239990234375, -1.47149658203125, -1.218994140625, -0.96649169921875, -0.7139892578125, -0.46148681640625, -0.208984375, 0.04351806640625, 0.2960205078125, 0.54852294921875, 0.801025390625, 1.05352783203125, 1.3060302734375, 1.55853271484375, 1.81103515625, 2.06353759765625, 2.3160400390625, 2.56854248046875, 2.821044921875, 3.07354736328125, 3.3260498046875, 3.57855224609375, 3.8310546875, 4.08355712890625, 4.3360595703125, 4.58856201171875, 4.841064453125, 5.09356689453125, 5.3460693359375, 5.59857177734375, 5.85107421875, 6.10357666015625, 6.3560791015625, 6.60858154296875, 6.861083984375, 7.11358642578125, 7.3660888671875, 7.61859130859375, 7.87109375]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 6.0, 8.0, 7.0, 11.0, 14.0, 23.0, 34.0, 48.0, 43.0, 51.0, 93.0, 119.0, 136.0, 155.0, 192.0, 232.0, 262.0, 285.0, 315.0, 288.0, 245.0, 247.0, 226.0, 206.0, 154.0, 147.0, 108.0, 86.0, 81.0, 63.0, 52.0, 30.0, 31.0, 16.0, 13.0, 19.0, 6.0, 6.0, 7.0, 5.0, 6.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.265625, -3.1524658203125, -3.039306640625, -2.9261474609375, -2.81298828125, -2.6998291015625, -2.586669921875, -2.4735107421875, -2.3603515625, -2.2471923828125, -2.134033203125, -2.0208740234375, -1.90771484375, -1.7945556640625, -1.681396484375, -1.5682373046875, -1.455078125, -1.3419189453125, -1.228759765625, -1.1156005859375, -1.00244140625, -0.8892822265625, -0.776123046875, -0.6629638671875, -0.5498046875, -0.4366455078125, -0.323486328125, -0.2103271484375, -0.09716796875, 0.0159912109375, 0.129150390625, 0.2423095703125, 0.35546875, 0.4686279296875, 0.581787109375, 0.6949462890625, 0.80810546875, 0.9212646484375, 1.034423828125, 1.1475830078125, 1.2607421875, 1.3739013671875, 1.487060546875, 1.6002197265625, 1.71337890625, 1.8265380859375, 1.939697265625, 2.0528564453125, 2.166015625, 2.2791748046875, 2.392333984375, 2.5054931640625, 2.61865234375, 2.7318115234375, 2.844970703125, 2.9581298828125, 3.0712890625, 3.1844482421875, 3.297607421875, 3.4107666015625, 3.52392578125, 3.6370849609375, 3.750244140625, 3.8634033203125, 3.9765625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 6.0, 10.0, 6.0, 14.0, 16.0, 9.0, 12.0, 21.0, 27.0, 22.0, 41.0, 36.0, 34.0, 45.0, 53.0, 50.0, 53.0, 46.0, 58.0, 50.0, 50.0, 55.0, 35.0, 36.0, 38.0, 24.0, 32.0, 16.0, 22.0, 25.0, 9.0, 9.0, 9.0, 11.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.457452774047852, -8.151654243469238, -7.845856189727783, -7.540058135986328, -7.234259605407715, -6.92846155166626, -6.622663497924805, -6.316864967346191, -6.011066913604736, -5.705268859863281, -5.399470329284668, -5.093672275543213, -4.787874221801758, -4.4820756912231445, -4.1762776374816895, -3.8704793453216553, -3.564681053161621, -3.258882761001587, -2.9530844688415527, -2.6472864151000977, -2.3414881229400635, -2.0356898307800293, -1.7298916578292847, -1.42409348487854, -1.1182951927185059, -0.8124969601631165, -0.506698727607727, -0.20090049505233765, 0.10489773750305176, 0.41069602966308594, 0.7164942026138306, 1.0222923755645752, 1.3280916213989258, 1.63388991355896, 1.9396880865097046, 2.245486259460449, 2.5512845516204834, 2.8570828437805176, 3.1628808975219727, 3.468679189682007, 3.774477481842041, 4.080275535583496, 4.386074066162109, 4.6918721199035645, 4.9976701736450195, 5.303468704223633, 5.609266757965088, 5.915064811706543, 6.220863342285156, 6.526661396026611, 6.832459926605225, 7.13825798034668, 7.444056510925293, 7.749854564666748, 8.055652618408203, 8.361451148986816, 8.66724967956543, 8.973048210144043, 9.27884578704834, 9.584644317626953, 9.890442848205566, 10.19624137878418, 10.502038955688477, 10.80783748626709, 11.113635063171387]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 6.0, 4.0, 6.0, 4.0, 5.0, 6.0, 17.0, 16.0, 19.0, 16.0, 21.0, 27.0, 39.0, 28.0, 33.0, 42.0, 40.0, 43.0, 45.0, 42.0, 47.0, 44.0, 38.0, 35.0, 48.0, 52.0, 33.0, 31.0, 39.0, 26.0, 30.0, 16.0, 22.0, 27.0, 14.0, 6.0, 9.0, 8.0, 6.0, 4.0, 7.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.835714340209961, -8.575971603393555, -8.316227912902832, -8.056485176086426, -7.7967424392700195, -7.536999225616455, -7.277256011962891, -7.017513275146484, -6.75777006149292, -6.4980268478393555, -6.238284111022949, -5.978540897369385, -5.71879768371582, -5.459054946899414, -5.19931173324585, -4.939568519592285, -4.679825782775879, -4.4200825691223145, -4.160339832305908, -3.9005966186523438, -3.6408536434173584, -3.381110668182373, -3.1213674545288086, -2.8616244792938232, -2.601881504058838, -2.3421385288238525, -2.082395553588867, -1.8226523399353027, -1.5629093647003174, -1.303166389465332, -1.0434232950210571, -0.7836802005767822, -0.5239377021789551, -0.26419466733932495, -0.004451632499694824, 0.2552914023399353, 0.5150344371795654, 0.7747774124145508, 1.0345205068588257, 1.2942636013031006, 1.554006576538086, 1.8137495517730713, 2.0734925270080566, 2.333235740661621, 2.5929787158966064, 2.852721691131592, 3.1124649047851562, 3.3722078800201416, 3.631950855255127, 3.8916938304901123, 4.151436805725098, 4.411180019378662, 4.670923233032227, 4.930665969848633, 5.190409183502197, 5.450152397155762, 5.709895133972168, 5.969638347625732, 6.229381084442139, 6.489124298095703, 6.748867034912109, 7.008610248565674, 7.268353462219238, 7.5280961990356445, 7.787839412689209]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 5.0, 6.0, 9.0, 15.0, 17.0, 35.0, 47.0, 65.0, 104.0, 136.0, 175.0, 263.0, 359.0, 556.0, 856.0, 1196.0, 1871.0, 2950.0, 4450.0, 7020.0, 11354.0, 18270.0, 30919.0, 52407.0, 89371.0, 142906.0, 188940.0, 178475.0, 125435.0, 76238.0, 44589.0, 26520.0, 15865.0, 9553.0, 6074.0, 3892.0, 2469.0, 1622.0, 1116.0, 760.0, 551.0, 333.0, 206.0, 185.0, 121.0, 74.0, 47.0, 35.0, 24.0, 28.0, 15.0, 11.0, 6.0, 6.0, 3.0, 3.0, 1.0, 4.0], "bins": [-9.859375, -9.5592041015625, -9.259033203125, -8.9588623046875, -8.65869140625, -8.3585205078125, -8.058349609375, -7.7581787109375, -7.4580078125, -7.1578369140625, -6.857666015625, -6.5574951171875, -6.25732421875, -5.9571533203125, -5.656982421875, -5.3568115234375, -5.056640625, -4.7564697265625, -4.456298828125, -4.1561279296875, -3.85595703125, -3.5557861328125, -3.255615234375, -2.9554443359375, -2.6552734375, -2.3551025390625, -2.054931640625, -1.7547607421875, -1.45458984375, -1.1544189453125, -0.854248046875, -0.5540771484375, -0.25390625, 0.0462646484375, 0.346435546875, 0.6466064453125, 0.94677734375, 1.2469482421875, 1.547119140625, 1.8472900390625, 2.1474609375, 2.4476318359375, 2.747802734375, 3.0479736328125, 3.34814453125, 3.6483154296875, 3.948486328125, 4.2486572265625, 4.548828125, 4.8489990234375, 5.149169921875, 5.4493408203125, 5.74951171875, 6.0496826171875, 6.349853515625, 6.6500244140625, 6.9501953125, 7.2503662109375, 7.550537109375, 7.8507080078125, 8.15087890625, 8.4510498046875, 8.751220703125, 9.0513916015625, 9.3515625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 6.0, 9.0, 10.0, 3.0, 10.0, 15.0, 16.0, 17.0, 25.0, 28.0, 30.0, 29.0, 31.0, 27.0, 39.0, 46.0, 46.0, 45.0, 38.0, 44.0, 40.0, 35.0, 28.0, 51.0, 46.0, 35.0, 41.0, 26.0, 26.0, 24.0, 33.0, 16.0, 12.0, 17.0, 11.0, 6.0, 12.0, 7.0, 9.0, 6.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.703125, -8.4530029296875, -8.202880859375, -7.9527587890625, -7.70263671875, -7.4525146484375, -7.202392578125, -6.9522705078125, -6.7021484375, -6.4520263671875, -6.201904296875, -5.9517822265625, -5.70166015625, -5.4515380859375, -5.201416015625, -4.9512939453125, -4.701171875, -4.4510498046875, -4.200927734375, -3.9508056640625, -3.70068359375, -3.4505615234375, -3.200439453125, -2.9503173828125, -2.7001953125, -2.4500732421875, -2.199951171875, -1.9498291015625, -1.69970703125, -1.4495849609375, -1.199462890625, -0.9493408203125, -0.69921875, -0.4490966796875, -0.198974609375, 0.0511474609375, 0.30126953125, 0.5513916015625, 0.801513671875, 1.0516357421875, 1.3017578125, 1.5518798828125, 1.802001953125, 2.0521240234375, 2.30224609375, 2.5523681640625, 2.802490234375, 3.0526123046875, 3.302734375, 3.5528564453125, 3.802978515625, 4.0531005859375, 4.30322265625, 4.5533447265625, 4.803466796875, 5.0535888671875, 5.3037109375, 5.5538330078125, 5.803955078125, 6.0540771484375, 6.30419921875, 6.5543212890625, 6.804443359375, 7.0545654296875, 7.3046875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 1.0, 7.0, 5.0, 7.0, 10.0, 19.0, 13.0, 36.0, 46.0, 54.0, 83.0, 117.0, 152.0, 216.0, 341.0, 445.0, 647.0, 982.0, 1554.0, 2463.0, 4107.0, 7201.0, 13918.0, 30807.0, 79507.0, 233532.0, 384624.0, 174930.0, 60673.0, 24441.0, 11559.0, 6148.0, 3579.0, 2161.0, 1347.0, 885.0, 579.0, 412.0, 271.0, 194.0, 145.0, 111.0, 66.0, 50.0, 31.0, 26.0, 18.0, 8.0, 9.0, 5.0, 7.0, 6.0, 0.0, 3.0, 3.0, 0.0, 2.0], "bins": [-22.5625, -21.88623046875, -21.2099609375, -20.53369140625, -19.857421875, -19.18115234375, -18.5048828125, -17.82861328125, -17.15234375, -16.47607421875, -15.7998046875, -15.12353515625, -14.447265625, -13.77099609375, -13.0947265625, -12.41845703125, -11.7421875, -11.06591796875, -10.3896484375, -9.71337890625, -9.037109375, -8.36083984375, -7.6845703125, -7.00830078125, -6.33203125, -5.65576171875, -4.9794921875, -4.30322265625, -3.626953125, -2.95068359375, -2.2744140625, -1.59814453125, -0.921875, -0.24560546875, 0.4306640625, 1.10693359375, 1.783203125, 2.45947265625, 3.1357421875, 3.81201171875, 4.48828125, 5.16455078125, 5.8408203125, 6.51708984375, 7.193359375, 7.86962890625, 8.5458984375, 9.22216796875, 9.8984375, 10.57470703125, 11.2509765625, 11.92724609375, 12.603515625, 13.27978515625, 13.9560546875, 14.63232421875, 15.30859375, 15.98486328125, 16.6611328125, 17.33740234375, 18.013671875, 18.68994140625, 19.3662109375, 20.04248046875, 20.71875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 8.0, 4.0, 8.0, 4.0, 5.0, 10.0, 11.0, 14.0, 8.0, 8.0, 13.0, 25.0, 22.0, 22.0, 29.0, 20.0, 35.0, 34.0, 37.0, 35.0, 36.0, 29.0, 41.0, 46.0, 44.0, 40.0, 39.0, 44.0, 31.0, 39.0, 33.0, 25.0, 28.0, 31.0, 24.0, 12.0, 31.0, 21.0, 12.0, 13.0, 7.0, 7.0, 4.0, 3.0, 3.0, 3.0, 5.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.42578125, -4.28167724609375, -4.1375732421875, -3.99346923828125, -3.849365234375, -3.70526123046875, -3.5611572265625, -3.41705322265625, -3.27294921875, -3.12884521484375, -2.9847412109375, -2.84063720703125, -2.696533203125, -2.55242919921875, -2.4083251953125, -2.26422119140625, -2.1201171875, -1.97601318359375, -1.8319091796875, -1.68780517578125, -1.543701171875, -1.39959716796875, -1.2554931640625, -1.11138916015625, -0.96728515625, -0.82318115234375, -0.6790771484375, -0.53497314453125, -0.390869140625, -0.24676513671875, -0.1026611328125, 0.04144287109375, 0.185546875, 0.32965087890625, 0.4737548828125, 0.61785888671875, 0.761962890625, 0.90606689453125, 1.0501708984375, 1.19427490234375, 1.33837890625, 1.48248291015625, 1.6265869140625, 1.77069091796875, 1.914794921875, 2.05889892578125, 2.2030029296875, 2.34710693359375, 2.4912109375, 2.63531494140625, 2.7794189453125, 2.92352294921875, 3.067626953125, 3.21173095703125, 3.3558349609375, 3.49993896484375, 3.64404296875, 3.78814697265625, 3.9322509765625, 4.07635498046875, 4.220458984375, 4.36456298828125, 4.5086669921875, 4.65277099609375, 4.796875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [6.0, 2.0, 2.0, 1.0, 1.0, 8.0, 10.0, 11.0, 9.0, 18.0, 20.0, 34.0, 34.0, 59.0, 65.0, 109.0, 165.0, 207.0, 380.0, 502.0, 765.0, 1251.0, 1998.0, 3303.0, 5551.0, 9671.0, 17433.0, 33012.0, 65791.0, 132513.0, 237549.0, 245900.0, 141436.0, 71050.0, 35715.0, 18537.0, 10165.0, 5771.0, 3554.0, 2162.0, 1314.0, 846.0, 549.0, 328.0, 225.0, 149.0, 93.0, 94.0, 56.0, 35.0, 37.0, 20.0, 18.0, 11.0, 4.0, 8.0, 2.0, 7.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.44921875, -6.24151611328125, -6.0338134765625, -5.82611083984375, -5.618408203125, -5.41070556640625, -5.2030029296875, -4.99530029296875, -4.78759765625, -4.57989501953125, -4.3721923828125, -4.16448974609375, -3.956787109375, -3.74908447265625, -3.5413818359375, -3.33367919921875, -3.1259765625, -2.91827392578125, -2.7105712890625, -2.50286865234375, -2.295166015625, -2.08746337890625, -1.8797607421875, -1.67205810546875, -1.46435546875, -1.25665283203125, -1.0489501953125, -0.84124755859375, -0.633544921875, -0.42584228515625, -0.2181396484375, -0.01043701171875, 0.197265625, 0.40496826171875, 0.6126708984375, 0.82037353515625, 1.028076171875, 1.23577880859375, 1.4434814453125, 1.65118408203125, 1.85888671875, 2.06658935546875, 2.2742919921875, 2.48199462890625, 2.689697265625, 2.89739990234375, 3.1051025390625, 3.31280517578125, 3.5205078125, 3.72821044921875, 3.9359130859375, 4.14361572265625, 4.351318359375, 4.55902099609375, 4.7667236328125, 4.97442626953125, 5.18212890625, 5.38983154296875, 5.5975341796875, 5.80523681640625, 6.012939453125, 6.22064208984375, 6.4283447265625, 6.63604736328125, 6.84375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 2.0, 5.0, 8.0, 4.0, 8.0, 8.0, 13.0, 14.0, 18.0, 23.0, 26.0, 35.0, 42.0, 57.0, 63.0, 81.0, 78.0, 77.0, 56.0, 64.0, 58.0, 59.0, 37.0, 18.0, 24.0, 30.0, 24.0, 11.0, 4.0, 10.0, 7.0, 7.0, 4.0, 1.0, 8.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0], "bins": [-0.0003516674041748047, -0.0003422833979129791, -0.00033289939165115356, -0.000323515385389328, -0.00031413137912750244, -0.0003047473728656769, -0.0002953633666038513, -0.00028597936034202576, -0.0002765953540802002, -0.00026721134781837463, -0.00025782734155654907, -0.0002484433352947235, -0.00023905932903289795, -0.0002296753227710724, -0.00022029131650924683, -0.00021090731024742126, -0.0002015233039855957, -0.00019213929772377014, -0.00018275529146194458, -0.00017337128520011902, -0.00016398727893829346, -0.0001546032726764679, -0.00014521926641464233, -0.00013583526015281677, -0.0001264512538909912, -0.00011706724762916565, -0.00010768324136734009, -9.829923510551453e-05, -8.891522884368896e-05, -7.95312225818634e-05, -7.014721632003784e-05, -6.076321005821228e-05, -5.137920379638672e-05, -4.199519753456116e-05, -3.2611191272735596e-05, -2.3227185010910034e-05, -1.3843178749084473e-05, -4.459172487258911e-06, 4.92483377456665e-06, 1.4308840036392212e-05, 2.3692846298217773e-05, 3.3076852560043335e-05, 4.2460858821868896e-05, 5.184486508369446e-05, 6.122887134552002e-05, 7.061287760734558e-05, 7.999688386917114e-05, 8.93808901309967e-05, 9.876489639282227e-05, 0.00010814890265464783, 0.00011753290891647339, 0.00012691691517829895, 0.0001363009214401245, 0.00014568492770195007, 0.00015506893396377563, 0.0001644529402256012, 0.00017383694648742676, 0.00018322095274925232, 0.00019260495901107788, 0.00020198896527290344, 0.000211372971534729, 0.00022075697779655457, 0.00023014098405838013, 0.0002395249903202057, 0.00024890899658203125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 9.0, 12.0, 19.0, 21.0, 32.0, 42.0, 70.0, 101.0, 182.0, 278.0, 406.0, 683.0, 1079.0, 1686.0, 2721.0, 4462.0, 6977.0, 11382.0, 18356.0, 29858.0, 47993.0, 75527.0, 113762.0, 151221.0, 165016.0, 140515.0, 100970.0, 66131.0, 41566.0, 25449.0, 15920.0, 9996.0, 6075.0, 3602.0, 2405.0, 1458.0, 927.0, 585.0, 364.0, 259.0, 159.0, 93.0, 59.0, 45.0, 30.0, 21.0, 16.0, 7.0, 3.0, 2.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0], "bins": [-4.578125, -4.43658447265625, -4.2950439453125, -4.15350341796875, -4.011962890625, -3.87042236328125, -3.7288818359375, -3.58734130859375, -3.44580078125, -3.30426025390625, -3.1627197265625, -3.02117919921875, -2.879638671875, -2.73809814453125, -2.5965576171875, -2.45501708984375, -2.3134765625, -2.17193603515625, -2.0303955078125, -1.88885498046875, -1.747314453125, -1.60577392578125, -1.4642333984375, -1.32269287109375, -1.18115234375, -1.03961181640625, -0.8980712890625, -0.75653076171875, -0.614990234375, -0.47344970703125, -0.3319091796875, -0.19036865234375, -0.048828125, 0.09271240234375, 0.2342529296875, 0.37579345703125, 0.517333984375, 0.65887451171875, 0.8004150390625, 0.94195556640625, 1.08349609375, 1.22503662109375, 1.3665771484375, 1.50811767578125, 1.649658203125, 1.79119873046875, 1.9327392578125, 2.07427978515625, 2.2158203125, 2.35736083984375, 2.4989013671875, 2.64044189453125, 2.781982421875, 2.92352294921875, 3.0650634765625, 3.20660400390625, 3.34814453125, 3.48968505859375, 3.6312255859375, 3.77276611328125, 3.914306640625, 4.05584716796875, 4.1973876953125, 4.33892822265625, 4.48046875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 4.0, 5.0, 6.0, 5.0, 9.0, 13.0, 8.0, 18.0, 26.0, 24.0, 24.0, 28.0, 41.0, 37.0, 58.0, 39.0, 57.0, 75.0, 70.0, 58.0, 61.0, 48.0, 72.0, 41.0, 33.0, 26.0, 16.0, 28.0, 15.0, 17.0, 9.0, 8.0, 7.0, 5.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.11328125, -2.0491790771484375, -1.985076904296875, -1.9209747314453125, -1.85687255859375, -1.7927703857421875, -1.728668212890625, -1.6645660400390625, -1.6004638671875, -1.5363616943359375, -1.472259521484375, -1.4081573486328125, -1.34405517578125, -1.2799530029296875, -1.215850830078125, -1.1517486572265625, -1.087646484375, -1.0235443115234375, -0.959442138671875, -0.8953399658203125, -0.83123779296875, -0.7671356201171875, -0.703033447265625, -0.6389312744140625, -0.5748291015625, -0.5107269287109375, -0.446624755859375, -0.3825225830078125, -0.31842041015625, -0.2543182373046875, -0.190216064453125, -0.1261138916015625, -0.06201171875, 0.0020904541015625, 0.066192626953125, 0.1302947998046875, 0.19439697265625, 0.2584991455078125, 0.322601318359375, 0.3867034912109375, 0.4508056640625, 0.5149078369140625, 0.579010009765625, 0.6431121826171875, 0.70721435546875, 0.7713165283203125, 0.835418701171875, 0.8995208740234375, 0.963623046875, 1.0277252197265625, 1.091827392578125, 1.1559295654296875, 1.22003173828125, 1.2841339111328125, 1.348236083984375, 1.4123382568359375, 1.4764404296875, 1.5405426025390625, 1.604644775390625, 1.6687469482421875, 1.73284912109375, 1.7969512939453125, 1.861053466796875, 1.9251556396484375, 1.9892578125]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 6.0, 12.0, 16.0, 5.0, 22.0, 14.0, 22.0, 17.0, 17.0, 33.0, 34.0, 35.0, 46.0, 52.0, 49.0, 59.0, 63.0, 65.0, 59.0, 44.0, 47.0, 36.0, 35.0, 30.0, 32.0, 23.0, 21.0, 24.0, 7.0, 17.0, 19.0, 7.0, 9.0, 5.0, 0.0, 6.0, 0.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.889204978942871, -8.589778900146484, -8.290352821350098, -7.990926742553711, -7.691500663757324, -7.3920745849609375, -7.092648506164551, -6.793222427368164, -6.493796348571777, -6.194370269775391, -5.894944190979004, -5.595518112182617, -5.2960920333862305, -4.996665954589844, -4.697239875793457, -4.39781379699707, -4.098387718200684, -3.798961639404297, -3.49953556060791, -3.2001094818115234, -2.9006834030151367, -2.60125732421875, -2.3018312454223633, -2.0024051666259766, -1.7029790878295898, -1.4035530090332031, -1.1041269302368164, -0.8047008514404297, -0.505274772644043, -0.20584869384765625, 0.09357738494873047, 0.3930034637451172, 0.6924304962158203, 0.991856575012207, 1.2912826538085938, 1.5907087326049805, 1.8901348114013672, 2.189560890197754, 2.4889869689941406, 2.7884130477905273, 3.087839126586914, 3.387265205383301, 3.6866912841796875, 3.986117362976074, 4.285543441772461, 4.584969520568848, 4.884395599365234, 5.183821678161621, 5.483247756958008, 5.7826738357543945, 6.082099914550781, 6.381525993347168, 6.680952072143555, 6.980378150939941, 7.279804229736328, 7.579230308532715, 7.878656387329102, 8.178082466125488, 8.477508544921875, 8.776934623718262, 9.076360702514648, 9.375786781311035, 9.675212860107422, 9.974638938903809, 10.274065017700195]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 8.0, 0.0, 4.0, 10.0, 8.0, 8.0, 7.0, 16.0, 18.0, 16.0, 26.0, 16.0, 31.0, 26.0, 37.0, 44.0, 41.0, 44.0, 39.0, 44.0, 37.0, 50.0, 40.0, 48.0, 35.0, 39.0, 43.0, 36.0, 29.0, 36.0, 21.0, 21.0, 30.0, 20.0, 18.0, 16.0, 10.0, 8.0, 5.0, 3.0, 5.0, 4.0, 6.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.668281555175781, -8.42397689819336, -8.179671287536621, -7.935366153717041, -7.691061019897461, -7.446756362915039, -7.202450752258301, -6.958146095275879, -6.713840961456299, -6.469535827636719, -6.225230693817139, -5.980925559997559, -5.7366204261779785, -5.492315292358398, -5.248010635375977, -5.0037055015563965, -4.759400367736816, -4.515095233917236, -4.270790100097656, -4.026484966278076, -3.782180070877075, -3.537874937057495, -3.293569803237915, -3.049264907836914, -2.804959297180176, -2.5606541633605957, -2.3163490295410156, -2.0720438957214355, -1.8277390003204346, -1.5834338665008545, -1.3391287326812744, -1.0948237180709839, -0.8505187034606934, -0.6062136292457581, -0.36190852522850037, -0.11760342121124268, 0.12670165300369263, 0.37100672721862793, 0.615311861038208, 0.8596168756484985, 1.1039220094680786, 1.3482271432876587, 1.5925321578979492, 1.8368372917175293, 2.0811424255371094, 2.3254475593566895, 2.5697526931762695, 2.8140575885772705, 3.0583627223968506, 3.3026678562164307, 3.5469729900360107, 3.7912778854370117, 4.035583019256592, 4.279888153076172, 4.524193286895752, 4.768498420715332, 5.012803554534912, 5.257108688354492, 5.501413822174072, 5.745718955993652, 5.990024089813232, 6.2343292236328125, 6.478633880615234, 6.7229390144348145, 6.9672441482543945]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 16.0, 18.0, 36.0, 56.0, 64.0, 101.0, 163.0, 262.0, 414.0, 649.0, 965.0, 1583.0, 2530.0, 4125.0, 6536.0, 10390.0, 16963.0, 26827.0, 42168.0, 62632.0, 89097.0, 116241.0, 135075.0, 135068.0, 118535.0, 92305.0, 65640.0, 43770.0, 28471.0, 18025.0, 11403.0, 6823.0, 4275.0, 2696.0, 1703.0, 1097.0, 665.0, 429.0, 270.0, 145.0, 116.0, 77.0, 47.0, 32.0, 21.0, 11.0, 7.0, 9.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8671875, -6.63873291015625, -6.4102783203125, -6.18182373046875, -5.953369140625, -5.72491455078125, -5.4964599609375, -5.26800537109375, -5.03955078125, -4.81109619140625, -4.5826416015625, -4.35418701171875, -4.125732421875, -3.89727783203125, -3.6688232421875, -3.44036865234375, -3.2119140625, -2.98345947265625, -2.7550048828125, -2.52655029296875, -2.298095703125, -2.06964111328125, -1.8411865234375, -1.61273193359375, -1.38427734375, -1.15582275390625, -0.9273681640625, -0.69891357421875, -0.470458984375, -0.24200439453125, -0.0135498046875, 0.21490478515625, 0.443359375, 0.67181396484375, 0.9002685546875, 1.12872314453125, 1.357177734375, 1.58563232421875, 1.8140869140625, 2.04254150390625, 2.27099609375, 2.49945068359375, 2.7279052734375, 2.95635986328125, 3.184814453125, 3.41326904296875, 3.6417236328125, 3.87017822265625, 4.0986328125, 4.32708740234375, 4.5555419921875, 4.78399658203125, 5.012451171875, 5.24090576171875, 5.4693603515625, 5.69781494140625, 5.92626953125, 6.15472412109375, 6.3831787109375, 6.61163330078125, 6.840087890625, 7.06854248046875, 7.2969970703125, 7.52545166015625, 7.75390625]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 9.0, 6.0, 5.0, 10.0, 11.0, 11.0, 14.0, 13.0, 20.0, 25.0, 18.0, 32.0, 30.0, 30.0, 37.0, 42.0, 34.0, 46.0, 43.0, 44.0, 31.0, 36.0, 39.0, 46.0, 41.0, 28.0, 38.0, 37.0, 34.0, 32.0, 24.0, 27.0, 15.0, 16.0, 18.0, 18.0, 9.0, 8.0, 8.0, 7.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0], "bins": [-8.5234375, -8.291259765625, -8.05908203125, -7.826904296875, -7.5947265625, -7.362548828125, -7.13037109375, -6.898193359375, -6.666015625, -6.433837890625, -6.20166015625, -5.969482421875, -5.7373046875, -5.505126953125, -5.27294921875, -5.040771484375, -4.80859375, -4.576416015625, -4.34423828125, -4.112060546875, -3.8798828125, -3.647705078125, -3.41552734375, -3.183349609375, -2.951171875, -2.718994140625, -2.48681640625, -2.254638671875, -2.0224609375, -1.790283203125, -1.55810546875, -1.325927734375, -1.09375, -0.861572265625, -0.62939453125, -0.397216796875, -0.1650390625, 0.067138671875, 0.29931640625, 0.531494140625, 0.763671875, 0.995849609375, 1.22802734375, 1.460205078125, 1.6923828125, 1.924560546875, 2.15673828125, 2.388916015625, 2.62109375, 2.853271484375, 3.08544921875, 3.317626953125, 3.5498046875, 3.781982421875, 4.01416015625, 4.246337890625, 4.478515625, 4.710693359375, 4.94287109375, 5.175048828125, 5.4072265625, 5.639404296875, 5.87158203125, 6.103759765625, 6.3359375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 6.0, 6.0, 13.0, 11.0, 31.0, 46.0, 76.0, 96.0, 143.0, 258.0, 363.0, 537.0, 888.0, 1351.0, 2044.0, 3236.0, 4952.0, 7789.0, 12119.0, 18802.0, 28281.0, 41852.0, 58742.0, 80644.0, 101811.0, 117892.0, 123052.0, 114030.0, 95674.0, 73538.0, 53164.0, 36824.0, 24572.0, 16306.0, 10503.0, 6741.0, 4286.0, 2722.0, 1842.0, 1132.0, 802.0, 455.0, 311.0, 205.0, 124.0, 101.0, 68.0, 42.0, 31.0, 17.0, 14.0, 7.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.59765625, -5.41314697265625, -5.2286376953125, -5.04412841796875, -4.859619140625, -4.67510986328125, -4.4906005859375, -4.30609130859375, -4.12158203125, -3.93707275390625, -3.7525634765625, -3.56805419921875, -3.383544921875, -3.19903564453125, -3.0145263671875, -2.83001708984375, -2.6455078125, -2.46099853515625, -2.2764892578125, -2.09197998046875, -1.907470703125, -1.72296142578125, -1.5384521484375, -1.35394287109375, -1.16943359375, -0.98492431640625, -0.8004150390625, -0.61590576171875, -0.431396484375, -0.24688720703125, -0.0623779296875, 0.12213134765625, 0.306640625, 0.49114990234375, 0.6756591796875, 0.86016845703125, 1.044677734375, 1.22918701171875, 1.4136962890625, 1.59820556640625, 1.78271484375, 1.96722412109375, 2.1517333984375, 2.33624267578125, 2.520751953125, 2.70526123046875, 2.8897705078125, 3.07427978515625, 3.2587890625, 3.44329833984375, 3.6278076171875, 3.81231689453125, 3.996826171875, 4.18133544921875, 4.3658447265625, 4.55035400390625, 4.73486328125, 4.91937255859375, 5.1038818359375, 5.28839111328125, 5.472900390625, 5.65740966796875, 5.8419189453125, 6.02642822265625, 6.2109375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 9.0, 5.0, 9.0, 8.0, 14.0, 15.0, 14.0, 17.0, 17.0, 19.0, 23.0, 31.0, 30.0, 30.0, 29.0, 25.0, 41.0, 35.0, 38.0, 34.0, 28.0, 40.0, 39.0, 46.0, 38.0, 21.0, 42.0, 35.0, 32.0, 25.0, 28.0, 19.0, 22.0, 23.0, 11.0, 21.0, 18.0, 14.0, 12.0, 6.0, 8.0, 6.0, 10.0, 5.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.57421875, -4.43548583984375, -4.2967529296875, -4.15802001953125, -4.019287109375, -3.88055419921875, -3.7418212890625, -3.60308837890625, -3.46435546875, -3.32562255859375, -3.1868896484375, -3.04815673828125, -2.909423828125, -2.77069091796875, -2.6319580078125, -2.49322509765625, -2.3544921875, -2.21575927734375, -2.0770263671875, -1.93829345703125, -1.799560546875, -1.66082763671875, -1.5220947265625, -1.38336181640625, -1.24462890625, -1.10589599609375, -0.9671630859375, -0.82843017578125, -0.689697265625, -0.55096435546875, -0.4122314453125, -0.27349853515625, -0.134765625, 0.00396728515625, 0.1427001953125, 0.28143310546875, 0.420166015625, 0.55889892578125, 0.6976318359375, 0.83636474609375, 0.97509765625, 1.11383056640625, 1.2525634765625, 1.39129638671875, 1.530029296875, 1.66876220703125, 1.8074951171875, 1.94622802734375, 2.0849609375, 2.22369384765625, 2.3624267578125, 2.50115966796875, 2.639892578125, 2.77862548828125, 2.9173583984375, 3.05609130859375, 3.19482421875, 3.33355712890625, 3.4722900390625, 3.61102294921875, 3.749755859375, 3.88848876953125, 4.0272216796875, 4.16595458984375, 4.3046875]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 6.0, 9.0, 20.0, 22.0, 32.0, 47.0, 80.0, 104.0, 152.0, 227.0, 332.0, 531.0, 863.0, 1339.0, 2326.0, 3933.0, 6799.0, 12679.0, 23401.0, 43207.0, 79074.0, 133019.0, 189633.0, 198024.0, 149508.0, 90853.0, 50519.0, 27390.0, 14877.0, 8203.0, 4600.0, 2472.0, 1598.0, 960.0, 576.0, 371.0, 255.0, 173.0, 123.0, 74.0, 51.0, 29.0, 25.0, 13.0, 8.0, 6.0, 7.0, 5.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.13671875, -5.9395751953125, -5.742431640625, -5.5452880859375, -5.34814453125, -5.1510009765625, -4.953857421875, -4.7567138671875, -4.5595703125, -4.3624267578125, -4.165283203125, -3.9681396484375, -3.77099609375, -3.5738525390625, -3.376708984375, -3.1795654296875, -2.982421875, -2.7852783203125, -2.588134765625, -2.3909912109375, -2.19384765625, -1.9967041015625, -1.799560546875, -1.6024169921875, -1.4052734375, -1.2081298828125, -1.010986328125, -0.8138427734375, -0.61669921875, -0.4195556640625, -0.222412109375, -0.0252685546875, 0.171875, 0.3690185546875, 0.566162109375, 0.7633056640625, 0.96044921875, 1.1575927734375, 1.354736328125, 1.5518798828125, 1.7490234375, 1.9461669921875, 2.143310546875, 2.3404541015625, 2.53759765625, 2.7347412109375, 2.931884765625, 3.1290283203125, 3.326171875, 3.5233154296875, 3.720458984375, 3.9176025390625, 4.11474609375, 4.3118896484375, 4.509033203125, 4.7061767578125, 4.9033203125, 5.1004638671875, 5.297607421875, 5.4947509765625, 5.69189453125, 5.8890380859375, 6.086181640625, 6.2833251953125, 6.48046875]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 8.0, 14.0, 14.0, 19.0, 18.0, 22.0, 35.0, 43.0, 59.0, 80.0, 123.0, 88.0, 102.0, 83.0, 78.0, 62.0, 44.0, 29.0, 18.0, 18.0, 10.0, 8.0, 10.0, 5.0, 7.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005640983581542969, -0.0005357041954994202, -0.0005073100328445435, -0.00047891587018966675, -0.00045052170753479004, -0.00042212754487991333, -0.0003937333822250366, -0.0003653392195701599, -0.0003369450569152832, -0.0003085508942604065, -0.0002801567316055298, -0.0002517625689506531, -0.00022336840629577637, -0.00019497424364089966, -0.00016658008098602295, -0.00013818591833114624, -0.00010979175567626953, -8.139759302139282e-05, -5.300343036651611e-05, -2.4609267711639404e-05, 3.7848949432373047e-06, 3.2179057598114014e-05, 6.057322025299072e-05, 8.896738290786743e-05, 0.00011736154556274414, 0.00014575570821762085, 0.00017414987087249756, 0.00020254403352737427, 0.00023093819618225098, 0.0002593323588371277, 0.0002877265214920044, 0.0003161206841468811, 0.0003445148468017578, 0.0003729090094566345, 0.00040130317211151123, 0.00042969733476638794, 0.00045809149742126465, 0.00048648566007614136, 0.0005148798227310181, 0.0005432739853858948, 0.0005716681480407715, 0.0006000623106956482, 0.0006284564733505249, 0.0006568506360054016, 0.0006852447986602783, 0.000713638961315155, 0.0007420331239700317, 0.0007704272866249084, 0.0007988214492797852, 0.0008272156119346619, 0.0008556097745895386, 0.0008840039372444153, 0.000912398099899292, 0.0009407922625541687, 0.0009691864252090454, 0.0009975805878639221, 0.0010259747505187988, 0.0010543689131736755, 0.0010827630758285522, 0.001111157238483429, 0.0011395514011383057, 0.0011679455637931824, 0.001196339726448059, 0.0012247338891029358, 0.0012531280517578125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 7.0, 10.0, 29.0, 28.0, 35.0, 69.0, 99.0, 212.0, 261.0, 483.0, 788.0, 1345.0, 2278.0, 4018.0, 6462.0, 11441.0, 19519.0, 33347.0, 56324.0, 90044.0, 131396.0, 163485.0, 163990.0, 133061.0, 91188.0, 57117.0, 33925.0, 19729.0, 11468.0, 6637.0, 3925.0, 2332.0, 1403.0, 835.0, 478.0, 310.0, 163.0, 118.0, 65.0, 38.0, 31.0, 23.0, 14.0, 5.0, 9.0, 5.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.85546875, -4.69891357421875, -4.5423583984375, -4.38580322265625, -4.229248046875, -4.07269287109375, -3.9161376953125, -3.75958251953125, -3.60302734375, -3.44647216796875, -3.2899169921875, -3.13336181640625, -2.976806640625, -2.82025146484375, -2.6636962890625, -2.50714111328125, -2.3505859375, -2.19403076171875, -2.0374755859375, -1.88092041015625, -1.724365234375, -1.56781005859375, -1.4112548828125, -1.25469970703125, -1.09814453125, -0.94158935546875, -0.7850341796875, -0.62847900390625, -0.471923828125, -0.31536865234375, -0.1588134765625, -0.00225830078125, 0.154296875, 0.31085205078125, 0.4674072265625, 0.62396240234375, 0.780517578125, 0.93707275390625, 1.0936279296875, 1.25018310546875, 1.40673828125, 1.56329345703125, 1.7198486328125, 1.87640380859375, 2.032958984375, 2.18951416015625, 2.3460693359375, 2.50262451171875, 2.6591796875, 2.81573486328125, 2.9722900390625, 3.12884521484375, 3.285400390625, 3.44195556640625, 3.5985107421875, 3.75506591796875, 3.91162109375, 4.06817626953125, 4.2247314453125, 4.38128662109375, 4.537841796875, 4.69439697265625, 4.8509521484375, 5.00750732421875, 5.1640625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 7.0, 4.0, 4.0, 9.0, 3.0, 11.0, 20.0, 20.0, 29.0, 25.0, 29.0, 39.0, 37.0, 49.0, 44.0, 58.0, 55.0, 63.0, 72.0, 54.0, 50.0, 53.0, 40.0, 34.0, 31.0, 32.0, 24.0, 22.0, 27.0, 16.0, 11.0, 3.0, 6.0, 3.0, 8.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.87890625, -1.81689453125, -1.7548828125, -1.69287109375, -1.630859375, -1.56884765625, -1.5068359375, -1.44482421875, -1.3828125, -1.32080078125, -1.2587890625, -1.19677734375, -1.134765625, -1.07275390625, -1.0107421875, -0.94873046875, -0.88671875, -0.82470703125, -0.7626953125, -0.70068359375, -0.638671875, -0.57666015625, -0.5146484375, -0.45263671875, -0.390625, -0.32861328125, -0.2666015625, -0.20458984375, -0.142578125, -0.08056640625, -0.0185546875, 0.04345703125, 0.10546875, 0.16748046875, 0.2294921875, 0.29150390625, 0.353515625, 0.41552734375, 0.4775390625, 0.53955078125, 0.6015625, 0.66357421875, 0.7255859375, 0.78759765625, 0.849609375, 0.91162109375, 0.9736328125, 1.03564453125, 1.09765625, 1.15966796875, 1.2216796875, 1.28369140625, 1.345703125, 1.40771484375, 1.4697265625, 1.53173828125, 1.59375, 1.65576171875, 1.7177734375, 1.77978515625, 1.841796875, 1.90380859375, 1.9658203125, 2.02783203125, 2.08984375]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 3.0, 7.0, 7.0, 10.0, 4.0, 9.0, 9.0, 20.0, 11.0, 11.0, 20.0, 29.0, 29.0, 27.0, 35.0, 40.0, 58.0, 47.0, 51.0, 55.0, 56.0, 47.0, 47.0, 54.0, 38.0, 33.0, 46.0, 37.0, 21.0, 28.0, 19.0, 15.0, 16.0, 14.0, 11.0, 11.0, 6.0, 6.0, 3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.72874927520752, -8.447918891906738, -8.167088508605957, -7.886258602142334, -7.605428218841553, -7.3245978355407715, -7.043767929077148, -6.762937545776367, -6.482107162475586, -6.201276779174805, -5.920446395874023, -5.6396164894104, -5.358786106109619, -5.077955722808838, -4.797125816345215, -4.516295433044434, -4.235465049743652, -3.954634666442871, -3.673804521560669, -3.392974376678467, -3.1121439933776855, -2.8313136100769043, -2.550483465194702, -2.2696533203125, -1.9888229370117188, -1.707992672920227, -1.4271624088287354, -1.1463321447372437, -0.865501880645752, -0.5846716165542603, -0.30384135246276855, -0.023011088371276855, 0.25781917572021484, 0.5386494398117065, 0.8194797039031982, 1.10030996799469, 1.3811402320861816, 1.6619704961776733, 1.942800760269165, 2.223630905151367, 2.5044612884521484, 2.7852916717529297, 3.066121816635132, 3.346951961517334, 3.6277823448181152, 3.9086127281188965, 4.1894426345825195, 4.470273017883301, 4.751103401184082, 5.031933784484863, 5.3127641677856445, 5.593594074249268, 5.874424457550049, 6.15525484085083, 6.436084747314453, 6.716915130615234, 6.997745513916016, 7.278575897216797, 7.559406280517578, 7.840236186981201, 8.12106704711914, 8.401896476745605, 8.682726860046387, 8.963557243347168, 9.24438762664795]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 6.0, 4.0, 5.0, 3.0, 7.0, 8.0, 5.0, 8.0, 6.0, 18.0, 16.0, 13.0, 17.0, 20.0, 21.0, 29.0, 20.0, 25.0, 37.0, 26.0, 36.0, 41.0, 36.0, 39.0, 42.0, 36.0, 43.0, 36.0, 36.0, 33.0, 30.0, 38.0, 33.0, 53.0, 21.0, 22.0, 29.0, 14.0, 18.0, 16.0, 12.0, 10.0, 10.0, 3.0, 10.0, 6.0, 2.0, 5.0, 0.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-7.567232608795166, -7.347975730895996, -7.128719329833984, -6.9094624519348145, -6.690206050872803, -6.470949172973633, -6.251692771911621, -6.032435894012451, -5.8131794929504395, -5.5939226150512695, -5.374666213989258, -5.155409336090088, -4.936152935028076, -4.716896057128906, -4.4976396560668945, -4.278382778167725, -4.059125900268555, -3.839869260787964, -3.620612621307373, -3.4013559818267822, -3.1820993423461914, -2.9628424644470215, -2.7435860633850098, -2.52432918548584, -2.305072784423828, -2.0858161449432373, -1.8665595054626465, -1.6473028659820557, -1.4280462265014648, -1.2087894678115845, -0.9895328283309937, -0.7702761888504028, -0.5510196685791016, -0.33176302909851074, -0.11250635981559753, 0.10675030946731567, 0.3260069489479065, 0.5452636480331421, 0.7645202875137329, 0.9837769269943237, 1.2030335664749146, 1.4222902059555054, 1.6415468454360962, 1.8608036041259766, 2.0800602436065674, 2.299316883087158, 2.518573522567749, 2.73783016204834, 2.9570868015289307, 3.1763434410095215, 3.3956000804901123, 3.614856719970703, 3.834113359451294, 4.053369998931885, 4.272626876831055, 4.491883277893066, 4.711140155792236, 4.930397033691406, 5.149653434753418, 5.368910312652588, 5.5881667137146, 5.8074235916137695, 6.026679992675781, 6.245936870574951, 6.465193271636963]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 4.0, 14.0, 23.0, 25.0, 44.0, 54.0, 107.0, 164.0, 228.0, 368.0, 584.0, 997.0, 1617.0, 2695.0, 4408.0, 7576.0, 13339.0, 24039.0, 46071.0, 91898.0, 194552.0, 423329.0, 825026.0, 1055337.0, 765403.0, 382508.0, 175601.0, 83415.0, 42030.0, 22697.0, 12466.0, 6974.0, 4157.0, 2491.0, 1560.0, 963.0, 564.0, 342.0, 223.0, 128.0, 88.0, 60.0, 40.0, 21.0, 16.0, 13.0, 14.0, 4.0, 5.0, 1.0, 2.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.0546875, -7.781005859375, -7.50732421875, -7.233642578125, -6.9599609375, -6.686279296875, -6.41259765625, -6.138916015625, -5.865234375, -5.591552734375, -5.31787109375, -5.044189453125, -4.7705078125, -4.496826171875, -4.22314453125, -3.949462890625, -3.67578125, -3.402099609375, -3.12841796875, -2.854736328125, -2.5810546875, -2.307373046875, -2.03369140625, -1.760009765625, -1.486328125, -1.212646484375, -0.93896484375, -0.665283203125, -0.3916015625, -0.117919921875, 0.15576171875, 0.429443359375, 0.703125, 0.976806640625, 1.25048828125, 1.524169921875, 1.7978515625, 2.071533203125, 2.34521484375, 2.618896484375, 2.892578125, 3.166259765625, 3.43994140625, 3.713623046875, 3.9873046875, 4.260986328125, 4.53466796875, 4.808349609375, 5.08203125, 5.355712890625, 5.62939453125, 5.903076171875, 6.1767578125, 6.450439453125, 6.72412109375, 6.997802734375, 7.271484375, 7.545166015625, 7.81884765625, 8.092529296875, 8.3662109375, 8.639892578125, 8.91357421875, 9.187255859375, 9.4609375]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 5.0, 7.0, 8.0, 3.0, 8.0, 10.0, 12.0, 12.0, 15.0, 20.0, 26.0, 16.0, 19.0, 21.0, 21.0, 36.0, 34.0, 30.0, 35.0, 46.0, 39.0, 50.0, 37.0, 30.0, 42.0, 34.0, 51.0, 35.0, 34.0, 39.0, 39.0, 37.0, 27.0, 17.0, 12.0, 16.0, 16.0, 21.0, 12.0, 8.0, 4.0, 7.0, 3.0, 2.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.19921875, -5.0399169921875, -4.880615234375, -4.7213134765625, -4.56201171875, -4.4027099609375, -4.243408203125, -4.0841064453125, -3.9248046875, -3.7655029296875, -3.606201171875, -3.4468994140625, -3.28759765625, -3.1282958984375, -2.968994140625, -2.8096923828125, -2.650390625, -2.4910888671875, -2.331787109375, -2.1724853515625, -2.01318359375, -1.8538818359375, -1.694580078125, -1.5352783203125, -1.3759765625, -1.2166748046875, -1.057373046875, -0.8980712890625, -0.73876953125, -0.5794677734375, -0.420166015625, -0.2608642578125, -0.1015625, 0.0577392578125, 0.217041015625, 0.3763427734375, 0.53564453125, 0.6949462890625, 0.854248046875, 1.0135498046875, 1.1728515625, 1.3321533203125, 1.491455078125, 1.6507568359375, 1.81005859375, 1.9693603515625, 2.128662109375, 2.2879638671875, 2.447265625, 2.6065673828125, 2.765869140625, 2.9251708984375, 3.08447265625, 3.2437744140625, 3.403076171875, 3.5623779296875, 3.7216796875, 3.8809814453125, 4.040283203125, 4.1995849609375, 4.35888671875, 4.5181884765625, 4.677490234375, 4.8367919921875, 4.99609375]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 10.0, 12.0, 17.0, 26.0, 36.0, 48.0, 70.0, 100.0, 165.0, 267.0, 383.0, 586.0, 893.0, 1353.0, 2171.0, 3624.0, 5987.0, 9772.0, 16627.0, 28222.0, 50388.0, 91728.0, 171235.0, 317893.0, 567945.0, 841816.0, 835389.0, 557480.0, 313184.0, 167994.0, 90580.0, 49265.0, 28195.0, 16075.0, 9459.0, 5711.0, 3434.0, 2248.0, 1355.0, 893.0, 564.0, 346.0, 247.0, 172.0, 110.0, 66.0, 41.0, 37.0, 26.0, 19.0, 7.0, 7.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0], "bins": [-7.8984375, -7.6514892578125, -7.404541015625, -7.1575927734375, -6.91064453125, -6.6636962890625, -6.416748046875, -6.1697998046875, -5.9228515625, -5.6759033203125, -5.428955078125, -5.1820068359375, -4.93505859375, -4.6881103515625, -4.441162109375, -4.1942138671875, -3.947265625, -3.7003173828125, -3.453369140625, -3.2064208984375, -2.95947265625, -2.7125244140625, -2.465576171875, -2.2186279296875, -1.9716796875, -1.7247314453125, -1.477783203125, -1.2308349609375, -0.98388671875, -0.7369384765625, -0.489990234375, -0.2430419921875, 0.00390625, 0.2508544921875, 0.497802734375, 0.7447509765625, 0.99169921875, 1.2386474609375, 1.485595703125, 1.7325439453125, 1.9794921875, 2.2264404296875, 2.473388671875, 2.7203369140625, 2.96728515625, 3.2142333984375, 3.461181640625, 3.7081298828125, 3.955078125, 4.2020263671875, 4.448974609375, 4.6959228515625, 4.94287109375, 5.1898193359375, 5.436767578125, 5.6837158203125, 5.9306640625, 6.1776123046875, 6.424560546875, 6.6715087890625, 6.91845703125, 7.1654052734375, 7.412353515625, 7.6593017578125, 7.90625]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 10.0, 11.0, 20.0, 17.0, 31.0, 40.0, 38.0, 54.0, 77.0, 94.0, 117.0, 146.0, 143.0, 197.0, 242.0, 279.0, 294.0, 298.0, 273.0, 291.0, 204.0, 209.0, 185.0, 152.0, 131.0, 105.0, 72.0, 80.0, 49.0, 37.0, 34.0, 32.0, 23.0, 21.0, 15.0, 9.0, 7.0, 5.0, 5.0, 6.0, 3.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-2.666015625, -2.57318115234375, -2.4803466796875, -2.38751220703125, -2.294677734375, -2.20184326171875, -2.1090087890625, -2.01617431640625, -1.92333984375, -1.83050537109375, -1.7376708984375, -1.64483642578125, -1.552001953125, -1.45916748046875, -1.3663330078125, -1.27349853515625, -1.1806640625, -1.08782958984375, -0.9949951171875, -0.90216064453125, -0.809326171875, -0.71649169921875, -0.6236572265625, -0.53082275390625, -0.43798828125, -0.34515380859375, -0.2523193359375, -0.15948486328125, -0.066650390625, 0.02618408203125, 0.1190185546875, 0.21185302734375, 0.3046875, 0.39752197265625, 0.4903564453125, 0.58319091796875, 0.676025390625, 0.76885986328125, 0.8616943359375, 0.95452880859375, 1.04736328125, 1.14019775390625, 1.2330322265625, 1.32586669921875, 1.418701171875, 1.51153564453125, 1.6043701171875, 1.69720458984375, 1.7900390625, 1.88287353515625, 1.9757080078125, 2.06854248046875, 2.161376953125, 2.25421142578125, 2.3470458984375, 2.43988037109375, 2.53271484375, 2.62554931640625, 2.7183837890625, 2.81121826171875, 2.904052734375, 2.99688720703125, 3.0897216796875, 3.18255615234375, 3.275390625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 5.0, 5.0, 6.0, 15.0, 12.0, 11.0, 14.0, 19.0, 28.0, 27.0, 32.0, 32.0, 39.0, 38.0, 40.0, 56.0, 67.0, 67.0, 56.0, 51.0, 66.0, 43.0, 52.0, 41.0, 35.0, 26.0, 20.0, 25.0, 18.0, 10.0, 10.0, 7.0, 7.0, 10.0, 6.0, 7.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.182652473449707, -9.896796226501465, -9.610940933227539, -9.325084686279297, -9.039228439331055, -8.753372192382812, -8.467516899108887, -8.181660652160645, -7.895804405212402, -7.609948635101318, -7.324092388153076, -7.038236618041992, -6.75238037109375, -6.466524600982666, -6.180668830871582, -5.89481258392334, -5.608956813812256, -5.323101043701172, -5.03724479675293, -4.751389026641846, -4.4655327796936035, -4.1796770095825195, -3.8938210010528564, -3.6079649925231934, -3.3221089839935303, -3.036252975463867, -2.750396966934204, -2.464540958404541, -2.178685188293457, -1.8928290605545044, -1.6069731712341309, -1.3211171627044678, -1.0352611541748047, -0.7494051456451416, -0.4635491967201233, -0.17769324779510498, 0.1081627607345581, 0.3940187692642212, 0.6798746585845947, 0.9657306671142578, 1.251586675643921, 1.537442684173584, 1.823298692703247, 2.10915470123291, 2.395010471343994, 2.6808667182922363, 2.9667224884033203, 3.2525784969329834, 3.5384345054626465, 3.8242905139923096, 4.110146522521973, 4.396002292633057, 4.681858539581299, 4.967714309692383, 5.253570556640625, 5.539426326751709, 5.825282096862793, 6.111137866973877, 6.396994113922119, 6.682849884033203, 6.968706130981445, 7.254561901092529, 7.540417671203613, 7.8262739181518555, 8.112130165100098]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 1.0, 4.0, 3.0, 6.0, 10.0, 9.0, 11.0, 8.0, 10.0, 13.0, 18.0, 16.0, 30.0, 24.0, 25.0, 23.0, 42.0, 34.0, 37.0, 34.0, 38.0, 46.0, 47.0, 47.0, 27.0, 37.0, 40.0, 34.0, 32.0, 43.0, 33.0, 34.0, 31.0, 28.0, 24.0, 15.0, 26.0, 16.0, 14.0, 9.0, 6.0, 5.0, 5.0, 4.0, 8.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.041364669799805, -5.8413872718811035, -5.641409873962402, -5.441432952880859, -5.241455554962158, -5.041478157043457, -4.841501235961914, -4.641523838043213, -4.441546440124512, -4.2415690422058105, -4.041591644287109, -3.8416147232055664, -3.6416373252868652, -3.441659927368164, -3.241682767868042, -3.04170560836792, -2.8417282104492188, -2.6417508125305176, -2.4417736530303955, -2.2417964935302734, -2.0418190956115723, -1.8418418169021606, -1.641864538192749, -1.4418872594833374, -1.2419099807739258, -1.0419327020645142, -0.8419554233551025, -0.6419781446456909, -0.4420008659362793, -0.24202358722686768, -0.042046308517456055, 0.15793097019195557, 0.357907772064209, 0.5578850507736206, 0.7578623294830322, 0.9578396081924438, 1.1578168869018555, 1.357794165611267, 1.5577714443206787, 1.7577487230300903, 1.957726001739502, 2.157703399658203, 2.357680559158325, 2.5576577186584473, 2.7576351165771484, 2.9576125144958496, 3.1575896739959717, 3.3575668334960938, 3.557544231414795, 3.757521629333496, 3.957498788833618, 4.15747594833374, 4.357453346252441, 4.557430744171143, 4.757408142089844, 4.957385063171387, 5.157362461090088, 5.357339859008789, 5.557316780090332, 5.757294178009033, 5.957271575927734, 6.1572489738464355, 6.357226371765137, 6.55720329284668, 6.757180690765381]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 7.0, 2.0, 7.0, 11.0, 12.0, 22.0, 22.0, 21.0, 31.0, 49.0, 58.0, 102.0, 107.0, 166.0, 214.0, 325.0, 497.0, 687.0, 967.0, 1475.0, 2250.0, 3623.0, 6228.0, 11967.0, 26220.0, 62385.0, 155953.0, 295129.0, 262569.0, 122678.0, 49334.0, 20683.0, 9864.0, 5415.0, 3184.0, 1988.0, 1275.0, 946.0, 628.0, 402.0, 328.0, 193.0, 143.0, 89.0, 78.0, 59.0, 44.0, 37.0, 25.0, 23.0, 13.0, 9.0, 7.0, 6.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-10.921875, -10.55615234375, -10.1904296875, -9.82470703125, -9.458984375, -9.09326171875, -8.7275390625, -8.36181640625, -7.99609375, -7.63037109375, -7.2646484375, -6.89892578125, -6.533203125, -6.16748046875, -5.8017578125, -5.43603515625, -5.0703125, -4.70458984375, -4.3388671875, -3.97314453125, -3.607421875, -3.24169921875, -2.8759765625, -2.51025390625, -2.14453125, -1.77880859375, -1.4130859375, -1.04736328125, -0.681640625, -0.31591796875, 0.0498046875, 0.41552734375, 0.78125, 1.14697265625, 1.5126953125, 1.87841796875, 2.244140625, 2.60986328125, 2.9755859375, 3.34130859375, 3.70703125, 4.07275390625, 4.4384765625, 4.80419921875, 5.169921875, 5.53564453125, 5.9013671875, 6.26708984375, 6.6328125, 6.99853515625, 7.3642578125, 7.72998046875, 8.095703125, 8.46142578125, 8.8271484375, 9.19287109375, 9.55859375, 9.92431640625, 10.2900390625, 10.65576171875, 11.021484375, 11.38720703125, 11.7529296875, 12.11865234375, 12.484375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 4.0, 1.0, 2.0, 2.0, 4.0, 5.0, 8.0, 13.0, 12.0, 12.0, 17.0, 18.0, 19.0, 21.0, 26.0, 32.0, 24.0, 24.0, 37.0, 33.0, 51.0, 36.0, 43.0, 34.0, 31.0, 37.0, 39.0, 50.0, 36.0, 36.0, 27.0, 42.0, 25.0, 32.0, 28.0, 20.0, 18.0, 24.0, 15.0, 20.0, 14.0, 11.0, 8.0, 5.0, 3.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.16015625, -5.96630859375, -5.7724609375, -5.57861328125, -5.384765625, -5.19091796875, -4.9970703125, -4.80322265625, -4.609375, -4.41552734375, -4.2216796875, -4.02783203125, -3.833984375, -3.64013671875, -3.4462890625, -3.25244140625, -3.05859375, -2.86474609375, -2.6708984375, -2.47705078125, -2.283203125, -2.08935546875, -1.8955078125, -1.70166015625, -1.5078125, -1.31396484375, -1.1201171875, -0.92626953125, -0.732421875, -0.53857421875, -0.3447265625, -0.15087890625, 0.04296875, 0.23681640625, 0.4306640625, 0.62451171875, 0.818359375, 1.01220703125, 1.2060546875, 1.39990234375, 1.59375, 1.78759765625, 1.9814453125, 2.17529296875, 2.369140625, 2.56298828125, 2.7568359375, 2.95068359375, 3.14453125, 3.33837890625, 3.5322265625, 3.72607421875, 3.919921875, 4.11376953125, 4.3076171875, 4.50146484375, 4.6953125, 4.88916015625, 5.0830078125, 5.27685546875, 5.470703125, 5.66455078125, 5.8583984375, 6.05224609375, 6.24609375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 8.0, 5.0, 7.0, 11.0, 23.0, 18.0, 33.0, 31.0, 61.0, 69.0, 96.0, 111.0, 175.0, 230.0, 346.0, 534.0, 897.0, 1352.0, 2181.0, 3926.0, 7516.0, 17012.0, 50680.0, 190612.0, 462122.0, 216227.0, 56908.0, 18663.0, 8046.0, 4127.0, 2318.0, 1396.0, 881.0, 541.0, 434.0, 288.0, 186.0, 133.0, 75.0, 72.0, 59.0, 40.0, 39.0, 22.0, 11.0, 12.0, 6.0, 8.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-17.90625, -17.320068359375, -16.73388671875, -16.147705078125, -15.5615234375, -14.975341796875, -14.38916015625, -13.802978515625, -13.216796875, -12.630615234375, -12.04443359375, -11.458251953125, -10.8720703125, -10.285888671875, -9.69970703125, -9.113525390625, -8.52734375, -7.941162109375, -7.35498046875, -6.768798828125, -6.1826171875, -5.596435546875, -5.01025390625, -4.424072265625, -3.837890625, -3.251708984375, -2.66552734375, -2.079345703125, -1.4931640625, -0.906982421875, -0.32080078125, 0.265380859375, 0.8515625, 1.437744140625, 2.02392578125, 2.610107421875, 3.1962890625, 3.782470703125, 4.36865234375, 4.954833984375, 5.541015625, 6.127197265625, 6.71337890625, 7.299560546875, 7.8857421875, 8.471923828125, 9.05810546875, 9.644287109375, 10.23046875, 10.816650390625, 11.40283203125, 11.989013671875, 12.5751953125, 13.161376953125, 13.74755859375, 14.333740234375, 14.919921875, 15.506103515625, 16.09228515625, 16.678466796875, 17.2646484375, 17.850830078125, 18.43701171875, 19.023193359375, 19.609375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 9.0, 6.0, 12.0, 18.0, 11.0, 17.0, 16.0, 15.0, 26.0, 28.0, 25.0, 24.0, 25.0, 33.0, 28.0, 41.0, 48.0, 32.0, 41.0, 49.0, 31.0, 43.0, 44.0, 42.0, 35.0, 31.0, 43.0, 32.0, 26.0, 36.0, 20.0, 18.0, 12.0, 14.0, 12.0, 10.0, 5.0, 7.0, 11.0, 4.0, 6.0, 3.0, 5.0, 0.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.04296875, -3.9210205078125, -3.799072265625, -3.6771240234375, -3.55517578125, -3.4332275390625, -3.311279296875, -3.1893310546875, -3.0673828125, -2.9454345703125, -2.823486328125, -2.7015380859375, -2.57958984375, -2.4576416015625, -2.335693359375, -2.2137451171875, -2.091796875, -1.9698486328125, -1.847900390625, -1.7259521484375, -1.60400390625, -1.4820556640625, -1.360107421875, -1.2381591796875, -1.1162109375, -0.9942626953125, -0.872314453125, -0.7503662109375, -0.62841796875, -0.5064697265625, -0.384521484375, -0.2625732421875, -0.140625, -0.0186767578125, 0.103271484375, 0.2252197265625, 0.34716796875, 0.4691162109375, 0.591064453125, 0.7130126953125, 0.8349609375, 0.9569091796875, 1.078857421875, 1.2008056640625, 1.32275390625, 1.4447021484375, 1.566650390625, 1.6885986328125, 1.810546875, 1.9324951171875, 2.054443359375, 2.1763916015625, 2.29833984375, 2.4202880859375, 2.542236328125, 2.6641845703125, 2.7861328125, 2.9080810546875, 3.030029296875, 3.1519775390625, 3.27392578125, 3.3958740234375, 3.517822265625, 3.6397705078125, 3.76171875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 1.0, 7.0, 4.0, 4.0, 8.0, 16.0, 22.0, 14.0, 41.0, 50.0, 53.0, 113.0, 128.0, 217.0, 303.0, 455.0, 705.0, 1115.0, 1805.0, 3185.0, 6411.0, 14657.0, 46160.0, 202113.0, 512033.0, 187342.0, 43492.0, 14159.0, 6070.0, 3016.0, 1731.0, 1129.0, 652.0, 427.0, 287.0, 187.0, 127.0, 88.0, 63.0, 62.0, 37.0, 18.0, 16.0, 15.0, 5.0, 5.0, 6.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-11.265625, -10.9388427734375, -10.612060546875, -10.2852783203125, -9.95849609375, -9.6317138671875, -9.304931640625, -8.9781494140625, -8.6513671875, -8.3245849609375, -7.997802734375, -7.6710205078125, -7.34423828125, -7.0174560546875, -6.690673828125, -6.3638916015625, -6.037109375, -5.7103271484375, -5.383544921875, -5.0567626953125, -4.72998046875, -4.4031982421875, -4.076416015625, -3.7496337890625, -3.4228515625, -3.0960693359375, -2.769287109375, -2.4425048828125, -2.11572265625, -1.7889404296875, -1.462158203125, -1.1353759765625, -0.80859375, -0.4818115234375, -0.155029296875, 0.1717529296875, 0.49853515625, 0.8253173828125, 1.152099609375, 1.4788818359375, 1.8056640625, 2.1324462890625, 2.459228515625, 2.7860107421875, 3.11279296875, 3.4395751953125, 3.766357421875, 4.0931396484375, 4.419921875, 4.7467041015625, 5.073486328125, 5.4002685546875, 5.72705078125, 6.0538330078125, 6.380615234375, 6.7073974609375, 7.0341796875, 7.3609619140625, 7.687744140625, 8.0145263671875, 8.34130859375, 8.6680908203125, 8.994873046875, 9.3216552734375, 9.6484375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 6.0, 10.0, 26.0, 32.0, 88.0, 143.0, 239.0, 223.0, 122.0, 44.0, 28.0, 12.0, 6.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.0008563995361328125, -0.0008358955383300781, -0.0008153915405273438, -0.0007948875427246094, -0.000774383544921875, -0.0007538795471191406, -0.0007333755493164062, -0.0007128715515136719, -0.0006923675537109375, -0.0006718635559082031, -0.0006513595581054688, -0.0006308555603027344, -0.0006103515625, -0.0005898475646972656, -0.0005693435668945312, -0.0005488395690917969, -0.0005283355712890625, -0.0005078315734863281, -0.00048732757568359375, -0.0004668235778808594, -0.000446319580078125, -0.0004258155822753906, -0.00040531158447265625, -0.0003848075866699219, -0.0003643035888671875, -0.0003437995910644531, -0.00032329559326171875, -0.0003027915954589844, -0.00028228759765625, -0.0002617835998535156, -0.00024127960205078125, -0.00022077560424804688, -0.0002002716064453125, -0.00017976760864257812, -0.00015926361083984375, -0.00013875961303710938, -0.000118255615234375, -9.775161743164062e-05, -7.724761962890625e-05, -5.6743621826171875e-05, -3.62396240234375e-05, -1.5735626220703125e-05, 4.76837158203125e-06, 2.5272369384765625e-05, 4.57763671875e-05, 6.628036499023438e-05, 8.678436279296875e-05, 0.00010728836059570312, 0.0001277923583984375, 0.00014829635620117188, 0.00016880035400390625, 0.00018930435180664062, 0.000209808349609375, 0.00023031234741210938, 0.00025081634521484375, 0.0002713203430175781, 0.0002918243408203125, 0.0003123283386230469, 0.00033283233642578125, 0.0003533363342285156, 0.00037384033203125, 0.0003943443298339844, 0.00041484832763671875, 0.0004353523254394531, 0.0004558563232421875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 9.0, 15.0, 15.0, 14.0, 19.0, 47.0, 53.0, 84.0, 105.0, 134.0, 206.0, 297.0, 427.0, 593.0, 873.0, 1240.0, 1823.0, 2855.0, 5383.0, 12513.0, 39146.0, 145940.0, 397497.0, 304171.0, 89602.0, 24777.0, 8921.0, 4211.0, 2380.0, 1603.0, 1067.0, 715.0, 535.0, 384.0, 249.0, 191.0, 136.0, 93.0, 66.0, 42.0, 31.0, 25.0, 20.0, 13.0, 13.0, 6.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-8.53125, -8.25439453125, -7.9775390625, -7.70068359375, -7.423828125, -7.14697265625, -6.8701171875, -6.59326171875, -6.31640625, -6.03955078125, -5.7626953125, -5.48583984375, -5.208984375, -4.93212890625, -4.6552734375, -4.37841796875, -4.1015625, -3.82470703125, -3.5478515625, -3.27099609375, -2.994140625, -2.71728515625, -2.4404296875, -2.16357421875, -1.88671875, -1.60986328125, -1.3330078125, -1.05615234375, -0.779296875, -0.50244140625, -0.2255859375, 0.05126953125, 0.328125, 0.60498046875, 0.8818359375, 1.15869140625, 1.435546875, 1.71240234375, 1.9892578125, 2.26611328125, 2.54296875, 2.81982421875, 3.0966796875, 3.37353515625, 3.650390625, 3.92724609375, 4.2041015625, 4.48095703125, 4.7578125, 5.03466796875, 5.3115234375, 5.58837890625, 5.865234375, 6.14208984375, 6.4189453125, 6.69580078125, 6.97265625, 7.24951171875, 7.5263671875, 7.80322265625, 8.080078125, 8.35693359375, 8.6337890625, 8.91064453125, 9.1875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0, 6.0, 7.0, 4.0, 6.0, 17.0, 22.0, 45.0, 46.0, 62.0, 117.0, 150.0, 128.0, 116.0, 105.0, 62.0, 45.0, 21.0, 16.0, 11.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.953125, -3.8524169921875, -3.751708984375, -3.6510009765625, -3.55029296875, -3.4495849609375, -3.348876953125, -3.2481689453125, -3.1474609375, -3.0467529296875, -2.946044921875, -2.8453369140625, -2.74462890625, -2.6439208984375, -2.543212890625, -2.4425048828125, -2.341796875, -2.2410888671875, -2.140380859375, -2.0396728515625, -1.93896484375, -1.8382568359375, -1.737548828125, -1.6368408203125, -1.5361328125, -1.4354248046875, -1.334716796875, -1.2340087890625, -1.13330078125, -1.0325927734375, -0.931884765625, -0.8311767578125, -0.73046875, -0.6297607421875, -0.529052734375, -0.4283447265625, -0.32763671875, -0.2269287109375, -0.126220703125, -0.0255126953125, 0.0751953125, 0.1759033203125, 0.276611328125, 0.3773193359375, 0.47802734375, 0.5787353515625, 0.679443359375, 0.7801513671875, 0.880859375, 0.9815673828125, 1.082275390625, 1.1829833984375, 1.28369140625, 1.3843994140625, 1.485107421875, 1.5858154296875, 1.6865234375, 1.7872314453125, 1.887939453125, 1.9886474609375, 2.08935546875, 2.1900634765625, 2.290771484375, 2.3914794921875, 2.4921875]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 5.0, 4.0, 5.0, 10.0, 9.0, 7.0, 13.0, 17.0, 25.0, 24.0, 35.0, 37.0, 28.0, 37.0, 37.0, 61.0, 43.0, 52.0, 57.0, 45.0, 64.0, 60.0, 46.0, 55.0, 30.0, 32.0, 28.0, 26.0, 22.0, 15.0, 13.0, 12.0, 10.0, 18.0, 7.0, 6.0, 1.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.566675186157227, -9.304231643676758, -9.041787147521973, -8.779343605041504, -8.516899108886719, -8.25445556640625, -7.992011547088623, -7.729567527770996, -7.467123508453369, -7.204679489135742, -6.942235469818115, -6.679791450500488, -6.4173479080200195, -6.154903411865234, -5.892459869384766, -5.630015850067139, -5.367571830749512, -5.105127811431885, -4.842683792114258, -4.580239772796631, -4.317795753479004, -4.055352210998535, -3.792908191680908, -3.5304641723632812, -3.2680201530456543, -3.0055761337280273, -2.7431321144104004, -2.4806883335113525, -2.2182443141937256, -1.9558002948760986, -1.6933563947677612, -1.4309124946594238, -1.1684694290161133, -0.9060254693031311, -0.6435815095901489, -0.38113754987716675, -0.11869359016418457, 0.14375042915344238, 0.4061943292617798, 0.6686382293701172, 0.9310822486877441, 1.193526268005371, 1.4559701681137085, 1.718414068222046, 1.9808580875396729, 2.2433021068573, 2.5057458877563477, 2.7681899070739746, 3.0306339263916016, 3.2930779457092285, 3.5555219650268555, 3.8179657459259033, 4.080410003662109, 4.342853546142578, 4.605297565460205, 4.867741584777832, 5.130185604095459, 5.392629623413086, 5.655073642730713, 5.91751766204834, 6.179961204528809, 6.442405700683594, 6.7048492431640625, 6.9672932624816895, 7.229737281799316]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 1.0, 5.0, 3.0, 4.0, 5.0, 9.0, 11.0, 6.0, 7.0, 6.0, 10.0, 9.0, 24.0, 19.0, 30.0, 20.0, 25.0, 31.0, 25.0, 36.0, 34.0, 39.0, 30.0, 53.0, 41.0, 38.0, 44.0, 46.0, 33.0, 34.0, 31.0, 41.0, 32.0, 36.0, 24.0, 29.0, 35.0, 25.0, 15.0, 13.0, 13.0, 5.0, 11.0, 6.0, 7.0, 4.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.39036226272583, -5.20006799697876, -5.0097737312316895, -4.819479465484619, -4.629185199737549, -4.4388909339904785, -4.24859619140625, -4.05830192565918, -3.8680078983306885, -3.677713632583618, -3.487419366836548, -3.2971248626708984, -3.106830596923828, -2.916536331176758, -2.7262420654296875, -2.535947799682617, -2.345653533935547, -2.1553592681884766, -1.9650650024414062, -1.7747706174850464, -1.584476351737976, -1.3941820859909058, -1.203887701034546, -1.0135934352874756, -0.8232991695404053, -0.633004903793335, -0.4427105784416199, -0.2524162530899048, -0.06212198734283447, 0.12817227840423584, 0.3184666633605957, 0.508760929107666, 0.6990556716918945, 0.8893499374389648, 1.0796442031860352, 1.269938588142395, 1.4602328538894653, 1.6505271196365356, 1.8408215045928955, 2.031115770339966, 2.221410036087036, 2.4117043018341064, 2.6019985675811768, 2.792293071746826, 2.9825873374938965, 3.172881603240967, 3.363175868988037, 3.5534701347351074, 3.7437644004821777, 3.934058666229248, 4.124352931976318, 4.314647197723389, 4.504941463470459, 4.695235729217529, 4.885530471801758, 5.075824737548828, 5.266119003295898, 5.456413269042969, 5.646707534790039, 5.837001800537109, 6.02729606628418, 6.21759033203125, 6.40788459777832, 6.598178863525391, 6.788473129272461]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 8.0, 7.0, 11.0, 31.0, 43.0, 51.0, 84.0, 137.0, 189.0, 297.0, 427.0, 647.0, 962.0, 1390.0, 2251.0, 3602.0, 5561.0, 8837.0, 13770.0, 21888.0, 33952.0, 52084.0, 76169.0, 104075.0, 128284.0, 138219.0, 128039.0, 104106.0, 76889.0, 52283.0, 34102.0, 21942.0, 13783.0, 8595.0, 5617.0, 3486.0, 2323.0, 1461.0, 997.0, 703.0, 453.0, 270.0, 182.0, 135.0, 79.0, 55.0, 37.0, 25.0, 11.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.66796875, -6.46893310546875, -6.2698974609375, -6.07086181640625, -5.871826171875, -5.67279052734375, -5.4737548828125, -5.27471923828125, -5.07568359375, -4.87664794921875, -4.6776123046875, -4.47857666015625, -4.279541015625, -4.08050537109375, -3.8814697265625, -3.68243408203125, -3.4833984375, -3.28436279296875, -3.0853271484375, -2.88629150390625, -2.687255859375, -2.48822021484375, -2.2891845703125, -2.09014892578125, -1.89111328125, -1.69207763671875, -1.4930419921875, -1.29400634765625, -1.094970703125, -0.89593505859375, -0.6968994140625, -0.49786376953125, -0.298828125, -0.09979248046875, 0.0992431640625, 0.29827880859375, 0.497314453125, 0.69635009765625, 0.8953857421875, 1.09442138671875, 1.29345703125, 1.49249267578125, 1.6915283203125, 1.89056396484375, 2.089599609375, 2.28863525390625, 2.4876708984375, 2.68670654296875, 2.8857421875, 3.08477783203125, 3.2838134765625, 3.48284912109375, 3.681884765625, 3.88092041015625, 4.0799560546875, 4.27899169921875, 4.47802734375, 4.67706298828125, 4.8760986328125, 5.07513427734375, 5.274169921875, 5.47320556640625, 5.6722412109375, 5.87127685546875, 6.0703125]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 5.0, 9.0, 5.0, 10.0, 8.0, 6.0, 6.0, 15.0, 19.0, 20.0, 25.0, 21.0, 24.0, 30.0, 32.0, 32.0, 32.0, 54.0, 43.0, 41.0, 55.0, 52.0, 33.0, 44.0, 41.0, 42.0, 44.0, 38.0, 30.0, 33.0, 32.0, 25.0, 27.0, 23.0, 9.0, 12.0, 11.0, 6.0, 3.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.765625, -5.5518798828125, -5.338134765625, -5.1243896484375, -4.91064453125, -4.6968994140625, -4.483154296875, -4.2694091796875, -4.0556640625, -3.8419189453125, -3.628173828125, -3.4144287109375, -3.20068359375, -2.9869384765625, -2.773193359375, -2.5594482421875, -2.345703125, -2.1319580078125, -1.918212890625, -1.7044677734375, -1.49072265625, -1.2769775390625, -1.063232421875, -0.8494873046875, -0.6357421875, -0.4219970703125, -0.208251953125, 0.0054931640625, 0.21923828125, 0.4329833984375, 0.646728515625, 0.8604736328125, 1.07421875, 1.2879638671875, 1.501708984375, 1.7154541015625, 1.92919921875, 2.1429443359375, 2.356689453125, 2.5704345703125, 2.7841796875, 2.9979248046875, 3.211669921875, 3.4254150390625, 3.63916015625, 3.8529052734375, 4.066650390625, 4.2803955078125, 4.494140625, 4.7078857421875, 4.921630859375, 5.1353759765625, 5.34912109375, 5.5628662109375, 5.776611328125, 5.9903564453125, 6.2041015625, 6.4178466796875, 6.631591796875, 6.8453369140625, 7.05908203125, 7.2728271484375, 7.486572265625, 7.7003173828125, 7.9140625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 9.0, 21.0, 32.0, 50.0, 49.0, 78.0, 148.0, 212.0, 316.0, 469.0, 737.0, 1105.0, 1646.0, 2463.0, 3812.0, 5770.0, 8536.0, 13126.0, 19310.0, 28227.0, 41317.0, 58517.0, 79131.0, 99490.0, 114942.0, 120704.0, 111722.0, 94094.0, 73080.0, 53982.0, 37682.0, 26040.0, 17283.0, 11631.0, 7720.0, 5123.0, 3399.0, 2263.0, 1472.0, 932.0, 677.0, 401.0, 299.0, 184.0, 119.0, 89.0, 55.0, 36.0, 26.0, 8.0, 9.0, 5.0, 4.0, 4.0, 2.0], "bins": [-5.46875, -5.30963134765625, -5.1505126953125, -4.99139404296875, -4.832275390625, -4.67315673828125, -4.5140380859375, -4.35491943359375, -4.19580078125, -4.03668212890625, -3.8775634765625, -3.71844482421875, -3.559326171875, -3.40020751953125, -3.2410888671875, -3.08197021484375, -2.9228515625, -2.76373291015625, -2.6046142578125, -2.44549560546875, -2.286376953125, -2.12725830078125, -1.9681396484375, -1.80902099609375, -1.64990234375, -1.49078369140625, -1.3316650390625, -1.17254638671875, -1.013427734375, -0.85430908203125, -0.6951904296875, -0.53607177734375, -0.376953125, -0.21783447265625, -0.0587158203125, 0.10040283203125, 0.259521484375, 0.41864013671875, 0.5777587890625, 0.73687744140625, 0.89599609375, 1.05511474609375, 1.2142333984375, 1.37335205078125, 1.532470703125, 1.69158935546875, 1.8507080078125, 2.00982666015625, 2.1689453125, 2.32806396484375, 2.4871826171875, 2.64630126953125, 2.805419921875, 2.96453857421875, 3.1236572265625, 3.28277587890625, 3.44189453125, 3.60101318359375, 3.7601318359375, 3.91925048828125, 4.078369140625, 4.23748779296875, 4.3966064453125, 4.55572509765625, 4.71484375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 8.0, 2.0, 3.0, 3.0, 17.0, 8.0, 9.0, 13.0, 16.0, 24.0, 10.0, 22.0, 15.0, 27.0, 28.0, 25.0, 36.0, 34.0, 31.0, 41.0, 42.0, 31.0, 45.0, 36.0, 53.0, 42.0, 48.0, 42.0, 32.0, 35.0, 31.0, 16.0, 23.0, 33.0, 26.0, 16.0, 22.0, 13.0, 9.0, 7.0, 6.0, 8.0, 6.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.203125, -4.0819091796875, -3.960693359375, -3.8394775390625, -3.71826171875, -3.5970458984375, -3.475830078125, -3.3546142578125, -3.2333984375, -3.1121826171875, -2.990966796875, -2.8697509765625, -2.74853515625, -2.6273193359375, -2.506103515625, -2.3848876953125, -2.263671875, -2.1424560546875, -2.021240234375, -1.9000244140625, -1.77880859375, -1.6575927734375, -1.536376953125, -1.4151611328125, -1.2939453125, -1.1727294921875, -1.051513671875, -0.9302978515625, -0.80908203125, -0.6878662109375, -0.566650390625, -0.4454345703125, -0.32421875, -0.2030029296875, -0.081787109375, 0.0394287109375, 0.16064453125, 0.2818603515625, 0.403076171875, 0.5242919921875, 0.6455078125, 0.7667236328125, 0.887939453125, 1.0091552734375, 1.13037109375, 1.2515869140625, 1.372802734375, 1.4940185546875, 1.615234375, 1.7364501953125, 1.857666015625, 1.9788818359375, 2.10009765625, 2.2213134765625, 2.342529296875, 2.4637451171875, 2.5849609375, 2.7061767578125, 2.827392578125, 2.9486083984375, 3.06982421875, 3.1910400390625, 3.312255859375, 3.4334716796875, 3.5546875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 6.0, 7.0, 13.0, 26.0, 24.0, 39.0, 69.0, 80.0, 141.0, 217.0, 345.0, 488.0, 778.0, 1242.0, 1963.0, 3248.0, 5271.0, 8884.0, 15127.0, 25896.0, 45427.0, 76952.0, 124855.0, 173985.0, 186140.0, 146174.0, 95021.0, 56435.0, 32839.0, 18793.0, 11129.0, 6425.0, 3980.0, 2429.0, 1521.0, 919.0, 599.0, 358.0, 245.0, 169.0, 101.0, 66.0, 58.0, 24.0, 24.0, 13.0, 8.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3828125, -4.2274169921875, -4.072021484375, -3.9166259765625, -3.76123046875, -3.6058349609375, -3.450439453125, -3.2950439453125, -3.1396484375, -2.9842529296875, -2.828857421875, -2.6734619140625, -2.51806640625, -2.3626708984375, -2.207275390625, -2.0518798828125, -1.896484375, -1.7410888671875, -1.585693359375, -1.4302978515625, -1.27490234375, -1.1195068359375, -0.964111328125, -0.8087158203125, -0.6533203125, -0.4979248046875, -0.342529296875, -0.1871337890625, -0.03173828125, 0.1236572265625, 0.279052734375, 0.4344482421875, 0.58984375, 0.7452392578125, 0.900634765625, 1.0560302734375, 1.21142578125, 1.3668212890625, 1.522216796875, 1.6776123046875, 1.8330078125, 1.9884033203125, 2.143798828125, 2.2991943359375, 2.45458984375, 2.6099853515625, 2.765380859375, 2.9207763671875, 3.076171875, 3.2315673828125, 3.386962890625, 3.5423583984375, 3.69775390625, 3.8531494140625, 4.008544921875, 4.1639404296875, 4.3193359375, 4.4747314453125, 4.630126953125, 4.7855224609375, 4.94091796875, 5.0963134765625, 5.251708984375, 5.4071044921875, 5.5625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 7.0, 4.0, 8.0, 8.0, 12.0, 22.0, 24.0, 37.0, 35.0, 45.0, 66.0, 62.0, 56.0, 73.0, 66.0, 84.0, 62.0, 56.0, 46.0, 44.0, 35.0, 30.0, 29.0, 19.0, 11.0, 16.0, 16.0, 4.0, 9.0, 2.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.0006461143493652344, -0.0006294958293437958, -0.0006128773093223572, -0.0005962587893009186, -0.00057964026927948, -0.0005630217492580414, -0.0005464032292366028, -0.0005297847092151642, -0.0005131661891937256, -0.000496547669172287, -0.0004799291491508484, -0.0004633106291294098, -0.0004466921091079712, -0.0004300735890865326, -0.000413455069065094, -0.0003968365490436554, -0.0003802180290222168, -0.0003635995090007782, -0.0003469809889793396, -0.000330362468957901, -0.0003137439489364624, -0.0002971254289150238, -0.0002805069088935852, -0.0002638883888721466, -0.000247269868850708, -0.0002306513488292694, -0.0002140328288078308, -0.0001974143087863922, -0.0001807957887649536, -0.00016417726874351501, -0.00014755874872207642, -0.00013094022870063782, -0.00011432170867919922, -9.770318865776062e-05, -8.108466863632202e-05, -6.446614861488342e-05, -4.7847628593444824e-05, -3.1229108572006226e-05, -1.4610588550567627e-05, 2.0079314708709717e-06, 1.862645149230957e-05, 3.524497151374817e-05, 5.186349153518677e-05, 6.848201155662537e-05, 8.510053157806396e-05, 0.00010171905159950256, 0.00011833757162094116, 0.00013495609164237976, 0.00015157461166381836, 0.00016819313168525696, 0.00018481165170669556, 0.00020143017172813416, 0.00021804869174957275, 0.00023466721177101135, 0.00025128573179244995, 0.00026790425181388855, 0.00028452277183532715, 0.00030114129185676575, 0.00031775981187820435, 0.00033437833189964294, 0.00035099685192108154, 0.00036761537194252014, 0.00038423389196395874, 0.00040085241198539734, 0.00041747093200683594]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 2.0, 2.0, 7.0, 8.0, 13.0, 13.0, 19.0, 37.0, 45.0, 84.0, 139.0, 185.0, 275.0, 455.0, 653.0, 1017.0, 1679.0, 2560.0, 4248.0, 7225.0, 12082.0, 20518.0, 34969.0, 58138.0, 92729.0, 133142.0, 162509.0, 161527.0, 128924.0, 88339.0, 54974.0, 33274.0, 19612.0, 11500.0, 6692.0, 4127.0, 2542.0, 1546.0, 990.0, 568.0, 379.0, 289.0, 172.0, 128.0, 74.0, 39.0, 36.0, 32.0, 21.0, 11.0, 11.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.875, -3.74560546875, -3.6162109375, -3.48681640625, -3.357421875, -3.22802734375, -3.0986328125, -2.96923828125, -2.83984375, -2.71044921875, -2.5810546875, -2.45166015625, -2.322265625, -2.19287109375, -2.0634765625, -1.93408203125, -1.8046875, -1.67529296875, -1.5458984375, -1.41650390625, -1.287109375, -1.15771484375, -1.0283203125, -0.89892578125, -0.76953125, -0.64013671875, -0.5107421875, -0.38134765625, -0.251953125, -0.12255859375, 0.0068359375, 0.13623046875, 0.265625, 0.39501953125, 0.5244140625, 0.65380859375, 0.783203125, 0.91259765625, 1.0419921875, 1.17138671875, 1.30078125, 1.43017578125, 1.5595703125, 1.68896484375, 1.818359375, 1.94775390625, 2.0771484375, 2.20654296875, 2.3359375, 2.46533203125, 2.5947265625, 2.72412109375, 2.853515625, 2.98291015625, 3.1123046875, 3.24169921875, 3.37109375, 3.50048828125, 3.6298828125, 3.75927734375, 3.888671875, 4.01806640625, 4.1474609375, 4.27685546875, 4.40625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 3.0, 2.0, 4.0, 7.0, 5.0, 6.0, 15.0, 6.0, 10.0, 17.0, 17.0, 24.0, 37.0, 33.0, 39.0, 35.0, 43.0, 48.0, 51.0, 51.0, 45.0, 53.0, 41.0, 38.0, 42.0, 34.0, 50.0, 41.0, 30.0, 35.0, 22.0, 20.0, 19.0, 18.0, 18.0, 12.0, 5.0, 3.0, 7.0, 5.0, 3.0, 1.0, 1.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2470703125, -1.2044219970703125, -1.161773681640625, -1.1191253662109375, -1.07647705078125, -1.0338287353515625, -0.991180419921875, -0.9485321044921875, -0.9058837890625, -0.8632354736328125, -0.820587158203125, -0.7779388427734375, -0.73529052734375, -0.6926422119140625, -0.649993896484375, -0.6073455810546875, -0.564697265625, -0.5220489501953125, -0.479400634765625, -0.4367523193359375, -0.39410400390625, -0.3514556884765625, -0.308807373046875, -0.2661590576171875, -0.2235107421875, -0.1808624267578125, -0.138214111328125, -0.0955657958984375, -0.05291748046875, -0.0102691650390625, 0.032379150390625, 0.0750274658203125, 0.11767578125, 0.1603240966796875, 0.202972412109375, 0.2456207275390625, 0.28826904296875, 0.3309173583984375, 0.373565673828125, 0.4162139892578125, 0.4588623046875, 0.5015106201171875, 0.544158935546875, 0.5868072509765625, 0.62945556640625, 0.6721038818359375, 0.714752197265625, 0.7574005126953125, 0.800048828125, 0.8426971435546875, 0.885345458984375, 0.9279937744140625, 0.97064208984375, 1.0132904052734375, 1.055938720703125, 1.0985870361328125, 1.1412353515625, 1.1838836669921875, 1.226531982421875, 1.2691802978515625, 1.31182861328125, 1.3544769287109375, 1.397125244140625, 1.4397735595703125, 1.482421875]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 7.0, 9.0, 6.0, 9.0, 7.0, 16.0, 21.0, 23.0, 30.0, 44.0, 39.0, 43.0, 49.0, 43.0, 54.0, 60.0, 47.0, 68.0, 59.0, 47.0, 48.0, 48.0, 46.0, 30.0, 25.0, 23.0, 16.0, 24.0, 6.0, 11.0, 16.0, 7.0, 8.0, 1.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.07490348815918, -8.797059059143066, -8.519214630126953, -8.24137020111084, -7.963525772094727, -7.685681343078613, -7.407836437225342, -7.1299920082092285, -6.852147579193115, -6.574303150177002, -6.296458721160889, -6.018614292144775, -5.740769386291504, -5.462924957275391, -5.185080528259277, -4.907236099243164, -4.629391670227051, -4.3515472412109375, -4.073702812194824, -3.795858144760132, -3.5180137157440186, -3.2401692867279053, -2.962324619293213, -2.6844801902770996, -2.4066357612609863, -2.128791332244873, -1.8509467840194702, -1.5731022357940674, -1.295257806777954, -1.0174133777618408, -0.739568829536438, -0.46172428131103516, -0.18388080596923828, 0.09396368265151978, 0.37180817127227783, 0.6496526598930359, 0.927497148513794, 1.2053415775299072, 1.48318612575531, 1.761030673980713, 2.038875102996826, 2.3167195320129395, 2.5945639610290527, 2.872408628463745, 3.1502530574798584, 3.4280974864959717, 3.705942153930664, 3.9837865829467773, 4.261631011962891, 4.539475440979004, 4.817319869995117, 5.0951642990112305, 5.373008728027344, 5.650853157043457, 5.9286980628967285, 6.206542491912842, 6.484386920928955, 6.762231349945068, 7.040075778961182, 7.317920207977295, 7.595765113830566, 7.87360954284668, 8.151453971862793, 8.429298400878906, 8.70714282989502]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 10.0, 7.0, 9.0, 14.0, 16.0, 9.0, 20.0, 21.0, 17.0, 21.0, 29.0, 24.0, 25.0, 28.0, 35.0, 34.0, 37.0, 31.0, 33.0, 44.0, 43.0, 45.0, 40.0, 37.0, 40.0, 31.0, 22.0, 35.0, 27.0, 38.0, 32.0, 22.0, 18.0, 21.0, 16.0, 14.0, 12.0, 8.0, 7.0, 9.0, 3.0, 7.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0], "bins": [-6.588812828063965, -6.406785011291504, -6.224756717681885, -6.042728900909424, -5.860701084136963, -5.678673267364502, -5.496644973754883, -5.314617156982422, -5.132589340209961, -4.9505615234375, -4.768533229827881, -4.58650541305542, -4.404477596282959, -4.222449779510498, -4.040421485900879, -3.858393669128418, -3.676365613937378, -3.494337558746338, -3.312309741973877, -3.130281686782837, -2.948253870010376, -2.766225814819336, -2.584197998046875, -2.402169942855835, -2.220141887664795, -2.038113832473755, -1.856086015701294, -1.674057960510254, -1.492030143737793, -1.310002088546753, -1.1279741525650024, -0.945946216583252, -0.763918399810791, -0.5818904638290405, -0.39986249804496765, -0.21783453226089478, -0.03580659627914429, 0.1462213397026062, 0.32824933528900146, 0.510277271270752, 0.6923052072525024, 0.8743331432342529, 1.0563610792160034, 1.238389015197754, 1.420417070388794, 1.6024448871612549, 1.784472942352295, 1.9665008783340454, 2.148528814315796, 2.330556869506836, 2.512584686279297, 2.694612741470337, 2.876640558242798, 3.058668613433838, 3.240696430206299, 3.422724485397339, 3.604752540588379, 3.786780595779419, 3.96880841255188, 4.15083646774292, 4.332864284515381, 4.514892101287842, 4.696920394897461, 4.878948211669922, 5.060976028442383]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 7.0, 5.0, 3.0, 11.0, 10.0, 28.0, 28.0, 44.0, 58.0, 88.0, 131.0, 199.0, 327.0, 475.0, 759.0, 1116.0, 1873.0, 3093.0, 5478.0, 9362.0, 16935.0, 32273.0, 64017.0, 134403.0, 302214.0, 670881.0, 1087862.0, 948878.0, 491293.0, 217082.0, 99008.0, 48071.0, 25054.0, 13826.0, 7592.0, 4525.0, 2606.0, 1732.0, 958.0, 703.0, 411.0, 281.0, 199.0, 113.0, 74.0, 60.0, 44.0, 37.0, 23.0, 9.0, 14.0, 6.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-7.0859375, -6.84814453125, -6.6103515625, -6.37255859375, -6.134765625, -5.89697265625, -5.6591796875, -5.42138671875, -5.18359375, -4.94580078125, -4.7080078125, -4.47021484375, -4.232421875, -3.99462890625, -3.7568359375, -3.51904296875, -3.28125, -3.04345703125, -2.8056640625, -2.56787109375, -2.330078125, -2.09228515625, -1.8544921875, -1.61669921875, -1.37890625, -1.14111328125, -0.9033203125, -0.66552734375, -0.427734375, -0.18994140625, 0.0478515625, 0.28564453125, 0.5234375, 0.76123046875, 0.9990234375, 1.23681640625, 1.474609375, 1.71240234375, 1.9501953125, 2.18798828125, 2.42578125, 2.66357421875, 2.9013671875, 3.13916015625, 3.376953125, 3.61474609375, 3.8525390625, 4.09033203125, 4.328125, 4.56591796875, 4.8037109375, 5.04150390625, 5.279296875, 5.51708984375, 5.7548828125, 5.99267578125, 6.23046875, 6.46826171875, 6.7060546875, 6.94384765625, 7.181640625, 7.41943359375, 7.6572265625, 7.89501953125, 8.1328125]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 7.0, 8.0, 7.0, 10.0, 13.0, 22.0, 21.0, 18.0, 18.0, 29.0, 35.0, 28.0, 27.0, 29.0, 28.0, 30.0, 42.0, 36.0, 41.0, 45.0, 52.0, 44.0, 49.0, 42.0, 35.0, 37.0, 29.0, 37.0, 24.0, 25.0, 26.0, 18.0, 20.0, 18.0, 13.0, 11.0, 10.0, 6.0, 7.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-5.25, -5.1103515625, -4.970703125, -4.8310546875, -4.69140625, -4.5517578125, -4.412109375, -4.2724609375, -4.1328125, -3.9931640625, -3.853515625, -3.7138671875, -3.57421875, -3.4345703125, -3.294921875, -3.1552734375, -3.015625, -2.8759765625, -2.736328125, -2.5966796875, -2.45703125, -2.3173828125, -2.177734375, -2.0380859375, -1.8984375, -1.7587890625, -1.619140625, -1.4794921875, -1.33984375, -1.2001953125, -1.060546875, -0.9208984375, -0.78125, -0.6416015625, -0.501953125, -0.3623046875, -0.22265625, -0.0830078125, 0.056640625, 0.1962890625, 0.3359375, 0.4755859375, 0.615234375, 0.7548828125, 0.89453125, 1.0341796875, 1.173828125, 1.3134765625, 1.453125, 1.5927734375, 1.732421875, 1.8720703125, 2.01171875, 2.1513671875, 2.291015625, 2.4306640625, 2.5703125, 2.7099609375, 2.849609375, 2.9892578125, 3.12890625, 3.2685546875, 3.408203125, 3.5478515625, 3.6875]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 8.0, 9.0, 9.0, 11.0, 17.0, 29.0, 51.0, 74.0, 95.0, 152.0, 245.0, 389.0, 510.0, 863.0, 1312.0, 1935.0, 3159.0, 5055.0, 8305.0, 14021.0, 24441.0, 42661.0, 77885.0, 148480.0, 283034.0, 532400.0, 872063.0, 912395.0, 586691.0, 313271.0, 163557.0, 87140.0, 47479.0, 26838.0, 15453.0, 9264.0, 5648.0, 3334.0, 2195.0, 1335.0, 888.0, 509.0, 350.0, 246.0, 164.0, 92.0, 83.0, 44.0, 33.0, 21.0, 17.0, 9.0, 9.0, 5.0, 3.0, 3.0, 1.0, 3.0], "bins": [-7.2265625, -7.00811767578125, -6.7896728515625, -6.57122802734375, -6.352783203125, -6.13433837890625, -5.9158935546875, -5.69744873046875, -5.47900390625, -5.26055908203125, -5.0421142578125, -4.82366943359375, -4.605224609375, -4.38677978515625, -4.1683349609375, -3.94989013671875, -3.7314453125, -3.51300048828125, -3.2945556640625, -3.07611083984375, -2.857666015625, -2.63922119140625, -2.4207763671875, -2.20233154296875, -1.98388671875, -1.76544189453125, -1.5469970703125, -1.32855224609375, -1.110107421875, -0.89166259765625, -0.6732177734375, -0.45477294921875, -0.236328125, -0.01788330078125, 0.2005615234375, 0.41900634765625, 0.637451171875, 0.85589599609375, 1.0743408203125, 1.29278564453125, 1.51123046875, 1.72967529296875, 1.9481201171875, 2.16656494140625, 2.385009765625, 2.60345458984375, 2.8218994140625, 3.04034423828125, 3.2587890625, 3.47723388671875, 3.6956787109375, 3.91412353515625, 4.132568359375, 4.35101318359375, 4.5694580078125, 4.78790283203125, 5.00634765625, 5.22479248046875, 5.4432373046875, 5.66168212890625, 5.880126953125, 6.09857177734375, 6.3170166015625, 6.53546142578125, 6.75390625]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 10.0, 6.0, 3.0, 15.0, 23.0, 23.0, 24.0, 36.0, 48.0, 55.0, 63.0, 89.0, 112.0, 131.0, 166.0, 174.0, 203.0, 245.0, 284.0, 258.0, 290.0, 269.0, 253.0, 198.0, 186.0, 145.0, 142.0, 118.0, 74.0, 92.0, 68.0, 60.0, 41.0, 31.0, 27.0, 30.0, 15.0, 16.0, 6.0, 11.0, 11.0, 3.0, 8.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.076171875, -2.004486083984375, -1.93280029296875, -1.861114501953125, -1.7894287109375, -1.717742919921875, -1.64605712890625, -1.574371337890625, -1.502685546875, -1.430999755859375, -1.35931396484375, -1.287628173828125, -1.2159423828125, -1.144256591796875, -1.07257080078125, -1.000885009765625, -0.92919921875, -0.857513427734375, -0.78582763671875, -0.714141845703125, -0.6424560546875, -0.570770263671875, -0.49908447265625, -0.427398681640625, -0.355712890625, -0.284027099609375, -0.21234130859375, -0.140655517578125, -0.0689697265625, 0.002716064453125, 0.07440185546875, 0.146087646484375, 0.2177734375, 0.289459228515625, 0.36114501953125, 0.432830810546875, 0.5045166015625, 0.576202392578125, 0.64788818359375, 0.719573974609375, 0.791259765625, 0.862945556640625, 0.93463134765625, 1.006317138671875, 1.0780029296875, 1.149688720703125, 1.22137451171875, 1.293060302734375, 1.36474609375, 1.436431884765625, 1.50811767578125, 1.579803466796875, 1.6514892578125, 1.723175048828125, 1.79486083984375, 1.866546630859375, 1.938232421875, 2.009918212890625, 2.08160400390625, 2.153289794921875, 2.2249755859375, 2.296661376953125, 2.36834716796875, 2.440032958984375, 2.51171875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 9.0, 8.0, 10.0, 13.0, 14.0, 26.0, 28.0, 22.0, 37.0, 39.0, 36.0, 46.0, 58.0, 60.0, 62.0, 77.0, 56.0, 52.0, 51.0, 54.0, 59.0, 32.0, 29.0, 26.0, 18.0, 17.0, 7.0, 12.0, 7.0, 11.0, 3.0, 1.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.877823829650879, -8.616966247558594, -8.356109619140625, -8.09525203704834, -7.834394454956055, -7.573537349700928, -7.312680244445801, -7.051822662353516, -6.790965557098389, -6.530108451843262, -6.269250869750977, -6.00839376449585, -5.747536659240723, -5.4866790771484375, -5.2258219718933105, -4.964964866638184, -4.704107284545898, -4.4432501792907715, -4.182392597198486, -3.9215354919433594, -3.6606781482696533, -3.3998208045959473, -3.1389636993408203, -2.8781063556671143, -2.617249011993408, -2.356391668319702, -2.095534324645996, -1.8346772193908691, -1.573819875717163, -1.312962532043457, -1.0521053075790405, -0.791248083114624, -0.5303916931152344, -0.2695344090461731, -0.008677124977111816, 0.25218015909194946, 0.5130374431610107, 0.7738947868347168, 1.0347520112991333, 1.2956092357635498, 1.5564665794372559, 1.817323923110962, 2.078181266784668, 2.339038372039795, 2.599895715713501, 2.860753059387207, 3.121610164642334, 3.38246750831604, 3.643324851989746, 3.904182195663452, 4.165039539337158, 4.425896644592285, 4.68675422668457, 4.947611331939697, 5.208468437194824, 5.469326019287109, 5.730183124542236, 5.991040229797363, 6.251897811889648, 6.512754917144775, 6.773612022399902, 7.0344696044921875, 7.2953267097473145, 7.556183815002441, 7.817041397094727]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 6.0, 7.0, 4.0, 16.0, 23.0, 15.0, 27.0, 18.0, 34.0, 25.0, 24.0, 28.0, 52.0, 43.0, 27.0, 39.0, 48.0, 49.0, 45.0, 47.0, 41.0, 50.0, 34.0, 25.0, 36.0, 43.0, 33.0, 26.0, 25.0, 23.0, 21.0, 20.0, 18.0, 6.0, 9.0, 4.0, 6.0, 6.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0543532371521, -5.8705925941467285, -5.686831951141357, -5.503071308135986, -5.319310665130615, -5.135549545288086, -4.951788902282715, -4.768028259277344, -4.584267616271973, -4.400506973266602, -4.2167463302612305, -4.032985687255859, -3.849224805831909, -3.665464162826538, -3.481703519821167, -3.297942638397217, -3.114182233810425, -2.9304215908050537, -2.7466609477996826, -2.5629000663757324, -2.3791394233703613, -2.1953787803649902, -2.011618137359619, -1.8278573751449585, -1.6440967321395874, -1.4603360891342163, -1.2765753269195557, -1.0928146839141846, -0.9090539813041687, -0.7252932786941528, -0.5415326356887817, -0.3577718734741211, -0.17401123046875, 0.009749457240104675, 0.19351014494895935, 0.37727081775665283, 0.5610315203666687, 0.7447922229766846, 0.9285528659820557, 1.1123136281967163, 1.2960742712020874, 1.4798349142074585, 1.6635956764221191, 1.8473563194274902, 2.0311169624328613, 2.2148776054382324, 2.3986382484436035, 2.5823991298675537, 2.766159772872925, 2.949920415878296, 3.133681058883667, 3.317441940307617, 3.5012025833129883, 3.6849632263183594, 3.8687238693237305, 4.052484512329102, 4.236245155334473, 4.420005798339844, 4.603766441345215, 4.787527084350586, 4.971287727355957, 5.155048370361328, 5.338809013366699, 5.5225701332092285, 5.7063307762146]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 6.0, 8.0, 10.0, 20.0, 33.0, 49.0, 64.0, 125.0, 181.0, 265.0, 397.0, 711.0, 1108.0, 1772.0, 2823.0, 4639.0, 7949.0, 13946.0, 25404.0, 45720.0, 82470.0, 139336.0, 196834.0, 198004.0, 138956.0, 82526.0, 45506.0, 25271.0, 14100.0, 8101.0, 4631.0, 2867.0, 1748.0, 1106.0, 694.0, 404.0, 298.0, 187.0, 103.0, 54.0, 45.0, 37.0, 18.0, 11.0, 8.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.65625, -5.46771240234375, -5.2791748046875, -5.09063720703125, -4.902099609375, -4.71356201171875, -4.5250244140625, -4.33648681640625, -4.14794921875, -3.95941162109375, -3.7708740234375, -3.58233642578125, -3.393798828125, -3.20526123046875, -3.0167236328125, -2.82818603515625, -2.6396484375, -2.45111083984375, -2.2625732421875, -2.07403564453125, -1.885498046875, -1.69696044921875, -1.5084228515625, -1.31988525390625, -1.13134765625, -0.94281005859375, -0.7542724609375, -0.56573486328125, -0.377197265625, -0.18865966796875, -0.0001220703125, 0.18841552734375, 0.376953125, 0.56549072265625, 0.7540283203125, 0.94256591796875, 1.131103515625, 1.31964111328125, 1.5081787109375, 1.69671630859375, 1.88525390625, 2.07379150390625, 2.2623291015625, 2.45086669921875, 2.639404296875, 2.82794189453125, 3.0164794921875, 3.20501708984375, 3.3935546875, 3.58209228515625, 3.7706298828125, 3.95916748046875, 4.147705078125, 4.33624267578125, 4.5247802734375, 4.71331787109375, 4.90185546875, 5.09039306640625, 5.2789306640625, 5.46746826171875, 5.656005859375, 5.84454345703125, 6.0330810546875, 6.22161865234375, 6.41015625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 5.0, 7.0, 5.0, 6.0, 19.0, 15.0, 13.0, 21.0, 20.0, 27.0, 22.0, 30.0, 39.0, 33.0, 41.0, 48.0, 31.0, 40.0, 38.0, 55.0, 57.0, 45.0, 49.0, 31.0, 33.0, 43.0, 35.0, 39.0, 26.0, 29.0, 30.0, 13.0, 15.0, 9.0, 11.0, 8.0, 3.0, 5.0, 4.0, 1.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.57421875, -6.383544921875, -6.19287109375, -6.002197265625, -5.8115234375, -5.620849609375, -5.43017578125, -5.239501953125, -5.048828125, -4.858154296875, -4.66748046875, -4.476806640625, -4.2861328125, -4.095458984375, -3.90478515625, -3.714111328125, -3.5234375, -3.332763671875, -3.14208984375, -2.951416015625, -2.7607421875, -2.570068359375, -2.37939453125, -2.188720703125, -1.998046875, -1.807373046875, -1.61669921875, -1.426025390625, -1.2353515625, -1.044677734375, -0.85400390625, -0.663330078125, -0.47265625, -0.281982421875, -0.09130859375, 0.099365234375, 0.2900390625, 0.480712890625, 0.67138671875, 0.862060546875, 1.052734375, 1.243408203125, 1.43408203125, 1.624755859375, 1.8154296875, 2.006103515625, 2.19677734375, 2.387451171875, 2.578125, 2.768798828125, 2.95947265625, 3.150146484375, 3.3408203125, 3.531494140625, 3.72216796875, 3.912841796875, 4.103515625, 4.294189453125, 4.48486328125, 4.675537109375, 4.8662109375, 5.056884765625, 5.24755859375, 5.438232421875, 5.62890625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 9.0, 5.0, 10.0, 8.0, 6.0, 20.0, 25.0, 39.0, 75.0, 119.0, 166.0, 216.0, 304.0, 439.0, 690.0, 1248.0, 2101.0, 3735.0, 7246.0, 16155.0, 40665.0, 117668.0, 321090.0, 334313.0, 125415.0, 42990.0, 16925.0, 7448.0, 3802.0, 2140.0, 1287.0, 742.0, 475.0, 334.0, 197.0, 139.0, 110.0, 54.0, 53.0, 29.0, 25.0, 10.0, 10.0, 8.0, 5.0, 3.0, 3.0, 1.0, 2.0, 6.0], "bins": [-14.671875, -14.275634765625, -13.87939453125, -13.483154296875, -13.0869140625, -12.690673828125, -12.29443359375, -11.898193359375, -11.501953125, -11.105712890625, -10.70947265625, -10.313232421875, -9.9169921875, -9.520751953125, -9.12451171875, -8.728271484375, -8.33203125, -7.935791015625, -7.53955078125, -7.143310546875, -6.7470703125, -6.350830078125, -5.95458984375, -5.558349609375, -5.162109375, -4.765869140625, -4.36962890625, -3.973388671875, -3.5771484375, -3.180908203125, -2.78466796875, -2.388427734375, -1.9921875, -1.595947265625, -1.19970703125, -0.803466796875, -0.4072265625, -0.010986328125, 0.38525390625, 0.781494140625, 1.177734375, 1.573974609375, 1.97021484375, 2.366455078125, 2.7626953125, 3.158935546875, 3.55517578125, 3.951416015625, 4.34765625, 4.743896484375, 5.14013671875, 5.536376953125, 5.9326171875, 6.328857421875, 6.72509765625, 7.121337890625, 7.517578125, 7.913818359375, 8.31005859375, 8.706298828125, 9.1025390625, 9.498779296875, 9.89501953125, 10.291259765625, 10.6875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 7.0, 8.0, 5.0, 1.0, 10.0, 11.0, 8.0, 14.0, 17.0, 14.0, 24.0, 24.0, 18.0, 20.0, 30.0, 36.0, 26.0, 23.0, 49.0, 43.0, 39.0, 40.0, 49.0, 44.0, 33.0, 34.0, 39.0, 34.0, 29.0, 33.0, 29.0, 36.0, 19.0, 20.0, 33.0, 16.0, 11.0, 12.0, 16.0, 14.0, 3.0, 14.0, 3.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.078125, -2.975860595703125, -2.87359619140625, -2.771331787109375, -2.6690673828125, -2.566802978515625, -2.46453857421875, -2.362274169921875, -2.260009765625, -2.157745361328125, -2.05548095703125, -1.953216552734375, -1.8509521484375, -1.748687744140625, -1.64642333984375, -1.544158935546875, -1.44189453125, -1.339630126953125, -1.23736572265625, -1.135101318359375, -1.0328369140625, -0.930572509765625, -0.82830810546875, -0.726043701171875, -0.623779296875, -0.521514892578125, -0.41925048828125, -0.316986083984375, -0.2147216796875, -0.112457275390625, -0.01019287109375, 0.092071533203125, 0.1943359375, 0.296600341796875, 0.39886474609375, 0.501129150390625, 0.6033935546875, 0.705657958984375, 0.80792236328125, 0.910186767578125, 1.012451171875, 1.114715576171875, 1.21697998046875, 1.319244384765625, 1.4215087890625, 1.523773193359375, 1.62603759765625, 1.728302001953125, 1.83056640625, 1.932830810546875, 2.03509521484375, 2.137359619140625, 2.2396240234375, 2.341888427734375, 2.44415283203125, 2.546417236328125, 2.648681640625, 2.750946044921875, 2.85321044921875, 2.955474853515625, 3.0577392578125, 3.160003662109375, 3.26226806640625, 3.364532470703125, 3.466796875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 6.0, 3.0, 9.0, 12.0, 22.0, 18.0, 31.0, 39.0, 52.0, 83.0, 120.0, 166.0, 243.0, 353.0, 550.0, 778.0, 1214.0, 1832.0, 3088.0, 5477.0, 10249.0, 20416.0, 44948.0, 108145.0, 251242.0, 314920.0, 159045.0, 65327.0, 28787.0, 13607.0, 7023.0, 3898.0, 2321.0, 1486.0, 964.0, 652.0, 446.0, 301.0, 175.0, 162.0, 109.0, 71.0, 46.0, 38.0, 24.0, 21.0, 19.0, 8.0, 4.0, 8.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.40234375, -4.25164794921875, -4.1009521484375, -3.95025634765625, -3.799560546875, -3.64886474609375, -3.4981689453125, -3.34747314453125, -3.19677734375, -3.04608154296875, -2.8953857421875, -2.74468994140625, -2.593994140625, -2.44329833984375, -2.2926025390625, -2.14190673828125, -1.9912109375, -1.84051513671875, -1.6898193359375, -1.53912353515625, -1.388427734375, -1.23773193359375, -1.0870361328125, -0.93634033203125, -0.78564453125, -0.63494873046875, -0.4842529296875, -0.33355712890625, -0.182861328125, -0.03216552734375, 0.1185302734375, 0.26922607421875, 0.419921875, 0.57061767578125, 0.7213134765625, 0.87200927734375, 1.022705078125, 1.17340087890625, 1.3240966796875, 1.47479248046875, 1.62548828125, 1.77618408203125, 1.9268798828125, 2.07757568359375, 2.228271484375, 2.37896728515625, 2.5296630859375, 2.68035888671875, 2.8310546875, 2.98175048828125, 3.1324462890625, 3.28314208984375, 3.433837890625, 3.58453369140625, 3.7352294921875, 3.88592529296875, 4.03662109375, 4.18731689453125, 4.3380126953125, 4.48870849609375, 4.639404296875, 4.79010009765625, 4.9407958984375, 5.09149169921875, 5.2421875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 2.0, 2.0, 3.0, 6.0, 5.0, 4.0, 3.0, 9.0, 12.0, 15.0, 21.0, 27.0, 31.0, 52.0, 52.0, 76.0, 107.0, 108.0, 82.0, 79.0, 85.0, 50.0, 37.0, 26.0, 20.0, 20.0, 12.0, 17.0, 7.0, 5.0, 6.0, 5.0, 3.0, 4.0, 5.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00021123886108398438, -0.00020439550280570984, -0.0001975521445274353, -0.00019070878624916077, -0.00018386542797088623, -0.0001770220696926117, -0.00017017871141433716, -0.00016333535313606262, -0.00015649199485778809, -0.00014964863657951355, -0.00014280527830123901, -0.00013596192002296448, -0.00012911856174468994, -0.0001222752034664154, -0.00011543184518814087, -0.00010858848690986633, -0.0001017451286315918, -9.490177035331726e-05, -8.805841207504272e-05, -8.121505379676819e-05, -7.437169551849365e-05, -6.752833724021912e-05, -6.068497896194458e-05, -5.3841620683670044e-05, -4.699826240539551e-05, -4.015490412712097e-05, -3.3311545848846436e-05, -2.64681875705719e-05, -1.9624829292297363e-05, -1.2781471014022827e-05, -5.938112735748291e-06, 9.052455425262451e-07, 7.748603820800781e-06, 1.4591962099075317e-05, 2.1435320377349854e-05, 2.827867865562439e-05, 3.5122036933898926e-05, 4.196539521217346e-05, 4.8808753490448e-05, 5.5652111768722534e-05, 6.249547004699707e-05, 6.93388283252716e-05, 7.618218660354614e-05, 8.302554488182068e-05, 8.986890316009521e-05, 9.671226143836975e-05, 0.00010355561971664429, 0.00011039897799491882, 0.00011724233627319336, 0.0001240856945514679, 0.00013092905282974243, 0.00013777241110801697, 0.0001446157693862915, 0.00015145912766456604, 0.00015830248594284058, 0.0001651458442211151, 0.00017198920249938965, 0.00017883256077766418, 0.00018567591905593872, 0.00019251927733421326, 0.0001993626356124878, 0.00020620599389076233, 0.00021304935216903687, 0.0002198927104473114, 0.00022673606872558594]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 8.0, 8.0, 14.0, 16.0, 26.0, 39.0, 55.0, 77.0, 121.0, 137.0, 189.0, 273.0, 381.0, 510.0, 791.0, 1154.0, 1839.0, 3002.0, 5303.0, 9803.0, 19258.0, 39282.0, 80546.0, 157793.0, 239988.0, 222065.0, 131941.0, 65472.0, 32300.0, 15906.0, 8113.0, 4497.0, 2675.0, 1555.0, 1059.0, 672.0, 513.0, 350.0, 214.0, 159.0, 125.0, 94.0, 66.0, 58.0, 38.0, 24.0, 23.0, 10.0, 4.0, 2.0, 6.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-3.716796875, -3.600128173828125, -3.48345947265625, -3.366790771484375, -3.2501220703125, -3.133453369140625, -3.01678466796875, -2.900115966796875, -2.783447265625, -2.666778564453125, -2.55010986328125, -2.433441162109375, -2.3167724609375, -2.200103759765625, -2.08343505859375, -1.966766357421875, -1.85009765625, -1.733428955078125, -1.61676025390625, -1.500091552734375, -1.3834228515625, -1.266754150390625, -1.15008544921875, -1.033416748046875, -0.916748046875, -0.800079345703125, -0.68341064453125, -0.566741943359375, -0.4500732421875, -0.333404541015625, -0.21673583984375, -0.100067138671875, 0.0166015625, 0.133270263671875, 0.24993896484375, 0.366607666015625, 0.4832763671875, 0.599945068359375, 0.71661376953125, 0.833282470703125, 0.949951171875, 1.066619873046875, 1.18328857421875, 1.299957275390625, 1.4166259765625, 1.533294677734375, 1.64996337890625, 1.766632080078125, 1.88330078125, 1.999969482421875, 2.11663818359375, 2.233306884765625, 2.3499755859375, 2.466644287109375, 2.58331298828125, 2.699981689453125, 2.816650390625, 2.933319091796875, 3.04998779296875, 3.166656494140625, 3.2833251953125, 3.399993896484375, 3.51666259765625, 3.633331298828125, 3.75]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0, 5.0, 5.0, 11.0, 9.0, 15.0, 28.0, 28.0, 34.0, 57.0, 68.0, 89.0, 79.0, 96.0, 89.0, 91.0, 78.0, 65.0, 49.0, 24.0, 20.0, 16.0, 17.0, 8.0, 8.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3193359375, -1.273468017578125, -1.22760009765625, -1.181732177734375, -1.1358642578125, -1.089996337890625, -1.04412841796875, -0.998260498046875, -0.952392578125, -0.906524658203125, -0.86065673828125, -0.814788818359375, -0.7689208984375, -0.723052978515625, -0.67718505859375, -0.631317138671875, -0.58544921875, -0.539581298828125, -0.49371337890625, -0.447845458984375, -0.4019775390625, -0.356109619140625, -0.31024169921875, -0.264373779296875, -0.218505859375, -0.172637939453125, -0.12677001953125, -0.080902099609375, -0.0350341796875, 0.010833740234375, 0.05670166015625, 0.102569580078125, 0.1484375, 0.194305419921875, 0.24017333984375, 0.286041259765625, 0.3319091796875, 0.377777099609375, 0.42364501953125, 0.469512939453125, 0.515380859375, 0.561248779296875, 0.60711669921875, 0.652984619140625, 0.6988525390625, 0.744720458984375, 0.79058837890625, 0.836456298828125, 0.88232421875, 0.928192138671875, 0.97406005859375, 1.019927978515625, 1.0657958984375, 1.111663818359375, 1.15753173828125, 1.203399658203125, 1.249267578125, 1.295135498046875, 1.34100341796875, 1.386871337890625, 1.4327392578125, 1.478607177734375, 1.52447509765625, 1.570343017578125, 1.6162109375]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 8.0, 2.0, 4.0, 6.0, 9.0, 9.0, 11.0, 18.0, 27.0, 23.0, 31.0, 36.0, 33.0, 44.0, 36.0, 48.0, 64.0, 50.0, 57.0, 59.0, 58.0, 55.0, 54.0, 55.0, 39.0, 35.0, 19.0, 25.0, 17.0, 20.0, 9.0, 4.0, 7.0, 6.0, 3.0, 7.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.542803764343262, -8.300796508789062, -8.058789253234863, -7.816781997680664, -7.574775218963623, -7.332767963409424, -7.090760707855225, -6.848753452301025, -6.606746673583984, -6.364739418029785, -6.122732162475586, -5.880724906921387, -5.638718128204346, -5.3967108726501465, -5.154703617095947, -4.912696361541748, -4.670689105987549, -4.42868185043335, -4.18667459487915, -3.9446675777435303, -3.70266056060791, -3.460653305053711, -3.2186460494995117, -2.9766387939453125, -2.7346317768096924, -2.492624521255493, -2.250617504119873, -2.008610248565674, -1.7666031122207642, -1.5245959758758545, -1.2825887203216553, -1.0405815839767456, -0.7985744476318359, -0.5565673112869263, -0.3145601153373718, -0.07255291938781738, 0.16945421695709229, 0.41146135330200195, 0.6534686088562012, 0.8954757452011108, 1.1374828815460205, 1.3794900178909302, 1.6214971542358398, 1.863504409790039, 2.1055116653442383, 2.3475186824798584, 2.5895259380340576, 2.8315329551696777, 3.073540210723877, 3.315547466278076, 3.5575544834136963, 3.7995617389678955, 4.041568756103516, 4.283576011657715, 4.525583267211914, 4.767590522766113, 5.0095977783203125, 5.251605033874512, 5.493612289428711, 5.73561954498291, 5.977626323699951, 6.21963357925415, 6.46164083480835, 6.703648090362549, 6.94565486907959]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 6.0, 2.0, 12.0, 14.0, 13.0, 23.0, 24.0, 15.0, 21.0, 27.0, 35.0, 36.0, 48.0, 46.0, 30.0, 46.0, 40.0, 44.0, 51.0, 42.0, 42.0, 50.0, 40.0, 33.0, 33.0, 34.0, 42.0, 27.0, 25.0, 21.0, 21.0, 19.0, 10.0, 13.0, 4.0, 10.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.362408638000488, -6.176389694213867, -5.990370750427246, -5.804351329803467, -5.618332386016846, -5.432313442230225, -5.246294021606445, -5.060275077819824, -4.874256134033203, -4.688237190246582, -4.502218246459961, -4.316198825836182, -4.1301798820495605, -3.9441609382629395, -3.7581417560577393, -3.572122573852539, -3.386103630065918, -3.200084686279297, -3.0140655040740967, -2.8280463218688965, -2.6420273780822754, -2.4560084342956543, -2.269989252090454, -2.083970069885254, -1.8979511260986328, -1.7119320631027222, -1.5259130001068115, -1.3398939371109009, -1.1538748741149902, -0.9678558111190796, -0.781836748123169, -0.5958176851272583, -0.40979814529418945, -0.2237790822982788, -0.037760019302368164, 0.14825904369354248, 0.3342781066894531, 0.5202971696853638, 0.7063162326812744, 0.8923352956771851, 1.0783543586730957, 1.2643734216690063, 1.450392484664917, 1.6364115476608276, 1.8224306106567383, 2.0084495544433594, 2.1944687366485596, 2.3804879188537598, 2.566506862640381, 2.752525806427002, 2.938544988632202, 3.1245641708374023, 3.3105831146240234, 3.4966020584106445, 3.6826212406158447, 3.868640422821045, 4.054659366607666, 4.240678310394287, 4.426697731018066, 4.6127166748046875, 4.798735618591309, 4.98475456237793, 5.170773506164551, 5.35679292678833, 5.542811870574951]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 4.0, 5.0, 5.0, 7.0, 11.0, 33.0, 23.0, 52.0, 63.0, 108.0, 171.0, 240.0, 351.0, 504.0, 773.0, 1137.0, 1739.0, 2636.0, 3811.0, 5749.0, 8495.0, 12951.0, 19145.0, 28693.0, 41784.0, 61204.0, 85475.0, 111089.0, 129060.0, 130268.0, 113878.0, 89052.0, 64185.0, 44784.0, 30051.0, 20370.0, 13386.0, 8973.0, 6032.0, 3997.0, 2783.0, 1815.0, 1185.0, 778.0, 587.0, 392.0, 252.0, 154.0, 87.0, 81.0, 51.0, 36.0, 24.0, 18.0, 10.0, 10.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.70703125, -4.56024169921875, -4.4134521484375, -4.26666259765625, -4.119873046875, -3.97308349609375, -3.8262939453125, -3.67950439453125, -3.53271484375, -3.38592529296875, -3.2391357421875, -3.09234619140625, -2.945556640625, -2.79876708984375, -2.6519775390625, -2.50518798828125, -2.3583984375, -2.21160888671875, -2.0648193359375, -1.91802978515625, -1.771240234375, -1.62445068359375, -1.4776611328125, -1.33087158203125, -1.18408203125, -1.03729248046875, -0.8905029296875, -0.74371337890625, -0.596923828125, -0.45013427734375, -0.3033447265625, -0.15655517578125, -0.009765625, 0.13702392578125, 0.2838134765625, 0.43060302734375, 0.577392578125, 0.72418212890625, 0.8709716796875, 1.01776123046875, 1.16455078125, 1.31134033203125, 1.4581298828125, 1.60491943359375, 1.751708984375, 1.89849853515625, 2.0452880859375, 2.19207763671875, 2.3388671875, 2.48565673828125, 2.6324462890625, 2.77923583984375, 2.926025390625, 3.07281494140625, 3.2196044921875, 3.36639404296875, 3.51318359375, 3.65997314453125, 3.8067626953125, 3.95355224609375, 4.100341796875, 4.24713134765625, 4.3939208984375, 4.54071044921875, 4.6875]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 10.0, 5.0, 9.0, 6.0, 13.0, 18.0, 16.0, 19.0, 21.0, 23.0, 24.0, 37.0, 37.0, 31.0, 32.0, 29.0, 43.0, 36.0, 38.0, 29.0, 48.0, 46.0, 38.0, 42.0, 32.0, 37.0, 33.0, 27.0, 36.0, 30.0, 21.0, 23.0, 22.0, 20.0, 22.0, 15.0, 8.0, 8.0, 3.0, 4.0, 2.0, 8.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.41015625, -5.246337890625, -5.08251953125, -4.918701171875, -4.7548828125, -4.591064453125, -4.42724609375, -4.263427734375, -4.099609375, -3.935791015625, -3.77197265625, -3.608154296875, -3.4443359375, -3.280517578125, -3.11669921875, -2.952880859375, -2.7890625, -2.625244140625, -2.46142578125, -2.297607421875, -2.1337890625, -1.969970703125, -1.80615234375, -1.642333984375, -1.478515625, -1.314697265625, -1.15087890625, -0.987060546875, -0.8232421875, -0.659423828125, -0.49560546875, -0.331787109375, -0.16796875, -0.004150390625, 0.15966796875, 0.323486328125, 0.4873046875, 0.651123046875, 0.81494140625, 0.978759765625, 1.142578125, 1.306396484375, 1.47021484375, 1.634033203125, 1.7978515625, 1.961669921875, 2.12548828125, 2.289306640625, 2.453125, 2.616943359375, 2.78076171875, 2.944580078125, 3.1083984375, 3.272216796875, 3.43603515625, 3.599853515625, 3.763671875, 3.927490234375, 4.09130859375, 4.255126953125, 4.4189453125, 4.582763671875, 4.74658203125, 4.910400390625, 5.07421875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 8.0, 10.0, 24.0, 23.0, 34.0, 56.0, 79.0, 112.0, 231.0, 323.0, 541.0, 774.0, 1275.0, 1922.0, 3071.0, 4830.0, 7625.0, 12061.0, 19416.0, 30418.0, 47458.0, 71044.0, 101230.0, 130792.0, 146831.0, 136164.0, 108627.0, 78080.0, 52448.0, 34441.0, 21511.0, 13474.0, 8681.0, 5512.0, 3350.0, 2238.0, 1410.0, 886.0, 565.0, 354.0, 213.0, 149.0, 103.0, 73.0, 32.0, 24.0, 12.0, 14.0, 7.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.578125, -4.433349609375, -4.28857421875, -4.143798828125, -3.9990234375, -3.854248046875, -3.70947265625, -3.564697265625, -3.419921875, -3.275146484375, -3.13037109375, -2.985595703125, -2.8408203125, -2.696044921875, -2.55126953125, -2.406494140625, -2.26171875, -2.116943359375, -1.97216796875, -1.827392578125, -1.6826171875, -1.537841796875, -1.39306640625, -1.248291015625, -1.103515625, -0.958740234375, -0.81396484375, -0.669189453125, -0.5244140625, -0.379638671875, -0.23486328125, -0.090087890625, 0.0546875, 0.199462890625, 0.34423828125, 0.489013671875, 0.6337890625, 0.778564453125, 0.92333984375, 1.068115234375, 1.212890625, 1.357666015625, 1.50244140625, 1.647216796875, 1.7919921875, 1.936767578125, 2.08154296875, 2.226318359375, 2.37109375, 2.515869140625, 2.66064453125, 2.805419921875, 2.9501953125, 3.094970703125, 3.23974609375, 3.384521484375, 3.529296875, 3.674072265625, 3.81884765625, 3.963623046875, 4.1083984375, 4.253173828125, 4.39794921875, 4.542724609375, 4.6875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 4.0, 5.0, 5.0, 8.0, 10.0, 12.0, 8.0, 15.0, 18.0, 18.0, 28.0, 18.0, 27.0, 33.0, 42.0, 37.0, 36.0, 61.0, 45.0, 48.0, 35.0, 43.0, 55.0, 33.0, 45.0, 28.0, 32.0, 39.0, 37.0, 18.0, 27.0, 21.0, 14.0, 17.0, 14.0, 13.0, 14.0, 9.0, 8.0, 7.0, 2.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.703125, -3.591094970703125, -3.47906494140625, -3.367034912109375, -3.2550048828125, -3.142974853515625, -3.03094482421875, -2.918914794921875, -2.806884765625, -2.694854736328125, -2.58282470703125, -2.470794677734375, -2.3587646484375, -2.246734619140625, -2.13470458984375, -2.022674560546875, -1.91064453125, -1.798614501953125, -1.68658447265625, -1.574554443359375, -1.4625244140625, -1.350494384765625, -1.23846435546875, -1.126434326171875, -1.014404296875, -0.902374267578125, -0.79034423828125, -0.678314208984375, -0.5662841796875, -0.454254150390625, -0.34222412109375, -0.230194091796875, -0.1181640625, -0.006134033203125, 0.10589599609375, 0.217926025390625, 0.3299560546875, 0.441986083984375, 0.55401611328125, 0.666046142578125, 0.778076171875, 0.890106201171875, 1.00213623046875, 1.114166259765625, 1.2261962890625, 1.338226318359375, 1.45025634765625, 1.562286376953125, 1.67431640625, 1.786346435546875, 1.89837646484375, 2.010406494140625, 2.1224365234375, 2.234466552734375, 2.34649658203125, 2.458526611328125, 2.570556640625, 2.682586669921875, 2.79461669921875, 2.906646728515625, 3.0186767578125, 3.130706787109375, 3.24273681640625, 3.354766845703125, 3.466796875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 12.0, 5.0, 15.0, 22.0, 30.0, 41.0, 71.0, 93.0, 156.0, 220.0, 349.0, 522.0, 774.0, 1151.0, 1841.0, 2964.0, 4625.0, 7250.0, 11855.0, 19702.0, 32705.0, 54525.0, 89850.0, 138453.0, 179353.0, 172468.0, 126329.0, 79808.0, 48280.0, 28726.0, 17599.0, 10553.0, 6614.0, 4142.0, 2609.0, 1674.0, 1091.0, 683.0, 484.0, 321.0, 208.0, 116.0, 102.0, 58.0, 41.0, 36.0, 12.0, 8.0, 9.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-4.0078125, -3.88592529296875, -3.7640380859375, -3.64215087890625, -3.520263671875, -3.39837646484375, -3.2764892578125, -3.15460205078125, -3.03271484375, -2.91082763671875, -2.7889404296875, -2.66705322265625, -2.545166015625, -2.42327880859375, -2.3013916015625, -2.17950439453125, -2.0576171875, -1.93572998046875, -1.8138427734375, -1.69195556640625, -1.570068359375, -1.44818115234375, -1.3262939453125, -1.20440673828125, -1.08251953125, -0.96063232421875, -0.8387451171875, -0.71685791015625, -0.594970703125, -0.47308349609375, -0.3511962890625, -0.22930908203125, -0.107421875, 0.01446533203125, 0.1363525390625, 0.25823974609375, 0.380126953125, 0.50201416015625, 0.6239013671875, 0.74578857421875, 0.86767578125, 0.98956298828125, 1.1114501953125, 1.23333740234375, 1.355224609375, 1.47711181640625, 1.5989990234375, 1.72088623046875, 1.8427734375, 1.96466064453125, 2.0865478515625, 2.20843505859375, 2.330322265625, 2.45220947265625, 2.5740966796875, 2.69598388671875, 2.81787109375, 2.93975830078125, 3.0616455078125, 3.18353271484375, 3.305419921875, 3.42730712890625, 3.5491943359375, 3.67108154296875, 3.79296875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 4.0, 3.0, 4.0, 8.0, 7.0, 11.0, 13.0, 13.0, 27.0, 21.0, 33.0, 47.0, 57.0, 70.0, 79.0, 109.0, 87.0, 94.0, 84.0, 69.0, 37.0, 41.0, 26.0, 21.0, 14.0, 7.0, 6.0, 5.0, 8.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006833076477050781, -0.0006649717688560486, -0.000646635890007019, -0.0006283000111579895, -0.00060996413230896, -0.0005916282534599304, -0.0005732923746109009, -0.0005549564957618713, -0.0005366206169128418, -0.0005182847380638123, -0.0004999488592147827, -0.0004816129803657532, -0.00046327710151672363, -0.0004449412226676941, -0.00042660534381866455, -0.000408269464969635, -0.00038993358612060547, -0.00037159770727157593, -0.0003532618284225464, -0.00033492594957351685, -0.0003165900707244873, -0.00029825419187545776, -0.0002799183130264282, -0.0002615824341773987, -0.00024324655532836914, -0.0002249106764793396, -0.00020657479763031006, -0.00018823891878128052, -0.00016990303993225098, -0.00015156716108322144, -0.0001332312822341919, -0.00011489540338516235, -9.655952453613281e-05, -7.822364568710327e-05, -5.988776683807373e-05, -4.155188798904419e-05, -2.321600914001465e-05, -4.880130290985107e-06, 1.3455748558044434e-05, 3.1791627407073975e-05, 5.0127506256103516e-05, 6.846338510513306e-05, 8.67992639541626e-05, 0.00010513514280319214, 0.00012347102165222168, 0.00014180690050125122, 0.00016014277935028076, 0.0001784786581993103, 0.00019681453704833984, 0.00021515041589736938, 0.00023348629474639893, 0.00025182217359542847, 0.000270158052444458, 0.00028849393129348755, 0.0003068298101425171, 0.00032516568899154663, 0.00034350156784057617, 0.0003618374466896057, 0.00038017332553863525, 0.0003985092043876648, 0.00041684508323669434, 0.0004351809620857239, 0.0004535168409347534, 0.00047185271978378296, 0.0004901885986328125]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 9.0, 9.0, 12.0, 14.0, 35.0, 40.0, 53.0, 82.0, 97.0, 195.0, 285.0, 411.0, 639.0, 1087.0, 1724.0, 2804.0, 4533.0, 7647.0, 12563.0, 21371.0, 35591.0, 58260.0, 91549.0, 133517.0, 164338.0, 162358.0, 127138.0, 85669.0, 54132.0, 32758.0, 19666.0, 11736.0, 6997.0, 4314.0, 2570.0, 1588.0, 927.0, 647.0, 385.0, 293.0, 188.0, 114.0, 68.0, 47.0, 37.0, 19.0, 19.0, 5.0, 3.0, 5.0, 5.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.228515625, -3.12738037109375, -3.0262451171875, -2.92510986328125, -2.823974609375, -2.72283935546875, -2.6217041015625, -2.52056884765625, -2.41943359375, -2.31829833984375, -2.2171630859375, -2.11602783203125, -2.014892578125, -1.91375732421875, -1.8126220703125, -1.71148681640625, -1.6103515625, -1.50921630859375, -1.4080810546875, -1.30694580078125, -1.205810546875, -1.10467529296875, -1.0035400390625, -0.90240478515625, -0.80126953125, -0.70013427734375, -0.5989990234375, -0.49786376953125, -0.396728515625, -0.29559326171875, -0.1944580078125, -0.09332275390625, 0.0078125, 0.10894775390625, 0.2100830078125, 0.31121826171875, 0.412353515625, 0.51348876953125, 0.6146240234375, 0.71575927734375, 0.81689453125, 0.91802978515625, 1.0191650390625, 1.12030029296875, 1.221435546875, 1.32257080078125, 1.4237060546875, 1.52484130859375, 1.6259765625, 1.72711181640625, 1.8282470703125, 1.92938232421875, 2.030517578125, 2.13165283203125, 2.2327880859375, 2.33392333984375, 2.43505859375, 2.53619384765625, 2.6373291015625, 2.73846435546875, 2.839599609375, 2.94073486328125, 3.0418701171875, 3.14300537109375, 3.244140625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 6.0, 10.0, 10.0, 10.0, 19.0, 26.0, 31.0, 35.0, 35.0, 56.0, 60.0, 77.0, 60.0, 82.0, 68.0, 74.0, 67.0, 56.0, 47.0, 34.0, 19.0, 35.0, 21.0, 10.0, 13.0, 11.0, 8.0, 5.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5341796875, -1.487457275390625, -1.44073486328125, -1.394012451171875, -1.3472900390625, -1.300567626953125, -1.25384521484375, -1.207122802734375, -1.160400390625, -1.113677978515625, -1.06695556640625, -1.020233154296875, -0.9735107421875, -0.926788330078125, -0.88006591796875, -0.833343505859375, -0.78662109375, -0.739898681640625, -0.69317626953125, -0.646453857421875, -0.5997314453125, -0.553009033203125, -0.50628662109375, -0.459564208984375, -0.412841796875, -0.366119384765625, -0.31939697265625, -0.272674560546875, -0.2259521484375, -0.179229736328125, -0.13250732421875, -0.085784912109375, -0.0390625, 0.007659912109375, 0.05438232421875, 0.101104736328125, 0.1478271484375, 0.194549560546875, 0.24127197265625, 0.287994384765625, 0.334716796875, 0.381439208984375, 0.42816162109375, 0.474884033203125, 0.5216064453125, 0.568328857421875, 0.61505126953125, 0.661773681640625, 0.70849609375, 0.755218505859375, 0.80194091796875, 0.848663330078125, 0.8953857421875, 0.942108154296875, 0.98883056640625, 1.035552978515625, 1.082275390625, 1.128997802734375, 1.17572021484375, 1.222442626953125, 1.2691650390625, 1.315887451171875, 1.36260986328125, 1.409332275390625, 1.4560546875]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 6.0, 6.0, 8.0, 10.0, 12.0, 20.0, 14.0, 31.0, 37.0, 27.0, 39.0, 39.0, 45.0, 39.0, 59.0, 58.0, 58.0, 61.0, 55.0, 52.0, 46.0, 57.0, 37.0, 41.0, 31.0, 20.0, 15.0, 14.0, 12.0, 14.0, 7.0, 5.0, 4.0, 3.0, 7.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.444511890411377, -7.208479881286621, -6.972447872161865, -6.736415863037109, -6.500383377075195, -6.2643513679504395, -6.028319358825684, -5.792287349700928, -5.556255340576172, -5.320223331451416, -5.08419132232666, -4.848158836364746, -4.61212682723999, -4.376094818115234, -4.1400628089904785, -3.9040307998657227, -3.6679983139038086, -3.4319663047790527, -3.1959340572357178, -2.959902048110962, -2.723869800567627, -2.487837791442871, -2.2518057823181152, -2.0157737731933594, -1.7797415256500244, -1.543709397315979, -1.3076772689819336, -1.0716452598571777, -0.8356131315231323, -0.5995810031890869, -0.36354899406433105, -0.12751686573028564, 0.10851573944091797, 0.344547837972641, 0.580579936504364, 0.8166120052337646, 1.05264413356781, 1.2886762619018555, 1.5247082710266113, 1.7607403993606567, 1.9967725276947021, 2.232804536819458, 2.468836784362793, 2.704868793487549, 2.9409008026123047, 3.1769330501556396, 3.4129650592803955, 3.6489973068237305, 3.8850293159484863, 4.121061325073242, 4.357093334197998, 4.593125343322754, 4.829157829284668, 5.065189838409424, 5.30122184753418, 5.5372538566589355, 5.773285865783691, 6.009317874908447, 6.245349884033203, 6.481382369995117, 6.717414379119873, 6.953446388244629, 7.189478397369385, 7.425510406494141, 7.661542892456055]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 10.0, 5.0, 9.0, 7.0, 14.0, 15.0, 22.0, 14.0, 32.0, 22.0, 29.0, 28.0, 31.0, 43.0, 47.0, 45.0, 52.0, 49.0, 49.0, 36.0, 35.0, 38.0, 49.0, 35.0, 31.0, 35.0, 33.0, 24.0, 31.0, 23.0, 19.0, 18.0, 22.0, 8.0, 9.0, 11.0, 5.0, 7.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.484739303588867, -5.311461925506592, -5.138184547424316, -4.964907169342041, -4.791629791259766, -4.61835241317749, -4.445075035095215, -4.271798133850098, -4.098520278930664, -3.9252429008483887, -3.7519655227661133, -3.578688144683838, -3.4054107666015625, -3.232133388519287, -3.058856248855591, -2.8855788707733154, -2.712301731109619, -2.5390243530273438, -2.3657469749450684, -2.192469596862793, -2.0191922187805176, -1.8459149599075317, -1.672637701034546, -1.4993603229522705, -1.3260829448699951, -1.1528055667877197, -0.9795282483100891, -0.8062509298324585, -0.6329735517501831, -0.4596961736679077, -0.2864189147949219, -0.11314153671264648, 0.060135841369628906, 0.2334131896495819, 0.4066905379295349, 0.5799678564071655, 0.7532452344894409, 0.9265226125717163, 1.0997998714447021, 1.2730772495269775, 1.446354627609253, 1.6196320056915283, 1.7929093837738037, 1.9661866426467896, 2.1394639015197754, 2.312741279602051, 2.486018657684326, 2.6592960357666016, 2.832573413848877, 3.0058507919311523, 3.1791281700134277, 3.352405548095703, 3.5256829261779785, 3.698960304260254, 3.87223744392395, 4.045515060424805, 4.218791961669922, 4.392069339752197, 4.565346717834473, 4.738624095916748, 4.911901473999023, 5.085178852081299, 5.258456230163574, 5.431733131408691, 5.605010986328125]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 10.0, 5.0, 14.0, 14.0, 18.0, 27.0, 45.0, 71.0, 115.0, 150.0, 231.0, 367.0, 580.0, 994.0, 1600.0, 2743.0, 4808.0, 8474.0, 16056.0, 30858.0, 64057.0, 142632.0, 338818.0, 789305.0, 1214894.0, 881126.0, 389482.0, 160953.0, 71130.0, 34508.0, 17520.0, 9647.0, 5332.0, 3070.0, 1837.0, 1081.0, 673.0, 388.0, 226.0, 150.0, 95.0, 63.0, 44.0, 27.0, 20.0, 13.0, 9.0, 6.0, 4.0, 1.0, 1.0, 0.0, 3.0], "bins": [-8.2265625, -7.995361328125, -7.76416015625, -7.532958984375, -7.3017578125, -7.070556640625, -6.83935546875, -6.608154296875, -6.376953125, -6.145751953125, -5.91455078125, -5.683349609375, -5.4521484375, -5.220947265625, -4.98974609375, -4.758544921875, -4.52734375, -4.296142578125, -4.06494140625, -3.833740234375, -3.6025390625, -3.371337890625, -3.14013671875, -2.908935546875, -2.677734375, -2.446533203125, -2.21533203125, -1.984130859375, -1.7529296875, -1.521728515625, -1.29052734375, -1.059326171875, -0.828125, -0.596923828125, -0.36572265625, -0.134521484375, 0.0966796875, 0.327880859375, 0.55908203125, 0.790283203125, 1.021484375, 1.252685546875, 1.48388671875, 1.715087890625, 1.9462890625, 2.177490234375, 2.40869140625, 2.639892578125, 2.87109375, 3.102294921875, 3.33349609375, 3.564697265625, 3.7958984375, 4.027099609375, 4.25830078125, 4.489501953125, 4.720703125, 4.951904296875, 5.18310546875, 5.414306640625, 5.6455078125, 5.876708984375, 6.10791015625, 6.339111328125, 6.5703125]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 1.0, 4.0, 5.0, 5.0, 9.0, 14.0, 15.0, 14.0, 17.0, 23.0, 22.0, 27.0, 28.0, 39.0, 31.0, 39.0, 42.0, 40.0, 41.0, 38.0, 55.0, 37.0, 56.0, 31.0, 46.0, 44.0, 40.0, 44.0, 23.0, 31.0, 12.0, 30.0, 24.0, 14.0, 15.0, 11.0, 10.0, 7.0, 4.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.1875, -4.06719970703125, -3.9468994140625, -3.82659912109375, -3.706298828125, -3.58599853515625, -3.4656982421875, -3.34539794921875, -3.22509765625, -3.10479736328125, -2.9844970703125, -2.86419677734375, -2.743896484375, -2.62359619140625, -2.5032958984375, -2.38299560546875, -2.2626953125, -2.14239501953125, -2.0220947265625, -1.90179443359375, -1.781494140625, -1.66119384765625, -1.5408935546875, -1.42059326171875, -1.30029296875, -1.17999267578125, -1.0596923828125, -0.93939208984375, -0.819091796875, -0.69879150390625, -0.5784912109375, -0.45819091796875, -0.337890625, -0.21759033203125, -0.0972900390625, 0.02301025390625, 0.143310546875, 0.26361083984375, 0.3839111328125, 0.50421142578125, 0.62451171875, 0.74481201171875, 0.8651123046875, 0.98541259765625, 1.105712890625, 1.22601318359375, 1.3463134765625, 1.46661376953125, 1.5869140625, 1.70721435546875, 1.8275146484375, 1.94781494140625, 2.068115234375, 2.18841552734375, 2.3087158203125, 2.42901611328125, 2.54931640625, 2.66961669921875, 2.7899169921875, 2.91021728515625, 3.030517578125, 3.15081787109375, 3.2711181640625, 3.39141845703125, 3.51171875]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 12.0, 8.0, 9.0, 13.0, 28.0, 36.0, 52.0, 73.0, 104.0, 165.0, 266.0, 356.0, 555.0, 877.0, 1265.0, 2165.0, 3343.0, 5259.0, 8765.0, 14676.0, 25211.0, 44471.0, 81970.0, 155681.0, 302485.0, 582754.0, 934039.0, 896556.0, 538227.0, 276696.0, 142224.0, 75223.0, 41588.0, 23417.0, 13608.0, 8255.0, 5022.0, 3214.0, 1923.0, 1306.0, 811.0, 542.0, 378.0, 222.0, 151.0, 101.0, 57.0, 49.0, 30.0, 22.0, 14.0, 6.0, 10.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.76953125, -5.57012939453125, -5.3707275390625, -5.17132568359375, -4.971923828125, -4.77252197265625, -4.5731201171875, -4.37371826171875, -4.17431640625, -3.97491455078125, -3.7755126953125, -3.57611083984375, -3.376708984375, -3.17730712890625, -2.9779052734375, -2.77850341796875, -2.5791015625, -2.37969970703125, -2.1802978515625, -1.98089599609375, -1.781494140625, -1.58209228515625, -1.3826904296875, -1.18328857421875, -0.98388671875, -0.78448486328125, -0.5850830078125, -0.38568115234375, -0.186279296875, 0.01312255859375, 0.2125244140625, 0.41192626953125, 0.611328125, 0.81072998046875, 1.0101318359375, 1.20953369140625, 1.408935546875, 1.60833740234375, 1.8077392578125, 2.00714111328125, 2.20654296875, 2.40594482421875, 2.6053466796875, 2.80474853515625, 3.004150390625, 3.20355224609375, 3.4029541015625, 3.60235595703125, 3.8017578125, 4.00115966796875, 4.2005615234375, 4.39996337890625, 4.599365234375, 4.79876708984375, 4.9981689453125, 5.19757080078125, 5.39697265625, 5.59637451171875, 5.7957763671875, 5.99517822265625, 6.194580078125, 6.39398193359375, 6.5933837890625, 6.79278564453125, 6.9921875]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 4.0, 12.0, 8.0, 12.0, 17.0, 25.0, 30.0, 39.0, 56.0, 68.0, 83.0, 112.0, 123.0, 164.0, 203.0, 213.0, 247.0, 298.0, 291.0, 273.0, 256.0, 268.0, 224.0, 192.0, 163.0, 148.0, 105.0, 87.0, 68.0, 57.0, 47.0, 42.0, 34.0, 28.0, 15.0, 13.0, 16.0, 13.0, 7.0, 7.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.94921875, -1.87994384765625, -1.8106689453125, -1.74139404296875, -1.672119140625, -1.60284423828125, -1.5335693359375, -1.46429443359375, -1.39501953125, -1.32574462890625, -1.2564697265625, -1.18719482421875, -1.117919921875, -1.04864501953125, -0.9793701171875, -0.91009521484375, -0.8408203125, -0.77154541015625, -0.7022705078125, -0.63299560546875, -0.563720703125, -0.49444580078125, -0.4251708984375, -0.35589599609375, -0.28662109375, -0.21734619140625, -0.1480712890625, -0.07879638671875, -0.009521484375, 0.05975341796875, 0.1290283203125, 0.19830322265625, 0.267578125, 0.33685302734375, 0.4061279296875, 0.47540283203125, 0.544677734375, 0.61395263671875, 0.6832275390625, 0.75250244140625, 0.82177734375, 0.89105224609375, 0.9603271484375, 1.02960205078125, 1.098876953125, 1.16815185546875, 1.2374267578125, 1.30670166015625, 1.3759765625, 1.44525146484375, 1.5145263671875, 1.58380126953125, 1.653076171875, 1.72235107421875, 1.7916259765625, 1.86090087890625, 1.93017578125, 1.99945068359375, 2.0687255859375, 2.13800048828125, 2.207275390625, 2.27655029296875, 2.3458251953125, 2.41510009765625, 2.484375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 7.0, 17.0, 6.0, 12.0, 10.0, 22.0, 15.0, 34.0, 33.0, 29.0, 39.0, 57.0, 67.0, 69.0, 77.0, 47.0, 64.0, 59.0, 60.0, 42.0, 36.0, 29.0, 23.0, 33.0, 25.0, 20.0, 16.0, 9.0, 9.0, 9.0, 3.0, 4.0, 1.0, 3.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.895099639892578, -6.658045291900635, -6.420990943908691, -6.18393611907959, -5.9468817710876465, -5.709827423095703, -5.472772598266602, -5.235718250274658, -4.998663902282715, -4.7616095542907715, -4.524555206298828, -4.287500381469727, -4.050446033477783, -3.81339168548584, -3.5763370990753174, -3.339282512664795, -3.1022281646728516, -2.865173816680908, -2.6281192302703857, -2.3910646438598633, -2.15401029586792, -1.916955828666687, -1.679901361465454, -1.4428468942642212, -1.2057924270629883, -0.9687379598617554, -0.7316834926605225, -0.49462902545928955, -0.25757455825805664, -0.02052009105682373, 0.21653437614440918, 0.4535888433456421, 0.690643310546875, 0.9276977777481079, 1.1647522449493408, 1.4018067121505737, 1.6388611793518066, 1.8759156465530396, 2.1129701137542725, 2.350024700164795, 2.5870790481567383, 2.8241333961486816, 3.061187982559204, 3.2982425689697266, 3.53529691696167, 3.7723512649536133, 4.009406089782715, 4.246460437774658, 4.483514785766602, 4.720569133758545, 4.957623481750488, 5.19467830657959, 5.431732654571533, 5.668787002563477, 5.905841827392578, 6.1428961753845215, 6.379950523376465, 6.617004871368408, 6.854059219360352, 7.091114044189453, 7.3281683921813965, 7.56522274017334, 7.802277565002441, 8.039331436157227, 8.276386260986328]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 1.0, 7.0, 8.0, 7.0, 10.0, 8.0, 14.0, 19.0, 12.0, 24.0, 28.0, 19.0, 35.0, 33.0, 34.0, 25.0, 36.0, 26.0, 36.0, 42.0, 29.0, 56.0, 47.0, 32.0, 29.0, 41.0, 38.0, 43.0, 29.0, 18.0, 27.0, 17.0, 24.0, 22.0, 20.0, 11.0, 20.0, 11.0, 15.0, 9.0, 7.0, 10.0, 6.0, 1.0, 3.0, 4.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0], "bins": [-4.4756879806518555, -4.342403888702393, -4.209120273590088, -4.075836181640625, -3.942552328109741, -3.8092684745788574, -3.6759843826293945, -3.5427005290985107, -3.409416675567627, -3.276132822036743, -3.1428487300872803, -3.0095648765563965, -2.8762810230255127, -2.742997169494629, -2.609713077545166, -2.4764292240142822, -2.3431451320648193, -2.2098612785339355, -2.0765771865844727, -1.9432933330535889, -1.810009479522705, -1.6767255067825317, -1.5434415340423584, -1.4101576805114746, -1.2768737077713013, -1.143589735031128, -1.0103058815002441, -0.8770219087600708, -0.7437379956245422, -0.6104540824890137, -0.47717010974884033, -0.34388619661331177, -0.2106022834777832, -0.07731835544109344, 0.055965572595596313, 0.18924951553344727, 0.32253342866897583, 0.4558173418045044, 0.5891013145446777, 0.7223852276802063, 0.8556691408157349, 0.9889530539512634, 1.122236967086792, 1.2555209398269653, 1.3888049125671387, 1.5220887660980225, 1.6553727388381958, 1.7886567115783691, 1.921940565109253, 2.0552244186401367, 2.1885085105895996, 2.3217923641204834, 2.455076217651367, 2.58836030960083, 2.721644163131714, 2.8549280166625977, 2.9882121086120605, 3.1214959621429443, 3.2547800540924072, 3.388063907623291, 3.521347761154175, 3.6546316146850586, 3.7879157066345215, 3.9211995601654053, 4.054483413696289]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 12.0, 13.0, 23.0, 27.0, 45.0, 54.0, 99.0, 130.0, 203.0, 319.0, 531.0, 805.0, 1325.0, 2214.0, 3665.0, 6329.0, 10756.0, 19059.0, 33731.0, 59185.0, 98471.0, 149276.0, 183709.0, 170659.0, 124368.0, 78221.0, 45305.0, 25113.0, 14297.0, 8383.0, 4749.0, 2737.0, 1776.0, 1087.0, 643.0, 432.0, 244.0, 186.0, 129.0, 80.0, 47.0, 38.0, 25.0, 22.0, 8.0, 10.0, 4.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-3.88671875, -3.771575927734375, -3.65643310546875, -3.541290283203125, -3.4261474609375, -3.311004638671875, -3.19586181640625, -3.080718994140625, -2.965576171875, -2.850433349609375, -2.73529052734375, -2.620147705078125, -2.5050048828125, -2.389862060546875, -2.27471923828125, -2.159576416015625, -2.04443359375, -1.929290771484375, -1.81414794921875, -1.699005126953125, -1.5838623046875, -1.468719482421875, -1.35357666015625, -1.238433837890625, -1.123291015625, -1.008148193359375, -0.89300537109375, -0.777862548828125, -0.6627197265625, -0.547576904296875, -0.43243408203125, -0.317291259765625, -0.2021484375, -0.087005615234375, 0.02813720703125, 0.143280029296875, 0.2584228515625, 0.373565673828125, 0.48870849609375, 0.603851318359375, 0.718994140625, 0.834136962890625, 0.94927978515625, 1.064422607421875, 1.1795654296875, 1.294708251953125, 1.40985107421875, 1.524993896484375, 1.64013671875, 1.755279541015625, 1.87042236328125, 1.985565185546875, 2.1007080078125, 2.215850830078125, 2.33099365234375, 2.446136474609375, 2.561279296875, 2.676422119140625, 2.79156494140625, 2.906707763671875, 3.0218505859375, 3.136993408203125, 3.25213623046875, 3.367279052734375, 3.482421875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 8.0, 8.0, 5.0, 2.0, 6.0, 9.0, 12.0, 12.0, 9.0, 14.0, 23.0, 19.0, 26.0, 35.0, 28.0, 27.0, 30.0, 27.0, 30.0, 34.0, 43.0, 60.0, 42.0, 40.0, 41.0, 45.0, 39.0, 26.0, 39.0, 32.0, 24.0, 32.0, 20.0, 26.0, 15.0, 27.0, 18.0, 14.0, 10.0, 10.0, 6.0, 7.0, 4.0, 10.0, 3.0, 2.0, 6.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.06640625, -4.92034912109375, -4.7742919921875, -4.62823486328125, -4.482177734375, -4.33612060546875, -4.1900634765625, -4.04400634765625, -3.89794921875, -3.75189208984375, -3.6058349609375, -3.45977783203125, -3.313720703125, -3.16766357421875, -3.0216064453125, -2.87554931640625, -2.7294921875, -2.58343505859375, -2.4373779296875, -2.29132080078125, -2.145263671875, -1.99920654296875, -1.8531494140625, -1.70709228515625, -1.56103515625, -1.41497802734375, -1.2689208984375, -1.12286376953125, -0.976806640625, -0.83074951171875, -0.6846923828125, -0.53863525390625, -0.392578125, -0.24652099609375, -0.1004638671875, 0.04559326171875, 0.191650390625, 0.33770751953125, 0.4837646484375, 0.62982177734375, 0.77587890625, 0.92193603515625, 1.0679931640625, 1.21405029296875, 1.360107421875, 1.50616455078125, 1.6522216796875, 1.79827880859375, 1.9443359375, 2.09039306640625, 2.2364501953125, 2.38250732421875, 2.528564453125, 2.67462158203125, 2.8206787109375, 2.96673583984375, 3.11279296875, 3.25885009765625, 3.4049072265625, 3.55096435546875, 3.697021484375, 3.84307861328125, 3.9891357421875, 4.13519287109375, 4.28125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 8.0, 5.0, 16.0, 18.0, 19.0, 22.0, 41.0, 60.0, 88.0, 142.0, 202.0, 296.0, 405.0, 718.0, 995.0, 1688.0, 2804.0, 4685.0, 7808.0, 13534.0, 24145.0, 42485.0, 77732.0, 131885.0, 198771.0, 205036.0, 142055.0, 83174.0, 46972.0, 26493.0, 14950.0, 8370.0, 4890.0, 3039.0, 1753.0, 1067.0, 737.0, 471.0, 340.0, 228.0, 139.0, 94.0, 59.0, 43.0, 26.0, 15.0, 20.0, 10.0, 8.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.2578125, -4.1162109375, -3.974609375, -3.8330078125, -3.69140625, -3.5498046875, -3.408203125, -3.2666015625, -3.125, -2.9833984375, -2.841796875, -2.7001953125, -2.55859375, -2.4169921875, -2.275390625, -2.1337890625, -1.9921875, -1.8505859375, -1.708984375, -1.5673828125, -1.42578125, -1.2841796875, -1.142578125, -1.0009765625, -0.859375, -0.7177734375, -0.576171875, -0.4345703125, -0.29296875, -0.1513671875, -0.009765625, 0.1318359375, 0.2734375, 0.4150390625, 0.556640625, 0.6982421875, 0.83984375, 0.9814453125, 1.123046875, 1.2646484375, 1.40625, 1.5478515625, 1.689453125, 1.8310546875, 1.97265625, 2.1142578125, 2.255859375, 2.3974609375, 2.5390625, 2.6806640625, 2.822265625, 2.9638671875, 3.10546875, 3.2470703125, 3.388671875, 3.5302734375, 3.671875, 3.8134765625, 3.955078125, 4.0966796875, 4.23828125, 4.3798828125, 4.521484375, 4.6630859375, 4.8046875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 5.0, 3.0, 6.0, 7.0, 1.0, 4.0, 13.0, 14.0, 7.0, 10.0, 17.0, 26.0, 21.0, 26.0, 28.0, 40.0, 45.0, 54.0, 42.0, 36.0, 40.0, 39.0, 50.0, 52.0, 53.0, 32.0, 36.0, 36.0, 36.0, 21.0, 26.0, 28.0, 24.0, 30.0, 14.0, 12.0, 15.0, 19.0, 10.0, 6.0, 5.0, 6.0, 5.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.525390625, -2.427581787109375, -2.32977294921875, -2.231964111328125, -2.1341552734375, -2.036346435546875, -1.93853759765625, -1.840728759765625, -1.742919921875, -1.645111083984375, -1.54730224609375, -1.449493408203125, -1.3516845703125, -1.253875732421875, -1.15606689453125, -1.058258056640625, -0.96044921875, -0.862640380859375, -0.76483154296875, -0.667022705078125, -0.5692138671875, -0.471405029296875, -0.37359619140625, -0.275787353515625, -0.177978515625, -0.080169677734375, 0.01763916015625, 0.115447998046875, 0.2132568359375, 0.311065673828125, 0.40887451171875, 0.506683349609375, 0.6044921875, 0.702301025390625, 0.80010986328125, 0.897918701171875, 0.9957275390625, 1.093536376953125, 1.19134521484375, 1.289154052734375, 1.386962890625, 1.484771728515625, 1.58258056640625, 1.680389404296875, 1.7781982421875, 1.876007080078125, 1.97381591796875, 2.071624755859375, 2.16943359375, 2.267242431640625, 2.36505126953125, 2.462860107421875, 2.5606689453125, 2.658477783203125, 2.75628662109375, 2.854095458984375, 2.951904296875, 3.049713134765625, 3.14752197265625, 3.245330810546875, 3.3431396484375, 3.440948486328125, 3.53875732421875, 3.636566162109375, 3.734375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 8.0, 10.0, 9.0, 14.0, 21.0, 24.0, 21.0, 37.0, 48.0, 71.0, 85.0, 111.0, 155.0, 161.0, 236.0, 325.0, 432.0, 675.0, 957.0, 1543.0, 2801.0, 5892.0, 13767.0, 39002.0, 128879.0, 385418.0, 318343.0, 96399.0, 30216.0, 11202.0, 4881.0, 2519.0, 1362.0, 834.0, 551.0, 357.0, 275.0, 222.0, 148.0, 131.0, 72.0, 76.0, 61.0, 47.0, 30.0, 35.0, 27.0, 23.0, 17.0, 10.0, 3.0, 6.0, 5.0, 5.0, 4.0], "bins": [-5.1953125, -5.04638671875, -4.8974609375, -4.74853515625, -4.599609375, -4.45068359375, -4.3017578125, -4.15283203125, -4.00390625, -3.85498046875, -3.7060546875, -3.55712890625, -3.408203125, -3.25927734375, -3.1103515625, -2.96142578125, -2.8125, -2.66357421875, -2.5146484375, -2.36572265625, -2.216796875, -2.06787109375, -1.9189453125, -1.77001953125, -1.62109375, -1.47216796875, -1.3232421875, -1.17431640625, -1.025390625, -0.87646484375, -0.7275390625, -0.57861328125, -0.4296875, -0.28076171875, -0.1318359375, 0.01708984375, 0.166015625, 0.31494140625, 0.4638671875, 0.61279296875, 0.76171875, 0.91064453125, 1.0595703125, 1.20849609375, 1.357421875, 1.50634765625, 1.6552734375, 1.80419921875, 1.953125, 2.10205078125, 2.2509765625, 2.39990234375, 2.548828125, 2.69775390625, 2.8466796875, 2.99560546875, 3.14453125, 3.29345703125, 3.4423828125, 3.59130859375, 3.740234375, 3.88916015625, 4.0380859375, 4.18701171875, 4.3359375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 2.0, 5.0, 9.0, 5.0, 13.0, 15.0, 17.0, 20.0, 31.0, 36.0, 42.0, 48.0, 56.0, 87.0, 106.0, 67.0, 71.0, 74.0, 76.0, 47.0, 32.0, 31.0, 32.0, 18.0, 11.0, 11.0, 11.0, 6.0, 10.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012421607971191406, -0.00012039672583341599, -0.00011657737195491791, -0.00011275801807641983, -0.00010893866419792175, -0.00010511931031942368, -0.0001012999564409256, -9.748060256242752e-05, -9.366124868392944e-05, -8.984189480543137e-05, -8.602254092693329e-05, -8.220318704843521e-05, -7.838383316993713e-05, -7.456447929143906e-05, -7.074512541294098e-05, -6.69257715344429e-05, -6.310641765594482e-05, -5.928706377744675e-05, -5.546770989894867e-05, -5.164835602045059e-05, -4.7829002141952515e-05, -4.400964826345444e-05, -4.019029438495636e-05, -3.637094050645828e-05, -3.2551586627960205e-05, -2.8732232749462128e-05, -2.491287887096405e-05, -2.1093524992465973e-05, -1.7274171113967896e-05, -1.3454817235469818e-05, -9.63546335697174e-06, -5.816109478473663e-06, -1.996755599975586e-06, 1.8225982785224915e-06, 5.641952157020569e-06, 9.461306035518646e-06, 1.3280659914016724e-05, 1.71000137925148e-05, 2.091936767101288e-05, 2.4738721549510956e-05, 2.8558075428009033e-05, 3.237742930650711e-05, 3.619678318500519e-05, 4.0016137063503265e-05, 4.383549094200134e-05, 4.765484482049942e-05, 5.14741986989975e-05, 5.5293552577495575e-05, 5.911290645599365e-05, 6.293226033449173e-05, 6.675161421298981e-05, 7.057096809148788e-05, 7.439032196998596e-05, 7.820967584848404e-05, 8.202902972698212e-05, 8.58483836054802e-05, 8.966773748397827e-05, 9.348709136247635e-05, 9.730644524097443e-05, 0.0001011257991194725, 0.00010494515299797058, 0.00010876450687646866, 0.00011258386075496674, 0.00011640321463346481, 0.00012022256851196289]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 4.0, 6.0, 5.0, 11.0, 18.0, 29.0, 27.0, 51.0, 64.0, 81.0, 125.0, 166.0, 256.0, 355.0, 568.0, 884.0, 1394.0, 2582.0, 4734.0, 9539.0, 21286.0, 51463.0, 125017.0, 249112.0, 283611.0, 167871.0, 72660.0, 29706.0, 12859.0, 6065.0, 3140.0, 1802.0, 1070.0, 603.0, 428.0, 272.0, 188.0, 135.0, 111.0, 70.0, 60.0, 45.0, 23.0, 26.0, 14.0, 6.0, 5.0, 9.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.017578125, -2.923828125, -2.830078125, -2.736328125, -2.642578125, -2.548828125, -2.455078125, -2.361328125, -2.267578125, -2.173828125, -2.080078125, -1.986328125, -1.892578125, -1.798828125, -1.705078125, -1.611328125, -1.517578125, -1.423828125, -1.330078125, -1.236328125, -1.142578125, -1.048828125, -0.955078125, -0.861328125, -0.767578125, -0.673828125, -0.580078125, -0.486328125, -0.392578125, -0.298828125, -0.205078125, -0.111328125, -0.017578125, 0.076171875, 0.169921875, 0.263671875, 0.357421875, 0.451171875, 0.544921875, 0.638671875, 0.732421875, 0.826171875, 0.919921875, 1.013671875, 1.107421875, 1.201171875, 1.294921875, 1.388671875, 1.482421875, 1.576171875, 1.669921875, 1.763671875, 1.857421875, 1.951171875, 2.044921875, 2.138671875, 2.232421875, 2.326171875, 2.419921875, 2.513671875, 2.607421875, 2.701171875, 2.794921875, 2.888671875, 2.982421875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 10.0, 2.0, 6.0, 6.0, 8.0, 11.0, 15.0, 24.0, 21.0, 36.0, 41.0, 40.0, 49.0, 44.0, 58.0, 51.0, 70.0, 73.0, 65.0, 81.0, 60.0, 47.0, 36.0, 34.0, 27.0, 20.0, 12.0, 17.0, 10.0, 11.0, 3.0, 5.0, 1.0, 6.0, 2.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73095703125, -0.7072067260742188, -0.6834564208984375, -0.6597061157226562, -0.635955810546875, -0.6122055053710938, -0.5884552001953125, -0.5647048950195312, -0.54095458984375, -0.5172042846679688, -0.4934539794921875, -0.46970367431640625, -0.445953369140625, -0.42220306396484375, -0.3984527587890625, -0.37470245361328125, -0.3509521484375, -0.32720184326171875, -0.3034515380859375, -0.27970123291015625, -0.255950927734375, -0.23220062255859375, -0.2084503173828125, -0.18470001220703125, -0.16094970703125, -0.13719940185546875, -0.1134490966796875, -0.08969879150390625, -0.065948486328125, -0.04219818115234375, -0.0184478759765625, 0.00530242919921875, 0.029052734375, 0.05280303955078125, 0.0765533447265625, 0.10030364990234375, 0.124053955078125, 0.14780426025390625, 0.1715545654296875, 0.19530487060546875, 0.21905517578125, 0.24280548095703125, 0.2665557861328125, 0.29030609130859375, 0.314056396484375, 0.33780670166015625, 0.3615570068359375, 0.38530731201171875, 0.4090576171875, 0.43280792236328125, 0.4565582275390625, 0.48030853271484375, 0.504058837890625, 0.5278091430664062, 0.5515594482421875, 0.5753097534179688, 0.59906005859375, 0.6228103637695312, 0.6465606689453125, 0.6703109741210938, 0.694061279296875, 0.7178115844726562, 0.7415618896484375, 0.7653121948242188, 0.7890625]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 3.0, 4.0, 2.0, 7.0, 12.0, 13.0, 12.0, 12.0, 29.0, 22.0, 32.0, 33.0, 35.0, 51.0, 65.0, 81.0, 62.0, 57.0, 71.0, 68.0, 55.0, 45.0, 45.0, 24.0, 35.0, 28.0, 21.0, 18.0, 14.0, 16.0, 8.0, 4.0, 4.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.946721076965332, -6.700906276702881, -6.45509147644043, -6.2092766761779785, -5.963461875915527, -5.717647075653076, -5.471832275390625, -5.226017951965332, -4.980202674865723, -4.7343878746032715, -4.48857307434082, -4.242758274078369, -3.996943473815918, -3.751128673553467, -3.5053141117095947, -3.2594993114471436, -3.0136847496032715, -2.7678699493408203, -2.522055149078369, -2.276240348815918, -2.030425548553467, -1.7846108675003052, -1.5387961864471436, -1.2929813861846924, -1.0471665859222412, -0.80135178565979, -0.5555370450019836, -0.30972230434417725, -0.06390750408172607, 0.1819072961807251, 0.4277219772338867, 0.6735367774963379, 0.9193515777587891, 1.1651663780212402, 1.4109811782836914, 1.656795859336853, 1.9026106595993042, 2.148425579071045, 2.394240140914917, 2.640054941177368, 2.8858697414398193, 3.1316845417022705, 3.3774993419647217, 3.6233139038085938, 3.869128704071045, 4.114943504333496, 4.360758304595947, 4.606573104858398, 4.85238790512085, 5.098202705383301, 5.344017505645752, 5.589832305908203, 5.835647106170654, 6.0814619064331055, 6.327276229858398, 6.573091506958008, 6.818905830383301, 7.064720630645752, 7.310535430908203, 7.556350231170654, 7.8021650314331055, 8.047979354858398, 8.293794631958008, 8.5396089553833, 8.78542423248291]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 8.0, 3.0, 3.0, 13.0, 9.0, 6.0, 9.0, 21.0, 16.0, 23.0, 26.0, 32.0, 25.0, 29.0, 31.0, 33.0, 31.0, 26.0, 38.0, 33.0, 50.0, 46.0, 38.0, 35.0, 41.0, 35.0, 32.0, 45.0, 27.0, 27.0, 21.0, 19.0, 23.0, 25.0, 16.0, 18.0, 12.0, 15.0, 6.0, 13.0, 9.0, 9.0, 8.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-4.334875106811523, -4.202536582946777, -4.070198059082031, -3.9378597736358643, -3.805521249771118, -3.673182725906372, -3.540844440460205, -3.408505916595459, -3.276167392730713, -3.143828868865967, -3.0114903450012207, -2.8791520595550537, -2.7468135356903076, -2.6144750118255615, -2.4821367263793945, -2.3497982025146484, -2.2174596786499023, -2.0851211547851562, -1.9527827501296997, -1.8204443454742432, -1.688105821609497, -1.555767297744751, -1.4234288930892944, -1.291090488433838, -1.1587519645690918, -1.0264134407043457, -0.8940750360488892, -0.7617365717887878, -0.6293981075286865, -0.4970596432685852, -0.3647211790084839, -0.23238271474838257, -0.10004377365112305, 0.03229469060897827, 0.1646331548690796, 0.2969716191291809, 0.4293100833892822, 0.5616485476493835, 0.6939870119094849, 0.8263254761695862, 0.9586639404296875, 1.0910024642944336, 1.2233408689498901, 1.3556792736053467, 1.4880177974700928, 1.6203563213348389, 1.7526947259902954, 1.885033130645752, 2.017371654510498, 2.149710178375244, 2.2820487022399902, 2.4143869876861572, 2.5467255115509033, 2.6790640354156494, 2.8114023208618164, 2.9437408447265625, 3.0760793685913086, 3.2084178924560547, 3.340756416320801, 3.4730947017669678, 3.605433225631714, 3.73777174949646, 3.870110034942627, 4.002448558807373, 4.134787082672119]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 6.0, 4.0, 8.0, 17.0, 41.0, 47.0, 62.0, 99.0, 146.0, 255.0, 369.0, 634.0, 979.0, 1593.0, 2405.0, 3961.0, 6251.0, 10430.0, 17000.0, 27843.0, 43573.0, 67312.0, 98482.0, 130243.0, 148541.0, 141621.0, 115425.0, 83227.0, 55409.0, 34979.0, 21884.0, 13669.0, 8302.0, 5214.0, 3156.0, 2000.0, 1283.0, 751.0, 479.0, 343.0, 179.0, 121.0, 81.0, 56.0, 32.0, 15.0, 11.0, 9.0, 9.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.875, -3.74481201171875, -3.6146240234375, -3.48443603515625, -3.354248046875, -3.22406005859375, -3.0938720703125, -2.96368408203125, -2.83349609375, -2.70330810546875, -2.5731201171875, -2.44293212890625, -2.312744140625, -2.18255615234375, -2.0523681640625, -1.92218017578125, -1.7919921875, -1.66180419921875, -1.5316162109375, -1.40142822265625, -1.271240234375, -1.14105224609375, -1.0108642578125, -0.88067626953125, -0.75048828125, -0.62030029296875, -0.4901123046875, -0.35992431640625, -0.229736328125, -0.09954833984375, 0.0306396484375, 0.16082763671875, 0.291015625, 0.42120361328125, 0.5513916015625, 0.68157958984375, 0.811767578125, 0.94195556640625, 1.0721435546875, 1.20233154296875, 1.33251953125, 1.46270751953125, 1.5928955078125, 1.72308349609375, 1.853271484375, 1.98345947265625, 2.1136474609375, 2.24383544921875, 2.3740234375, 2.50421142578125, 2.6343994140625, 2.76458740234375, 2.894775390625, 3.02496337890625, 3.1551513671875, 3.28533935546875, 3.41552734375, 3.54571533203125, 3.6759033203125, 3.80609130859375, 3.936279296875, 4.06646728515625, 4.1966552734375, 4.32684326171875, 4.45703125]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 1.0, 4.0, 4.0, 9.0, 7.0, 7.0, 19.0, 10.0, 12.0, 12.0, 21.0, 28.0, 28.0, 41.0, 33.0, 35.0, 29.0, 46.0, 49.0, 47.0, 48.0, 34.0, 37.0, 46.0, 39.0, 37.0, 33.0, 39.0, 26.0, 31.0, 23.0, 26.0, 21.0, 20.0, 18.0, 17.0, 16.0, 13.0, 8.0, 6.0, 13.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8828125, -4.732421875, -4.58203125, -4.431640625, -4.28125, -4.130859375, -3.98046875, -3.830078125, -3.6796875, -3.529296875, -3.37890625, -3.228515625, -3.078125, -2.927734375, -2.77734375, -2.626953125, -2.4765625, -2.326171875, -2.17578125, -2.025390625, -1.875, -1.724609375, -1.57421875, -1.423828125, -1.2734375, -1.123046875, -0.97265625, -0.822265625, -0.671875, -0.521484375, -0.37109375, -0.220703125, -0.0703125, 0.080078125, 0.23046875, 0.380859375, 0.53125, 0.681640625, 0.83203125, 0.982421875, 1.1328125, 1.283203125, 1.43359375, 1.583984375, 1.734375, 1.884765625, 2.03515625, 2.185546875, 2.3359375, 2.486328125, 2.63671875, 2.787109375, 2.9375, 3.087890625, 3.23828125, 3.388671875, 3.5390625, 3.689453125, 3.83984375, 3.990234375, 4.140625, 4.291015625, 4.44140625, 4.591796875, 4.7421875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 7.0, 6.0, 12.0, 14.0, 18.0, 34.0, 44.0, 59.0, 88.0, 137.0, 223.0, 283.0, 464.0, 711.0, 1062.0, 1640.0, 2541.0, 3964.0, 5866.0, 9282.0, 14340.0, 22221.0, 34133.0, 51154.0, 74495.0, 101226.0, 126048.0, 136800.0, 127594.0, 103872.0, 76430.0, 53360.0, 35173.0, 22857.0, 14834.0, 9786.0, 6201.0, 4005.0, 2591.0, 1709.0, 1140.0, 698.0, 518.0, 352.0, 195.0, 128.0, 84.0, 62.0, 39.0, 17.0, 19.0, 12.0, 10.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.431640625, -3.322845458984375, -3.21405029296875, -3.105255126953125, -2.9964599609375, -2.887664794921875, -2.77886962890625, -2.670074462890625, -2.561279296875, -2.452484130859375, -2.34368896484375, -2.234893798828125, -2.1260986328125, -2.017303466796875, -1.90850830078125, -1.799713134765625, -1.69091796875, -1.582122802734375, -1.47332763671875, -1.364532470703125, -1.2557373046875, -1.146942138671875, -1.03814697265625, -0.929351806640625, -0.820556640625, -0.711761474609375, -0.60296630859375, -0.494171142578125, -0.3853759765625, -0.276580810546875, -0.16778564453125, -0.058990478515625, 0.0498046875, 0.158599853515625, 0.26739501953125, 0.376190185546875, 0.4849853515625, 0.593780517578125, 0.70257568359375, 0.811370849609375, 0.920166015625, 1.028961181640625, 1.13775634765625, 1.246551513671875, 1.3553466796875, 1.464141845703125, 1.57293701171875, 1.681732177734375, 1.79052734375, 1.899322509765625, 2.00811767578125, 2.116912841796875, 2.2257080078125, 2.334503173828125, 2.44329833984375, 2.552093505859375, 2.660888671875, 2.769683837890625, 2.87847900390625, 2.987274169921875, 3.0960693359375, 3.204864501953125, 3.31365966796875, 3.422454833984375, 3.53125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 2.0, 12.0, 4.0, 8.0, 13.0, 20.0, 12.0, 24.0, 19.0, 32.0, 26.0, 28.0, 30.0, 50.0, 35.0, 45.0, 27.0, 46.0, 47.0, 50.0, 50.0, 37.0, 36.0, 37.0, 36.0, 33.0, 38.0, 27.0, 18.0, 27.0, 23.0, 21.0, 16.0, 8.0, 11.0, 14.0, 5.0, 4.0, 4.0, 5.0, 5.0, 3.0, 1.0, 1.0, 4.0, 3.0, 2.0], "bins": [-3.494140625, -3.397308349609375, -3.30047607421875, -3.203643798828125, -3.1068115234375, -3.009979248046875, -2.91314697265625, -2.816314697265625, -2.719482421875, -2.622650146484375, -2.52581787109375, -2.428985595703125, -2.3321533203125, -2.235321044921875, -2.13848876953125, -2.041656494140625, -1.94482421875, -1.847991943359375, -1.75115966796875, -1.654327392578125, -1.5574951171875, -1.460662841796875, -1.36383056640625, -1.266998291015625, -1.170166015625, -1.073333740234375, -0.97650146484375, -0.879669189453125, -0.7828369140625, -0.686004638671875, -0.58917236328125, -0.492340087890625, -0.3955078125, -0.298675537109375, -0.20184326171875, -0.105010986328125, -0.0081787109375, 0.088653564453125, 0.18548583984375, 0.282318115234375, 0.379150390625, 0.475982666015625, 0.57281494140625, 0.669647216796875, 0.7664794921875, 0.863311767578125, 0.96014404296875, 1.056976318359375, 1.15380859375, 1.250640869140625, 1.34747314453125, 1.444305419921875, 1.5411376953125, 1.637969970703125, 1.73480224609375, 1.831634521484375, 1.928466796875, 2.025299072265625, 2.12213134765625, 2.218963623046875, 2.3157958984375, 2.412628173828125, 2.50946044921875, 2.606292724609375, 2.703125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 11.0, 10.0, 12.0, 19.0, 48.0, 74.0, 95.0, 119.0, 231.0, 357.0, 623.0, 1070.0, 1842.0, 3090.0, 5617.0, 10415.0, 19125.0, 36554.0, 66929.0, 116073.0, 173721.0, 201441.0, 167081.0, 108458.0, 62029.0, 33832.0, 17896.0, 9559.0, 5290.0, 2911.0, 1596.0, 915.0, 596.0, 340.0, 200.0, 138.0, 83.0, 48.0, 31.0, 25.0, 17.0, 13.0, 6.0, 4.0, 8.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.17578125, -3.08355712890625, -2.9913330078125, -2.89910888671875, -2.806884765625, -2.71466064453125, -2.6224365234375, -2.53021240234375, -2.43798828125, -2.34576416015625, -2.2535400390625, -2.16131591796875, -2.069091796875, -1.97686767578125, -1.8846435546875, -1.79241943359375, -1.7001953125, -1.60797119140625, -1.5157470703125, -1.42352294921875, -1.331298828125, -1.23907470703125, -1.1468505859375, -1.05462646484375, -0.96240234375, -0.87017822265625, -0.7779541015625, -0.68572998046875, -0.593505859375, -0.50128173828125, -0.4090576171875, -0.31683349609375, -0.224609375, -0.13238525390625, -0.0401611328125, 0.05206298828125, 0.144287109375, 0.23651123046875, 0.3287353515625, 0.42095947265625, 0.51318359375, 0.60540771484375, 0.6976318359375, 0.78985595703125, 0.882080078125, 0.97430419921875, 1.0665283203125, 1.15875244140625, 1.2509765625, 1.34320068359375, 1.4354248046875, 1.52764892578125, 1.619873046875, 1.71209716796875, 1.8043212890625, 1.89654541015625, 1.98876953125, 2.08099365234375, 2.1732177734375, 2.26544189453125, 2.357666015625, 2.44989013671875, 2.5421142578125, 2.63433837890625, 2.7265625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 8.0, 9.0, 7.0, 17.0, 18.0, 21.0, 22.0, 38.0, 51.0, 53.0, 81.0, 60.0, 70.0, 75.0, 62.0, 57.0, 64.0, 58.0, 45.0, 36.0, 40.0, 29.0, 27.0, 13.0, 10.0, 10.0, 5.0, 7.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00029468536376953125, -0.00028483569622039795, -0.00027498602867126465, -0.00026513636112213135, -0.00025528669357299805, -0.00024543702602386475, -0.00023558735847473145, -0.00022573769092559814, -0.00021588802337646484, -0.00020603835582733154, -0.00019618868827819824, -0.00018633902072906494, -0.00017648935317993164, -0.00016663968563079834, -0.00015679001808166504, -0.00014694035053253174, -0.00013709068298339844, -0.00012724101543426514, -0.00011739134788513184, -0.00010754168033599854, -9.769201278686523e-05, -8.784234523773193e-05, -7.799267768859863e-05, -6.814301013946533e-05, -5.829334259033203e-05, -4.844367504119873e-05, -3.859400749206543e-05, -2.874433994293213e-05, -1.8894672393798828e-05, -9.045004844665527e-06, 8.046627044677734e-07, 1.0654330253601074e-05, 2.0503997802734375e-05, 3.0353665351867676e-05, 4.0203332901000977e-05, 5.005300045013428e-05, 5.990266799926758e-05, 6.975233554840088e-05, 7.960200309753418e-05, 8.945167064666748e-05, 9.930133819580078e-05, 0.00010915100574493408, 0.00011900067329406738, 0.00012885034084320068, 0.00013870000839233398, 0.00014854967594146729, 0.00015839934349060059, 0.0001682490110397339, 0.0001780986785888672, 0.0001879483461380005, 0.0001977980136871338, 0.0002076476812362671, 0.0002174973487854004, 0.0002273470163345337, 0.000237196683883667, 0.0002470463514328003, 0.0002568960189819336, 0.0002667456865310669, 0.0002765953540802002, 0.0002864450216293335, 0.0002962946891784668, 0.0003061443567276001, 0.0003159940242767334, 0.0003258436918258667, 0.000335693359375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 8.0, 7.0, 11.0, 13.0, 26.0, 44.0, 57.0, 77.0, 98.0, 151.0, 255.0, 356.0, 544.0, 856.0, 1327.0, 2157.0, 3420.0, 5691.0, 9428.0, 15817.0, 26063.0, 43444.0, 69710.0, 105108.0, 140381.0, 158396.0, 147279.0, 114396.0, 77895.0, 49458.0, 30129.0, 18168.0, 10800.0, 6574.0, 3841.0, 2344.0, 1507.0, 930.0, 587.0, 375.0, 267.0, 173.0, 113.0, 91.0, 57.0, 41.0, 33.0, 17.0, 12.0, 5.0, 7.0, 2.0, 8.0, 3.0, 2.0, 1.0, 2.0], "bins": [-2.328125, -2.25677490234375, -2.1854248046875, -2.11407470703125, -2.042724609375, -1.97137451171875, -1.9000244140625, -1.82867431640625, -1.75732421875, -1.68597412109375, -1.6146240234375, -1.54327392578125, -1.471923828125, -1.40057373046875, -1.3292236328125, -1.25787353515625, -1.1865234375, -1.11517333984375, -1.0438232421875, -0.97247314453125, -0.901123046875, -0.82977294921875, -0.7584228515625, -0.68707275390625, -0.61572265625, -0.54437255859375, -0.4730224609375, -0.40167236328125, -0.330322265625, -0.25897216796875, -0.1876220703125, -0.11627197265625, -0.044921875, 0.02642822265625, 0.0977783203125, 0.16912841796875, 0.240478515625, 0.31182861328125, 0.3831787109375, 0.45452880859375, 0.52587890625, 0.59722900390625, 0.6685791015625, 0.73992919921875, 0.811279296875, 0.88262939453125, 0.9539794921875, 1.02532958984375, 1.0966796875, 1.16802978515625, 1.2393798828125, 1.31072998046875, 1.382080078125, 1.45343017578125, 1.5247802734375, 1.59613037109375, 1.66748046875, 1.73883056640625, 1.8101806640625, 1.88153076171875, 1.952880859375, 2.02423095703125, 2.0955810546875, 2.16693115234375, 2.23828125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 6.0, 9.0, 3.0, 6.0, 9.0, 13.0, 17.0, 25.0, 25.0, 32.0, 30.0, 37.0, 46.0, 54.0, 47.0, 63.0, 53.0, 67.0, 48.0, 47.0, 49.0, 56.0, 37.0, 47.0, 28.0, 28.0, 25.0, 21.0, 15.0, 10.0, 12.0, 5.0, 10.0, 3.0, 3.0, 5.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.833984375, -0.8075103759765625, -0.781036376953125, -0.7545623779296875, -0.72808837890625, -0.7016143798828125, -0.675140380859375, -0.6486663818359375, -0.6221923828125, -0.5957183837890625, -0.569244384765625, -0.5427703857421875, -0.51629638671875, -0.4898223876953125, -0.463348388671875, -0.4368743896484375, -0.410400390625, -0.3839263916015625, -0.357452392578125, -0.3309783935546875, -0.30450439453125, -0.2780303955078125, -0.251556396484375, -0.2250823974609375, -0.1986083984375, -0.1721343994140625, -0.145660400390625, -0.1191864013671875, -0.09271240234375, -0.0662384033203125, -0.039764404296875, -0.0132904052734375, 0.01318359375, 0.0396575927734375, 0.066131591796875, 0.0926055908203125, 0.11907958984375, 0.1455535888671875, 0.172027587890625, 0.1985015869140625, 0.2249755859375, 0.2514495849609375, 0.277923583984375, 0.3043975830078125, 0.33087158203125, 0.3573455810546875, 0.383819580078125, 0.4102935791015625, 0.436767578125, 0.4632415771484375, 0.489715576171875, 0.5161895751953125, 0.54266357421875, 0.5691375732421875, 0.595611572265625, 0.6220855712890625, 0.6485595703125, 0.6750335693359375, 0.701507568359375, 0.7279815673828125, 0.75445556640625, 0.7809295654296875, 0.807403564453125, 0.8338775634765625, 0.8603515625]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 1.0, 6.0, 5.0, 5.0, 6.0, 7.0, 7.0, 9.0, 14.0, 11.0, 17.0, 28.0, 31.0, 29.0, 25.0, 38.0, 48.0, 57.0, 57.0, 48.0, 55.0, 66.0, 69.0, 50.0, 45.0, 39.0, 36.0, 40.0, 21.0, 18.0, 30.0, 14.0, 8.0, 13.0, 10.0, 9.0, 9.0, 6.0, 3.0, 2.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-7.236756324768066, -7.029432773590088, -6.822109699249268, -6.614786148071289, -6.407463073730469, -6.20013952255249, -5.992815971374512, -5.785492897033691, -5.578169822692871, -5.370846271514893, -5.163523197174072, -4.956199645996094, -4.748876571655273, -4.541553020477295, -4.334229469299316, -4.126906394958496, -3.9195828437805176, -3.712259531021118, -3.5049362182617188, -3.2976126670837402, -3.09028959274292, -2.8829660415649414, -2.675642728805542, -2.4683194160461426, -2.260996103286743, -2.0536727905273438, -1.8463494777679443, -1.6390260457992554, -1.431702733039856, -1.2243794202804565, -1.0170559883117676, -0.8097326755523682, -0.602409839630127, -0.39508649706840515, -0.18776315450668335, 0.01956021785736084, 0.22688353061676025, 0.43420684337615967, 0.6415302753448486, 0.848853588104248, 1.0561769008636475, 1.2635002136230469, 1.4708235263824463, 1.6781469583511353, 1.8854702711105347, 2.0927934646606445, 2.300117015838623, 2.5074403285980225, 2.714763641357422, 2.9220869541168213, 3.1294102668762207, 3.336733818054199, 3.5440568923950195, 3.751380443572998, 3.9587037563323975, 4.166027069091797, 4.373350143432617, 4.580673694610596, 4.787996768951416, 4.9953203201293945, 5.202643394470215, 5.409966945648193, 5.617290496826172, 5.824613571166992, 6.031937122344971]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 2.0, 1.0, 4.0, 3.0, 3.0, 7.0, 11.0, 20.0, 15.0, 19.0, 22.0, 31.0, 24.0, 28.0, 18.0, 33.0, 29.0, 40.0, 24.0, 40.0, 36.0, 45.0, 42.0, 33.0, 31.0, 41.0, 45.0, 27.0, 34.0, 33.0, 30.0, 40.0, 28.0, 27.0, 22.0, 26.0, 13.0, 14.0, 8.0, 2.0, 12.0, 10.0, 6.0, 5.0, 5.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.626706600189209, -4.494546890258789, -4.362387657165527, -4.230227947235107, -4.0980682373046875, -3.9659087657928467, -3.833749294281006, -3.701589584350586, -3.569430112838745, -3.4372706413269043, -3.3051109313964844, -3.1729514598846436, -3.0407919883728027, -2.908632278442383, -2.776472806930542, -2.644313335418701, -2.5121536254882812, -2.3799941539764404, -2.2478344440460205, -2.1156749725341797, -1.9835153818130493, -1.851355791091919, -1.7191963195800781, -1.5870367288589478, -1.4548771381378174, -1.322717547416687, -1.1905579566955566, -1.0583984851837158, -0.9262388944625854, -0.7940793037414551, -0.6619197726249695, -0.5297602415084839, -0.3976008892059326, -0.26544132828712463, -0.13328176736831665, -0.001122206449508667, 0.13103735446929932, 0.2631969451904297, 0.3953564763069153, 0.5275160074234009, 0.6596755981445312, 0.7918351888656616, 0.9239947199821472, 1.0561542510986328, 1.1883138418197632, 1.3204734325408936, 1.4526329040527344, 1.5847924947738647, 1.7169520854949951, 1.8491116762161255, 1.9812712669372559, 2.1134307384490967, 2.2455902099609375, 2.3777499198913574, 2.5099093914031982, 2.642068862915039, 2.774228572845459, 2.9063880443573, 3.0385477542877197, 3.1707072257995605, 3.3028669357299805, 3.4350264072418213, 3.567185878753662, 3.699345588684082, 3.831505060195923]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [4.0, 4.0, 4.0, 11.0, 9.0, 13.0, 18.0, 26.0, 31.0, 43.0, 64.0, 101.0, 120.0, 184.0, 233.0, 341.0, 459.0, 729.0, 1041.0, 1559.0, 2314.0, 3691.0, 5992.0, 9715.0, 16304.0, 29938.0, 56523.0, 116635.0, 260214.0, 602316.0, 1091987.0, 1026853.0, 522785.0, 224801.0, 101313.0, 50034.0, 26780.0, 15258.0, 8953.0, 5745.0, 3697.0, 2425.0, 1585.0, 1076.0, 743.0, 512.0, 363.0, 235.0, 170.0, 132.0, 75.0, 47.0, 28.0, 22.0, 19.0, 11.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0], "bins": [-5.9609375, -5.76812744140625, -5.5753173828125, -5.38250732421875, -5.189697265625, -4.99688720703125, -4.8040771484375, -4.61126708984375, -4.41845703125, -4.22564697265625, -4.0328369140625, -3.84002685546875, -3.647216796875, -3.45440673828125, -3.2615966796875, -3.06878662109375, -2.8759765625, -2.68316650390625, -2.4903564453125, -2.29754638671875, -2.104736328125, -1.91192626953125, -1.7191162109375, -1.52630615234375, -1.33349609375, -1.14068603515625, -0.9478759765625, -0.75506591796875, -0.562255859375, -0.36944580078125, -0.1766357421875, 0.01617431640625, 0.208984375, 0.40179443359375, 0.5946044921875, 0.78741455078125, 0.980224609375, 1.17303466796875, 1.3658447265625, 1.55865478515625, 1.75146484375, 1.94427490234375, 2.1370849609375, 2.32989501953125, 2.522705078125, 2.71551513671875, 2.9083251953125, 3.10113525390625, 3.2939453125, 3.48675537109375, 3.6795654296875, 3.87237548828125, 4.065185546875, 4.25799560546875, 4.4508056640625, 4.64361572265625, 4.83642578125, 5.02923583984375, 5.2220458984375, 5.41485595703125, 5.607666015625, 5.80047607421875, 5.9932861328125, 6.18609619140625, 6.37890625]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 11.0, 3.0, 15.0, 20.0, 13.0, 18.0, 14.0, 18.0, 27.0, 22.0, 31.0, 30.0, 35.0, 35.0, 35.0, 42.0, 36.0, 38.0, 35.0, 37.0, 40.0, 30.0, 41.0, 46.0, 32.0, 28.0, 35.0, 30.0, 27.0, 26.0, 26.0, 19.0, 24.0, 9.0, 13.0, 8.0, 7.0, 3.0, 9.0, 10.0, 2.0, 6.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.208984375, -3.1156005859375, -3.022216796875, -2.9288330078125, -2.83544921875, -2.7420654296875, -2.648681640625, -2.5552978515625, -2.4619140625, -2.3685302734375, -2.275146484375, -2.1817626953125, -2.08837890625, -1.9949951171875, -1.901611328125, -1.8082275390625, -1.71484375, -1.6214599609375, -1.528076171875, -1.4346923828125, -1.34130859375, -1.2479248046875, -1.154541015625, -1.0611572265625, -0.9677734375, -0.8743896484375, -0.781005859375, -0.6876220703125, -0.59423828125, -0.5008544921875, -0.407470703125, -0.3140869140625, -0.220703125, -0.1273193359375, -0.033935546875, 0.0594482421875, 0.15283203125, 0.2462158203125, 0.339599609375, 0.4329833984375, 0.5263671875, 0.6197509765625, 0.713134765625, 0.8065185546875, 0.89990234375, 0.9932861328125, 1.086669921875, 1.1800537109375, 1.2734375, 1.3668212890625, 1.460205078125, 1.5535888671875, 1.64697265625, 1.7403564453125, 1.833740234375, 1.9271240234375, 2.0205078125, 2.1138916015625, 2.207275390625, 2.3006591796875, 2.39404296875, 2.4874267578125, 2.580810546875, 2.6741943359375, 2.767578125]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 5.0, 8.0, 14.0, 15.0, 17.0, 36.0, 45.0, 82.0, 106.0, 139.0, 197.0, 298.0, 525.0, 698.0, 1092.0, 1686.0, 2596.0, 4258.0, 7014.0, 12012.0, 21160.0, 38590.0, 73354.0, 146840.0, 306561.0, 649361.0, 1115431.0, 914014.0, 456359.0, 213921.0, 104749.0, 54034.0, 28682.0, 16049.0, 9339.0, 5481.0, 3427.0, 2086.0, 1373.0, 829.0, 577.0, 375.0, 274.0, 176.0, 129.0, 97.0, 56.0, 44.0, 31.0, 18.0, 14.0, 11.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.64453125, -6.44171142578125, -6.2388916015625, -6.03607177734375, -5.833251953125, -5.63043212890625, -5.4276123046875, -5.22479248046875, -5.02197265625, -4.81915283203125, -4.6163330078125, -4.41351318359375, -4.210693359375, -4.00787353515625, -3.8050537109375, -3.60223388671875, -3.3994140625, -3.19659423828125, -2.9937744140625, -2.79095458984375, -2.588134765625, -2.38531494140625, -2.1824951171875, -1.97967529296875, -1.77685546875, -1.57403564453125, -1.3712158203125, -1.16839599609375, -0.965576171875, -0.76275634765625, -0.5599365234375, -0.35711669921875, -0.154296875, 0.04852294921875, 0.2513427734375, 0.45416259765625, 0.656982421875, 0.85980224609375, 1.0626220703125, 1.26544189453125, 1.46826171875, 1.67108154296875, 1.8739013671875, 2.07672119140625, 2.279541015625, 2.48236083984375, 2.6851806640625, 2.88800048828125, 3.0908203125, 3.29364013671875, 3.4964599609375, 3.69927978515625, 3.902099609375, 4.10491943359375, 4.3077392578125, 4.51055908203125, 4.71337890625, 4.91619873046875, 5.1190185546875, 5.32183837890625, 5.524658203125, 5.72747802734375, 5.9302978515625, 6.13311767578125, 6.3359375]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 6.0, 8.0, 15.0, 16.0, 23.0, 26.0, 27.0, 44.0, 60.0, 61.0, 93.0, 107.0, 163.0, 200.0, 246.0, 239.0, 284.0, 316.0, 328.0, 317.0, 266.0, 224.0, 179.0, 156.0, 133.0, 113.0, 86.0, 67.0, 60.0, 34.0, 38.0, 19.0, 22.0, 20.0, 16.0, 14.0, 11.0, 8.0, 0.0, 5.0, 7.0, 3.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 3.0], "bins": [-2.1015625, -2.038299560546875, -1.97503662109375, -1.911773681640625, -1.8485107421875, -1.785247802734375, -1.72198486328125, -1.658721923828125, -1.595458984375, -1.532196044921875, -1.46893310546875, -1.405670166015625, -1.3424072265625, -1.279144287109375, -1.21588134765625, -1.152618408203125, -1.08935546875, -1.026092529296875, -0.96282958984375, -0.899566650390625, -0.8363037109375, -0.773040771484375, -0.70977783203125, -0.646514892578125, -0.583251953125, -0.519989013671875, -0.45672607421875, -0.393463134765625, -0.3302001953125, -0.266937255859375, -0.20367431640625, -0.140411376953125, -0.0771484375, -0.013885498046875, 0.04937744140625, 0.112640380859375, 0.1759033203125, 0.239166259765625, 0.30242919921875, 0.365692138671875, 0.428955078125, 0.492218017578125, 0.55548095703125, 0.618743896484375, 0.6820068359375, 0.745269775390625, 0.80853271484375, 0.871795654296875, 0.93505859375, 0.998321533203125, 1.06158447265625, 1.124847412109375, 1.1881103515625, 1.251373291015625, 1.31463623046875, 1.377899169921875, 1.441162109375, 1.504425048828125, 1.56768798828125, 1.630950927734375, 1.6942138671875, 1.757476806640625, 1.82073974609375, 1.884002685546875, 1.947265625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 7.0, 7.0, 12.0, 8.0, 6.0, 14.0, 12.0, 29.0, 27.0, 27.0, 30.0, 38.0, 41.0, 58.0, 67.0, 59.0, 78.0, 69.0, 64.0, 58.0, 43.0, 46.0, 52.0, 34.0, 22.0, 15.0, 18.0, 16.0, 8.0, 9.0, 5.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.33729362487793, -7.110114097595215, -6.8829345703125, -6.655755043029785, -6.42857551574707, -6.2013959884643555, -5.974216461181641, -5.747036457061768, -5.519856929779053, -5.292677402496338, -5.065497875213623, -4.838318347930908, -4.611138820648193, -4.38395881652832, -4.1567792892456055, -3.9295997619628906, -3.702420473098755, -3.47524094581604, -3.248061418533325, -3.0208816528320312, -2.7937021255493164, -2.5665225982666016, -2.3393430709838867, -2.112163543701172, -1.8849838972091675, -1.6578043699264526, -1.4306247234344482, -1.2034451961517334, -0.9762656092643738, -0.7490860223770142, -0.5219064950942993, -0.2947268486022949, -0.06754732131958008, 0.15963225066661835, 0.3868118226528168, 0.613991379737854, 0.8411709666252136, 1.0683505535125732, 1.295530080795288, 1.5227097272872925, 1.7498892545700073, 1.9770687818527222, 2.2042484283447266, 2.4314279556274414, 2.6586074829101562, 2.885787010192871, 3.112966537475586, 3.34014630317688, 3.5673258304595947, 3.7945053577423096, 4.0216851234436035, 4.248864650726318, 4.476044178009033, 4.703223705291748, 4.930403232574463, 5.157582759857178, 5.384762287139893, 5.611941814422607, 5.839121341705322, 6.066300868988037, 6.293480396270752, 6.520660400390625, 6.74783992767334, 6.975019454956055, 7.2021989822387695]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 5.0, 4.0, 8.0, 5.0, 7.0, 10.0, 14.0, 13.0, 17.0, 13.0, 16.0, 17.0, 24.0, 25.0, 30.0, 29.0, 36.0, 23.0, 28.0, 35.0, 46.0, 41.0, 39.0, 41.0, 30.0, 26.0, 33.0, 35.0, 42.0, 33.0, 39.0, 24.0, 27.0, 30.0, 19.0, 17.0, 19.0, 13.0, 12.0, 12.0, 15.0, 11.0, 12.0, 7.0, 3.0, 5.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.4900124073028564, -3.37502384185791, -3.2600350379943848, -3.1450464725494385, -3.030057668685913, -2.915069103240967, -2.8000802993774414, -2.685091733932495, -2.570103168487549, -2.4551146030426025, -2.340125799179077, -2.225137233734131, -2.1101484298706055, -1.9951598644256592, -1.8801711797714233, -1.7651824951171875, -1.650193691253662, -1.5352050065994263, -1.4202163219451904, -1.3052277565002441, -1.1902389526367188, -1.0752503871917725, -0.9602617025375366, -0.8452730178833008, -0.7302843332290649, -0.6152956485748291, -0.5003069639205933, -0.3853183388710022, -0.27032965421676636, -0.15534096956253052, -0.04035234451293945, 0.07463634014129639, 0.18962502479553223, 0.30461370944976807, 0.4196023643016815, 0.534591019153595, 0.6495797038078308, 0.7645683884620667, 0.8795570135116577, 0.9945456981658936, 1.1095343828201294, 1.2245230674743652, 1.339511752128601, 1.454500436782837, 1.5694890022277832, 1.6844778060913086, 1.7994663715362549, 1.9144550561904907, 2.0294437408447266, 2.144432306289673, 2.2594211101531982, 2.3744096755981445, 2.48939847946167, 2.604387044906616, 2.7193756103515625, 2.834364414215088, 2.9493532180786133, 3.0643417835235596, 3.179330587387085, 3.2943191528320312, 3.4093079566955566, 3.524296522140503, 3.639285087585449, 3.7542738914489746, 3.869262456893921]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 9.0, 10.0, 8.0, 12.0, 22.0, 17.0, 45.0, 41.0, 66.0, 101.0, 181.0, 227.0, 371.0, 567.0, 918.0, 1568.0, 2902.0, 5948.0, 12240.0, 27831.0, 65342.0, 146070.0, 256771.0, 258499.0, 148325.0, 66591.0, 28422.0, 12339.0, 5801.0, 2977.0, 1627.0, 933.0, 605.0, 348.0, 255.0, 184.0, 118.0, 84.0, 49.0, 38.0, 34.0, 19.0, 6.0, 5.0, 10.0, 5.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0], "bins": [-5.046875, -4.88922119140625, -4.7315673828125, -4.57391357421875, -4.416259765625, -4.25860595703125, -4.1009521484375, -3.94329833984375, -3.78564453125, -3.62799072265625, -3.4703369140625, -3.31268310546875, -3.155029296875, -2.99737548828125, -2.8397216796875, -2.68206787109375, -2.5244140625, -2.36676025390625, -2.2091064453125, -2.05145263671875, -1.893798828125, -1.73614501953125, -1.5784912109375, -1.42083740234375, -1.26318359375, -1.10552978515625, -0.9478759765625, -0.79022216796875, -0.632568359375, -0.47491455078125, -0.3172607421875, -0.15960693359375, -0.001953125, 0.15570068359375, 0.3133544921875, 0.47100830078125, 0.628662109375, 0.78631591796875, 0.9439697265625, 1.10162353515625, 1.25927734375, 1.41693115234375, 1.5745849609375, 1.73223876953125, 1.889892578125, 2.04754638671875, 2.2052001953125, 2.36285400390625, 2.5205078125, 2.67816162109375, 2.8358154296875, 2.99346923828125, 3.151123046875, 3.30877685546875, 3.4664306640625, 3.62408447265625, 3.78173828125, 3.93939208984375, 4.0970458984375, 4.25469970703125, 4.412353515625, 4.57000732421875, 4.7276611328125, 4.88531494140625, 5.04296875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 6.0, 5.0, 2.0, 10.0, 14.0, 16.0, 9.0, 13.0, 21.0, 18.0, 21.0, 24.0, 19.0, 41.0, 30.0, 28.0, 41.0, 36.0, 37.0, 39.0, 45.0, 39.0, 36.0, 39.0, 37.0, 39.0, 35.0, 32.0, 31.0, 25.0, 29.0, 29.0, 22.0, 20.0, 16.0, 16.0, 9.0, 15.0, 13.0, 10.0, 8.0, 9.0, 5.0, 5.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.818359375, -3.690521240234375, -3.56268310546875, -3.434844970703125, -3.3070068359375, -3.179168701171875, -3.05133056640625, -2.923492431640625, -2.795654296875, -2.667816162109375, -2.53997802734375, -2.412139892578125, -2.2843017578125, -2.156463623046875, -2.02862548828125, -1.900787353515625, -1.77294921875, -1.645111083984375, -1.51727294921875, -1.389434814453125, -1.2615966796875, -1.133758544921875, -1.00592041015625, -0.878082275390625, -0.750244140625, -0.622406005859375, -0.49456787109375, -0.366729736328125, -0.2388916015625, -0.111053466796875, 0.01678466796875, 0.144622802734375, 0.2724609375, 0.400299072265625, 0.52813720703125, 0.655975341796875, 0.7838134765625, 0.911651611328125, 1.03948974609375, 1.167327880859375, 1.295166015625, 1.423004150390625, 1.55084228515625, 1.678680419921875, 1.8065185546875, 1.934356689453125, 2.06219482421875, 2.190032958984375, 2.31787109375, 2.445709228515625, 2.57354736328125, 2.701385498046875, 2.8292236328125, 2.957061767578125, 3.08489990234375, 3.212738037109375, 3.340576171875, 3.468414306640625, 3.59625244140625, 3.724090576171875, 3.8519287109375, 3.979766845703125, 4.10760498046875, 4.235443115234375, 4.36328125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 6.0, 11.0, 7.0, 11.0, 24.0, 32.0, 38.0, 44.0, 93.0, 113.0, 172.0, 280.0, 370.0, 594.0, 1073.0, 1751.0, 3026.0, 5976.0, 11974.0, 25643.0, 59425.0, 137638.0, 271998.0, 275554.0, 140478.0, 60043.0, 26306.0, 11978.0, 6074.0, 3128.0, 1796.0, 1047.0, 622.0, 388.0, 258.0, 186.0, 123.0, 71.0, 61.0, 36.0, 39.0, 25.0, 16.0, 7.0, 6.0, 12.0, 5.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.84765625, -5.66497802734375, -5.4822998046875, -5.29962158203125, -5.116943359375, -4.93426513671875, -4.7515869140625, -4.56890869140625, -4.38623046875, -4.20355224609375, -4.0208740234375, -3.83819580078125, -3.655517578125, -3.47283935546875, -3.2901611328125, -3.10748291015625, -2.9248046875, -2.74212646484375, -2.5594482421875, -2.37677001953125, -2.194091796875, -2.01141357421875, -1.8287353515625, -1.64605712890625, -1.46337890625, -1.28070068359375, -1.0980224609375, -0.91534423828125, -0.732666015625, -0.54998779296875, -0.3673095703125, -0.18463134765625, -0.001953125, 0.18072509765625, 0.3634033203125, 0.54608154296875, 0.728759765625, 0.91143798828125, 1.0941162109375, 1.27679443359375, 1.45947265625, 1.64215087890625, 1.8248291015625, 2.00750732421875, 2.190185546875, 2.37286376953125, 2.5555419921875, 2.73822021484375, 2.9208984375, 3.10357666015625, 3.2862548828125, 3.46893310546875, 3.651611328125, 3.83428955078125, 4.0169677734375, 4.19964599609375, 4.38232421875, 4.56500244140625, 4.7476806640625, 4.93035888671875, 5.113037109375, 5.29571533203125, 5.4783935546875, 5.66107177734375, 5.84375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 8.0, 6.0, 1.0, 5.0, 7.0, 10.0, 11.0, 12.0, 13.0, 9.0, 15.0, 18.0, 32.0, 24.0, 32.0, 28.0, 26.0, 53.0, 35.0, 38.0, 51.0, 46.0, 33.0, 39.0, 31.0, 39.0, 49.0, 42.0, 37.0, 34.0, 29.0, 32.0, 21.0, 27.0, 15.0, 19.0, 16.0, 7.0, 18.0, 6.0, 10.0, 5.0, 5.0, 3.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.693359375, -2.61199951171875, -2.5306396484375, -2.44927978515625, -2.367919921875, -2.28656005859375, -2.2052001953125, -2.12384033203125, -2.04248046875, -1.96112060546875, -1.8797607421875, -1.79840087890625, -1.717041015625, -1.63568115234375, -1.5543212890625, -1.47296142578125, -1.3916015625, -1.31024169921875, -1.2288818359375, -1.14752197265625, -1.066162109375, -0.98480224609375, -0.9034423828125, -0.82208251953125, -0.74072265625, -0.65936279296875, -0.5780029296875, -0.49664306640625, -0.415283203125, -0.33392333984375, -0.2525634765625, -0.17120361328125, -0.08984375, -0.00848388671875, 0.0728759765625, 0.15423583984375, 0.235595703125, 0.31695556640625, 0.3983154296875, 0.47967529296875, 0.56103515625, 0.64239501953125, 0.7237548828125, 0.80511474609375, 0.886474609375, 0.96783447265625, 1.0491943359375, 1.13055419921875, 1.2119140625, 1.29327392578125, 1.3746337890625, 1.45599365234375, 1.537353515625, 1.61871337890625, 1.7000732421875, 1.78143310546875, 1.86279296875, 1.94415283203125, 2.0255126953125, 2.10687255859375, 2.188232421875, 2.26959228515625, 2.3509521484375, 2.43231201171875, 2.513671875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 11.0, 10.0, 11.0, 11.0, 17.0, 21.0, 35.0, 58.0, 81.0, 116.0, 152.0, 214.0, 355.0, 581.0, 1013.0, 1610.0, 2937.0, 5401.0, 10601.0, 22353.0, 48793.0, 111684.0, 236408.0, 296435.0, 168395.0, 75114.0, 33306.0, 15526.0, 7697.0, 4071.0, 2200.0, 1237.0, 730.0, 433.0, 319.0, 195.0, 135.0, 99.0, 53.0, 44.0, 28.0, 21.0, 14.0, 12.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.509765625, -2.429473876953125, -2.34918212890625, -2.268890380859375, -2.1885986328125, -2.108306884765625, -2.02801513671875, -1.947723388671875, -1.867431640625, -1.787139892578125, -1.70684814453125, -1.626556396484375, -1.5462646484375, -1.465972900390625, -1.38568115234375, -1.305389404296875, -1.22509765625, -1.144805908203125, -1.06451416015625, -0.984222412109375, -0.9039306640625, -0.823638916015625, -0.74334716796875, -0.663055419921875, -0.582763671875, -0.502471923828125, -0.42218017578125, -0.341888427734375, -0.2615966796875, -0.181304931640625, -0.10101318359375, -0.020721435546875, 0.0595703125, 0.139862060546875, 0.22015380859375, 0.300445556640625, 0.3807373046875, 0.461029052734375, 0.54132080078125, 0.621612548828125, 0.701904296875, 0.782196044921875, 0.86248779296875, 0.942779541015625, 1.0230712890625, 1.103363037109375, 1.18365478515625, 1.263946533203125, 1.34423828125, 1.424530029296875, 1.50482177734375, 1.585113525390625, 1.6654052734375, 1.745697021484375, 1.82598876953125, 1.906280517578125, 1.986572265625, 2.066864013671875, 2.14715576171875, 2.227447509765625, 2.3077392578125, 2.388031005859375, 2.46832275390625, 2.548614501953125, 2.62890625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 6.0, 1.0, 1.0, 7.0, 5.0, 5.0, 5.0, 10.0, 9.0, 14.0, 13.0, 9.0, 21.0, 27.0, 26.0, 27.0, 30.0, 54.0, 42.0, 65.0, 53.0, 48.0, 57.0, 53.0, 54.0, 52.0, 59.0, 43.0, 31.0, 21.0, 38.0, 22.0, 19.0, 14.0, 17.0, 12.0, 11.0, 0.0, 6.0, 7.0, 12.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-9.98377799987793e-05, -9.724870324134827e-05, -9.465962648391724e-05, -9.20705497264862e-05, -8.948147296905518e-05, -8.689239621162415e-05, -8.430331945419312e-05, -8.171424269676208e-05, -7.912516593933105e-05, -7.653608918190002e-05, -7.3947012424469e-05, -7.135793566703796e-05, -6.876885890960693e-05, -6.61797821521759e-05, -6.359070539474487e-05, -6.100162863731384e-05, -5.841255187988281e-05, -5.582347512245178e-05, -5.323439836502075e-05, -5.064532160758972e-05, -4.805624485015869e-05, -4.546716809272766e-05, -4.287809133529663e-05, -4.02890145778656e-05, -3.769993782043457e-05, -3.511086106300354e-05, -3.252178430557251e-05, -2.993270754814148e-05, -2.734363079071045e-05, -2.475455403327942e-05, -2.216547727584839e-05, -1.957640051841736e-05, -1.6987323760986328e-05, -1.4398247003555298e-05, -1.1809170246124268e-05, -9.220093488693237e-06, -6.631016731262207e-06, -4.041939973831177e-06, -1.4528632164001465e-06, 1.1362135410308838e-06, 3.725290298461914e-06, 6.314367055892944e-06, 8.903443813323975e-06, 1.1492520570755005e-05, 1.4081597328186035e-05, 1.6670674085617065e-05, 1.9259750843048096e-05, 2.1848827600479126e-05, 2.4437904357910156e-05, 2.7026981115341187e-05, 2.9616057872772217e-05, 3.220513463020325e-05, 3.479421138763428e-05, 3.738328814506531e-05, 3.997236490249634e-05, 4.256144165992737e-05, 4.51505184173584e-05, 4.773959517478943e-05, 5.032867193222046e-05, 5.291774868965149e-05, 5.550682544708252e-05, 5.809590220451355e-05, 6.068497896194458e-05, 6.327405571937561e-05, 6.586313247680664e-05]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 8.0, 7.0, 11.0, 22.0, 22.0, 53.0, 69.0, 143.0, 258.0, 391.0, 698.0, 1248.0, 2268.0, 4146.0, 7844.0, 15136.0, 28895.0, 55253.0, 102177.0, 167691.0, 213372.0, 186004.0, 121175.0, 67031.0, 35747.0, 18298.0, 9503.0, 4932.0, 2644.0, 1508.0, 850.0, 481.0, 260.0, 142.0, 105.0, 67.0, 42.0, 18.0, 13.0, 9.0, 9.0, 3.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.8828125, -1.8251495361328125, -1.767486572265625, -1.7098236083984375, -1.65216064453125, -1.5944976806640625, -1.536834716796875, -1.4791717529296875, -1.4215087890625, -1.3638458251953125, -1.306182861328125, -1.2485198974609375, -1.19085693359375, -1.1331939697265625, -1.075531005859375, -1.0178680419921875, -0.960205078125, -0.9025421142578125, -0.844879150390625, -0.7872161865234375, -0.72955322265625, -0.6718902587890625, -0.614227294921875, -0.5565643310546875, -0.4989013671875, -0.4412384033203125, -0.383575439453125, -0.3259124755859375, -0.26824951171875, -0.2105865478515625, -0.152923583984375, -0.0952606201171875, -0.03759765625, 0.0200653076171875, 0.077728271484375, 0.1353912353515625, 0.19305419921875, 0.2507171630859375, 0.308380126953125, 0.3660430908203125, 0.4237060546875, 0.4813690185546875, 0.539031982421875, 0.5966949462890625, 0.65435791015625, 0.7120208740234375, 0.769683837890625, 0.8273468017578125, 0.885009765625, 0.9426727294921875, 1.000335693359375, 1.0579986572265625, 1.11566162109375, 1.1733245849609375, 1.230987548828125, 1.2886505126953125, 1.3463134765625, 1.4039764404296875, 1.461639404296875, 1.5193023681640625, 1.57696533203125, 1.6346282958984375, 1.692291259765625, 1.7499542236328125, 1.8076171875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 4.0, 4.0, 12.0, 19.0, 14.0, 12.0, 10.0, 26.0, 28.0, 28.0, 30.0, 32.0, 43.0, 39.0, 41.0, 46.0, 48.0, 57.0, 42.0, 55.0, 47.0, 42.0, 38.0, 40.0, 42.0, 23.0, 30.0, 26.0, 30.0, 20.0, 17.0, 15.0, 5.0, 7.0, 4.0, 4.0, 6.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.447509765625, -0.4327201843261719, -0.41793060302734375, -0.4031410217285156, -0.3883514404296875, -0.3735618591308594, -0.35877227783203125, -0.3439826965332031, -0.329193115234375, -0.3144035339355469, -0.29961395263671875, -0.2848243713378906, -0.2700347900390625, -0.2552452087402344, -0.24045562744140625, -0.22566604614257812, -0.21087646484375, -0.19608688354492188, -0.18129730224609375, -0.16650772094726562, -0.1517181396484375, -0.13692855834960938, -0.12213897705078125, -0.10734939575195312, -0.092559814453125, -0.07777023315429688, -0.06298065185546875, -0.048191070556640625, -0.0334014892578125, -0.018611907958984375, -0.00382232666015625, 0.010967254638671875, 0.0257568359375, 0.040546417236328125, 0.05533599853515625, 0.07012557983398438, 0.0849151611328125, 0.09970474243164062, 0.11449432373046875, 0.12928390502929688, 0.144073486328125, 0.15886306762695312, 0.17365264892578125, 0.18844223022460938, 0.2032318115234375, 0.21802139282226562, 0.23281097412109375, 0.24760055541992188, 0.26239013671875, 0.2771797180175781, 0.29196929931640625, 0.3067588806152344, 0.3215484619140625, 0.3363380432128906, 0.35112762451171875, 0.3659172058105469, 0.380706787109375, 0.3954963684082031, 0.41028594970703125, 0.4250755310058594, 0.4398651123046875, 0.4546546936035156, 0.46944427490234375, 0.4842338562011719, 0.4990234375]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 3.0, 6.0, 7.0, 9.0, 8.0, 12.0, 11.0, 13.0, 22.0, 28.0, 20.0, 34.0, 32.0, 39.0, 55.0, 64.0, 59.0, 71.0, 72.0, 59.0, 55.0, 61.0, 44.0, 44.0, 40.0, 30.0, 19.0, 14.0, 16.0, 17.0, 3.0, 8.0, 6.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.729515075683594, -6.509955883026123, -6.2903971672058105, -6.07083797454834, -5.851278781890869, -5.631719589233398, -5.412160873413086, -5.192601680755615, -4.9730424880981445, -4.753483295440674, -4.533924579620361, -4.314365386962891, -4.09480619430542, -3.8752472400665283, -3.6556882858276367, -3.436129093170166, -3.2165703773498535, -2.997011423110962, -2.777452230453491, -2.5578932762145996, -2.338334083557129, -2.1187751293182373, -1.8992161750793457, -1.6796571016311646, -1.4600980281829834, -1.2405389547348022, -1.020979881286621, -0.8014209270477295, -0.5818618535995483, -0.3623027801513672, -0.14274382591247559, 0.07681524753570557, 0.2963738441467285, 0.5159329175949097, 0.735491931438446, 0.9550509452819824, 1.1746100187301636, 1.3941690921783447, 1.6137280464172363, 1.8332871198654175, 2.0528461933135986, 2.2724051475524902, 2.491964340209961, 2.7115232944488525, 2.931082248687744, 3.150641441345215, 3.3702003955841064, 3.589759349822998, 3.8093185424804688, 4.0288777351379395, 4.248436450958252, 4.467995643615723, 4.687554836273193, 4.907114028930664, 5.126672744750977, 5.346231937408447, 5.565791130065918, 5.785350322723389, 6.004909038543701, 6.224468231201172, 6.444027423858643, 6.663586616516113, 6.883145332336426, 7.1027045249938965, 7.322263240814209]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 4.0, 6.0, 3.0, 4.0, 7.0, 7.0, 5.0, 16.0, 12.0, 11.0, 17.0, 9.0, 23.0, 17.0, 24.0, 30.0, 29.0, 24.0, 32.0, 34.0, 24.0, 34.0, 40.0, 38.0, 34.0, 48.0, 29.0, 43.0, 27.0, 29.0, 40.0, 32.0, 38.0, 33.0, 19.0, 30.0, 21.0, 19.0, 21.0, 9.0, 15.0, 11.0, 13.0, 11.0, 11.0, 8.0, 4.0, 4.0, 7.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.4440343379974365, -3.3310611248016357, -3.218087911605835, -3.105114459991455, -2.9921412467956543, -2.8791680335998535, -2.7661948204040527, -2.653221607208252, -2.540248394012451, -2.4272751808166504, -2.3143019676208496, -2.201328754425049, -2.088355302810669, -1.9753820896148682, -1.8624088764190674, -1.7494356632232666, -1.6364622116088867, -1.523488998413086, -1.4105156660079956, -1.2975424528121948, -1.1845691204071045, -1.0715959072113037, -0.9586226940155029, -0.8456494212150574, -0.7326761484146118, -0.6197028756141663, -0.5067296028137207, -0.3937563896179199, -0.28078311681747437, -0.1678098440170288, -0.05483663082122803, 0.05813664197921753, 0.1711101531982422, 0.28408342599868774, 0.3970566689968109, 0.5100299119949341, 0.6230031847953796, 0.7359764575958252, 0.848949670791626, 0.9619229435920715, 1.074896216392517, 1.1878694295883179, 1.3008427619934082, 1.413815975189209, 1.5267891883850098, 1.6397625207901, 1.7527357339859009, 1.8657090663909912, 1.978682279586792, 2.0916554927825928, 2.2046287059783936, 2.3176021575927734, 2.430575370788574, 2.543548583984375, 2.656521797180176, 2.7694950103759766, 2.8824682235717773, 2.995441436767578, 3.108414649963379, 3.2213878631591797, 3.3343613147735596, 3.4473345279693604, 3.560307741165161, 3.673280954360962, 3.786254405975342]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 4.0, 12.0, 13.0, 11.0, 26.0, 27.0, 56.0, 60.0, 105.0, 153.0, 225.0, 371.0, 577.0, 899.0, 1388.0, 2164.0, 3361.0, 5372.0, 8214.0, 12873.0, 19885.0, 29992.0, 44816.0, 65159.0, 89238.0, 114590.0, 131124.0, 130046.0, 112706.0, 87003.0, 62815.0, 42979.0, 29180.0, 18715.0, 12200.0, 7953.0, 5178.0, 3236.0, 2119.0, 1311.0, 836.0, 519.0, 343.0, 238.0, 155.0, 100.0, 67.0, 40.0, 37.0, 26.0, 21.0, 4.0, 6.0, 7.0, 6.0, 3.0, 3.0, 1.0], "bins": [-3.3515625, -3.249847412109375, -3.14813232421875, -3.046417236328125, -2.9447021484375, -2.842987060546875, -2.74127197265625, -2.639556884765625, -2.537841796875, -2.436126708984375, -2.33441162109375, -2.232696533203125, -2.1309814453125, -2.029266357421875, -1.92755126953125, -1.825836181640625, -1.72412109375, -1.622406005859375, -1.52069091796875, -1.418975830078125, -1.3172607421875, -1.215545654296875, -1.11383056640625, -1.012115478515625, -0.910400390625, -0.808685302734375, -0.70697021484375, -0.605255126953125, -0.5035400390625, -0.401824951171875, -0.30010986328125, -0.198394775390625, -0.0966796875, 0.005035400390625, 0.10675048828125, 0.208465576171875, 0.3101806640625, 0.411895751953125, 0.51361083984375, 0.615325927734375, 0.717041015625, 0.818756103515625, 0.92047119140625, 1.022186279296875, 1.1239013671875, 1.225616455078125, 1.32733154296875, 1.429046630859375, 1.53076171875, 1.632476806640625, 1.73419189453125, 1.835906982421875, 1.9376220703125, 2.039337158203125, 2.14105224609375, 2.242767333984375, 2.344482421875, 2.446197509765625, 2.54791259765625, 2.649627685546875, 2.7513427734375, 2.853057861328125, 2.95477294921875, 3.056488037109375, 3.158203125]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 5.0, 5.0, 10.0, 13.0, 10.0, 19.0, 14.0, 16.0, 25.0, 22.0, 32.0, 30.0, 33.0, 35.0, 48.0, 39.0, 38.0, 48.0, 38.0, 58.0, 48.0, 37.0, 42.0, 41.0, 42.0, 34.0, 38.0, 35.0, 21.0, 16.0, 29.0, 12.0, 13.0, 16.0, 13.0, 11.0, 3.0, 4.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.67578125, -4.53057861328125, -4.3853759765625, -4.24017333984375, -4.094970703125, -3.94976806640625, -3.8045654296875, -3.65936279296875, -3.51416015625, -3.36895751953125, -3.2237548828125, -3.07855224609375, -2.933349609375, -2.78814697265625, -2.6429443359375, -2.49774169921875, -2.3525390625, -2.20733642578125, -2.0621337890625, -1.91693115234375, -1.771728515625, -1.62652587890625, -1.4813232421875, -1.33612060546875, -1.19091796875, -1.04571533203125, -0.9005126953125, -0.75531005859375, -0.610107421875, -0.46490478515625, -0.3197021484375, -0.17449951171875, -0.029296875, 0.11590576171875, 0.2611083984375, 0.40631103515625, 0.551513671875, 0.69671630859375, 0.8419189453125, 0.98712158203125, 1.13232421875, 1.27752685546875, 1.4227294921875, 1.56793212890625, 1.713134765625, 1.85833740234375, 2.0035400390625, 2.14874267578125, 2.2939453125, 2.43914794921875, 2.5843505859375, 2.72955322265625, 2.874755859375, 3.01995849609375, 3.1651611328125, 3.31036376953125, 3.45556640625, 3.60076904296875, 3.7459716796875, 3.89117431640625, 4.036376953125, 4.18157958984375, 4.3267822265625, 4.47198486328125, 4.6171875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 9.0, 10.0, 11.0, 11.0, 30.0, 52.0, 75.0, 125.0, 175.0, 303.0, 450.0, 797.0, 1284.0, 2201.0, 3728.0, 6344.0, 10927.0, 18444.0, 31120.0, 50887.0, 80251.0, 117382.0, 150397.0, 160290.0, 139068.0, 102209.0, 67888.0, 42342.0, 25199.0, 15186.0, 8742.0, 5049.0, 3032.0, 1801.0, 1082.0, 646.0, 380.0, 255.0, 122.0, 106.0, 47.0, 39.0, 22.0, 14.0, 9.0, 12.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.47265625, -3.358062744140625, -3.24346923828125, -3.128875732421875, -3.0142822265625, -2.899688720703125, -2.78509521484375, -2.670501708984375, -2.555908203125, -2.441314697265625, -2.32672119140625, -2.212127685546875, -2.0975341796875, -1.982940673828125, -1.86834716796875, -1.753753662109375, -1.63916015625, -1.524566650390625, -1.40997314453125, -1.295379638671875, -1.1807861328125, -1.066192626953125, -0.95159912109375, -0.837005615234375, -0.722412109375, -0.607818603515625, -0.49322509765625, -0.378631591796875, -0.2640380859375, -0.149444580078125, -0.03485107421875, 0.079742431640625, 0.1943359375, 0.308929443359375, 0.42352294921875, 0.538116455078125, 0.6527099609375, 0.767303466796875, 0.88189697265625, 0.996490478515625, 1.111083984375, 1.225677490234375, 1.34027099609375, 1.454864501953125, 1.5694580078125, 1.684051513671875, 1.79864501953125, 1.913238525390625, 2.02783203125, 2.142425537109375, 2.25701904296875, 2.371612548828125, 2.4862060546875, 2.600799560546875, 2.71539306640625, 2.829986572265625, 2.944580078125, 3.059173583984375, 3.17376708984375, 3.288360595703125, 3.4029541015625, 3.517547607421875, 3.63214111328125, 3.746734619140625, 3.861328125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 4.0, 6.0, 3.0, 3.0, 10.0, 14.0, 6.0, 17.0, 14.0, 10.0, 14.0, 18.0, 15.0, 16.0, 30.0, 35.0, 22.0, 36.0, 37.0, 38.0, 36.0, 39.0, 48.0, 29.0, 43.0, 42.0, 33.0, 48.0, 39.0, 42.0, 43.0, 32.0, 28.0, 23.0, 27.0, 15.0, 17.0, 14.0, 9.0, 11.0, 9.0, 6.0, 4.0, 7.0, 0.0, 4.0, 6.0, 2.0, 4.0, 0.0, 1.0, 0.0, 4.0], "bins": [-2.705078125, -2.62603759765625, -2.5469970703125, -2.46795654296875, -2.388916015625, -2.30987548828125, -2.2308349609375, -2.15179443359375, -2.07275390625, -1.99371337890625, -1.9146728515625, -1.83563232421875, -1.756591796875, -1.67755126953125, -1.5985107421875, -1.51947021484375, -1.4404296875, -1.36138916015625, -1.2823486328125, -1.20330810546875, -1.124267578125, -1.04522705078125, -0.9661865234375, -0.88714599609375, -0.80810546875, -0.72906494140625, -0.6500244140625, -0.57098388671875, -0.491943359375, -0.41290283203125, -0.3338623046875, -0.25482177734375, -0.17578125, -0.09674072265625, -0.0177001953125, 0.06134033203125, 0.140380859375, 0.21942138671875, 0.2984619140625, 0.37750244140625, 0.45654296875, 0.53558349609375, 0.6146240234375, 0.69366455078125, 0.772705078125, 0.85174560546875, 0.9307861328125, 1.00982666015625, 1.0888671875, 1.16790771484375, 1.2469482421875, 1.32598876953125, 1.405029296875, 1.48406982421875, 1.5631103515625, 1.64215087890625, 1.72119140625, 1.80023193359375, 1.8792724609375, 1.95831298828125, 2.037353515625, 2.11639404296875, 2.1954345703125, 2.27447509765625, 2.353515625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 7.0, 8.0, 15.0, 18.0, 27.0, 48.0, 59.0, 77.0, 132.0, 163.0, 282.0, 398.0, 650.0, 937.0, 1494.0, 2463.0, 3846.0, 6478.0, 10698.0, 18872.0, 33004.0, 58539.0, 101316.0, 156439.0, 192381.0, 173292.0, 119685.0, 71013.0, 40150.0, 22858.0, 13097.0, 7589.0, 4695.0, 2768.0, 1799.0, 1095.0, 687.0, 499.0, 330.0, 215.0, 144.0, 96.0, 69.0, 41.0, 30.0, 24.0, 13.0, 9.0, 8.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.458984375, -2.385955810546875, -2.31292724609375, -2.239898681640625, -2.1668701171875, -2.093841552734375, -2.02081298828125, -1.947784423828125, -1.874755859375, -1.801727294921875, -1.72869873046875, -1.655670166015625, -1.5826416015625, -1.509613037109375, -1.43658447265625, -1.363555908203125, -1.29052734375, -1.217498779296875, -1.14447021484375, -1.071441650390625, -0.9984130859375, -0.925384521484375, -0.85235595703125, -0.779327392578125, -0.706298828125, -0.633270263671875, -0.56024169921875, -0.487213134765625, -0.4141845703125, -0.341156005859375, -0.26812744140625, -0.195098876953125, -0.1220703125, -0.049041748046875, 0.02398681640625, 0.097015380859375, 0.1700439453125, 0.243072509765625, 0.31610107421875, 0.389129638671875, 0.462158203125, 0.535186767578125, 0.60821533203125, 0.681243896484375, 0.7542724609375, 0.827301025390625, 0.90032958984375, 0.973358154296875, 1.04638671875, 1.119415283203125, 1.19244384765625, 1.265472412109375, 1.3385009765625, 1.411529541015625, 1.48455810546875, 1.557586669921875, 1.630615234375, 1.703643798828125, 1.77667236328125, 1.849700927734375, 1.9227294921875, 1.995758056640625, 2.06878662109375, 2.141815185546875, 2.21484375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 5.0, 3.0, 5.0, 8.0, 8.0, 6.0, 14.0, 10.0, 12.0, 28.0, 27.0, 23.0, 31.0, 27.0, 40.0, 44.0, 55.0, 57.0, 50.0, 61.0, 61.0, 48.0, 49.0, 46.0, 39.0, 32.0, 31.0, 35.0, 17.0, 25.0, 19.0, 16.0, 12.0, 9.0, 9.0, 10.0, 4.0, 5.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00018680095672607422, -0.0001807641237974167, -0.00017472729086875916, -0.00016869045794010162, -0.0001626536250114441, -0.00015661679208278656, -0.00015057995915412903, -0.0001445431262254715, -0.00013850629329681396, -0.00013246946036815643, -0.0001264326274394989, -0.00012039579451084137, -0.00011435896158218384, -0.0001083221286535263, -0.00010228529572486877, -9.624846279621124e-05, -9.021162986755371e-05, -8.417479693889618e-05, -7.813796401023865e-05, -7.210113108158112e-05, -6.606429815292358e-05, -6.002746522426605e-05, -5.399063229560852e-05, -4.795379936695099e-05, -4.191696643829346e-05, -3.5880133509635925e-05, -2.9843300580978394e-05, -2.3806467652320862e-05, -1.776963472366333e-05, -1.1732801795005798e-05, -5.695968866348267e-06, 3.4086406230926514e-07, 6.377696990966797e-06, 1.2414529919624329e-05, 1.845136284828186e-05, 2.4488195776939392e-05, 3.0525028705596924e-05, 3.6561861634254456e-05, 4.259869456291199e-05, 4.863552749156952e-05, 5.467236042022705e-05, 6.070919334888458e-05, 6.674602627754211e-05, 7.278285920619965e-05, 7.881969213485718e-05, 8.485652506351471e-05, 9.089335799217224e-05, 9.693019092082977e-05, 0.0001029670238494873, 0.00010900385677814484, 0.00011504068970680237, 0.0001210775226354599, 0.00012711435556411743, 0.00013315118849277496, 0.0001391880214214325, 0.00014522485435009003, 0.00015126168727874756, 0.0001572985202074051, 0.00016333535313606262, 0.00016937218606472015, 0.00017540901899337769, 0.00018144585192203522, 0.00018748268485069275, 0.00019351951777935028, 0.0001995563507080078]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 9.0, 4.0, 8.0, 13.0, 16.0, 8.0, 28.0, 39.0, 55.0, 77.0, 132.0, 172.0, 265.0, 402.0, 704.0, 1140.0, 2052.0, 3677.0, 6756.0, 12743.0, 24554.0, 49130.0, 94680.0, 163197.0, 216364.0, 198193.0, 128896.0, 70131.0, 35612.0, 18247.0, 9427.0, 5082.0, 2785.0, 1541.0, 914.0, 544.0, 307.0, 208.0, 149.0, 81.0, 58.0, 34.0, 26.0, 14.0, 12.0, 15.0, 12.0, 10.0, 9.0, 8.0, 4.0, 7.0, 3.0, 0.0, 3.0, 1.0, 2.0], "bins": [-2.6484375, -2.5650634765625, -2.481689453125, -2.3983154296875, -2.31494140625, -2.2315673828125, -2.148193359375, -2.0648193359375, -1.9814453125, -1.8980712890625, -1.814697265625, -1.7313232421875, -1.64794921875, -1.5645751953125, -1.481201171875, -1.3978271484375, -1.314453125, -1.2310791015625, -1.147705078125, -1.0643310546875, -0.98095703125, -0.8975830078125, -0.814208984375, -0.7308349609375, -0.6474609375, -0.5640869140625, -0.480712890625, -0.3973388671875, -0.31396484375, -0.2305908203125, -0.147216796875, -0.0638427734375, 0.01953125, 0.1029052734375, 0.186279296875, 0.2696533203125, 0.35302734375, 0.4364013671875, 0.519775390625, 0.6031494140625, 0.6865234375, 0.7698974609375, 0.853271484375, 0.9366455078125, 1.02001953125, 1.1033935546875, 1.186767578125, 1.2701416015625, 1.353515625, 1.4368896484375, 1.520263671875, 1.6036376953125, 1.68701171875, 1.7703857421875, 1.853759765625, 1.9371337890625, 2.0205078125, 2.1038818359375, 2.187255859375, 2.2706298828125, 2.35400390625, 2.4373779296875, 2.520751953125, 2.6041259765625, 2.6875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 4.0, 4.0, 2.0, 5.0, 6.0, 8.0, 12.0, 16.0, 20.0, 28.0, 30.0, 42.0, 47.0, 44.0, 42.0, 51.0, 56.0, 60.0, 64.0, 60.0, 63.0, 44.0, 48.0, 40.0, 43.0, 37.0, 28.0, 26.0, 16.0, 19.0, 8.0, 5.0, 6.0, 10.0, 9.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.85888671875, -0.8317031860351562, -0.8045196533203125, -0.7773361206054688, -0.750152587890625, -0.7229690551757812, -0.6957855224609375, -0.6686019897460938, -0.64141845703125, -0.6142349243164062, -0.5870513916015625, -0.5598678588867188, -0.532684326171875, -0.5055007934570312, -0.4783172607421875, -0.45113372802734375, -0.4239501953125, -0.39676666259765625, -0.3695831298828125, -0.34239959716796875, -0.315216064453125, -0.28803253173828125, -0.2608489990234375, -0.23366546630859375, -0.20648193359375, -0.17929840087890625, -0.1521148681640625, -0.12493133544921875, -0.097747802734375, -0.07056427001953125, -0.0433807373046875, -0.01619720458984375, 0.010986328125, 0.03816986083984375, 0.0653533935546875, 0.09253692626953125, 0.119720458984375, 0.14690399169921875, 0.1740875244140625, 0.20127105712890625, 0.22845458984375, 0.25563812255859375, 0.2828216552734375, 0.31000518798828125, 0.337188720703125, 0.36437225341796875, 0.3915557861328125, 0.41873931884765625, 0.4459228515625, 0.47310638427734375, 0.5002899169921875, 0.5274734497070312, 0.554656982421875, 0.5818405151367188, 0.6090240478515625, 0.6362075805664062, 0.66339111328125, 0.6905746459960938, 0.7177581787109375, 0.7449417114257812, 0.772125244140625, 0.7993087768554688, 0.8264923095703125, 0.8536758422851562, 0.880859375]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 5.0, 1.0, 10.0, 6.0, 4.0, 5.0, 8.0, 13.0, 12.0, 22.0, 15.0, 19.0, 29.0, 31.0, 49.0, 42.0, 58.0, 54.0, 57.0, 55.0, 66.0, 54.0, 61.0, 56.0, 49.0, 40.0, 42.0, 31.0, 16.0, 26.0, 11.0, 8.0, 11.0, 11.0, 8.0, 2.0, 5.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.5597333908081055, -6.353708267211914, -6.1476826667785645, -5.941657543182373, -5.735631942749023, -5.529606819152832, -5.323581695556641, -5.117556571960449, -4.9115309715271, -4.705505847930908, -4.499480247497559, -4.293455123901367, -4.087430000305176, -3.881404399871826, -3.6753792762756348, -3.4693539142608643, -3.2633285522460938, -3.0573031902313232, -2.8512778282165527, -2.6452527046203613, -2.439227342605591, -2.2332019805908203, -2.027176856994629, -1.8211514949798584, -1.615126132965088, -1.4091007709503174, -1.2030755281448364, -0.9970502257347107, -0.791024923324585, -0.5849995613098145, -0.3789743185043335, -0.17294907569885254, 0.03307628631591797, 0.2391015887260437, 0.44512689113616943, 0.6511521935462952, 0.8571774959564209, 1.0632028579711914, 1.2692281007766724, 1.4752533435821533, 1.6812787055969238, 1.8873040676116943, 2.093329429626465, 2.2993545532226562, 2.5053799152374268, 2.7114052772521973, 2.9174304008483887, 3.123455762863159, 3.3294811248779297, 3.5355064868927, 3.7415318489074707, 3.947556972503662, 4.153582572937012, 4.359607696533203, 4.5656328201293945, 4.771657943725586, 4.9776835441589355, 5.183708667755127, 5.389734268188477, 5.595759391784668, 5.801784515380859, 6.007810115814209, 6.2138352394104, 6.41986083984375, 6.625885963439941]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 2.0, 4.0, 7.0, 4.0, 13.0, 16.0, 11.0, 7.0, 23.0, 11.0, 11.0, 22.0, 20.0, 27.0, 24.0, 30.0, 38.0, 27.0, 45.0, 47.0, 44.0, 41.0, 45.0, 44.0, 35.0, 47.0, 32.0, 35.0, 25.0, 19.0, 32.0, 33.0, 27.0, 30.0, 24.0, 10.0, 17.0, 8.0, 23.0, 14.0, 5.0, 5.0, 8.0, 2.0, 7.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.7564151287078857, -3.6334409713745117, -3.5104668140411377, -3.3874926567077637, -3.2645184993743896, -3.1415443420410156, -3.0185699462890625, -2.8955960273742676, -2.7726216316223145, -2.6496474742889404, -2.5266733169555664, -2.4036991596221924, -2.2807250022888184, -2.1577508449554443, -2.0347766876220703, -1.9118024110794067, -1.7888283729553223, -1.6658542156219482, -1.5428800582885742, -1.4199059009552002, -1.2969317436218262, -1.1739575862884521, -1.0509833097457886, -0.9280091524124146, -0.8050349950790405, -0.6820608377456665, -0.5590866804122925, -0.4361124634742737, -0.31313830614089966, -0.19016414880752563, -0.06718993186950684, 0.05578422546386719, 0.1787581443786621, 0.30173230171203613, 0.42470648884773254, 0.547680675983429, 0.670654833316803, 0.793628990650177, 0.9166032075881958, 1.0395773649215698, 1.1625515222549438, 1.2855256795883179, 1.408499836921692, 1.5314741134643555, 1.6544482707977295, 1.7774224281311035, 1.9003965854644775, 2.0233707427978516, 2.1463449001312256, 2.2693190574645996, 2.3922932147979736, 2.5152673721313477, 2.6382415294647217, 2.7612156867980957, 2.884190082550049, 3.0071640014648438, 3.130138397216797, 3.253112554550171, 3.376086711883545, 3.499060869216919, 3.622035026550293, 3.745009183883667, 3.867983341217041, 3.990957736968994, 4.113931655883789]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 9.0, 10.0, 19.0, 22.0, 30.0, 51.0, 62.0, 83.0, 128.0, 184.0, 233.0, 326.0, 441.0, 710.0, 1045.0, 1594.0, 2482.0, 3885.0, 6365.0, 10566.0, 18126.0, 33211.0, 64498.0, 135525.0, 309109.0, 717012.0, 1165761.0, 925460.0, 431697.0, 182455.0, 84255.0, 42637.0, 22699.0, 13077.0, 7660.0, 4612.0, 2842.0, 1826.0, 1171.0, 764.0, 489.0, 360.0, 227.0, 179.0, 115.0, 95.0, 56.0, 40.0, 28.0, 18.0, 10.0, 8.0, 5.0, 10.0, 1.0, 1.0, 1.0, 2.0], "bins": [-5.90625, -5.7255859375, -5.544921875, -5.3642578125, -5.18359375, -5.0029296875, -4.822265625, -4.6416015625, -4.4609375, -4.2802734375, -4.099609375, -3.9189453125, -3.73828125, -3.5576171875, -3.376953125, -3.1962890625, -3.015625, -2.8349609375, -2.654296875, -2.4736328125, -2.29296875, -2.1123046875, -1.931640625, -1.7509765625, -1.5703125, -1.3896484375, -1.208984375, -1.0283203125, -0.84765625, -0.6669921875, -0.486328125, -0.3056640625, -0.125, 0.0556640625, 0.236328125, 0.4169921875, 0.59765625, 0.7783203125, 0.958984375, 1.1396484375, 1.3203125, 1.5009765625, 1.681640625, 1.8623046875, 2.04296875, 2.2236328125, 2.404296875, 2.5849609375, 2.765625, 2.9462890625, 3.126953125, 3.3076171875, 3.48828125, 3.6689453125, 3.849609375, 4.0302734375, 4.2109375, 4.3916015625, 4.572265625, 4.7529296875, 4.93359375, 5.1142578125, 5.294921875, 5.4755859375, 5.65625]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 5.0, 12.0, 6.0, 8.0, 8.0, 14.0, 10.0, 21.0, 14.0, 19.0, 20.0, 24.0, 28.0, 38.0, 16.0, 39.0, 37.0, 41.0, 41.0, 33.0, 50.0, 42.0, 42.0, 27.0, 34.0, 43.0, 38.0, 26.0, 23.0, 37.0, 32.0, 23.0, 23.0, 21.0, 19.0, 16.0, 16.0, 7.0, 11.0, 10.0, 4.0, 2.0, 6.0, 2.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.525390625, -2.439788818359375, -2.35418701171875, -2.268585205078125, -2.1829833984375, -2.097381591796875, -2.01177978515625, -1.926177978515625, -1.840576171875, -1.754974365234375, -1.66937255859375, -1.583770751953125, -1.4981689453125, -1.412567138671875, -1.32696533203125, -1.241363525390625, -1.15576171875, -1.070159912109375, -0.98455810546875, -0.898956298828125, -0.8133544921875, -0.727752685546875, -0.64215087890625, -0.556549072265625, -0.470947265625, -0.385345458984375, -0.29974365234375, -0.214141845703125, -0.1285400390625, -0.042938232421875, 0.04266357421875, 0.128265380859375, 0.2138671875, 0.299468994140625, 0.38507080078125, 0.470672607421875, 0.5562744140625, 0.641876220703125, 0.72747802734375, 0.813079833984375, 0.898681640625, 0.984283447265625, 1.06988525390625, 1.155487060546875, 1.2410888671875, 1.326690673828125, 1.41229248046875, 1.497894287109375, 1.58349609375, 1.669097900390625, 1.75469970703125, 1.840301513671875, 1.9259033203125, 2.011505126953125, 2.09710693359375, 2.182708740234375, 2.268310546875, 2.353912353515625, 2.43951416015625, 2.525115966796875, 2.6107177734375, 2.696319580078125, 2.78192138671875, 2.867523193359375, 2.953125]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 7.0, 4.0, 12.0, 14.0, 26.0, 32.0, 40.0, 59.0, 91.0, 129.0, 202.0, 332.0, 505.0, 710.0, 1075.0, 1772.0, 2659.0, 4461.0, 7353.0, 12579.0, 22691.0, 41700.0, 81873.0, 170895.0, 379486.0, 830819.0, 1207709.0, 762219.0, 343970.0, 156100.0, 74901.0, 38545.0, 20995.0, 11819.0, 6976.0, 4150.0, 2615.0, 1661.0, 1056.0, 711.0, 449.0, 317.0, 191.0, 129.0, 85.0, 54.0, 34.0, 34.0, 13.0, 11.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-6.6328125, -6.4283447265625, -6.223876953125, -6.0194091796875, -5.81494140625, -5.6104736328125, -5.406005859375, -5.2015380859375, -4.9970703125, -4.7926025390625, -4.588134765625, -4.3836669921875, -4.17919921875, -3.9747314453125, -3.770263671875, -3.5657958984375, -3.361328125, -3.1568603515625, -2.952392578125, -2.7479248046875, -2.54345703125, -2.3389892578125, -2.134521484375, -1.9300537109375, -1.7255859375, -1.5211181640625, -1.316650390625, -1.1121826171875, -0.90771484375, -0.7032470703125, -0.498779296875, -0.2943115234375, -0.08984375, 0.1146240234375, 0.319091796875, 0.5235595703125, 0.72802734375, 0.9324951171875, 1.136962890625, 1.3414306640625, 1.5458984375, 1.7503662109375, 1.954833984375, 2.1593017578125, 2.36376953125, 2.5682373046875, 2.772705078125, 2.9771728515625, 3.181640625, 3.3861083984375, 3.590576171875, 3.7950439453125, 3.99951171875, 4.2039794921875, 4.408447265625, 4.6129150390625, 4.8173828125, 5.0218505859375, 5.226318359375, 5.4307861328125, 5.63525390625, 5.8397216796875, 6.044189453125, 6.2486572265625, 6.453125]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 10.0, 9.0, 9.0, 5.0, 19.0, 19.0, 35.0, 43.0, 45.0, 74.0, 95.0, 133.0, 159.0, 194.0, 283.0, 323.0, 393.0, 376.0, 374.0, 302.0, 267.0, 209.0, 166.0, 113.0, 88.0, 81.0, 55.0, 62.0, 23.0, 29.0, 17.0, 16.0, 11.0, 11.0, 7.0, 5.0, 5.0, 10.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.234375, -2.16363525390625, -2.0928955078125, -2.02215576171875, -1.951416015625, -1.88067626953125, -1.8099365234375, -1.73919677734375, -1.66845703125, -1.59771728515625, -1.5269775390625, -1.45623779296875, -1.385498046875, -1.31475830078125, -1.2440185546875, -1.17327880859375, -1.1025390625, -1.03179931640625, -0.9610595703125, -0.89031982421875, -0.819580078125, -0.74884033203125, -0.6781005859375, -0.60736083984375, -0.53662109375, -0.46588134765625, -0.3951416015625, -0.32440185546875, -0.253662109375, -0.18292236328125, -0.1121826171875, -0.04144287109375, 0.029296875, 0.10003662109375, 0.1707763671875, 0.24151611328125, 0.312255859375, 0.38299560546875, 0.4537353515625, 0.52447509765625, 0.59521484375, 0.66595458984375, 0.7366943359375, 0.80743408203125, 0.878173828125, 0.94891357421875, 1.0196533203125, 1.09039306640625, 1.1611328125, 1.23187255859375, 1.3026123046875, 1.37335205078125, 1.444091796875, 1.51483154296875, 1.5855712890625, 1.65631103515625, 1.72705078125, 1.79779052734375, 1.8685302734375, 1.93927001953125, 2.010009765625, 2.08074951171875, 2.1514892578125, 2.22222900390625, 2.29296875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 3.0, 5.0, 9.0, 7.0, 10.0, 13.0, 15.0, 11.0, 25.0, 26.0, 27.0, 34.0, 32.0, 63.0, 54.0, 72.0, 75.0, 87.0, 72.0, 67.0, 58.0, 57.0, 37.0, 39.0, 23.0, 24.0, 20.0, 8.0, 6.0, 6.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-9.557711601257324, -9.31735897064209, -9.077007293701172, -8.836654663085938, -8.59630298614502, -8.355950355529785, -8.115598678588867, -7.875246047973633, -7.634894371032715, -7.394542217254639, -7.1541900634765625, -6.913837909698486, -6.67348575592041, -6.433133602142334, -6.192781448364258, -5.952428817749023, -5.712076663970947, -5.471724510192871, -5.231372356414795, -4.991020202636719, -4.750668048858643, -4.510315895080566, -4.269963264465332, -4.029611587524414, -3.789259195327759, -3.5489070415496826, -3.3085548877716064, -3.068202495574951, -2.827850341796875, -2.587498188018799, -2.3471460342407227, -2.1067938804626465, -1.8664422035217285, -1.6260900497436523, -1.3857378959655762, -1.1453856229782104, -0.9050334692001343, -0.6646813154220581, -0.4243290424346924, -0.1839768886566162, 0.05637526512145996, 0.2967274487018585, 0.5370796322822571, 0.777431845664978, 1.0177839994430542, 1.2581361532211304, 1.498488426208496, 1.7388405799865723, 1.9791927337646484, 2.2195448875427246, 2.459897041320801, 2.700249195098877, 2.940601348876953, 3.1809535026550293, 3.4213058948516846, 3.6616580486297607, 3.902010202407837, 4.142362594604492, 4.382714748382568, 4.6230669021606445, 4.863419055938721, 5.103771209716797, 5.344123363494873, 5.584475517272949, 5.824827671051025]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 7.0, 5.0, 3.0, 5.0, 9.0, 17.0, 8.0, 8.0, 13.0, 13.0, 15.0, 17.0, 19.0, 20.0, 17.0, 23.0, 32.0, 25.0, 26.0, 35.0, 26.0, 33.0, 33.0, 34.0, 28.0, 36.0, 31.0, 40.0, 42.0, 38.0, 31.0, 29.0, 47.0, 31.0, 20.0, 17.0, 15.0, 26.0, 20.0, 16.0, 23.0, 16.0, 9.0, 10.0, 6.0, 2.0, 13.0, 5.0, 6.0, 4.0, 3.0, 4.0, 0.0, 2.0], "bins": [-3.6355714797973633, -3.5323939323425293, -3.4292166233062744, -3.3260390758514404, -3.2228617668151855, -3.1196842193603516, -3.0165066719055176, -2.9133291244506836, -2.8101518154144287, -2.7069742679595947, -2.60379695892334, -2.500619411468506, -2.397441864013672, -2.294264554977417, -2.191087007522583, -2.087909698486328, -1.9847321510314941, -1.8815547227859497, -1.7783772945404053, -1.6751997470855713, -1.5720223188400269, -1.4688448905944824, -1.3656673431396484, -1.262489914894104, -1.1593124866485596, -1.0561350584030151, -0.9529575705528259, -0.8497800827026367, -0.7466026544570923, -0.6434252262115479, -0.5402477383613586, -0.43707025051116943, -0.3338925838470459, -0.23071512579917908, -0.12753766775131226, -0.024360209703445435, 0.07881724834442139, 0.18199467658996582, 0.28517216444015503, 0.38834965229034424, 0.49152708053588867, 0.5947045087814331, 0.6978819966316223, 0.8010594844818115, 0.904236912727356, 1.0074143409729004, 1.1105918884277344, 1.2137693166732788, 1.3169467449188232, 1.4201241731643677, 1.523301601409912, 1.626479148864746, 1.7296565771102905, 1.832834005355835, 1.936011552810669, 2.039188861846924, 2.142366409301758, 2.245543956756592, 2.3487212657928467, 2.4518988132476807, 2.5550761222839355, 2.6582536697387695, 2.7614312171936035, 2.8646087646484375, 2.9677860736846924]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 9.0, 14.0, 23.0, 27.0, 23.0, 57.0, 81.0, 123.0, 168.0, 289.0, 388.0, 600.0, 1008.0, 1487.0, 2410.0, 3764.0, 6143.0, 10218.0, 16859.0, 28306.0, 46978.0, 76777.0, 118182.0, 159700.0, 172021.0, 143168.0, 100203.0, 62727.0, 38207.0, 22756.0, 13832.0, 8160.0, 5065.0, 3130.0, 1994.0, 1272.0, 798.0, 514.0, 363.0, 244.0, 151.0, 107.0, 68.0, 43.0, 43.0, 17.0, 17.0, 10.0, 7.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.63671875, -2.552459716796875, -2.46820068359375, -2.383941650390625, -2.2996826171875, -2.215423583984375, -2.13116455078125, -2.046905517578125, -1.962646484375, -1.878387451171875, -1.79412841796875, -1.709869384765625, -1.6256103515625, -1.541351318359375, -1.45709228515625, -1.372833251953125, -1.28857421875, -1.204315185546875, -1.12005615234375, -1.035797119140625, -0.9515380859375, -0.867279052734375, -0.78302001953125, -0.698760986328125, -0.614501953125, -0.530242919921875, -0.44598388671875, -0.361724853515625, -0.2774658203125, -0.193206787109375, -0.10894775390625, -0.024688720703125, 0.0595703125, 0.143829345703125, 0.22808837890625, 0.312347412109375, 0.3966064453125, 0.480865478515625, 0.56512451171875, 0.649383544921875, 0.733642578125, 0.817901611328125, 0.90216064453125, 0.986419677734375, 1.0706787109375, 1.154937744140625, 1.23919677734375, 1.323455810546875, 1.40771484375, 1.491973876953125, 1.57623291015625, 1.660491943359375, 1.7447509765625, 1.829010009765625, 1.91326904296875, 1.997528076171875, 2.081787109375, 2.166046142578125, 2.25030517578125, 2.334564208984375, 2.4188232421875, 2.503082275390625, 2.58734130859375, 2.671600341796875, 2.755859375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 4.0, 5.0, 9.0, 8.0, 10.0, 9.0, 14.0, 13.0, 11.0, 23.0, 14.0, 22.0, 27.0, 29.0, 32.0, 28.0, 31.0, 32.0, 43.0, 31.0, 30.0, 46.0, 42.0, 37.0, 48.0, 42.0, 50.0, 36.0, 33.0, 45.0, 25.0, 20.0, 19.0, 18.0, 23.0, 16.0, 14.0, 13.0, 15.0, 8.0, 7.0, 8.0, 8.0, 3.0, 2.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0234375, -3.895751953125, -3.76806640625, -3.640380859375, -3.5126953125, -3.385009765625, -3.25732421875, -3.129638671875, -3.001953125, -2.874267578125, -2.74658203125, -2.618896484375, -2.4912109375, -2.363525390625, -2.23583984375, -2.108154296875, -1.98046875, -1.852783203125, -1.72509765625, -1.597412109375, -1.4697265625, -1.342041015625, -1.21435546875, -1.086669921875, -0.958984375, -0.831298828125, -0.70361328125, -0.575927734375, -0.4482421875, -0.320556640625, -0.19287109375, -0.065185546875, 0.0625, 0.190185546875, 0.31787109375, 0.445556640625, 0.5732421875, 0.700927734375, 0.82861328125, 0.956298828125, 1.083984375, 1.211669921875, 1.33935546875, 1.467041015625, 1.5947265625, 1.722412109375, 1.85009765625, 1.977783203125, 2.10546875, 2.233154296875, 2.36083984375, 2.488525390625, 2.6162109375, 2.743896484375, 2.87158203125, 2.999267578125, 3.126953125, 3.254638671875, 3.38232421875, 3.510009765625, 3.6376953125, 3.765380859375, 3.89306640625, 4.020751953125, 4.1484375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 9.0, 10.0, 12.0, 27.0, 45.0, 67.0, 108.0, 183.0, 311.0, 538.0, 896.0, 1640.0, 3281.0, 6349.0, 13309.0, 28714.0, 64424.0, 142757.0, 265850.0, 263109.0, 139440.0, 63047.0, 28286.0, 12855.0, 6283.0, 3171.0, 1681.0, 909.0, 516.0, 292.0, 159.0, 85.0, 57.0, 50.0, 35.0, 21.0, 4.0, 12.0, 3.0, 6.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.14453125, -4.9931640625, -4.841796875, -4.6904296875, -4.5390625, -4.3876953125, -4.236328125, -4.0849609375, -3.93359375, -3.7822265625, -3.630859375, -3.4794921875, -3.328125, -3.1767578125, -3.025390625, -2.8740234375, -2.72265625, -2.5712890625, -2.419921875, -2.2685546875, -2.1171875, -1.9658203125, -1.814453125, -1.6630859375, -1.51171875, -1.3603515625, -1.208984375, -1.0576171875, -0.90625, -0.7548828125, -0.603515625, -0.4521484375, -0.30078125, -0.1494140625, 0.001953125, 0.1533203125, 0.3046875, 0.4560546875, 0.607421875, 0.7587890625, 0.91015625, 1.0615234375, 1.212890625, 1.3642578125, 1.515625, 1.6669921875, 1.818359375, 1.9697265625, 2.12109375, 2.2724609375, 2.423828125, 2.5751953125, 2.7265625, 2.8779296875, 3.029296875, 3.1806640625, 3.33203125, 3.4833984375, 3.634765625, 3.7861328125, 3.9375, 4.0888671875, 4.240234375, 4.3916015625, 4.54296875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 9.0, 9.0, 6.0, 15.0, 19.0, 16.0, 17.0, 23.0, 28.0, 21.0, 27.0, 31.0, 29.0, 43.0, 29.0, 42.0, 38.0, 36.0, 44.0, 36.0, 47.0, 31.0, 35.0, 53.0, 31.0, 36.0, 29.0, 27.0, 21.0, 31.0, 25.0, 17.0, 12.0, 11.0, 13.0, 17.0, 9.0, 10.0, 7.0, 4.0, 4.0, 6.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.20703125, -2.133636474609375, -2.06024169921875, -1.986846923828125, -1.9134521484375, -1.840057373046875, -1.76666259765625, -1.693267822265625, -1.619873046875, -1.546478271484375, -1.47308349609375, -1.399688720703125, -1.3262939453125, -1.252899169921875, -1.17950439453125, -1.106109619140625, -1.03271484375, -0.959320068359375, -0.88592529296875, -0.812530517578125, -0.7391357421875, -0.665740966796875, -0.59234619140625, -0.518951416015625, -0.445556640625, -0.372161865234375, -0.29876708984375, -0.225372314453125, -0.1519775390625, -0.078582763671875, -0.00518798828125, 0.068206787109375, 0.1416015625, 0.214996337890625, 0.28839111328125, 0.361785888671875, 0.4351806640625, 0.508575439453125, 0.58197021484375, 0.655364990234375, 0.728759765625, 0.802154541015625, 0.87554931640625, 0.948944091796875, 1.0223388671875, 1.095733642578125, 1.16912841796875, 1.242523193359375, 1.31591796875, 1.389312744140625, 1.46270751953125, 1.536102294921875, 1.6094970703125, 1.682891845703125, 1.75628662109375, 1.829681396484375, 1.903076171875, 1.976470947265625, 2.04986572265625, 2.123260498046875, 2.1966552734375, 2.270050048828125, 2.34344482421875, 2.416839599609375, 2.490234375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 3.0, 6.0, 1.0, 4.0, 10.0, 11.0, 21.0, 22.0, 38.0, 38.0, 53.0, 89.0, 93.0, 165.0, 188.0, 308.0, 477.0, 770.0, 1027.0, 1611.0, 2614.0, 3931.0, 6546.0, 10996.0, 19104.0, 35184.0, 67554.0, 131654.0, 232806.0, 238789.0, 137610.0, 70605.0, 36420.0, 20229.0, 11242.0, 6686.0, 4068.0, 2569.0, 1598.0, 1111.0, 714.0, 490.0, 351.0, 228.0, 157.0, 117.0, 71.0, 50.0, 37.0, 39.0, 24.0, 13.0, 7.0, 4.0, 7.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.693359375, -1.6369781494140625, -1.580596923828125, -1.5242156982421875, -1.46783447265625, -1.4114532470703125, -1.355072021484375, -1.2986907958984375, -1.2423095703125, -1.1859283447265625, -1.129547119140625, -1.0731658935546875, -1.01678466796875, -0.9604034423828125, -0.904022216796875, -0.8476409912109375, -0.791259765625, -0.7348785400390625, -0.678497314453125, -0.6221160888671875, -0.56573486328125, -0.5093536376953125, -0.452972412109375, -0.3965911865234375, -0.3402099609375, -0.2838287353515625, -0.227447509765625, -0.1710662841796875, -0.11468505859375, -0.0583038330078125, -0.001922607421875, 0.0544586181640625, 0.11083984375, 0.1672210693359375, 0.223602294921875, 0.2799835205078125, 0.33636474609375, 0.3927459716796875, 0.449127197265625, 0.5055084228515625, 0.5618896484375, 0.6182708740234375, 0.674652099609375, 0.7310333251953125, 0.78741455078125, 0.8437957763671875, 0.900177001953125, 0.9565582275390625, 1.012939453125, 1.0693206787109375, 1.125701904296875, 1.1820831298828125, 1.23846435546875, 1.2948455810546875, 1.351226806640625, 1.4076080322265625, 1.4639892578125, 1.5203704833984375, 1.576751708984375, 1.6331329345703125, 1.68951416015625, 1.7458953857421875, 1.802276611328125, 1.8586578369140625, 1.9150390625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 1.0, 2.0, 7.0, 5.0, 8.0, 8.0, 8.0, 10.0, 13.0, 22.0, 23.0, 30.0, 41.0, 45.0, 48.0, 45.0, 56.0, 51.0, 66.0, 75.0, 68.0, 53.0, 47.0, 58.0, 46.0, 35.0, 22.0, 21.0, 11.0, 18.0, 12.0, 9.0, 7.0, 5.0, 4.0, 6.0, 7.0, 6.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.355213165283203e-05, -7.102359086275101e-05, -6.849505007266998e-05, -6.596650928258896e-05, -6.343796849250793e-05, -6.090942770242691e-05, -5.8380886912345886e-05, -5.585234612226486e-05, -5.332380533218384e-05, -5.0795264542102814e-05, -4.826672375202179e-05, -4.5738182961940765e-05, -4.320964217185974e-05, -4.068110138177872e-05, -3.815256059169769e-05, -3.562401980161667e-05, -3.3095479011535645e-05, -3.056693822145462e-05, -2.8038397431373596e-05, -2.5509856641292572e-05, -2.2981315851211548e-05, -2.0452775061130524e-05, -1.79242342710495e-05, -1.5395693480968475e-05, -1.2867152690887451e-05, -1.0338611900806427e-05, -7.810071110725403e-06, -5.281530320644379e-06, -2.7529895305633545e-06, -2.2444874048233032e-07, 2.304092049598694e-06, 4.832632839679718e-06, 7.361173629760742e-06, 9.889714419841766e-06, 1.241825520992279e-05, 1.4946796000003815e-05, 1.747533679008484e-05, 2.0003877580165863e-05, 2.2532418370246887e-05, 2.506095916032791e-05, 2.7589499950408936e-05, 3.011804074048996e-05, 3.2646581530570984e-05, 3.517512232065201e-05, 3.770366311073303e-05, 4.0232203900814056e-05, 4.276074469089508e-05, 4.5289285480976105e-05, 4.781782627105713e-05, 5.034636706113815e-05, 5.287490785121918e-05, 5.54034486413002e-05, 5.7931989431381226e-05, 6.046053022146225e-05, 6.298907101154327e-05, 6.55176118016243e-05, 6.804615259170532e-05, 7.057469338178635e-05, 7.310323417186737e-05, 7.56317749619484e-05, 7.816031575202942e-05, 8.068885654211044e-05, 8.321739733219147e-05, 8.574593812227249e-05, 8.827447891235352e-05]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 4.0, 9.0, 11.0, 18.0, 18.0, 34.0, 47.0, 73.0, 91.0, 134.0, 209.0, 342.0, 477.0, 823.0, 1339.0, 2148.0, 3463.0, 5918.0, 10016.0, 17548.0, 31933.0, 60324.0, 111744.0, 181044.0, 216654.0, 173557.0, 104699.0, 56108.0, 29780.0, 16360.0, 9354.0, 5498.0, 3262.0, 1961.0, 1304.0, 780.0, 511.0, 363.0, 186.0, 126.0, 97.0, 54.0, 39.0, 20.0, 22.0, 17.0, 5.0, 17.0, 8.0, 8.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.5751953125, -1.526641845703125, -1.47808837890625, -1.429534912109375, -1.3809814453125, -1.332427978515625, -1.28387451171875, -1.235321044921875, -1.186767578125, -1.138214111328125, -1.08966064453125, -1.041107177734375, -0.9925537109375, -0.944000244140625, -0.89544677734375, -0.846893310546875, -0.79833984375, -0.749786376953125, -0.70123291015625, -0.652679443359375, -0.6041259765625, -0.555572509765625, -0.50701904296875, -0.458465576171875, -0.409912109375, -0.361358642578125, -0.31280517578125, -0.264251708984375, -0.2156982421875, -0.167144775390625, -0.11859130859375, -0.070037841796875, -0.021484375, 0.027069091796875, 0.07562255859375, 0.124176025390625, 0.1727294921875, 0.221282958984375, 0.26983642578125, 0.318389892578125, 0.366943359375, 0.415496826171875, 0.46405029296875, 0.512603759765625, 0.5611572265625, 0.609710693359375, 0.65826416015625, 0.706817626953125, 0.75537109375, 0.803924560546875, 0.85247802734375, 0.901031494140625, 0.9495849609375, 0.998138427734375, 1.04669189453125, 1.095245361328125, 1.143798828125, 1.192352294921875, 1.24090576171875, 1.289459228515625, 1.3380126953125, 1.386566162109375, 1.43511962890625, 1.483673095703125, 1.5322265625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 7.0, 4.0, 8.0, 5.0, 3.0, 7.0, 19.0, 12.0, 22.0, 25.0, 33.0, 37.0, 57.0, 53.0, 73.0, 68.0, 70.0, 73.0, 69.0, 67.0, 53.0, 43.0, 46.0, 25.0, 21.0, 29.0, 13.0, 10.0, 14.0, 3.0, 11.0, 4.0, 8.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5146484375, -0.4990501403808594, -0.48345184326171875, -0.4678535461425781, -0.4522552490234375, -0.4366569519042969, -0.42105865478515625, -0.4054603576660156, -0.389862060546875, -0.3742637634277344, -0.35866546630859375, -0.3430671691894531, -0.3274688720703125, -0.3118705749511719, -0.29627227783203125, -0.2806739807128906, -0.26507568359375, -0.24947738647460938, -0.23387908935546875, -0.21828079223632812, -0.2026824951171875, -0.18708419799804688, -0.17148590087890625, -0.15588760375976562, -0.140289306640625, -0.12469100952148438, -0.10909271240234375, -0.09349441528320312, -0.0778961181640625, -0.062297821044921875, -0.04669952392578125, -0.031101226806640625, -0.0155029296875, 9.5367431640625e-05, 0.01569366455078125, 0.031291961669921875, 0.0468902587890625, 0.062488555908203125, 0.07808685302734375, 0.09368515014648438, 0.109283447265625, 0.12488174438476562, 0.14048004150390625, 0.15607833862304688, 0.1716766357421875, 0.18727493286132812, 0.20287322998046875, 0.21847152709960938, 0.23406982421875, 0.24966812133789062, 0.26526641845703125, 0.2808647155761719, 0.2964630126953125, 0.3120613098144531, 0.32765960693359375, 0.3432579040527344, 0.358856201171875, 0.3744544982910156, 0.39005279541015625, 0.4056510925292969, 0.4212493896484375, 0.4368476867675781, 0.45244598388671875, 0.4680442810058594, 0.483642578125]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 4.0, 6.0, 5.0, 6.0, 6.0, 12.0, 18.0, 10.0, 17.0, 22.0, 32.0, 21.0, 38.0, 51.0, 60.0, 63.0, 66.0, 91.0, 86.0, 70.0, 69.0, 57.0, 46.0, 30.0, 33.0, 30.0, 20.0, 6.0, 6.0, 8.0, 6.0, 2.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-9.940326690673828, -9.692682266235352, -9.445038795471191, -9.197394371032715, -8.949750900268555, -8.702106475830078, -8.454462051391602, -8.206818580627441, -7.959174156188965, -7.7115302085876465, -7.463886260986328, -7.216241836547852, -6.968597888946533, -6.720953941345215, -6.473309516906738, -6.22566556930542, -5.978021621704102, -5.730377674102783, -5.482733726501465, -5.235089302062988, -4.98744535446167, -4.739801406860352, -4.492156982421875, -4.244513034820557, -3.9968690872192383, -3.74922513961792, -3.5015809535980225, -3.253936767578125, -3.0062928199768066, -2.7586488723754883, -2.511004686355591, -2.2633605003356934, -2.015716552734375, -1.768072485923767, -1.5204284191131592, -1.2727843523025513, -1.0251402854919434, -0.7774962186813354, -0.5298521518707275, -0.28220808506011963, -0.03456401824951172, 0.2130800485610962, 0.4607241153717041, 0.708368182182312, 0.9560122489929199, 1.2036563158035278, 1.4513003826141357, 1.6989444494247437, 1.9465885162353516, 2.19423246383667, 2.4418766498565674, 2.689520835876465, 2.937164783477783, 3.1848087310791016, 3.432452917098999, 3.6800971031188965, 3.927741050720215, 4.175384998321533, 4.423028945922852, 4.670673370361328, 4.9183173179626465, 5.165961265563965, 5.413605690002441, 5.66124963760376, 5.908893585205078]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 5.0, 6.0, 6.0, 5.0, 10.0, 10.0, 10.0, 6.0, 15.0, 16.0, 15.0, 18.0, 17.0, 20.0, 14.0, 26.0, 29.0, 29.0, 27.0, 22.0, 34.0, 28.0, 30.0, 42.0, 28.0, 39.0, 29.0, 43.0, 32.0, 34.0, 41.0, 32.0, 40.0, 31.0, 22.0, 20.0, 19.0, 13.0, 20.0, 27.0, 15.0, 10.0, 19.0, 8.0, 8.0, 4.0, 5.0, 11.0, 7.0, 3.0, 2.0, 5.0, 1.0, 2.0], "bins": [-3.5719351768493652, -3.4707858562469482, -3.369636297225952, -3.268486976623535, -3.167337656021118, -3.066188335418701, -2.965038776397705, -2.863889455795288, -2.762740135192871, -2.661590814590454, -2.560441255569458, -2.459291934967041, -2.358142614364624, -2.256993293762207, -2.155843734741211, -2.054694414138794, -1.9535448551177979, -1.8523954153060913, -1.7512460947036743, -1.6500966548919678, -1.5489473342895508, -1.4477978944778442, -1.3466484546661377, -1.2454991340637207, -1.1443496942520142, -1.0432002544403076, -0.9420509338378906, -0.8409014940261841, -0.7397521138191223, -0.6386027336120605, -0.537453293800354, -0.43630391359329224, -0.33515477180480957, -0.2340053766965866, -0.13285598158836365, -0.03170657157897949, 0.06944280862808228, 0.17059218883514404, 0.2717416286468506, 0.37289100885391235, 0.4740403890609741, 0.5751897692680359, 0.6763391494750977, 0.7774885892868042, 0.878637969493866, 0.9797873497009277, 1.0809367895126343, 1.1820862293243408, 1.2832355499267578, 1.3843849897384644, 1.4855343103408813, 1.586683750152588, 1.6878330707550049, 1.7889825105667114, 1.890131950378418, 1.991281270980835, 2.092430591583252, 2.193579912185669, 2.294729471206665, 2.395878791809082, 2.497028112411499, 2.598177433013916, 2.699326992034912, 2.800476312637329, 2.901625871658325]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 7.0, 10.0, 11.0, 16.0, 21.0, 31.0, 41.0, 69.0, 90.0, 146.0, 241.0, 400.0, 679.0, 1304.0, 2460.0, 4718.0, 9633.0, 20038.0, 40699.0, 80288.0, 144386.0, 208855.0, 211954.0, 151040.0, 85480.0, 43589.0, 21279.0, 10263.0, 5140.0, 2552.0, 1303.0, 718.0, 386.0, 235.0, 167.0, 82.0, 57.0, 42.0, 42.0, 23.0, 18.0, 11.0, 10.0, 7.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.265625, -5.1109619140625, -4.956298828125, -4.8016357421875, -4.64697265625, -4.4923095703125, -4.337646484375, -4.1829833984375, -4.0283203125, -3.8736572265625, -3.718994140625, -3.5643310546875, -3.40966796875, -3.2550048828125, -3.100341796875, -2.9456787109375, -2.791015625, -2.6363525390625, -2.481689453125, -2.3270263671875, -2.17236328125, -2.0177001953125, -1.863037109375, -1.7083740234375, -1.5537109375, -1.3990478515625, -1.244384765625, -1.0897216796875, -0.93505859375, -0.7803955078125, -0.625732421875, -0.4710693359375, -0.31640625, -0.1617431640625, -0.007080078125, 0.1475830078125, 0.30224609375, 0.4569091796875, 0.611572265625, 0.7662353515625, 0.9208984375, 1.0755615234375, 1.230224609375, 1.3848876953125, 1.53955078125, 1.6942138671875, 1.848876953125, 2.0035400390625, 2.158203125, 2.3128662109375, 2.467529296875, 2.6221923828125, 2.77685546875, 2.9315185546875, 3.086181640625, 3.2408447265625, 3.3955078125, 3.5501708984375, 3.704833984375, 3.8594970703125, 4.01416015625, 4.1688232421875, 4.323486328125, 4.4781494140625, 4.6328125]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 7.0, 3.0, 4.0, 3.0, 12.0, 10.0, 7.0, 15.0, 9.0, 22.0, 14.0, 13.0, 21.0, 38.0, 28.0, 23.0, 23.0, 32.0, 31.0, 37.0, 30.0, 35.0, 35.0, 41.0, 29.0, 46.0, 42.0, 50.0, 40.0, 39.0, 35.0, 32.0, 31.0, 23.0, 14.0, 15.0, 16.0, 19.0, 9.0, 16.0, 15.0, 9.0, 8.0, 11.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.79296875, -3.67401123046875, -3.5550537109375, -3.43609619140625, -3.317138671875, -3.19818115234375, -3.0792236328125, -2.96026611328125, -2.84130859375, -2.72235107421875, -2.6033935546875, -2.48443603515625, -2.365478515625, -2.24652099609375, -2.1275634765625, -2.00860595703125, -1.8896484375, -1.77069091796875, -1.6517333984375, -1.53277587890625, -1.413818359375, -1.29486083984375, -1.1759033203125, -1.05694580078125, -0.93798828125, -0.81903076171875, -0.7000732421875, -0.58111572265625, -0.462158203125, -0.34320068359375, -0.2242431640625, -0.10528564453125, 0.013671875, 0.13262939453125, 0.2515869140625, 0.37054443359375, 0.489501953125, 0.60845947265625, 0.7274169921875, 0.84637451171875, 0.96533203125, 1.08428955078125, 1.2032470703125, 1.32220458984375, 1.441162109375, 1.56011962890625, 1.6790771484375, 1.79803466796875, 1.9169921875, 2.03594970703125, 2.1549072265625, 2.27386474609375, 2.392822265625, 2.51177978515625, 2.6307373046875, 2.74969482421875, 2.86865234375, 2.98760986328125, 3.1065673828125, 3.22552490234375, 3.344482421875, 3.46343994140625, 3.5823974609375, 3.70135498046875, 3.8203125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 8.0, 4.0, 4.0, 5.0, 9.0, 11.0, 15.0, 21.0, 21.0, 29.0, 46.0, 64.0, 80.0, 135.0, 171.0, 248.0, 341.0, 451.0, 685.0, 990.0, 1574.0, 2443.0, 4270.0, 7446.0, 13901.0, 25769.0, 49192.0, 90109.0, 148878.0, 199649.0, 192603.0, 135621.0, 78888.0, 43133.0, 22536.0, 12072.0, 6771.0, 3823.0, 2234.0, 1385.0, 943.0, 590.0, 381.0, 280.0, 202.0, 150.0, 107.0, 82.0, 49.0, 41.0, 26.0, 20.0, 19.0, 20.0, 14.0, 5.0, 2.0, 5.0, 2.0, 2.0], "bins": [-4.69140625, -4.552978515625, -4.41455078125, -4.276123046875, -4.1376953125, -3.999267578125, -3.86083984375, -3.722412109375, -3.583984375, -3.445556640625, -3.30712890625, -3.168701171875, -3.0302734375, -2.891845703125, -2.75341796875, -2.614990234375, -2.4765625, -2.338134765625, -2.19970703125, -2.061279296875, -1.9228515625, -1.784423828125, -1.64599609375, -1.507568359375, -1.369140625, -1.230712890625, -1.09228515625, -0.953857421875, -0.8154296875, -0.677001953125, -0.53857421875, -0.400146484375, -0.26171875, -0.123291015625, 0.01513671875, 0.153564453125, 0.2919921875, 0.430419921875, 0.56884765625, 0.707275390625, 0.845703125, 0.984130859375, 1.12255859375, 1.260986328125, 1.3994140625, 1.537841796875, 1.67626953125, 1.814697265625, 1.953125, 2.091552734375, 2.22998046875, 2.368408203125, 2.5068359375, 2.645263671875, 2.78369140625, 2.922119140625, 3.060546875, 3.198974609375, 3.33740234375, 3.475830078125, 3.6142578125, 3.752685546875, 3.89111328125, 4.029541015625, 4.16796875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 14.0, 15.0, 17.0, 14.0, 10.0, 17.0, 28.0, 26.0, 34.0, 27.0, 33.0, 32.0, 34.0, 37.0, 36.0, 43.0, 45.0, 44.0, 45.0, 39.0, 50.0, 36.0, 35.0, 36.0, 35.0, 28.0, 21.0, 35.0, 17.0, 16.0, 15.0, 19.0, 16.0, 10.0, 7.0, 5.0, 7.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-2.720703125, -2.64007568359375, -2.5594482421875, -2.47882080078125, -2.398193359375, -2.31756591796875, -2.2369384765625, -2.15631103515625, -2.07568359375, -1.99505615234375, -1.9144287109375, -1.83380126953125, -1.753173828125, -1.67254638671875, -1.5919189453125, -1.51129150390625, -1.4306640625, -1.35003662109375, -1.2694091796875, -1.18878173828125, -1.108154296875, -1.02752685546875, -0.9468994140625, -0.86627197265625, -0.78564453125, -0.70501708984375, -0.6243896484375, -0.54376220703125, -0.463134765625, -0.38250732421875, -0.3018798828125, -0.22125244140625, -0.140625, -0.05999755859375, 0.0206298828125, 0.10125732421875, 0.181884765625, 0.26251220703125, 0.3431396484375, 0.42376708984375, 0.50439453125, 0.58502197265625, 0.6656494140625, 0.74627685546875, 0.826904296875, 0.90753173828125, 0.9881591796875, 1.06878662109375, 1.1494140625, 1.23004150390625, 1.3106689453125, 1.39129638671875, 1.471923828125, 1.55255126953125, 1.6331787109375, 1.71380615234375, 1.79443359375, 1.87506103515625, 1.9556884765625, 2.03631591796875, 2.116943359375, 2.19757080078125, 2.2781982421875, 2.35882568359375, 2.439453125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 10.0, 12.0, 17.0, 31.0, 34.0, 40.0, 68.0, 96.0, 139.0, 225.0, 321.0, 477.0, 674.0, 1072.0, 1766.0, 2825.0, 5208.0, 10283.0, 23304.0, 58100.0, 145348.0, 280048.0, 275963.0, 141000.0, 55981.0, 22656.0, 10029.0, 5071.0, 2780.0, 1743.0, 1074.0, 715.0, 453.0, 314.0, 187.0, 160.0, 113.0, 67.0, 54.0, 32.0, 22.0, 16.0, 9.0, 4.0, 7.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.4765625, -3.37115478515625, -3.2657470703125, -3.16033935546875, -3.054931640625, -2.94952392578125, -2.8441162109375, -2.73870849609375, -2.63330078125, -2.52789306640625, -2.4224853515625, -2.31707763671875, -2.211669921875, -2.10626220703125, -2.0008544921875, -1.89544677734375, -1.7900390625, -1.68463134765625, -1.5792236328125, -1.47381591796875, -1.368408203125, -1.26300048828125, -1.1575927734375, -1.05218505859375, -0.94677734375, -0.84136962890625, -0.7359619140625, -0.63055419921875, -0.525146484375, -0.41973876953125, -0.3143310546875, -0.20892333984375, -0.103515625, 0.00189208984375, 0.1072998046875, 0.21270751953125, 0.318115234375, 0.42352294921875, 0.5289306640625, 0.63433837890625, 0.73974609375, 0.84515380859375, 0.9505615234375, 1.05596923828125, 1.161376953125, 1.26678466796875, 1.3721923828125, 1.47760009765625, 1.5830078125, 1.68841552734375, 1.7938232421875, 1.89923095703125, 2.004638671875, 2.11004638671875, 2.2154541015625, 2.32086181640625, 2.42626953125, 2.53167724609375, 2.6370849609375, 2.74249267578125, 2.847900390625, 2.95330810546875, 3.0587158203125, 3.16412353515625, 3.26953125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 0.0, 2.0, 9.0, 8.0, 7.0, 12.0, 16.0, 27.0, 52.0, 64.0, 103.0, 110.0, 115.0, 124.0, 81.0, 79.0, 58.0, 46.0, 31.0, 18.0, 8.0, 6.0, 7.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00029468536376953125, -0.00028366968035697937, -0.0002726539969444275, -0.0002616383135318756, -0.00025062263011932373, -0.00023960694670677185, -0.00022859126329421997, -0.0002175755798816681, -0.0002065598964691162, -0.00019554421305656433, -0.00018452852964401245, -0.00017351284623146057, -0.0001624971628189087, -0.0001514814794063568, -0.00014046579599380493, -0.00012945011258125305, -0.00011843442916870117, -0.00010741874575614929, -9.640306234359741e-05, -8.538737893104553e-05, -7.437169551849365e-05, -6.335601210594177e-05, -5.234032869338989e-05, -4.132464528083801e-05, -3.0308961868286133e-05, -1.9293278455734253e-05, -8.277595043182373e-06, 2.738088369369507e-06, 1.3753771781921387e-05, 2.4769455194473267e-05, 3.5785138607025146e-05, 4.6800822019577026e-05, 5.7816505432128906e-05, 6.883218884468079e-05, 7.984787225723267e-05, 9.086355566978455e-05, 0.00010187923908233643, 0.0001128949224948883, 0.00012391060590744019, 0.00013492628931999207, 0.00014594197273254395, 0.00015695765614509583, 0.0001679733395576477, 0.00017898902297019958, 0.00019000470638275146, 0.00020102038979530334, 0.00021203607320785522, 0.0002230517566204071, 0.00023406744003295898, 0.00024508312344551086, 0.00025609880685806274, 0.0002671144902706146, 0.0002781301736831665, 0.0002891458570957184, 0.00030016154050827026, 0.00031117722392082214, 0.000322192907333374, 0.0003332085907459259, 0.0003442242741584778, 0.00035523995757102966, 0.00036625564098358154, 0.0003772713243961334, 0.0003882870078086853, 0.0003993026912212372, 0.00041031837463378906]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 4.0, 3.0, 10.0, 12.0, 10.0, 33.0, 26.0, 30.0, 49.0, 69.0, 101.0, 132.0, 163.0, 235.0, 328.0, 475.0, 759.0, 1060.0, 1663.0, 2686.0, 5081.0, 10167.0, 23447.0, 61134.0, 160717.0, 304357.0, 269175.0, 123243.0, 45725.0, 18257.0, 8249.0, 4192.0, 2405.0, 1413.0, 962.0, 661.0, 448.0, 274.0, 218.0, 164.0, 131.0, 72.0, 68.0, 36.0, 32.0, 24.0, 16.0, 14.0, 10.0, 4.0, 10.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.109375, -3.001617431640625, -2.89385986328125, -2.786102294921875, -2.6783447265625, -2.570587158203125, -2.46282958984375, -2.355072021484375, -2.247314453125, -2.139556884765625, -2.03179931640625, -1.924041748046875, -1.8162841796875, -1.708526611328125, -1.60076904296875, -1.493011474609375, -1.38525390625, -1.277496337890625, -1.16973876953125, -1.061981201171875, -0.9542236328125, -0.846466064453125, -0.73870849609375, -0.630950927734375, -0.523193359375, -0.415435791015625, -0.30767822265625, -0.199920654296875, -0.0921630859375, 0.015594482421875, 0.12335205078125, 0.231109619140625, 0.3388671875, 0.446624755859375, 0.55438232421875, 0.662139892578125, 0.7698974609375, 0.877655029296875, 0.98541259765625, 1.093170166015625, 1.200927734375, 1.308685302734375, 1.41644287109375, 1.524200439453125, 1.6319580078125, 1.739715576171875, 1.84747314453125, 1.955230712890625, 2.06298828125, 2.170745849609375, 2.27850341796875, 2.386260986328125, 2.4940185546875, 2.601776123046875, 2.70953369140625, 2.817291259765625, 2.925048828125, 3.032806396484375, 3.14056396484375, 3.248321533203125, 3.3560791015625, 3.463836669921875, 3.57159423828125, 3.679351806640625, 3.787109375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 0.0, 4.0, 5.0, 11.0, 10.0, 15.0, 22.0, 39.0, 47.0, 74.0, 70.0, 83.0, 97.0, 91.0, 86.0, 104.0, 68.0, 56.0, 34.0, 35.0, 13.0, 8.0, 6.0, 7.0, 5.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9140625, -0.8826446533203125, -0.851226806640625, -0.8198089599609375, -0.78839111328125, -0.7569732666015625, -0.725555419921875, -0.6941375732421875, -0.6627197265625, -0.6313018798828125, -0.599884033203125, -0.5684661865234375, -0.53704833984375, -0.5056304931640625, -0.474212646484375, -0.4427947998046875, -0.411376953125, -0.3799591064453125, -0.348541259765625, -0.3171234130859375, -0.28570556640625, -0.2542877197265625, -0.222869873046875, -0.1914520263671875, -0.1600341796875, -0.1286163330078125, -0.097198486328125, -0.0657806396484375, -0.03436279296875, -0.0029449462890625, 0.028472900390625, 0.0598907470703125, 0.09130859375, 0.1227264404296875, 0.154144287109375, 0.1855621337890625, 0.21697998046875, 0.2483978271484375, 0.279815673828125, 0.3112335205078125, 0.3426513671875, 0.3740692138671875, 0.405487060546875, 0.4369049072265625, 0.46832275390625, 0.4997406005859375, 0.531158447265625, 0.5625762939453125, 0.593994140625, 0.6254119873046875, 0.656829833984375, 0.6882476806640625, 0.71966552734375, 0.7510833740234375, 0.782501220703125, 0.8139190673828125, 0.8453369140625, 0.8767547607421875, 0.908172607421875, 0.9395904541015625, 0.97100830078125, 1.0024261474609375, 1.033843994140625, 1.0652618408203125, 1.0966796875]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 5.0, 8.0, 2.0, 3.0, 12.0, 12.0, 20.0, 14.0, 18.0, 22.0, 37.0, 36.0, 36.0, 57.0, 64.0, 59.0, 77.0, 69.0, 73.0, 59.0, 64.0, 56.0, 41.0, 37.0, 34.0, 24.0, 16.0, 7.0, 13.0, 6.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.231340408325195, -8.999356269836426, -8.767373085021973, -8.535388946533203, -8.30340576171875, -8.07142162322998, -7.839438438415527, -7.607454299926758, -7.3754706382751465, -7.143486976623535, -6.911503314971924, -6.6795196533203125, -6.447535991668701, -6.21555233001709, -5.98356819152832, -5.751584529876709, -5.519600868225098, -5.287617206573486, -5.055633544921875, -4.823649883270264, -4.591666221618652, -4.359682083129883, -4.12769889831543, -3.89571475982666, -3.663731575012207, -3.4317479133605957, -3.1997642517089844, -2.967780590057373, -2.7357966899871826, -2.5038130283355713, -2.27182936668396, -2.0398454666137695, -1.8078618049621582, -1.5758781433105469, -1.343894362449646, -1.1119107007980347, -0.8799269795417786, -0.6479432582855225, -0.41595959663391113, -0.18397581577301025, 0.048007845878601074, 0.2799915671348572, 0.5119752883911133, 0.7439589500427246, 0.9759426712989807, 1.2079263925552368, 1.4399100542068481, 1.671893835067749, 1.9038774967193604, 2.1358611583709717, 2.367844820022583, 2.5998287200927734, 2.8318123817443848, 3.063796043395996, 3.2957797050476074, 3.5277633666992188, 3.75974702835083, 3.9917306900024414, 4.223714351654053, 4.455698013305664, 4.687681674957275, 4.919665336608887, 5.151649475097656, 5.383633136749268, 5.615616798400879]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 6.0, 8.0, 4.0, 5.0, 12.0, 8.0, 13.0, 15.0, 8.0, 22.0, 16.0, 23.0, 12.0, 21.0, 24.0, 21.0, 27.0, 28.0, 34.0, 37.0, 38.0, 40.0, 32.0, 41.0, 42.0, 53.0, 28.0, 34.0, 35.0, 33.0, 32.0, 26.0, 31.0, 29.0, 25.0, 23.0, 16.0, 18.0, 12.0, 12.0, 10.0, 10.0, 12.0, 5.0, 5.0, 5.0, 6.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.342905044555664, -3.2374014854431152, -3.1318979263305664, -3.0263943672180176, -2.9208908081054688, -2.81538724899292, -2.70988392829895, -2.6043803691864014, -2.4988768100738525, -2.3933732509613037, -2.287869691848755, -2.182366132736206, -2.0768628120422363, -1.971359133720398, -1.8658556938171387, -1.7603521347045898, -1.654848575592041, -1.5493450164794922, -1.4438414573669434, -1.338338017463684, -1.2328344583511353, -1.1273308992385864, -1.0218274593353271, -0.9163239002227783, -0.8108203411102295, -0.7053167819976807, -0.5998132824897766, -0.49430975317955017, -0.38880622386932373, -0.2833026647567749, -0.17779916524887085, -0.0722956657409668, 0.03320789337158203, 0.13871142268180847, 0.2442149519920349, 0.34971848130226135, 0.4552220106124878, 0.5607255697250366, 0.6662290692329407, 0.7717325687408447, 0.8772361278533936, 0.9827396869659424, 1.0882432460784912, 1.1937466859817505, 1.2992502450942993, 1.4047538042068481, 1.5102572441101074, 1.6157608032226562, 1.721264362335205, 1.826767921447754, 1.9322714805603027, 2.0377750396728516, 2.1432785987854004, 2.248782157897949, 2.354285478591919, 2.4597890377044678, 2.5652925968170166, 2.6707961559295654, 2.7762997150421143, 2.881803274154663, 2.987306594848633, 3.0928101539611816, 3.1983137130737305, 3.3038172721862793, 3.409320831298828]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 6.0, 2.0, 6.0, 5.0, 12.0, 20.0, 15.0, 22.0, 34.0, 57.0, 58.0, 105.0, 137.0, 184.0, 290.0, 386.0, 599.0, 908.0, 1338.0, 1946.0, 3068.0, 4787.0, 7945.0, 13741.0, 24741.0, 47206.0, 97477.0, 221553.0, 558049.0, 1154140.0, 1120302.0, 528408.0, 211373.0, 92585.0, 44845.0, 23650.0, 13120.0, 7628.0, 4730.0, 2912.0, 1915.0, 1285.0, 844.0, 590.0, 384.0, 269.0, 196.0, 113.0, 97.0, 71.0, 41.0, 41.0, 16.0, 13.0, 12.0, 7.0, 8.0, 1.0, 2.0, 3.0], "bins": [-6.5, -6.30865478515625, -6.1173095703125, -5.92596435546875, -5.734619140625, -5.54327392578125, -5.3519287109375, -5.16058349609375, -4.96923828125, -4.77789306640625, -4.5865478515625, -4.39520263671875, -4.203857421875, -4.01251220703125, -3.8211669921875, -3.62982177734375, -3.4384765625, -3.24713134765625, -3.0557861328125, -2.86444091796875, -2.673095703125, -2.48175048828125, -2.2904052734375, -2.09906005859375, -1.90771484375, -1.71636962890625, -1.5250244140625, -1.33367919921875, -1.142333984375, -0.95098876953125, -0.7596435546875, -0.56829833984375, -0.376953125, -0.18560791015625, 0.0057373046875, 0.19708251953125, 0.388427734375, 0.57977294921875, 0.7711181640625, 0.96246337890625, 1.15380859375, 1.34515380859375, 1.5364990234375, 1.72784423828125, 1.919189453125, 2.11053466796875, 2.3018798828125, 2.49322509765625, 2.6845703125, 2.87591552734375, 3.0672607421875, 3.25860595703125, 3.449951171875, 3.64129638671875, 3.8326416015625, 4.02398681640625, 4.21533203125, 4.40667724609375, 4.5980224609375, 4.78936767578125, 4.980712890625, 5.17205810546875, 5.3634033203125, 5.55474853515625, 5.74609375]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 4.0, 9.0, 12.0, 6.0, 12.0, 14.0, 17.0, 12.0, 8.0, 18.0, 27.0, 18.0, 17.0, 21.0, 34.0, 26.0, 26.0, 26.0, 26.0, 43.0, 36.0, 37.0, 34.0, 45.0, 45.0, 41.0, 35.0, 39.0, 35.0, 28.0, 37.0, 27.0, 20.0, 24.0, 22.0, 21.0, 12.0, 10.0, 16.0, 15.0, 9.0, 5.0, 6.0, 6.0, 8.0, 5.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0], "bins": [-2.548828125, -2.472869873046875, -2.39691162109375, -2.320953369140625, -2.2449951171875, -2.169036865234375, -2.09307861328125, -2.017120361328125, -1.941162109375, -1.865203857421875, -1.78924560546875, -1.713287353515625, -1.6373291015625, -1.561370849609375, -1.48541259765625, -1.409454345703125, -1.33349609375, -1.257537841796875, -1.18157958984375, -1.105621337890625, -1.0296630859375, -0.953704833984375, -0.87774658203125, -0.801788330078125, -0.725830078125, -0.649871826171875, -0.57391357421875, -0.497955322265625, -0.4219970703125, -0.346038818359375, -0.27008056640625, -0.194122314453125, -0.1181640625, -0.042205810546875, 0.03375244140625, 0.109710693359375, 0.1856689453125, 0.261627197265625, 0.33758544921875, 0.413543701171875, 0.489501953125, 0.565460205078125, 0.64141845703125, 0.717376708984375, 0.7933349609375, 0.869293212890625, 0.94525146484375, 1.021209716796875, 1.09716796875, 1.173126220703125, 1.24908447265625, 1.325042724609375, 1.4010009765625, 1.476959228515625, 1.55291748046875, 1.628875732421875, 1.704833984375, 1.780792236328125, 1.85675048828125, 1.932708740234375, 2.0086669921875, 2.084625244140625, 2.16058349609375, 2.236541748046875, 2.3125]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 13.0, 17.0, 12.0, 14.0, 44.0, 72.0, 96.0, 134.0, 225.0, 291.0, 450.0, 712.0, 991.0, 1609.0, 2463.0, 3789.0, 6025.0, 9727.0, 16247.0, 27177.0, 47295.0, 85426.0, 160703.0, 320625.0, 641484.0, 1034483.0, 868500.0, 461940.0, 229935.0, 118966.0, 63683.0, 36316.0, 20888.0, 12667.0, 7726.0, 4805.0, 2997.0, 1996.0, 1265.0, 809.0, 536.0, 367.0, 276.0, 152.0, 106.0, 73.0, 62.0, 26.0, 24.0, 24.0, 9.0, 10.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-5.640625, -5.46844482421875, -5.2962646484375, -5.12408447265625, -4.951904296875, -4.77972412109375, -4.6075439453125, -4.43536376953125, -4.26318359375, -4.09100341796875, -3.9188232421875, -3.74664306640625, -3.574462890625, -3.40228271484375, -3.2301025390625, -3.05792236328125, -2.8857421875, -2.71356201171875, -2.5413818359375, -2.36920166015625, -2.197021484375, -2.02484130859375, -1.8526611328125, -1.68048095703125, -1.50830078125, -1.33612060546875, -1.1639404296875, -0.99176025390625, -0.819580078125, -0.64739990234375, -0.4752197265625, -0.30303955078125, -0.130859375, 0.04132080078125, 0.2135009765625, 0.38568115234375, 0.557861328125, 0.73004150390625, 0.9022216796875, 1.07440185546875, 1.24658203125, 1.41876220703125, 1.5909423828125, 1.76312255859375, 1.935302734375, 2.10748291015625, 2.2796630859375, 2.45184326171875, 2.6240234375, 2.79620361328125, 2.9683837890625, 3.14056396484375, 3.312744140625, 3.48492431640625, 3.6571044921875, 3.82928466796875, 4.00146484375, 4.17364501953125, 4.3458251953125, 4.51800537109375, 4.690185546875, 4.86236572265625, 5.0345458984375, 5.20672607421875, 5.37890625]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 11.0, 9.0, 11.0, 14.0, 17.0, 14.0, 24.0, 38.0, 39.0, 53.0, 74.0, 93.0, 122.0, 146.0, 180.0, 202.0, 233.0, 284.0, 285.0, 268.0, 292.0, 271.0, 254.0, 247.0, 194.0, 129.0, 115.0, 90.0, 82.0, 63.0, 30.0, 42.0, 32.0, 25.0, 22.0, 18.0, 15.0, 9.0, 4.0, 5.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.6572265625, -1.6015777587890625, -1.545928955078125, -1.4902801513671875, -1.43463134765625, -1.3789825439453125, -1.323333740234375, -1.2676849365234375, -1.2120361328125, -1.1563873291015625, -1.100738525390625, -1.0450897216796875, -0.98944091796875, -0.9337921142578125, -0.878143310546875, -0.8224945068359375, -0.766845703125, -0.7111968994140625, -0.655548095703125, -0.5998992919921875, -0.54425048828125, -0.4886016845703125, -0.432952880859375, -0.3773040771484375, -0.3216552734375, -0.2660064697265625, -0.210357666015625, -0.1547088623046875, -0.09906005859375, -0.0434112548828125, 0.012237548828125, 0.0678863525390625, 0.12353515625, 0.1791839599609375, 0.234832763671875, 0.2904815673828125, 0.34613037109375, 0.4017791748046875, 0.457427978515625, 0.5130767822265625, 0.5687255859375, 0.6243743896484375, 0.680023193359375, 0.7356719970703125, 0.79132080078125, 0.8469696044921875, 0.902618408203125, 0.9582672119140625, 1.013916015625, 1.0695648193359375, 1.125213623046875, 1.1808624267578125, 1.23651123046875, 1.2921600341796875, 1.347808837890625, 1.4034576416015625, 1.4591064453125, 1.5147552490234375, 1.570404052734375, 1.6260528564453125, 1.68170166015625, 1.7373504638671875, 1.792999267578125, 1.8486480712890625, 1.904296875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 7.0, 7.0, 7.0, 9.0, 13.0, 19.0, 23.0, 29.0, 34.0, 38.0, 58.0, 66.0, 68.0, 77.0, 77.0, 74.0, 82.0, 56.0, 54.0, 48.0, 41.0, 35.0, 24.0, 17.0, 14.0, 8.0, 1.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-11.406835556030273, -11.148826599121094, -10.890816688537598, -10.632807731628418, -10.374797821044922, -10.116788864135742, -9.858778953552246, -9.600769996643066, -9.34276008605957, -9.08475112915039, -8.826741218566895, -8.568732261657715, -8.310722351074219, -8.052713394165039, -7.794703960418701, -7.536694526672363, -7.278685569763184, -7.020676136016846, -6.762666702270508, -6.50465726852417, -6.246647834777832, -5.988638877868652, -5.7306294441223145, -5.472620010375977, -5.214610576629639, -4.956601142883301, -4.698591709136963, -4.440582275390625, -4.182573318481445, -3.9245636463165283, -3.6665544509887695, -3.4085450172424316, -3.1505351066589355, -2.8925256729125977, -2.6345162391662598, -2.376507043838501, -2.118497610092163, -1.8604881763458252, -1.6024788618087769, -1.3444695472717285, -1.0864601135253906, -0.8284507393836975, -0.5704413652420044, -0.3124319911003113, -0.054422616958618164, 0.20358681678771973, 0.46159613132476807, 0.7196054458618164, 0.9776148796081543, 1.2356243133544922, 1.4936336278915405, 1.7516429424285889, 2.0096523761749268, 2.2676618099212646, 2.5256710052490234, 2.7836804389953613, 3.041689872741699, 3.299699306488037, 3.557708740234375, 3.815717935562134, 4.073727607727051, 4.3317365646362305, 4.589745998382568, 4.847755432128906, 5.105764865875244]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 9.0, 7.0, 5.0, 9.0, 11.0, 13.0, 15.0, 17.0, 13.0, 23.0, 24.0, 30.0, 17.0, 27.0, 38.0, 35.0, 38.0, 43.0, 24.0, 40.0, 40.0, 35.0, 32.0, 47.0, 39.0, 33.0, 36.0, 34.0, 25.0, 28.0, 26.0, 28.0, 17.0, 27.0, 27.0, 9.0, 18.0, 6.0, 14.0, 14.0, 4.0, 6.0, 3.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-3.7236645221710205, -3.6212408542633057, -3.518817186355591, -3.416393518447876, -3.313969850540161, -3.2115461826324463, -3.1091222763061523, -3.0066986083984375, -2.9042749404907227, -2.801851272583008, -2.699427604675293, -2.597003936767578, -2.4945802688598633, -2.3921566009521484, -2.2897329330444336, -2.1873092651367188, -2.084885597229004, -1.982461929321289, -1.8800382614135742, -1.7776145935058594, -1.6751909255981445, -1.5727672576904297, -1.4703434705734253, -1.3679198026657104, -1.2654961347579956, -1.1630724668502808, -1.060648798942566, -0.9582250714302063, -0.8558014035224915, -0.7533777356147766, -0.650954008102417, -0.5485303401947021, -0.4461069107055664, -0.34368324279785156, -0.24125954508781433, -0.1388358473777771, -0.036412179470062256, 0.06601148843765259, 0.1684352159500122, 0.27085888385772705, 0.3732825517654419, 0.47570621967315674, 0.5781298875808716, 0.6805536150932312, 0.782977283000946, 0.8854009509086609, 0.9878246784210205, 1.0902483463287354, 1.1926720142364502, 1.295095682144165, 1.3975193500518799, 1.4999430179595947, 1.6023666858673096, 1.7047903537750244, 1.8072141408920288, 1.9096378087997437, 2.012061595916748, 2.114485263824463, 2.2169089317321777, 2.3193325996398926, 2.4217562675476074, 2.5241799354553223, 2.626603603363037, 2.729027271270752, 2.831450939178467]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 9.0, 12.0, 7.0, 16.0, 22.0, 17.0, 47.0, 53.0, 83.0, 117.0, 163.0, 199.0, 246.0, 376.0, 584.0, 869.0, 1307.0, 2290.0, 4018.0, 7399.0, 14255.0, 28620.0, 57793.0, 112151.0, 189819.0, 233841.0, 180748.0, 103709.0, 53671.0, 26241.0, 13230.0, 6853.0, 3724.0, 2094.0, 1268.0, 836.0, 580.0, 344.0, 252.0, 173.0, 148.0, 99.0, 69.0, 60.0, 45.0, 27.0, 27.0, 14.0, 10.0, 5.0, 11.0, 4.0, 2.0, 4.0], "bins": [-3.7421875, -3.6365966796875, -3.531005859375, -3.4254150390625, -3.31982421875, -3.2142333984375, -3.108642578125, -3.0030517578125, -2.8974609375, -2.7918701171875, -2.686279296875, -2.5806884765625, -2.47509765625, -2.3695068359375, -2.263916015625, -2.1583251953125, -2.052734375, -1.9471435546875, -1.841552734375, -1.7359619140625, -1.63037109375, -1.5247802734375, -1.419189453125, -1.3135986328125, -1.2080078125, -1.1024169921875, -0.996826171875, -0.8912353515625, -0.78564453125, -0.6800537109375, -0.574462890625, -0.4688720703125, -0.36328125, -0.2576904296875, -0.152099609375, -0.0465087890625, 0.05908203125, 0.1646728515625, 0.270263671875, 0.3758544921875, 0.4814453125, 0.5870361328125, 0.692626953125, 0.7982177734375, 0.90380859375, 1.0093994140625, 1.114990234375, 1.2205810546875, 1.326171875, 1.4317626953125, 1.537353515625, 1.6429443359375, 1.74853515625, 1.8541259765625, 1.959716796875, 2.0653076171875, 2.1708984375, 2.2764892578125, 2.382080078125, 2.4876708984375, 2.59326171875, 2.6988525390625, 2.804443359375, 2.9100341796875, 3.015625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 7.0, 9.0, 6.0, 8.0, 7.0, 12.0, 9.0, 12.0, 16.0, 22.0, 19.0, 28.0, 24.0, 32.0, 31.0, 43.0, 28.0, 30.0, 32.0, 32.0, 51.0, 35.0, 39.0, 41.0, 33.0, 38.0, 32.0, 31.0, 33.0, 35.0, 27.0, 38.0, 19.0, 28.0, 16.0, 22.0, 13.0, 11.0, 10.0, 12.0, 5.0, 7.0, 8.0, 1.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.83984375, -3.7265625, -3.61328125, -3.5, -3.38671875, -3.2734375, -3.16015625, -3.046875, -2.93359375, -2.8203125, -2.70703125, -2.59375, -2.48046875, -2.3671875, -2.25390625, -2.140625, -2.02734375, -1.9140625, -1.80078125, -1.6875, -1.57421875, -1.4609375, -1.34765625, -1.234375, -1.12109375, -1.0078125, -0.89453125, -0.78125, -0.66796875, -0.5546875, -0.44140625, -0.328125, -0.21484375, -0.1015625, 0.01171875, 0.125, 0.23828125, 0.3515625, 0.46484375, 0.578125, 0.69140625, 0.8046875, 0.91796875, 1.03125, 1.14453125, 1.2578125, 1.37109375, 1.484375, 1.59765625, 1.7109375, 1.82421875, 1.9375, 2.05078125, 2.1640625, 2.27734375, 2.390625, 2.50390625, 2.6171875, 2.73046875, 2.84375, 2.95703125, 3.0703125, 3.18359375, 3.296875, 3.41015625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 7.0, 0.0, 5.0, 10.0, 8.0, 13.0, 18.0, 30.0, 18.0, 30.0, 57.0, 84.0, 146.0, 209.0, 269.0, 437.0, 691.0, 1167.0, 2097.0, 4072.0, 8073.0, 18181.0, 43181.0, 106174.0, 246194.0, 320853.0, 171781.0, 70393.0, 28883.0, 12485.0, 5905.0, 2964.0, 1615.0, 959.0, 508.0, 303.0, 229.0, 156.0, 115.0, 60.0, 60.0, 33.0, 27.0, 19.0, 8.0, 4.0, 9.0, 6.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-5.21484375, -5.05810546875, -4.9013671875, -4.74462890625, -4.587890625, -4.43115234375, -4.2744140625, -4.11767578125, -3.9609375, -3.80419921875, -3.6474609375, -3.49072265625, -3.333984375, -3.17724609375, -3.0205078125, -2.86376953125, -2.70703125, -2.55029296875, -2.3935546875, -2.23681640625, -2.080078125, -1.92333984375, -1.7666015625, -1.60986328125, -1.453125, -1.29638671875, -1.1396484375, -0.98291015625, -0.826171875, -0.66943359375, -0.5126953125, -0.35595703125, -0.19921875, -0.04248046875, 0.1142578125, 0.27099609375, 0.427734375, 0.58447265625, 0.7412109375, 0.89794921875, 1.0546875, 1.21142578125, 1.3681640625, 1.52490234375, 1.681640625, 1.83837890625, 1.9951171875, 2.15185546875, 2.30859375, 2.46533203125, 2.6220703125, 2.77880859375, 2.935546875, 3.09228515625, 3.2490234375, 3.40576171875, 3.5625, 3.71923828125, 3.8759765625, 4.03271484375, 4.189453125, 4.34619140625, 4.5029296875, 4.65966796875, 4.81640625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 6.0, 6.0, 12.0, 9.0, 11.0, 17.0, 13.0, 20.0, 23.0, 24.0, 25.0, 24.0, 35.0, 21.0, 45.0, 50.0, 39.0, 39.0, 33.0, 34.0, 35.0, 50.0, 38.0, 32.0, 33.0, 36.0, 42.0, 31.0, 25.0, 28.0, 18.0, 16.0, 26.0, 16.0, 19.0, 10.0, 10.0, 11.0, 10.0, 6.0, 8.0, 3.0, 7.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.2265625, -2.15716552734375, -2.0877685546875, -2.01837158203125, -1.948974609375, -1.87957763671875, -1.8101806640625, -1.74078369140625, -1.67138671875, -1.60198974609375, -1.5325927734375, -1.46319580078125, -1.393798828125, -1.32440185546875, -1.2550048828125, -1.18560791015625, -1.1162109375, -1.04681396484375, -0.9774169921875, -0.90802001953125, -0.838623046875, -0.76922607421875, -0.6998291015625, -0.63043212890625, -0.56103515625, -0.49163818359375, -0.4222412109375, -0.35284423828125, -0.283447265625, -0.21405029296875, -0.1446533203125, -0.07525634765625, -0.005859375, 0.06353759765625, 0.1329345703125, 0.20233154296875, 0.271728515625, 0.34112548828125, 0.4105224609375, 0.47991943359375, 0.54931640625, 0.61871337890625, 0.6881103515625, 0.75750732421875, 0.826904296875, 0.89630126953125, 0.9656982421875, 1.03509521484375, 1.1044921875, 1.17388916015625, 1.2432861328125, 1.31268310546875, 1.382080078125, 1.45147705078125, 1.5208740234375, 1.59027099609375, 1.65966796875, 1.72906494140625, 1.7984619140625, 1.86785888671875, 1.937255859375, 2.00665283203125, 2.0760498046875, 2.14544677734375, 2.21484375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 7.0, 7.0, 16.0, 21.0, 24.0, 37.0, 56.0, 60.0, 93.0, 102.0, 151.0, 217.0, 297.0, 417.0, 564.0, 875.0, 1434.0, 2401.0, 4345.0, 9820.0, 27215.0, 92287.0, 327317.0, 398942.0, 122451.0, 34484.0, 12239.0, 5112.0, 2649.0, 1553.0, 1041.0, 629.0, 484.0, 328.0, 255.0, 173.0, 114.0, 98.0, 78.0, 48.0, 32.0, 19.0, 21.0, 13.0, 9.0, 10.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.1640625, -3.065521240234375, -2.96697998046875, -2.868438720703125, -2.7698974609375, -2.671356201171875, -2.57281494140625, -2.474273681640625, -2.375732421875, -2.277191162109375, -2.17864990234375, -2.080108642578125, -1.9815673828125, -1.883026123046875, -1.78448486328125, -1.685943603515625, -1.58740234375, -1.488861083984375, -1.39031982421875, -1.291778564453125, -1.1932373046875, -1.094696044921875, -0.99615478515625, -0.897613525390625, -0.799072265625, -0.700531005859375, -0.60198974609375, -0.503448486328125, -0.4049072265625, -0.306365966796875, -0.20782470703125, -0.109283447265625, -0.0107421875, 0.087799072265625, 0.18634033203125, 0.284881591796875, 0.3834228515625, 0.481964111328125, 0.58050537109375, 0.679046630859375, 0.777587890625, 0.876129150390625, 0.97467041015625, 1.073211669921875, 1.1717529296875, 1.270294189453125, 1.36883544921875, 1.467376708984375, 1.56591796875, 1.664459228515625, 1.76300048828125, 1.861541748046875, 1.9600830078125, 2.058624267578125, 2.15716552734375, 2.255706787109375, 2.354248046875, 2.452789306640625, 2.55133056640625, 2.649871826171875, 2.7484130859375, 2.846954345703125, 2.94549560546875, 3.044036865234375, 3.142578125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 11.0, 14.0, 35.0, 36.0, 48.0, 65.0, 92.0, 117.0, 135.0, 124.0, 95.0, 71.0, 44.0, 31.0, 25.0, 21.0, 7.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014281272888183594, -0.00013865530490875244, -0.00013449788093566895, -0.00013034045696258545, -0.00012618303298950195, -0.00012202560901641846, -0.00011786818504333496, -0.00011371076107025146, -0.00010955333709716797, -0.00010539591312408447, -0.00010123848915100098, -9.708106517791748e-05, -9.292364120483398e-05, -8.876621723175049e-05, -8.460879325866699e-05, -8.04513692855835e-05, -7.62939453125e-05, -7.21365213394165e-05, -6.797909736633301e-05, -6.382167339324951e-05, -5.9664249420166016e-05, -5.550682544708252e-05, -5.1349401473999023e-05, -4.719197750091553e-05, -4.303455352783203e-05, -3.8877129554748535e-05, -3.471970558166504e-05, -3.056228160858154e-05, -2.6404857635498047e-05, -2.224743366241455e-05, -1.8090009689331055e-05, -1.3932585716247559e-05, -9.775161743164062e-06, -5.617737770080566e-06, -1.4603137969970703e-06, 2.6971101760864258e-06, 6.854534149169922e-06, 1.1011958122253418e-05, 1.5169382095336914e-05, 1.932680606842041e-05, 2.3484230041503906e-05, 2.7641654014587402e-05, 3.17990779876709e-05, 3.5956501960754395e-05, 4.011392593383789e-05, 4.427134990692139e-05, 4.842877388000488e-05, 5.258619785308838e-05, 5.6743621826171875e-05, 6.090104579925537e-05, 6.505846977233887e-05, 6.921589374542236e-05, 7.337331771850586e-05, 7.753074169158936e-05, 8.168816566467285e-05, 8.584558963775635e-05, 9.000301361083984e-05, 9.416043758392334e-05, 9.831786155700684e-05, 0.00010247528553009033, 0.00010663270950317383, 0.00011079013347625732, 0.00011494755744934082, 0.00011910498142242432, 0.0001232624053955078]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 4.0, 13.0, 20.0, 17.0, 23.0, 42.0, 61.0, 88.0, 150.0, 220.0, 293.0, 459.0, 724.0, 1050.0, 1718.0, 2976.0, 6416.0, 17414.0, 60659.0, 216050.0, 422717.0, 222656.0, 62230.0, 18080.0, 6459.0, 3046.0, 1755.0, 1093.0, 718.0, 489.0, 290.0, 205.0, 151.0, 101.0, 55.0, 35.0, 33.0, 20.0, 6.0, 13.0, 3.0, 4.0, 3.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.0859375, -2.99652099609375, -2.9071044921875, -2.81768798828125, -2.728271484375, -2.63885498046875, -2.5494384765625, -2.46002197265625, -2.37060546875, -2.28118896484375, -2.1917724609375, -2.10235595703125, -2.012939453125, -1.92352294921875, -1.8341064453125, -1.74468994140625, -1.6552734375, -1.56585693359375, -1.4764404296875, -1.38702392578125, -1.297607421875, -1.20819091796875, -1.1187744140625, -1.02935791015625, -0.93994140625, -0.85052490234375, -0.7611083984375, -0.67169189453125, -0.582275390625, -0.49285888671875, -0.4034423828125, -0.31402587890625, -0.224609375, -0.13519287109375, -0.0457763671875, 0.04364013671875, 0.133056640625, 0.22247314453125, 0.3118896484375, 0.40130615234375, 0.49072265625, 0.58013916015625, 0.6695556640625, 0.75897216796875, 0.848388671875, 0.93780517578125, 1.0272216796875, 1.11663818359375, 1.2060546875, 1.29547119140625, 1.3848876953125, 1.47430419921875, 1.563720703125, 1.65313720703125, 1.7425537109375, 1.83197021484375, 1.92138671875, 2.01080322265625, 2.1002197265625, 2.18963623046875, 2.279052734375, 2.36846923828125, 2.4578857421875, 2.54730224609375, 2.63671875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 2.0, 7.0, 6.0, 10.0, 21.0, 16.0, 34.0, 53.0, 47.0, 46.0, 69.0, 82.0, 99.0, 92.0, 75.0, 63.0, 75.0, 47.0, 40.0, 29.0, 24.0, 19.0, 14.0, 7.0, 9.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.537109375, -0.519195556640625, -0.50128173828125, -0.483367919921875, -0.4654541015625, -0.447540283203125, -0.42962646484375, -0.411712646484375, -0.393798828125, -0.375885009765625, -0.35797119140625, -0.340057373046875, -0.3221435546875, -0.304229736328125, -0.28631591796875, -0.268402099609375, -0.25048828125, -0.232574462890625, -0.21466064453125, -0.196746826171875, -0.1788330078125, -0.160919189453125, -0.14300537109375, -0.125091552734375, -0.107177734375, -0.089263916015625, -0.07135009765625, -0.053436279296875, -0.0355224609375, -0.017608642578125, 0.00030517578125, 0.018218994140625, 0.0361328125, 0.054046630859375, 0.07196044921875, 0.089874267578125, 0.1077880859375, 0.125701904296875, 0.14361572265625, 0.161529541015625, 0.179443359375, 0.197357177734375, 0.21527099609375, 0.233184814453125, 0.2510986328125, 0.269012451171875, 0.28692626953125, 0.304840087890625, 0.32275390625, 0.340667724609375, 0.35858154296875, 0.376495361328125, 0.3944091796875, 0.412322998046875, 0.43023681640625, 0.448150634765625, 0.466064453125, 0.483978271484375, 0.50189208984375, 0.519805908203125, 0.5377197265625, 0.555633544921875, 0.57354736328125, 0.591461181640625, 0.609375]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 7.0, 9.0, 6.0, 19.0, 17.0, 27.0, 32.0, 36.0, 50.0, 53.0, 68.0, 84.0, 77.0, 84.0, 85.0, 71.0, 45.0, 57.0, 45.0, 32.0, 21.0, 21.0, 13.0, 9.0, 9.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-11.466853141784668, -11.204253196716309, -10.941654205322266, -10.679054260253906, -10.416454315185547, -10.153854370117188, -9.891255378723145, -9.628655433654785, -9.366056442260742, -9.103456497192383, -8.84085750579834, -8.57825756072998, -8.315657615661621, -8.053058624267578, -7.790458679199219, -7.527858734130859, -7.2652587890625, -7.002659320831299, -6.7400593757629395, -6.477459907531738, -6.214859962463379, -5.952260494232178, -5.689661026000977, -5.427061080932617, -5.164461612701416, -4.901862144470215, -4.6392621994018555, -4.376662731170654, -4.114063262939453, -3.8514633178710938, -3.5888638496398926, -3.3262641429901123, -3.0636649131774902, -2.80106520652771, -2.5384654998779297, -2.2758660316467285, -2.0132663249969482, -1.750666618347168, -1.4880670309066772, -1.2254674434661865, -0.9628677368164062, -0.7002680897712708, -0.43766844272613525, -0.17506879568099976, 0.08753085136413574, 0.350130558013916, 0.6127301454544067, 0.8753297328948975, 1.1379294395446777, 1.400529146194458, 1.6631287336349487, 1.9257283210754395, 2.1883280277252197, 2.450927734375, 2.713527202606201, 2.9761269092559814, 3.2387266159057617, 3.501326322555542, 3.7639260292053223, 4.026525497436523, 4.289125442504883, 4.551724910736084, 4.814324378967285, 5.0769243240356445, 5.339523792266846]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 6.0, 6.0, 11.0, 7.0, 10.0, 9.0, 18.0, 16.0, 9.0, 19.0, 22.0, 23.0, 24.0, 34.0, 17.0, 30.0, 46.0, 38.0, 37.0, 27.0, 32.0, 40.0, 36.0, 34.0, 40.0, 37.0, 34.0, 35.0, 30.0, 34.0, 27.0, 22.0, 28.0, 20.0, 24.0, 27.0, 13.0, 15.0, 7.0, 9.0, 13.0, 7.0, 8.0, 3.0, 2.0, 6.0, 2.0, 3.0, 3.0], "bins": [-3.6605007648468018, -3.561526298522949, -3.4625518321990967, -3.363577365875244, -3.2646028995513916, -3.165628433227539, -3.0666542053222656, -2.967679500579834, -2.8687052726745605, -2.769730806350708, -2.6707563400268555, -2.571781873703003, -2.4728074073791504, -2.373832941055298, -2.2748584747314453, -2.175884246826172, -2.0769095420837402, -1.9779350757598877, -1.8789606094360352, -1.7799861431121826, -1.68101167678833, -1.5820372104644775, -1.4830628633499146, -1.384088397026062, -1.2851139307022095, -1.186139464378357, -1.0871649980545044, -0.9881905913352966, -0.8892161250114441, -0.7902416586875916, -0.6912672519683838, -0.5922927856445312, -0.4933185577392578, -0.3943440914154053, -0.2953696548938751, -0.19639521837234497, -0.09742075204849243, 0.0015537142753601074, 0.10052812099456787, 0.1995025873184204, 0.29847705364227295, 0.3974515199661255, 0.49642595648765564, 0.5954003930091858, 0.6943748593330383, 0.7933493256568909, 0.8923237323760986, 0.9912981986999512, 1.0902726650238037, 1.1892471313476562, 1.2882215976715088, 1.3871960639953613, 1.4861705303192139, 1.5851449966430664, 1.6841193437576294, 1.783093810081482, 1.8820682764053345, 1.981042742729187, 2.08001708984375, 2.1789915561676025, 2.277966022491455, 2.3769404888153076, 2.47591495513916, 2.5748894214630127, 2.6738638877868652]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 3.0, 5.0, 10.0, 9.0, 15.0, 20.0, 41.0, 70.0, 89.0, 150.0, 205.0, 336.0, 542.0, 804.0, 1235.0, 1962.0, 2972.0, 4838.0, 7735.0, 12120.0, 19637.0, 30766.0, 47737.0, 72049.0, 102205.0, 131174.0, 145811.0, 136303.0, 107896.0, 77880.0, 52051.0, 33947.0, 21338.0, 13611.0, 8305.0, 5409.0, 3276.0, 2182.0, 1372.0, 853.0, 549.0, 373.0, 241.0, 145.0, 108.0, 55.0, 44.0, 28.0, 19.0, 18.0, 5.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-3.134765625, -3.041473388671875, -2.94818115234375, -2.854888916015625, -2.7615966796875, -2.668304443359375, -2.57501220703125, -2.481719970703125, -2.388427734375, -2.295135498046875, -2.20184326171875, -2.108551025390625, -2.0152587890625, -1.921966552734375, -1.82867431640625, -1.735382080078125, -1.64208984375, -1.548797607421875, -1.45550537109375, -1.362213134765625, -1.2689208984375, -1.175628662109375, -1.08233642578125, -0.989044189453125, -0.895751953125, -0.802459716796875, -0.70916748046875, -0.615875244140625, -0.5225830078125, -0.429290771484375, -0.33599853515625, -0.242706298828125, -0.1494140625, -0.056121826171875, 0.03717041015625, 0.130462646484375, 0.2237548828125, 0.317047119140625, 0.41033935546875, 0.503631591796875, 0.596923828125, 0.690216064453125, 0.78350830078125, 0.876800537109375, 0.9700927734375, 1.063385009765625, 1.15667724609375, 1.249969482421875, 1.34326171875, 1.436553955078125, 1.52984619140625, 1.623138427734375, 1.7164306640625, 1.809722900390625, 1.90301513671875, 1.996307373046875, 2.089599609375, 2.182891845703125, 2.27618408203125, 2.369476318359375, 2.4627685546875, 2.556060791015625, 2.64935302734375, 2.742645263671875, 2.8359375]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 1.0, 8.0, 6.0, 10.0, 9.0, 18.0, 18.0, 12.0, 16.0, 24.0, 19.0, 25.0, 30.0, 34.0, 36.0, 32.0, 38.0, 52.0, 38.0, 41.0, 42.0, 37.0, 32.0, 40.0, 39.0, 39.0, 29.0, 35.0, 21.0, 30.0, 26.0, 32.0, 18.0, 24.0, 18.0, 13.0, 14.0, 10.0, 9.0, 2.0, 4.0, 4.0, 2.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.03125, -3.91534423828125, -3.7994384765625, -3.68353271484375, -3.567626953125, -3.45172119140625, -3.3358154296875, -3.21990966796875, -3.10400390625, -2.98809814453125, -2.8721923828125, -2.75628662109375, -2.640380859375, -2.52447509765625, -2.4085693359375, -2.29266357421875, -2.1767578125, -2.06085205078125, -1.9449462890625, -1.82904052734375, -1.713134765625, -1.59722900390625, -1.4813232421875, -1.36541748046875, -1.24951171875, -1.13360595703125, -1.0177001953125, -0.90179443359375, -0.785888671875, -0.66998291015625, -0.5540771484375, -0.43817138671875, -0.322265625, -0.20635986328125, -0.0904541015625, 0.02545166015625, 0.141357421875, 0.25726318359375, 0.3731689453125, 0.48907470703125, 0.60498046875, 0.72088623046875, 0.8367919921875, 0.95269775390625, 1.068603515625, 1.18450927734375, 1.3004150390625, 1.41632080078125, 1.5322265625, 1.64813232421875, 1.7640380859375, 1.87994384765625, 1.995849609375, 2.11175537109375, 2.2276611328125, 2.34356689453125, 2.45947265625, 2.57537841796875, 2.6912841796875, 2.80718994140625, 2.923095703125, 3.03900146484375, 3.1549072265625, 3.27081298828125, 3.38671875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 9.0, 6.0, 3.0, 12.0, 18.0, 19.0, 26.0, 61.0, 83.0, 98.0, 124.0, 254.0, 381.0, 624.0, 931.0, 1703.0, 2685.0, 4604.0, 8325.0, 14751.0, 26124.0, 46965.0, 80250.0, 126115.0, 168825.0, 179383.0, 147230.0, 99417.0, 60173.0, 34397.0, 19537.0, 10708.0, 5989.0, 3427.0, 2055.0, 1190.0, 730.0, 439.0, 311.0, 197.0, 131.0, 102.0, 50.0, 44.0, 22.0, 12.0, 7.0, 12.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.62890625, -3.50885009765625, -3.3887939453125, -3.26873779296875, -3.148681640625, -3.02862548828125, -2.9085693359375, -2.78851318359375, -2.66845703125, -2.54840087890625, -2.4283447265625, -2.30828857421875, -2.188232421875, -2.06817626953125, -1.9481201171875, -1.82806396484375, -1.7080078125, -1.58795166015625, -1.4678955078125, -1.34783935546875, -1.227783203125, -1.10772705078125, -0.9876708984375, -0.86761474609375, -0.74755859375, -0.62750244140625, -0.5074462890625, -0.38739013671875, -0.267333984375, -0.14727783203125, -0.0272216796875, 0.09283447265625, 0.212890625, 0.33294677734375, 0.4530029296875, 0.57305908203125, 0.693115234375, 0.81317138671875, 0.9332275390625, 1.05328369140625, 1.17333984375, 1.29339599609375, 1.4134521484375, 1.53350830078125, 1.653564453125, 1.77362060546875, 1.8936767578125, 2.01373291015625, 2.1337890625, 2.25384521484375, 2.3739013671875, 2.49395751953125, 2.614013671875, 2.73406982421875, 2.8541259765625, 2.97418212890625, 3.09423828125, 3.21429443359375, 3.3343505859375, 3.45440673828125, 3.574462890625, 3.69451904296875, 3.8145751953125, 3.93463134765625, 4.0546875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 3.0, 5.0, 9.0, 13.0, 19.0, 23.0, 11.0, 16.0, 27.0, 25.0, 33.0, 31.0, 29.0, 47.0, 30.0, 42.0, 41.0, 38.0, 40.0, 43.0, 34.0, 40.0, 36.0, 31.0, 35.0, 41.0, 26.0, 23.0, 38.0, 21.0, 20.0, 15.0, 17.0, 20.0, 17.0, 13.0, 6.0, 7.0, 6.0, 4.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.248046875, -2.1796875, -2.111328125, -2.04296875, -1.974609375, -1.90625, -1.837890625, -1.76953125, -1.701171875, -1.6328125, -1.564453125, -1.49609375, -1.427734375, -1.359375, -1.291015625, -1.22265625, -1.154296875, -1.0859375, -1.017578125, -0.94921875, -0.880859375, -0.8125, -0.744140625, -0.67578125, -0.607421875, -0.5390625, -0.470703125, -0.40234375, -0.333984375, -0.265625, -0.197265625, -0.12890625, -0.060546875, 0.0078125, 0.076171875, 0.14453125, 0.212890625, 0.28125, 0.349609375, 0.41796875, 0.486328125, 0.5546875, 0.623046875, 0.69140625, 0.759765625, 0.828125, 0.896484375, 0.96484375, 1.033203125, 1.1015625, 1.169921875, 1.23828125, 1.306640625, 1.375, 1.443359375, 1.51171875, 1.580078125, 1.6484375, 1.716796875, 1.78515625, 1.853515625, 1.921875, 1.990234375, 2.05859375, 2.126953125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 7.0, 14.0, 16.0, 20.0, 36.0, 53.0, 80.0, 85.0, 153.0, 244.0, 365.0, 548.0, 853.0, 1293.0, 1971.0, 3140.0, 5256.0, 8743.0, 14745.0, 26099.0, 45603.0, 80069.0, 132419.0, 186168.0, 192067.0, 142289.0, 87667.0, 49740.0, 28145.0, 15954.0, 9478.0, 5704.0, 3476.0, 2151.0, 1326.0, 886.0, 550.0, 372.0, 253.0, 167.0, 108.0, 82.0, 59.0, 35.0, 23.0, 20.0, 10.0, 3.0, 4.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.01953125, -1.956573486328125, -1.89361572265625, -1.830657958984375, -1.7677001953125, -1.704742431640625, -1.64178466796875, -1.578826904296875, -1.515869140625, -1.452911376953125, -1.38995361328125, -1.326995849609375, -1.2640380859375, -1.201080322265625, -1.13812255859375, -1.075164794921875, -1.01220703125, -0.949249267578125, -0.88629150390625, -0.823333740234375, -0.7603759765625, -0.697418212890625, -0.63446044921875, -0.571502685546875, -0.508544921875, -0.445587158203125, -0.38262939453125, -0.319671630859375, -0.2567138671875, -0.193756103515625, -0.13079833984375, -0.067840576171875, -0.0048828125, 0.058074951171875, 0.12103271484375, 0.183990478515625, 0.2469482421875, 0.309906005859375, 0.37286376953125, 0.435821533203125, 0.498779296875, 0.561737060546875, 0.62469482421875, 0.687652587890625, 0.7506103515625, 0.813568115234375, 0.87652587890625, 0.939483642578125, 1.00244140625, 1.065399169921875, 1.12835693359375, 1.191314697265625, 1.2542724609375, 1.317230224609375, 1.38018798828125, 1.443145751953125, 1.506103515625, 1.569061279296875, 1.63201904296875, 1.694976806640625, 1.7579345703125, 1.820892333984375, 1.88385009765625, 1.946807861328125, 2.009765625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 2.0, 7.0, 5.0, 7.0, 11.0, 6.0, 12.0, 21.0, 15.0, 20.0, 15.0, 35.0, 25.0, 33.0, 46.0, 62.0, 59.0, 73.0, 56.0, 70.0, 66.0, 57.0, 54.0, 36.0, 39.0, 30.0, 29.0, 20.0, 20.0, 13.0, 8.0, 10.0, 4.0, 4.0, 6.0, 4.0, 1.0, 5.0, 0.0, 5.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00015461444854736328, -0.00014940090477466583, -0.00014418736100196838, -0.00013897381722927094, -0.00013376027345657349, -0.00012854672968387604, -0.0001233331859111786, -0.00011811964213848114, -0.00011290609836578369, -0.00010769255459308624, -0.0001024790108203888, -9.726546704769135e-05, -9.20519232749939e-05, -8.683837950229645e-05, -8.1624835729599e-05, -7.641129195690155e-05, -7.11977481842041e-05, -6.598420441150665e-05, -6.0770660638809204e-05, -5.5557116866111755e-05, -5.034357309341431e-05, -4.513002932071686e-05, -3.991648554801941e-05, -3.470294177532196e-05, -2.9489398002624512e-05, -2.4275854229927063e-05, -1.9062310457229614e-05, -1.3848766684532166e-05, -8.635222911834717e-06, -3.421679139137268e-06, 1.7918646335601807e-06, 7.005408406257629e-06, 1.2218952178955078e-05, 1.7432495951652527e-05, 2.2646039724349976e-05, 2.7859583497047424e-05, 3.307312726974487e-05, 3.828667104244232e-05, 4.350021481513977e-05, 4.871375858783722e-05, 5.392730236053467e-05, 5.914084613323212e-05, 6.435438990592957e-05, 6.956793367862701e-05, 7.478147745132446e-05, 7.999502122402191e-05, 8.520856499671936e-05, 9.042210876941681e-05, 9.563565254211426e-05, 0.0001008491963148117, 0.00010606274008750916, 0.0001112762838602066, 0.00011648982763290405, 0.0001217033714056015, 0.00012691691517829895, 0.0001321304589509964, 0.00013734400272369385, 0.0001425575464963913, 0.00014777109026908875, 0.0001529846340417862, 0.00015819817781448364, 0.0001634117215871811, 0.00016862526535987854, 0.000173838809132576, 0.00017905235290527344]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 9.0, 6.0, 9.0, 10.0, 15.0, 25.0, 43.0, 54.0, 78.0, 143.0, 183.0, 289.0, 476.0, 656.0, 942.0, 1556.0, 2350.0, 3634.0, 5619.0, 9003.0, 14003.0, 23070.0, 37773.0, 61837.0, 96545.0, 139649.0, 168504.0, 157702.0, 118754.0, 78360.0, 48307.0, 29741.0, 17999.0, 11352.0, 6998.0, 4576.0, 2754.0, 1883.0, 1205.0, 806.0, 514.0, 388.0, 222.0, 173.0, 116.0, 84.0, 54.0, 26.0, 25.0, 19.0, 8.0, 4.0, 8.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.8056640625, -1.7505340576171875, -1.695404052734375, -1.6402740478515625, -1.58514404296875, -1.5300140380859375, -1.474884033203125, -1.4197540283203125, -1.3646240234375, -1.3094940185546875, -1.254364013671875, -1.1992340087890625, -1.14410400390625, -1.0889739990234375, -1.033843994140625, -0.9787139892578125, -0.923583984375, -0.8684539794921875, -0.813323974609375, -0.7581939697265625, -0.70306396484375, -0.6479339599609375, -0.592803955078125, -0.5376739501953125, -0.4825439453125, -0.4274139404296875, -0.372283935546875, -0.3171539306640625, -0.26202392578125, -0.2068939208984375, -0.151763916015625, -0.0966339111328125, -0.04150390625, 0.0136260986328125, 0.068756103515625, 0.1238861083984375, 0.17901611328125, 0.2341461181640625, 0.289276123046875, 0.3444061279296875, 0.3995361328125, 0.4546661376953125, 0.509796142578125, 0.5649261474609375, 0.62005615234375, 0.6751861572265625, 0.730316162109375, 0.7854461669921875, 0.840576171875, 0.8957061767578125, 0.950836181640625, 1.0059661865234375, 1.06109619140625, 1.1162261962890625, 1.171356201171875, 1.2264862060546875, 1.2816162109375, 1.3367462158203125, 1.391876220703125, 1.4470062255859375, 1.50213623046875, 1.5572662353515625, 1.612396240234375, 1.6675262451171875, 1.72265625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 2.0, 4.0, 3.0, 7.0, 8.0, 4.0, 12.0, 13.0, 22.0, 13.0, 24.0, 21.0, 25.0, 29.0, 40.0, 39.0, 59.0, 40.0, 50.0, 54.0, 59.0, 55.0, 38.0, 45.0, 44.0, 52.0, 40.0, 35.0, 31.0, 26.0, 18.0, 11.0, 18.0, 7.0, 10.0, 7.0, 3.0, 7.0, 0.0, 8.0, 5.0, 3.0, 6.0, 0.0, 0.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.54296875, -0.5252151489257812, -0.5074615478515625, -0.48970794677734375, -0.471954345703125, -0.45420074462890625, -0.4364471435546875, -0.41869354248046875, -0.40093994140625, -0.38318634033203125, -0.3654327392578125, -0.34767913818359375, -0.329925537109375, -0.31217193603515625, -0.2944183349609375, -0.27666473388671875, -0.2589111328125, -0.24115753173828125, -0.2234039306640625, -0.20565032958984375, -0.187896728515625, -0.17014312744140625, -0.1523895263671875, -0.13463592529296875, -0.11688232421875, -0.09912872314453125, -0.0813751220703125, -0.06362152099609375, -0.045867919921875, -0.02811431884765625, -0.0103607177734375, 0.00739288330078125, 0.025146484375, 0.04290008544921875, 0.0606536865234375, 0.07840728759765625, 0.096160888671875, 0.11391448974609375, 0.1316680908203125, 0.14942169189453125, 0.16717529296875, 0.18492889404296875, 0.2026824951171875, 0.22043609619140625, 0.238189697265625, 0.25594329833984375, 0.2736968994140625, 0.29145050048828125, 0.3092041015625, 0.32695770263671875, 0.3447113037109375, 0.36246490478515625, 0.380218505859375, 0.39797210693359375, 0.4157257080078125, 0.43347930908203125, 0.45123291015625, 0.46898651123046875, 0.4867401123046875, 0.5044937133789062, 0.522247314453125, 0.5400009155273438, 0.5577545166015625, 0.5755081176757812, 0.59326171875]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 9.0, 5.0, 10.0, 10.0, 14.0, 17.0, 24.0, 34.0, 45.0, 53.0, 55.0, 71.0, 69.0, 92.0, 76.0, 89.0, 56.0, 61.0, 44.0, 51.0, 38.0, 22.0, 18.0, 7.0, 8.0, 4.0, 8.0, 6.0, 4.0, 0.0, 3.0, 0.0, 2.0], "bins": [-11.977826118469238, -11.709940910339355, -11.442055702209473, -11.17417049407959, -10.906285285949707, -10.638400077819824, -10.370514869689941, -10.102629661560059, -9.834744453430176, -9.566859245300293, -9.29897403717041, -9.031088829040527, -8.763203620910645, -8.495318412780762, -8.227433204650879, -7.959547996520996, -7.691662788391113, -7.4237775802612305, -7.155892372131348, -6.888007164001465, -6.620121955871582, -6.352236747741699, -6.084351539611816, -5.816466331481934, -5.548581123352051, -5.280695915222168, -5.012810707092285, -4.744925498962402, -4.4770402908325195, -4.209155082702637, -3.941269874572754, -3.673384666442871, -3.40549898147583, -3.1376137733459473, -2.8697285652160645, -2.6018433570861816, -2.333958148956299, -2.066072940826416, -1.7981877326965332, -1.5303025245666504, -1.2624173164367676, -0.9945321083068848, -0.726646900177002, -0.45876169204711914, -0.19087648391723633, 0.07700872421264648, 0.3448939323425293, 0.6127791404724121, 0.8806643486022949, 1.1485495567321777, 1.4164347648620605, 1.6843199729919434, 1.9522051811218262, 2.220090389251709, 2.487975597381592, 2.7558608055114746, 3.0237460136413574, 3.2916312217712402, 3.559516429901123, 3.827401638031006, 4.095286846160889, 4.3631720542907715, 4.631057262420654, 4.898942470550537, 5.16682767868042]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 2.0, 7.0, 5.0, 4.0, 3.0, 7.0, 7.0, 9.0, 11.0, 11.0, 9.0, 17.0, 22.0, 13.0, 22.0, 28.0, 20.0, 31.0, 30.0, 36.0, 38.0, 41.0, 38.0, 33.0, 35.0, 32.0, 33.0, 35.0, 40.0, 39.0, 37.0, 41.0, 31.0, 23.0, 28.0, 25.0, 24.0, 21.0, 25.0, 17.0, 12.0, 11.0, 10.0, 13.0, 12.0, 4.0, 4.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.248361110687256, -3.1510603427886963, -3.0537595748901367, -2.956458806991577, -2.8591580390930176, -2.761857032775879, -2.6645562648773193, -2.5672554969787598, -2.4699547290802, -2.3726539611816406, -2.275353193283081, -2.1780524253845215, -2.080751419067383, -1.9834507703781128, -1.8861498832702637, -1.788849115371704, -1.6915483474731445, -1.594247579574585, -1.4969468116760254, -1.3996459245681763, -1.3023451566696167, -1.2050443887710571, -1.107743501663208, -1.0104427337646484, -0.9131419658660889, -0.8158411979675293, -0.718540370464325, -0.6212395429611206, -0.523938775062561, -0.4266379773616791, -0.3293371796607971, -0.23203635215759277, -0.1347355842590332, -0.037434786558151245, 0.05986601114273071, 0.15716680884361267, 0.25446760654449463, 0.3517684042453766, 0.44906920194625854, 0.5463700294494629, 0.6436707973480225, 0.740971565246582, 0.8382723927497864, 0.9355732202529907, 1.0328739881515503, 1.1301747560501099, 1.227475643157959, 1.3247764110565186, 1.4220771789550781, 1.5193779468536377, 1.6166787147521973, 1.7139796018600464, 1.811280369758606, 1.9085811376571655, 2.0058820247650146, 2.103182792663574, 2.200483560562134, 2.2977843284606934, 2.395085096359253, 2.4923858642578125, 2.589686870574951, 2.6869876384735107, 2.7842884063720703, 2.88158917427063, 2.9788899421691895]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 8.0, 15.0, 12.0, 20.0, 36.0, 56.0, 79.0, 112.0, 177.0, 240.0, 410.0, 651.0, 936.0, 1416.0, 2296.0, 3555.0, 5917.0, 9694.0, 16779.0, 31459.0, 62304.0, 138526.0, 351733.0, 897125.0, 1328063.0, 790685.0, 306923.0, 123185.0, 55775.0, 28404.0, 15143.0, 8743.0, 5183.0, 3133.0, 1970.0, 1197.0, 833.0, 551.0, 324.0, 226.0, 141.0, 102.0, 54.0, 37.0, 24.0, 12.0, 7.0, 6.0, 9.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-6.23046875, -6.038330078125, -5.84619140625, -5.654052734375, -5.4619140625, -5.269775390625, -5.07763671875, -4.885498046875, -4.693359375, -4.501220703125, -4.30908203125, -4.116943359375, -3.9248046875, -3.732666015625, -3.54052734375, -3.348388671875, -3.15625, -2.964111328125, -2.77197265625, -2.579833984375, -2.3876953125, -2.195556640625, -2.00341796875, -1.811279296875, -1.619140625, -1.427001953125, -1.23486328125, -1.042724609375, -0.8505859375, -0.658447265625, -0.46630859375, -0.274169921875, -0.08203125, 0.110107421875, 0.30224609375, 0.494384765625, 0.6865234375, 0.878662109375, 1.07080078125, 1.262939453125, 1.455078125, 1.647216796875, 1.83935546875, 2.031494140625, 2.2236328125, 2.415771484375, 2.60791015625, 2.800048828125, 2.9921875, 3.184326171875, 3.37646484375, 3.568603515625, 3.7607421875, 3.952880859375, 4.14501953125, 4.337158203125, 4.529296875, 4.721435546875, 4.91357421875, 5.105712890625, 5.2978515625, 5.489990234375, 5.68212890625, 5.874267578125, 6.06640625]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 7.0, 5.0, 7.0, 4.0, 6.0, 10.0, 9.0, 9.0, 16.0, 23.0, 23.0, 19.0, 34.0, 30.0, 30.0, 34.0, 32.0, 40.0, 40.0, 36.0, 50.0, 45.0, 37.0, 44.0, 47.0, 39.0, 29.0, 31.0, 25.0, 33.0, 31.0, 26.0, 25.0, 17.0, 21.0, 21.0, 15.0, 13.0, 10.0, 5.0, 6.0, 5.0, 0.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0], "bins": [-2.873046875, -2.79534912109375, -2.7176513671875, -2.63995361328125, -2.562255859375, -2.48455810546875, -2.4068603515625, -2.32916259765625, -2.25146484375, -2.17376708984375, -2.0960693359375, -2.01837158203125, -1.940673828125, -1.86297607421875, -1.7852783203125, -1.70758056640625, -1.6298828125, -1.55218505859375, -1.4744873046875, -1.39678955078125, -1.319091796875, -1.24139404296875, -1.1636962890625, -1.08599853515625, -1.00830078125, -0.93060302734375, -0.8529052734375, -0.77520751953125, -0.697509765625, -0.61981201171875, -0.5421142578125, -0.46441650390625, -0.38671875, -0.30902099609375, -0.2313232421875, -0.15362548828125, -0.075927734375, 0.00177001953125, 0.0794677734375, 0.15716552734375, 0.23486328125, 0.31256103515625, 0.3902587890625, 0.46795654296875, 0.545654296875, 0.62335205078125, 0.7010498046875, 0.77874755859375, 0.8564453125, 0.93414306640625, 1.0118408203125, 1.08953857421875, 1.167236328125, 1.24493408203125, 1.3226318359375, 1.40032958984375, 1.47802734375, 1.55572509765625, 1.6334228515625, 1.71112060546875, 1.788818359375, 1.86651611328125, 1.9442138671875, 2.02191162109375, 2.099609375]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 12.0, 9.0, 9.0, 9.0, 19.0, 25.0, 43.0, 48.0, 86.0, 108.0, 182.0, 278.0, 412.0, 652.0, 1140.0, 1884.0, 3304.0, 6004.0, 11249.0, 21944.0, 45933.0, 101393.0, 246739.0, 643707.0, 1357316.0, 1039397.0, 411963.0, 162183.0, 69929.0, 32781.0, 16270.0, 8441.0, 4640.0, 2492.0, 1407.0, 865.0, 495.0, 315.0, 213.0, 112.0, 74.0, 72.0, 51.0, 23.0, 21.0, 15.0, 3.0, 14.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.1328125, -6.9010009765625, -6.669189453125, -6.4373779296875, -6.20556640625, -5.9737548828125, -5.741943359375, -5.5101318359375, -5.2783203125, -5.0465087890625, -4.814697265625, -4.5828857421875, -4.35107421875, -4.1192626953125, -3.887451171875, -3.6556396484375, -3.423828125, -3.1920166015625, -2.960205078125, -2.7283935546875, -2.49658203125, -2.2647705078125, -2.032958984375, -1.8011474609375, -1.5693359375, -1.3375244140625, -1.105712890625, -0.8739013671875, -0.64208984375, -0.4102783203125, -0.178466796875, 0.0533447265625, 0.28515625, 0.5169677734375, 0.748779296875, 0.9805908203125, 1.21240234375, 1.4442138671875, 1.676025390625, 1.9078369140625, 2.1396484375, 2.3714599609375, 2.603271484375, 2.8350830078125, 3.06689453125, 3.2987060546875, 3.530517578125, 3.7623291015625, 3.994140625, 4.2259521484375, 4.457763671875, 4.6895751953125, 4.92138671875, 5.1531982421875, 5.385009765625, 5.6168212890625, 5.8486328125, 6.0804443359375, 6.312255859375, 6.5440673828125, 6.77587890625, 7.0076904296875, 7.239501953125, 7.4713134765625, 7.703125]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 2.0, 4.0, 5.0, 11.0, 18.0, 20.0, 27.0, 36.0, 47.0, 63.0, 67.0, 97.0, 118.0, 149.0, 172.0, 233.0, 264.0, 333.0, 308.0, 358.0, 289.0, 328.0, 242.0, 191.0, 143.0, 127.0, 77.0, 80.0, 60.0, 46.0, 37.0, 26.0, 21.0, 13.0, 11.0, 11.0, 11.0, 5.0, 7.0, 1.0, 0.0, 2.0, 0.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.8330078125, -1.774169921875, -1.71533203125, -1.656494140625, -1.59765625, -1.538818359375, -1.47998046875, -1.421142578125, -1.3623046875, -1.303466796875, -1.24462890625, -1.185791015625, -1.126953125, -1.068115234375, -1.00927734375, -0.950439453125, -0.8916015625, -0.832763671875, -0.77392578125, -0.715087890625, -0.65625, -0.597412109375, -0.53857421875, -0.479736328125, -0.4208984375, -0.362060546875, -0.30322265625, -0.244384765625, -0.185546875, -0.126708984375, -0.06787109375, -0.009033203125, 0.0498046875, 0.108642578125, 0.16748046875, 0.226318359375, 0.28515625, 0.343994140625, 0.40283203125, 0.461669921875, 0.5205078125, 0.579345703125, 0.63818359375, 0.697021484375, 0.755859375, 0.814697265625, 0.87353515625, 0.932373046875, 0.9912109375, 1.050048828125, 1.10888671875, 1.167724609375, 1.2265625, 1.285400390625, 1.34423828125, 1.403076171875, 1.4619140625, 1.520751953125, 1.57958984375, 1.638427734375, 1.697265625, 1.756103515625, 1.81494140625, 1.873779296875, 1.9326171875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 4.0, 8.0, 9.0, 10.0, 23.0, 31.0, 43.0, 59.0, 79.0, 94.0, 99.0, 109.0, 98.0, 91.0, 73.0, 52.0, 32.0, 33.0, 19.0, 12.0, 7.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-16.24724769592285, -15.90961742401123, -15.571986198425293, -15.234355926513672, -14.89672565460205, -14.55909538269043, -14.221464157104492, -13.883833885192871, -13.54620361328125, -13.208573341369629, -12.870942115783691, -12.53331184387207, -12.19568157196045, -11.858051300048828, -11.52042007446289, -11.18278980255127, -10.845159530639648, -10.507529258728027, -10.16989803314209, -9.832267761230469, -9.494637489318848, -9.157007217407227, -8.819375991821289, -8.481745719909668, -8.14411449432373, -7.806483745574951, -7.46885347366333, -7.131222724914551, -6.79359245300293, -6.45596170425415, -6.118330955505371, -5.78070068359375, -5.443070411682129, -5.10543966293335, -4.7678093910217285, -4.430178642272949, -4.092548370361328, -3.754917621612549, -3.4172871112823486, -3.0796566009521484, -2.7420260906219482, -2.404395580291748, -2.066765069961548, -1.729134440422058, -1.391503930091858, -1.0538734197616577, -0.716242790222168, -0.3786122798919678, -0.04098176956176758, 0.296648770570755, 0.6342793107032776, 0.9719098806381226, 1.3095403909683228, 1.647170901298523, 1.9848015308380127, 2.322432041168213, 2.660062551498413, 2.9976930618286133, 3.3353235721588135, 3.6729540824890137, 4.010584831237793, 4.348215103149414, 4.685845851898193, 5.023476600646973, 5.361106872558594]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 7.0, 4.0, 4.0, 18.0, 5.0, 11.0, 14.0, 18.0, 14.0, 21.0, 23.0, 32.0, 23.0, 30.0, 31.0, 46.0, 39.0, 40.0, 43.0, 49.0, 31.0, 36.0, 42.0, 47.0, 43.0, 43.0, 38.0, 43.0, 29.0, 29.0, 21.0, 22.0, 25.0, 18.0, 11.0, 9.0, 14.0, 9.0, 7.0, 2.0, 3.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.53413724899292, -3.4264910221099854, -3.318844795227051, -3.211198329925537, -3.1035521030426025, -2.995905876159668, -2.8882596492767334, -2.780613422393799, -2.672966957092285, -2.5653207302093506, -2.457674503326416, -2.3500280380249023, -2.2423818111419678, -2.134735584259033, -2.0270893573760986, -1.919443130493164, -1.8117969036102295, -1.704150676727295, -1.5965043306350708, -1.4888581037521362, -1.381211757659912, -1.2735655307769775, -1.165919303894043, -1.0582730770111084, -0.9506267309188843, -0.8429804444313049, -0.7353341579437256, -0.627687931060791, -0.5200416445732117, -0.4123953580856323, -0.30474913120269775, -0.1971028447151184, -0.08945631980895996, 0.01818995177745819, 0.12583622336387634, 0.2334824800491333, 0.34112876653671265, 0.448775053024292, 0.5564212799072266, 0.6640675663948059, 0.7717138528823853, 0.8793601393699646, 0.987006425857544, 1.0946526527404785, 1.202298879623413, 1.3099452257156372, 1.4175914525985718, 1.525237798690796, 1.6328840255737305, 1.740530252456665, 1.8481765985488892, 1.9558228254318237, 2.063469171524048, 2.1711153984069824, 2.278761625289917, 2.3864078521728516, 2.4940543174743652, 2.6017005443573, 2.7093467712402344, 2.816993236541748, 2.9246394634246826, 3.032285690307617, 3.1399319171905518, 3.2475781440734863, 3.355224370956421]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 2.0, 6.0, 1.0, 6.0, 11.0, 7.0, 18.0, 17.0, 33.0, 28.0, 49.0, 62.0, 94.0, 110.0, 170.0, 229.0, 368.0, 555.0, 844.0, 1390.0, 2547.0, 4944.0, 11641.0, 31167.0, 93130.0, 265344.0, 368857.0, 174081.0, 56532.0, 19768.0, 7764.0, 3635.0, 1929.0, 1061.0, 672.0, 449.0, 291.0, 203.0, 159.0, 127.0, 71.0, 41.0, 38.0, 28.0, 27.0, 11.0, 12.0, 6.0, 8.0, 9.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-5.15625, -4.9859619140625, -4.815673828125, -4.6453857421875, -4.47509765625, -4.3048095703125, -4.134521484375, -3.9642333984375, -3.7939453125, -3.6236572265625, -3.453369140625, -3.2830810546875, -3.11279296875, -2.9425048828125, -2.772216796875, -2.6019287109375, -2.431640625, -2.2613525390625, -2.091064453125, -1.9207763671875, -1.75048828125, -1.5802001953125, -1.409912109375, -1.2396240234375, -1.0693359375, -0.8990478515625, -0.728759765625, -0.5584716796875, -0.38818359375, -0.2178955078125, -0.047607421875, 0.1226806640625, 0.29296875, 0.4632568359375, 0.633544921875, 0.8038330078125, 0.97412109375, 1.1444091796875, 1.314697265625, 1.4849853515625, 1.6552734375, 1.8255615234375, 1.995849609375, 2.1661376953125, 2.33642578125, 2.5067138671875, 2.677001953125, 2.8472900390625, 3.017578125, 3.1878662109375, 3.358154296875, 3.5284423828125, 3.69873046875, 3.8690185546875, 4.039306640625, 4.2095947265625, 4.3798828125, 4.5501708984375, 4.720458984375, 4.8907470703125, 5.06103515625, 5.2313232421875, 5.401611328125, 5.5718994140625, 5.7421875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 5.0, 2.0, 6.0, 15.0, 7.0, 15.0, 16.0, 24.0, 15.0, 31.0, 26.0, 29.0, 37.0, 41.0, 49.0, 49.0, 39.0, 50.0, 43.0, 34.0, 47.0, 52.0, 43.0, 35.0, 44.0, 33.0, 25.0, 33.0, 18.0, 25.0, 17.0, 21.0, 19.0, 16.0, 4.0, 8.0, 5.0, 5.0, 8.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6875, -3.56463623046875, -3.4417724609375, -3.31890869140625, -3.196044921875, -3.07318115234375, -2.9503173828125, -2.82745361328125, -2.70458984375, -2.58172607421875, -2.4588623046875, -2.33599853515625, -2.213134765625, -2.09027099609375, -1.9674072265625, -1.84454345703125, -1.7216796875, -1.59881591796875, -1.4759521484375, -1.35308837890625, -1.230224609375, -1.10736083984375, -0.9844970703125, -0.86163330078125, -0.73876953125, -0.61590576171875, -0.4930419921875, -0.37017822265625, -0.247314453125, -0.12445068359375, -0.0015869140625, 0.12127685546875, 0.244140625, 0.36700439453125, 0.4898681640625, 0.61273193359375, 0.735595703125, 0.85845947265625, 0.9813232421875, 1.10418701171875, 1.22705078125, 1.34991455078125, 1.4727783203125, 1.59564208984375, 1.718505859375, 1.84136962890625, 1.9642333984375, 2.08709716796875, 2.2099609375, 2.33282470703125, 2.4556884765625, 2.57855224609375, 2.701416015625, 2.82427978515625, 2.9471435546875, 3.07000732421875, 3.19287109375, 3.31573486328125, 3.4385986328125, 3.56146240234375, 3.684326171875, 3.80718994140625, 3.9300537109375, 4.05291748046875, 4.17578125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 10.0, 7.0, 18.0, 14.0, 20.0, 29.0, 71.0, 71.0, 123.0, 164.0, 271.0, 411.0, 709.0, 1210.0, 2190.0, 4886.0, 12545.0, 37951.0, 141016.0, 420679.0, 301290.0, 84436.0, 24547.0, 8181.0, 3448.0, 1696.0, 906.0, 573.0, 367.0, 238.0, 143.0, 109.0, 81.0, 44.0, 27.0, 20.0, 11.0, 10.0, 7.0, 3.0, 8.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.67578125, -6.4517822265625, -6.227783203125, -6.0037841796875, -5.77978515625, -5.5557861328125, -5.331787109375, -5.1077880859375, -4.8837890625, -4.6597900390625, -4.435791015625, -4.2117919921875, -3.98779296875, -3.7637939453125, -3.539794921875, -3.3157958984375, -3.091796875, -2.8677978515625, -2.643798828125, -2.4197998046875, -2.19580078125, -1.9718017578125, -1.747802734375, -1.5238037109375, -1.2998046875, -1.0758056640625, -0.851806640625, -0.6278076171875, -0.40380859375, -0.1798095703125, 0.044189453125, 0.2681884765625, 0.4921875, 0.7161865234375, 0.940185546875, 1.1641845703125, 1.38818359375, 1.6121826171875, 1.836181640625, 2.0601806640625, 2.2841796875, 2.5081787109375, 2.732177734375, 2.9561767578125, 3.18017578125, 3.4041748046875, 3.628173828125, 3.8521728515625, 4.076171875, 4.3001708984375, 4.524169921875, 4.7481689453125, 4.97216796875, 5.1961669921875, 5.420166015625, 5.6441650390625, 5.8681640625, 6.0921630859375, 6.316162109375, 6.5401611328125, 6.76416015625, 6.9881591796875, 7.212158203125, 7.4361572265625, 7.66015625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 9.0, 10.0, 11.0, 15.0, 17.0, 20.0, 28.0, 18.0, 28.0, 28.0, 41.0, 31.0, 33.0, 50.0, 38.0, 48.0, 50.0, 52.0, 38.0, 48.0, 28.0, 46.0, 33.0, 26.0, 38.0, 24.0, 37.0, 20.0, 26.0, 22.0, 9.0, 16.0, 9.0, 9.0, 6.0, 11.0, 8.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.275390625, -2.204193115234375, -2.13299560546875, -2.061798095703125, -1.9906005859375, -1.919403076171875, -1.84820556640625, -1.777008056640625, -1.705810546875, -1.634613037109375, -1.56341552734375, -1.492218017578125, -1.4210205078125, -1.349822998046875, -1.27862548828125, -1.207427978515625, -1.13623046875, -1.065032958984375, -0.99383544921875, -0.922637939453125, -0.8514404296875, -0.780242919921875, -0.70904541015625, -0.637847900390625, -0.566650390625, -0.495452880859375, -0.42425537109375, -0.353057861328125, -0.2818603515625, -0.210662841796875, -0.13946533203125, -0.068267822265625, 0.0029296875, 0.074127197265625, 0.14532470703125, 0.216522216796875, 0.2877197265625, 0.358917236328125, 0.43011474609375, 0.501312255859375, 0.572509765625, 0.643707275390625, 0.71490478515625, 0.786102294921875, 0.8572998046875, 0.928497314453125, 0.99969482421875, 1.070892333984375, 1.14208984375, 1.213287353515625, 1.28448486328125, 1.355682373046875, 1.4268798828125, 1.498077392578125, 1.56927490234375, 1.640472412109375, 1.711669921875, 1.782867431640625, 1.85406494140625, 1.925262451171875, 1.9964599609375, 2.067657470703125, 2.13885498046875, 2.210052490234375, 2.28125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 6.0, 9.0, 10.0, 17.0, 22.0, 38.0, 54.0, 81.0, 96.0, 149.0, 186.0, 294.0, 483.0, 658.0, 1117.0, 1764.0, 2720.0, 4537.0, 7839.0, 13872.0, 26914.0, 56676.0, 123716.0, 259729.0, 278054.0, 139667.0, 62689.0, 30155.0, 15363.0, 8589.0, 4815.0, 3002.0, 1855.0, 1124.0, 699.0, 523.0, 320.0, 221.0, 144.0, 100.0, 71.0, 57.0, 31.0, 24.0, 22.0, 15.0, 11.0, 6.0, 2.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.865234375, -1.805206298828125, -1.74517822265625, -1.685150146484375, -1.6251220703125, -1.565093994140625, -1.50506591796875, -1.445037841796875, -1.385009765625, -1.324981689453125, -1.26495361328125, -1.204925537109375, -1.1448974609375, -1.084869384765625, -1.02484130859375, -0.964813232421875, -0.90478515625, -0.844757080078125, -0.78472900390625, -0.724700927734375, -0.6646728515625, -0.604644775390625, -0.54461669921875, -0.484588623046875, -0.424560546875, -0.364532470703125, -0.30450439453125, -0.244476318359375, -0.1844482421875, -0.124420166015625, -0.06439208984375, -0.004364013671875, 0.0556640625, 0.115692138671875, 0.17572021484375, 0.235748291015625, 0.2957763671875, 0.355804443359375, 0.41583251953125, 0.475860595703125, 0.535888671875, 0.595916748046875, 0.65594482421875, 0.715972900390625, 0.7760009765625, 0.836029052734375, 0.89605712890625, 0.956085205078125, 1.01611328125, 1.076141357421875, 1.13616943359375, 1.196197509765625, 1.2562255859375, 1.316253662109375, 1.37628173828125, 1.436309814453125, 1.496337890625, 1.556365966796875, 1.61639404296875, 1.676422119140625, 1.7364501953125, 1.796478271484375, 1.85650634765625, 1.916534423828125, 1.9765625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 8.0, 4.0, 5.0, 9.0, 13.0, 22.0, 12.0, 44.0, 51.0, 85.0, 126.0, 125.0, 138.0, 109.0, 80.0, 52.0, 34.0, 18.0, 16.0, 13.0, 7.0, 5.0, 4.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014209747314453125, -0.00013664178550243378, -0.0001311860978603363, -0.00012573041021823883, -0.00012027472257614136, -0.00011481903493404388, -0.00010936334729194641, -0.00010390765964984894, -9.845197200775146e-05, -9.299628436565399e-05, -8.754059672355652e-05, -8.208490908145905e-05, -7.662922143936157e-05, -7.11735337972641e-05, -6.571784615516663e-05, -6.026215851306915e-05, -5.480647087097168e-05, -4.9350783228874207e-05, -4.3895095586776733e-05, -3.843940794467926e-05, -3.298372030258179e-05, -2.7528032660484314e-05, -2.207234501838684e-05, -1.6616657376289368e-05, -1.1160969734191895e-05, -5.705282092094421e-06, -2.4959444999694824e-07, 5.206093192100525e-06, 1.0661780834197998e-05, 1.611746847629547e-05, 2.1573156118392944e-05, 2.7028843760490417e-05, 3.248453140258789e-05, 3.7940219044685364e-05, 4.339590668678284e-05, 4.885159432888031e-05, 5.430728197097778e-05, 5.9762969613075256e-05, 6.521865725517273e-05, 7.06743448972702e-05, 7.613003253936768e-05, 8.158572018146515e-05, 8.704140782356262e-05, 9.24970954656601e-05, 9.795278310775757e-05, 0.00010340847074985504, 0.00010886415839195251, 0.00011431984603404999, 0.00011977553367614746, 0.00012523122131824493, 0.0001306869089603424, 0.00013614259660243988, 0.00014159828424453735, 0.00014705397188663483, 0.0001525096595287323, 0.00015796534717082977, 0.00016342103481292725, 0.00016887672245502472, 0.0001743324100971222, 0.00017978809773921967, 0.00018524378538131714, 0.0001906994730234146, 0.00019615516066551208, 0.00020161084830760956, 0.00020706653594970703]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 7.0, 10.0, 14.0, 17.0, 23.0, 42.0, 53.0, 93.0, 126.0, 162.0, 280.0, 354.0, 616.0, 925.0, 1400.0, 2241.0, 3558.0, 6031.0, 10549.0, 18927.0, 35148.0, 69503.0, 136819.0, 228302.0, 232155.0, 143547.0, 73611.0, 36735.0, 19548.0, 10920.0, 6429.0, 3826.0, 2369.0, 1449.0, 926.0, 650.0, 385.0, 246.0, 190.0, 111.0, 82.0, 56.0, 37.0, 33.0, 18.0, 13.0, 8.0, 3.0, 1.0, 6.0, 1.0, 1.0, 3.0, 2.0], "bins": [-1.65625, -1.6075897216796875, -1.558929443359375, -1.5102691650390625, -1.46160888671875, -1.4129486083984375, -1.364288330078125, -1.3156280517578125, -1.2669677734375, -1.2183074951171875, -1.169647216796875, -1.1209869384765625, -1.07232666015625, -1.0236663818359375, -0.975006103515625, -0.9263458251953125, -0.877685546875, -0.8290252685546875, -0.780364990234375, -0.7317047119140625, -0.68304443359375, -0.6343841552734375, -0.585723876953125, -0.5370635986328125, -0.4884033203125, -0.4397430419921875, -0.391082763671875, -0.3424224853515625, -0.29376220703125, -0.2451019287109375, -0.196441650390625, -0.1477813720703125, -0.09912109375, -0.0504608154296875, -0.001800537109375, 0.0468597412109375, 0.09552001953125, 0.1441802978515625, 0.192840576171875, 0.2415008544921875, 0.2901611328125, 0.3388214111328125, 0.387481689453125, 0.4361419677734375, 0.48480224609375, 0.5334625244140625, 0.582122802734375, 0.6307830810546875, 0.679443359375, 0.7281036376953125, 0.776763916015625, 0.8254241943359375, 0.87408447265625, 0.9227447509765625, 0.971405029296875, 1.0200653076171875, 1.0687255859375, 1.1173858642578125, 1.166046142578125, 1.2147064208984375, 1.26336669921875, 1.3120269775390625, 1.360687255859375, 1.4093475341796875, 1.4580078125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 10.0, 10.0, 10.0, 11.0, 20.0, 21.0, 31.0, 53.0, 43.0, 83.0, 78.0, 108.0, 123.0, 89.0, 74.0, 65.0, 48.0, 40.0, 34.0, 16.0, 19.0, 2.0, 8.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63525390625, -0.6155776977539062, -0.5959014892578125, -0.5762252807617188, -0.556549072265625, -0.5368728637695312, -0.5171966552734375, -0.49752044677734375, -0.47784423828125, -0.45816802978515625, -0.4384918212890625, -0.41881561279296875, -0.399139404296875, -0.37946319580078125, -0.3597869873046875, -0.34011077880859375, -0.3204345703125, -0.30075836181640625, -0.2810821533203125, -0.26140594482421875, -0.241729736328125, -0.22205352783203125, -0.2023773193359375, -0.18270111083984375, -0.16302490234375, -0.14334869384765625, -0.1236724853515625, -0.10399627685546875, -0.084320068359375, -0.06464385986328125, -0.0449676513671875, -0.02529144287109375, -0.005615234375, 0.01406097412109375, 0.0337371826171875, 0.05341339111328125, 0.073089599609375, 0.09276580810546875, 0.1124420166015625, 0.13211822509765625, 0.15179443359375, 0.17147064208984375, 0.1911468505859375, 0.21082305908203125, 0.230499267578125, 0.25017547607421875, 0.2698516845703125, 0.28952789306640625, 0.3092041015625, 0.32888031005859375, 0.3485565185546875, 0.36823272705078125, 0.387908935546875, 0.40758514404296875, 0.4272613525390625, 0.44693756103515625, 0.46661376953125, 0.48628997802734375, 0.5059661865234375, 0.5256423950195312, 0.545318603515625, 0.5649948120117188, 0.5846710205078125, 0.6043472290039062, 0.6240234375]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 5.0, 3.0, 1.0, 3.0, 5.0, 11.0, 11.0, 16.0, 25.0, 30.0, 43.0, 67.0, 75.0, 87.0, 103.0, 113.0, 90.0, 101.0, 66.0, 47.0, 23.0, 29.0, 21.0, 14.0, 8.0, 6.0, 6.0, 4.0, 0.0, 2.0], "bins": [-15.971409797668457, -15.644852638244629, -15.318296432495117, -14.991739273071289, -14.665182113647461, -14.338624954223633, -14.012068748474121, -13.685511589050293, -13.358954429626465, -13.032397270202637, -12.705841064453125, -12.379283905029297, -12.052726745605469, -11.72616958618164, -11.399613380432129, -11.0730562210083, -10.746500015258789, -10.419942855834961, -10.09338665008545, -9.766829490661621, -9.440272331237793, -9.113715171813965, -8.787158966064453, -8.460601806640625, -8.134044647216797, -7.807487964630127, -7.480930805206299, -7.154374122619629, -6.827816963195801, -6.501260280609131, -6.174703598022461, -5.848146438598633, -5.5215888023376465, -5.195032119750977, -4.868474960327148, -4.5419182777404785, -4.21536111831665, -3.8888044357299805, -3.5622475147247314, -3.2356905937194824, -2.9091336727142334, -2.5825767517089844, -2.2560198307037354, -1.9294630289077759, -1.6029061079025269, -1.2763491868972778, -0.9497923851013184, -0.6232354640960693, -0.2966785430908203, 0.029878348112106323, 0.35643523931503296, 0.6829921007156372, 1.0095490217208862, 1.3361059427261353, 1.6626627445220947, 1.9892196655273438, 2.3157765865325928, 2.642333507537842, 2.968890428543091, 3.29544734954834, 3.6220040321350098, 3.948561191558838, 4.275117874145508, 4.601675033569336, 4.928231716156006]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 8.0, 9.0, 10.0, 12.0, 7.0, 15.0, 19.0, 14.0, 24.0, 24.0, 27.0, 25.0, 24.0, 43.0, 42.0, 37.0, 42.0, 51.0, 42.0, 29.0, 36.0, 44.0, 40.0, 57.0, 31.0, 45.0, 38.0, 33.0, 20.0, 22.0, 24.0, 24.0, 19.0, 9.0, 11.0, 14.0, 8.0, 5.0, 3.0, 8.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-3.4932479858398438, -3.386782169342041, -3.2803165912628174, -3.1738507747650146, -3.067385196685791, -2.9609193801879883, -2.8544535636901855, -2.747987747192383, -2.641522169113159, -2.5350563526153564, -2.428590774536133, -2.32212495803833, -2.2156591415405273, -2.1091935634613037, -2.002727746963501, -1.8962620496749878, -1.7897963523864746, -1.6833306550979614, -1.5768649578094482, -1.4703991413116455, -1.3639334440231323, -1.2574677467346191, -1.1510019302368164, -1.0445362329483032, -0.93807053565979, -0.8316048383712769, -0.7251390814781189, -0.6186733245849609, -0.5122076272964478, -0.40574193000793457, -0.2992761731147766, -0.19281041622161865, -0.08634471893310547, 0.020121008157730103, 0.12658673524856567, 0.23305246233940125, 0.3395181894302368, 0.44598388671875, 0.552449643611908, 0.6589154005050659, 0.7653810977935791, 0.8718467950820923, 0.9783125519752502, 1.0847783088684082, 1.1912440061569214, 1.2977097034454346, 1.4041755199432373, 1.5106412172317505, 1.6171069145202637, 1.7235726118087769, 1.83003830909729, 1.9365041255950928, 2.0429697036743164, 2.149435520172119, 2.255901336669922, 2.3623671531677246, 2.4688327312469482, 2.575298547744751, 2.6817641258239746, 2.7882299423217773, 2.89469575881958, 3.0011613368988037, 3.1076271533966064, 3.21409273147583, 3.320558547973633]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 1.0, 7.0, 7.0, 13.0, 11.0, 25.0, 31.0, 42.0, 70.0, 93.0, 139.0, 266.0, 414.0, 741.0, 1412.0, 2700.0, 5752.0, 12439.0, 27864.0, 64168.0, 137252.0, 235085.0, 251486.0, 163850.0, 79615.0, 35376.0, 15490.0, 7007.0, 3343.0, 1711.0, 881.0, 516.0, 301.0, 174.0, 98.0, 58.0, 38.0, 26.0, 23.0, 10.0, 8.0, 8.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9453125, -4.77557373046875, -4.6058349609375, -4.43609619140625, -4.266357421875, -4.09661865234375, -3.9268798828125, -3.75714111328125, -3.58740234375, -3.41766357421875, -3.2479248046875, -3.07818603515625, -2.908447265625, -2.73870849609375, -2.5689697265625, -2.39923095703125, -2.2294921875, -2.05975341796875, -1.8900146484375, -1.72027587890625, -1.550537109375, -1.38079833984375, -1.2110595703125, -1.04132080078125, -0.87158203125, -0.70184326171875, -0.5321044921875, -0.36236572265625, -0.192626953125, -0.02288818359375, 0.1468505859375, 0.31658935546875, 0.486328125, 0.65606689453125, 0.8258056640625, 0.99554443359375, 1.165283203125, 1.33502197265625, 1.5047607421875, 1.67449951171875, 1.84423828125, 2.01397705078125, 2.1837158203125, 2.35345458984375, 2.523193359375, 2.69293212890625, 2.8626708984375, 3.03240966796875, 3.2021484375, 3.37188720703125, 3.5416259765625, 3.71136474609375, 3.881103515625, 4.05084228515625, 4.2205810546875, 4.39031982421875, 4.56005859375, 4.72979736328125, 4.8995361328125, 5.06927490234375, 5.239013671875, 5.40875244140625, 5.5784912109375, 5.74822998046875, 5.91796875]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 8.0, 5.0, 10.0, 15.0, 18.0, 17.0, 16.0, 16.0, 19.0, 24.0, 24.0, 30.0, 38.0, 46.0, 34.0, 45.0, 49.0, 39.0, 47.0, 36.0, 49.0, 44.0, 32.0, 42.0, 39.0, 37.0, 30.0, 27.0, 20.0, 27.0, 24.0, 22.0, 10.0, 16.0, 12.0, 10.0, 7.0, 8.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.861328125, -3.745452880859375, -3.62957763671875, -3.513702392578125, -3.3978271484375, -3.281951904296875, -3.16607666015625, -3.050201416015625, -2.934326171875, -2.818450927734375, -2.70257568359375, -2.586700439453125, -2.4708251953125, -2.354949951171875, -2.23907470703125, -2.123199462890625, -2.00732421875, -1.891448974609375, -1.77557373046875, -1.659698486328125, -1.5438232421875, -1.427947998046875, -1.31207275390625, -1.196197509765625, -1.080322265625, -0.964447021484375, -0.84857177734375, -0.732696533203125, -0.6168212890625, -0.500946044921875, -0.38507080078125, -0.269195556640625, -0.1533203125, -0.037445068359375, 0.07843017578125, 0.194305419921875, 0.3101806640625, 0.426055908203125, 0.54193115234375, 0.657806396484375, 0.773681640625, 0.889556884765625, 1.00543212890625, 1.121307373046875, 1.2371826171875, 1.353057861328125, 1.46893310546875, 1.584808349609375, 1.70068359375, 1.816558837890625, 1.93243408203125, 2.048309326171875, 2.1641845703125, 2.280059814453125, 2.39593505859375, 2.511810302734375, 2.627685546875, 2.743560791015625, 2.85943603515625, 2.975311279296875, 3.0911865234375, 3.207061767578125, 3.32293701171875, 3.438812255859375, 3.5546875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 8.0, 4.0, 9.0, 10.0, 18.0, 37.0, 37.0, 54.0, 78.0, 106.0, 161.0, 210.0, 355.0, 509.0, 890.0, 1511.0, 2751.0, 5429.0, 10957.0, 23266.0, 50585.0, 105487.0, 189042.0, 241459.0, 197092.0, 113818.0, 54941.0, 25144.0, 11865.0, 5656.0, 2907.0, 1569.0, 936.0, 548.0, 334.0, 257.0, 167.0, 106.0, 62.0, 54.0, 31.0, 35.0, 12.0, 14.0, 16.0, 13.0, 3.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.8203125, -4.66253662109375, -4.5047607421875, -4.34698486328125, -4.189208984375, -4.03143310546875, -3.8736572265625, -3.71588134765625, -3.55810546875, -3.40032958984375, -3.2425537109375, -3.08477783203125, -2.927001953125, -2.76922607421875, -2.6114501953125, -2.45367431640625, -2.2958984375, -2.13812255859375, -1.9803466796875, -1.82257080078125, -1.664794921875, -1.50701904296875, -1.3492431640625, -1.19146728515625, -1.03369140625, -0.87591552734375, -0.7181396484375, -0.56036376953125, -0.402587890625, -0.24481201171875, -0.0870361328125, 0.07073974609375, 0.228515625, 0.38629150390625, 0.5440673828125, 0.70184326171875, 0.859619140625, 1.01739501953125, 1.1751708984375, 1.33294677734375, 1.49072265625, 1.64849853515625, 1.8062744140625, 1.96405029296875, 2.121826171875, 2.27960205078125, 2.4373779296875, 2.59515380859375, 2.7529296875, 2.91070556640625, 3.0684814453125, 3.22625732421875, 3.384033203125, 3.54180908203125, 3.6995849609375, 3.85736083984375, 4.01513671875, 4.17291259765625, 4.3306884765625, 4.48846435546875, 4.646240234375, 4.80401611328125, 4.9617919921875, 5.11956787109375, 5.27734375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 6.0, 3.0, 7.0, 7.0, 8.0, 5.0, 14.0, 12.0, 14.0, 14.0, 14.0, 27.0, 25.0, 25.0, 18.0, 42.0, 35.0, 47.0, 34.0, 55.0, 44.0, 42.0, 36.0, 55.0, 42.0, 39.0, 35.0, 48.0, 33.0, 33.0, 31.0, 21.0, 25.0, 21.0, 23.0, 15.0, 14.0, 7.0, 9.0, 4.0, 5.0, 4.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.125, -2.05645751953125, -1.9879150390625, -1.91937255859375, -1.850830078125, -1.78228759765625, -1.7137451171875, -1.64520263671875, -1.57666015625, -1.50811767578125, -1.4395751953125, -1.37103271484375, -1.302490234375, -1.23394775390625, -1.1654052734375, -1.09686279296875, -1.0283203125, -0.95977783203125, -0.8912353515625, -0.82269287109375, -0.754150390625, -0.68560791015625, -0.6170654296875, -0.54852294921875, -0.47998046875, -0.41143798828125, -0.3428955078125, -0.27435302734375, -0.205810546875, -0.13726806640625, -0.0687255859375, -0.00018310546875, 0.068359375, 0.13690185546875, 0.2054443359375, 0.27398681640625, 0.342529296875, 0.41107177734375, 0.4796142578125, 0.54815673828125, 0.61669921875, 0.68524169921875, 0.7537841796875, 0.82232666015625, 0.890869140625, 0.95941162109375, 1.0279541015625, 1.09649658203125, 1.1650390625, 1.23358154296875, 1.3021240234375, 1.37066650390625, 1.439208984375, 1.50775146484375, 1.5762939453125, 1.64483642578125, 1.71337890625, 1.78192138671875, 1.8504638671875, 1.91900634765625, 1.987548828125, 2.05609130859375, 2.1246337890625, 2.19317626953125, 2.26171875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 7.0, 5.0, 6.0, 6.0, 14.0, 18.0, 29.0, 34.0, 69.0, 100.0, 152.0, 207.0, 311.0, 424.0, 675.0, 1044.0, 1653.0, 2712.0, 4327.0, 7306.0, 13484.0, 26196.0, 52323.0, 105575.0, 189386.0, 242239.0, 187344.0, 103936.0, 51186.0, 25747.0, 13057.0, 7412.0, 4274.0, 2523.0, 1665.0, 1061.0, 741.0, 437.0, 320.0, 178.0, 133.0, 92.0, 58.0, 39.0, 24.0, 12.0, 11.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-2.505859375, -2.433197021484375, -2.36053466796875, -2.287872314453125, -2.2152099609375, -2.142547607421875, -2.06988525390625, -1.997222900390625, -1.924560546875, -1.851898193359375, -1.77923583984375, -1.706573486328125, -1.6339111328125, -1.561248779296875, -1.48858642578125, -1.415924072265625, -1.34326171875, -1.270599365234375, -1.19793701171875, -1.125274658203125, -1.0526123046875, -0.979949951171875, -0.90728759765625, -0.834625244140625, -0.761962890625, -0.689300537109375, -0.61663818359375, -0.543975830078125, -0.4713134765625, -0.398651123046875, -0.32598876953125, -0.253326416015625, -0.1806640625, -0.108001708984375, -0.03533935546875, 0.037322998046875, 0.1099853515625, 0.182647705078125, 0.25531005859375, 0.327972412109375, 0.400634765625, 0.473297119140625, 0.54595947265625, 0.618621826171875, 0.6912841796875, 0.763946533203125, 0.83660888671875, 0.909271240234375, 0.98193359375, 1.054595947265625, 1.12725830078125, 1.199920654296875, 1.2725830078125, 1.345245361328125, 1.41790771484375, 1.490570068359375, 1.563232421875, 1.635894775390625, 1.70855712890625, 1.781219482421875, 1.8538818359375, 1.926544189453125, 1.99920654296875, 2.071868896484375, 2.14453125]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 6.0, 1.0, 9.0, 8.0, 6.0, 20.0, 29.0, 21.0, 36.0, 42.0, 52.0, 73.0, 101.0, 99.0, 99.0, 87.0, 91.0, 55.0, 37.0, 37.0, 31.0, 14.0, 7.0, 12.0, 1.0, 6.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00024056434631347656, -0.00023252889513969421, -0.00022449344396591187, -0.00021645799279212952, -0.00020842254161834717, -0.00020038709044456482, -0.00019235163927078247, -0.00018431618809700012, -0.00017628073692321777, -0.00016824528574943542, -0.00016020983457565308, -0.00015217438340187073, -0.00014413893222808838, -0.00013610348105430603, -0.00012806802988052368, -0.00012003257870674133, -0.00011199712753295898, -0.00010396167635917664, -9.592622518539429e-05, -8.789077401161194e-05, -7.985532283782959e-05, -7.181987166404724e-05, -6.378442049026489e-05, -5.5748969316482544e-05, -4.7713518142700195e-05, -3.967806696891785e-05, -3.16426157951355e-05, -2.360716462135315e-05, -1.55717134475708e-05, -7.536262273788452e-06, 4.991888999938965e-07, 8.534640073776245e-06, 1.6570091247558594e-05, 2.4605542421340942e-05, 3.264099359512329e-05, 4.067644476890564e-05, 4.871189594268799e-05, 5.674734711647034e-05, 6.478279829025269e-05, 7.281824946403503e-05, 8.085370063781738e-05, 8.888915181159973e-05, 9.692460298538208e-05, 0.00010496005415916443, 0.00011299550533294678, 0.00012103095650672913, 0.00012906640768051147, 0.00013710185885429382, 0.00014513731002807617, 0.00015317276120185852, 0.00016120821237564087, 0.00016924366354942322, 0.00017727911472320557, 0.00018531456589698792, 0.00019335001707077026, 0.0002013854682445526, 0.00020942091941833496, 0.0002174563705921173, 0.00022549182176589966, 0.000233527272939682, 0.00024156272411346436, 0.0002495981752872467, 0.00025763362646102905, 0.0002656690776348114, 0.00027370452880859375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 6.0, 7.0, 15.0, 23.0, 38.0, 42.0, 36.0, 73.0, 116.0, 144.0, 197.0, 279.0, 411.0, 547.0, 850.0, 1201.0, 1729.0, 2547.0, 3876.0, 6216.0, 9636.0, 15931.0, 26666.0, 45169.0, 74752.0, 117525.0, 160158.0, 175088.0, 146717.0, 100379.0, 62192.0, 36948.0, 21926.0, 13171.0, 8191.0, 5151.0, 3300.0, 2216.0, 1552.0, 1079.0, 664.0, 495.0, 372.0, 261.0, 209.0, 143.0, 101.0, 62.0, 40.0, 36.0, 21.0, 17.0, 16.0, 6.0, 4.0, 7.0, 3.0, 4.0], "bins": [-1.7197265625, -1.6681060791015625, -1.616485595703125, -1.5648651123046875, -1.51324462890625, -1.4616241455078125, -1.410003662109375, -1.3583831787109375, -1.3067626953125, -1.2551422119140625, -1.203521728515625, -1.1519012451171875, -1.10028076171875, -1.0486602783203125, -0.997039794921875, -0.9454193115234375, -0.893798828125, -0.8421783447265625, -0.790557861328125, -0.7389373779296875, -0.68731689453125, -0.6356964111328125, -0.584075927734375, -0.5324554443359375, -0.4808349609375, -0.4292144775390625, -0.377593994140625, -0.3259735107421875, -0.27435302734375, -0.2227325439453125, -0.171112060546875, -0.1194915771484375, -0.06787109375, -0.0162506103515625, 0.035369873046875, 0.0869903564453125, 0.13861083984375, 0.1902313232421875, 0.241851806640625, 0.2934722900390625, 0.3450927734375, 0.3967132568359375, 0.448333740234375, 0.4999542236328125, 0.55157470703125, 0.6031951904296875, 0.654815673828125, 0.7064361572265625, 0.758056640625, 0.8096771240234375, 0.861297607421875, 0.9129180908203125, 0.96453857421875, 1.0161590576171875, 1.067779541015625, 1.1194000244140625, 1.1710205078125, 1.2226409912109375, 1.274261474609375, 1.3258819580078125, 1.37750244140625, 1.4291229248046875, 1.480743408203125, 1.5323638916015625, 1.583984375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 0.0, 2.0, 5.0, 3.0, 5.0, 10.0, 5.0, 13.0, 14.0, 13.0, 19.0, 23.0, 36.0, 33.0, 48.0, 44.0, 51.0, 50.0, 57.0, 68.0, 62.0, 71.0, 65.0, 44.0, 41.0, 36.0, 31.0, 35.0, 23.0, 17.0, 21.0, 12.0, 11.0, 10.0, 5.0, 3.0, 5.0, 4.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.548828125, -0.5321578979492188, -0.5154876708984375, -0.49881744384765625, -0.482147216796875, -0.46547698974609375, -0.4488067626953125, -0.43213653564453125, -0.41546630859375, -0.39879608154296875, -0.3821258544921875, -0.36545562744140625, -0.348785400390625, -0.33211517333984375, -0.3154449462890625, -0.29877471923828125, -0.2821044921875, -0.26543426513671875, -0.2487640380859375, -0.23209381103515625, -0.215423583984375, -0.19875335693359375, -0.1820831298828125, -0.16541290283203125, -0.14874267578125, -0.13207244873046875, -0.1154022216796875, -0.09873199462890625, -0.082061767578125, -0.06539154052734375, -0.0487213134765625, -0.03205108642578125, -0.015380859375, 0.00128936767578125, 0.0179595947265625, 0.03462982177734375, 0.051300048828125, 0.06797027587890625, 0.0846405029296875, 0.10131072998046875, 0.11798095703125, 0.13465118408203125, 0.1513214111328125, 0.16799163818359375, 0.184661865234375, 0.20133209228515625, 0.2180023193359375, 0.23467254638671875, 0.2513427734375, 0.26801300048828125, 0.2846832275390625, 0.30135345458984375, 0.318023681640625, 0.33469390869140625, 0.3513641357421875, 0.36803436279296875, 0.38470458984375, 0.40137481689453125, 0.4180450439453125, 0.43471527099609375, 0.451385498046875, 0.46805572509765625, 0.4847259521484375, 0.5013961791992188, 0.51806640625]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 2.0, 7.0, 14.0, 10.0, 21.0, 32.0, 44.0, 53.0, 62.0, 103.0, 99.0, 121.0, 104.0, 89.0, 65.0, 59.0, 30.0, 35.0, 18.0, 14.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0], "bins": [-16.5013484954834, -16.165313720703125, -15.829277038574219, -15.493241310119629, -15.157205581665039, -14.82116985321045, -14.48513412475586, -14.149099349975586, -13.81306266784668, -13.47702693939209, -13.1409912109375, -12.80495548248291, -12.46891975402832, -12.13288402557373, -11.79684829711914, -11.460813522338867, -11.124777793884277, -10.788742065429688, -10.452706336975098, -10.116670608520508, -9.780634880065918, -9.444599151611328, -9.108564376831055, -8.772527694702148, -8.436492919921875, -8.100457191467285, -7.764421463012695, -7.4283857345581055, -7.092350006103516, -6.756314277648926, -6.420279026031494, -6.084243297576904, -5.74820613861084, -5.41217041015625, -5.07613468170166, -4.74009895324707, -4.4040632247924805, -4.068027496337891, -3.731992244720459, -3.395956516265869, -3.0599207878112793, -2.7238850593566895, -2.3878493309020996, -2.051813840866089, -1.715778112411499, -1.3797423839569092, -1.0437068939208984, -0.7076711654663086, -0.37163543701171875, -0.03559976816177368, 0.3004359006881714, 0.6364715099334717, 0.9725072383880615, 1.3085429668426514, 1.644578456878662, 1.980614185333252, 2.316649913787842, 2.6526856422424316, 2.9887213706970215, 3.3247568607330322, 3.660792589187622, 3.996828317642212, 4.332863807678223, 4.6688995361328125, 5.004935264587402]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 8.0, 6.0, 4.0, 11.0, 6.0, 9.0, 17.0, 17.0, 29.0, 26.0, 21.0, 29.0, 39.0, 35.0, 27.0, 37.0, 50.0, 51.0, 46.0, 37.0, 45.0, 48.0, 34.0, 59.0, 37.0, 27.0, 30.0, 24.0, 28.0, 38.0, 23.0, 18.0, 16.0, 14.0, 9.0, 15.0, 6.0, 5.0, 8.0, 7.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.512770891189575, -3.4048044681549072, -3.2968382835388184, -3.1888718605041504, -3.0809054374694824, -2.9729392528533936, -2.8649728298187256, -2.7570066452026367, -2.6490402221679688, -2.541073799133301, -2.433107614517212, -2.325141191482544, -2.217174768447876, -2.109208583831787, -2.001242160797119, -1.8932758569717407, -1.7853094339370728, -1.6773431301116943, -1.5693767070770264, -1.461410403251648, -1.3534440994262695, -1.2454776763916016, -1.1375113725662231, -1.0295450687408447, -0.9215787053108215, -0.8136123418807983, -0.7056460380554199, -0.5976796746253967, -0.4897133409976959, -0.3817470073699951, -0.2737806439399719, -0.1658143401145935, -0.05784797668457031, 0.05011836439371109, 0.1580847054719925, 0.2660510540008545, 0.3740173876285553, 0.4819837212562561, 0.5899500846862793, 0.6979163885116577, 0.8058827519416809, 0.9138491153717041, 1.0218154191970825, 1.129781723022461, 1.237748146057129, 1.3457144498825073, 1.4536807537078857, 1.5616471767425537, 1.6696134805679321, 1.7775797843933105, 1.8855462074279785, 1.993512511253357, 2.1014788150787354, 2.2094452381134033, 2.317411422729492, 2.42537784576416, 2.533344268798828, 2.641310691833496, 2.749276876449585, 2.857243299484253, 2.965209722518921, 3.0731759071350098, 3.1811423301696777, 3.2891087532043457, 3.3970749378204346]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 4.0, 1.0, 2.0, 5.0, 6.0, 11.0, 12.0, 13.0, 24.0, 37.0, 45.0, 57.0, 106.0, 146.0, 237.0, 360.0, 532.0, 854.0, 1361.0, 2371.0, 4033.0, 7270.0, 13569.0, 27120.0, 59095.0, 144953.0, 402818.0, 1122442.0, 1422214.0, 615033.0, 210433.0, 82244.0, 36885.0, 17809.0, 9403.0, 5183.0, 2924.0, 1723.0, 1074.0, 671.0, 392.0, 275.0, 164.0, 107.0, 80.0, 60.0, 40.0, 30.0, 17.0, 20.0, 14.0, 6.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.12109375, -6.89990234375, -6.6787109375, -6.45751953125, -6.236328125, -6.01513671875, -5.7939453125, -5.57275390625, -5.3515625, -5.13037109375, -4.9091796875, -4.68798828125, -4.466796875, -4.24560546875, -4.0244140625, -3.80322265625, -3.58203125, -3.36083984375, -3.1396484375, -2.91845703125, -2.697265625, -2.47607421875, -2.2548828125, -2.03369140625, -1.8125, -1.59130859375, -1.3701171875, -1.14892578125, -0.927734375, -0.70654296875, -0.4853515625, -0.26416015625, -0.04296875, 0.17822265625, 0.3994140625, 0.62060546875, 0.841796875, 1.06298828125, 1.2841796875, 1.50537109375, 1.7265625, 1.94775390625, 2.1689453125, 2.39013671875, 2.611328125, 2.83251953125, 3.0537109375, 3.27490234375, 3.49609375, 3.71728515625, 3.9384765625, 4.15966796875, 4.380859375, 4.60205078125, 4.8232421875, 5.04443359375, 5.265625, 5.48681640625, 5.7080078125, 5.92919921875, 6.150390625, 6.37158203125, 6.5927734375, 6.81396484375, 7.03515625]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 5.0, 6.0, 7.0, 12.0, 14.0, 15.0, 9.0, 17.0, 28.0, 34.0, 40.0, 43.0, 40.0, 40.0, 44.0, 47.0, 54.0, 48.0, 46.0, 48.0, 49.0, 44.0, 40.0, 40.0, 38.0, 44.0, 33.0, 25.0, 25.0, 15.0, 12.0, 10.0, 7.0, 9.0, 5.0, 8.0, 1.0, 5.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.62890625, -2.538330078125, -2.44775390625, -2.357177734375, -2.2666015625, -2.176025390625, -2.08544921875, -1.994873046875, -1.904296875, -1.813720703125, -1.72314453125, -1.632568359375, -1.5419921875, -1.451416015625, -1.36083984375, -1.270263671875, -1.1796875, -1.089111328125, -0.99853515625, -0.907958984375, -0.8173828125, -0.726806640625, -0.63623046875, -0.545654296875, -0.455078125, -0.364501953125, -0.27392578125, -0.183349609375, -0.0927734375, -0.002197265625, 0.08837890625, 0.178955078125, 0.26953125, 0.360107421875, 0.45068359375, 0.541259765625, 0.6318359375, 0.722412109375, 0.81298828125, 0.903564453125, 0.994140625, 1.084716796875, 1.17529296875, 1.265869140625, 1.3564453125, 1.447021484375, 1.53759765625, 1.628173828125, 1.71875, 1.809326171875, 1.89990234375, 1.990478515625, 2.0810546875, 2.171630859375, 2.26220703125, 2.352783203125, 2.443359375, 2.533935546875, 2.62451171875, 2.715087890625, 2.8056640625, 2.896240234375, 2.98681640625, 3.077392578125, 3.16796875]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 8.0, 10.0, 21.0, 17.0, 31.0, 36.0, 36.0, 70.0, 99.0, 142.0, 192.0, 271.0, 380.0, 598.0, 901.0, 1374.0, 2027.0, 3173.0, 4972.0, 7792.0, 12632.0, 21437.0, 37443.0, 68044.0, 127793.0, 254104.0, 514208.0, 944363.0, 1008026.0, 575753.0, 285919.0, 143820.0, 75438.0, 41324.0, 24209.0, 14016.0, 8482.0, 5315.0, 3394.0, 2091.0, 1442.0, 958.0, 576.0, 425.0, 290.0, 213.0, 133.0, 82.0, 55.0, 46.0, 32.0, 26.0, 19.0, 6.0, 8.0, 10.0, 3.0, 7.0, 3.0, 3.0, 1.0], "bins": [-5.3046875, -5.134033203125, -4.96337890625, -4.792724609375, -4.6220703125, -4.451416015625, -4.28076171875, -4.110107421875, -3.939453125, -3.768798828125, -3.59814453125, -3.427490234375, -3.2568359375, -3.086181640625, -2.91552734375, -2.744873046875, -2.57421875, -2.403564453125, -2.23291015625, -2.062255859375, -1.8916015625, -1.720947265625, -1.55029296875, -1.379638671875, -1.208984375, -1.038330078125, -0.86767578125, -0.697021484375, -0.5263671875, -0.355712890625, -0.18505859375, -0.014404296875, 0.15625, 0.326904296875, 0.49755859375, 0.668212890625, 0.8388671875, 1.009521484375, 1.18017578125, 1.350830078125, 1.521484375, 1.692138671875, 1.86279296875, 2.033447265625, 2.2041015625, 2.374755859375, 2.54541015625, 2.716064453125, 2.88671875, 3.057373046875, 3.22802734375, 3.398681640625, 3.5693359375, 3.739990234375, 3.91064453125, 4.081298828125, 4.251953125, 4.422607421875, 4.59326171875, 4.763916015625, 4.9345703125, 5.105224609375, 5.27587890625, 5.446533203125, 5.6171875]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 7.0, 5.0, 3.0, 7.0, 11.0, 14.0, 15.0, 17.0, 21.0, 39.0, 34.0, 46.0, 79.0, 90.0, 128.0, 123.0, 175.0, 239.0, 279.0, 265.0, 294.0, 317.0, 331.0, 276.0, 252.0, 217.0, 178.0, 130.0, 116.0, 84.0, 52.0, 53.0, 33.0, 28.0, 24.0, 26.0, 13.0, 12.0, 10.0, 11.0, 8.0, 5.0, 1.0, 0.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6884765625, -1.633148193359375, -1.57781982421875, -1.522491455078125, -1.4671630859375, -1.411834716796875, -1.35650634765625, -1.301177978515625, -1.245849609375, -1.190521240234375, -1.13519287109375, -1.079864501953125, -1.0245361328125, -0.969207763671875, -0.91387939453125, -0.858551025390625, -0.80322265625, -0.747894287109375, -0.69256591796875, -0.637237548828125, -0.5819091796875, -0.526580810546875, -0.47125244140625, -0.415924072265625, -0.360595703125, -0.305267333984375, -0.24993896484375, -0.194610595703125, -0.1392822265625, -0.083953857421875, -0.02862548828125, 0.026702880859375, 0.08203125, 0.137359619140625, 0.19268798828125, 0.248016357421875, 0.3033447265625, 0.358673095703125, 0.41400146484375, 0.469329833984375, 0.524658203125, 0.579986572265625, 0.63531494140625, 0.690643310546875, 0.7459716796875, 0.801300048828125, 0.85662841796875, 0.911956787109375, 0.96728515625, 1.022613525390625, 1.07794189453125, 1.133270263671875, 1.1885986328125, 1.243927001953125, 1.29925537109375, 1.354583740234375, 1.409912109375, 1.465240478515625, 1.52056884765625, 1.575897216796875, 1.6312255859375, 1.686553955078125, 1.74188232421875, 1.797210693359375, 1.8525390625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 5.0, 10.0, 8.0, 9.0, 16.0, 22.0, 24.0, 23.0, 36.0, 61.0, 66.0, 86.0, 84.0, 83.0, 96.0, 94.0, 62.0, 60.0, 40.0, 37.0, 26.0, 15.0, 11.0, 16.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-13.311237335205078, -13.022732734680176, -12.73422908782959, -12.445724487304688, -12.157219886779785, -11.8687162399292, -11.580211639404297, -11.291707992553711, -11.003203392028809, -10.714698791503906, -10.42619514465332, -10.137690544128418, -9.849185943603516, -9.56068229675293, -9.272177696228027, -8.983673095703125, -8.695169448852539, -8.406664848327637, -8.11816120147705, -7.829656600952148, -7.541152477264404, -7.25264835357666, -6.964143753051758, -6.675639629364014, -6.387134552001953, -6.098630428314209, -5.810125827789307, -5.5216217041015625, -5.233117580413818, -4.944613456726074, -4.656108856201172, -4.367604732513428, -4.079100608825684, -3.7905962467193604, -3.502092123031616, -3.213587760925293, -2.925083637237549, -2.6365792751312256, -2.3480749130249023, -2.059570789337158, -1.771066427230835, -1.4825621843338013, -1.1940579414367676, -0.9055535793304443, -0.6170493364334106, -0.32854509353637695, -0.04004073143005371, 0.24846339225769043, 0.5369677543640137, 0.8254719972610474, 1.113976240158081, 1.4024806022644043, 1.690984845161438, 1.9794890880584717, 2.267993450164795, 2.556497573852539, 2.8450019359588623, 3.1335062980651855, 3.4220104217529297, 3.710514783859253, 3.999019145965576, 4.28752326965332, 4.576027870178223, 4.864531517028809, 5.153036117553711]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 4.0, 9.0, 13.0, 12.0, 13.0, 20.0, 21.0, 27.0, 27.0, 25.0, 27.0, 31.0, 30.0, 31.0, 43.0, 53.0, 42.0, 40.0, 53.0, 42.0, 44.0, 39.0, 31.0, 40.0, 37.0, 42.0, 39.0, 32.0, 17.0, 18.0, 21.0, 14.0, 15.0, 11.0, 8.0, 7.0, 9.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.712069272994995, -3.6039493083953857, -3.4958291053771973, -3.387709140777588, -3.2795891761779785, -3.17146897315979, -3.0633490085601807, -2.955228805541992, -2.847108840942383, -2.7389888763427734, -2.630868673324585, -2.5227487087249756, -2.414628505706787, -2.3065085411071777, -2.1983885765075684, -2.090268611907959, -1.9821484088897705, -1.8740283250808716, -1.7659082412719727, -1.6577882766723633, -1.5496681928634644, -1.4415481090545654, -1.333428144454956, -1.2253080606460571, -1.1171879768371582, -1.0090678930282593, -0.9009478688240051, -0.792827844619751, -0.684707760810852, -0.5765876770019531, -0.468467652797699, -0.3603476285934448, -0.2522275447845459, -0.14410749077796936, -0.03598743677139282, 0.07213261723518372, 0.18025267124176025, 0.2883727550506592, 0.39649277925491333, 0.5046128034591675, 0.6127328872680664, 0.7208529710769653, 0.8289729952812195, 0.9370930194854736, 1.0452131032943726, 1.1533331871032715, 1.2614531517028809, 1.3695732355117798, 1.4776933193206787, 1.5858134031295776, 1.6939334869384766, 1.802053451538086, 1.9101735353469849, 2.018293619155884, 2.126413583755493, 2.2345337867736816, 2.342653751373291, 2.4507737159729004, 2.558893918991089, 2.6670138835906982, 2.7751340866088867, 2.883254051208496, 2.9913740158081055, 3.099493980407715, 3.2076141834259033]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 8.0, 8.0, 13.0, 24.0, 27.0, 64.0, 94.0, 140.0, 241.0, 353.0, 555.0, 888.0, 1451.0, 2428.0, 4078.0, 6713.0, 11546.0, 20003.0, 33070.0, 55845.0, 88426.0, 128453.0, 161271.0, 163959.0, 132331.0, 92205.0, 58109.0, 35324.0, 20744.0, 12261.0, 7190.0, 4268.0, 2595.0, 1507.0, 880.0, 556.0, 342.0, 201.0, 126.0, 98.0, 52.0, 37.0, 25.0, 17.0, 9.0, 12.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.046875, -1.9849395751953125, -1.923004150390625, -1.8610687255859375, -1.79913330078125, -1.7371978759765625, -1.675262451171875, -1.6133270263671875, -1.5513916015625, -1.4894561767578125, -1.427520751953125, -1.3655853271484375, -1.30364990234375, -1.2417144775390625, -1.179779052734375, -1.1178436279296875, -1.055908203125, -0.9939727783203125, -0.932037353515625, -0.8701019287109375, -0.80816650390625, -0.7462310791015625, -0.684295654296875, -0.6223602294921875, -0.5604248046875, -0.4984893798828125, -0.436553955078125, -0.3746185302734375, -0.31268310546875, -0.2507476806640625, -0.188812255859375, -0.1268768310546875, -0.06494140625, -0.0030059814453125, 0.058929443359375, 0.1208648681640625, 0.18280029296875, 0.2447357177734375, 0.306671142578125, 0.3686065673828125, 0.4305419921875, 0.4924774169921875, 0.554412841796875, 0.6163482666015625, 0.67828369140625, 0.7402191162109375, 0.802154541015625, 0.8640899658203125, 0.926025390625, 0.9879608154296875, 1.049896240234375, 1.1118316650390625, 1.17376708984375, 1.2357025146484375, 1.297637939453125, 1.3595733642578125, 1.4215087890625, 1.4834442138671875, 1.545379638671875, 1.6073150634765625, 1.66925048828125, 1.7311859130859375, 1.793121337890625, 1.8550567626953125, 1.9169921875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 3.0, 8.0, 7.0, 9.0, 19.0, 14.0, 11.0, 19.0, 27.0, 26.0, 25.0, 32.0, 36.0, 38.0, 30.0, 47.0, 38.0, 38.0, 57.0, 42.0, 39.0, 51.0, 35.0, 29.0, 42.0, 34.0, 44.0, 25.0, 27.0, 23.0, 24.0, 17.0, 27.0, 17.0, 12.0, 7.0, 6.0, 8.0, 4.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.580078125, -3.46234130859375, -3.3446044921875, -3.22686767578125, -3.109130859375, -2.99139404296875, -2.8736572265625, -2.75592041015625, -2.63818359375, -2.52044677734375, -2.4027099609375, -2.28497314453125, -2.167236328125, -2.04949951171875, -1.9317626953125, -1.81402587890625, -1.6962890625, -1.57855224609375, -1.4608154296875, -1.34307861328125, -1.225341796875, -1.10760498046875, -0.9898681640625, -0.87213134765625, -0.75439453125, -0.63665771484375, -0.5189208984375, -0.40118408203125, -0.283447265625, -0.16571044921875, -0.0479736328125, 0.06976318359375, 0.1875, 0.30523681640625, 0.4229736328125, 0.54071044921875, 0.658447265625, 0.77618408203125, 0.8939208984375, 1.01165771484375, 1.12939453125, 1.24713134765625, 1.3648681640625, 1.48260498046875, 1.600341796875, 1.71807861328125, 1.8358154296875, 1.95355224609375, 2.0712890625, 2.18902587890625, 2.3067626953125, 2.42449951171875, 2.542236328125, 2.65997314453125, 2.7777099609375, 2.89544677734375, 3.01318359375, 3.13092041015625, 3.2486572265625, 3.36639404296875, 3.484130859375, 3.60186767578125, 3.7196044921875, 3.83734130859375, 3.955078125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 4.0, 7.0, 11.0, 20.0, 32.0, 35.0, 87.0, 96.0, 182.0, 309.0, 512.0, 842.0, 1567.0, 2506.0, 4311.0, 7670.0, 13648.0, 24449.0, 44108.0, 78955.0, 133882.0, 197727.0, 202849.0, 141843.0, 84922.0, 47713.0, 26111.0, 14774.0, 8193.0, 4600.0, 2641.0, 1642.0, 937.0, 553.0, 342.0, 170.0, 116.0, 68.0, 50.0, 32.0, 21.0, 9.0, 6.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.876953125, -2.789947509765625, -2.70294189453125, -2.615936279296875, -2.5289306640625, -2.441925048828125, -2.35491943359375, -2.267913818359375, -2.180908203125, -2.093902587890625, -2.00689697265625, -1.919891357421875, -1.8328857421875, -1.745880126953125, -1.65887451171875, -1.571868896484375, -1.48486328125, -1.397857666015625, -1.31085205078125, -1.223846435546875, -1.1368408203125, -1.049835205078125, -0.96282958984375, -0.875823974609375, -0.788818359375, -0.701812744140625, -0.61480712890625, -0.527801513671875, -0.4407958984375, -0.353790283203125, -0.26678466796875, -0.179779052734375, -0.0927734375, -0.005767822265625, 0.08123779296875, 0.168243408203125, 0.2552490234375, 0.342254638671875, 0.42926025390625, 0.516265869140625, 0.603271484375, 0.690277099609375, 0.77728271484375, 0.864288330078125, 0.9512939453125, 1.038299560546875, 1.12530517578125, 1.212310791015625, 1.29931640625, 1.386322021484375, 1.47332763671875, 1.560333251953125, 1.6473388671875, 1.734344482421875, 1.82135009765625, 1.908355712890625, 1.995361328125, 2.082366943359375, 2.16937255859375, 2.256378173828125, 2.3433837890625, 2.430389404296875, 2.51739501953125, 2.604400634765625, 2.69140625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 5.0, 6.0, 3.0, 8.0, 6.0, 14.0, 8.0, 14.0, 24.0, 30.0, 22.0, 17.0, 32.0, 24.0, 32.0, 28.0, 36.0, 30.0, 28.0, 35.0, 38.0, 34.0, 44.0, 49.0, 33.0, 33.0, 26.0, 38.0, 37.0, 28.0, 25.0, 25.0, 24.0, 21.0, 18.0, 18.0, 16.0, 13.0, 15.0, 11.0, 13.0, 7.0, 8.0, 4.0, 7.0, 6.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.009765625, -1.949462890625, -1.88916015625, -1.828857421875, -1.7685546875, -1.708251953125, -1.64794921875, -1.587646484375, -1.52734375, -1.467041015625, -1.40673828125, -1.346435546875, -1.2861328125, -1.225830078125, -1.16552734375, -1.105224609375, -1.044921875, -0.984619140625, -0.92431640625, -0.864013671875, -0.8037109375, -0.743408203125, -0.68310546875, -0.622802734375, -0.5625, -0.502197265625, -0.44189453125, -0.381591796875, -0.3212890625, -0.260986328125, -0.20068359375, -0.140380859375, -0.080078125, -0.019775390625, 0.04052734375, 0.100830078125, 0.1611328125, 0.221435546875, 0.28173828125, 0.342041015625, 0.40234375, 0.462646484375, 0.52294921875, 0.583251953125, 0.6435546875, 0.703857421875, 0.76416015625, 0.824462890625, 0.884765625, 0.945068359375, 1.00537109375, 1.065673828125, 1.1259765625, 1.186279296875, 1.24658203125, 1.306884765625, 1.3671875, 1.427490234375, 1.48779296875, 1.548095703125, 1.6083984375, 1.668701171875, 1.72900390625, 1.789306640625, 1.849609375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 8.0, 11.0, 7.0, 22.0, 30.0, 52.0, 59.0, 60.0, 131.0, 168.0, 235.0, 378.0, 543.0, 727.0, 1133.0, 1729.0, 2656.0, 4113.0, 6410.0, 10462.0, 17062.0, 28824.0, 48409.0, 81886.0, 134337.0, 193476.0, 190073.0, 129230.0, 78244.0, 46217.0, 27506.0, 16461.0, 10002.0, 6312.0, 4039.0, 2452.0, 1645.0, 1110.0, 753.0, 494.0, 354.0, 232.0, 173.0, 100.0, 86.0, 44.0, 28.0, 30.0, 16.0, 10.0, 13.0, 4.0, 5.0, 2.0, 1.0, 3.0, 2.0], "bins": [-1.1396484375, -1.105072021484375, -1.07049560546875, -1.035919189453125, -1.0013427734375, -0.966766357421875, -0.93218994140625, -0.897613525390625, -0.863037109375, -0.828460693359375, -0.79388427734375, -0.759307861328125, -0.7247314453125, -0.690155029296875, -0.65557861328125, -0.621002197265625, -0.58642578125, -0.551849365234375, -0.51727294921875, -0.482696533203125, -0.4481201171875, -0.413543701171875, -0.37896728515625, -0.344390869140625, -0.309814453125, -0.275238037109375, -0.24066162109375, -0.206085205078125, -0.1715087890625, -0.136932373046875, -0.10235595703125, -0.067779541015625, -0.033203125, 0.001373291015625, 0.03594970703125, 0.070526123046875, 0.1051025390625, 0.139678955078125, 0.17425537109375, 0.208831787109375, 0.243408203125, 0.277984619140625, 0.31256103515625, 0.347137451171875, 0.3817138671875, 0.416290283203125, 0.45086669921875, 0.485443115234375, 0.52001953125, 0.554595947265625, 0.58917236328125, 0.623748779296875, 0.6583251953125, 0.692901611328125, 0.72747802734375, 0.762054443359375, 0.796630859375, 0.831207275390625, 0.86578369140625, 0.900360107421875, 0.9349365234375, 0.969512939453125, 1.00408935546875, 1.038665771484375, 1.0732421875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 3.0, 4.0, 3.0, 6.0, 12.0, 16.0, 10.0, 13.0, 21.0, 21.0, 33.0, 36.0, 47.0, 52.0, 49.0, 79.0, 69.0, 64.0, 69.0, 78.0, 55.0, 50.0, 51.0, 31.0, 26.0, 19.0, 28.0, 16.0, 9.0, 10.0, 5.0, 4.0, 2.0, 4.0, 1.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.151199340820312e-05, -5.941465497016907e-05, -5.731731653213501e-05, -5.521997809410095e-05, -5.3122639656066895e-05, -5.102530121803284e-05, -4.892796277999878e-05, -4.683062434196472e-05, -4.4733285903930664e-05, -4.2635947465896606e-05, -4.053860902786255e-05, -3.844127058982849e-05, -3.6343932151794434e-05, -3.4246593713760376e-05, -3.214925527572632e-05, -3.005191683769226e-05, -2.7954578399658203e-05, -2.5857239961624146e-05, -2.3759901523590088e-05, -2.166256308555603e-05, -1.9565224647521973e-05, -1.7467886209487915e-05, -1.5370547771453857e-05, -1.32732093334198e-05, -1.1175870895385742e-05, -9.078532457351685e-06, -6.981194019317627e-06, -4.883855581283569e-06, -2.7865171432495117e-06, -6.891787052154541e-07, 1.4081597328186035e-06, 3.505498170852661e-06, 5.602836608886719e-06, 7.700175046920776e-06, 9.797513484954834e-06, 1.1894851922988892e-05, 1.399219036102295e-05, 1.6089528799057007e-05, 1.8186867237091064e-05, 2.0284205675125122e-05, 2.238154411315918e-05, 2.4478882551193237e-05, 2.6576220989227295e-05, 2.8673559427261353e-05, 3.077089786529541e-05, 3.286823630332947e-05, 3.4965574741363525e-05, 3.706291317939758e-05, 3.916025161743164e-05, 4.12575900554657e-05, 4.3354928493499756e-05, 4.5452266931533813e-05, 4.754960536956787e-05, 4.964694380760193e-05, 5.1744282245635986e-05, 5.3841620683670044e-05, 5.59389591217041e-05, 5.803629755973816e-05, 6.013363599777222e-05, 6.223097443580627e-05, 6.432831287384033e-05, 6.642565131187439e-05, 6.852298974990845e-05, 7.06203281879425e-05, 7.271766662597656e-05]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 5.0, 13.0, 14.0, 16.0, 30.0, 57.0, 71.0, 122.0, 182.0, 272.0, 475.0, 738.0, 1186.0, 1820.0, 3155.0, 5187.0, 8624.0, 14440.0, 24772.0, 42069.0, 70378.0, 111882.0, 156567.0, 176724.0, 153709.0, 108787.0, 67693.0, 40660.0, 23716.0, 14127.0, 8346.0, 4898.0, 2965.0, 1822.0, 1088.0, 682.0, 476.0, 270.0, 178.0, 127.0, 80.0, 34.0, 35.0, 14.0, 16.0, 16.0, 5.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.0439453125, -1.0127487182617188, -0.9815521240234375, -0.9503555297851562, -0.919158935546875, -0.8879623413085938, -0.8567657470703125, -0.8255691528320312, -0.79437255859375, -0.7631759643554688, -0.7319793701171875, -0.7007827758789062, -0.669586181640625, -0.6383895874023438, -0.6071929931640625, -0.5759963989257812, -0.5447998046875, -0.5136032104492188, -0.4824066162109375, -0.45121002197265625, -0.420013427734375, -0.38881683349609375, -0.3576202392578125, -0.32642364501953125, -0.29522705078125, -0.26403045654296875, -0.2328338623046875, -0.20163726806640625, -0.170440673828125, -0.13924407958984375, -0.1080474853515625, -0.07685089111328125, -0.045654296875, -0.01445770263671875, 0.0167388916015625, 0.04793548583984375, 0.079132080078125, 0.11032867431640625, 0.1415252685546875, 0.17272186279296875, 0.20391845703125, 0.23511505126953125, 0.2663116455078125, 0.29750823974609375, 0.328704833984375, 0.35990142822265625, 0.3910980224609375, 0.42229461669921875, 0.4534912109375, 0.48468780517578125, 0.5158843994140625, 0.5470809936523438, 0.578277587890625, 0.6094741821289062, 0.6406707763671875, 0.6718673706054688, 0.70306396484375, 0.7342605590820312, 0.7654571533203125, 0.7966537475585938, 0.827850341796875, 0.8590469360351562, 0.8902435302734375, 0.9214401245117188, 0.95263671875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 7.0, 5.0, 6.0, 8.0, 5.0, 9.0, 10.0, 19.0, 15.0, 14.0, 26.0, 22.0, 26.0, 24.0, 34.0, 44.0, 33.0, 52.0, 39.0, 33.0, 45.0, 47.0, 45.0, 55.0, 45.0, 33.0, 38.0, 52.0, 28.0, 23.0, 25.0, 22.0, 21.0, 16.0, 13.0, 8.0, 8.0, 11.0, 11.0, 7.0, 2.0, 4.0, 0.0, 4.0, 5.0, 1.0, 4.0, 4.0], "bins": [-0.301025390625, -0.2930259704589844, -0.28502655029296875, -0.2770271301269531, -0.2690277099609375, -0.2610282897949219, -0.25302886962890625, -0.24502944946289062, -0.237030029296875, -0.22903060913085938, -0.22103118896484375, -0.21303176879882812, -0.2050323486328125, -0.19703292846679688, -0.18903350830078125, -0.18103408813476562, -0.17303466796875, -0.16503524780273438, -0.15703582763671875, -0.14903640747070312, -0.1410369873046875, -0.13303756713867188, -0.12503814697265625, -0.11703872680664062, -0.109039306640625, -0.10103988647460938, -0.09304046630859375, -0.08504104614257812, -0.0770416259765625, -0.06904220581054688, -0.06104278564453125, -0.053043365478515625, -0.0450439453125, -0.037044525146484375, -0.02904510498046875, -0.021045684814453125, -0.0130462646484375, -0.005046844482421875, 0.00295257568359375, 0.010951995849609375, 0.018951416015625, 0.026950836181640625, 0.03495025634765625, 0.042949676513671875, 0.0509490966796875, 0.058948516845703125, 0.06694793701171875, 0.07494735717773438, 0.08294677734375, 0.09094619750976562, 0.09894561767578125, 0.10694503784179688, 0.1149444580078125, 0.12294387817382812, 0.13094329833984375, 0.13894271850585938, 0.146942138671875, 0.15494155883789062, 0.16294097900390625, 0.17094039916992188, 0.1789398193359375, 0.18693923950195312, 0.19493865966796875, 0.20293807983398438, 0.2109375]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 7.0, 7.0, 10.0, 11.0, 16.0, 25.0, 23.0, 30.0, 52.0, 67.0, 68.0, 88.0, 94.0, 93.0, 97.0, 76.0, 64.0, 38.0, 48.0, 28.0, 18.0, 13.0, 12.0, 8.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-13.480181694030762, -13.184569358825684, -12.888957023620605, -12.593343734741211, -12.297731399536133, -12.002119064331055, -11.706506729125977, -11.410894393920898, -11.11528205871582, -10.819669723510742, -10.524057388305664, -10.22844409942627, -9.932831764221191, -9.637219429016113, -9.341607093811035, -9.045994758605957, -8.750381469726562, -8.454769134521484, -8.159156799316406, -7.86354398727417, -7.567931175231934, -7.2723188400268555, -6.976706504821777, -6.681094169616699, -6.385481357574463, -6.089869022369385, -5.794256210327148, -5.49864387512207, -5.203031539916992, -4.907418727874756, -4.611806392669678, -4.316193580627441, -4.020580291748047, -3.7249677181243896, -3.4293551445007324, -3.1337428092956543, -2.838130235671997, -2.54251766204834, -2.2469053268432617, -1.9512927532196045, -1.6556801795959473, -1.36006760597229, -1.0644551515579224, -0.7688426375389099, -0.47323012351989746, -0.17761754989624023, 0.11799490451812744, 0.4136073589324951, 0.7092199325561523, 1.0048325061798096, 1.3004449605941772, 1.596057415008545, 1.8916699886322021, 2.1872825622558594, 2.4828948974609375, 2.7785074710845947, 3.074120044708252, 3.369732618331909, 3.6653451919555664, 3.9609575271606445, 4.256569862365723, 4.552182674407959, 4.847795009613037, 5.143407821655273, 5.439020156860352]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 7.0, 4.0, 3.0, 10.0, 11.0, 14.0, 11.0, 18.0, 15.0, 21.0, 30.0, 30.0, 20.0, 38.0, 27.0, 37.0, 40.0, 38.0, 48.0, 40.0, 55.0, 37.0, 45.0, 43.0, 33.0, 39.0, 34.0, 42.0, 36.0, 38.0, 23.0, 16.0, 20.0, 14.0, 22.0, 11.0, 13.0, 8.0, 6.0, 5.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.694929361343384, -3.5890119075775146, -3.4830944538116455, -3.3771772384643555, -3.2712597846984863, -3.165342330932617, -3.059424877166748, -2.953507423400879, -2.8475899696350098, -2.7416725158691406, -2.6357550621032715, -2.5298376083374023, -2.4239203929901123, -2.318002939224243, -2.212085485458374, -2.106168031692505, -2.000250816345215, -1.8943333625793457, -1.7884160280227661, -1.682498574256897, -1.5765811204910278, -1.4706637859344482, -1.364746332168579, -1.25882887840271, -1.1529114246368408, -1.0469939708709717, -0.9410765767097473, -0.835159182548523, -0.7292417287826538, -0.6233243346214294, -0.5174069404602051, -0.41148948669433594, -0.3055720329284668, -0.19965460896492004, -0.09373719990253448, 0.012180209159851074, 0.11809763312339783, 0.22401505708694458, 0.32993245124816895, 0.4358499050140381, 0.5417672991752625, 0.6476846933364868, 0.753602147102356, 0.8595195412635803, 0.9654369354248047, 1.0713543891906738, 1.177271842956543, 1.283189296722412, 1.3891066312789917, 1.4950240850448608, 1.6009414196014404, 1.7068588733673096, 1.8127763271331787, 1.9186937808990479, 2.024610996246338, 2.130528450012207, 2.236445903778076, 2.3423633575439453, 2.4482808113098145, 2.5541982650756836, 2.6601154804229736, 2.7660329341888428, 2.871950387954712, 2.977867841720581, 3.08378529548645]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 6.0, 11.0, 13.0, 26.0, 35.0, 43.0, 79.0, 156.0, 189.0, 336.0, 529.0, 854.0, 1511.0, 2539.0, 4221.0, 7151.0, 12325.0, 20584.0, 34839.0, 56570.0, 87769.0, 124462.0, 151877.0, 155933.0, 131961.0, 96067.0, 62815.0, 38732.0, 23442.0, 13597.0, 8117.0, 4768.0, 2877.0, 1606.0, 989.0, 587.0, 351.0, 205.0, 143.0, 92.0, 57.0, 40.0, 22.0, 12.0, 9.0, 2.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-3.3828125, -3.286468505859375, -3.19012451171875, -3.093780517578125, -2.9974365234375, -2.901092529296875, -2.80474853515625, -2.708404541015625, -2.612060546875, -2.515716552734375, -2.41937255859375, -2.323028564453125, -2.2266845703125, -2.130340576171875, -2.03399658203125, -1.937652587890625, -1.84130859375, -1.744964599609375, -1.64862060546875, -1.552276611328125, -1.4559326171875, -1.359588623046875, -1.26324462890625, -1.166900634765625, -1.070556640625, -0.974212646484375, -0.87786865234375, -0.781524658203125, -0.6851806640625, -0.588836669921875, -0.49249267578125, -0.396148681640625, -0.2998046875, -0.203460693359375, -0.10711669921875, -0.010772705078125, 0.0855712890625, 0.181915283203125, 0.27825927734375, 0.374603271484375, 0.470947265625, 0.567291259765625, 0.66363525390625, 0.759979248046875, 0.8563232421875, 0.952667236328125, 1.04901123046875, 1.145355224609375, 1.24169921875, 1.338043212890625, 1.43438720703125, 1.530731201171875, 1.6270751953125, 1.723419189453125, 1.81976318359375, 1.916107177734375, 2.012451171875, 2.108795166015625, 2.20513916015625, 2.301483154296875, 2.3978271484375, 2.494171142578125, 2.59051513671875, 2.686859130859375, 2.783203125]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 1.0, 8.0, 9.0, 10.0, 7.0, 12.0, 14.0, 22.0, 19.0, 28.0, 15.0, 40.0, 32.0, 35.0, 30.0, 42.0, 41.0, 51.0, 46.0, 43.0, 53.0, 49.0, 46.0, 31.0, 40.0, 35.0, 38.0, 43.0, 25.0, 24.0, 21.0, 18.0, 16.0, 14.0, 17.0, 8.0, 8.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.37890625, -4.260101318359375, -4.14129638671875, -4.022491455078125, -3.9036865234375, -3.784881591796875, -3.66607666015625, -3.547271728515625, -3.428466796875, -3.309661865234375, -3.19085693359375, -3.072052001953125, -2.9532470703125, -2.834442138671875, -2.71563720703125, -2.596832275390625, -2.47802734375, -2.359222412109375, -2.24041748046875, -2.121612548828125, -2.0028076171875, -1.884002685546875, -1.76519775390625, -1.646392822265625, -1.527587890625, -1.408782958984375, -1.28997802734375, -1.171173095703125, -1.0523681640625, -0.933563232421875, -0.81475830078125, -0.695953369140625, -0.5771484375, -0.458343505859375, -0.33953857421875, -0.220733642578125, -0.1019287109375, 0.016876220703125, 0.13568115234375, 0.254486083984375, 0.373291015625, 0.492095947265625, 0.61090087890625, 0.729705810546875, 0.8485107421875, 0.967315673828125, 1.08612060546875, 1.204925537109375, 1.32373046875, 1.442535400390625, 1.56134033203125, 1.680145263671875, 1.7989501953125, 1.917755126953125, 2.03656005859375, 2.155364990234375, 2.274169921875, 2.392974853515625, 2.51177978515625, 2.630584716796875, 2.7493896484375, 2.868194580078125, 2.98699951171875, 3.105804443359375, 3.224609375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 5.0, 12.0, 16.0, 28.0, 46.0, 79.0, 124.0, 183.0, 248.0, 388.0, 600.0, 839.0, 1302.0, 1947.0, 3113.0, 4703.0, 7106.0, 10879.0, 16573.0, 25233.0, 37377.0, 54470.0, 75801.0, 99057.0, 116973.0, 124759.0, 118748.0, 100438.0, 77252.0, 55899.0, 38738.0, 25799.0, 17174.0, 11225.0, 7477.0, 4774.0, 3078.0, 2037.0, 1368.0, 944.0, 591.0, 394.0, 294.0, 153.0, 121.0, 66.0, 41.0, 33.0, 20.0, 14.0, 7.0, 7.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.462890625, -2.384796142578125, -2.30670166015625, -2.228607177734375, -2.1505126953125, -2.072418212890625, -1.99432373046875, -1.916229248046875, -1.838134765625, -1.760040283203125, -1.68194580078125, -1.603851318359375, -1.5257568359375, -1.447662353515625, -1.36956787109375, -1.291473388671875, -1.21337890625, -1.135284423828125, -1.05718994140625, -0.979095458984375, -0.9010009765625, -0.822906494140625, -0.74481201171875, -0.666717529296875, -0.588623046875, -0.510528564453125, -0.43243408203125, -0.354339599609375, -0.2762451171875, -0.198150634765625, -0.12005615234375, -0.041961669921875, 0.0361328125, 0.114227294921875, 0.19232177734375, 0.270416259765625, 0.3485107421875, 0.426605224609375, 0.50469970703125, 0.582794189453125, 0.660888671875, 0.738983154296875, 0.81707763671875, 0.895172119140625, 0.9732666015625, 1.051361083984375, 1.12945556640625, 1.207550048828125, 1.28564453125, 1.363739013671875, 1.44183349609375, 1.519927978515625, 1.5980224609375, 1.676116943359375, 1.75421142578125, 1.832305908203125, 1.910400390625, 1.988494873046875, 2.06658935546875, 2.144683837890625, 2.2227783203125, 2.300872802734375, 2.37896728515625, 2.457061767578125, 2.53515625]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 3.0, 4.0, 10.0, 8.0, 12.0, 22.0, 18.0, 9.0, 22.0, 32.0, 28.0, 14.0, 23.0, 26.0, 52.0, 39.0, 38.0, 41.0, 37.0, 47.0, 42.0, 42.0, 44.0, 41.0, 26.0, 26.0, 31.0, 33.0, 30.0, 27.0, 27.0, 20.0, 20.0, 14.0, 15.0, 15.0, 11.0, 12.0, 10.0, 6.0, 9.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.060546875, -1.9975433349609375, -1.934539794921875, -1.8715362548828125, -1.80853271484375, -1.7455291748046875, -1.682525634765625, -1.6195220947265625, -1.5565185546875, -1.4935150146484375, -1.430511474609375, -1.3675079345703125, -1.30450439453125, -1.2415008544921875, -1.178497314453125, -1.1154937744140625, -1.052490234375, -0.9894866943359375, -0.926483154296875, -0.8634796142578125, -0.80047607421875, -0.7374725341796875, -0.674468994140625, -0.6114654541015625, -0.5484619140625, -0.4854583740234375, -0.422454833984375, -0.3594512939453125, -0.29644775390625, -0.2334442138671875, -0.170440673828125, -0.1074371337890625, -0.04443359375, 0.0185699462890625, 0.081573486328125, 0.1445770263671875, 0.20758056640625, 0.2705841064453125, 0.333587646484375, 0.3965911865234375, 0.4595947265625, 0.5225982666015625, 0.585601806640625, 0.6486053466796875, 0.71160888671875, 0.7746124267578125, 0.837615966796875, 0.9006195068359375, 0.963623046875, 1.0266265869140625, 1.089630126953125, 1.1526336669921875, 1.21563720703125, 1.2786407470703125, 1.341644287109375, 1.4046478271484375, 1.4676513671875, 1.5306549072265625, 1.593658447265625, 1.6566619873046875, 1.71966552734375, 1.7826690673828125, 1.845672607421875, 1.9086761474609375, 1.9716796875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 9.0, 9.0, 15.0, 24.0, 27.0, 48.0, 92.0, 142.0, 205.0, 348.0, 573.0, 860.0, 1378.0, 2175.0, 3427.0, 5931.0, 9927.0, 16736.0, 28126.0, 47756.0, 78198.0, 120046.0, 158888.0, 171230.0, 143772.0, 100732.0, 63619.0, 38286.0, 22635.0, 13138.0, 7801.0, 4749.0, 2849.0, 1771.0, 1095.0, 685.0, 454.0, 296.0, 193.0, 115.0, 71.0, 47.0, 35.0, 19.0, 10.0, 9.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5107421875, -1.4666748046875, -1.422607421875, -1.3785400390625, -1.33447265625, -1.2904052734375, -1.246337890625, -1.2022705078125, -1.158203125, -1.1141357421875, -1.070068359375, -1.0260009765625, -0.98193359375, -0.9378662109375, -0.893798828125, -0.8497314453125, -0.8056640625, -0.7615966796875, -0.717529296875, -0.6734619140625, -0.62939453125, -0.5853271484375, -0.541259765625, -0.4971923828125, -0.453125, -0.4090576171875, -0.364990234375, -0.3209228515625, -0.27685546875, -0.2327880859375, -0.188720703125, -0.1446533203125, -0.1005859375, -0.0565185546875, -0.012451171875, 0.0316162109375, 0.07568359375, 0.1197509765625, 0.163818359375, 0.2078857421875, 0.251953125, 0.2960205078125, 0.340087890625, 0.3841552734375, 0.42822265625, 0.4722900390625, 0.516357421875, 0.5604248046875, 0.6044921875, 0.6485595703125, 0.692626953125, 0.7366943359375, 0.78076171875, 0.8248291015625, 0.868896484375, 0.9129638671875, 0.95703125, 1.0010986328125, 1.045166015625, 1.0892333984375, 1.13330078125, 1.1773681640625, 1.221435546875, 1.2655029296875, 1.3095703125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 3.0, 2.0, 10.0, 6.0, 14.0, 21.0, 21.0, 29.0, 35.0, 37.0, 45.0, 49.0, 51.0, 61.0, 56.0, 72.0, 58.0, 64.0, 59.0, 60.0, 46.0, 40.0, 35.0, 27.0, 18.0, 20.0, 12.0, 10.0, 10.0, 5.0, 8.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0001633167266845703, -0.0001587122678756714, -0.00015410780906677246, -0.00014950335025787354, -0.0001448988914489746, -0.00014029443264007568, -0.00013568997383117676, -0.00013108551502227783, -0.0001264810562133789, -0.00012187659740447998, -0.00011727213859558105, -0.00011266767978668213, -0.0001080632209777832, -0.00010345876216888428, -9.885430335998535e-05, -9.424984455108643e-05, -8.96453857421875e-05, -8.504092693328857e-05, -8.043646812438965e-05, -7.583200931549072e-05, -7.12275505065918e-05, -6.662309169769287e-05, -6.201863288879395e-05, -5.741417407989502e-05, -5.2809715270996094e-05, -4.820525646209717e-05, -4.360079765319824e-05, -3.8996338844299316e-05, -3.439188003540039e-05, -2.9787421226501465e-05, -2.518296241760254e-05, -2.0578503608703613e-05, -1.5974044799804688e-05, -1.1369585990905762e-05, -6.765127182006836e-06, -2.16066837310791e-06, 2.4437904357910156e-06, 7.048249244689941e-06, 1.1652708053588867e-05, 1.6257166862487793e-05, 2.086162567138672e-05, 2.5466084480285645e-05, 3.007054328918457e-05, 3.4675002098083496e-05, 3.927946090698242e-05, 4.388391971588135e-05, 4.8488378524780273e-05, 5.30928373336792e-05, 5.7697296142578125e-05, 6.230175495147705e-05, 6.690621376037598e-05, 7.15106725692749e-05, 7.611513137817383e-05, 8.071959018707275e-05, 8.532404899597168e-05, 8.99285078048706e-05, 9.453296661376953e-05, 9.913742542266846e-05, 0.00010374188423156738, 0.00010834634304046631, 0.00011295080184936523, 0.00011755526065826416, 0.00012215971946716309, 0.000126764178276062, 0.00013136863708496094]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 9.0, 10.0, 21.0, 19.0, 26.0, 48.0, 69.0, 99.0, 179.0, 261.0, 492.0, 844.0, 1447.0, 2467.0, 4469.0, 7932.0, 14283.0, 26335.0, 47849.0, 83905.0, 135459.0, 183642.0, 187078.0, 143315.0, 91260.0, 52078.0, 29050.0, 15789.0, 8736.0, 4756.0, 2782.0, 1562.0, 881.0, 557.0, 287.0, 199.0, 114.0, 83.0, 51.0, 22.0, 22.0, 15.0, 14.0, 11.0, 8.0, 2.0, 10.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-1.658203125, -1.6095428466796875, -1.560882568359375, -1.5122222900390625, -1.46356201171875, -1.4149017333984375, -1.366241455078125, -1.3175811767578125, -1.2689208984375, -1.2202606201171875, -1.171600341796875, -1.1229400634765625, -1.07427978515625, -1.0256195068359375, -0.976959228515625, -0.9282989501953125, -0.879638671875, -0.8309783935546875, -0.782318115234375, -0.7336578369140625, -0.68499755859375, -0.6363372802734375, -0.587677001953125, -0.5390167236328125, -0.4903564453125, -0.4416961669921875, -0.393035888671875, -0.3443756103515625, -0.29571533203125, -0.2470550537109375, -0.198394775390625, -0.1497344970703125, -0.10107421875, -0.0524139404296875, -0.003753662109375, 0.0449066162109375, 0.09356689453125, 0.1422271728515625, 0.190887451171875, 0.2395477294921875, 0.2882080078125, 0.3368682861328125, 0.385528564453125, 0.4341888427734375, 0.48284912109375, 0.5315093994140625, 0.580169677734375, 0.6288299560546875, 0.677490234375, 0.7261505126953125, 0.774810791015625, 0.8234710693359375, 0.87213134765625, 0.9207916259765625, 0.969451904296875, 1.0181121826171875, 1.0667724609375, 1.1154327392578125, 1.164093017578125, 1.2127532958984375, 1.26141357421875, 1.3100738525390625, 1.358734130859375, 1.4073944091796875, 1.4560546875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 7.0, 10.0, 13.0, 9.0, 16.0, 17.0, 23.0, 31.0, 19.0, 29.0, 31.0, 54.0, 49.0, 45.0, 43.0, 51.0, 45.0, 45.0, 55.0, 50.0, 43.0, 40.0, 40.0, 37.0, 26.0, 29.0, 21.0, 28.0, 22.0, 12.0, 10.0, 12.0, 5.0, 8.0, 4.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3974609375, -0.38423919677734375, -0.3710174560546875, -0.35779571533203125, -0.344573974609375, -0.33135223388671875, -0.3181304931640625, -0.30490875244140625, -0.29168701171875, -0.27846527099609375, -0.2652435302734375, -0.25202178955078125, -0.238800048828125, -0.22557830810546875, -0.2123565673828125, -0.19913482666015625, -0.1859130859375, -0.17269134521484375, -0.1594696044921875, -0.14624786376953125, -0.133026123046875, -0.11980438232421875, -0.1065826416015625, -0.09336090087890625, -0.08013916015625, -0.06691741943359375, -0.0536956787109375, -0.04047393798828125, -0.027252197265625, -0.01403045654296875, -0.0008087158203125, 0.01241302490234375, 0.025634765625, 0.03885650634765625, 0.0520782470703125, 0.06529998779296875, 0.078521728515625, 0.09174346923828125, 0.1049652099609375, 0.11818695068359375, 0.13140869140625, 0.14463043212890625, 0.1578521728515625, 0.17107391357421875, 0.184295654296875, 0.19751739501953125, 0.2107391357421875, 0.22396087646484375, 0.2371826171875, 0.25040435791015625, 0.2636260986328125, 0.27684783935546875, 0.290069580078125, 0.30329132080078125, 0.3165130615234375, 0.32973480224609375, 0.34295654296875, 0.35617828369140625, 0.3694000244140625, 0.38262176513671875, 0.395843505859375, 0.40906524658203125, 0.4222869873046875, 0.43550872802734375, 0.44873046875]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 7.0, 7.0, 8.0, 12.0, 11.0, 25.0, 33.0, 33.0, 42.0, 55.0, 74.0, 79.0, 87.0, 91.0, 107.0, 87.0, 66.0, 41.0, 35.0, 40.0, 19.0, 16.0, 12.0, 8.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-13.601099967956543, -13.304840087890625, -13.008581161499023, -12.712321281433105, -12.416061401367188, -12.119802474975586, -11.823542594909668, -11.52728271484375, -11.231023788452148, -10.93476390838623, -10.638504981994629, -10.342245101928711, -10.04598617553711, -9.749726295471191, -9.453466415405273, -9.157207489013672, -8.860947608947754, -8.564687728881836, -8.268428802490234, -7.972168922424316, -7.675909519195557, -7.379650115966797, -7.083390235900879, -6.787130832672119, -6.490871429443359, -6.1946120262146, -5.89835262298584, -5.602092742919922, -5.305833339691162, -5.009573936462402, -4.713314056396484, -4.417054653167725, -4.120794296264648, -3.8245348930358887, -3.52827525138855, -3.232015609741211, -2.935756206512451, -2.6394968032836914, -2.3432371616363525, -2.0469775199890137, -1.750718116760254, -1.4544585943222046, -1.1581990718841553, -0.861939549446106, -0.5656800270080566, -0.2694205045700073, 0.026839017868041992, 0.32309865951538086, 0.6193580627441406, 0.9156175851821899, 1.2118771076202393, 1.5081366300582886, 1.804396152496338, 2.1006555557250977, 2.3969151973724365, 2.6931748390197754, 2.989434242248535, 3.285693645477295, 3.581953287124634, 3.8782129287719727, 4.174472332000732, 4.470731735229492, 4.76699161529541, 5.06325101852417, 5.35951042175293]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 8.0, 6.0, 10.0, 14.0, 20.0, 21.0, 30.0, 30.0, 25.0, 32.0, 26.0, 33.0, 40.0, 44.0, 40.0, 36.0, 50.0, 54.0, 59.0, 54.0, 35.0, 53.0, 43.0, 42.0, 34.0, 30.0, 31.0, 26.0, 11.0, 16.0, 9.0, 11.0, 6.0, 8.0, 4.0, 7.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.361629009246826, -4.244543075561523, -4.1274566650390625, -4.01037073135376, -3.893284797668457, -3.776198625564575, -3.6591124534606934, -3.5420265197753906, -3.424940347671509, -3.307854175567627, -3.190768241882324, -3.0736820697784424, -2.9565958976745605, -2.839509963989258, -2.722423791885376, -2.605337619781494, -2.4882516860961914, -2.3711655139923096, -2.254079580307007, -2.136993408203125, -2.0199074745178223, -1.9028213024139404, -1.7857351303100586, -1.6686490774154663, -1.551563024520874, -1.4344769716262817, -1.3173909187316895, -1.2003047466278076, -1.0832186937332153, -0.966132640838623, -0.849046528339386, -0.7319604158401489, -0.6148743629455566, -0.49778828024864197, -0.3807021975517273, -0.2636161148548126, -0.14653003215789795, -0.029443979263305664, 0.0876421332359314, 0.20472824573516846, 0.32181429862976074, 0.4389003813266754, 0.5559864640235901, 0.6730725765228271, 0.7901586294174194, 0.9072446823120117, 1.0243308544158936, 1.1414169073104858, 1.2585029602050781, 1.3755890130996704, 1.4926750659942627, 1.6097612380981445, 1.7268472909927368, 1.843933343887329, 1.961019515991211, 2.0781054496765137, 2.1951916217803955, 2.3122777938842773, 2.42936372756958, 2.546449899673462, 2.6635360717773438, 2.7806220054626465, 2.8977081775665283, 3.01479434967041, 3.131880283355713]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [3.0, 4.0, 0.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 4.0, 6.0, 15.0, 13.0, 16.0, 29.0, 41.0, 49.0, 50.0, 92.0, 113.0, 222.0, 299.0, 445.0, 733.0, 1168.0, 2006.0, 3221.0, 5654.0, 10816.0, 20380.0, 42956.0, 101702.0, 281230.0, 863378.0, 1570182.0, 839419.0, 267896.0, 97368.0, 41311.0, 19769.0, 9995.0, 5636.0, 3166.0, 1766.0, 1080.0, 730.0, 465.0, 270.0, 197.0, 116.0, 76.0, 68.0, 40.0, 32.0, 19.0, 14.0, 9.0, 6.0, 4.0, 1.0, 5.0, 4.0, 2.0, 4.0], "bins": [-7.8671875, -7.6390380859375, -7.410888671875, -7.1827392578125, -6.95458984375, -6.7264404296875, -6.498291015625, -6.2701416015625, -6.0419921875, -5.8138427734375, -5.585693359375, -5.3575439453125, -5.12939453125, -4.9012451171875, -4.673095703125, -4.4449462890625, -4.216796875, -3.9886474609375, -3.760498046875, -3.5323486328125, -3.30419921875, -3.0760498046875, -2.847900390625, -2.6197509765625, -2.3916015625, -2.1634521484375, -1.935302734375, -1.7071533203125, -1.47900390625, -1.2508544921875, -1.022705078125, -0.7945556640625, -0.56640625, -0.3382568359375, -0.110107421875, 0.1180419921875, 0.34619140625, 0.5743408203125, 0.802490234375, 1.0306396484375, 1.2587890625, 1.4869384765625, 1.715087890625, 1.9432373046875, 2.17138671875, 2.3995361328125, 2.627685546875, 2.8558349609375, 3.083984375, 3.3121337890625, 3.540283203125, 3.7684326171875, 3.99658203125, 4.2247314453125, 4.452880859375, 4.6810302734375, 4.9091796875, 5.1373291015625, 5.365478515625, 5.5936279296875, 5.82177734375, 6.0499267578125, 6.278076171875, 6.5062255859375, 6.734375]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 8.0, 9.0, 3.0, 8.0, 9.0, 12.0, 18.0, 16.0, 17.0, 17.0, 31.0, 23.0, 38.0, 35.0, 37.0, 46.0, 31.0, 57.0, 44.0, 46.0, 42.0, 43.0, 52.0, 40.0, 41.0, 31.0, 40.0, 44.0, 28.0, 23.0, 20.0, 22.0, 15.0, 9.0, 13.0, 6.0, 6.0, 9.0, 8.0, 2.0, 8.0, 2.0, 3.0], "bins": [-3.458984375, -3.3746337890625, -3.290283203125, -3.2059326171875, -3.12158203125, -3.0372314453125, -2.952880859375, -2.8685302734375, -2.7841796875, -2.6998291015625, -2.615478515625, -2.5311279296875, -2.44677734375, -2.3624267578125, -2.278076171875, -2.1937255859375, -2.109375, -2.0250244140625, -1.940673828125, -1.8563232421875, -1.77197265625, -1.6876220703125, -1.603271484375, -1.5189208984375, -1.4345703125, -1.3502197265625, -1.265869140625, -1.1815185546875, -1.09716796875, -1.0128173828125, -0.928466796875, -0.8441162109375, -0.759765625, -0.6754150390625, -0.591064453125, -0.5067138671875, -0.42236328125, -0.3380126953125, -0.253662109375, -0.1693115234375, -0.0849609375, -0.0006103515625, 0.083740234375, 0.1680908203125, 0.25244140625, 0.3367919921875, 0.421142578125, 0.5054931640625, 0.58984375, 0.6741943359375, 0.758544921875, 0.8428955078125, 0.92724609375, 1.0115966796875, 1.095947265625, 1.1802978515625, 1.2646484375, 1.3489990234375, 1.433349609375, 1.5177001953125, 1.60205078125, 1.6864013671875, 1.770751953125, 1.8551025390625, 1.939453125]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 6.0, 6.0, 9.0, 18.0, 35.0, 35.0, 85.0, 94.0, 157.0, 202.0, 360.0, 568.0, 905.0, 1489.0, 2313.0, 3727.0, 6302.0, 10371.0, 17859.0, 31956.0, 60561.0, 119291.0, 252675.0, 552885.0, 1064235.0, 1041923.0, 533769.0, 243963.0, 115686.0, 58350.0, 31262.0, 17245.0, 10099.0, 6010.0, 3711.0, 2347.0, 1396.0, 838.0, 536.0, 352.0, 248.0, 139.0, 93.0, 60.0, 42.0, 28.0, 20.0, 11.0, 8.0, 4.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.91015625, -5.7193603515625, -5.528564453125, -5.3377685546875, -5.14697265625, -4.9561767578125, -4.765380859375, -4.5745849609375, -4.3837890625, -4.1929931640625, -4.002197265625, -3.8114013671875, -3.62060546875, -3.4298095703125, -3.239013671875, -3.0482177734375, -2.857421875, -2.6666259765625, -2.475830078125, -2.2850341796875, -2.09423828125, -1.9034423828125, -1.712646484375, -1.5218505859375, -1.3310546875, -1.1402587890625, -0.949462890625, -0.7586669921875, -0.56787109375, -0.3770751953125, -0.186279296875, 0.0045166015625, 0.1953125, 0.3861083984375, 0.576904296875, 0.7677001953125, 0.95849609375, 1.1492919921875, 1.340087890625, 1.5308837890625, 1.7216796875, 1.9124755859375, 2.103271484375, 2.2940673828125, 2.48486328125, 2.6756591796875, 2.866455078125, 3.0572509765625, 3.248046875, 3.4388427734375, 3.629638671875, 3.8204345703125, 4.01123046875, 4.2020263671875, 4.392822265625, 4.5836181640625, 4.7744140625, 4.9652099609375, 5.156005859375, 5.3468017578125, 5.53759765625, 5.7283935546875, 5.919189453125, 6.1099853515625, 6.30078125]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 3.0, 11.0, 8.0, 15.0, 23.0, 35.0, 46.0, 49.0, 55.0, 88.0, 106.0, 138.0, 193.0, 237.0, 280.0, 336.0, 385.0, 392.0, 339.0, 318.0, 239.0, 192.0, 148.0, 109.0, 93.0, 58.0, 46.0, 31.0, 28.0, 20.0, 14.0, 9.0, 7.0, 8.0, 5.0, 4.0, 5.0, 1.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9619140625, -1.8965301513671875, -1.831146240234375, -1.7657623291015625, -1.70037841796875, -1.6349945068359375, -1.569610595703125, -1.5042266845703125, -1.4388427734375, -1.3734588623046875, -1.308074951171875, -1.2426910400390625, -1.17730712890625, -1.1119232177734375, -1.046539306640625, -0.9811553955078125, -0.915771484375, -0.8503875732421875, -0.785003662109375, -0.7196197509765625, -0.65423583984375, -0.5888519287109375, -0.523468017578125, -0.4580841064453125, -0.3927001953125, -0.3273162841796875, -0.261932373046875, -0.1965484619140625, -0.13116455078125, -0.0657806396484375, -0.000396728515625, 0.0649871826171875, 0.13037109375, 0.1957550048828125, 0.261138916015625, 0.3265228271484375, 0.39190673828125, 0.4572906494140625, 0.522674560546875, 0.5880584716796875, 0.6534423828125, 0.7188262939453125, 0.784210205078125, 0.8495941162109375, 0.91497802734375, 0.9803619384765625, 1.045745849609375, 1.1111297607421875, 1.176513671875, 1.2418975830078125, 1.307281494140625, 1.3726654052734375, 1.43804931640625, 1.5034332275390625, 1.568817138671875, 1.6342010498046875, 1.6995849609375, 1.7649688720703125, 1.830352783203125, 1.8957366943359375, 1.96112060546875, 2.0265045166015625, 2.091888427734375, 2.1572723388671875, 2.22265625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 9.0, 8.0, 6.0, 8.0, 22.0, 27.0, 34.0, 35.0, 65.0, 62.0, 101.0, 115.0, 118.0, 107.0, 85.0, 58.0, 47.0, 24.0, 25.0, 18.0, 11.0, 10.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-16.51675796508789, -16.16375160217285, -15.810744285583496, -15.45773696899414, -15.104729652404785, -14.75172233581543, -14.39871597290039, -14.045708656311035, -13.69270133972168, -13.339694023132324, -12.986687660217285, -12.63368034362793, -12.280673027038574, -11.927665710449219, -11.57465934753418, -11.221652030944824, -10.868644714355469, -10.515637397766113, -10.162631034851074, -9.809623718261719, -9.456616401672363, -9.103609085083008, -8.750602722167969, -8.397595405578613, -8.044589042663574, -7.691582202911377, -7.3385748863220215, -6.985568046569824, -6.632560729980469, -6.2795538902282715, -5.926547050476074, -5.573539733886719, -5.220532417297363, -4.867525577545166, -4.5145182609558105, -4.161511421203613, -3.808504104614258, -3.4554972648620605, -3.102490186691284, -2.749483108520508, -2.3964760303497314, -2.043468952178955, -1.6904618740081787, -1.337454915046692, -0.9844478368759155, -0.6314407587051392, -0.27843379974365234, 0.07457327842712402, 0.4275803565979004, 0.7805874347686768, 1.1335945129394531, 1.48660147190094, 1.8396085500717163, 2.192615509033203, 2.5456225872039795, 2.898629665374756, 3.2516367435455322, 3.6046438217163086, 3.957650899887085, 4.310657978057861, 4.663664817810059, 5.016672134399414, 5.369678974151611, 5.722685813903809, 6.075693130493164]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 2.0, 3.0, 11.0, 16.0, 15.0, 15.0, 13.0, 20.0, 29.0, 21.0, 30.0, 18.0, 33.0, 35.0, 29.0, 32.0, 33.0, 41.0, 32.0, 39.0, 39.0, 34.0, 51.0, 44.0, 41.0, 45.0, 32.0, 32.0, 32.0, 24.0, 25.0, 17.0, 21.0, 14.0, 17.0, 16.0, 11.0, 17.0, 7.0, 4.0, 4.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.3351566791534424, -3.2348620891571045, -3.1345677375793457, -3.034273147583008, -2.933978796005249, -2.833684206008911, -2.7333898544311523, -2.6330952644348145, -2.5328006744384766, -2.4325060844421387, -2.33221173286438, -2.231917142868042, -2.131622791290283, -2.0313282012939453, -1.931033730506897, -1.8307392597198486, -1.7304449081420898, -1.6301504373550415, -1.5298559665679932, -1.4295613765716553, -1.3292670249938965, -1.2289724349975586, -1.1286779642105103, -1.028383493423462, -0.9280890226364136, -0.8277945518493652, -0.7275000810623169, -0.6272055506706238, -0.5269110798835754, -0.4266166090965271, -0.326322078704834, -0.22602760791778564, -0.1257328987121582, -0.02543841302394867, 0.07485607266426086, 0.1751505732536316, 0.27544504404067993, 0.37573951482772827, 0.4760340452194214, 0.5763285160064697, 0.6766229867935181, 0.7769174575805664, 0.8772119283676147, 0.9775064587593079, 1.077800989151001, 1.1780953407287598, 1.2783899307250977, 1.378684401512146, 1.4789788722991943, 1.5792733430862427, 1.679567813873291, 1.779862403869629, 1.8801567554473877, 1.9804513454437256, 2.0807456970214844, 2.1810402870178223, 2.28133487701416, 2.381629467010498, 2.481923818588257, 2.5822184085845947, 2.6825127601623535, 2.7828073501586914, 2.8831019401550293, 2.983396291732788, 3.083690643310547]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 7.0, 8.0, 12.0, 23.0, 31.0, 50.0, 109.0, 147.0, 262.0, 408.0, 773.0, 1273.0, 2444.0, 4289.0, 7693.0, 13997.0, 26017.0, 47732.0, 85928.0, 141485.0, 192018.0, 192486.0, 140728.0, 85264.0, 47643.0, 26013.0, 14175.0, 7729.0, 4264.0, 2352.0, 1322.0, 737.0, 432.0, 275.0, 153.0, 108.0, 52.0, 44.0, 24.0, 21.0, 5.0, 7.0, 6.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0], "bins": [-2.5546875, -2.481689453125, -2.40869140625, -2.335693359375, -2.2626953125, -2.189697265625, -2.11669921875, -2.043701171875, -1.970703125, -1.897705078125, -1.82470703125, -1.751708984375, -1.6787109375, -1.605712890625, -1.53271484375, -1.459716796875, -1.38671875, -1.313720703125, -1.24072265625, -1.167724609375, -1.0947265625, -1.021728515625, -0.94873046875, -0.875732421875, -0.802734375, -0.729736328125, -0.65673828125, -0.583740234375, -0.5107421875, -0.437744140625, -0.36474609375, -0.291748046875, -0.21875, -0.145751953125, -0.07275390625, 0.000244140625, 0.0732421875, 0.146240234375, 0.21923828125, 0.292236328125, 0.365234375, 0.438232421875, 0.51123046875, 0.584228515625, 0.6572265625, 0.730224609375, 0.80322265625, 0.876220703125, 0.94921875, 1.022216796875, 1.09521484375, 1.168212890625, 1.2412109375, 1.314208984375, 1.38720703125, 1.460205078125, 1.533203125, 1.606201171875, 1.67919921875, 1.752197265625, 1.8251953125, 1.898193359375, 1.97119140625, 2.044189453125, 2.1171875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0, 5.0, 12.0, 7.0, 8.0, 7.0, 10.0, 24.0, 15.0, 22.0, 16.0, 28.0, 26.0, 27.0, 22.0, 28.0, 32.0, 29.0, 33.0, 38.0, 30.0, 43.0, 35.0, 33.0, 35.0, 45.0, 40.0, 26.0, 43.0, 33.0, 40.0, 24.0, 21.0, 29.0, 11.0, 21.0, 23.0, 17.0, 12.0, 11.0, 9.0, 7.0, 6.0, 7.0, 9.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.30859375, -3.208160400390625, -3.10772705078125, -3.007293701171875, -2.9068603515625, -2.806427001953125, -2.70599365234375, -2.605560302734375, -2.505126953125, -2.404693603515625, -2.30426025390625, -2.203826904296875, -2.1033935546875, -2.002960205078125, -1.90252685546875, -1.802093505859375, -1.70166015625, -1.601226806640625, -1.50079345703125, -1.400360107421875, -1.2999267578125, -1.199493408203125, -1.09906005859375, -0.998626708984375, -0.898193359375, -0.797760009765625, -0.69732666015625, -0.596893310546875, -0.4964599609375, -0.396026611328125, -0.29559326171875, -0.195159912109375, -0.0947265625, 0.005706787109375, 0.10614013671875, 0.206573486328125, 0.3070068359375, 0.407440185546875, 0.50787353515625, 0.608306884765625, 0.708740234375, 0.809173583984375, 0.90960693359375, 1.010040283203125, 1.1104736328125, 1.210906982421875, 1.31134033203125, 1.411773681640625, 1.51220703125, 1.612640380859375, 1.71307373046875, 1.813507080078125, 1.9139404296875, 2.014373779296875, 2.11480712890625, 2.215240478515625, 2.315673828125, 2.416107177734375, 2.51654052734375, 2.616973876953125, 2.7174072265625, 2.817840576171875, 2.91827392578125, 3.018707275390625, 3.119140625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 9.0, 19.0, 34.0, 27.0, 57.0, 74.0, 121.0, 213.0, 301.0, 453.0, 769.0, 1173.0, 1786.0, 2984.0, 4625.0, 7577.0, 12425.0, 19949.0, 32829.0, 53371.0, 85742.0, 130964.0, 174308.0, 172761.0, 128386.0, 83422.0, 51649.0, 31918.0, 19119.0, 11813.0, 7318.0, 4519.0, 2871.0, 1765.0, 1161.0, 769.0, 455.0, 289.0, 185.0, 122.0, 79.0, 44.0, 29.0, 31.0, 14.0, 7.0, 3.0, 5.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.08984375, -2.020111083984375, -1.95037841796875, -1.880645751953125, -1.8109130859375, -1.741180419921875, -1.67144775390625, -1.601715087890625, -1.531982421875, -1.462249755859375, -1.39251708984375, -1.322784423828125, -1.2530517578125, -1.183319091796875, -1.11358642578125, -1.043853759765625, -0.97412109375, -0.904388427734375, -0.83465576171875, -0.764923095703125, -0.6951904296875, -0.625457763671875, -0.55572509765625, -0.485992431640625, -0.416259765625, -0.346527099609375, -0.27679443359375, -0.207061767578125, -0.1373291015625, -0.067596435546875, 0.00213623046875, 0.071868896484375, 0.1416015625, 0.211334228515625, 0.28106689453125, 0.350799560546875, 0.4205322265625, 0.490264892578125, 0.55999755859375, 0.629730224609375, 0.699462890625, 0.769195556640625, 0.83892822265625, 0.908660888671875, 0.9783935546875, 1.048126220703125, 1.11785888671875, 1.187591552734375, 1.25732421875, 1.327056884765625, 1.39678955078125, 1.466522216796875, 1.5362548828125, 1.605987548828125, 1.67572021484375, 1.745452880859375, 1.815185546875, 1.884918212890625, 1.95465087890625, 2.024383544921875, 2.0941162109375, 2.163848876953125, 2.23358154296875, 2.303314208984375, 2.373046875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 5.0, 5.0, 8.0, 7.0, 14.0, 10.0, 10.0, 6.0, 12.0, 12.0, 23.0, 21.0, 25.0, 25.0, 26.0, 30.0, 28.0, 39.0, 33.0, 34.0, 44.0, 48.0, 27.0, 35.0, 41.0, 38.0, 37.0, 39.0, 47.0, 35.0, 29.0, 27.0, 21.0, 24.0, 23.0, 16.0, 14.0, 19.0, 17.0, 15.0, 5.0, 6.0, 7.0, 3.0, 5.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0], "bins": [-1.990234375, -1.931304931640625, -1.87237548828125, -1.813446044921875, -1.7545166015625, -1.695587158203125, -1.63665771484375, -1.577728271484375, -1.518798828125, -1.459869384765625, -1.40093994140625, -1.342010498046875, -1.2830810546875, -1.224151611328125, -1.16522216796875, -1.106292724609375, -1.04736328125, -0.988433837890625, -0.92950439453125, -0.870574951171875, -0.8116455078125, -0.752716064453125, -0.69378662109375, -0.634857177734375, -0.575927734375, -0.516998291015625, -0.45806884765625, -0.399139404296875, -0.3402099609375, -0.281280517578125, -0.22235107421875, -0.163421630859375, -0.1044921875, -0.045562744140625, 0.01336669921875, 0.072296142578125, 0.1312255859375, 0.190155029296875, 0.24908447265625, 0.308013916015625, 0.366943359375, 0.425872802734375, 0.48480224609375, 0.543731689453125, 0.6026611328125, 0.661590576171875, 0.72052001953125, 0.779449462890625, 0.83837890625, 0.897308349609375, 0.95623779296875, 1.015167236328125, 1.0740966796875, 1.133026123046875, 1.19195556640625, 1.250885009765625, 1.309814453125, 1.368743896484375, 1.42767333984375, 1.486602783203125, 1.5455322265625, 1.604461669921875, 1.66339111328125, 1.722320556640625, 1.78125]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 11.0, 13.0, 20.0, 22.0, 28.0, 56.0, 86.0, 94.0, 166.0, 221.0, 397.0, 650.0, 1221.0, 2019.0, 3674.0, 7293.0, 14174.0, 29187.0, 61636.0, 131734.0, 245086.0, 263779.0, 149585.0, 70906.0, 33098.0, 15871.0, 8007.0, 4234.0, 2160.0, 1196.0, 710.0, 414.0, 276.0, 166.0, 106.0, 77.0, 44.0, 41.0, 32.0, 16.0, 11.0, 10.0, 7.0, 7.0, 5.0, 2.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5849609375, -1.5370635986328125, -1.489166259765625, -1.4412689208984375, -1.39337158203125, -1.3454742431640625, -1.297576904296875, -1.2496795654296875, -1.2017822265625, -1.1538848876953125, -1.105987548828125, -1.0580902099609375, -1.01019287109375, -0.9622955322265625, -0.914398193359375, -0.8665008544921875, -0.818603515625, -0.7707061767578125, -0.722808837890625, -0.6749114990234375, -0.62701416015625, -0.5791168212890625, -0.531219482421875, -0.4833221435546875, -0.4354248046875, -0.3875274658203125, -0.339630126953125, -0.2917327880859375, -0.24383544921875, -0.1959381103515625, -0.148040771484375, -0.1001434326171875, -0.05224609375, -0.0043487548828125, 0.043548583984375, 0.0914459228515625, 0.13934326171875, 0.1872406005859375, 0.235137939453125, 0.2830352783203125, 0.3309326171875, 0.3788299560546875, 0.426727294921875, 0.4746246337890625, 0.52252197265625, 0.5704193115234375, 0.618316650390625, 0.6662139892578125, 0.714111328125, 0.7620086669921875, 0.809906005859375, 0.8578033447265625, 0.90570068359375, 0.9535980224609375, 1.001495361328125, 1.0493927001953125, 1.0972900390625, 1.1451873779296875, 1.193084716796875, 1.2409820556640625, 1.28887939453125, 1.3367767333984375, 1.384674072265625, 1.4325714111328125, 1.48046875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 5.0, 9.0, 7.0, 11.0, 11.0, 24.0, 19.0, 19.0, 22.0, 30.0, 41.0, 49.0, 43.0, 43.0, 56.0, 55.0, 55.0, 48.0, 59.0, 52.0, 47.0, 52.0, 47.0, 29.0, 34.0, 20.0, 17.0, 21.0, 14.0, 11.0, 9.0, 6.0, 7.0, 9.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.857778549194336e-05, -4.682503640651703e-05, -4.50722873210907e-05, -4.331953823566437e-05, -4.156678915023804e-05, -3.9814040064811707e-05, -3.8061290979385376e-05, -3.6308541893959045e-05, -3.4555792808532715e-05, -3.2803043723106384e-05, -3.1050294637680054e-05, -2.9297545552253723e-05, -2.7544796466827393e-05, -2.5792047381401062e-05, -2.403929829597473e-05, -2.22865492105484e-05, -2.053380012512207e-05, -1.878105103969574e-05, -1.702830195426941e-05, -1.527555286884308e-05, -1.3522803783416748e-05, -1.1770054697990417e-05, -1.0017305612564087e-05, -8.264556527137756e-06, -6.511807441711426e-06, -4.759058356285095e-06, -3.0063092708587646e-06, -1.253560185432434e-06, 4.991888999938965e-07, 2.251937985420227e-06, 4.004687070846558e-06, 5.757436156272888e-06, 7.510185241699219e-06, 9.26293432712555e-06, 1.101568341255188e-05, 1.276843249797821e-05, 1.4521181583404541e-05, 1.627393066883087e-05, 1.8026679754257202e-05, 1.9779428839683533e-05, 2.1532177925109863e-05, 2.3284927010536194e-05, 2.5037676095962524e-05, 2.6790425181388855e-05, 2.8543174266815186e-05, 3.0295923352241516e-05, 3.204867243766785e-05, 3.380142152309418e-05, 3.555417060852051e-05, 3.730691969394684e-05, 3.905966877937317e-05, 4.08124178647995e-05, 4.256516695022583e-05, 4.431791603565216e-05, 4.607066512107849e-05, 4.782341420650482e-05, 4.957616329193115e-05, 5.132891237735748e-05, 5.3081661462783813e-05, 5.4834410548210144e-05, 5.6587159633636475e-05, 5.8339908719062805e-05, 6.0092657804489136e-05, 6.184540688991547e-05, 6.35981559753418e-05]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 10.0, 16.0, 21.0, 37.0, 63.0, 70.0, 116.0, 207.0, 260.0, 397.0, 705.0, 1054.0, 1552.0, 2446.0, 3774.0, 5988.0, 9560.0, 15209.0, 24832.0, 38735.0, 60572.0, 89129.0, 121649.0, 145790.0, 145514.0, 122064.0, 90092.0, 61502.0, 39877.0, 25019.0, 15601.0, 9636.0, 6210.0, 3788.0, 2541.0, 1579.0, 1018.0, 683.0, 439.0, 276.0, 186.0, 116.0, 78.0, 60.0, 26.0, 21.0, 14.0, 11.0, 9.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.8828125, -0.8552398681640625, -0.827667236328125, -0.8000946044921875, -0.77252197265625, -0.7449493408203125, -0.717376708984375, -0.6898040771484375, -0.6622314453125, -0.6346588134765625, -0.607086181640625, -0.5795135498046875, -0.55194091796875, -0.5243682861328125, -0.496795654296875, -0.4692230224609375, -0.441650390625, -0.4140777587890625, -0.386505126953125, -0.3589324951171875, -0.33135986328125, -0.3037872314453125, -0.276214599609375, -0.2486419677734375, -0.2210693359375, -0.1934967041015625, -0.165924072265625, -0.1383514404296875, -0.11077880859375, -0.0832061767578125, -0.055633544921875, -0.0280609130859375, -0.00048828125, 0.0270843505859375, 0.054656982421875, 0.0822296142578125, 0.10980224609375, 0.1373748779296875, 0.164947509765625, 0.1925201416015625, 0.2200927734375, 0.2476654052734375, 0.275238037109375, 0.3028106689453125, 0.33038330078125, 0.3579559326171875, 0.385528564453125, 0.4131011962890625, 0.440673828125, 0.4682464599609375, 0.495819091796875, 0.5233917236328125, 0.55096435546875, 0.5785369873046875, 0.606109619140625, 0.6336822509765625, 0.6612548828125, 0.6888275146484375, 0.716400146484375, 0.7439727783203125, 0.77154541015625, 0.7991180419921875, 0.826690673828125, 0.8542633056640625, 0.8818359375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 4.0, 6.0, 6.0, 4.0, 2.0, 6.0, 10.0, 10.0, 10.0, 10.0, 19.0, 21.0, 29.0, 38.0, 36.0, 46.0, 55.0, 79.0, 48.0, 63.0, 49.0, 57.0, 61.0, 53.0, 47.0, 41.0, 32.0, 24.0, 23.0, 14.0, 18.0, 14.0, 16.0, 12.0, 7.0, 8.0, 6.0, 6.0, 6.0, 4.0, 0.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.298828125, -0.28974151611328125, -0.2806549072265625, -0.27156829833984375, -0.262481689453125, -0.25339508056640625, -0.2443084716796875, -0.23522186279296875, -0.22613525390625, -0.21704864501953125, -0.2079620361328125, -0.19887542724609375, -0.189788818359375, -0.18070220947265625, -0.1716156005859375, -0.16252899169921875, -0.1534423828125, -0.14435577392578125, -0.1352691650390625, -0.12618255615234375, -0.117095947265625, -0.10800933837890625, -0.0989227294921875, -0.08983612060546875, -0.08074951171875, -0.07166290283203125, -0.0625762939453125, -0.05348968505859375, -0.044403076171875, -0.03531646728515625, -0.0262298583984375, -0.01714324951171875, -0.008056640625, 0.00102996826171875, 0.0101165771484375, 0.01920318603515625, 0.028289794921875, 0.03737640380859375, 0.0464630126953125, 0.05554962158203125, 0.06463623046875, 0.07372283935546875, 0.0828094482421875, 0.09189605712890625, 0.100982666015625, 0.11006927490234375, 0.1191558837890625, 0.12824249267578125, 0.1373291015625, 0.14641571044921875, 0.1555023193359375, 0.16458892822265625, 0.173675537109375, 0.18276214599609375, 0.1918487548828125, 0.20093536376953125, 0.21002197265625, 0.21910858154296875, 0.2281951904296875, 0.23728179931640625, 0.246368408203125, 0.25545501708984375, 0.2645416259765625, 0.27362823486328125, 0.28271484375]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 8.0, 6.0, 7.0, 6.0, 9.0, 24.0, 43.0, 31.0, 40.0, 63.0, 66.0, 106.0, 109.0, 121.0, 94.0, 77.0, 58.0, 38.0, 33.0, 17.0, 21.0, 10.0, 3.0, 9.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-15.761994361877441, -15.422834396362305, -15.083675384521484, -14.744515419006348, -14.405355453491211, -14.066195487976074, -13.727036476135254, -13.387876510620117, -13.04871654510498, -12.709556579589844, -12.370397567749023, -12.031237602233887, -11.69207763671875, -11.352917671203613, -11.013758659362793, -10.674598693847656, -10.335439682006836, -9.9962797164917, -9.657120704650879, -9.317960739135742, -8.978800773620605, -8.639640808105469, -8.300481796264648, -7.961321830749512, -7.622161865234375, -7.2830023765563965, -6.94384241104126, -6.604682922363281, -6.2655229568481445, -5.926363468170166, -5.5872039794921875, -5.248044013977051, -4.908884525299072, -4.569725036621094, -4.230565071105957, -3.8914055824279785, -3.552245616912842, -3.2130861282348633, -2.8739264011383057, -2.534766674041748, -2.1956069469451904, -1.8564472198486328, -1.5172874927520752, -1.1781278848648071, -0.8389681577682495, -0.4998084306716919, -0.16064882278442383, 0.1785109043121338, 0.5176706314086914, 0.856830358505249, 1.1959900856018066, 1.5351496934890747, 1.8743094205856323, 2.2134690284729004, 2.552628755569458, 2.8917884826660156, 3.2309482097625732, 3.570107936859131, 3.9092676639556885, 4.248427391052246, 4.587586879730225, 4.926746845245361, 5.26590633392334, 5.605066299438477, 5.944225788116455]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 3.0, 3.0, 4.0, 15.0, 11.0, 14.0, 18.0, 15.0, 19.0, 28.0, 24.0, 26.0, 19.0, 32.0, 39.0, 25.0, 34.0, 35.0, 36.0, 31.0, 47.0, 34.0, 41.0, 46.0, 36.0, 43.0, 52.0, 27.0, 32.0, 25.0, 28.0, 22.0, 22.0, 15.0, 16.0, 19.0, 16.0, 15.0, 10.0, 12.0, 4.0, 5.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.2714529037475586, -3.1733615398406982, -3.075270175933838, -2.9771788120269775, -2.879087448120117, -2.780996084213257, -2.6829047203063965, -2.5848135948181152, -2.486721992492676, -2.3886306285858154, -2.290539264678955, -2.1924479007720947, -2.0943565368652344, -1.996265172958374, -1.8981739282608032, -1.8000825643539429, -1.701991319656372, -1.6038999557495117, -1.5058085918426514, -1.407717227935791, -1.3096258640289307, -1.2115345001220703, -1.1134432554244995, -1.0153518915176392, -0.9172605276107788, -0.8191691637039185, -0.7210777997970581, -0.6229864954948425, -0.5248951315879822, -0.4268037676811218, -0.32871246337890625, -0.2306210994720459, -0.13252949714660645, -0.03443814814090729, 0.06365320086479187, 0.16174453496932983, 0.2598358988761902, 0.35792726278305054, 0.4560185670852661, 0.5541099309921265, 0.6522012948989868, 0.7502926588058472, 0.8483840227127075, 0.9464753270149231, 1.0445666313171387, 1.142657995223999, 1.2407493591308594, 1.3388407230377197, 1.43693208694458, 1.5350234508514404, 1.6331148147583008, 1.7312061786651611, 1.8292975425720215, 1.9273889064788818, 2.025480270385742, 2.1235713958740234, 2.221662998199463, 2.3197543621063232, 2.4178457260131836, 2.515937089920044, 2.6140284538269043, 2.7121198177337646, 2.810211181640625, 2.9083023071289062, 3.0063936710357666]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 10.0, 14.0, 11.0, 28.0, 45.0, 71.0, 123.0, 185.0, 299.0, 558.0, 967.0, 1699.0, 3090.0, 5594.0, 10329.0, 18542.0, 33287.0, 58317.0, 96273.0, 141888.0, 174180.0, 169834.0, 130860.0, 86237.0, 51181.0, 28795.0, 16042.0, 8801.0, 4974.0, 2699.0, 1570.0, 856.0, 508.0, 281.0, 188.0, 79.0, 56.0, 36.0, 12.0, 19.0, 12.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.60546875, -3.48870849609375, -3.3719482421875, -3.25518798828125, -3.138427734375, -3.02166748046875, -2.9049072265625, -2.78814697265625, -2.67138671875, -2.55462646484375, -2.4378662109375, -2.32110595703125, -2.204345703125, -2.08758544921875, -1.9708251953125, -1.85406494140625, -1.7373046875, -1.62054443359375, -1.5037841796875, -1.38702392578125, -1.270263671875, -1.15350341796875, -1.0367431640625, -0.91998291015625, -0.80322265625, -0.68646240234375, -0.5697021484375, -0.45294189453125, -0.336181640625, -0.21942138671875, -0.1026611328125, 0.01409912109375, 0.130859375, 0.24761962890625, 0.3643798828125, 0.48114013671875, 0.597900390625, 0.71466064453125, 0.8314208984375, 0.94818115234375, 1.06494140625, 1.18170166015625, 1.2984619140625, 1.41522216796875, 1.531982421875, 1.64874267578125, 1.7655029296875, 1.88226318359375, 1.9990234375, 2.11578369140625, 2.2325439453125, 2.34930419921875, 2.466064453125, 2.58282470703125, 2.6995849609375, 2.81634521484375, 2.93310546875, 3.04986572265625, 3.1666259765625, 3.28338623046875, 3.400146484375, 3.51690673828125, 3.6336669921875, 3.75042724609375, 3.8671875]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 6.0, 6.0, 6.0, 11.0, 10.0, 13.0, 18.0, 24.0, 25.0, 29.0, 24.0, 23.0, 31.0, 23.0, 29.0, 37.0, 44.0, 40.0, 35.0, 29.0, 31.0, 43.0, 44.0, 45.0, 42.0, 43.0, 47.0, 26.0, 22.0, 29.0, 26.0, 25.0, 18.0, 18.0, 10.0, 16.0, 12.0, 10.0, 9.0, 8.0, 5.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.654296875, -3.544403076171875, -3.43450927734375, -3.324615478515625, -3.2147216796875, -3.104827880859375, -2.99493408203125, -2.885040283203125, -2.775146484375, -2.665252685546875, -2.55535888671875, -2.445465087890625, -2.3355712890625, -2.225677490234375, -2.11578369140625, -2.005889892578125, -1.89599609375, -1.786102294921875, -1.67620849609375, -1.566314697265625, -1.4564208984375, -1.346527099609375, -1.23663330078125, -1.126739501953125, -1.016845703125, -0.906951904296875, -0.79705810546875, -0.687164306640625, -0.5772705078125, -0.467376708984375, -0.35748291015625, -0.247589111328125, -0.1376953125, -0.027801513671875, 0.08209228515625, 0.191986083984375, 0.3018798828125, 0.411773681640625, 0.52166748046875, 0.631561279296875, 0.741455078125, 0.851348876953125, 0.96124267578125, 1.071136474609375, 1.1810302734375, 1.290924072265625, 1.40081787109375, 1.510711669921875, 1.62060546875, 1.730499267578125, 1.84039306640625, 1.950286865234375, 2.0601806640625, 2.170074462890625, 2.27996826171875, 2.389862060546875, 2.499755859375, 2.609649658203125, 2.71954345703125, 2.829437255859375, 2.9393310546875, 3.049224853515625, 3.15911865234375, 3.269012451171875, 3.37890625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 6.0, 5.0, 19.0, 23.0, 34.0, 39.0, 76.0, 86.0, 147.0, 243.0, 436.0, 799.0, 1436.0, 2774.0, 5245.0, 10056.0, 19264.0, 36707.0, 68123.0, 117276.0, 172693.0, 198573.0, 167392.0, 110618.0, 63877.0, 34548.0, 18036.0, 9518.0, 4781.0, 2532.0, 1344.0, 737.0, 434.0, 253.0, 132.0, 106.0, 58.0, 46.0, 23.0, 16.0, 13.0, 8.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-4.21484375, -4.080810546875, -3.94677734375, -3.812744140625, -3.6787109375, -3.544677734375, -3.41064453125, -3.276611328125, -3.142578125, -3.008544921875, -2.87451171875, -2.740478515625, -2.6064453125, -2.472412109375, -2.33837890625, -2.204345703125, -2.0703125, -1.936279296875, -1.80224609375, -1.668212890625, -1.5341796875, -1.400146484375, -1.26611328125, -1.132080078125, -0.998046875, -0.864013671875, -0.72998046875, -0.595947265625, -0.4619140625, -0.327880859375, -0.19384765625, -0.059814453125, 0.07421875, 0.208251953125, 0.34228515625, 0.476318359375, 0.6103515625, 0.744384765625, 0.87841796875, 1.012451171875, 1.146484375, 1.280517578125, 1.41455078125, 1.548583984375, 1.6826171875, 1.816650390625, 1.95068359375, 2.084716796875, 2.21875, 2.352783203125, 2.48681640625, 2.620849609375, 2.7548828125, 2.888916015625, 3.02294921875, 3.156982421875, 3.291015625, 3.425048828125, 3.55908203125, 3.693115234375, 3.8271484375, 3.961181640625, 4.09521484375, 4.229248046875, 4.36328125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 10.0, 13.0, 11.0, 14.0, 14.0, 17.0, 15.0, 18.0, 12.0, 21.0, 17.0, 27.0, 22.0, 32.0, 28.0, 32.0, 31.0, 38.0, 43.0, 46.0, 29.0, 42.0, 44.0, 34.0, 29.0, 34.0, 40.0, 27.0, 26.0, 21.0, 29.0, 24.0, 19.0, 22.0, 24.0, 19.0, 12.0, 12.0, 9.0, 5.0, 9.0, 9.0, 8.0, 6.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.8515625, -1.79150390625, -1.7314453125, -1.67138671875, -1.611328125, -1.55126953125, -1.4912109375, -1.43115234375, -1.37109375, -1.31103515625, -1.2509765625, -1.19091796875, -1.130859375, -1.07080078125, -1.0107421875, -0.95068359375, -0.890625, -0.83056640625, -0.7705078125, -0.71044921875, -0.650390625, -0.59033203125, -0.5302734375, -0.47021484375, -0.41015625, -0.35009765625, -0.2900390625, -0.22998046875, -0.169921875, -0.10986328125, -0.0498046875, 0.01025390625, 0.0703125, 0.13037109375, 0.1904296875, 0.25048828125, 0.310546875, 0.37060546875, 0.4306640625, 0.49072265625, 0.55078125, 0.61083984375, 0.6708984375, 0.73095703125, 0.791015625, 0.85107421875, 0.9111328125, 0.97119140625, 1.03125, 1.09130859375, 1.1513671875, 1.21142578125, 1.271484375, 1.33154296875, 1.3916015625, 1.45166015625, 1.51171875, 1.57177734375, 1.6318359375, 1.69189453125, 1.751953125, 1.81201171875, 1.8720703125, 1.93212890625, 1.9921875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 7.0, 9.0, 9.0, 27.0, 21.0, 36.0, 48.0, 66.0, 92.0, 123.0, 200.0, 265.0, 381.0, 638.0, 1064.0, 1640.0, 3060.0, 5351.0, 10679.0, 21784.0, 45994.0, 98174.0, 186310.0, 252912.0, 203371.0, 111661.0, 53267.0, 24623.0, 11931.0, 6184.0, 3374.0, 1886.0, 1156.0, 778.0, 489.0, 279.0, 231.0, 133.0, 82.0, 73.0, 41.0, 33.0, 22.0, 24.0, 8.0, 10.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0], "bins": [-2.4375, -2.367034912109375, -2.29656982421875, -2.226104736328125, -2.1556396484375, -2.085174560546875, -2.01470947265625, -1.944244384765625, -1.873779296875, -1.803314208984375, -1.73284912109375, -1.662384033203125, -1.5919189453125, -1.521453857421875, -1.45098876953125, -1.380523681640625, -1.31005859375, -1.239593505859375, -1.16912841796875, -1.098663330078125, -1.0281982421875, -0.957733154296875, -0.88726806640625, -0.816802978515625, -0.746337890625, -0.675872802734375, -0.60540771484375, -0.534942626953125, -0.4644775390625, -0.394012451171875, -0.32354736328125, -0.253082275390625, -0.1826171875, -0.112152099609375, -0.04168701171875, 0.028778076171875, 0.0992431640625, 0.169708251953125, 0.24017333984375, 0.310638427734375, 0.381103515625, 0.451568603515625, 0.52203369140625, 0.592498779296875, 0.6629638671875, 0.733428955078125, 0.80389404296875, 0.874359130859375, 0.94482421875, 1.015289306640625, 1.08575439453125, 1.156219482421875, 1.2266845703125, 1.297149658203125, 1.36761474609375, 1.438079833984375, 1.508544921875, 1.579010009765625, 1.64947509765625, 1.719940185546875, 1.7904052734375, 1.860870361328125, 1.93133544921875, 2.001800537109375, 2.072265625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 7.0, 9.0, 11.0, 9.0, 16.0, 24.0, 25.0, 27.0, 29.0, 43.0, 45.0, 62.0, 70.0, 58.0, 69.0, 76.0, 76.0, 69.0, 52.0, 44.0, 42.0, 32.0, 27.0, 22.0, 9.0, 15.0, 6.0, 6.0, 8.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015020370483398438, -0.00014432333409786224, -0.0001384429633617401, -0.00013256259262561798, -0.00012668222188949585, -0.00012080185115337372, -0.00011492148041725159, -0.00010904110968112946, -0.00010316073894500732, -9.728036820888519e-05, -9.139999747276306e-05, -8.551962673664093e-05, -7.96392560005188e-05, -7.375888526439667e-05, -6.787851452827454e-05, -6.19981437921524e-05, -5.6117773056030273e-05, -5.023740231990814e-05, -4.435703158378601e-05, -3.847666084766388e-05, -3.259629011154175e-05, -2.6715919375419617e-05, -2.0835548639297485e-05, -1.4955177903175354e-05, -9.074807167053223e-06, -3.1944364309310913e-06, 2.68593430519104e-06, 8.566305041313171e-06, 1.4446675777435303e-05, 2.0327046513557434e-05, 2.6207417249679565e-05, 3.20877879858017e-05, 3.796815872192383e-05, 4.384852945804596e-05, 4.972890019416809e-05, 5.560927093029022e-05, 6.148964166641235e-05, 6.737001240253448e-05, 7.325038313865662e-05, 7.913075387477875e-05, 8.501112461090088e-05, 9.089149534702301e-05, 9.677186608314514e-05, 0.00010265223681926727, 0.0001085326075553894, 0.00011441297829151154, 0.00012029334902763367, 0.0001261737197637558, 0.00013205409049987793, 0.00013793446123600006, 0.0001438148319721222, 0.00014969520270824432, 0.00015557557344436646, 0.00016145594418048859, 0.00016733631491661072, 0.00017321668565273285, 0.00017909705638885498, 0.0001849774271249771, 0.00019085779786109924, 0.00019673816859722137, 0.0002026185393333435, 0.00020849891006946564, 0.00021437928080558777, 0.0002202596515417099, 0.00022614002227783203]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 6.0, 14.0, 25.0, 24.0, 37.0, 53.0, 88.0, 112.0, 150.0, 210.0, 306.0, 447.0, 676.0, 1008.0, 1543.0, 2480.0, 4061.0, 6585.0, 11231.0, 19460.0, 34195.0, 60789.0, 101152.0, 152154.0, 184638.0, 169267.0, 120976.0, 74575.0, 42931.0, 24184.0, 13873.0, 7993.0, 4791.0, 3014.0, 1909.0, 1167.0, 752.0, 496.0, 346.0, 226.0, 183.0, 120.0, 86.0, 68.0, 38.0, 36.0, 23.0, 21.0, 12.0, 10.0, 6.0, 4.0, 2.0, 3.0, 0.0, 2.0], "bins": [-1.6357421875, -1.5857086181640625, -1.535675048828125, -1.4856414794921875, -1.43560791015625, -1.3855743408203125, -1.335540771484375, -1.2855072021484375, -1.2354736328125, -1.1854400634765625, -1.135406494140625, -1.0853729248046875, -1.03533935546875, -0.9853057861328125, -0.935272216796875, -0.8852386474609375, -0.835205078125, -0.7851715087890625, -0.735137939453125, -0.6851043701171875, -0.63507080078125, -0.5850372314453125, -0.535003662109375, -0.4849700927734375, -0.4349365234375, -0.3849029541015625, -0.334869384765625, -0.2848358154296875, -0.23480224609375, -0.1847686767578125, -0.134735107421875, -0.0847015380859375, -0.03466796875, 0.0153656005859375, 0.065399169921875, 0.1154327392578125, 0.16546630859375, 0.2154998779296875, 0.265533447265625, 0.3155670166015625, 0.3656005859375, 0.4156341552734375, 0.465667724609375, 0.5157012939453125, 0.56573486328125, 0.6157684326171875, 0.665802001953125, 0.7158355712890625, 0.765869140625, 0.8159027099609375, 0.865936279296875, 0.9159698486328125, 0.96600341796875, 1.0160369873046875, 1.066070556640625, 1.1161041259765625, 1.1661376953125, 1.2161712646484375, 1.266204833984375, 1.3162384033203125, 1.36627197265625, 1.4163055419921875, 1.466339111328125, 1.5163726806640625, 1.56640625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 5.0, 7.0, 12.0, 17.0, 10.0, 24.0, 20.0, 19.0, 30.0, 37.0, 32.0, 37.0, 50.0, 49.0, 51.0, 70.0, 43.0, 57.0, 45.0, 51.0, 48.0, 52.0, 42.0, 29.0, 26.0, 31.0, 20.0, 24.0, 12.0, 11.0, 7.0, 5.0, 9.0, 2.0, 2.0, 4.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.52490234375, -0.5104942321777344, -0.49608612060546875, -0.4816780090332031, -0.4672698974609375, -0.4528617858886719, -0.43845367431640625, -0.4240455627441406, -0.409637451171875, -0.3952293395996094, -0.38082122802734375, -0.3664131164550781, -0.3520050048828125, -0.3375968933105469, -0.32318878173828125, -0.3087806701660156, -0.29437255859375, -0.2799644470214844, -0.26555633544921875, -0.2511482238769531, -0.2367401123046875, -0.22233200073242188, -0.20792388916015625, -0.19351577758789062, -0.179107666015625, -0.16469955444335938, -0.15029144287109375, -0.13588333129882812, -0.1214752197265625, -0.10706710815429688, -0.09265899658203125, -0.07825088500976562, -0.0638427734375, -0.049434661865234375, -0.03502655029296875, -0.020618438720703125, -0.0062103271484375, 0.008197784423828125, 0.02260589599609375, 0.037014007568359375, 0.051422119140625, 0.06583023071289062, 0.08023834228515625, 0.09464645385742188, 0.1090545654296875, 0.12346267700195312, 0.13787078857421875, 0.15227890014648438, 0.16668701171875, 0.18109512329101562, 0.19550323486328125, 0.20991134643554688, 0.2243194580078125, 0.23872756958007812, 0.25313568115234375, 0.2675437927246094, 0.281951904296875, 0.2963600158691406, 0.31076812744140625, 0.3251762390136719, 0.3395843505859375, 0.3539924621582031, 0.36840057373046875, 0.3828086853027344, 0.397216796875]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 9.0, 4.0, 5.0, 9.0, 13.0, 27.0, 35.0, 47.0, 45.0, 77.0, 78.0, 100.0, 110.0, 129.0, 80.0, 70.0, 55.0, 29.0, 29.0, 17.0, 8.0, 9.0, 6.0, 8.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-15.795585632324219, -15.452794075012207, -15.110002517700195, -14.767210006713867, -14.424418449401855, -14.081626892089844, -13.738835334777832, -13.39604377746582, -13.053252220153809, -12.710460662841797, -12.367669105529785, -12.024877548217773, -11.682085037231445, -11.339293479919434, -10.996501922607422, -10.65371036529541, -10.310918807983398, -9.968127250671387, -9.625335693359375, -9.282543182373047, -8.939751625061035, -8.596960067749023, -8.254168510437012, -7.911376953125, -7.568584442138672, -7.22579288482666, -6.88300085067749, -6.5402092933654785, -6.197417736053467, -5.854625701904297, -5.511834144592285, -5.169042587280273, -4.82625150680542, -4.483459949493408, -4.140667915344238, -3.7978763580322266, -3.455084800720215, -3.112293004989624, -2.769501209259033, -2.4267096519470215, -2.0839178562164307, -1.7411261796951294, -1.3983345031738281, -1.0555427074432373, -0.712751030921936, -0.36995935440063477, -0.027167558670043945, 0.3156239986419678, 0.6584157943725586, 1.0012074708938599, 1.3439991474151611, 1.686790943145752, 2.0295825004577637, 2.3723742961883545, 2.7151660919189453, 3.057957649230957, 3.400749444961548, 3.7435412406921387, 4.08633279800415, 4.42912483215332, 4.771916389465332, 5.114707946777344, 5.4574995040893555, 5.800291061401367, 6.143083095550537]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 7.0, 10.0, 7.0, 11.0, 10.0, 11.0, 12.0, 15.0, 14.0, 19.0, 32.0, 28.0, 33.0, 25.0, 27.0, 29.0, 25.0, 39.0, 29.0, 33.0, 41.0, 45.0, 48.0, 45.0, 41.0, 36.0, 41.0, 32.0, 33.0, 33.0, 24.0, 23.0, 20.0, 23.0, 12.0, 14.0, 18.0, 7.0, 9.0, 15.0, 6.0, 10.0, 3.0, 8.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.327981472015381, -3.231311798095703, -3.1346421241760254, -3.0379726886749268, -2.941303014755249, -2.8446333408355713, -2.7479639053344727, -2.651294231414795, -2.554624557495117, -2.4579548835754395, -2.3612852096557617, -2.264615774154663, -2.1679461002349854, -2.0712764263153076, -1.9746068716049194, -1.8779373168945312, -1.7812676429748535, -1.6845979690551758, -1.5879284143447876, -1.4912588596343994, -1.3945891857147217, -1.297919511795044, -1.2012499570846558, -1.1045804023742676, -1.0079107284545898, -0.9112411141395569, -0.8145714998245239, -0.717901885509491, -0.621232271194458, -0.524562656879425, -0.4278930425643921, -0.33122342824935913, -0.23455405235290527, -0.13788443803787231, -0.041214823722839355, 0.055454790592193604, 0.15212440490722656, 0.24879401922225952, 0.3454636335372925, 0.44213324785232544, 0.5388028621673584, 0.6354724764823914, 0.7321420907974243, 0.8288117051124573, 0.9254813194274902, 1.022150993347168, 1.1188205480575562, 1.2154901027679443, 1.312159776687622, 1.4088294506072998, 1.505499005317688, 1.6021685600280762, 1.698838233947754, 1.7955079078674316, 1.8921774625778198, 1.988847017288208, 2.0855166912078857, 2.1821863651275635, 2.278855800628662, 2.37552547454834, 2.4721951484680176, 2.5688648223876953, 2.665534496307373, 2.7622039318084717, 2.8588736057281494]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 9.0, 13.0, 16.0, 25.0, 29.0, 54.0, 94.0, 116.0, 215.0, 252.0, 438.0, 733.0, 1049.0, 1792.0, 3020.0, 4981.0, 8764.0, 16216.0, 30579.0, 63105.0, 142093.0, 357360.0, 929564.0, 1371347.0, 755804.0, 280866.0, 113867.0, 52218.0, 25952.0, 14038.0, 7786.0, 4572.0, 2704.0, 1683.0, 1040.0, 693.0, 415.0, 279.0, 174.0, 109.0, 72.0, 48.0, 39.0, 16.0, 15.0, 4.0, 8.0, 4.0, 7.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.82421875, -6.6197509765625, -6.415283203125, -6.2108154296875, -6.00634765625, -5.8018798828125, -5.597412109375, -5.3929443359375, -5.1884765625, -4.9840087890625, -4.779541015625, -4.5750732421875, -4.37060546875, -4.1661376953125, -3.961669921875, -3.7572021484375, -3.552734375, -3.3482666015625, -3.143798828125, -2.9393310546875, -2.73486328125, -2.5303955078125, -2.325927734375, -2.1214599609375, -1.9169921875, -1.7125244140625, -1.508056640625, -1.3035888671875, -1.09912109375, -0.8946533203125, -0.690185546875, -0.4857177734375, -0.28125, -0.0767822265625, 0.127685546875, 0.3321533203125, 0.53662109375, 0.7410888671875, 0.945556640625, 1.1500244140625, 1.3544921875, 1.5589599609375, 1.763427734375, 1.9678955078125, 2.17236328125, 2.3768310546875, 2.581298828125, 2.7857666015625, 2.990234375, 3.1947021484375, 3.399169921875, 3.6036376953125, 3.80810546875, 4.0125732421875, 4.217041015625, 4.4215087890625, 4.6259765625, 4.8304443359375, 5.034912109375, 5.2393798828125, 5.44384765625, 5.6483154296875, 5.852783203125, 6.0572509765625, 6.26171875]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 5.0, 9.0, 10.0, 15.0, 11.0, 10.0, 7.0, 23.0, 22.0, 39.0, 31.0, 27.0, 31.0, 24.0, 24.0, 31.0, 44.0, 43.0, 38.0, 55.0, 27.0, 50.0, 49.0, 48.0, 34.0, 34.0, 36.0, 28.0, 25.0, 27.0, 26.0, 15.0, 17.0, 13.0, 18.0, 7.0, 5.0, 9.0, 10.0, 9.0, 3.0, 8.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.33984375, -2.261138916015625, -2.18243408203125, -2.103729248046875, -2.0250244140625, -1.946319580078125, -1.86761474609375, -1.788909912109375, -1.710205078125, -1.631500244140625, -1.55279541015625, -1.474090576171875, -1.3953857421875, -1.316680908203125, -1.23797607421875, -1.159271240234375, -1.08056640625, -1.001861572265625, -0.92315673828125, -0.844451904296875, -0.7657470703125, -0.687042236328125, -0.60833740234375, -0.529632568359375, -0.450927734375, -0.372222900390625, -0.29351806640625, -0.214813232421875, -0.1361083984375, -0.057403564453125, 0.02130126953125, 0.100006103515625, 0.1787109375, 0.257415771484375, 0.33612060546875, 0.414825439453125, 0.4935302734375, 0.572235107421875, 0.65093994140625, 0.729644775390625, 0.808349609375, 0.887054443359375, 0.96575927734375, 1.044464111328125, 1.1231689453125, 1.201873779296875, 1.28057861328125, 1.359283447265625, 1.43798828125, 1.516693115234375, 1.59539794921875, 1.674102783203125, 1.7528076171875, 1.831512451171875, 1.91021728515625, 1.988922119140625, 2.067626953125, 2.146331787109375, 2.22503662109375, 2.303741455078125, 2.3824462890625, 2.461151123046875, 2.53985595703125, 2.618560791015625, 2.697265625]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 9.0, 14.0, 17.0, 30.0, 39.0, 63.0, 65.0, 137.0, 217.0, 330.0, 521.0, 736.0, 1184.0, 1833.0, 2878.0, 4675.0, 7796.0, 13230.0, 23271.0, 42048.0, 81759.0, 166861.0, 356853.0, 759733.0, 1165215.0, 809641.0, 384403.0, 179110.0, 86918.0, 45059.0, 24545.0, 13730.0, 8173.0, 4798.0, 2995.0, 1932.0, 1160.0, 820.0, 474.0, 345.0, 256.0, 137.0, 105.0, 60.0, 42.0, 28.0, 16.0, 13.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5234375, -6.3289794921875, -6.134521484375, -5.9400634765625, -5.74560546875, -5.5511474609375, -5.356689453125, -5.1622314453125, -4.9677734375, -4.7733154296875, -4.578857421875, -4.3843994140625, -4.18994140625, -3.9954833984375, -3.801025390625, -3.6065673828125, -3.412109375, -3.2176513671875, -3.023193359375, -2.8287353515625, -2.63427734375, -2.4398193359375, -2.245361328125, -2.0509033203125, -1.8564453125, -1.6619873046875, -1.467529296875, -1.2730712890625, -1.07861328125, -0.8841552734375, -0.689697265625, -0.4952392578125, -0.30078125, -0.1063232421875, 0.088134765625, 0.2825927734375, 0.47705078125, 0.6715087890625, 0.865966796875, 1.0604248046875, 1.2548828125, 1.4493408203125, 1.643798828125, 1.8382568359375, 2.03271484375, 2.2271728515625, 2.421630859375, 2.6160888671875, 2.810546875, 3.0050048828125, 3.199462890625, 3.3939208984375, 3.58837890625, 3.7828369140625, 3.977294921875, 4.1717529296875, 4.3662109375, 4.5606689453125, 4.755126953125, 4.9495849609375, 5.14404296875, 5.3385009765625, 5.532958984375, 5.7274169921875, 5.921875]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 6.0, 2.0, 7.0, 10.0, 11.0, 18.0, 20.0, 31.0, 33.0, 46.0, 58.0, 74.0, 106.0, 97.0, 157.0, 195.0, 233.0, 261.0, 289.0, 286.0, 306.0, 344.0, 274.0, 250.0, 194.0, 172.0, 138.0, 87.0, 67.0, 55.0, 49.0, 42.0, 31.0, 28.0, 15.0, 13.0, 12.0, 5.0, 10.0, 8.0, 5.0, 6.0, 7.0, 3.0, 4.0, 4.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.642578125, -1.586395263671875, -1.53021240234375, -1.474029541015625, -1.4178466796875, -1.361663818359375, -1.30548095703125, -1.249298095703125, -1.193115234375, -1.136932373046875, -1.08074951171875, -1.024566650390625, -0.9683837890625, -0.912200927734375, -0.85601806640625, -0.799835205078125, -0.74365234375, -0.687469482421875, -0.63128662109375, -0.575103759765625, -0.5189208984375, -0.462738037109375, -0.40655517578125, -0.350372314453125, -0.294189453125, -0.238006591796875, -0.18182373046875, -0.125640869140625, -0.0694580078125, -0.013275146484375, 0.04290771484375, 0.099090576171875, 0.1552734375, 0.211456298828125, 0.26763916015625, 0.323822021484375, 0.3800048828125, 0.436187744140625, 0.49237060546875, 0.548553466796875, 0.604736328125, 0.660919189453125, 0.71710205078125, 0.773284912109375, 0.8294677734375, 0.885650634765625, 0.94183349609375, 0.998016357421875, 1.05419921875, 1.110382080078125, 1.16656494140625, 1.222747802734375, 1.2789306640625, 1.335113525390625, 1.39129638671875, 1.447479248046875, 1.503662109375, 1.559844970703125, 1.61602783203125, 1.672210693359375, 1.7283935546875, 1.784576416015625, 1.84075927734375, 1.896942138671875, 1.953125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 10.0, 7.0, 15.0, 26.0, 22.0, 30.0, 49.0, 64.0, 62.0, 97.0, 116.0, 133.0, 105.0, 90.0, 56.0, 36.0, 20.0, 22.0, 16.0, 11.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.101999282836914, -13.726221084594727, -13.350443840026855, -12.974665641784668, -12.598888397216797, -12.22311019897461, -11.847332000732422, -11.471553802490234, -11.095776557922363, -10.719998359680176, -10.344221115112305, -9.968442916870117, -9.59266471862793, -9.216887474060059, -8.841109275817871, -8.46533203125, -8.089553833007812, -7.713776111602783, -7.337998390197754, -6.962220191955566, -6.586442470550537, -6.210664749145508, -5.83488655090332, -5.459108829498291, -5.083331108093262, -4.707553386688232, -4.331775665283203, -3.9559974670410156, -3.5802197456359863, -3.204442024230957, -2.8286640644073486, -2.4528861045837402, -2.077108383178711, -1.701330542564392, -1.3255527019500732, -0.9497748613357544, -0.5739970207214355, -0.1982191801071167, 0.17755866050720215, 0.5533366203308105, 0.9291143417358398, 1.3048921823501587, 1.6806700229644775, 2.056447982788086, 2.4322257041931152, 2.8080034255981445, 3.183781385421753, 3.5595593452453613, 3.9353370666503906, 4.31111478805542, 4.686892509460449, 5.062670707702637, 5.438448429107666, 5.814226150512695, 6.190004348754883, 6.565782070159912, 6.941559791564941, 7.317337512969971, 7.693115234375, 8.068893432617188, 8.444671630859375, 8.820448875427246, 9.196227073669434, 9.572004318237305, 9.947782516479492]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 10.0, 11.0, 9.0, 16.0, 20.0, 15.0, 14.0, 19.0, 25.0, 20.0, 22.0, 26.0, 32.0, 46.0, 46.0, 39.0, 34.0, 47.0, 40.0, 44.0, 36.0, 46.0, 50.0, 35.0, 31.0, 31.0, 32.0, 26.0, 23.0, 19.0, 12.0, 12.0, 23.0, 18.0, 12.0, 11.0, 8.0, 13.0, 5.0, 6.0, 3.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.4018402099609375, -3.298731565475464, -3.1956229209899902, -3.0925140380859375, -2.989405393600464, -2.8862967491149902, -2.7831878662109375, -2.680079221725464, -2.5769705772399902, -2.4738619327545166, -2.370753288269043, -2.2676444053649902, -2.1645357608795166, -2.061427116394043, -1.9583183526992798, -1.8552095890045166, -1.752100944519043, -1.6489923000335693, -1.5458835363388062, -1.442774772644043, -1.3396661281585693, -1.2365574836730957, -1.1334487199783325, -1.0303399562835693, -0.9272313117980957, -0.8241226077079773, -0.7210139036178589, -0.6179051995277405, -0.5147964954376221, -0.41168779134750366, -0.30857908725738525, -0.20547038316726685, -0.10236191749572754, 0.0007467865943908691, 0.10385549068450928, 0.20696419477462769, 0.3100728988647461, 0.4131816029548645, 0.5162903070449829, 0.6193990111351013, 0.7225077152252197, 0.8256164193153381, 0.9287251234054565, 1.0318338871002197, 1.1349425315856934, 1.238051176071167, 1.3411599397659302, 1.4442687034606934, 1.547377347946167, 1.6504859924316406, 1.7535947561264038, 1.856703519821167, 1.9598121643066406, 2.0629208087921143, 2.166029453277588, 2.2691383361816406, 2.3722469806671143, 2.475355625152588, 2.5784645080566406, 2.6815731525421143, 2.784681797027588, 2.8877904415130615, 2.990899085998535, 3.094007968902588, 3.1971166133880615]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 7.0, 19.0, 11.0, 11.0, 24.0, 42.0, 75.0, 82.0, 124.0, 205.0, 286.0, 422.0, 655.0, 998.0, 1609.0, 2759.0, 5683.0, 12671.0, 35532.0, 112483.0, 319738.0, 351549.0, 133306.0, 41429.0, 14897.0, 6152.0, 3036.0, 1659.0, 999.0, 648.0, 451.0, 293.0, 214.0, 145.0, 94.0, 54.0, 47.0, 33.0, 37.0, 15.0, 16.0, 6.0, 11.0, 10.0, 4.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-6.078125, -5.88861083984375, -5.6990966796875, -5.50958251953125, -5.320068359375, -5.13055419921875, -4.9410400390625, -4.75152587890625, -4.56201171875, -4.37249755859375, -4.1829833984375, -3.99346923828125, -3.803955078125, -3.61444091796875, -3.4249267578125, -3.23541259765625, -3.0458984375, -2.85638427734375, -2.6668701171875, -2.47735595703125, -2.287841796875, -2.09832763671875, -1.9088134765625, -1.71929931640625, -1.52978515625, -1.34027099609375, -1.1507568359375, -0.96124267578125, -0.771728515625, -0.58221435546875, -0.3927001953125, -0.20318603515625, -0.013671875, 0.17584228515625, 0.3653564453125, 0.55487060546875, 0.744384765625, 0.93389892578125, 1.1234130859375, 1.31292724609375, 1.50244140625, 1.69195556640625, 1.8814697265625, 2.07098388671875, 2.260498046875, 2.45001220703125, 2.6395263671875, 2.82904052734375, 3.0185546875, 3.20806884765625, 3.3975830078125, 3.58709716796875, 3.776611328125, 3.96612548828125, 4.1556396484375, 4.34515380859375, 4.53466796875, 4.72418212890625, 4.9136962890625, 5.10321044921875, 5.292724609375, 5.48223876953125, 5.6717529296875, 5.86126708984375, 6.05078125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 5.0, 1.0, 4.0, 4.0, 5.0, 8.0, 11.0, 6.0, 9.0, 10.0, 18.0, 27.0, 17.0, 31.0, 26.0, 35.0, 28.0, 31.0, 34.0, 35.0, 36.0, 42.0, 55.0, 46.0, 35.0, 48.0, 40.0, 39.0, 40.0, 28.0, 25.0, 26.0, 24.0, 25.0, 23.0, 20.0, 20.0, 16.0, 8.0, 17.0, 10.0, 11.0, 10.0, 4.0, 3.0, 1.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.62109375, -3.507659912109375, -3.39422607421875, -3.280792236328125, -3.1673583984375, -3.053924560546875, -2.94049072265625, -2.827056884765625, -2.713623046875, -2.600189208984375, -2.48675537109375, -2.373321533203125, -2.2598876953125, -2.146453857421875, -2.03302001953125, -1.919586181640625, -1.80615234375, -1.692718505859375, -1.57928466796875, -1.465850830078125, -1.3524169921875, -1.238983154296875, -1.12554931640625, -1.012115478515625, -0.898681640625, -0.785247802734375, -0.67181396484375, -0.558380126953125, -0.4449462890625, -0.331512451171875, -0.21807861328125, -0.104644775390625, 0.0087890625, 0.122222900390625, 0.23565673828125, 0.349090576171875, 0.4625244140625, 0.575958251953125, 0.68939208984375, 0.802825927734375, 0.916259765625, 1.029693603515625, 1.14312744140625, 1.256561279296875, 1.3699951171875, 1.483428955078125, 1.59686279296875, 1.710296630859375, 1.82373046875, 1.937164306640625, 2.05059814453125, 2.164031982421875, 2.2774658203125, 2.390899658203125, 2.50433349609375, 2.617767333984375, 2.731201171875, 2.844635009765625, 2.95806884765625, 3.071502685546875, 3.1849365234375, 3.298370361328125, 3.41180419921875, 3.525238037109375, 3.638671875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 7.0, 5.0, 4.0, 11.0, 8.0, 15.0, 12.0, 17.0, 30.0, 50.0, 50.0, 83.0, 101.0, 132.0, 169.0, 292.0, 429.0, 587.0, 838.0, 1340.0, 2138.0, 4410.0, 13175.0, 63857.0, 403338.0, 456575.0, 74806.0, 14596.0, 4877.0, 2238.0, 1370.0, 903.0, 599.0, 412.0, 292.0, 213.0, 151.0, 111.0, 80.0, 60.0, 42.0, 30.0, 22.0, 19.0, 18.0, 12.0, 9.0, 7.0, 3.0, 2.0, 5.0, 5.0, 2.0, 3.0, 4.0, 0.0, 0.0, 2.0], "bins": [-10.390625, -10.055908203125, -9.72119140625, -9.386474609375, -9.0517578125, -8.717041015625, -8.38232421875, -8.047607421875, -7.712890625, -7.378173828125, -7.04345703125, -6.708740234375, -6.3740234375, -6.039306640625, -5.70458984375, -5.369873046875, -5.03515625, -4.700439453125, -4.36572265625, -4.031005859375, -3.6962890625, -3.361572265625, -3.02685546875, -2.692138671875, -2.357421875, -2.022705078125, -1.68798828125, -1.353271484375, -1.0185546875, -0.683837890625, -0.34912109375, -0.014404296875, 0.3203125, 0.655029296875, 0.98974609375, 1.324462890625, 1.6591796875, 1.993896484375, 2.32861328125, 2.663330078125, 2.998046875, 3.332763671875, 3.66748046875, 4.002197265625, 4.3369140625, 4.671630859375, 5.00634765625, 5.341064453125, 5.67578125, 6.010498046875, 6.34521484375, 6.679931640625, 7.0146484375, 7.349365234375, 7.68408203125, 8.018798828125, 8.353515625, 8.688232421875, 9.02294921875, 9.357666015625, 9.6923828125, 10.027099609375, 10.36181640625, 10.696533203125, 11.03125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 7.0, 7.0, 10.0, 7.0, 5.0, 13.0, 11.0, 17.0, 17.0, 23.0, 23.0, 13.0, 25.0, 24.0, 25.0, 34.0, 44.0, 37.0, 46.0, 53.0, 47.0, 35.0, 36.0, 38.0, 32.0, 37.0, 43.0, 34.0, 40.0, 23.0, 28.0, 29.0, 23.0, 14.0, 15.0, 19.0, 12.0, 9.0, 6.0, 11.0, 13.0, 4.0, 3.0, 6.0, 5.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.091796875, -2.026336669921875, -1.96087646484375, -1.895416259765625, -1.8299560546875, -1.764495849609375, -1.69903564453125, -1.633575439453125, -1.568115234375, -1.502655029296875, -1.43719482421875, -1.371734619140625, -1.3062744140625, -1.240814208984375, -1.17535400390625, -1.109893798828125, -1.04443359375, -0.978973388671875, -0.91351318359375, -0.848052978515625, -0.7825927734375, -0.717132568359375, -0.65167236328125, -0.586212158203125, -0.520751953125, -0.455291748046875, -0.38983154296875, -0.324371337890625, -0.2589111328125, -0.193450927734375, -0.12799072265625, -0.062530517578125, 0.0029296875, 0.068389892578125, 0.13385009765625, 0.199310302734375, 0.2647705078125, 0.330230712890625, 0.39569091796875, 0.461151123046875, 0.526611328125, 0.592071533203125, 0.65753173828125, 0.722991943359375, 0.7884521484375, 0.853912353515625, 0.91937255859375, 0.984832763671875, 1.05029296875, 1.115753173828125, 1.18121337890625, 1.246673583984375, 1.3121337890625, 1.377593994140625, 1.44305419921875, 1.508514404296875, 1.573974609375, 1.639434814453125, 1.70489501953125, 1.770355224609375, 1.8358154296875, 1.901275634765625, 1.96673583984375, 2.032196044921875, 2.09765625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 6.0, 1.0, 8.0, 6.0, 6.0, 5.0, 10.0, 22.0, 30.0, 45.0, 62.0, 104.0, 143.0, 228.0, 318.0, 554.0, 821.0, 1460.0, 2509.0, 4699.0, 10547.0, 32031.0, 143147.0, 530062.0, 243936.0, 49725.0, 14506.0, 6136.0, 2959.0, 1731.0, 1048.0, 620.0, 377.0, 236.0, 164.0, 101.0, 79.0, 38.0, 26.0, 24.0, 14.0, 11.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.53515625, -3.4073486328125, -3.279541015625, -3.1517333984375, -3.02392578125, -2.8961181640625, -2.768310546875, -2.6405029296875, -2.5126953125, -2.3848876953125, -2.257080078125, -2.1292724609375, -2.00146484375, -1.8736572265625, -1.745849609375, -1.6180419921875, -1.490234375, -1.3624267578125, -1.234619140625, -1.1068115234375, -0.97900390625, -0.8511962890625, -0.723388671875, -0.5955810546875, -0.4677734375, -0.3399658203125, -0.212158203125, -0.0843505859375, 0.04345703125, 0.1712646484375, 0.299072265625, 0.4268798828125, 0.5546875, 0.6824951171875, 0.810302734375, 0.9381103515625, 1.06591796875, 1.1937255859375, 1.321533203125, 1.4493408203125, 1.5771484375, 1.7049560546875, 1.832763671875, 1.9605712890625, 2.08837890625, 2.2161865234375, 2.343994140625, 2.4718017578125, 2.599609375, 2.7274169921875, 2.855224609375, 2.9830322265625, 3.11083984375, 3.2386474609375, 3.366455078125, 3.4942626953125, 3.6220703125, 3.7498779296875, 3.877685546875, 4.0054931640625, 4.13330078125, 4.2611083984375, 4.388916015625, 4.5167236328125, 4.64453125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 0.0, 4.0, 2.0, 5.0, 2.0, 5.0, 9.0, 19.0, 31.0, 68.0, 100.0, 174.0, 199.0, 155.0, 100.0, 54.0, 29.0, 22.0, 10.0, 9.0, 3.0, 2.0, 0.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014770030975341797, -0.00014081411063671112, -0.00013392791152000427, -0.00012704171240329742, -0.00012015551328659058, -0.00011326931416988373, -0.00010638311505317688, -9.949691593647003e-05, -9.261071681976318e-05, -8.572451770305634e-05, -7.883831858634949e-05, -7.195211946964264e-05, -6.506592035293579e-05, -5.817972123622894e-05, -5.1293522119522095e-05, -4.4407323002815247e-05, -3.75211238861084e-05, -3.063492476940155e-05, -2.3748725652694702e-05, -1.6862526535987854e-05, -9.976327419281006e-06, -3.0901283025741577e-06, 3.7960708141326904e-06, 1.0682269930839539e-05, 1.7568469047546387e-05, 2.4454668164253235e-05, 3.134086728096008e-05, 3.822706639766693e-05, 4.511326551437378e-05, 5.199946463108063e-05, 5.8885663747787476e-05, 6.577186286449432e-05, 7.265806198120117e-05, 7.954426109790802e-05, 8.643046021461487e-05, 9.331665933132172e-05, 0.00010020285844802856, 0.00010708905756473541, 0.00011397525668144226, 0.00012086145579814911, 0.00012774765491485596, 0.0001346338540315628, 0.00014152005314826965, 0.0001484062522649765, 0.00015529245138168335, 0.0001621786504983902, 0.00016906484961509705, 0.0001759510487318039, 0.00018283724784851074, 0.0001897234469652176, 0.00019660964608192444, 0.0002034958451986313, 0.00021038204431533813, 0.00021726824343204498, 0.00022415444254875183, 0.00023104064166545868, 0.00023792684078216553, 0.0002448130398988724, 0.0002516992390155792, 0.00025858543813228607, 0.0002654716372489929, 0.00027235783636569977, 0.0002792440354824066, 0.00028613023459911346, 0.0002930164337158203]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 6.0, 8.0, 15.0, 20.0, 19.0, 44.0, 74.0, 111.0, 125.0, 173.0, 233.0, 341.0, 434.0, 629.0, 871.0, 1222.0, 1640.0, 2257.0, 3433.0, 5900.0, 12124.0, 33001.0, 108060.0, 307665.0, 351398.0, 141473.0, 42978.0, 14975.0, 6715.0, 3740.0, 2480.0, 1778.0, 1252.0, 921.0, 689.0, 498.0, 371.0, 283.0, 180.0, 120.0, 84.0, 76.0, 46.0, 39.0, 14.0, 15.0, 9.0, 4.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-2.5546875, -2.4698486328125, -2.385009765625, -2.3001708984375, -2.21533203125, -2.1304931640625, -2.045654296875, -1.9608154296875, -1.8759765625, -1.7911376953125, -1.706298828125, -1.6214599609375, -1.53662109375, -1.4517822265625, -1.366943359375, -1.2821044921875, -1.197265625, -1.1124267578125, -1.027587890625, -0.9427490234375, -0.85791015625, -0.7730712890625, -0.688232421875, -0.6033935546875, -0.5185546875, -0.4337158203125, -0.348876953125, -0.2640380859375, -0.17919921875, -0.0943603515625, -0.009521484375, 0.0753173828125, 0.16015625, 0.2449951171875, 0.329833984375, 0.4146728515625, 0.49951171875, 0.5843505859375, 0.669189453125, 0.7540283203125, 0.8388671875, 0.9237060546875, 1.008544921875, 1.0933837890625, 1.17822265625, 1.2630615234375, 1.347900390625, 1.4327392578125, 1.517578125, 1.6024169921875, 1.687255859375, 1.7720947265625, 1.85693359375, 1.9417724609375, 2.026611328125, 2.1114501953125, 2.1962890625, 2.2811279296875, 2.365966796875, 2.4508056640625, 2.53564453125, 2.6204833984375, 2.705322265625, 2.7901611328125, 2.875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 3.0, 0.0, 6.0, 6.0, 14.0, 17.0, 28.0, 42.0, 62.0, 128.0, 163.0, 163.0, 118.0, 85.0, 66.0, 40.0, 15.0, 15.0, 10.0, 6.0, 4.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.96240234375, -0.9342193603515625, -0.906036376953125, -0.8778533935546875, -0.84967041015625, -0.8214874267578125, -0.793304443359375, -0.7651214599609375, -0.7369384765625, -0.7087554931640625, -0.680572509765625, -0.6523895263671875, -0.62420654296875, -0.5960235595703125, -0.567840576171875, -0.5396575927734375, -0.511474609375, -0.4832916259765625, -0.455108642578125, -0.4269256591796875, -0.39874267578125, -0.3705596923828125, -0.342376708984375, -0.3141937255859375, -0.2860107421875, -0.2578277587890625, -0.229644775390625, -0.2014617919921875, -0.17327880859375, -0.1450958251953125, -0.116912841796875, -0.0887298583984375, -0.060546875, -0.0323638916015625, -0.004180908203125, 0.0240020751953125, 0.05218505859375, 0.0803680419921875, 0.108551025390625, 0.1367340087890625, 0.1649169921875, 0.1930999755859375, 0.221282958984375, 0.2494659423828125, 0.27764892578125, 0.3058319091796875, 0.334014892578125, 0.3621978759765625, 0.390380859375, 0.4185638427734375, 0.446746826171875, 0.4749298095703125, 0.50311279296875, 0.5312957763671875, 0.559478759765625, 0.5876617431640625, 0.6158447265625, 0.6440277099609375, 0.672210693359375, 0.7003936767578125, 0.72857666015625, 0.7567596435546875, 0.784942626953125, 0.8131256103515625, 0.84130859375]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 9.0, 8.0, 16.0, 16.0, 21.0, 25.0, 47.0, 56.0, 65.0, 79.0, 124.0, 114.0, 112.0, 82.0, 85.0, 44.0, 24.0, 23.0, 16.0, 18.0, 7.0, 3.0, 2.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.908937454223633, -13.542439460754395, -13.175941467285156, -12.809443473815918, -12.44294548034668, -12.076448440551758, -11.70995044708252, -11.343452453613281, -10.976954460144043, -10.610456466674805, -10.243958473205566, -9.877460479736328, -9.510963439941406, -9.144465446472168, -8.77796745300293, -8.411469459533691, -8.044971466064453, -7.678473472595215, -7.311975479125977, -6.9454779624938965, -6.578979969024658, -6.21248197555542, -5.84598445892334, -5.479486465454102, -5.112988471984863, -4.746490478515625, -4.379992485046387, -4.013494968414307, -3.6469969749450684, -3.28049898147583, -2.914001226425171, -2.5475034713745117, -2.1810054779052734, -1.8145076036453247, -1.448009729385376, -1.0815118551254272, -0.7150139808654785, -0.3485161066055298, 0.017981767654418945, 0.3844795227050781, 0.7509775161743164, 1.1174753904342651, 1.4839732646942139, 1.8504711389541626, 2.2169690132141113, 2.5834670066833496, 2.949964761734009, 3.316462516784668, 3.6829605102539062, 4.0494585037231445, 4.415956497192383, 4.782454013824463, 5.148952007293701, 5.5154500007629395, 5.8819475173950195, 6.248445510864258, 6.614943504333496, 6.981441497802734, 7.347939491271973, 7.714437007904053, 8.080934524536133, 8.447432518005371, 8.81393051147461, 9.180428504943848, 9.546926498413086]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 3.0, 5.0, 7.0, 7.0, 12.0, 16.0, 15.0, 24.0, 15.0, 21.0, 16.0, 24.0, 26.0, 27.0, 37.0, 45.0, 43.0, 38.0, 37.0, 39.0, 46.0, 45.0, 41.0, 45.0, 50.0, 38.0, 28.0, 26.0, 40.0, 18.0, 20.0, 19.0, 16.0, 12.0, 21.0, 18.0, 12.0, 10.0, 11.0, 3.0, 7.0, 5.0, 8.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.3787872791290283, -3.276102066040039, -3.173417091369629, -3.0707318782806396, -2.9680469036102295, -2.8653616905212402, -2.76267671585083, -2.659991502761841, -2.5573062896728516, -2.4546210765838623, -2.351936101913452, -2.249250888824463, -2.1465659141540527, -2.0438807010650635, -1.9411956071853638, -1.838510513305664, -1.735825538635254, -1.6331404447555542, -1.5304553508758545, -1.4277701377868652, -1.325085163116455, -1.2223999500274658, -1.1197148561477661, -1.0170297622680664, -0.9143446683883667, -0.811659574508667, -0.7089744806289673, -0.6062893271446228, -0.5036042332649231, -0.4009191393852234, -0.2982339859008789, -0.1955488920211792, -0.09286355972290039, 0.00982154905796051, 0.11250665783882141, 0.2151917815208435, 0.3178768754005432, 0.4205619692802429, 0.5232471227645874, 0.6259322166442871, 0.7286173105239868, 0.8313024044036865, 0.9339874982833862, 1.036672592163086, 1.1393578052520752, 1.2420427799224854, 1.3447279930114746, 1.4474130868911743, 1.550098180770874, 1.6527832746505737, 1.7554683685302734, 1.8581535816192627, 1.9608385562896729, 2.063523769378662, 2.1662087440490723, 2.2688939571380615, 2.371579170227051, 2.47426438331604, 2.57694935798645, 2.6796345710754395, 2.7823195457458496, 2.885004758834839, 2.987689971923828, 3.0903749465942383, 3.1930599212646484]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 8.0, 16.0, 18.0, 18.0, 45.0, 80.0, 104.0, 184.0, 313.0, 499.0, 977.0, 2166.0, 4796.0, 11960.0, 31953.0, 85951.0, 206862.0, 313321.0, 228329.0, 99760.0, 37080.0, 13875.0, 5466.0, 2323.0, 1062.0, 575.0, 292.0, 173.0, 122.0, 81.0, 43.0, 27.0, 20.0, 10.0, 13.0, 12.0, 9.0, 7.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.859375, -7.61810302734375, -7.3768310546875, -7.13555908203125, -6.894287109375, -6.65301513671875, -6.4117431640625, -6.17047119140625, -5.92919921875, -5.68792724609375, -5.4466552734375, -5.20538330078125, -4.964111328125, -4.72283935546875, -4.4815673828125, -4.24029541015625, -3.9990234375, -3.75775146484375, -3.5164794921875, -3.27520751953125, -3.033935546875, -2.79266357421875, -2.5513916015625, -2.31011962890625, -2.06884765625, -1.82757568359375, -1.5863037109375, -1.34503173828125, -1.103759765625, -0.86248779296875, -0.6212158203125, -0.37994384765625, -0.138671875, 0.10260009765625, 0.3438720703125, 0.58514404296875, 0.826416015625, 1.06768798828125, 1.3089599609375, 1.55023193359375, 1.79150390625, 2.03277587890625, 2.2740478515625, 2.51531982421875, 2.756591796875, 2.99786376953125, 3.2391357421875, 3.48040771484375, 3.7216796875, 3.96295166015625, 4.2042236328125, 4.44549560546875, 4.686767578125, 4.92803955078125, 5.1693115234375, 5.41058349609375, 5.65185546875, 5.89312744140625, 6.1343994140625, 6.37567138671875, 6.616943359375, 6.85821533203125, 7.0994873046875, 7.34075927734375, 7.58203125]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 0.0, 9.0, 6.0, 8.0, 8.0, 13.0, 20.0, 18.0, 19.0, 21.0, 23.0, 20.0, 27.0, 47.0, 29.0, 41.0, 44.0, 35.0, 47.0, 33.0, 35.0, 45.0, 40.0, 41.0, 43.0, 24.0, 38.0, 33.0, 27.0, 28.0, 27.0, 18.0, 21.0, 21.0, 12.0, 15.0, 16.0, 10.0, 4.0, 8.0, 3.0, 8.0, 8.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-3.666015625, -3.554962158203125, -3.44390869140625, -3.332855224609375, -3.2218017578125, -3.110748291015625, -2.99969482421875, -2.888641357421875, -2.777587890625, -2.666534423828125, -2.55548095703125, -2.444427490234375, -2.3333740234375, -2.222320556640625, -2.11126708984375, -2.000213623046875, -1.88916015625, -1.778106689453125, -1.66705322265625, -1.555999755859375, -1.4449462890625, -1.333892822265625, -1.22283935546875, -1.111785888671875, -1.000732421875, -0.889678955078125, -0.77862548828125, -0.667572021484375, -0.5565185546875, -0.445465087890625, -0.33441162109375, -0.223358154296875, -0.1123046875, -0.001251220703125, 0.10980224609375, 0.220855712890625, 0.3319091796875, 0.442962646484375, 0.55401611328125, 0.665069580078125, 0.776123046875, 0.887176513671875, 0.99822998046875, 1.109283447265625, 1.2203369140625, 1.331390380859375, 1.44244384765625, 1.553497314453125, 1.66455078125, 1.775604248046875, 1.88665771484375, 1.997711181640625, 2.1087646484375, 2.219818115234375, 2.33087158203125, 2.441925048828125, 2.552978515625, 2.664031982421875, 2.77508544921875, 2.886138916015625, 2.9971923828125, 3.108245849609375, 3.21929931640625, 3.330352783203125, 3.44140625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 5.0, 8.0, 19.0, 29.0, 42.0, 69.0, 98.0, 104.0, 171.0, 290.0, 392.0, 626.0, 1005.0, 1548.0, 2761.0, 4631.0, 8008.0, 14098.0, 25776.0, 45792.0, 80002.0, 128032.0, 175111.0, 185226.0, 147244.0, 96989.0, 56972.0, 31628.0, 17552.0, 10135.0, 5670.0, 3296.0, 1944.0, 1183.0, 730.0, 453.0, 297.0, 197.0, 141.0, 98.0, 59.0, 40.0, 24.0, 14.0, 15.0, 9.0, 9.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.453125, -4.30560302734375, -4.1580810546875, -4.01055908203125, -3.863037109375, -3.71551513671875, -3.5679931640625, -3.42047119140625, -3.27294921875, -3.12542724609375, -2.9779052734375, -2.83038330078125, -2.682861328125, -2.53533935546875, -2.3878173828125, -2.24029541015625, -2.0927734375, -1.94525146484375, -1.7977294921875, -1.65020751953125, -1.502685546875, -1.35516357421875, -1.2076416015625, -1.06011962890625, -0.91259765625, -0.76507568359375, -0.6175537109375, -0.47003173828125, -0.322509765625, -0.17498779296875, -0.0274658203125, 0.12005615234375, 0.267578125, 0.41510009765625, 0.5626220703125, 0.71014404296875, 0.857666015625, 1.00518798828125, 1.1527099609375, 1.30023193359375, 1.44775390625, 1.59527587890625, 1.7427978515625, 1.89031982421875, 2.037841796875, 2.18536376953125, 2.3328857421875, 2.48040771484375, 2.6279296875, 2.77545166015625, 2.9229736328125, 3.07049560546875, 3.218017578125, 3.36553955078125, 3.5130615234375, 3.66058349609375, 3.80810546875, 3.95562744140625, 4.1031494140625, 4.25067138671875, 4.398193359375, 4.54571533203125, 4.6932373046875, 4.84075927734375, 4.98828125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 7.0, 4.0, 10.0, 5.0, 6.0, 12.0, 6.0, 14.0, 9.0, 15.0, 20.0, 17.0, 16.0, 28.0, 23.0, 35.0, 27.0, 31.0, 36.0, 37.0, 50.0, 38.0, 33.0, 38.0, 39.0, 42.0, 35.0, 40.0, 34.0, 28.0, 32.0, 29.0, 34.0, 33.0, 22.0, 12.0, 19.0, 16.0, 10.0, 18.0, 9.0, 10.0, 6.0, 8.0, 3.0, 5.0, 6.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.005859375, -1.9427490234375, -1.879638671875, -1.8165283203125, -1.75341796875, -1.6903076171875, -1.627197265625, -1.5640869140625, -1.5009765625, -1.4378662109375, -1.374755859375, -1.3116455078125, -1.24853515625, -1.1854248046875, -1.122314453125, -1.0592041015625, -0.99609375, -0.9329833984375, -0.869873046875, -0.8067626953125, -0.74365234375, -0.6805419921875, -0.617431640625, -0.5543212890625, -0.4912109375, -0.4281005859375, -0.364990234375, -0.3018798828125, -0.23876953125, -0.1756591796875, -0.112548828125, -0.0494384765625, 0.013671875, 0.0767822265625, 0.139892578125, 0.2030029296875, 0.26611328125, 0.3292236328125, 0.392333984375, 0.4554443359375, 0.5185546875, 0.5816650390625, 0.644775390625, 0.7078857421875, 0.77099609375, 0.8341064453125, 0.897216796875, 0.9603271484375, 1.0234375, 1.0865478515625, 1.149658203125, 1.2127685546875, 1.27587890625, 1.3389892578125, 1.402099609375, 1.4652099609375, 1.5283203125, 1.5914306640625, 1.654541015625, 1.7176513671875, 1.78076171875, 1.8438720703125, 1.906982421875, 1.9700927734375, 2.033203125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 7.0, 13.0, 15.0, 32.0, 25.0, 55.0, 55.0, 120.0, 184.0, 248.0, 388.0, 550.0, 876.0, 1449.0, 2133.0, 3683.0, 6080.0, 10297.0, 17393.0, 30449.0, 52338.0, 88515.0, 137804.0, 179434.0, 177607.0, 132912.0, 84644.0, 50231.0, 29193.0, 16762.0, 9750.0, 5821.0, 3583.0, 2124.0, 1306.0, 847.0, 531.0, 370.0, 252.0, 151.0, 121.0, 74.0, 46.0, 20.0, 21.0, 13.0, 15.0, 9.0, 12.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8779296875, -1.8191680908203125, -1.760406494140625, -1.7016448974609375, -1.64288330078125, -1.5841217041015625, -1.525360107421875, -1.4665985107421875, -1.4078369140625, -1.3490753173828125, -1.290313720703125, -1.2315521240234375, -1.17279052734375, -1.1140289306640625, -1.055267333984375, -0.9965057373046875, -0.937744140625, -0.8789825439453125, -0.820220947265625, -0.7614593505859375, -0.70269775390625, -0.6439361572265625, -0.585174560546875, -0.5264129638671875, -0.4676513671875, -0.4088897705078125, -0.350128173828125, -0.2913665771484375, -0.23260498046875, -0.1738433837890625, -0.115081787109375, -0.0563201904296875, 0.00244140625, 0.0612030029296875, 0.119964599609375, 0.1787261962890625, 0.23748779296875, 0.2962493896484375, 0.355010986328125, 0.4137725830078125, 0.4725341796875, 0.5312957763671875, 0.590057373046875, 0.6488189697265625, 0.70758056640625, 0.7663421630859375, 0.825103759765625, 0.8838653564453125, 0.942626953125, 1.0013885498046875, 1.060150146484375, 1.1189117431640625, 1.17767333984375, 1.2364349365234375, 1.295196533203125, 1.3539581298828125, 1.4127197265625, 1.4714813232421875, 1.530242919921875, 1.5890045166015625, 1.64776611328125, 1.7065277099609375, 1.765289306640625, 1.8240509033203125, 1.8828125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 10.0, 5.0, 12.0, 18.0, 20.0, 16.0, 32.0, 44.0, 46.0, 58.0, 78.0, 84.0, 89.0, 90.0, 80.0, 78.0, 51.0, 48.0, 31.0, 25.0, 28.0, 10.0, 7.0, 9.0, 6.0, 7.0, 4.0, 6.0, 5.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00031113624572753906, -0.00030315108597278595, -0.00029516592621803284, -0.0002871807664632797, -0.0002791956067085266, -0.0002712104469537735, -0.0002632252871990204, -0.0002552401274442673, -0.00024725496768951416, -0.00023926980793476105, -0.00023128464818000793, -0.00022329948842525482, -0.0002153143286705017, -0.0002073291689157486, -0.00019934400916099548, -0.00019135884940624237, -0.00018337368965148926, -0.00017538852989673615, -0.00016740337014198303, -0.00015941821038722992, -0.0001514330506324768, -0.0001434478908777237, -0.00013546273112297058, -0.00012747757136821747, -0.00011949241161346436, -0.00011150725185871124, -0.00010352209210395813, -9.553693234920502e-05, -8.75517725944519e-05, -7.956661283969879e-05, -7.158145308494568e-05, -6.359629333019257e-05, -5.561113357543945e-05, -4.762597382068634e-05, -3.964081406593323e-05, -3.1655654311180115e-05, -2.3670494556427002e-05, -1.568533480167389e-05, -7.700175046920776e-06, 2.849847078323364e-07, 8.27014446258545e-06, 1.6255304217338562e-05, 2.4240463972091675e-05, 3.222562372684479e-05, 4.02107834815979e-05, 4.819594323635101e-05, 5.6181102991104126e-05, 6.416626274585724e-05, 7.215142250061035e-05, 8.013658225536346e-05, 8.812174201011658e-05, 9.610690176486969e-05, 0.0001040920615196228, 0.00011207722127437592, 0.00012006238102912903, 0.00012804754078388214, 0.00013603270053863525, 0.00014401786029338837, 0.00015200302004814148, 0.0001599881798028946, 0.0001679733395576477, 0.00017595849931240082, 0.00018394365906715393, 0.00019192881882190704, 0.00019991397857666016]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 5.0, 2.0, 7.0, 8.0, 3.0, 8.0, 18.0, 26.0, 48.0, 70.0, 95.0, 130.0, 219.0, 304.0, 482.0, 701.0, 1107.0, 1781.0, 3022.0, 5066.0, 8376.0, 15192.0, 26623.0, 48199.0, 87002.0, 142755.0, 194264.0, 190003.0, 136457.0, 81662.0, 45184.0, 25384.0, 13913.0, 8023.0, 4604.0, 2832.0, 1738.0, 1104.0, 751.0, 437.0, 329.0, 201.0, 136.0, 89.0, 64.0, 47.0, 41.0, 16.0, 12.0, 11.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.8515625, -1.78973388671875, -1.7279052734375, -1.66607666015625, -1.604248046875, -1.54241943359375, -1.4805908203125, -1.41876220703125, -1.35693359375, -1.29510498046875, -1.2332763671875, -1.17144775390625, -1.109619140625, -1.04779052734375, -0.9859619140625, -0.92413330078125, -0.8623046875, -0.80047607421875, -0.7386474609375, -0.67681884765625, -0.614990234375, -0.55316162109375, -0.4913330078125, -0.42950439453125, -0.36767578125, -0.30584716796875, -0.2440185546875, -0.18218994140625, -0.120361328125, -0.05853271484375, 0.0032958984375, 0.06512451171875, 0.126953125, 0.18878173828125, 0.2506103515625, 0.31243896484375, 0.374267578125, 0.43609619140625, 0.4979248046875, 0.55975341796875, 0.62158203125, 0.68341064453125, 0.7452392578125, 0.80706787109375, 0.868896484375, 0.93072509765625, 0.9925537109375, 1.05438232421875, 1.1162109375, 1.17803955078125, 1.2398681640625, 1.30169677734375, 1.363525390625, 1.42535400390625, 1.4871826171875, 1.54901123046875, 1.61083984375, 1.67266845703125, 1.7344970703125, 1.79632568359375, 1.858154296875, 1.91998291015625, 1.9818115234375, 2.04364013671875, 2.10546875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 2.0, 2.0, 1.0, 4.0, 7.0, 5.0, 7.0, 8.0, 9.0, 13.0, 13.0, 13.0, 14.0, 16.0, 24.0, 32.0, 32.0, 37.0, 30.0, 35.0, 52.0, 40.0, 41.0, 50.0, 48.0, 58.0, 57.0, 32.0, 44.0, 45.0, 35.0, 34.0, 28.0, 13.0, 23.0, 14.0, 11.0, 14.0, 14.0, 10.0, 5.0, 6.0, 4.0, 1.0, 7.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 3.0], "bins": [-0.5068359375, -0.4926567077636719, -0.47847747802734375, -0.4642982482910156, -0.4501190185546875, -0.4359397888183594, -0.42176055908203125, -0.4075813293457031, -0.393402099609375, -0.3792228698730469, -0.36504364013671875, -0.3508644104003906, -0.3366851806640625, -0.3225059509277344, -0.30832672119140625, -0.2941474914550781, -0.27996826171875, -0.2657890319824219, -0.25160980224609375, -0.23743057250976562, -0.2232513427734375, -0.20907211303710938, -0.19489288330078125, -0.18071365356445312, -0.166534423828125, -0.15235519409179688, -0.13817596435546875, -0.12399673461914062, -0.1098175048828125, -0.09563827514648438, -0.08145904541015625, -0.06727981567382812, -0.0531005859375, -0.038921356201171875, -0.02474212646484375, -0.010562896728515625, 0.0036163330078125, 0.017795562744140625, 0.03197479248046875, 0.046154022216796875, 0.060333251953125, 0.07451248168945312, 0.08869171142578125, 0.10287094116210938, 0.1170501708984375, 0.13122940063476562, 0.14540863037109375, 0.15958786010742188, 0.17376708984375, 0.18794631958007812, 0.20212554931640625, 0.21630477905273438, 0.2304840087890625, 0.24466323852539062, 0.25884246826171875, 0.2730216979980469, 0.287200927734375, 0.3013801574707031, 0.31555938720703125, 0.3297386169433594, 0.3439178466796875, 0.3580970764160156, 0.37227630615234375, 0.3864555358886719, 0.400634765625]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 4.0, 3.0, 4.0, 5.0, 7.0, 16.0, 16.0, 21.0, 21.0, 37.0, 49.0, 56.0, 75.0, 95.0, 124.0, 115.0, 103.0, 75.0, 62.0, 41.0, 23.0, 20.0, 16.0, 9.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.230144500732422, -13.869439125061035, -13.508734703063965, -13.148029327392578, -12.787324905395508, -12.426619529724121, -12.065914154052734, -11.705209732055664, -11.344504356384277, -10.98379898071289, -10.62309455871582, -10.262389183044434, -9.901684761047363, -9.540979385375977, -9.180274963378906, -8.81956958770752, -8.458864212036133, -8.098158836364746, -7.737454414367676, -7.376749038696289, -7.0160441398620605, -6.655339241027832, -6.2946343421936035, -5.933929443359375, -5.573225021362305, -5.212520122528076, -4.851815223693848, -4.491109848022461, -4.130404949188232, -3.769700050354004, -3.4089951515197754, -3.0482900142669678, -2.68758487701416, -2.3268799781799316, -1.966174840927124, -1.6054699420928955, -1.2447649240493774, -0.8840599060058594, -0.5233550071716309, -0.16264986991882324, 0.19805502891540527, 0.5587600469589233, 0.9194650053977966, 1.28016996383667, 1.640874981880188, 2.001579999923706, 2.3622848987579346, 2.722990036010742, 3.0836949348449707, 3.444399833679199, 3.805104970932007, 4.165809631347656, 4.526515007019043, 4.8872199058532715, 5.2479248046875, 5.608630180358887, 5.969334602355957, 6.3300395011901855, 6.690744400024414, 7.051449775695801, 7.412154674530029, 7.772859573364258, 8.133563995361328, 8.494269371032715, 8.854974746704102]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 9.0, 7.0, 6.0, 9.0, 11.0, 16.0, 15.0, 20.0, 25.0, 23.0, 19.0, 39.0, 36.0, 31.0, 41.0, 32.0, 39.0, 44.0, 41.0, 37.0, 48.0, 48.0, 46.0, 43.0, 39.0, 29.0, 25.0, 28.0, 28.0, 25.0, 25.0, 21.0, 18.0, 16.0, 11.0, 13.0, 7.0, 11.0, 7.0, 6.0, 7.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.568134069442749, -3.462757110595703, -3.3573801517486572, -3.2520031929016113, -3.1466259956359863, -3.0412490367889404, -2.9358720779418945, -2.8304951190948486, -2.7251181602478027, -2.619741201400757, -2.514364242553711, -2.408987045288086, -2.30361008644104, -2.198233127593994, -2.0928561687469482, -1.9874792098999023, -1.8821020126342773, -1.7767250537872314, -1.671347975730896, -1.56597101688385, -1.4605939388275146, -1.3552169799804688, -1.2498400211334229, -1.144463062286377, -1.0390859842300415, -0.9337089657783508, -0.8283319473266602, -0.7229549884796143, -0.6175779700279236, -0.5122009515762329, -0.406823992729187, -0.30144697427749634, -0.19607019424438477, -0.09069319069385529, 0.014683812856674194, 0.12006080150604248, 0.22543781995773315, 0.33081483840942383, 0.4361917972564697, 0.5415688157081604, 0.6469458341598511, 0.7523228526115417, 0.8576998710632324, 0.9630768299102783, 1.0684537887573242, 1.1738308668136597, 1.2792078256607056, 1.384584903717041, 1.489961862564087, 1.5953388214111328, 1.7007158994674683, 1.8060928583145142, 1.9114699363708496, 2.0168468952178955, 2.1222238540649414, 2.2276008129119873, 2.332977771759033, 2.438354730606079, 2.543731689453125, 2.64910888671875, 2.754485845565796, 2.859862804412842, 2.9652397632598877, 3.0706167221069336, 3.1759939193725586]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 9.0, 3.0, 11.0, 9.0, 8.0, 23.0, 34.0, 59.0, 82.0, 115.0, 233.0, 316.0, 559.0, 1038.0, 1756.0, 3485.0, 6567.0, 13468.0, 29103.0, 68296.0, 184543.0, 588295.0, 1542454.0, 1181063.0, 363582.0, 119565.0, 47219.0, 21063.0, 10033.0, 5162.0, 2721.0, 1448.0, 793.0, 482.0, 260.0, 170.0, 88.0, 58.0, 48.0, 33.0, 14.0, 10.0, 10.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.828125, -9.56109619140625, -9.2940673828125, -9.02703857421875, -8.760009765625, -8.49298095703125, -8.2259521484375, -7.95892333984375, -7.69189453125, -7.42486572265625, -7.1578369140625, -6.89080810546875, -6.623779296875, -6.35675048828125, -6.0897216796875, -5.82269287109375, -5.5556640625, -5.28863525390625, -5.0216064453125, -4.75457763671875, -4.487548828125, -4.22052001953125, -3.9534912109375, -3.68646240234375, -3.41943359375, -3.15240478515625, -2.8853759765625, -2.61834716796875, -2.351318359375, -2.08428955078125, -1.8172607421875, -1.55023193359375, -1.283203125, -1.01617431640625, -0.7491455078125, -0.48211669921875, -0.215087890625, 0.05194091796875, 0.3189697265625, 0.58599853515625, 0.85302734375, 1.12005615234375, 1.3870849609375, 1.65411376953125, 1.921142578125, 2.18817138671875, 2.4552001953125, 2.72222900390625, 2.9892578125, 3.25628662109375, 3.5233154296875, 3.79034423828125, 4.057373046875, 4.32440185546875, 4.5914306640625, 4.85845947265625, 5.12548828125, 5.39251708984375, 5.6595458984375, 5.92657470703125, 6.193603515625, 6.46063232421875, 6.7276611328125, 6.99468994140625, 7.26171875]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 12.0, 10.0, 10.0, 6.0, 12.0, 17.0, 20.0, 24.0, 26.0, 28.0, 37.0, 24.0, 19.0, 45.0, 33.0, 34.0, 53.0, 52.0, 46.0, 48.0, 33.0, 34.0, 39.0, 32.0, 45.0, 33.0, 31.0, 25.0, 26.0, 33.0, 11.0, 22.0, 16.0, 11.0, 10.0, 10.0, 11.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.830078125, -2.7470703125, -2.6640625, -2.5810546875, -2.498046875, -2.4150390625, -2.33203125, -2.2490234375, -2.166015625, -2.0830078125, -2.0, -1.9169921875, -1.833984375, -1.7509765625, -1.66796875, -1.5849609375, -1.501953125, -1.4189453125, -1.3359375, -1.2529296875, -1.169921875, -1.0869140625, -1.00390625, -0.9208984375, -0.837890625, -0.7548828125, -0.671875, -0.5888671875, -0.505859375, -0.4228515625, -0.33984375, -0.2568359375, -0.173828125, -0.0908203125, -0.0078125, 0.0751953125, 0.158203125, 0.2412109375, 0.32421875, 0.4072265625, 0.490234375, 0.5732421875, 0.65625, 0.7392578125, 0.822265625, 0.9052734375, 0.98828125, 1.0712890625, 1.154296875, 1.2373046875, 1.3203125, 1.4033203125, 1.486328125, 1.5693359375, 1.65234375, 1.7353515625, 1.818359375, 1.9013671875, 1.984375, 2.0673828125, 2.150390625, 2.2333984375, 2.31640625, 2.3994140625, 2.482421875]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 12.0, 17.0, 23.0, 38.0, 70.0, 79.0, 149.0, 176.0, 289.0, 455.0, 641.0, 938.0, 1443.0, 2120.0, 3450.0, 5529.0, 8960.0, 14977.0, 25365.0, 45688.0, 83755.0, 162684.0, 327882.0, 661097.0, 1070692.0, 861286.0, 446648.0, 218567.0, 111505.0, 58797.0, 32582.0, 18614.0, 11028.0, 6664.0, 4163.0, 2688.0, 1692.0, 1199.0, 777.0, 522.0, 344.0, 223.0, 128.0, 99.0, 93.0, 48.0, 28.0, 17.0, 14.0, 12.0, 8.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-6.0859375, -5.89404296875, -5.7021484375, -5.51025390625, -5.318359375, -5.12646484375, -4.9345703125, -4.74267578125, -4.55078125, -4.35888671875, -4.1669921875, -3.97509765625, -3.783203125, -3.59130859375, -3.3994140625, -3.20751953125, -3.015625, -2.82373046875, -2.6318359375, -2.43994140625, -2.248046875, -2.05615234375, -1.8642578125, -1.67236328125, -1.48046875, -1.28857421875, -1.0966796875, -0.90478515625, -0.712890625, -0.52099609375, -0.3291015625, -0.13720703125, 0.0546875, 0.24658203125, 0.4384765625, 0.63037109375, 0.822265625, 1.01416015625, 1.2060546875, 1.39794921875, 1.58984375, 1.78173828125, 1.9736328125, 2.16552734375, 2.357421875, 2.54931640625, 2.7412109375, 2.93310546875, 3.125, 3.31689453125, 3.5087890625, 3.70068359375, 3.892578125, 4.08447265625, 4.2763671875, 4.46826171875, 4.66015625, 4.85205078125, 5.0439453125, 5.23583984375, 5.427734375, 5.61962890625, 5.8115234375, 6.00341796875, 6.1953125]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 1.0, 5.0, 5.0, 7.0, 17.0, 16.0, 18.0, 26.0, 48.0, 56.0, 75.0, 108.0, 112.0, 149.0, 204.0, 266.0, 296.0, 361.0, 385.0, 386.0, 334.0, 261.0, 224.0, 179.0, 120.0, 99.0, 81.0, 62.0, 42.0, 30.0, 23.0, 21.0, 13.0, 14.0, 5.0, 9.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9697265625, -1.8986663818359375, -1.827606201171875, -1.7565460205078125, -1.68548583984375, -1.6144256591796875, -1.543365478515625, -1.4723052978515625, -1.4012451171875, -1.3301849365234375, -1.259124755859375, -1.1880645751953125, -1.11700439453125, -1.0459442138671875, -0.974884033203125, -0.9038238525390625, -0.832763671875, -0.7617034912109375, -0.690643310546875, -0.6195831298828125, -0.54852294921875, -0.4774627685546875, -0.406402587890625, -0.3353424072265625, -0.2642822265625, -0.1932220458984375, -0.122161865234375, -0.0511016845703125, 0.01995849609375, 0.0910186767578125, 0.162078857421875, 0.2331390380859375, 0.30419921875, 0.3752593994140625, 0.446319580078125, 0.5173797607421875, 0.58843994140625, 0.6595001220703125, 0.730560302734375, 0.8016204833984375, 0.8726806640625, 0.9437408447265625, 1.014801025390625, 1.0858612060546875, 1.15692138671875, 1.2279815673828125, 1.299041748046875, 1.3701019287109375, 1.441162109375, 1.5122222900390625, 1.583282470703125, 1.6543426513671875, 1.72540283203125, 1.7964630126953125, 1.867523193359375, 1.9385833740234375, 2.0096435546875, 2.0807037353515625, 2.151763916015625, 2.2228240966796875, 2.29388427734375, 2.3649444580078125, 2.436004638671875, 2.5070648193359375, 2.578125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 8.0, 4.0, 0.0, 7.0, 12.0, 11.0, 17.0, 16.0, 20.0, 42.0, 36.0, 52.0, 55.0, 73.0, 94.0, 93.0, 84.0, 86.0, 67.0, 59.0, 46.0, 38.0, 22.0, 22.0, 20.0, 8.0, 5.0, 3.0, 0.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.97739315032959, -10.66610336303711, -10.354814529418945, -10.043524742126465, -9.732234954833984, -9.42094612121582, -9.10965633392334, -8.79836654663086, -8.487077713012695, -8.175787925720215, -7.864498615264893, -7.55320930480957, -7.24191951751709, -6.930630207061768, -6.619340896606445, -6.308051109313965, -5.996761322021484, -5.685472011566162, -5.374182224273682, -5.062892913818359, -4.751603126525879, -4.440313816070557, -4.129024505615234, -3.817734956741333, -3.5064454078674316, -3.1951558589935303, -2.883866310119629, -2.5725769996643066, -2.2612874507904053, -1.949997901916504, -1.638708472251892, -1.3274190425872803, -1.0161304473876953, -0.7048409581184387, -0.39355146884918213, -0.08226197957992554, 0.22902750968933105, 0.5403170585632324, 0.8516064882278442, 1.162895917892456, 1.4741854667663574, 1.7854750156402588, 2.09676456451416, 2.4080538749694824, 2.719343423843384, 3.030632972717285, 3.3419222831726074, 3.653211832046509, 3.96450138092041, 4.275790691375732, 4.587080478668213, 4.898369789123535, 5.209659576416016, 5.520948886871338, 5.83223819732666, 6.143527984619141, 6.454817295074463, 6.766106605529785, 7.077396392822266, 7.388685703277588, 7.69997501373291, 8.01126480102539, 8.322554588317871, 8.633843421936035, 8.945133209228516]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 6.0, 8.0, 8.0, 10.0, 11.0, 13.0, 6.0, 18.0, 15.0, 30.0, 27.0, 32.0, 32.0, 36.0, 36.0, 35.0, 36.0, 38.0, 36.0, 36.0, 45.0, 48.0, 35.0, 36.0, 50.0, 35.0, 37.0, 28.0, 37.0, 24.0, 20.0, 28.0, 26.0, 14.0, 16.0, 10.0, 12.0, 10.0, 6.0, 4.0, 4.0, 5.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7475574016571045, -3.6351704597473145, -3.5227832794189453, -3.4103963375091553, -3.2980093955993652, -3.185622215270996, -3.073235273361206, -2.960848331451416, -2.848461151123047, -2.736074209213257, -2.6236870288848877, -2.5113000869750977, -2.3989131450653076, -2.2865259647369385, -2.1741390228271484, -2.0617518424987793, -1.9493650197982788, -1.8369779586791992, -1.7245910167694092, -1.6122039556503296, -1.49981689453125, -1.38742995262146, -1.2750428915023804, -1.1626558303833008, -1.0502688884735107, -0.9378818869590759, -0.8254948258399963, -0.7131078243255615, -0.6007207632064819, -0.4883337616920471, -0.3759467601776123, -0.2635596990585327, -0.15117263793945312, -0.03878561407327652, 0.07360140979290009, 0.1859884262084961, 0.2983754575252533, 0.4107624888420105, 0.5231494903564453, 0.6355365514755249, 0.7479235529899597, 0.8603105545043945, 0.9726976156234741, 1.0850846767425537, 1.1974716186523438, 1.3098586797714233, 1.422245740890503, 1.534632682800293, 1.6470197439193726, 1.7594068050384521, 1.8717937469482422, 1.9841808080673218, 2.0965678691864014, 2.2089548110961914, 2.3213419914245605, 2.4337289333343506, 2.5461158752441406, 2.6585028171539307, 2.7708899974823, 2.88327693939209, 2.99566388130188, 3.108051061630249, 3.220438003540039, 3.332825183868408, 3.4452121257781982]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 4.0, 4.0, 6.0, 10.0, 17.0, 28.0, 28.0, 41.0, 56.0, 105.0, 152.0, 218.0, 370.0, 632.0, 1127.0, 2162.0, 4173.0, 9078.0, 21074.0, 51938.0, 129165.0, 266679.0, 293260.0, 156473.0, 64576.0, 25832.0, 10858.0, 4887.0, 2421.0, 1264.0, 696.0, 430.0, 269.0, 173.0, 111.0, 71.0, 51.0, 42.0, 35.0, 14.0, 12.0, 6.0, 3.0, 8.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.85546875, -4.713134765625, -4.57080078125, -4.428466796875, -4.2861328125, -4.143798828125, -4.00146484375, -3.859130859375, -3.716796875, -3.574462890625, -3.43212890625, -3.289794921875, -3.1474609375, -3.005126953125, -2.86279296875, -2.720458984375, -2.578125, -2.435791015625, -2.29345703125, -2.151123046875, -2.0087890625, -1.866455078125, -1.72412109375, -1.581787109375, -1.439453125, -1.297119140625, -1.15478515625, -1.012451171875, -0.8701171875, -0.727783203125, -0.58544921875, -0.443115234375, -0.30078125, -0.158447265625, -0.01611328125, 0.126220703125, 0.2685546875, 0.410888671875, 0.55322265625, 0.695556640625, 0.837890625, 0.980224609375, 1.12255859375, 1.264892578125, 1.4072265625, 1.549560546875, 1.69189453125, 1.834228515625, 1.9765625, 2.118896484375, 2.26123046875, 2.403564453125, 2.5458984375, 2.688232421875, 2.83056640625, 2.972900390625, 3.115234375, 3.257568359375, 3.39990234375, 3.542236328125, 3.6845703125, 3.826904296875, 3.96923828125, 4.111572265625, 4.25390625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 5.0, 4.0, 6.0, 6.0, 12.0, 17.0, 15.0, 16.0, 15.0, 22.0, 19.0, 28.0, 22.0, 35.0, 42.0, 35.0, 35.0, 35.0, 43.0, 44.0, 50.0, 41.0, 45.0, 36.0, 35.0, 44.0, 33.0, 31.0, 41.0, 25.0, 28.0, 24.0, 22.0, 23.0, 12.0, 11.0, 10.0, 8.0, 8.0, 5.0, 4.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.109375, -3.98114013671875, -3.8529052734375, -3.72467041015625, -3.596435546875, -3.46820068359375, -3.3399658203125, -3.21173095703125, -3.08349609375, -2.95526123046875, -2.8270263671875, -2.69879150390625, -2.570556640625, -2.44232177734375, -2.3140869140625, -2.18585205078125, -2.0576171875, -1.92938232421875, -1.8011474609375, -1.67291259765625, -1.544677734375, -1.41644287109375, -1.2882080078125, -1.15997314453125, -1.03173828125, -0.90350341796875, -0.7752685546875, -0.64703369140625, -0.518798828125, -0.39056396484375, -0.2623291015625, -0.13409423828125, -0.005859375, 0.12237548828125, 0.2506103515625, 0.37884521484375, 0.507080078125, 0.63531494140625, 0.7635498046875, 0.89178466796875, 1.02001953125, 1.14825439453125, 1.2764892578125, 1.40472412109375, 1.532958984375, 1.66119384765625, 1.7894287109375, 1.91766357421875, 2.0458984375, 2.17413330078125, 2.3023681640625, 2.43060302734375, 2.558837890625, 2.68707275390625, 2.8153076171875, 2.94354248046875, 3.07177734375, 3.20001220703125, 3.3282470703125, 3.45648193359375, 3.584716796875, 3.71295166015625, 3.8411865234375, 3.96942138671875, 4.09765625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 7.0, 7.0, 18.0, 22.0, 24.0, 37.0, 63.0, 63.0, 100.0, 143.0, 198.0, 272.0, 444.0, 680.0, 997.0, 1678.0, 2810.0, 4778.0, 9095.0, 17394.0, 35275.0, 72610.0, 146892.0, 248566.0, 236627.0, 134408.0, 66748.0, 32507.0, 16047.0, 8477.0, 4530.0, 2569.0, 1567.0, 917.0, 594.0, 429.0, 293.0, 185.0, 125.0, 100.0, 71.0, 52.0, 39.0, 23.0, 28.0, 9.0, 10.0, 8.0, 6.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.0, -3.874755859375, -3.74951171875, -3.624267578125, -3.4990234375, -3.373779296875, -3.24853515625, -3.123291015625, -2.998046875, -2.872802734375, -2.74755859375, -2.622314453125, -2.4970703125, -2.371826171875, -2.24658203125, -2.121337890625, -1.99609375, -1.870849609375, -1.74560546875, -1.620361328125, -1.4951171875, -1.369873046875, -1.24462890625, -1.119384765625, -0.994140625, -0.868896484375, -0.74365234375, -0.618408203125, -0.4931640625, -0.367919921875, -0.24267578125, -0.117431640625, 0.0078125, 0.133056640625, 0.25830078125, 0.383544921875, 0.5087890625, 0.634033203125, 0.75927734375, 0.884521484375, 1.009765625, 1.135009765625, 1.26025390625, 1.385498046875, 1.5107421875, 1.635986328125, 1.76123046875, 1.886474609375, 2.01171875, 2.136962890625, 2.26220703125, 2.387451171875, 2.5126953125, 2.637939453125, 2.76318359375, 2.888427734375, 3.013671875, 3.138916015625, 3.26416015625, 3.389404296875, 3.5146484375, 3.639892578125, 3.76513671875, 3.890380859375, 4.015625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 5.0, 4.0, 3.0, 12.0, 9.0, 10.0, 15.0, 23.0, 23.0, 29.0, 31.0, 25.0, 24.0, 22.0, 31.0, 45.0, 40.0, 41.0, 40.0, 49.0, 33.0, 51.0, 44.0, 44.0, 38.0, 36.0, 28.0, 31.0, 30.0, 20.0, 32.0, 27.0, 22.0, 13.0, 13.0, 11.0, 12.0, 13.0, 1.0, 5.0, 4.0, 4.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9794921875, -1.9066925048828125, -1.833892822265625, -1.7610931396484375, -1.68829345703125, -1.6154937744140625, -1.542694091796875, -1.4698944091796875, -1.3970947265625, -1.3242950439453125, -1.251495361328125, -1.1786956787109375, -1.10589599609375, -1.0330963134765625, -0.960296630859375, -0.8874969482421875, -0.814697265625, -0.7418975830078125, -0.669097900390625, -0.5962982177734375, -0.52349853515625, -0.4506988525390625, -0.377899169921875, -0.3050994873046875, -0.2322998046875, -0.1595001220703125, -0.086700439453125, -0.0139007568359375, 0.05889892578125, 0.1316986083984375, 0.204498291015625, 0.2772979736328125, 0.35009765625, 0.4228973388671875, 0.495697021484375, 0.5684967041015625, 0.64129638671875, 0.7140960693359375, 0.786895751953125, 0.8596954345703125, 0.9324951171875, 1.0052947998046875, 1.078094482421875, 1.1508941650390625, 1.22369384765625, 1.2964935302734375, 1.369293212890625, 1.4420928955078125, 1.514892578125, 1.5876922607421875, 1.660491943359375, 1.7332916259765625, 1.80609130859375, 1.8788909912109375, 1.951690673828125, 2.0244903564453125, 2.0972900390625, 2.1700897216796875, 2.242889404296875, 2.3156890869140625, 2.38848876953125, 2.4612884521484375, 2.534088134765625, 2.6068878173828125, 2.6796875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [6.0, 2.0, 2.0, 3.0, 5.0, 9.0, 10.0, 12.0, 17.0, 16.0, 28.0, 46.0, 59.0, 75.0, 132.0, 171.0, 271.0, 352.0, 546.0, 795.0, 1271.0, 2047.0, 3299.0, 5585.0, 9786.0, 18455.0, 36346.0, 74646.0, 156431.0, 271863.0, 230667.0, 117760.0, 56039.0, 27531.0, 14359.0, 7896.0, 4467.0, 2655.0, 1682.0, 1045.0, 660.0, 469.0, 309.0, 214.0, 163.0, 101.0, 68.0, 53.0, 45.0, 27.0, 18.0, 15.0, 12.0, 8.0, 5.0, 8.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.8212890625, -1.7601776123046875, -1.699066162109375, -1.6379547119140625, -1.57684326171875, -1.5157318115234375, -1.454620361328125, -1.3935089111328125, -1.3323974609375, -1.2712860107421875, -1.210174560546875, -1.1490631103515625, -1.08795166015625, -1.0268402099609375, -0.965728759765625, -0.9046173095703125, -0.843505859375, -0.7823944091796875, -0.721282958984375, -0.6601715087890625, -0.59906005859375, -0.5379486083984375, -0.476837158203125, -0.4157257080078125, -0.3546142578125, -0.2935028076171875, -0.232391357421875, -0.1712799072265625, -0.11016845703125, -0.0490570068359375, 0.012054443359375, 0.0731658935546875, 0.13427734375, 0.1953887939453125, 0.256500244140625, 0.3176116943359375, 0.37872314453125, 0.4398345947265625, 0.500946044921875, 0.5620574951171875, 0.6231689453125, 0.6842803955078125, 0.745391845703125, 0.8065032958984375, 0.86761474609375, 0.9287261962890625, 0.989837646484375, 1.0509490966796875, 1.112060546875, 1.1731719970703125, 1.234283447265625, 1.2953948974609375, 1.35650634765625, 1.4176177978515625, 1.478729248046875, 1.5398406982421875, 1.6009521484375, 1.6620635986328125, 1.723175048828125, 1.7842864990234375, 1.84539794921875, 1.9065093994140625, 1.967620849609375, 2.0287322998046875, 2.08984375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 7.0, 6.0, 8.0, 22.0, 17.0, 22.0, 25.0, 28.0, 47.0, 50.0, 70.0, 62.0, 74.0, 91.0, 88.0, 72.0, 56.0, 54.0, 47.0, 34.0, 20.0, 22.0, 14.0, 18.0, 7.0, 3.0, 5.0, 8.0, 1.0, 3.0, 4.0, 3.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00012350082397460938, -0.00012022629380226135, -0.00011695176362991333, -0.00011367723345756531, -0.00011040270328521729, -0.00010712817311286926, -0.00010385364294052124, -0.00010057911276817322, -9.73045825958252e-05, -9.403005242347717e-05, -9.075552225112915e-05, -8.748099207878113e-05, -8.42064619064331e-05, -8.093193173408508e-05, -7.765740156173706e-05, -7.438287138938904e-05, -7.110834121704102e-05, -6.783381104469299e-05, -6.455928087234497e-05, -6.128475069999695e-05, -5.8010220527648926e-05, -5.47356903553009e-05, -5.146116018295288e-05, -4.818663001060486e-05, -4.4912099838256836e-05, -4.1637569665908813e-05, -3.836303949356079e-05, -3.508850932121277e-05, -3.1813979148864746e-05, -2.8539448976516724e-05, -2.52649188041687e-05, -2.199038863182068e-05, -1.8715858459472656e-05, -1.5441328287124634e-05, -1.2166798114776611e-05, -8.892267942428589e-06, -5.617737770080566e-06, -2.343207597732544e-06, 9.313225746154785e-07, 4.205852746963501e-06, 7.4803829193115234e-06, 1.0754913091659546e-05, 1.4029443264007568e-05, 1.730397343635559e-05, 2.0578503608703613e-05, 2.3853033781051636e-05, 2.7127563953399658e-05, 3.040209412574768e-05, 3.36766242980957e-05, 3.6951154470443726e-05, 4.022568464279175e-05, 4.350021481513977e-05, 4.677474498748779e-05, 5.0049275159835815e-05, 5.332380533218384e-05, 5.659833550453186e-05, 5.987286567687988e-05, 6.31473958492279e-05, 6.642192602157593e-05, 6.969645619392395e-05, 7.297098636627197e-05, 7.624551653862e-05, 7.952004671096802e-05, 8.279457688331604e-05, 8.606910705566406e-05]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 5.0, 5.0, 5.0, 10.0, 13.0, 19.0, 25.0, 41.0, 80.0, 123.0, 168.0, 224.0, 381.0, 577.0, 900.0, 1442.0, 2655.0, 4607.0, 9008.0, 19278.0, 45429.0, 110682.0, 235172.0, 294712.0, 181672.0, 78491.0, 32730.0, 14067.0, 6838.0, 3654.0, 2133.0, 1285.0, 741.0, 508.0, 284.0, 194.0, 144.0, 77.0, 70.0, 45.0, 32.0, 22.0, 7.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.86328125, -1.7950439453125, -1.726806640625, -1.6585693359375, -1.59033203125, -1.5220947265625, -1.453857421875, -1.3856201171875, -1.3173828125, -1.2491455078125, -1.180908203125, -1.1126708984375, -1.04443359375, -0.9761962890625, -0.907958984375, -0.8397216796875, -0.771484375, -0.7032470703125, -0.635009765625, -0.5667724609375, -0.49853515625, -0.4302978515625, -0.362060546875, -0.2938232421875, -0.2255859375, -0.1573486328125, -0.089111328125, -0.0208740234375, 0.04736328125, 0.1156005859375, 0.183837890625, 0.2520751953125, 0.3203125, 0.3885498046875, 0.456787109375, 0.5250244140625, 0.59326171875, 0.6614990234375, 0.729736328125, 0.7979736328125, 0.8662109375, 0.9344482421875, 1.002685546875, 1.0709228515625, 1.13916015625, 1.2073974609375, 1.275634765625, 1.3438720703125, 1.412109375, 1.4803466796875, 1.548583984375, 1.6168212890625, 1.68505859375, 1.7532958984375, 1.821533203125, 1.8897705078125, 1.9580078125, 2.0262451171875, 2.094482421875, 2.1627197265625, 2.23095703125, 2.2991943359375, 2.367431640625, 2.4356689453125, 2.50390625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 3.0, 6.0, 3.0, 3.0, 5.0, 7.0, 13.0, 17.0, 15.0, 17.0, 23.0, 28.0, 30.0, 39.0, 46.0, 50.0, 64.0, 55.0, 73.0, 56.0, 63.0, 73.0, 64.0, 54.0, 34.0, 31.0, 27.0, 22.0, 20.0, 11.0, 11.0, 7.0, 10.0, 5.0, 8.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.404541015625, -0.3915138244628906, -0.37848663330078125, -0.3654594421386719, -0.3524322509765625, -0.3394050598144531, -0.32637786865234375, -0.3133506774902344, -0.300323486328125, -0.2872962951660156, -0.27426910400390625, -0.2612419128417969, -0.2482147216796875, -0.23518753051757812, -0.22216033935546875, -0.20913314819335938, -0.19610595703125, -0.18307876586914062, -0.17005157470703125, -0.15702438354492188, -0.1439971923828125, -0.13097000122070312, -0.11794281005859375, -0.10491561889648438, -0.091888427734375, -0.07886123657226562, -0.06583404541015625, -0.052806854248046875, -0.0397796630859375, -0.026752471923828125, -0.01372528076171875, -0.000698089599609375, 0.0123291015625, 0.025356292724609375, 0.03838348388671875, 0.051410675048828125, 0.0644378662109375, 0.07746505737304688, 0.09049224853515625, 0.10351943969726562, 0.116546630859375, 0.12957382202148438, 0.14260101318359375, 0.15562820434570312, 0.1686553955078125, 0.18168258666992188, 0.19470977783203125, 0.20773696899414062, 0.22076416015625, 0.23379135131835938, 0.24681854248046875, 0.2598457336425781, 0.2728729248046875, 0.2859001159667969, 0.29892730712890625, 0.3119544982910156, 0.324981689453125, 0.3380088806152344, 0.35103607177734375, 0.3640632629394531, 0.3770904541015625, 0.3901176452636719, 0.40314483642578125, 0.4161720275878906, 0.42919921875]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 3.0, 6.0, 9.0, 7.0, 9.0, 20.0, 22.0, 33.0, 36.0, 49.0, 57.0, 76.0, 83.0, 95.0, 87.0, 92.0, 68.0, 65.0, 54.0, 27.0, 32.0, 15.0, 28.0, 12.0, 3.0, 1.0, 2.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.881915092468262, -10.567342758178711, -10.25277042388916, -9.938197135925293, -9.623624801635742, -9.309052467346191, -8.99448013305664, -8.67990779876709, -8.365335464477539, -8.050763130187988, -7.736190319061279, -7.4216179847717285, -7.1070451736450195, -6.792472839355469, -6.477900505065918, -6.163328170776367, -5.8487548828125, -5.534182548522949, -5.21960973739624, -4.9050374031066895, -4.5904645919799805, -4.27589225769043, -3.961319923400879, -3.646747350692749, -3.332174777984619, -3.0176022052764893, -2.7030296325683594, -2.3884572982788086, -2.0738847255706787, -1.7593121528625488, -1.4447396993637085, -1.1301672458648682, -0.8155937194824219, -0.5010212063789368, -0.18644869327545166, 0.12812381982803345, 0.44269633293151855, 0.7572689056396484, 1.0718413591384888, 1.386413812637329, 1.700986385345459, 2.015558958053589, 2.3301315307617188, 2.6447038650512695, 2.9592764377593994, 3.2738490104675293, 3.58842134475708, 3.90299391746521, 4.21756649017334, 4.532138824462891, 4.8467116355896, 5.16128396987915, 5.475856781005859, 5.79042911529541, 6.105001449584961, 6.419573783874512, 6.734146595001221, 7.0487189292907715, 7.3632917404174805, 7.677864074707031, 7.992436408996582, 8.307008743286133, 8.62158203125, 8.93615436553955, 9.250726699829102]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 6.0, 8.0, 11.0, 8.0, 11.0, 10.0, 12.0, 9.0, 24.0, 31.0, 25.0, 29.0, 31.0, 41.0, 36.0, 37.0, 37.0, 31.0, 40.0, 37.0, 42.0, 53.0, 32.0, 37.0, 44.0, 29.0, 39.0, 31.0, 29.0, 34.0, 21.0, 26.0, 23.0, 15.0, 13.0, 11.0, 12.0, 10.0, 7.0, 5.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.650895357131958, -3.541168689727783, -3.4314420223236084, -3.3217153549194336, -3.211988687515259, -3.102262020111084, -2.992535352706909, -2.8828086853027344, -2.7730820178985596, -2.6633553504943848, -2.55362868309021, -2.443902015686035, -2.3341753482818604, -2.2244486808776855, -2.1147220134735107, -2.004995346069336, -1.8952686786651611, -1.7855420112609863, -1.6758153438568115, -1.5660886764526367, -1.456362009048462, -1.346635341644287, -1.2369086742401123, -1.1271820068359375, -1.0174553394317627, -0.9077286720275879, -0.7980020046234131, -0.6882753372192383, -0.5785486698150635, -0.46882200241088867, -0.35909533500671387, -0.24936866760253906, -0.13964200019836426, -0.029915332794189453, 0.07981133460998535, 0.18953800201416016, 0.29926466941833496, 0.40899133682250977, 0.5187180042266846, 0.6284446716308594, 0.7381713390350342, 0.847898006439209, 0.9576246738433838, 1.0673513412475586, 1.1770780086517334, 1.2868046760559082, 1.396531343460083, 1.5062580108642578, 1.6159846782684326, 1.7257113456726074, 1.8354380130767822, 1.945164680480957, 2.054891347885132, 2.1646180152893066, 2.2743446826934814, 2.3840713500976562, 2.493798017501831, 2.603524684906006, 2.7132513523101807, 2.8229780197143555, 2.9327046871185303, 3.042431354522705, 3.15215802192688, 3.2618846893310547, 3.3716113567352295]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 4.0, 8.0, 9.0, 13.0, 25.0, 28.0, 58.0, 76.0, 117.0, 176.0, 269.0, 387.0, 665.0, 1134.0, 1796.0, 3065.0, 5379.0, 9753.0, 18085.0, 34661.0, 65334.0, 118796.0, 184177.0, 211898.0, 168341.0, 103833.0, 55745.0, 29240.0, 15454.0, 8384.0, 4786.0, 2625.0, 1600.0, 967.0, 570.0, 361.0, 216.0, 184.0, 120.0, 70.0, 36.0, 40.0, 30.0, 15.0, 13.0, 4.0, 7.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-6.52734375, -6.33746337890625, -6.1475830078125, -5.95770263671875, -5.767822265625, -5.57794189453125, -5.3880615234375, -5.19818115234375, -5.00830078125, -4.81842041015625, -4.6285400390625, -4.43865966796875, -4.248779296875, -4.05889892578125, -3.8690185546875, -3.67913818359375, -3.4892578125, -3.29937744140625, -3.1094970703125, -2.91961669921875, -2.729736328125, -2.53985595703125, -2.3499755859375, -2.16009521484375, -1.97021484375, -1.78033447265625, -1.5904541015625, -1.40057373046875, -1.210693359375, -1.02081298828125, -0.8309326171875, -0.64105224609375, -0.451171875, -0.26129150390625, -0.0714111328125, 0.11846923828125, 0.308349609375, 0.49822998046875, 0.6881103515625, 0.87799072265625, 1.06787109375, 1.25775146484375, 1.4476318359375, 1.63751220703125, 1.827392578125, 2.01727294921875, 2.2071533203125, 2.39703369140625, 2.5869140625, 2.77679443359375, 2.9666748046875, 3.15655517578125, 3.346435546875, 3.53631591796875, 3.7261962890625, 3.91607666015625, 4.10595703125, 4.29583740234375, 4.4857177734375, 4.67559814453125, 4.865478515625, 5.05535888671875, 5.2452392578125, 5.43511962890625, 5.625]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 2.0, 6.0, 9.0, 12.0, 9.0, 5.0, 10.0, 16.0, 16.0, 22.0, 25.0, 24.0, 27.0, 31.0, 21.0, 34.0, 36.0, 36.0, 38.0, 34.0, 44.0, 34.0, 29.0, 44.0, 31.0, 47.0, 37.0, 35.0, 33.0, 19.0, 33.0, 23.0, 23.0, 19.0, 18.0, 15.0, 16.0, 10.0, 9.0, 10.0, 6.0, 10.0, 5.0, 10.0, 5.0, 4.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-3.703125, -3.59429931640625, -3.4854736328125, -3.37664794921875, -3.267822265625, -3.15899658203125, -3.0501708984375, -2.94134521484375, -2.83251953125, -2.72369384765625, -2.6148681640625, -2.50604248046875, -2.397216796875, -2.28839111328125, -2.1795654296875, -2.07073974609375, -1.9619140625, -1.85308837890625, -1.7442626953125, -1.63543701171875, -1.526611328125, -1.41778564453125, -1.3089599609375, -1.20013427734375, -1.09130859375, -0.98248291015625, -0.8736572265625, -0.76483154296875, -0.656005859375, -0.54718017578125, -0.4383544921875, -0.32952880859375, -0.220703125, -0.11187744140625, -0.0030517578125, 0.10577392578125, 0.214599609375, 0.32342529296875, 0.4322509765625, 0.54107666015625, 0.64990234375, 0.75872802734375, 0.8675537109375, 0.97637939453125, 1.085205078125, 1.19403076171875, 1.3028564453125, 1.41168212890625, 1.5205078125, 1.62933349609375, 1.7381591796875, 1.84698486328125, 1.955810546875, 2.06463623046875, 2.1734619140625, 2.28228759765625, 2.39111328125, 2.49993896484375, 2.6087646484375, 2.71759033203125, 2.826416015625, 2.93524169921875, 3.0440673828125, 3.15289306640625, 3.26171875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 0.0, 6.0, 7.0, 7.0, 11.0, 12.0, 35.0, 22.0, 41.0, 62.0, 83.0, 169.0, 228.0, 384.0, 708.0, 1193.0, 2024.0, 3691.0, 6705.0, 12706.0, 24131.0, 45977.0, 85213.0, 141951.0, 192424.0, 194864.0, 145259.0, 88189.0, 48072.0, 25407.0, 12981.0, 7028.0, 3816.0, 2124.0, 1213.0, 698.0, 420.0, 239.0, 151.0, 100.0, 61.0, 52.0, 29.0, 18.0, 12.0, 7.0, 11.0, 7.0, 3.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-6.0078125, -5.82025146484375, -5.6326904296875, -5.44512939453125, -5.257568359375, -5.07000732421875, -4.8824462890625, -4.69488525390625, -4.50732421875, -4.31976318359375, -4.1322021484375, -3.94464111328125, -3.757080078125, -3.56951904296875, -3.3819580078125, -3.19439697265625, -3.0068359375, -2.81927490234375, -2.6317138671875, -2.44415283203125, -2.256591796875, -2.06903076171875, -1.8814697265625, -1.69390869140625, -1.50634765625, -1.31878662109375, -1.1312255859375, -0.94366455078125, -0.756103515625, -0.56854248046875, -0.3809814453125, -0.19342041015625, -0.005859375, 0.18170166015625, 0.3692626953125, 0.55682373046875, 0.744384765625, 0.93194580078125, 1.1195068359375, 1.30706787109375, 1.49462890625, 1.68218994140625, 1.8697509765625, 2.05731201171875, 2.244873046875, 2.43243408203125, 2.6199951171875, 2.80755615234375, 2.9951171875, 3.18267822265625, 3.3702392578125, 3.55780029296875, 3.745361328125, 3.93292236328125, 4.1204833984375, 4.30804443359375, 4.49560546875, 4.68316650390625, 4.8707275390625, 5.05828857421875, 5.245849609375, 5.43341064453125, 5.6209716796875, 5.80853271484375, 5.99609375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 6.0, 7.0, 10.0, 8.0, 10.0, 15.0, 17.0, 14.0, 26.0, 37.0, 23.0, 31.0, 39.0, 42.0, 35.0, 45.0, 40.0, 57.0, 47.0, 40.0, 52.0, 47.0, 49.0, 39.0, 42.0, 28.0, 25.0, 27.0, 19.0, 24.0, 20.0, 17.0, 15.0, 12.0, 7.0, 7.0, 5.0, 4.0, 3.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.6328125, -2.553680419921875, -2.47454833984375, -2.395416259765625, -2.3162841796875, -2.237152099609375, -2.15802001953125, -2.078887939453125, -1.999755859375, -1.920623779296875, -1.84149169921875, -1.762359619140625, -1.6832275390625, -1.604095458984375, -1.52496337890625, -1.445831298828125, -1.36669921875, -1.287567138671875, -1.20843505859375, -1.129302978515625, -1.0501708984375, -0.971038818359375, -0.89190673828125, -0.812774658203125, -0.733642578125, -0.654510498046875, -0.57537841796875, -0.496246337890625, -0.4171142578125, -0.337982177734375, -0.25885009765625, -0.179718017578125, -0.1005859375, -0.021453857421875, 0.05767822265625, 0.136810302734375, 0.2159423828125, 0.295074462890625, 0.37420654296875, 0.453338623046875, 0.532470703125, 0.611602783203125, 0.69073486328125, 0.769866943359375, 0.8489990234375, 0.928131103515625, 1.00726318359375, 1.086395263671875, 1.16552734375, 1.244659423828125, 1.32379150390625, 1.402923583984375, 1.4820556640625, 1.561187744140625, 1.64031982421875, 1.719451904296875, 1.798583984375, 1.877716064453125, 1.95684814453125, 2.035980224609375, 2.1151123046875, 2.194244384765625, 2.27337646484375, 2.352508544921875, 2.431640625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 11.0, 11.0, 19.0, 26.0, 35.0, 39.0, 70.0, 103.0, 175.0, 237.0, 376.0, 622.0, 894.0, 1536.0, 2449.0, 3710.0, 6020.0, 9949.0, 16590.0, 28698.0, 49650.0, 84404.0, 134556.0, 181993.0, 182640.0, 135569.0, 85288.0, 50206.0, 28886.0, 17128.0, 10133.0, 6132.0, 3859.0, 2361.0, 1525.0, 909.0, 611.0, 387.0, 277.0, 172.0, 102.0, 60.0, 50.0, 31.0, 17.0, 15.0, 11.0, 5.0, 7.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.671875, -2.588409423828125, -2.50494384765625, -2.421478271484375, -2.3380126953125, -2.254547119140625, -2.17108154296875, -2.087615966796875, -2.004150390625, -1.920684814453125, -1.83721923828125, -1.753753662109375, -1.6702880859375, -1.586822509765625, -1.50335693359375, -1.419891357421875, -1.33642578125, -1.252960205078125, -1.16949462890625, -1.086029052734375, -1.0025634765625, -0.919097900390625, -0.83563232421875, -0.752166748046875, -0.668701171875, -0.585235595703125, -0.50177001953125, -0.418304443359375, -0.3348388671875, -0.251373291015625, -0.16790771484375, -0.084442138671875, -0.0009765625, 0.082489013671875, 0.16595458984375, 0.249420166015625, 0.3328857421875, 0.416351318359375, 0.49981689453125, 0.583282470703125, 0.666748046875, 0.750213623046875, 0.83367919921875, 0.917144775390625, 1.0006103515625, 1.084075927734375, 1.16754150390625, 1.251007080078125, 1.33447265625, 1.417938232421875, 1.50140380859375, 1.584869384765625, 1.6683349609375, 1.751800537109375, 1.83526611328125, 1.918731689453125, 2.002197265625, 2.085662841796875, 2.16912841796875, 2.252593994140625, 2.3360595703125, 2.419525146484375, 2.50299072265625, 2.586456298828125, 2.669921875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 2.0, 5.0, 6.0, 8.0, 13.0, 12.0, 18.0, 17.0, 29.0, 35.0, 32.0, 58.0, 47.0, 62.0, 66.0, 67.0, 76.0, 83.0, 64.0, 56.0, 53.0, 42.0, 20.0, 30.0, 17.0, 14.0, 10.0, 9.0, 17.0, 8.0, 7.0, 4.0, 3.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0], "bins": [-0.0004024505615234375, -0.00039162859320640564, -0.0003808066248893738, -0.0003699846565723419, -0.00035916268825531006, -0.0003483407199382782, -0.00033751875162124634, -0.0003266967833042145, -0.0003158748149871826, -0.00030505284667015076, -0.0002942308783531189, -0.00028340891003608704, -0.0002725869417190552, -0.0002617649734020233, -0.00025094300508499146, -0.0002401210367679596, -0.00022929906845092773, -0.00021847710013389587, -0.00020765513181686401, -0.00019683316349983215, -0.0001860111951828003, -0.00017518922686576843, -0.00016436725854873657, -0.0001535452902317047, -0.00014272332191467285, -0.000131901353597641, -0.00012107938528060913, -0.00011025741696357727, -9.943544864654541e-05, -8.861348032951355e-05, -7.779151201248169e-05, -6.696954369544983e-05, -5.614757537841797e-05, -4.532560706138611e-05, -3.450363874435425e-05, -2.3681670427322388e-05, -1.2859702110290527e-05, -2.037733793258667e-06, 8.784234523773193e-06, 1.9606202840805054e-05, 3.0428171157836914e-05, 4.1250139474868774e-05, 5.2072107791900635e-05, 6.28940761089325e-05, 7.371604442596436e-05, 8.453801274299622e-05, 9.535998106002808e-05, 0.00010618194937705994, 0.0001170039176940918, 0.00012782588601112366, 0.00013864785432815552, 0.00014946982264518738, 0.00016029179096221924, 0.0001711137592792511, 0.00018193572759628296, 0.00019275769591331482, 0.00020357966423034668, 0.00021440163254737854, 0.0002252236008644104, 0.00023604556918144226, 0.0002468675374984741, 0.000257689505815506, 0.00026851147413253784, 0.0002793334424495697, 0.00029015541076660156]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 6.0, 7.0, 14.0, 15.0, 24.0, 27.0, 35.0, 58.0, 76.0, 79.0, 111.0, 152.0, 230.0, 311.0, 470.0, 729.0, 1156.0, 1699.0, 2753.0, 4398.0, 7269.0, 12256.0, 21314.0, 36587.0, 61967.0, 101222.0, 146394.0, 176023.0, 162473.0, 120441.0, 77193.0, 46312.0, 26897.0, 15906.0, 9003.0, 5451.0, 3377.0, 2087.0, 1288.0, 882.0, 534.0, 397.0, 264.0, 172.0, 126.0, 108.0, 69.0, 40.0, 38.0, 40.0, 26.0, 21.0, 10.0, 12.0, 2.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0], "bins": [-2.1015625, -2.03314208984375, -1.9647216796875, -1.89630126953125, -1.827880859375, -1.75946044921875, -1.6910400390625, -1.62261962890625, -1.55419921875, -1.48577880859375, -1.4173583984375, -1.34893798828125, -1.280517578125, -1.21209716796875, -1.1436767578125, -1.07525634765625, -1.0068359375, -0.93841552734375, -0.8699951171875, -0.80157470703125, -0.733154296875, -0.66473388671875, -0.5963134765625, -0.52789306640625, -0.45947265625, -0.39105224609375, -0.3226318359375, -0.25421142578125, -0.185791015625, -0.11737060546875, -0.0489501953125, 0.01947021484375, 0.087890625, 0.15631103515625, 0.2247314453125, 0.29315185546875, 0.361572265625, 0.42999267578125, 0.4984130859375, 0.56683349609375, 0.63525390625, 0.70367431640625, 0.7720947265625, 0.84051513671875, 0.908935546875, 0.97735595703125, 1.0457763671875, 1.11419677734375, 1.1826171875, 1.25103759765625, 1.3194580078125, 1.38787841796875, 1.456298828125, 1.52471923828125, 1.5931396484375, 1.66156005859375, 1.72998046875, 1.79840087890625, 1.8668212890625, 1.93524169921875, 2.003662109375, 2.07208251953125, 2.1405029296875, 2.20892333984375, 2.27734375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 10.0, 16.0, 9.0, 22.0, 27.0, 36.0, 37.0, 54.0, 59.0, 67.0, 74.0, 66.0, 64.0, 73.0, 70.0, 59.0, 54.0, 49.0, 26.0, 23.0, 27.0, 23.0, 9.0, 15.0, 12.0, 3.0, 5.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.0234375, -0.9976119995117188, -0.9717864990234375, -0.9459609985351562, -0.920135498046875, -0.8943099975585938, -0.8684844970703125, -0.8426589965820312, -0.81683349609375, -0.7910079956054688, -0.7651824951171875, -0.7393569946289062, -0.713531494140625, -0.6877059936523438, -0.6618804931640625, -0.6360549926757812, -0.6102294921875, -0.5844039916992188, -0.5585784912109375, -0.5327529907226562, -0.506927490234375, -0.48110198974609375, -0.4552764892578125, -0.42945098876953125, -0.40362548828125, -0.37779998779296875, -0.3519744873046875, -0.32614898681640625, -0.300323486328125, -0.27449798583984375, -0.2486724853515625, -0.22284698486328125, -0.197021484375, -0.17119598388671875, -0.1453704833984375, -0.11954498291015625, -0.093719482421875, -0.06789398193359375, -0.0420684814453125, -0.01624298095703125, 0.00958251953125, 0.03540802001953125, 0.0612335205078125, 0.08705902099609375, 0.112884521484375, 0.13871002197265625, 0.1645355224609375, 0.19036102294921875, 0.2161865234375, 0.24201202392578125, 0.2678375244140625, 0.29366302490234375, 0.319488525390625, 0.34531402587890625, 0.3711395263671875, 0.39696502685546875, 0.42279052734375, 0.44861602783203125, 0.4744415283203125, 0.5002670288085938, 0.526092529296875, 0.5519180297851562, 0.5777435302734375, 0.6035690307617188, 0.62939453125]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 6.0, 5.0, 9.0, 2.0, 8.0, 14.0, 16.0, 20.0, 22.0, 27.0, 41.0, 63.0, 67.0, 65.0, 83.0, 79.0, 66.0, 99.0, 73.0, 66.0, 46.0, 33.0, 27.0, 26.0, 13.0, 16.0, 6.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.698271751403809, -10.396517753601074, -10.094762802124023, -9.793008804321289, -9.491254806518555, -9.189499855041504, -8.88774585723877, -8.585990905761719, -8.284236907958984, -7.982482433319092, -7.680727958679199, -7.378973960876465, -7.077219486236572, -6.77546501159668, -6.473711013793945, -6.171956539154053, -5.87020206451416, -5.568447589874268, -5.266693115234375, -4.964939117431641, -4.663184642791748, -4.3614301681518555, -4.059676170349121, -3.7579216957092285, -3.456167221069336, -3.1544127464294434, -2.85265851020813, -2.5509042739868164, -2.249149799346924, -1.9473954439163208, -1.6456410884857178, -1.3438868522644043, -1.0421333312988281, -0.7403789758682251, -0.43862462043762207, -0.13687026500701904, 0.16488409042358398, 0.466638445854187, 0.76839280128479, 1.0701470375061035, 1.371901512145996, 1.6736558675765991, 1.9754102230072021, 2.2771644592285156, 2.578918933868408, 2.880673408508301, 3.1824276447296143, 3.4841818809509277, 3.7859363555908203, 4.087690830230713, 4.3894453048706055, 4.69119930267334, 4.992953777313232, 5.294708251953125, 5.596462249755859, 5.898216724395752, 6.1999711990356445, 6.501725673675537, 6.80348014831543, 7.105234146118164, 7.406988620758057, 7.708743095397949, 8.010497093200684, 8.312252044677734, 8.614006042480469]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 8.0, 13.0, 8.0, 11.0, 12.0, 12.0, 18.0, 25.0, 22.0, 14.0, 22.0, 17.0, 25.0, 24.0, 41.0, 42.0, 52.0, 53.0, 43.0, 49.0, 43.0, 39.0, 32.0, 34.0, 42.0, 35.0, 47.0, 29.0, 24.0, 36.0, 30.0, 22.0, 11.0, 7.0, 15.0, 12.0, 6.0, 5.0, 5.0, 8.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.4548962116241455, -3.342690944671631, -3.2304859161376953, -3.1182806491851807, -3.006075620651245, -2.8938703536987305, -2.781665325164795, -2.6694600582122803, -2.5572547912597656, -2.445049524307251, -2.3328444957733154, -2.220639228820801, -2.1084342002868652, -1.9962289333343506, -1.8840237855911255, -1.7718186378479004, -1.6596136093139648, -1.5474084615707397, -1.4352033138275146, -1.322998046875, -1.2107930183410645, -1.0985877513885498, -0.9863826036453247, -0.8741774559020996, -0.7619723081588745, -0.6497671604156494, -0.5375620126724243, -0.42535680532455444, -0.31315165758132935, -0.20094650983810425, -0.08874130249023438, 0.023463845252990723, 0.13566923141479492, 0.2478743940591812, 0.3600795567035675, 0.472284734249115, 0.5844898819923401, 0.6966950297355652, 0.8089002370834351, 0.9211053848266602, 1.0333105325698853, 1.1455156803131104, 1.2577208280563354, 1.3699259757995605, 1.4821312427520752, 1.5943362712860107, 1.7065415382385254, 1.8187466859817505, 1.9309518337249756, 2.0431571006774902, 2.155362129211426, 2.2675673961639404, 2.379772424697876, 2.4919776916503906, 2.604182720184326, 2.716387987136841, 2.8285932540893555, 2.94079852104187, 3.0530035495758057, 3.1652088165283203, 3.277413845062256, 3.3896191120147705, 3.501824378967285, 3.6140294075012207, 3.7262344360351562]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 10.0, 11.0, 14.0, 17.0, 21.0, 45.0, 66.0, 96.0, 159.0, 251.0, 421.0, 680.0, 1234.0, 2283.0, 4486.0, 9188.0, 20588.0, 52667.0, 154775.0, 545847.0, 1652830.0, 1243638.0, 337328.0, 100276.0, 36429.0, 15417.0, 7322.0, 3640.0, 1941.0, 1063.0, 621.0, 380.0, 196.0, 144.0, 66.0, 57.0, 26.0, 19.0, 12.0, 13.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.984375, -10.6689453125, -10.353515625, -10.0380859375, -9.72265625, -9.4072265625, -9.091796875, -8.7763671875, -8.4609375, -8.1455078125, -7.830078125, -7.5146484375, -7.19921875, -6.8837890625, -6.568359375, -6.2529296875, -5.9375, -5.6220703125, -5.306640625, -4.9912109375, -4.67578125, -4.3603515625, -4.044921875, -3.7294921875, -3.4140625, -3.0986328125, -2.783203125, -2.4677734375, -2.15234375, -1.8369140625, -1.521484375, -1.2060546875, -0.890625, -0.5751953125, -0.259765625, 0.0556640625, 0.37109375, 0.6865234375, 1.001953125, 1.3173828125, 1.6328125, 1.9482421875, 2.263671875, 2.5791015625, 2.89453125, 3.2099609375, 3.525390625, 3.8408203125, 4.15625, 4.4716796875, 4.787109375, 5.1025390625, 5.41796875, 5.7333984375, 6.048828125, 6.3642578125, 6.6796875, 6.9951171875, 7.310546875, 7.6259765625, 7.94140625, 8.2568359375, 8.572265625, 8.8876953125, 9.203125]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 7.0, 8.0, 14.0, 9.0, 16.0, 12.0, 14.0, 12.0, 19.0, 19.0, 20.0, 21.0, 21.0, 34.0, 37.0, 41.0, 38.0, 47.0, 35.0, 52.0, 34.0, 56.0, 51.0, 38.0, 36.0, 49.0, 25.0, 30.0, 30.0, 32.0, 26.0, 25.0, 12.0, 17.0, 6.0, 5.0, 14.0, 7.0, 7.0, 6.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.91015625, -2.81756591796875, -2.7249755859375, -2.63238525390625, -2.539794921875, -2.44720458984375, -2.3546142578125, -2.26202392578125, -2.16943359375, -2.07684326171875, -1.9842529296875, -1.89166259765625, -1.799072265625, -1.70648193359375, -1.6138916015625, -1.52130126953125, -1.4287109375, -1.33612060546875, -1.2435302734375, -1.15093994140625, -1.058349609375, -0.96575927734375, -0.8731689453125, -0.78057861328125, -0.68798828125, -0.59539794921875, -0.5028076171875, -0.41021728515625, -0.317626953125, -0.22503662109375, -0.1324462890625, -0.03985595703125, 0.052734375, 0.14532470703125, 0.2379150390625, 0.33050537109375, 0.423095703125, 0.51568603515625, 0.6082763671875, 0.70086669921875, 0.79345703125, 0.88604736328125, 0.9786376953125, 1.07122802734375, 1.163818359375, 1.25640869140625, 1.3489990234375, 1.44158935546875, 1.5341796875, 1.62677001953125, 1.7193603515625, 1.81195068359375, 1.904541015625, 1.99713134765625, 2.0897216796875, 2.18231201171875, 2.27490234375, 2.36749267578125, 2.4600830078125, 2.55267333984375, 2.645263671875, 2.73785400390625, 2.8304443359375, 2.92303466796875, 3.015625]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 5.0, 10.0, 14.0, 19.0, 40.0, 43.0, 61.0, 111.0, 130.0, 258.0, 345.0, 549.0, 772.0, 1204.0, 1840.0, 3016.0, 4834.0, 8046.0, 13798.0, 24314.0, 44747.0, 84682.0, 167328.0, 347530.0, 720056.0, 1121666.0, 830137.0, 408773.0, 194800.0, 97412.0, 50884.0, 28193.0, 15469.0, 8964.0, 5363.0, 3212.0, 2073.0, 1254.0, 829.0, 511.0, 364.0, 212.0, 146.0, 91.0, 65.0, 48.0, 22.0, 18.0, 10.0, 11.0, 2.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0], "bins": [-6.9296875, -6.7171630859375, -6.504638671875, -6.2921142578125, -6.07958984375, -5.8670654296875, -5.654541015625, -5.4420166015625, -5.2294921875, -5.0169677734375, -4.804443359375, -4.5919189453125, -4.37939453125, -4.1668701171875, -3.954345703125, -3.7418212890625, -3.529296875, -3.3167724609375, -3.104248046875, -2.8917236328125, -2.67919921875, -2.4666748046875, -2.254150390625, -2.0416259765625, -1.8291015625, -1.6165771484375, -1.404052734375, -1.1915283203125, -0.97900390625, -0.7664794921875, -0.553955078125, -0.3414306640625, -0.12890625, 0.0836181640625, 0.296142578125, 0.5086669921875, 0.72119140625, 0.9337158203125, 1.146240234375, 1.3587646484375, 1.5712890625, 1.7838134765625, 1.996337890625, 2.2088623046875, 2.42138671875, 2.6339111328125, 2.846435546875, 3.0589599609375, 3.271484375, 3.4840087890625, 3.696533203125, 3.9090576171875, 4.12158203125, 4.3341064453125, 4.546630859375, 4.7591552734375, 4.9716796875, 5.1842041015625, 5.396728515625, 5.6092529296875, 5.82177734375, 6.0343017578125, 6.246826171875, 6.4593505859375, 6.671875]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 3.0, 6.0, 4.0, 9.0, 7.0, 16.0, 12.0, 17.0, 24.0, 39.0, 48.0, 57.0, 77.0, 100.0, 117.0, 151.0, 181.0, 257.0, 258.0, 297.0, 312.0, 328.0, 321.0, 295.0, 225.0, 213.0, 164.0, 129.0, 71.0, 73.0, 63.0, 44.0, 38.0, 22.0, 23.0, 11.0, 10.0, 14.0, 9.0, 6.0, 1.0, 7.0, 2.0, 10.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-2.240234375, -2.17242431640625, -2.1046142578125, -2.03680419921875, -1.968994140625, -1.90118408203125, -1.8333740234375, -1.76556396484375, -1.69775390625, -1.62994384765625, -1.5621337890625, -1.49432373046875, -1.426513671875, -1.35870361328125, -1.2908935546875, -1.22308349609375, -1.1552734375, -1.08746337890625, -1.0196533203125, -0.95184326171875, -0.884033203125, -0.81622314453125, -0.7484130859375, -0.68060302734375, -0.61279296875, -0.54498291015625, -0.4771728515625, -0.40936279296875, -0.341552734375, -0.27374267578125, -0.2059326171875, -0.13812255859375, -0.0703125, -0.00250244140625, 0.0653076171875, 0.13311767578125, 0.200927734375, 0.26873779296875, 0.3365478515625, 0.40435791015625, 0.47216796875, 0.53997802734375, 0.6077880859375, 0.67559814453125, 0.743408203125, 0.81121826171875, 0.8790283203125, 0.94683837890625, 1.0146484375, 1.08245849609375, 1.1502685546875, 1.21807861328125, 1.285888671875, 1.35369873046875, 1.4215087890625, 1.48931884765625, 1.55712890625, 1.62493896484375, 1.6927490234375, 1.76055908203125, 1.828369140625, 1.89617919921875, 1.9639892578125, 2.03179931640625, 2.099609375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 4.0, 7.0, 2.0, 4.0, 9.0, 7.0, 10.0, 18.0, 17.0, 33.0, 32.0, 37.0, 45.0, 48.0, 70.0, 75.0, 64.0, 86.0, 69.0, 58.0, 65.0, 58.0, 40.0, 19.0, 33.0, 21.0, 8.0, 16.0, 9.0, 11.0, 7.0, 7.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.09686279296875, -9.814611434936523, -9.532360076904297, -9.25010871887207, -8.967857360839844, -8.685606002807617, -8.40335464477539, -8.121103286743164, -7.838851451873779, -7.556600093841553, -7.274348735809326, -6.9920973777771, -6.709845542907715, -6.427594184875488, -6.145342826843262, -5.863091468811035, -5.580840110778809, -5.298588752746582, -5.0163373947143555, -4.734086036682129, -4.451834678649902, -4.169583320617676, -3.887331485748291, -3.6050801277160645, -3.322828769683838, -3.0405774116516113, -2.7583260536193848, -2.476074457168579, -2.1938230991363525, -1.911571741104126, -1.6293202638626099, -1.3470687866210938, -1.0648174285888672, -0.7825660109519958, -0.5003145933151245, -0.21806317567825317, 0.06418824195861816, 0.3464395999908447, 0.6286910772323608, 0.910942554473877, 1.1931939125061035, 1.47544527053833, 1.7576967477798462, 2.0399482250213623, 2.322199583053589, 2.6044509410858154, 2.886702537536621, 3.1689538955688477, 3.451205253601074, 3.733456611633301, 4.015707969665527, 4.297959327697754, 4.5802106857299805, 4.862462043762207, 5.144713878631592, 5.426965236663818, 5.709216594696045, 5.9914679527282715, 6.273719310760498, 6.555970668792725, 6.838222503662109, 7.120473861694336, 7.4027252197265625, 7.684976577758789, 7.967227935791016]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 5.0, 11.0, 9.0, 3.0, 6.0, 15.0, 11.0, 17.0, 12.0, 19.0, 19.0, 29.0, 25.0, 30.0, 33.0, 31.0, 33.0, 39.0, 49.0, 39.0, 47.0, 37.0, 25.0, 27.0, 28.0, 30.0, 36.0, 34.0, 27.0, 33.0, 31.0, 22.0, 21.0, 25.0, 25.0, 17.0, 11.0, 13.0, 11.0, 9.0, 10.0, 9.0, 8.0, 1.0, 6.0, 4.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.54913330078125, -3.442233085632324, -3.3353331089019775, -3.2284328937530518, -3.121532678604126, -3.0146327018737793, -2.9077324867248535, -2.8008322715759277, -2.693932056427002, -2.587031841278076, -2.4801318645477295, -2.3732316493988037, -2.266331434249878, -2.1594314575195312, -2.0525312423706055, -1.9456310272216797, -1.838731050491333, -1.7318309545516968, -1.624930739402771, -1.5180306434631348, -1.411130428314209, -1.3042303323745728, -1.1973302364349365, -1.0904300212860107, -0.9835299253463745, -0.8766297698020935, -0.7697296142578125, -0.6628295183181763, -0.5559293627738953, -0.44902920722961426, -0.342129111289978, -0.23522895574569702, -0.12832880020141602, -0.021428659558296204, 0.08547148108482361, 0.19237160682678223, 0.29927176237106323, 0.40617191791534424, 0.5130720138549805, 0.6199721693992615, 0.7268723249435425, 0.8337724804878235, 0.9406726360321045, 1.0475727319717407, 1.154472827911377, 1.2613730430603027, 1.368273138999939, 1.4751732349395752, 1.582073450088501, 1.6889735460281372, 1.795873761177063, 1.9027738571166992, 2.009674072265625, 2.116574287414551, 2.2234742641448975, 2.3303744792938232, 2.43727445602417, 2.5441746711730957, 2.6510746479034424, 2.757974863052368, 2.864875078201294, 2.9717750549316406, 3.0786752700805664, 3.185575485229492, 3.292475700378418]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 9.0, 14.0, 13.0, 33.0, 43.0, 50.0, 78.0, 118.0, 167.0, 257.0, 395.0, 595.0, 884.0, 1445.0, 2536.0, 4963.0, 11020.0, 29728.0, 91461.0, 264497.0, 370764.0, 176477.0, 56954.0, 19289.0, 7579.0, 3687.0, 1998.0, 1224.0, 771.0, 511.0, 331.0, 230.0, 141.0, 95.0, 77.0, 35.0, 23.0, 25.0, 14.0, 11.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.95703125, -5.753662109375, -5.55029296875, -5.346923828125, -5.1435546875, -4.940185546875, -4.73681640625, -4.533447265625, -4.330078125, -4.126708984375, -3.92333984375, -3.719970703125, -3.5166015625, -3.313232421875, -3.10986328125, -2.906494140625, -2.703125, -2.499755859375, -2.29638671875, -2.093017578125, -1.8896484375, -1.686279296875, -1.48291015625, -1.279541015625, -1.076171875, -0.872802734375, -0.66943359375, -0.466064453125, -0.2626953125, -0.059326171875, 0.14404296875, 0.347412109375, 0.55078125, 0.754150390625, 0.95751953125, 1.160888671875, 1.3642578125, 1.567626953125, 1.77099609375, 1.974365234375, 2.177734375, 2.381103515625, 2.58447265625, 2.787841796875, 2.9912109375, 3.194580078125, 3.39794921875, 3.601318359375, 3.8046875, 4.008056640625, 4.21142578125, 4.414794921875, 4.6181640625, 4.821533203125, 5.02490234375, 5.228271484375, 5.431640625, 5.635009765625, 5.83837890625, 6.041748046875, 6.2451171875, 6.448486328125, 6.65185546875, 6.855224609375, 7.05859375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 7.0, 5.0, 7.0, 4.0, 8.0, 9.0, 11.0, 8.0, 14.0, 9.0, 15.0, 23.0, 23.0, 23.0, 20.0, 25.0, 31.0, 31.0, 37.0, 36.0, 37.0, 40.0, 53.0, 33.0, 49.0, 40.0, 23.0, 44.0, 30.0, 35.0, 31.0, 24.0, 29.0, 39.0, 26.0, 20.0, 8.0, 16.0, 10.0, 9.0, 14.0, 12.0, 9.0, 6.0, 9.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.94921875, -3.8251953125, -3.701171875, -3.5771484375, -3.453125, -3.3291015625, -3.205078125, -3.0810546875, -2.95703125, -2.8330078125, -2.708984375, -2.5849609375, -2.4609375, -2.3369140625, -2.212890625, -2.0888671875, -1.96484375, -1.8408203125, -1.716796875, -1.5927734375, -1.46875, -1.3447265625, -1.220703125, -1.0966796875, -0.97265625, -0.8486328125, -0.724609375, -0.6005859375, -0.4765625, -0.3525390625, -0.228515625, -0.1044921875, 0.01953125, 0.1435546875, 0.267578125, 0.3916015625, 0.515625, 0.6396484375, 0.763671875, 0.8876953125, 1.01171875, 1.1357421875, 1.259765625, 1.3837890625, 1.5078125, 1.6318359375, 1.755859375, 1.8798828125, 2.00390625, 2.1279296875, 2.251953125, 2.3759765625, 2.5, 2.6240234375, 2.748046875, 2.8720703125, 2.99609375, 3.1201171875, 3.244140625, 3.3681640625, 3.4921875, 3.6162109375, 3.740234375, 3.8642578125, 3.98828125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 2.0, 6.0, 7.0, 9.0, 6.0, 21.0, 23.0, 36.0, 44.0, 45.0, 73.0, 82.0, 131.0, 188.0, 237.0, 374.0, 508.0, 849.0, 1552.0, 3279.0, 8959.0, 38398.0, 252772.0, 582163.0, 125710.0, 21327.0, 5786.0, 2380.0, 1265.0, 744.0, 423.0, 312.0, 228.0, 160.0, 115.0, 87.0, 64.0, 45.0, 35.0, 40.0, 21.0, 9.0, 15.0, 9.0, 6.0, 3.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.34375, -10.9696044921875, -10.595458984375, -10.2213134765625, -9.84716796875, -9.4730224609375, -9.098876953125, -8.7247314453125, -8.3505859375, -7.9764404296875, -7.602294921875, -7.2281494140625, -6.85400390625, -6.4798583984375, -6.105712890625, -5.7315673828125, -5.357421875, -4.9832763671875, -4.609130859375, -4.2349853515625, -3.86083984375, -3.4866943359375, -3.112548828125, -2.7384033203125, -2.3642578125, -1.9901123046875, -1.615966796875, -1.2418212890625, -0.86767578125, -0.4935302734375, -0.119384765625, 0.2547607421875, 0.62890625, 1.0030517578125, 1.377197265625, 1.7513427734375, 2.12548828125, 2.4996337890625, 2.873779296875, 3.2479248046875, 3.6220703125, 3.9962158203125, 4.370361328125, 4.7445068359375, 5.11865234375, 5.4927978515625, 5.866943359375, 6.2410888671875, 6.615234375, 6.9893798828125, 7.363525390625, 7.7376708984375, 8.11181640625, 8.4859619140625, 8.860107421875, 9.2342529296875, 9.6083984375, 9.9825439453125, 10.356689453125, 10.7308349609375, 11.10498046875, 11.4791259765625, 11.853271484375, 12.2274169921875, 12.6015625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 4.0, 2.0, 1.0, 6.0, 1.0, 8.0, 8.0, 7.0, 5.0, 12.0, 7.0, 13.0, 14.0, 17.0, 10.0, 21.0, 17.0, 22.0, 20.0, 37.0, 36.0, 26.0, 35.0, 37.0, 40.0, 32.0, 39.0, 38.0, 40.0, 42.0, 40.0, 38.0, 32.0, 37.0, 36.0, 29.0, 16.0, 22.0, 20.0, 22.0, 19.0, 20.0, 12.0, 7.0, 8.0, 12.0, 8.0, 8.0, 7.0, 6.0, 5.0, 1.0, 5.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.169921875, -2.0987548828125, -2.027587890625, -1.9564208984375, -1.88525390625, -1.8140869140625, -1.742919921875, -1.6717529296875, -1.6005859375, -1.5294189453125, -1.458251953125, -1.3870849609375, -1.31591796875, -1.2447509765625, -1.173583984375, -1.1024169921875, -1.03125, -0.9600830078125, -0.888916015625, -0.8177490234375, -0.74658203125, -0.6754150390625, -0.604248046875, -0.5330810546875, -0.4619140625, -0.3907470703125, -0.319580078125, -0.2484130859375, -0.17724609375, -0.1060791015625, -0.034912109375, 0.0362548828125, 0.107421875, 0.1785888671875, 0.249755859375, 0.3209228515625, 0.39208984375, 0.4632568359375, 0.534423828125, 0.6055908203125, 0.6767578125, 0.7479248046875, 0.819091796875, 0.8902587890625, 0.96142578125, 1.0325927734375, 1.103759765625, 1.1749267578125, 1.24609375, 1.3172607421875, 1.388427734375, 1.4595947265625, 1.53076171875, 1.6019287109375, 1.673095703125, 1.7442626953125, 1.8154296875, 1.8865966796875, 1.957763671875, 2.0289306640625, 2.10009765625, 2.1712646484375, 2.242431640625, 2.3135986328125, 2.384765625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 7.0, 14.0, 31.0, 11.0, 36.0, 46.0, 79.0, 98.0, 164.0, 243.0, 369.0, 543.0, 823.0, 1340.0, 2093.0, 3631.0, 7646.0, 28531.0, 283712.0, 626540.0, 68492.0, 11970.0, 4835.0, 2669.0, 1560.0, 1049.0, 680.0, 414.0, 284.0, 181.0, 125.0, 91.0, 75.0, 48.0, 37.0, 22.0, 24.0, 12.0, 3.0, 5.0, 4.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.0546875, -6.82867431640625, -6.6026611328125, -6.37664794921875, -6.150634765625, -5.92462158203125, -5.6986083984375, -5.47259521484375, -5.24658203125, -5.02056884765625, -4.7945556640625, -4.56854248046875, -4.342529296875, -4.11651611328125, -3.8905029296875, -3.66448974609375, -3.4384765625, -3.21246337890625, -2.9864501953125, -2.76043701171875, -2.534423828125, -2.30841064453125, -2.0823974609375, -1.85638427734375, -1.63037109375, -1.40435791015625, -1.1783447265625, -0.95233154296875, -0.726318359375, -0.50030517578125, -0.2742919921875, -0.04827880859375, 0.177734375, 0.40374755859375, 0.6297607421875, 0.85577392578125, 1.081787109375, 1.30780029296875, 1.5338134765625, 1.75982666015625, 1.98583984375, 2.21185302734375, 2.4378662109375, 2.66387939453125, 2.889892578125, 3.11590576171875, 3.3419189453125, 3.56793212890625, 3.7939453125, 4.01995849609375, 4.2459716796875, 4.47198486328125, 4.697998046875, 4.92401123046875, 5.1500244140625, 5.37603759765625, 5.60205078125, 5.82806396484375, 6.0540771484375, 6.28009033203125, 6.506103515625, 6.73211669921875, 6.9581298828125, 7.18414306640625, 7.41015625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 15.0, 18.0, 28.0, 47.0, 87.0, 127.0, 203.0, 180.0, 108.0, 77.0, 49.0, 16.0, 9.0, 9.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.0002760887145996094, -0.0002685803920030594, -0.0002610720694065094, -0.0002535637468099594, -0.0002460554242134094, -0.00023854710161685944, -0.00023103877902030945, -0.00022353045642375946, -0.00021602213382720947, -0.00020851381123065948, -0.0002010054886341095, -0.0001934971660375595, -0.00018598884344100952, -0.00017848052084445953, -0.00017097219824790955, -0.00016346387565135956, -0.00015595555305480957, -0.00014844723045825958, -0.0001409389078617096, -0.0001334305852651596, -0.00012592226266860962, -0.00011841394007205963, -0.00011090561747550964, -0.00010339729487895966, -9.588897228240967e-05, -8.838064968585968e-05, -8.087232708930969e-05, -7.33640044927597e-05, -6.585568189620972e-05, -5.834735929965973e-05, -5.083903670310974e-05, -4.3330714106559753e-05, -3.5822391510009766e-05, -2.8314068913459778e-05, -2.080574631690979e-05, -1.3297423720359802e-05, -5.7891011238098145e-06, 1.7192214727401733e-06, 9.227544069290161e-06, 1.673586666584015e-05, 2.4244189262390137e-05, 3.1752511858940125e-05, 3.926083445549011e-05, 4.67691570520401e-05, 5.427747964859009e-05, 6.178580224514008e-05, 6.929412484169006e-05, 7.680244743824005e-05, 8.431077003479004e-05, 9.181909263134003e-05, 9.932741522789001e-05, 0.00010683573782444, 0.00011434406042098999, 0.00012185238301753998, 0.00012936070561408997, 0.00013686902821063995, 0.00014437735080718994, 0.00015188567340373993, 0.00015939399600028992, 0.0001669023185968399, 0.0001744106411933899, 0.00018191896378993988, 0.00018942728638648987, 0.00019693560898303986, 0.00020444393157958984]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 6.0, 10.0, 10.0, 20.0, 20.0, 32.0, 44.0, 62.0, 87.0, 153.0, 154.0, 221.0, 371.0, 477.0, 675.0, 905.0, 1238.0, 1815.0, 2633.0, 3704.0, 6394.0, 14068.0, 46577.0, 197767.0, 460764.0, 222680.0, 52594.0, 15245.0, 6743.0, 3942.0, 2602.0, 1857.0, 1347.0, 959.0, 637.0, 481.0, 335.0, 286.0, 177.0, 136.0, 96.0, 78.0, 55.0, 33.0, 18.0, 13.0, 11.0, 5.0, 5.0, 8.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-4.03515625, -3.911163330078125, -3.78717041015625, -3.663177490234375, -3.5391845703125, -3.415191650390625, -3.29119873046875, -3.167205810546875, -3.043212890625, -2.919219970703125, -2.79522705078125, -2.671234130859375, -2.5472412109375, -2.423248291015625, -2.29925537109375, -2.175262451171875, -2.05126953125, -1.927276611328125, -1.80328369140625, -1.679290771484375, -1.5552978515625, -1.431304931640625, -1.30731201171875, -1.183319091796875, -1.059326171875, -0.935333251953125, -0.81134033203125, -0.687347412109375, -0.5633544921875, -0.439361572265625, -0.31536865234375, -0.191375732421875, -0.0673828125, 0.056610107421875, 0.18060302734375, 0.304595947265625, 0.4285888671875, 0.552581787109375, 0.67657470703125, 0.800567626953125, 0.924560546875, 1.048553466796875, 1.17254638671875, 1.296539306640625, 1.4205322265625, 1.544525146484375, 1.66851806640625, 1.792510986328125, 1.91650390625, 2.040496826171875, 2.16448974609375, 2.288482666015625, 2.4124755859375, 2.536468505859375, 2.66046142578125, 2.784454345703125, 2.908447265625, 3.032440185546875, 3.15643310546875, 3.280426025390625, 3.4044189453125, 3.528411865234375, 3.65240478515625, 3.776397705078125, 3.900390625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 5.0, 2.0, 14.0, 22.0, 74.0, 160.0, 227.0, 215.0, 147.0, 72.0, 23.0, 7.0, 6.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8193359375, -1.76055908203125, -1.7017822265625, -1.64300537109375, -1.584228515625, -1.52545166015625, -1.4666748046875, -1.40789794921875, -1.34912109375, -1.29034423828125, -1.2315673828125, -1.17279052734375, -1.114013671875, -1.05523681640625, -0.9964599609375, -0.93768310546875, -0.87890625, -0.82012939453125, -0.7613525390625, -0.70257568359375, -0.643798828125, -0.58502197265625, -0.5262451171875, -0.46746826171875, -0.40869140625, -0.34991455078125, -0.2911376953125, -0.23236083984375, -0.173583984375, -0.11480712890625, -0.0560302734375, 0.00274658203125, 0.0615234375, 0.12030029296875, 0.1790771484375, 0.23785400390625, 0.296630859375, 0.35540771484375, 0.4141845703125, 0.47296142578125, 0.53173828125, 0.59051513671875, 0.6492919921875, 0.70806884765625, 0.766845703125, 0.82562255859375, 0.8843994140625, 0.94317626953125, 1.001953125, 1.06072998046875, 1.1195068359375, 1.17828369140625, 1.237060546875, 1.29583740234375, 1.3546142578125, 1.41339111328125, 1.47216796875, 1.53094482421875, 1.5897216796875, 1.64849853515625, 1.707275390625, 1.76605224609375, 1.8248291015625, 1.88360595703125, 1.9423828125]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 1.0, 5.0, 8.0, 1.0, 2.0, 10.0, 3.0, 12.0, 10.0, 13.0, 18.0, 28.0, 42.0, 35.0, 49.0, 46.0, 63.0, 75.0, 69.0, 84.0, 64.0, 60.0, 58.0, 57.0, 43.0, 24.0, 29.0, 22.0, 18.0, 15.0, 11.0, 7.0, 10.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.02247428894043, -9.74274730682373, -9.463020324707031, -9.183293342590332, -8.903566360473633, -8.623838424682617, -8.344111442565918, -8.064384460449219, -7.7846574783325195, -7.50493049621582, -7.225203514099121, -6.945476055145264, -6.6657490730285645, -6.386022090911865, -6.106294631958008, -5.826567649841309, -5.546840667724609, -5.26711368560791, -4.987386703491211, -4.7076592445373535, -4.427932262420654, -4.148205280303955, -3.8684780597686768, -3.5887508392333984, -3.309023857116699, -3.029296875, -2.7495696544647217, -2.4698424339294434, -2.190115451812744, -1.9103883504867554, -1.6306612491607666, -1.3509341478347778, -1.071207046508789, -0.7914799451828003, -0.5117528438568115, -0.23202574253082275, 0.047701358795166016, 0.3274284601211548, 0.6071555614471436, 0.8868826627731323, 1.166609764099121, 1.4463368654251099, 1.7260639667510986, 2.005791187286377, 2.285518169403076, 2.5652451515197754, 2.8449723720550537, 3.124699592590332, 3.4044265747070312, 3.6841535568237305, 3.963880777359009, 4.243607997894287, 4.523334980010986, 4.8030619621276855, 5.082789421081543, 5.362516403198242, 5.642243385314941, 5.921970367431641, 6.20169734954834, 6.481424808502197, 6.7611517906188965, 7.040878772735596, 7.320606231689453, 7.600333213806152, 7.880060195922852]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 11.0, 7.0, 2.0, 8.0, 7.0, 9.0, 9.0, 12.0, 11.0, 17.0, 16.0, 22.0, 27.0, 28.0, 22.0, 44.0, 27.0, 35.0, 39.0, 34.0, 40.0, 47.0, 37.0, 35.0, 31.0, 28.0, 32.0, 34.0, 30.0, 35.0, 26.0, 27.0, 30.0, 29.0, 22.0, 19.0, 18.0, 10.0, 13.0, 17.0, 11.0, 8.0, 8.0, 7.0, 6.0, 6.0, 4.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.5768890380859375, -3.4689245223999023, -3.360960006713867, -3.252995491027832, -3.145030975341797, -3.0370664596557617, -2.9291017055511475, -2.8211371898651123, -2.713172674179077, -2.605208158493042, -2.497243642807007, -2.3892791271209717, -2.2813143730163574, -2.1733498573303223, -2.065385341644287, -1.957420825958252, -1.8494563102722168, -1.7414917945861816, -1.6335272789001465, -1.5255626440048218, -1.4175981283187866, -1.3096336126327515, -1.2016689777374268, -1.0937044620513916, -0.9857399463653564, -0.8777754306793213, -0.7698108553886414, -0.6618462800979614, -0.5538817644119263, -0.4459172487258911, -0.3379526734352112, -0.22998809814453125, -0.12202334403991699, -0.014058798551559448, 0.0939057469367981, 0.20187029242515564, 0.3098348379135132, 0.41779935359954834, 0.5257639288902283, 0.6337285041809082, 0.7416930198669434, 0.8496575355529785, 0.9576221108436584, 1.0655866861343384, 1.1735512018203735, 1.2815157175064087, 1.3894803524017334, 1.4974448680877686, 1.6054093837738037, 1.7133738994598389, 1.821338415145874, 1.9293030500411987, 2.0372676849365234, 2.1452322006225586, 2.2531967163085938, 2.361161231994629, 2.469125747680664, 2.577090263366699, 2.6850547790527344, 2.7930192947387695, 2.9009838104248047, 3.00894832611084, 3.116913080215454, 3.2248775959014893, 3.3328421115875244]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 1.0, 7.0, 5.0, 11.0, 17.0, 22.0, 26.0, 39.0, 71.0, 104.0, 141.0, 231.0, 390.0, 579.0, 889.0, 1374.0, 2266.0, 3772.0, 6196.0, 10300.0, 17323.0, 29887.0, 51315.0, 86017.0, 131655.0, 172841.0, 175128.0, 137086.0, 89733.0, 53970.0, 31486.0, 18131.0, 10696.0, 6308.0, 3920.0, 2382.0, 1476.0, 1002.0, 574.0, 363.0, 251.0, 167.0, 135.0, 81.0, 62.0, 43.0, 25.0, 26.0, 13.0, 13.0, 2.0, 6.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.44140625, -5.26031494140625, -5.0792236328125, -4.89813232421875, -4.717041015625, -4.53594970703125, -4.3548583984375, -4.17376708984375, -3.99267578125, -3.81158447265625, -3.6304931640625, -3.44940185546875, -3.268310546875, -3.08721923828125, -2.9061279296875, -2.72503662109375, -2.5439453125, -2.36285400390625, -2.1817626953125, -2.00067138671875, -1.819580078125, -1.63848876953125, -1.4573974609375, -1.27630615234375, -1.09521484375, -0.91412353515625, -0.7330322265625, -0.55194091796875, -0.370849609375, -0.18975830078125, -0.0086669921875, 0.17242431640625, 0.353515625, 0.53460693359375, 0.7156982421875, 0.89678955078125, 1.077880859375, 1.25897216796875, 1.4400634765625, 1.62115478515625, 1.80224609375, 1.98333740234375, 2.1644287109375, 2.34552001953125, 2.526611328125, 2.70770263671875, 2.8887939453125, 3.06988525390625, 3.2509765625, 3.43206787109375, 3.6131591796875, 3.79425048828125, 3.975341796875, 4.15643310546875, 4.3375244140625, 4.51861572265625, 4.69970703125, 4.88079833984375, 5.0618896484375, 5.24298095703125, 5.424072265625, 5.60516357421875, 5.7862548828125, 5.96734619140625, 6.1484375]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 4.0, 3.0, 4.0, 7.0, 17.0, 15.0, 12.0, 11.0, 14.0, 21.0, 14.0, 21.0, 30.0, 35.0, 36.0, 29.0, 41.0, 34.0, 34.0, 38.0, 36.0, 59.0, 36.0, 40.0, 42.0, 38.0, 41.0, 30.0, 30.0, 24.0, 26.0, 27.0, 11.0, 14.0, 19.0, 19.0, 15.0, 16.0, 12.0, 7.0, 10.0, 3.0, 6.0, 7.0, 2.0, 6.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4.1484375, -4.02545166015625, -3.9024658203125, -3.77947998046875, -3.656494140625, -3.53350830078125, -3.4105224609375, -3.28753662109375, -3.16455078125, -3.04156494140625, -2.9185791015625, -2.79559326171875, -2.672607421875, -2.54962158203125, -2.4266357421875, -2.30364990234375, -2.1806640625, -2.05767822265625, -1.9346923828125, -1.81170654296875, -1.688720703125, -1.56573486328125, -1.4427490234375, -1.31976318359375, -1.19677734375, -1.07379150390625, -0.9508056640625, -0.82781982421875, -0.704833984375, -0.58184814453125, -0.4588623046875, -0.33587646484375, -0.212890625, -0.08990478515625, 0.0330810546875, 0.15606689453125, 0.279052734375, 0.40203857421875, 0.5250244140625, 0.64801025390625, 0.77099609375, 0.89398193359375, 1.0169677734375, 1.13995361328125, 1.262939453125, 1.38592529296875, 1.5089111328125, 1.63189697265625, 1.7548828125, 1.87786865234375, 2.0008544921875, 2.12384033203125, 2.246826171875, 2.36981201171875, 2.4927978515625, 2.61578369140625, 2.73876953125, 2.86175537109375, 2.9847412109375, 3.10772705078125, 3.230712890625, 3.35369873046875, 3.4766845703125, 3.59967041015625, 3.72265625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 10.0, 15.0, 24.0, 24.0, 46.0, 72.0, 113.0, 137.0, 207.0, 355.0, 579.0, 865.0, 1432.0, 2137.0, 3528.0, 5557.0, 8525.0, 13504.0, 21222.0, 33384.0, 52190.0, 77359.0, 107766.0, 135119.0, 145221.0, 130850.0, 103096.0, 72093.0, 47768.0, 31245.0, 19829.0, 12573.0, 7812.0, 4996.0, 3276.0, 2033.0, 1281.0, 798.0, 548.0, 325.0, 222.0, 148.0, 86.0, 74.0, 49.0, 28.0, 17.0, 8.0, 7.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-5.15234375, -5.00262451171875, -4.8529052734375, -4.70318603515625, -4.553466796875, -4.40374755859375, -4.2540283203125, -4.10430908203125, -3.95458984375, -3.80487060546875, -3.6551513671875, -3.50543212890625, -3.355712890625, -3.20599365234375, -3.0562744140625, -2.90655517578125, -2.7568359375, -2.60711669921875, -2.4573974609375, -2.30767822265625, -2.157958984375, -2.00823974609375, -1.8585205078125, -1.70880126953125, -1.55908203125, -1.40936279296875, -1.2596435546875, -1.10992431640625, -0.960205078125, -0.81048583984375, -0.6607666015625, -0.51104736328125, -0.361328125, -0.21160888671875, -0.0618896484375, 0.08782958984375, 0.237548828125, 0.38726806640625, 0.5369873046875, 0.68670654296875, 0.83642578125, 0.98614501953125, 1.1358642578125, 1.28558349609375, 1.435302734375, 1.58502197265625, 1.7347412109375, 1.88446044921875, 2.0341796875, 2.18389892578125, 2.3336181640625, 2.48333740234375, 2.633056640625, 2.78277587890625, 2.9324951171875, 3.08221435546875, 3.23193359375, 3.38165283203125, 3.5313720703125, 3.68109130859375, 3.830810546875, 3.98052978515625, 4.1302490234375, 4.27996826171875, 4.4296875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 6.0, 8.0, 5.0, 7.0, 11.0, 13.0, 15.0, 6.0, 27.0, 21.0, 22.0, 28.0, 21.0, 54.0, 34.0, 46.0, 26.0, 33.0, 30.0, 33.0, 40.0, 50.0, 45.0, 34.0, 47.0, 41.0, 43.0, 36.0, 38.0, 28.0, 20.0, 28.0, 16.0, 14.0, 14.0, 12.0, 12.0, 9.0, 8.0, 7.0, 6.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7734375, -2.690673828125, -2.60791015625, -2.525146484375, -2.4423828125, -2.359619140625, -2.27685546875, -2.194091796875, -2.111328125, -2.028564453125, -1.94580078125, -1.863037109375, -1.7802734375, -1.697509765625, -1.61474609375, -1.531982421875, -1.44921875, -1.366455078125, -1.28369140625, -1.200927734375, -1.1181640625, -1.035400390625, -0.95263671875, -0.869873046875, -0.787109375, -0.704345703125, -0.62158203125, -0.538818359375, -0.4560546875, -0.373291015625, -0.29052734375, -0.207763671875, -0.125, -0.042236328125, 0.04052734375, 0.123291015625, 0.2060546875, 0.288818359375, 0.37158203125, 0.454345703125, 0.537109375, 0.619873046875, 0.70263671875, 0.785400390625, 0.8681640625, 0.950927734375, 1.03369140625, 1.116455078125, 1.19921875, 1.281982421875, 1.36474609375, 1.447509765625, 1.5302734375, 1.613037109375, 1.69580078125, 1.778564453125, 1.861328125, 1.944091796875, 2.02685546875, 2.109619140625, 2.1923828125, 2.275146484375, 2.35791015625, 2.440673828125, 2.5234375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 5.0, 4.0, 6.0, 6.0, 13.0, 32.0, 29.0, 50.0, 68.0, 126.0, 167.0, 240.0, 325.0, 533.0, 757.0, 1178.0, 1777.0, 2722.0, 4218.0, 6489.0, 10618.0, 17071.0, 28490.0, 49149.0, 83861.0, 136944.0, 186947.0, 184698.0, 132740.0, 80585.0, 46441.0, 27354.0, 16557.0, 10070.0, 6354.0, 4196.0, 2622.0, 1727.0, 1129.0, 711.0, 478.0, 364.0, 241.0, 146.0, 106.0, 75.0, 46.0, 33.0, 29.0, 16.0, 8.0, 6.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.740234375, -2.648773193359375, -2.55731201171875, -2.465850830078125, -2.3743896484375, -2.282928466796875, -2.19146728515625, -2.100006103515625, -2.008544921875, -1.917083740234375, -1.82562255859375, -1.734161376953125, -1.6427001953125, -1.551239013671875, -1.45977783203125, -1.368316650390625, -1.27685546875, -1.185394287109375, -1.09393310546875, -1.002471923828125, -0.9110107421875, -0.819549560546875, -0.72808837890625, -0.636627197265625, -0.545166015625, -0.453704833984375, -0.36224365234375, -0.270782470703125, -0.1793212890625, -0.087860107421875, 0.00360107421875, 0.095062255859375, 0.1865234375, 0.277984619140625, 0.36944580078125, 0.460906982421875, 0.5523681640625, 0.643829345703125, 0.73529052734375, 0.826751708984375, 0.918212890625, 1.009674072265625, 1.10113525390625, 1.192596435546875, 1.2840576171875, 1.375518798828125, 1.46697998046875, 1.558441162109375, 1.64990234375, 1.741363525390625, 1.83282470703125, 1.924285888671875, 2.0157470703125, 2.107208251953125, 2.19866943359375, 2.290130615234375, 2.381591796875, 2.473052978515625, 2.56451416015625, 2.655975341796875, 2.7474365234375, 2.838897705078125, 2.93035888671875, 3.021820068359375, 3.11328125]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 3.0, 8.0, 6.0, 14.0, 15.0, 27.0, 28.0, 33.0, 35.0, 45.0, 67.0, 55.0, 90.0, 81.0, 94.0, 84.0, 52.0, 59.0, 46.0, 32.0, 23.0, 13.0, 10.0, 17.0, 9.0, 9.0, 8.0, 9.0, 2.0, 6.0, 2.0, 5.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0004417896270751953, -0.0004290565848350525, -0.00041632354259490967, -0.00040359050035476685, -0.000390857458114624, -0.0003781244158744812, -0.0003653913736343384, -0.00035265833139419556, -0.00033992528915405273, -0.0003271922469139099, -0.0003144592046737671, -0.00030172616243362427, -0.00028899312019348145, -0.0002762600779533386, -0.0002635270357131958, -0.000250793993473053, -0.00023806095123291016, -0.00022532790899276733, -0.0002125948667526245, -0.0001998618245124817, -0.00018712878227233887, -0.00017439574003219604, -0.00016166269779205322, -0.0001489296555519104, -0.00013619661331176758, -0.00012346357107162476, -0.00011073052883148193, -9.799748659133911e-05, -8.526444435119629e-05, -7.253140211105347e-05, -5.9798359870910645e-05, -4.706531763076782e-05, -3.4332275390625e-05, -2.1599233150482178e-05, -8.866190910339355e-06, 3.866851329803467e-06, 1.659989356994629e-05, 2.933293581008911e-05, 4.2065978050231934e-05, 5.4799020290374756e-05, 6.753206253051758e-05, 8.02651047706604e-05, 9.299814701080322e-05, 0.00010573118925094604, 0.00011846423149108887, 0.0001311972737312317, 0.0001439303159713745, 0.00015666335821151733, 0.00016939640045166016, 0.00018212944269180298, 0.0001948624849319458, 0.00020759552717208862, 0.00022032856941223145, 0.00023306161165237427, 0.0002457946538925171, 0.0002585276961326599, 0.00027126073837280273, 0.00028399378061294556, 0.0002967268228530884, 0.0003094598650932312, 0.000322192907333374, 0.00033492594957351685, 0.00034765899181365967, 0.0003603920340538025, 0.0003731250762939453]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 12.0, 20.0, 28.0, 43.0, 66.0, 100.0, 129.0, 218.0, 327.0, 508.0, 797.0, 1275.0, 1953.0, 3260.0, 5245.0, 8893.0, 15100.0, 25387.0, 43762.0, 74170.0, 119281.0, 169340.0, 184334.0, 149630.0, 99361.0, 59879.0, 34525.0, 20423.0, 11874.0, 7185.0, 4263.0, 2574.0, 1626.0, 1052.0, 674.0, 405.0, 281.0, 193.0, 109.0, 94.0, 54.0, 34.0, 26.0, 24.0, 11.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.353515625, -2.273162841796875, -2.19281005859375, -2.112457275390625, -2.0321044921875, -1.951751708984375, -1.87139892578125, -1.791046142578125, -1.710693359375, -1.630340576171875, -1.54998779296875, -1.469635009765625, -1.3892822265625, -1.308929443359375, -1.22857666015625, -1.148223876953125, -1.06787109375, -0.987518310546875, -0.90716552734375, -0.826812744140625, -0.7464599609375, -0.666107177734375, -0.58575439453125, -0.505401611328125, -0.425048828125, -0.344696044921875, -0.26434326171875, -0.183990478515625, -0.1036376953125, -0.023284912109375, 0.05706787109375, 0.137420654296875, 0.2177734375, 0.298126220703125, 0.37847900390625, 0.458831787109375, 0.5391845703125, 0.619537353515625, 0.69989013671875, 0.780242919921875, 0.860595703125, 0.940948486328125, 1.02130126953125, 1.101654052734375, 1.1820068359375, 1.262359619140625, 1.34271240234375, 1.423065185546875, 1.50341796875, 1.583770751953125, 1.66412353515625, 1.744476318359375, 1.8248291015625, 1.905181884765625, 1.98553466796875, 2.065887451171875, 2.146240234375, 2.226593017578125, 2.30694580078125, 2.387298583984375, 2.4676513671875, 2.548004150390625, 2.62835693359375, 2.708709716796875, 2.7890625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 0.0, 6.0, 2.0, 13.0, 7.0, 13.0, 12.0, 16.0, 11.0, 18.0, 25.0, 22.0, 26.0, 43.0, 47.0, 50.0, 60.0, 52.0, 46.0, 61.0, 52.0, 56.0, 36.0, 39.0, 53.0, 37.0, 35.0, 33.0, 27.0, 20.0, 10.0, 12.0, 11.0, 11.0, 9.0, 3.0, 3.0, 4.0, 6.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.708984375, -0.6871337890625, -0.665283203125, -0.6434326171875, -0.62158203125, -0.5997314453125, -0.577880859375, -0.5560302734375, -0.5341796875, -0.5123291015625, -0.490478515625, -0.4686279296875, -0.44677734375, -0.4249267578125, -0.403076171875, -0.3812255859375, -0.359375, -0.3375244140625, -0.315673828125, -0.2938232421875, -0.27197265625, -0.2501220703125, -0.228271484375, -0.2064208984375, -0.1845703125, -0.1627197265625, -0.140869140625, -0.1190185546875, -0.09716796875, -0.0753173828125, -0.053466796875, -0.0316162109375, -0.009765625, 0.0120849609375, 0.033935546875, 0.0557861328125, 0.07763671875, 0.0994873046875, 0.121337890625, 0.1431884765625, 0.1650390625, 0.1868896484375, 0.208740234375, 0.2305908203125, 0.25244140625, 0.2742919921875, 0.296142578125, 0.3179931640625, 0.33984375, 0.3616943359375, 0.383544921875, 0.4053955078125, 0.42724609375, 0.4490966796875, 0.470947265625, 0.4927978515625, 0.5146484375, 0.5364990234375, 0.558349609375, 0.5802001953125, 0.60205078125, 0.6239013671875, 0.645751953125, 0.6676025390625, 0.689453125]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 2.0, 7.0, 9.0, 7.0, 5.0, 11.0, 13.0, 13.0, 15.0, 23.0, 30.0, 31.0, 59.0, 70.0, 69.0, 73.0, 59.0, 82.0, 60.0, 71.0, 56.0, 57.0, 43.0, 34.0, 20.0, 23.0, 12.0, 11.0, 9.0, 8.0, 4.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.548230171203613, -10.262133598327637, -9.97603702545166, -9.689939498901367, -9.40384292602539, -9.117746353149414, -8.831649780273438, -8.545553207397461, -8.259455680847168, -7.973359107971191, -7.687262058258057, -7.40116548538208, -7.115068435668945, -6.828971862792969, -6.542875289916992, -6.256778240203857, -5.970681667327881, -5.684585094451904, -5.3984880447387695, -5.112391471862793, -4.826294422149658, -4.540197849273682, -4.254100799560547, -3.9680042266845703, -3.6819074153900146, -3.395810604095459, -3.1097137928009033, -2.8236169815063477, -2.537520408630371, -2.2514233589172363, -1.9653267860412598, -1.679229974746704, -1.3931326866149902, -1.1070358753204346, -0.8209391236305237, -0.5348423719406128, -0.24874556064605713, 0.037351250648498535, 0.32344794273376465, 0.6095447540283203, 0.895641565322876, 1.1817383766174316, 1.4678351879119873, 1.7539318799972534, 2.0400285720825195, 2.3261256217956543, 2.612222194671631, 2.8983190059661865, 3.184415817260742, 3.470512628555298, 3.7566094398498535, 4.04270601272583, 4.328803062438965, 4.614899635314941, 4.900996208190918, 5.187093257904053, 5.4731903076171875, 5.759286880493164, 6.045383930206299, 6.331480503082275, 6.61757755279541, 6.903674125671387, 7.189770698547363, 7.475867748260498, 7.761964321136475]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 7.0, 9.0, 1.0, 8.0, 10.0, 11.0, 10.0, 8.0, 12.0, 26.0, 18.0, 15.0, 17.0, 20.0, 27.0, 23.0, 28.0, 35.0, 33.0, 27.0, 39.0, 32.0, 39.0, 29.0, 26.0, 42.0, 29.0, 41.0, 34.0, 34.0, 25.0, 33.0, 36.0, 29.0, 22.0, 21.0, 10.0, 22.0, 15.0, 19.0, 14.0, 9.0, 15.0, 8.0, 10.0, 9.0, 5.0, 7.0, 4.0, 1.0, 1.0, 4.0, 2.0, 2.0], "bins": [-3.612844944000244, -3.507185459136963, -3.4015259742736816, -3.2958664894104004, -3.1902072429656982, -3.084547758102417, -2.9788882732391357, -2.8732287883758545, -2.7675695419311523, -2.661910057067871, -2.55625057220459, -2.4505910873413086, -2.3449318408966064, -2.239272356033325, -2.133612871170044, -2.0279533863067627, -1.9222939014434814, -1.8166344165802002, -1.7109750509262085, -1.6053155660629272, -1.4996562004089355, -1.3939967155456543, -1.288337230682373, -1.1826777458190918, -1.0770183801651, -0.9713589549064636, -0.8656995296478271, -0.7600400447845459, -0.6543806195259094, -0.548721194267273, -0.4430617094039917, -0.3374022841453552, -0.23174285888671875, -0.12608341872692108, -0.020423978567123413, 0.08523547649383545, 0.19089490175247192, 0.2965543270111084, 0.40221381187438965, 0.5078732371330261, 0.6135326623916626, 0.7191920876502991, 0.8248515129089355, 0.9305109977722168, 1.036170482635498, 1.1418298482894897, 1.247489333152771, 1.3531486988067627, 1.458808183670044, 1.5644676685333252, 1.670127034187317, 1.7757865190505981, 1.8814458847045898, 1.987105369567871, 2.0927648544311523, 2.1984243392944336, 2.304083824157715, 2.409743309020996, 2.5154027938842773, 2.6210622787475586, 2.7267215251922607, 2.832381010055542, 2.9380404949188232, 3.0436999797821045, 3.1493592262268066]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 4.0, 2.0, 8.0, 9.0, 13.0, 17.0, 15.0, 35.0, 56.0, 87.0, 135.0, 189.0, 346.0, 587.0, 903.0, 1527.0, 2818.0, 5441.0, 10466.0, 22355.0, 51959.0, 134702.0, 403988.0, 1168476.0, 1473538.0, 597299.0, 188543.0, 69401.0, 29731.0, 14287.0, 7199.0, 4025.0, 2246.0, 1381.0, 820.0, 568.0, 353.0, 236.0, 166.0, 110.0, 80.0, 54.0, 35.0, 20.0, 16.0, 9.0, 15.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0], "bins": [-9.7734375, -9.4874267578125, -9.201416015625, -8.9154052734375, -8.62939453125, -8.3433837890625, -8.057373046875, -7.7713623046875, -7.4853515625, -7.1993408203125, -6.913330078125, -6.6273193359375, -6.34130859375, -6.0552978515625, -5.769287109375, -5.4832763671875, -5.197265625, -4.9112548828125, -4.625244140625, -4.3392333984375, -4.05322265625, -3.7672119140625, -3.481201171875, -3.1951904296875, -2.9091796875, -2.6231689453125, -2.337158203125, -2.0511474609375, -1.76513671875, -1.4791259765625, -1.193115234375, -0.9071044921875, -0.62109375, -0.3350830078125, -0.049072265625, 0.2369384765625, 0.52294921875, 0.8089599609375, 1.094970703125, 1.3809814453125, 1.6669921875, 1.9530029296875, 2.239013671875, 2.5250244140625, 2.81103515625, 3.0970458984375, 3.383056640625, 3.6690673828125, 3.955078125, 4.2410888671875, 4.527099609375, 4.8131103515625, 5.09912109375, 5.3851318359375, 5.671142578125, 5.9571533203125, 6.2431640625, 6.5291748046875, 6.815185546875, 7.1011962890625, 7.38720703125, 7.6732177734375, 7.959228515625, 8.2452392578125, 8.53125]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 4.0, 4.0, 4.0, 11.0, 13.0, 11.0, 15.0, 17.0, 16.0, 13.0, 22.0, 22.0, 25.0, 34.0, 32.0, 35.0, 29.0, 47.0, 52.0, 40.0, 35.0, 52.0, 24.0, 39.0, 44.0, 43.0, 38.0, 36.0, 26.0, 25.0, 20.0, 23.0, 26.0, 16.0, 13.0, 20.0, 17.0, 13.0, 8.0, 11.0, 8.0, 6.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.142578125, -3.0423583984375, -2.942138671875, -2.8419189453125, -2.74169921875, -2.6414794921875, -2.541259765625, -2.4410400390625, -2.3408203125, -2.2406005859375, -2.140380859375, -2.0401611328125, -1.93994140625, -1.8397216796875, -1.739501953125, -1.6392822265625, -1.5390625, -1.4388427734375, -1.338623046875, -1.2384033203125, -1.13818359375, -1.0379638671875, -0.937744140625, -0.8375244140625, -0.7373046875, -0.6370849609375, -0.536865234375, -0.4366455078125, -0.33642578125, -0.2362060546875, -0.135986328125, -0.0357666015625, 0.064453125, 0.1646728515625, 0.264892578125, 0.3651123046875, 0.46533203125, 0.5655517578125, 0.665771484375, 0.7659912109375, 0.8662109375, 0.9664306640625, 1.066650390625, 1.1668701171875, 1.26708984375, 1.3673095703125, 1.467529296875, 1.5677490234375, 1.66796875, 1.7681884765625, 1.868408203125, 1.9686279296875, 2.06884765625, 2.1690673828125, 2.269287109375, 2.3695068359375, 2.4697265625, 2.5699462890625, 2.670166015625, 2.7703857421875, 2.87060546875, 2.9708251953125, 3.071044921875, 3.1712646484375, 3.271484375]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 9.0, 20.0, 25.0, 34.0, 53.0, 104.0, 163.0, 251.0, 434.0, 761.0, 1428.0, 2452.0, 4558.0, 8724.0, 17776.0, 38274.0, 89123.0, 226184.0, 631933.0, 1435009.0, 1076413.0, 397374.0, 147987.0, 60958.0, 26992.0, 12984.0, 6490.0, 3466.0, 1846.0, 1038.0, 568.0, 322.0, 198.0, 112.0, 65.0, 62.0, 36.0, 20.0, 10.0, 7.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-10.546875, -10.22509765625, -9.9033203125, -9.58154296875, -9.259765625, -8.93798828125, -8.6162109375, -8.29443359375, -7.97265625, -7.65087890625, -7.3291015625, -7.00732421875, -6.685546875, -6.36376953125, -6.0419921875, -5.72021484375, -5.3984375, -5.07666015625, -4.7548828125, -4.43310546875, -4.111328125, -3.78955078125, -3.4677734375, -3.14599609375, -2.82421875, -2.50244140625, -2.1806640625, -1.85888671875, -1.537109375, -1.21533203125, -0.8935546875, -0.57177734375, -0.25, 0.07177734375, 0.3935546875, 0.71533203125, 1.037109375, 1.35888671875, 1.6806640625, 2.00244140625, 2.32421875, 2.64599609375, 2.9677734375, 3.28955078125, 3.611328125, 3.93310546875, 4.2548828125, 4.57666015625, 4.8984375, 5.22021484375, 5.5419921875, 5.86376953125, 6.185546875, 6.50732421875, 6.8291015625, 7.15087890625, 7.47265625, 7.79443359375, 8.1162109375, 8.43798828125, 8.759765625, 9.08154296875, 9.4033203125, 9.72509765625, 10.046875]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 7.0, 7.0, 8.0, 11.0, 14.0, 21.0, 32.0, 38.0, 53.0, 71.0, 96.0, 152.0, 176.0, 228.0, 325.0, 346.0, 384.0, 411.0, 390.0, 332.0, 277.0, 179.0, 158.0, 94.0, 68.0, 65.0, 33.0, 25.0, 26.0, 11.0, 9.0, 7.0, 8.0, 5.0, 2.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.470703125, -3.37457275390625, -3.2784423828125, -3.18231201171875, -3.086181640625, -2.99005126953125, -2.8939208984375, -2.79779052734375, -2.70166015625, -2.60552978515625, -2.5093994140625, -2.41326904296875, -2.317138671875, -2.22100830078125, -2.1248779296875, -2.02874755859375, -1.9326171875, -1.83648681640625, -1.7403564453125, -1.64422607421875, -1.548095703125, -1.45196533203125, -1.3558349609375, -1.25970458984375, -1.16357421875, -1.06744384765625, -0.9713134765625, -0.87518310546875, -0.779052734375, -0.68292236328125, -0.5867919921875, -0.49066162109375, -0.39453125, -0.29840087890625, -0.2022705078125, -0.10614013671875, -0.010009765625, 0.08612060546875, 0.1822509765625, 0.27838134765625, 0.37451171875, 0.47064208984375, 0.5667724609375, 0.66290283203125, 0.759033203125, 0.85516357421875, 0.9512939453125, 1.04742431640625, 1.1435546875, 1.23968505859375, 1.3358154296875, 1.43194580078125, 1.528076171875, 1.62420654296875, 1.7203369140625, 1.81646728515625, 1.91259765625, 2.00872802734375, 2.1048583984375, 2.20098876953125, 2.297119140625, 2.39324951171875, 2.4893798828125, 2.58551025390625, 2.681640625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 4.0, 2.0, 6.0, 12.0, 10.0, 17.0, 11.0, 22.0, 23.0, 34.0, 37.0, 39.0, 50.0, 72.0, 65.0, 81.0, 85.0, 62.0, 62.0, 73.0, 54.0, 37.0, 27.0, 31.0, 23.0, 15.0, 17.0, 8.0, 4.0, 5.0, 6.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-13.038509368896484, -12.719670295715332, -12.400830268859863, -12.081991195678711, -11.763152122497559, -11.444313049316406, -11.125473022460938, -10.806633949279785, -10.487794876098633, -10.16895580291748, -9.850115776062012, -9.53127670288086, -9.212437629699707, -8.893598556518555, -8.574758529663086, -8.255919456481934, -7.937079429626465, -7.618239879608154, -7.299400806427002, -6.980561256408691, -6.661722183227539, -6.3428826332092285, -6.024043083190918, -5.705204010009766, -5.386364459991455, -5.0675249099731445, -4.748685836791992, -4.429846286773682, -4.111006736755371, -3.7921676635742188, -3.473328113555908, -3.1544888019561768, -2.8356499671936035, -2.516810655593872, -2.1979713439941406, -1.87913179397583, -1.5602924823760986, -1.2414531707763672, -0.9226137399673462, -0.6037743091583252, -0.28493499755859375, 0.03390437364578247, 0.3527437448501587, 0.6715831160545349, 0.9904224872589111, 1.3092617988586426, 1.6281012296676636, 1.9469406604766846, 2.265779972076416, 2.5846192836761475, 2.903458595275879, 3.2222981452941895, 3.541137456893921, 3.8599767684936523, 4.178816318511963, 4.497655868530273, 4.816494941711426, 5.135334491729736, 5.454173564910889, 5.773013114929199, 6.091852188110352, 6.410691738128662, 6.729531288146973, 7.048370361328125, 7.3672099113464355]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 7.0, 4.0, 2.0, 5.0, 10.0, 10.0, 12.0, 19.0, 12.0, 21.0, 15.0, 20.0, 26.0, 25.0, 31.0, 29.0, 37.0, 35.0, 44.0, 40.0, 32.0, 41.0, 38.0, 45.0, 37.0, 37.0, 30.0, 28.0, 33.0, 34.0, 28.0, 34.0, 21.0, 27.0, 20.0, 17.0, 16.0, 11.0, 9.0, 8.0, 9.0, 11.0, 10.0, 9.0, 6.0, 3.0, 4.0, 5.0, 4.0, 0.0, 1.0, 2.0], "bins": [-4.489992618560791, -4.361401081085205, -4.232809543609619, -4.104218006134033, -3.9756264686584473, -3.8470349311828613, -3.7184433937072754, -3.5898518562316895, -3.4612603187561035, -3.3326687812805176, -3.2040772438049316, -3.0754857063293457, -2.9468941688537598, -2.818302631378174, -2.689711093902588, -2.561119556427002, -2.432528018951416, -2.30393648147583, -2.175344944000244, -2.046753406524658, -1.9181618690490723, -1.7895703315734863, -1.6609787940979004, -1.5323872566223145, -1.4037957191467285, -1.2752041816711426, -1.1466126441955566, -1.0180211067199707, -0.8894295692443848, -0.7608380317687988, -0.6322464942932129, -0.503654956817627, -0.3750631809234619, -0.24647164344787598, -0.11788010597229004, 0.010711431503295898, 0.13930296897888184, 0.2678945064544678, 0.3964860439300537, 0.5250775814056396, 0.6536691188812256, 0.7822606563568115, 0.9108521938323975, 1.0394437313079834, 1.1680352687835693, 1.2966268062591553, 1.4252183437347412, 1.5538098812103271, 1.682401418685913, 1.810992956161499, 1.939584493637085, 2.068176031112671, 2.196767568588257, 2.3253591060638428, 2.4539506435394287, 2.5825421810150146, 2.7111337184906006, 2.8397252559661865, 2.9683167934417725, 3.0969083309173584, 3.2254998683929443, 3.3540914058685303, 3.482682943344116, 3.611274480819702, 3.739866018295288]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 6.0, 8.0, 11.0, 17.0, 27.0, 28.0, 55.0, 83.0, 145.0, 220.0, 367.0, 546.0, 898.0, 1347.0, 2253.0, 3614.0, 5877.0, 9809.0, 16065.0, 26414.0, 42929.0, 68074.0, 103453.0, 142455.0, 163486.0, 149560.0, 111842.0, 74947.0, 47606.0, 29782.0, 18010.0, 11041.0, 6641.0, 4151.0, 2507.0, 1610.0, 990.0, 611.0, 385.0, 216.0, 168.0, 104.0, 74.0, 48.0, 24.0, 20.0, 10.0, 7.0, 10.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-2.74609375, -2.661895751953125, -2.57769775390625, -2.493499755859375, -2.4093017578125, -2.325103759765625, -2.24090576171875, -2.156707763671875, -2.072509765625, -1.988311767578125, -1.90411376953125, -1.819915771484375, -1.7357177734375, -1.651519775390625, -1.56732177734375, -1.483123779296875, -1.39892578125, -1.314727783203125, -1.23052978515625, -1.146331787109375, -1.0621337890625, -0.977935791015625, -0.89373779296875, -0.809539794921875, -0.725341796875, -0.641143798828125, -0.55694580078125, -0.472747802734375, -0.3885498046875, -0.304351806640625, -0.22015380859375, -0.135955810546875, -0.0517578125, 0.032440185546875, 0.11663818359375, 0.200836181640625, 0.2850341796875, 0.369232177734375, 0.45343017578125, 0.537628173828125, 0.621826171875, 0.706024169921875, 0.79022216796875, 0.874420166015625, 0.9586181640625, 1.042816162109375, 1.12701416015625, 1.211212158203125, 1.29541015625, 1.379608154296875, 1.46380615234375, 1.548004150390625, 1.6322021484375, 1.716400146484375, 1.80059814453125, 1.884796142578125, 1.968994140625, 2.053192138671875, 2.13739013671875, 2.221588134765625, 2.3057861328125, 2.389984130859375, 2.47418212890625, 2.558380126953125, 2.642578125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 8.0, 3.0, 2.0, 8.0, 11.0, 10.0, 8.0, 20.0, 16.0, 16.0, 31.0, 24.0, 26.0, 32.0, 28.0, 30.0, 40.0, 33.0, 42.0, 35.0, 38.0, 38.0, 49.0, 43.0, 35.0, 37.0, 32.0, 31.0, 28.0, 24.0, 26.0, 28.0, 23.0, 16.0, 21.0, 18.0, 14.0, 22.0, 16.0, 6.0, 11.0, 3.0, 4.0, 2.0, 3.0, 3.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0], "bins": [-4.80859375, -4.6680908203125, -4.527587890625, -4.3870849609375, -4.24658203125, -4.1060791015625, -3.965576171875, -3.8250732421875, -3.6845703125, -3.5440673828125, -3.403564453125, -3.2630615234375, -3.12255859375, -2.9820556640625, -2.841552734375, -2.7010498046875, -2.560546875, -2.4200439453125, -2.279541015625, -2.1390380859375, -1.99853515625, -1.8580322265625, -1.717529296875, -1.5770263671875, -1.4365234375, -1.2960205078125, -1.155517578125, -1.0150146484375, -0.87451171875, -0.7340087890625, -0.593505859375, -0.4530029296875, -0.3125, -0.1719970703125, -0.031494140625, 0.1090087890625, 0.24951171875, 0.3900146484375, 0.530517578125, 0.6710205078125, 0.8115234375, 0.9520263671875, 1.092529296875, 1.2330322265625, 1.37353515625, 1.5140380859375, 1.654541015625, 1.7950439453125, 1.935546875, 2.0760498046875, 2.216552734375, 2.3570556640625, 2.49755859375, 2.6380615234375, 2.778564453125, 2.9190673828125, 3.0595703125, 3.2000732421875, 3.340576171875, 3.4810791015625, 3.62158203125, 3.7620849609375, 3.902587890625, 4.0430908203125, 4.18359375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 14.0, 16.0, 25.0, 41.0, 58.0, 86.0, 160.0, 216.0, 358.0, 567.0, 908.0, 1341.0, 2097.0, 3384.0, 5395.0, 8590.0, 13861.0, 22577.0, 37153.0, 59953.0, 96685.0, 147856.0, 187504.0, 164790.0, 112137.0, 69944.0, 43215.0, 26360.0, 16346.0, 9906.0, 6310.0, 3955.0, 2398.0, 1478.0, 1032.0, 604.0, 445.0, 277.0, 181.0, 137.0, 73.0, 55.0, 26.0, 18.0, 8.0, 4.0, 9.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9375, -2.838470458984375, -2.73944091796875, -2.640411376953125, -2.5413818359375, -2.442352294921875, -2.34332275390625, -2.244293212890625, -2.145263671875, -2.046234130859375, -1.94720458984375, -1.848175048828125, -1.7491455078125, -1.650115966796875, -1.55108642578125, -1.452056884765625, -1.35302734375, -1.253997802734375, -1.15496826171875, -1.055938720703125, -0.9569091796875, -0.857879638671875, -0.75885009765625, -0.659820556640625, -0.560791015625, -0.461761474609375, -0.36273193359375, -0.263702392578125, -0.1646728515625, -0.065643310546875, 0.03338623046875, 0.132415771484375, 0.2314453125, 0.330474853515625, 0.42950439453125, 0.528533935546875, 0.6275634765625, 0.726593017578125, 0.82562255859375, 0.924652099609375, 1.023681640625, 1.122711181640625, 1.22174072265625, 1.320770263671875, 1.4197998046875, 1.518829345703125, 1.61785888671875, 1.716888427734375, 1.81591796875, 1.914947509765625, 2.01397705078125, 2.113006591796875, 2.2120361328125, 2.311065673828125, 2.41009521484375, 2.509124755859375, 2.608154296875, 2.707183837890625, 2.80621337890625, 2.905242919921875, 3.0042724609375, 3.103302001953125, 3.20233154296875, 3.301361083984375, 3.400390625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 3.0, 3.0, 8.0, 7.0, 12.0, 14.0, 14.0, 16.0, 17.0, 20.0, 21.0, 24.0, 39.0, 31.0, 48.0, 47.0, 49.0, 48.0, 52.0, 45.0, 56.0, 47.0, 49.0, 35.0, 42.0, 29.0, 29.0, 31.0, 27.0, 24.0, 20.0, 20.0, 12.0, 16.0, 9.0, 8.0, 9.0, 7.0, 8.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.998046875, -2.89984130859375, -2.8016357421875, -2.70343017578125, -2.605224609375, -2.50701904296875, -2.4088134765625, -2.31060791015625, -2.21240234375, -2.11419677734375, -2.0159912109375, -1.91778564453125, -1.819580078125, -1.72137451171875, -1.6231689453125, -1.52496337890625, -1.4267578125, -1.32855224609375, -1.2303466796875, -1.13214111328125, -1.033935546875, -0.93572998046875, -0.8375244140625, -0.73931884765625, -0.64111328125, -0.54290771484375, -0.4447021484375, -0.34649658203125, -0.248291015625, -0.15008544921875, -0.0518798828125, 0.04632568359375, 0.14453125, 0.24273681640625, 0.3409423828125, 0.43914794921875, 0.537353515625, 0.63555908203125, 0.7337646484375, 0.83197021484375, 0.93017578125, 1.02838134765625, 1.1265869140625, 1.22479248046875, 1.322998046875, 1.42120361328125, 1.5194091796875, 1.61761474609375, 1.7158203125, 1.81402587890625, 1.9122314453125, 2.01043701171875, 2.108642578125, 2.20684814453125, 2.3050537109375, 2.40325927734375, 2.50146484375, 2.59967041015625, 2.6978759765625, 2.79608154296875, 2.894287109375, 2.99249267578125, 3.0906982421875, 3.18890380859375, 3.287109375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 6.0, 13.0, 21.0, 28.0, 34.0, 54.0, 88.0, 126.0, 210.0, 291.0, 498.0, 751.0, 1207.0, 1921.0, 3271.0, 5646.0, 9838.0, 18314.0, 36136.0, 75453.0, 157695.0, 276580.0, 230198.0, 115740.0, 54769.0, 26979.0, 14195.0, 7379.0, 4345.0, 2515.0, 1557.0, 977.0, 611.0, 369.0, 259.0, 150.0, 109.0, 69.0, 50.0, 37.0, 15.0, 25.0, 7.0, 8.0, 5.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.951171875, -1.883392333984375, -1.81561279296875, -1.747833251953125, -1.6800537109375, -1.612274169921875, -1.54449462890625, -1.476715087890625, -1.408935546875, -1.341156005859375, -1.27337646484375, -1.205596923828125, -1.1378173828125, -1.070037841796875, -1.00225830078125, -0.934478759765625, -0.86669921875, -0.798919677734375, -0.73114013671875, -0.663360595703125, -0.5955810546875, -0.527801513671875, -0.46002197265625, -0.392242431640625, -0.324462890625, -0.256683349609375, -0.18890380859375, -0.121124267578125, -0.0533447265625, 0.014434814453125, 0.08221435546875, 0.149993896484375, 0.2177734375, 0.285552978515625, 0.35333251953125, 0.421112060546875, 0.4888916015625, 0.556671142578125, 0.62445068359375, 0.692230224609375, 0.760009765625, 0.827789306640625, 0.89556884765625, 0.963348388671875, 1.0311279296875, 1.098907470703125, 1.16668701171875, 1.234466552734375, 1.30224609375, 1.370025634765625, 1.43780517578125, 1.505584716796875, 1.5733642578125, 1.641143798828125, 1.70892333984375, 1.776702880859375, 1.844482421875, 1.912261962890625, 1.98004150390625, 2.047821044921875, 2.1156005859375, 2.183380126953125, 2.25115966796875, 2.318939208984375, 2.38671875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 3.0, 8.0, 9.0, 17.0, 13.0, 22.0, 26.0, 45.0, 43.0, 62.0, 64.0, 79.0, 89.0, 84.0, 88.0, 72.0, 61.0, 59.0, 36.0, 27.0, 25.0, 15.0, 15.0, 11.0, 6.0, 6.0, 6.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00013518333435058594, -0.00013144686818122864, -0.00012771040201187134, -0.00012397393584251404, -0.00012023746967315674, -0.00011650100350379944, -0.00011276453733444214, -0.00010902807116508484, -0.00010529160499572754, -0.00010155513882637024, -9.781867265701294e-05, -9.408220648765564e-05, -9.034574031829834e-05, -8.660927414894104e-05, -8.287280797958374e-05, -7.913634181022644e-05, -7.539987564086914e-05, -7.166340947151184e-05, -6.792694330215454e-05, -6.419047713279724e-05, -6.045401096343994e-05, -5.671754479408264e-05, -5.298107862472534e-05, -4.924461245536804e-05, -4.550814628601074e-05, -4.177168011665344e-05, -3.803521394729614e-05, -3.429874777793884e-05, -3.056228160858154e-05, -2.6825815439224243e-05, -2.3089349269866943e-05, -1.9352883100509644e-05, -1.5616416931152344e-05, -1.1879950761795044e-05, -8.143484592437744e-06, -4.407018423080444e-06, -6.705522537231445e-07, 3.0659139156341553e-06, 6.802380084991455e-06, 1.0538846254348755e-05, 1.4275312423706055e-05, 1.8011778593063354e-05, 2.1748244762420654e-05, 2.5484710931777954e-05, 2.9221177101135254e-05, 3.2957643270492554e-05, 3.6694109439849854e-05, 4.043057560920715e-05, 4.416704177856445e-05, 4.790350794792175e-05, 5.163997411727905e-05, 5.537644028663635e-05, 5.911290645599365e-05, 6.284937262535095e-05, 6.658583879470825e-05, 7.032230496406555e-05, 7.405877113342285e-05, 7.779523730278015e-05, 8.153170347213745e-05, 8.526816964149475e-05, 8.900463581085205e-05, 9.274110198020935e-05, 9.647756814956665e-05, 0.00010021403431892395, 0.00010395050048828125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 2.0, 9.0, 18.0, 21.0, 25.0, 40.0, 63.0, 96.0, 129.0, 196.0, 270.0, 409.0, 664.0, 1035.0, 1520.0, 2564.0, 4085.0, 6591.0, 10849.0, 17641.0, 29810.0, 49855.0, 81558.0, 124626.0, 165253.0, 172013.0, 138372.0, 93880.0, 57888.0, 34945.0, 20960.0, 12527.0, 7669.0, 4716.0, 3029.0, 1832.0, 1117.0, 771.0, 482.0, 340.0, 235.0, 142.0, 83.0, 73.0, 63.0, 34.0, 24.0, 13.0, 9.0, 5.0, 3.0, 4.0, 5.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.4287109375, -1.38427734375, -1.33984375, -1.29541015625, -1.2509765625, -1.20654296875, -1.162109375, -1.11767578125, -1.0732421875, -1.02880859375, -0.984375, -0.93994140625, -0.8955078125, -0.85107421875, -0.806640625, -0.76220703125, -0.7177734375, -0.67333984375, -0.62890625, -0.58447265625, -0.5400390625, -0.49560546875, -0.451171875, -0.40673828125, -0.3623046875, -0.31787109375, -0.2734375, -0.22900390625, -0.1845703125, -0.14013671875, -0.095703125, -0.05126953125, -0.0068359375, 0.03759765625, 0.08203125, 0.12646484375, 0.1708984375, 0.21533203125, 0.259765625, 0.30419921875, 0.3486328125, 0.39306640625, 0.4375, 0.48193359375, 0.5263671875, 0.57080078125, 0.615234375, 0.65966796875, 0.7041015625, 0.74853515625, 0.79296875, 0.83740234375, 0.8818359375, 0.92626953125, 0.970703125, 1.01513671875, 1.0595703125, 1.10400390625, 1.1484375, 1.19287109375, 1.2373046875, 1.28173828125, 1.326171875, 1.37060546875, 1.4150390625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 5.0, 4.0, 5.0, 6.0, 9.0, 8.0, 15.0, 17.0, 24.0, 30.0, 37.0, 31.0, 42.0, 42.0, 51.0, 50.0, 50.0, 46.0, 58.0, 59.0, 66.0, 52.0, 39.0, 43.0, 39.0, 24.0, 33.0, 13.0, 18.0, 15.0, 12.0, 15.0, 6.0, 11.0, 3.0, 7.0, 6.0, 5.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.427490234375, -0.4138031005859375, -0.400115966796875, -0.3864288330078125, -0.37274169921875, -0.3590545654296875, -0.345367431640625, -0.3316802978515625, -0.3179931640625, -0.3043060302734375, -0.290618896484375, -0.2769317626953125, -0.26324462890625, -0.2495574951171875, -0.235870361328125, -0.2221832275390625, -0.20849609375, -0.1948089599609375, -0.181121826171875, -0.1674346923828125, -0.15374755859375, -0.1400604248046875, -0.126373291015625, -0.1126861572265625, -0.0989990234375, -0.0853118896484375, -0.071624755859375, -0.0579376220703125, -0.04425048828125, -0.0305633544921875, -0.016876220703125, -0.0031890869140625, 0.010498046875, 0.0241851806640625, 0.037872314453125, 0.0515594482421875, 0.06524658203125, 0.0789337158203125, 0.092620849609375, 0.1063079833984375, 0.1199951171875, 0.1336822509765625, 0.147369384765625, 0.1610565185546875, 0.17474365234375, 0.1884307861328125, 0.202117919921875, 0.2158050537109375, 0.2294921875, 0.2431793212890625, 0.256866455078125, 0.2705535888671875, 0.28424072265625, 0.2979278564453125, 0.311614990234375, 0.3253021240234375, 0.3389892578125, 0.3526763916015625, 0.366363525390625, 0.3800506591796875, 0.39373779296875, 0.4074249267578125, 0.421112060546875, 0.4347991943359375, 0.448486328125]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 9.0, 10.0, 11.0, 18.0, 9.0, 17.0, 26.0, 32.0, 37.0, 36.0, 46.0, 72.0, 65.0, 77.0, 81.0, 56.0, 70.0, 63.0, 65.0, 41.0, 30.0, 34.0, 17.0, 21.0, 14.0, 9.0, 6.0, 7.0, 4.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0], "bins": [-12.656728744506836, -12.348825454711914, -12.040922164916992, -11.73301887512207, -11.425115585327148, -11.11721134185791, -10.809308052062988, -10.501404762268066, -10.193501472473145, -9.885598182678223, -9.5776948928833, -9.269791603088379, -8.96188735961914, -8.653984069824219, -8.346080780029297, -8.038177490234375, -7.730274200439453, -7.422370910644531, -7.114467620849609, -6.806563854217529, -6.498660564422607, -6.1907572746276855, -5.8828535079956055, -5.574950218200684, -5.267046928405762, -4.95914363861084, -4.651240348815918, -4.343336582183838, -4.035433292388916, -3.727530002593994, -3.419626474380493, -3.111722946166992, -2.8038196563720703, -2.4959163665771484, -2.1880128383636475, -1.880109429359436, -1.5722060203552246, -1.2643026113510132, -0.9563992023468018, -0.6484956741333008, -0.3405923843383789, -0.03268897533416748, 0.27521443367004395, 0.5831178426742554, 0.8910212516784668, 1.1989246606826782, 1.5068280696868896, 1.8147315979003906, 2.1226348876953125, 2.4305381774902344, 2.7384417057037354, 3.0463452339172363, 3.354248523712158, 3.66215181350708, 3.970055341720581, 4.277958869934082, 4.585862159729004, 4.893765449523926, 5.201668739318848, 5.509572505950928, 5.81747579574585, 6.1253790855407715, 6.433282852172852, 6.741186141967773, 7.049089431762695]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 7.0, 2.0, 9.0, 11.0, 7.0, 16.0, 11.0, 24.0, 13.0, 18.0, 23.0, 22.0, 26.0, 36.0, 28.0, 34.0, 39.0, 37.0, 32.0, 39.0, 37.0, 41.0, 42.0, 45.0, 29.0, 31.0, 34.0, 31.0, 22.0, 34.0, 37.0, 23.0, 22.0, 21.0, 17.0, 17.0, 12.0, 7.0, 9.0, 13.0, 7.0, 9.0, 10.0, 7.0, 3.0, 4.0, 7.0, 2.0, 0.0, 1.0, 2.0], "bins": [-4.384467124938965, -4.258650779724121, -4.132833957672119, -4.007017612457275, -3.8812012672424316, -3.755384683609009, -3.629568099975586, -3.503751754760742, -3.3779351711273193, -3.2521185874938965, -3.1263022422790527, -3.00048565864563, -2.874669075012207, -2.7488527297973633, -2.6230361461639404, -2.4972195625305176, -2.371403217315674, -2.245586633682251, -2.1197702884674072, -1.9939537048339844, -1.868137240409851, -1.7423207759857178, -1.616504192352295, -1.4906877279281616, -1.3648712635040283, -1.239054799079895, -1.1132383346557617, -0.9874217510223389, -0.8616052865982056, -0.7357888221740723, -0.6099722981452942, -0.4841557741165161, -0.3583395481109619, -0.23252305388450623, -0.10670655965805054, 0.01910993456840515, 0.14492642879486084, 0.27074289321899414, 0.3965594172477722, 0.5223759412765503, 0.6481924057006836, 0.7740088701248169, 0.899825394153595, 1.025641918182373, 1.1514583826065063, 1.2772748470306396, 1.4030914306640625, 1.5289078950881958, 1.654724359512329, 1.7805408239364624, 1.9063572883605957, 2.0321738719940186, 2.1579904556274414, 2.283806800842285, 2.409623384475708, 2.535439968109131, 2.6612563133239746, 2.7870728969573975, 2.912889242172241, 3.038705825805664, 3.164522171020508, 3.2903387546539307, 3.4161553382873535, 3.5419716835021973, 3.66778826713562]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 4.0, 11.0, 15.0, 11.0, 21.0, 18.0, 22.0, 42.0, 69.0, 99.0, 127.0, 182.0, 274.0, 440.0, 730.0, 1149.0, 1832.0, 3218.0, 5539.0, 9712.0, 17707.0, 32747.0, 61296.0, 112500.0, 181892.0, 217543.0, 172442.0, 104329.0, 56317.0, 29875.0, 16401.0, 8879.0, 5155.0, 2995.0, 1785.0, 1137.0, 684.0, 434.0, 283.0, 191.0, 136.0, 98.0, 69.0, 38.0, 30.0, 16.0, 16.0, 20.0, 9.0, 4.0, 3.0, 6.0, 3.0, 4.0, 3.0], "bins": [-7.48828125, -7.27081298828125, -7.0533447265625, -6.83587646484375, -6.618408203125, -6.40093994140625, -6.1834716796875, -5.96600341796875, -5.74853515625, -5.53106689453125, -5.3135986328125, -5.09613037109375, -4.878662109375, -4.66119384765625, -4.4437255859375, -4.22625732421875, -4.0087890625, -3.79132080078125, -3.5738525390625, -3.35638427734375, -3.138916015625, -2.92144775390625, -2.7039794921875, -2.48651123046875, -2.26904296875, -2.05157470703125, -1.8341064453125, -1.61663818359375, -1.399169921875, -1.18170166015625, -0.9642333984375, -0.74676513671875, -0.529296875, -0.31182861328125, -0.0943603515625, 0.12310791015625, 0.340576171875, 0.55804443359375, 0.7755126953125, 0.99298095703125, 1.21044921875, 1.42791748046875, 1.6453857421875, 1.86285400390625, 2.080322265625, 2.29779052734375, 2.5152587890625, 2.73272705078125, 2.9501953125, 3.16766357421875, 3.3851318359375, 3.60260009765625, 3.820068359375, 4.03753662109375, 4.2550048828125, 4.47247314453125, 4.68994140625, 4.90740966796875, 5.1248779296875, 5.34234619140625, 5.559814453125, 5.77728271484375, 5.9947509765625, 6.21221923828125, 6.4296875]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 5.0, 2.0, 14.0, 10.0, 14.0, 5.0, 13.0, 16.0, 16.0, 16.0, 23.0, 20.0, 28.0, 34.0, 40.0, 25.0, 38.0, 48.0, 32.0, 38.0, 27.0, 41.0, 58.0, 45.0, 40.0, 29.0, 33.0, 27.0, 31.0, 25.0, 26.0, 26.0, 23.0, 18.0, 17.0, 12.0, 13.0, 10.0, 10.0, 10.0, 7.0, 4.0, 9.0, 7.0, 4.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 3.0], "bins": [-4.51953125, -4.38494873046875, -4.2503662109375, -4.11578369140625, -3.981201171875, -3.84661865234375, -3.7120361328125, -3.57745361328125, -3.44287109375, -3.30828857421875, -3.1737060546875, -3.03912353515625, -2.904541015625, -2.76995849609375, -2.6353759765625, -2.50079345703125, -2.3662109375, -2.23162841796875, -2.0970458984375, -1.96246337890625, -1.827880859375, -1.69329833984375, -1.5587158203125, -1.42413330078125, -1.28955078125, -1.15496826171875, -1.0203857421875, -0.88580322265625, -0.751220703125, -0.61663818359375, -0.4820556640625, -0.34747314453125, -0.212890625, -0.07830810546875, 0.0562744140625, 0.19085693359375, 0.325439453125, 0.46002197265625, 0.5946044921875, 0.72918701171875, 0.86376953125, 0.99835205078125, 1.1329345703125, 1.26751708984375, 1.402099609375, 1.53668212890625, 1.6712646484375, 1.80584716796875, 1.9404296875, 2.07501220703125, 2.2095947265625, 2.34417724609375, 2.478759765625, 2.61334228515625, 2.7479248046875, 2.88250732421875, 3.01708984375, 3.15167236328125, 3.2862548828125, 3.42083740234375, 3.555419921875, 3.69000244140625, 3.8245849609375, 3.95916748046875, 4.09375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 7.0, 12.0, 17.0, 20.0, 28.0, 54.0, 53.0, 101.0, 132.0, 203.0, 319.0, 407.0, 618.0, 943.0, 1450.0, 2221.0, 3636.0, 5480.0, 9202.0, 15529.0, 26537.0, 45928.0, 76792.0, 122350.0, 169987.0, 181741.0, 145271.0, 96411.0, 58185.0, 34263.0, 19837.0, 11582.0, 7046.0, 4319.0, 2644.0, 1729.0, 1093.0, 827.0, 514.0, 349.0, 206.0, 154.0, 113.0, 80.0, 61.0, 25.0, 30.0, 24.0, 8.0, 7.0, 5.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.49609375, -5.31427001953125, -5.1324462890625, -4.95062255859375, -4.768798828125, -4.58697509765625, -4.4051513671875, -4.22332763671875, -4.04150390625, -3.85968017578125, -3.6778564453125, -3.49603271484375, -3.314208984375, -3.13238525390625, -2.9505615234375, -2.76873779296875, -2.5869140625, -2.40509033203125, -2.2232666015625, -2.04144287109375, -1.859619140625, -1.67779541015625, -1.4959716796875, -1.31414794921875, -1.13232421875, -0.95050048828125, -0.7686767578125, -0.58685302734375, -0.405029296875, -0.22320556640625, -0.0413818359375, 0.14044189453125, 0.322265625, 0.50408935546875, 0.6859130859375, 0.86773681640625, 1.049560546875, 1.23138427734375, 1.4132080078125, 1.59503173828125, 1.77685546875, 1.95867919921875, 2.1405029296875, 2.32232666015625, 2.504150390625, 2.68597412109375, 2.8677978515625, 3.04962158203125, 3.2314453125, 3.41326904296875, 3.5950927734375, 3.77691650390625, 3.958740234375, 4.14056396484375, 4.3223876953125, 4.50421142578125, 4.68603515625, 4.86785888671875, 5.0496826171875, 5.23150634765625, 5.413330078125, 5.59515380859375, 5.7769775390625, 5.95880126953125, 6.140625]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 3.0, 0.0, 3.0, 3.0, 9.0, 7.0, 7.0, 6.0, 9.0, 7.0, 9.0, 16.0, 20.0, 23.0, 22.0, 25.0, 35.0, 26.0, 26.0, 37.0, 32.0, 35.0, 34.0, 29.0, 59.0, 40.0, 41.0, 34.0, 39.0, 34.0, 41.0, 28.0, 34.0, 29.0, 33.0, 29.0, 29.0, 18.0, 13.0, 10.0, 14.0, 10.0, 7.0, 10.0, 10.0, 4.0, 7.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.34765625, -2.26690673828125, -2.1861572265625, -2.10540771484375, -2.024658203125, -1.94390869140625, -1.8631591796875, -1.78240966796875, -1.70166015625, -1.62091064453125, -1.5401611328125, -1.45941162109375, -1.378662109375, -1.29791259765625, -1.2171630859375, -1.13641357421875, -1.0556640625, -0.97491455078125, -0.8941650390625, -0.81341552734375, -0.732666015625, -0.65191650390625, -0.5711669921875, -0.49041748046875, -0.40966796875, -0.32891845703125, -0.2481689453125, -0.16741943359375, -0.086669921875, -0.00592041015625, 0.0748291015625, 0.15557861328125, 0.236328125, 0.31707763671875, 0.3978271484375, 0.47857666015625, 0.559326171875, 0.64007568359375, 0.7208251953125, 0.80157470703125, 0.88232421875, 0.96307373046875, 1.0438232421875, 1.12457275390625, 1.205322265625, 1.28607177734375, 1.3668212890625, 1.44757080078125, 1.5283203125, 1.60906982421875, 1.6898193359375, 1.77056884765625, 1.851318359375, 1.93206787109375, 2.0128173828125, 2.09356689453125, 2.17431640625, 2.25506591796875, 2.3358154296875, 2.41656494140625, 2.497314453125, 2.57806396484375, 2.6588134765625, 2.73956298828125, 2.8203125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 4.0, 8.0, 7.0, 12.0, 18.0, 16.0, 31.0, 31.0, 62.0, 104.0, 128.0, 180.0, 218.0, 335.0, 477.0, 713.0, 1105.0, 1482.0, 2263.0, 3413.0, 5010.0, 7714.0, 12043.0, 18731.0, 29897.0, 49589.0, 82370.0, 131998.0, 182262.0, 179995.0, 128458.0, 80063.0, 48022.0, 29280.0, 18070.0, 11425.0, 7586.0, 4986.0, 3438.0, 2168.0, 1538.0, 1006.0, 679.0, 459.0, 352.0, 249.0, 165.0, 115.0, 76.0, 62.0, 43.0, 24.0, 25.0, 21.0, 13.0, 6.0, 9.0, 8.0, 1.0, 3.0], "bins": [-2.8203125, -2.734771728515625, -2.64923095703125, -2.563690185546875, -2.4781494140625, -2.392608642578125, -2.30706787109375, -2.221527099609375, -2.135986328125, -2.050445556640625, -1.96490478515625, -1.879364013671875, -1.7938232421875, -1.708282470703125, -1.62274169921875, -1.537200927734375, -1.45166015625, -1.366119384765625, -1.28057861328125, -1.195037841796875, -1.1094970703125, -1.023956298828125, -0.93841552734375, -0.852874755859375, -0.767333984375, -0.681793212890625, -0.59625244140625, -0.510711669921875, -0.4251708984375, -0.339630126953125, -0.25408935546875, -0.168548583984375, -0.0830078125, 0.002532958984375, 0.08807373046875, 0.173614501953125, 0.2591552734375, 0.344696044921875, 0.43023681640625, 0.515777587890625, 0.601318359375, 0.686859130859375, 0.77239990234375, 0.857940673828125, 0.9434814453125, 1.029022216796875, 1.11456298828125, 1.200103759765625, 1.28564453125, 1.371185302734375, 1.45672607421875, 1.542266845703125, 1.6278076171875, 1.713348388671875, 1.79888916015625, 1.884429931640625, 1.969970703125, 2.055511474609375, 2.14105224609375, 2.226593017578125, 2.3121337890625, 2.397674560546875, 2.48321533203125, 2.568756103515625, 2.654296875]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 1.0, 18.0, 7.0, 12.0, 14.0, 35.0, 55.0, 72.0, 92.0, 133.0, 151.0, 131.0, 106.0, 44.0, 53.0, 22.0, 18.0, 12.0, 8.0, 4.0, 7.0, 7.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0007038116455078125, -0.000684000551700592, -0.0006641894578933716, -0.0006443783640861511, -0.0006245672702789307, -0.0006047561764717102, -0.0005849450826644897, -0.0005651339888572693, -0.0005453228950500488, -0.0005255118012428284, -0.0005057007074356079, -0.00048588961362838745, -0.000466078519821167, -0.00044626742601394653, -0.0004264563322067261, -0.0004066452383995056, -0.00038683414459228516, -0.0003670230507850647, -0.00034721195697784424, -0.0003274008631706238, -0.0003075897693634033, -0.00028777867555618286, -0.0002679675817489624, -0.00024815648794174194, -0.00022834539413452148, -0.00020853430032730103, -0.00018872320652008057, -0.0001689121127128601, -0.00014910101890563965, -0.0001292899250984192, -0.00010947883129119873, -8.966773748397827e-05, -6.985664367675781e-05, -5.0045549869537354e-05, -3.0234456062316895e-05, -1.0423362255096436e-05, 9.387731552124023e-06, 2.9198825359344482e-05, 4.900991916656494e-05, 6.88210129737854e-05, 8.863210678100586e-05, 0.00010844320058822632, 0.00012825429439544678, 0.00014806538820266724, 0.0001678764820098877, 0.00018768757581710815, 0.0002074986696243286, 0.00022730976343154907, 0.00024712085723876953, 0.00026693195104599, 0.00028674304485321045, 0.0003065541386604309, 0.00032636523246765137, 0.0003461763262748718, 0.0003659874200820923, 0.00038579851388931274, 0.0004056096076965332, 0.00042542070150375366, 0.0004452317953109741, 0.0004650428891181946, 0.00048485398292541504, 0.0005046650767326355, 0.000524476170539856, 0.0005442872643470764, 0.0005640983581542969]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 4.0, 4.0, 2.0, 4.0, 5.0, 11.0, 23.0, 38.0, 45.0, 77.0, 128.0, 220.0, 300.0, 488.0, 805.0, 1349.0, 2166.0, 3529.0, 5783.0, 9777.0, 16467.0, 28049.0, 48774.0, 84367.0, 137972.0, 190378.0, 187617.0, 134591.0, 81597.0, 47261.0, 27275.0, 15814.0, 9243.0, 5574.0, 3465.0, 2075.0, 1234.0, 780.0, 474.0, 319.0, 186.0, 87.0, 78.0, 50.0, 29.0, 19.0, 15.0, 10.0, 6.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.48046875, -2.39483642578125, -2.3092041015625, -2.22357177734375, -2.137939453125, -2.05230712890625, -1.9666748046875, -1.88104248046875, -1.79541015625, -1.70977783203125, -1.6241455078125, -1.53851318359375, -1.452880859375, -1.36724853515625, -1.2816162109375, -1.19598388671875, -1.1103515625, -1.02471923828125, -0.9390869140625, -0.85345458984375, -0.767822265625, -0.68218994140625, -0.5965576171875, -0.51092529296875, -0.42529296875, -0.33966064453125, -0.2540283203125, -0.16839599609375, -0.082763671875, 0.00286865234375, 0.0885009765625, 0.17413330078125, 0.259765625, 0.34539794921875, 0.4310302734375, 0.51666259765625, 0.602294921875, 0.68792724609375, 0.7735595703125, 0.85919189453125, 0.94482421875, 1.03045654296875, 1.1160888671875, 1.20172119140625, 1.287353515625, 1.37298583984375, 1.4586181640625, 1.54425048828125, 1.6298828125, 1.71551513671875, 1.8011474609375, 1.88677978515625, 1.972412109375, 2.05804443359375, 2.1436767578125, 2.22930908203125, 2.31494140625, 2.40057373046875, 2.4862060546875, 2.57183837890625, 2.657470703125, 2.74310302734375, 2.8287353515625, 2.91436767578125, 3.0]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 9.0, 3.0, 7.0, 11.0, 7.0, 12.0, 21.0, 22.0, 36.0, 32.0, 37.0, 40.0, 46.0, 63.0, 74.0, 91.0, 79.0, 74.0, 44.0, 48.0, 37.0, 40.0, 37.0, 30.0, 23.0, 18.0, 17.0, 15.0, 8.0, 5.0, 8.0, 3.0, 5.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.900390625, -0.869384765625, -0.83837890625, -0.807373046875, -0.7763671875, -0.745361328125, -0.71435546875, -0.683349609375, -0.65234375, -0.621337890625, -0.59033203125, -0.559326171875, -0.5283203125, -0.497314453125, -0.46630859375, -0.435302734375, -0.404296875, -0.373291015625, -0.34228515625, -0.311279296875, -0.2802734375, -0.249267578125, -0.21826171875, -0.187255859375, -0.15625, -0.125244140625, -0.09423828125, -0.063232421875, -0.0322265625, -0.001220703125, 0.02978515625, 0.060791015625, 0.091796875, 0.122802734375, 0.15380859375, 0.184814453125, 0.2158203125, 0.246826171875, 0.27783203125, 0.308837890625, 0.33984375, 0.370849609375, 0.40185546875, 0.432861328125, 0.4638671875, 0.494873046875, 0.52587890625, 0.556884765625, 0.587890625, 0.618896484375, 0.64990234375, 0.680908203125, 0.7119140625, 0.742919921875, 0.77392578125, 0.804931640625, 0.8359375, 0.866943359375, 0.89794921875, 0.928955078125, 0.9599609375, 0.990966796875, 1.02197265625, 1.052978515625, 1.083984375]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 4.0, 8.0, 18.0, 10.0, 9.0, 14.0, 28.0, 39.0, 28.0, 37.0, 39.0, 65.0, 71.0, 69.0, 82.0, 74.0, 63.0, 65.0, 54.0, 52.0, 41.0, 25.0, 18.0, 17.0, 13.0, 15.0, 10.0, 5.0, 8.0, 7.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.7656831741333, -10.46187686920166, -10.158071517944336, -9.854265213012695, -9.550458908081055, -9.24665355682373, -8.94284725189209, -8.639041900634766, -8.335235595703125, -8.031429290771484, -7.727623462677002, -7.4238176345825195, -7.120011806488037, -6.816205978393555, -6.512399673461914, -6.208593845367432, -5.904787540435791, -5.600981712341309, -5.297175407409668, -4.9933695793151855, -4.689563751220703, -4.3857574462890625, -4.08195161819458, -3.7781457901000977, -3.474339723587036, -3.1705336570739746, -2.866727828979492, -2.5629217624664307, -2.259115695953369, -1.9553098678588867, -1.6515038013458252, -1.3476979732513428, -1.0438919067382812, -0.7400859594345093, -0.43627995252609253, -0.13247394561767578, 0.1713320016860962, 0.47513794898986816, 0.7789440155029297, 1.082749843597412, 1.3865559101104736, 1.6903618574142456, 1.9941678047180176, 2.297973871231079, 2.6017799377441406, 2.905585765838623, 3.2093918323516846, 3.513197660446167, 3.8170037269592285, 4.120809555053711, 4.424615859985352, 4.728421688079834, 5.032227516174316, 5.336033821105957, 5.6398396492004395, 5.943645477294922, 6.2474517822265625, 6.551257610321045, 6.8550639152526855, 7.158869743347168, 7.46267557144165, 7.766481399536133, 8.070287704467773, 8.374094009399414, 8.677899360656738]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 7.0, 4.0, 5.0, 9.0, 6.0, 12.0, 13.0, 22.0, 18.0, 24.0, 21.0, 22.0, 15.0, 25.0, 23.0, 36.0, 31.0, 43.0, 35.0, 40.0, 35.0, 38.0, 44.0, 36.0, 36.0, 28.0, 55.0, 37.0, 29.0, 33.0, 27.0, 31.0, 25.0, 16.0, 21.0, 24.0, 14.0, 11.0, 12.0, 13.0, 9.0, 3.0, 4.0, 7.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.349158763885498, -4.21394157409668, -4.078723907470703, -3.9435067176818848, -3.8082895278930664, -3.673072099685669, -3.5378546714782715, -3.402637481689453, -3.2674200534820557, -3.132202625274658, -2.99698543548584, -2.8617680072784424, -2.726550579071045, -2.5913333892822266, -2.456115961074829, -2.3208985328674316, -2.1856813430786133, -2.050463914871216, -1.9152467250823975, -1.780029296875, -1.644811987876892, -1.5095946788787842, -1.3743772506713867, -1.2391599416732788, -1.103942632675171, -0.968725323677063, -0.8335079550743103, -0.6982905864715576, -0.5630732774734497, -0.4278559684753418, -0.2926385998725891, -0.15742123126983643, -0.02220439910888672, 0.11301293969154358, 0.24823027849197388, 0.3834476172924042, 0.5186649560928345, 0.6538822650909424, 0.7890996336936951, 0.9243170022964478, 1.0595343112945557, 1.1947516202926636, 1.3299689292907715, 1.465186357498169, 1.6004036664962769, 1.7356209754943848, 1.8708384037017822, 2.0060558319091797, 2.141273021697998, 2.2764904499053955, 2.411707639694214, 2.5469250679016113, 2.6821422576904297, 2.817359685897827, 2.9525771141052246, 3.087794303894043, 3.2230117321014404, 3.358229160308838, 3.4934463500976562, 3.6286637783050537, 3.763881206512451, 3.8990983963012695, 4.034315586090088, 4.1695332527160645, 4.304750442504883]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 2.0, 3.0, 6.0, 6.0, 13.0, 22.0, 28.0, 50.0, 72.0, 105.0, 121.0, 202.0, 337.0, 521.0, 879.0, 1443.0, 2490.0, 4282.0, 7928.0, 15558.0, 33908.0, 81267.0, 228561.0, 728995.0, 1550161.0, 1013859.0, 325197.0, 109554.0, 44286.0, 20467.0, 10206.0, 5425.0, 3163.0, 1871.0, 1117.0, 735.0, 464.0, 286.0, 197.0, 146.0, 99.0, 91.0, 42.0, 38.0, 22.0, 17.0, 14.0, 7.0, 11.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.4453125, -10.1153564453125, -9.785400390625, -9.4554443359375, -9.12548828125, -8.7955322265625, -8.465576171875, -8.1356201171875, -7.8056640625, -7.4757080078125, -7.145751953125, -6.8157958984375, -6.48583984375, -6.1558837890625, -5.825927734375, -5.4959716796875, -5.166015625, -4.8360595703125, -4.506103515625, -4.1761474609375, -3.84619140625, -3.5162353515625, -3.186279296875, -2.8563232421875, -2.5263671875, -2.1964111328125, -1.866455078125, -1.5364990234375, -1.20654296875, -0.8765869140625, -0.546630859375, -0.2166748046875, 0.11328125, 0.4432373046875, 0.773193359375, 1.1031494140625, 1.43310546875, 1.7630615234375, 2.093017578125, 2.4229736328125, 2.7529296875, 3.0828857421875, 3.412841796875, 3.7427978515625, 4.07275390625, 4.4027099609375, 4.732666015625, 5.0626220703125, 5.392578125, 5.7225341796875, 6.052490234375, 6.3824462890625, 6.71240234375, 7.0423583984375, 7.372314453125, 7.7022705078125, 8.0322265625, 8.3621826171875, 8.692138671875, 9.0220947265625, 9.35205078125, 9.6820068359375, 10.011962890625, 10.3419189453125, 10.671875]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 3.0, 5.0, 1.0, 7.0, 4.0, 10.0, 7.0, 7.0, 11.0, 20.0, 12.0, 17.0, 28.0, 15.0, 32.0, 29.0, 27.0, 32.0, 38.0, 26.0, 36.0, 30.0, 40.0, 40.0, 41.0, 33.0, 52.0, 46.0, 37.0, 35.0, 23.0, 24.0, 33.0, 33.0, 26.0, 23.0, 13.0, 24.0, 22.0, 9.0, 13.0, 1.0, 10.0, 10.0, 7.0, 2.0, 5.0, 7.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.04296875, -2.93548583984375, -2.8280029296875, -2.72052001953125, -2.613037109375, -2.50555419921875, -2.3980712890625, -2.29058837890625, -2.18310546875, -2.07562255859375, -1.9681396484375, -1.86065673828125, -1.753173828125, -1.64569091796875, -1.5382080078125, -1.43072509765625, -1.3232421875, -1.21575927734375, -1.1082763671875, -1.00079345703125, -0.893310546875, -0.78582763671875, -0.6783447265625, -0.57086181640625, -0.46337890625, -0.35589599609375, -0.2484130859375, -0.14093017578125, -0.033447265625, 0.07403564453125, 0.1815185546875, 0.28900146484375, 0.396484375, 0.50396728515625, 0.6114501953125, 0.71893310546875, 0.826416015625, 0.93389892578125, 1.0413818359375, 1.14886474609375, 1.25634765625, 1.36383056640625, 1.4713134765625, 1.57879638671875, 1.686279296875, 1.79376220703125, 1.9012451171875, 2.00872802734375, 2.1162109375, 2.22369384765625, 2.3311767578125, 2.43865966796875, 2.546142578125, 2.65362548828125, 2.7611083984375, 2.86859130859375, 2.97607421875, 3.08355712890625, 3.1910400390625, 3.29852294921875, 3.406005859375, 3.51348876953125, 3.6209716796875, 3.72845458984375, 3.8359375]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 7.0, 10.0, 10.0, 15.0, 18.0, 38.0, 41.0, 86.0, 121.0, 223.0, 353.0, 601.0, 1019.0, 1739.0, 3123.0, 6080.0, 12285.0, 26432.0, 62563.0, 165223.0, 493509.0, 1354968.0, 1321622.0, 473941.0, 159240.0, 60519.0, 25646.0, 11702.0, 5966.0, 3082.0, 1656.0, 1001.0, 519.0, 326.0, 188.0, 147.0, 91.0, 50.0, 45.0, 30.0, 15.0, 10.0, 7.0, 6.0, 6.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.6640625, -11.2750244140625, -10.885986328125, -10.4969482421875, -10.10791015625, -9.7188720703125, -9.329833984375, -8.9407958984375, -8.5517578125, -8.1627197265625, -7.773681640625, -7.3846435546875, -6.99560546875, -6.6065673828125, -6.217529296875, -5.8284912109375, -5.439453125, -5.0504150390625, -4.661376953125, -4.2723388671875, -3.88330078125, -3.4942626953125, -3.105224609375, -2.7161865234375, -2.3271484375, -1.9381103515625, -1.549072265625, -1.1600341796875, -0.77099609375, -0.3819580078125, 0.007080078125, 0.3961181640625, 0.78515625, 1.1741943359375, 1.563232421875, 1.9522705078125, 2.34130859375, 2.7303466796875, 3.119384765625, 3.5084228515625, 3.8974609375, 4.2864990234375, 4.675537109375, 5.0645751953125, 5.45361328125, 5.8426513671875, 6.231689453125, 6.6207275390625, 7.009765625, 7.3988037109375, 7.787841796875, 8.1768798828125, 8.56591796875, 8.9549560546875, 9.343994140625, 9.7330322265625, 10.1220703125, 10.5111083984375, 10.900146484375, 11.2891845703125, 11.67822265625, 12.0672607421875, 12.456298828125, 12.8453369140625, 13.234375]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 6.0, 9.0, 9.0, 8.0, 9.0, 17.0, 26.0, 33.0, 52.0, 66.0, 102.0, 150.0, 165.0, 212.0, 326.0, 372.0, 373.0, 401.0, 349.0, 298.0, 294.0, 218.0, 156.0, 105.0, 87.0, 60.0, 43.0, 31.0, 32.0, 11.0, 14.0, 12.0, 6.0, 6.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.53125, -3.428070068359375, -3.32489013671875, -3.221710205078125, -3.1185302734375, -3.015350341796875, -2.91217041015625, -2.808990478515625, -2.705810546875, -2.602630615234375, -2.49945068359375, -2.396270751953125, -2.2930908203125, -2.189910888671875, -2.08673095703125, -1.983551025390625, -1.88037109375, -1.777191162109375, -1.67401123046875, -1.570831298828125, -1.4676513671875, -1.364471435546875, -1.26129150390625, -1.158111572265625, -1.054931640625, -0.951751708984375, -0.84857177734375, -0.745391845703125, -0.6422119140625, -0.539031982421875, -0.43585205078125, -0.332672119140625, -0.2294921875, -0.126312255859375, -0.02313232421875, 0.080047607421875, 0.1832275390625, 0.286407470703125, 0.38958740234375, 0.492767333984375, 0.595947265625, 0.699127197265625, 0.80230712890625, 0.905487060546875, 1.0086669921875, 1.111846923828125, 1.21502685546875, 1.318206787109375, 1.42138671875, 1.524566650390625, 1.62774658203125, 1.730926513671875, 1.8341064453125, 1.937286376953125, 2.04046630859375, 2.143646240234375, 2.246826171875, 2.350006103515625, 2.45318603515625, 2.556365966796875, 2.6595458984375, 2.762725830078125, 2.86590576171875, 2.969085693359375, 3.072265625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 6.0, 3.0, 7.0, 6.0, 4.0, 7.0, 14.0, 11.0, 20.0, 23.0, 23.0, 28.0, 37.0, 46.0, 56.0, 62.0, 73.0, 72.0, 58.0, 61.0, 58.0, 51.0, 59.0, 44.0, 33.0, 27.0, 24.0, 19.0, 14.0, 9.0, 7.0, 13.0, 7.0, 4.0, 9.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-11.04246711730957, -10.743955612182617, -10.445443153381348, -10.146930694580078, -9.848419189453125, -9.549907684326172, -9.251395225524902, -8.952882766723633, -8.65437126159668, -8.355859756469727, -8.057347297668457, -7.758835315704346, -7.460323333740234, -7.161811351776123, -6.863299369812012, -6.5647873878479, -6.266275405883789, -5.967763423919678, -5.669251441955566, -5.370739459991455, -5.072227478027344, -4.773715496063232, -4.475203514099121, -4.17669153213501, -3.8781795501708984, -3.579667568206787, -3.281155586242676, -2.9826436042785645, -2.684131622314453, -2.385619640350342, -2.0871076583862305, -1.7885956764221191, -1.4900836944580078, -1.1915717124938965, -0.8930597305297852, -0.5945477485656738, -0.2960357666015625, 0.002476215362548828, 0.30098819732666016, 0.5995001792907715, 0.8980121612548828, 1.1965241432189941, 1.4950361251831055, 1.7935481071472168, 2.092060089111328, 2.3905720710754395, 2.689084053039551, 2.987596035003662, 3.2861080169677734, 3.5846199989318848, 3.883131980895996, 4.181643962860107, 4.480155944824219, 4.77866792678833, 5.077179908752441, 5.375691890716553, 5.674203872680664, 5.972715854644775, 6.271227836608887, 6.569739818572998, 6.868251800537109, 7.166763782501221, 7.465275764465332, 7.763787746429443, 8.062299728393555]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 7.0, 7.0, 5.0, 5.0, 8.0, 17.0, 12.0, 16.0, 10.0, 21.0, 26.0, 28.0, 22.0, 27.0, 27.0, 25.0, 33.0, 31.0, 31.0, 45.0, 33.0, 49.0, 41.0, 34.0, 32.0, 30.0, 35.0, 37.0, 31.0, 31.0, 35.0, 22.0, 29.0, 26.0, 12.0, 19.0, 9.0, 7.0, 12.0, 14.0, 11.0, 11.0, 6.0, 8.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.12053108215332, -3.9783573150634766, -3.836183786392212, -3.6940102577209473, -3.5518364906311035, -3.4096627235412598, -3.267489194869995, -3.1253156661987305, -2.9831418991088867, -2.840968132019043, -2.6987946033477783, -2.5566210746765137, -2.41444730758667, -2.272273540496826, -2.1301000118255615, -1.9879263639450073, -1.8457527160644531, -1.703579068183899, -1.5614054203033447, -1.4192317724227905, -1.2770581245422363, -1.1348844766616821, -0.9927108287811279, -0.8505371809005737, -0.7083635330200195, -0.5661898851394653, -0.42401623725891113, -0.28184258937835693, -0.13966894149780273, 0.002504706382751465, 0.14467835426330566, 0.28685200214385986, 0.42902517318725586, 0.5711988210678101, 0.7133724689483643, 0.8555461168289185, 0.9977197647094727, 1.1398934125900269, 1.282067060470581, 1.4242407083511353, 1.5664143562316895, 1.7085880041122437, 1.8507616519927979, 1.992935299873352, 2.1351089477539062, 2.27728271484375, 2.4194562435150146, 2.5616297721862793, 2.703803539276123, 2.845977306365967, 2.9881508350372314, 3.130324363708496, 3.27249813079834, 3.4146718978881836, 3.5568454265594482, 3.699018955230713, 3.8411927223205566, 3.9833664894104004, 4.125539779663086, 4.26771354675293, 4.409887313842773, 4.552061080932617, 4.694234848022461, 4.8364081382751465, 4.97858190536499]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 6.0, 3.0, 9.0, 7.0, 18.0, 24.0, 36.0, 53.0, 83.0, 89.0, 139.0, 192.0, 267.0, 380.0, 532.0, 758.0, 1022.0, 1411.0, 2089.0, 3173.0, 5040.0, 8890.0, 18373.0, 44581.0, 125231.0, 305888.0, 310496.0, 129825.0, 46363.0, 18870.0, 9142.0, 5138.0, 3155.0, 2136.0, 1454.0, 1000.0, 800.0, 534.0, 394.0, 293.0, 199.0, 141.0, 88.0, 86.0, 50.0, 35.0, 18.0, 17.0, 11.0, 9.0, 7.0, 4.0, 1.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-8.015625, -7.7572021484375, -7.498779296875, -7.2403564453125, -6.98193359375, -6.7235107421875, -6.465087890625, -6.2066650390625, -5.9482421875, -5.6898193359375, -5.431396484375, -5.1729736328125, -4.91455078125, -4.6561279296875, -4.397705078125, -4.1392822265625, -3.880859375, -3.6224365234375, -3.364013671875, -3.1055908203125, -2.84716796875, -2.5887451171875, -2.330322265625, -2.0718994140625, -1.8134765625, -1.5550537109375, -1.296630859375, -1.0382080078125, -0.77978515625, -0.5213623046875, -0.262939453125, -0.0045166015625, 0.25390625, 0.5123291015625, 0.770751953125, 1.0291748046875, 1.28759765625, 1.5460205078125, 1.804443359375, 2.0628662109375, 2.3212890625, 2.5797119140625, 2.838134765625, 3.0965576171875, 3.35498046875, 3.6134033203125, 3.871826171875, 4.1302490234375, 4.388671875, 4.6470947265625, 4.905517578125, 5.1639404296875, 5.42236328125, 5.6807861328125, 5.939208984375, 6.1976318359375, 6.4560546875, 6.7144775390625, 6.972900390625, 7.2313232421875, 7.48974609375, 7.7481689453125, 8.006591796875, 8.2650146484375, 8.5234375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 3.0, 2.0, 5.0, 4.0, 3.0, 7.0, 6.0, 8.0, 8.0, 11.0, 17.0, 11.0, 23.0, 9.0, 19.0, 17.0, 20.0, 19.0, 29.0, 27.0, 36.0, 27.0, 38.0, 43.0, 31.0, 43.0, 34.0, 41.0, 36.0, 43.0, 39.0, 32.0, 38.0, 30.0, 32.0, 21.0, 20.0, 21.0, 21.0, 22.0, 18.0, 12.0, 13.0, 6.0, 14.0, 8.0, 8.0, 11.0, 8.0, 2.0, 3.0, 5.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.46875, -4.31982421875, -4.1708984375, -4.02197265625, -3.873046875, -3.72412109375, -3.5751953125, -3.42626953125, -3.27734375, -3.12841796875, -2.9794921875, -2.83056640625, -2.681640625, -2.53271484375, -2.3837890625, -2.23486328125, -2.0859375, -1.93701171875, -1.7880859375, -1.63916015625, -1.490234375, -1.34130859375, -1.1923828125, -1.04345703125, -0.89453125, -0.74560546875, -0.5966796875, -0.44775390625, -0.298828125, -0.14990234375, -0.0009765625, 0.14794921875, 0.296875, 0.44580078125, 0.5947265625, 0.74365234375, 0.892578125, 1.04150390625, 1.1904296875, 1.33935546875, 1.48828125, 1.63720703125, 1.7861328125, 1.93505859375, 2.083984375, 2.23291015625, 2.3818359375, 2.53076171875, 2.6796875, 2.82861328125, 2.9775390625, 3.12646484375, 3.275390625, 3.42431640625, 3.5732421875, 3.72216796875, 3.87109375, 4.02001953125, 4.1689453125, 4.31787109375, 4.466796875, 4.61572265625, 4.7646484375, 4.91357421875, 5.0625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 4.0, 6.0, 5.0, 5.0, 1.0, 10.0, 5.0, 15.0, 16.0, 13.0, 25.0, 40.0, 41.0, 43.0, 84.0, 92.0, 152.0, 189.0, 214.0, 339.0, 502.0, 666.0, 1054.0, 1596.0, 2529.0, 4470.0, 9387.0, 27697.0, 142486.0, 592533.0, 204035.0, 35816.0, 11126.0, 4987.0, 2817.0, 1754.0, 1123.0, 757.0, 572.0, 352.0, 232.0, 200.0, 139.0, 98.0, 74.0, 54.0, 54.0, 46.0, 29.0, 19.0, 19.0, 14.0, 3.0, 9.0, 4.0, 4.0, 7.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-15.7109375, -15.1973876953125, -14.683837890625, -14.1702880859375, -13.65673828125, -13.1431884765625, -12.629638671875, -12.1160888671875, -11.6025390625, -11.0889892578125, -10.575439453125, -10.0618896484375, -9.54833984375, -9.0347900390625, -8.521240234375, -8.0076904296875, -7.494140625, -6.9805908203125, -6.467041015625, -5.9534912109375, -5.43994140625, -4.9263916015625, -4.412841796875, -3.8992919921875, -3.3857421875, -2.8721923828125, -2.358642578125, -1.8450927734375, -1.33154296875, -0.8179931640625, -0.304443359375, 0.2091064453125, 0.72265625, 1.2362060546875, 1.749755859375, 2.2633056640625, 2.77685546875, 3.2904052734375, 3.803955078125, 4.3175048828125, 4.8310546875, 5.3446044921875, 5.858154296875, 6.3717041015625, 6.88525390625, 7.3988037109375, 7.912353515625, 8.4259033203125, 8.939453125, 9.4530029296875, 9.966552734375, 10.4801025390625, 10.99365234375, 11.5072021484375, 12.020751953125, 12.5343017578125, 13.0478515625, 13.5614013671875, 14.074951171875, 14.5885009765625, 15.10205078125, 15.6156005859375, 16.129150390625, 16.6427001953125, 17.15625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 1.0, 4.0, 8.0, 4.0, 9.0, 13.0, 8.0, 13.0, 20.0, 21.0, 19.0, 24.0, 24.0, 34.0, 43.0, 41.0, 38.0, 37.0, 43.0, 42.0, 41.0, 63.0, 46.0, 50.0, 41.0, 44.0, 21.0, 26.0, 31.0, 28.0, 33.0, 28.0, 13.0, 17.0, 13.0, 15.0, 11.0, 8.0, 7.0, 8.0, 3.0, 7.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.16015625, -3.05029296875, -2.9404296875, -2.83056640625, -2.720703125, -2.61083984375, -2.5009765625, -2.39111328125, -2.28125, -2.17138671875, -2.0615234375, -1.95166015625, -1.841796875, -1.73193359375, -1.6220703125, -1.51220703125, -1.40234375, -1.29248046875, -1.1826171875, -1.07275390625, -0.962890625, -0.85302734375, -0.7431640625, -0.63330078125, -0.5234375, -0.41357421875, -0.3037109375, -0.19384765625, -0.083984375, 0.02587890625, 0.1357421875, 0.24560546875, 0.35546875, 0.46533203125, 0.5751953125, 0.68505859375, 0.794921875, 0.90478515625, 1.0146484375, 1.12451171875, 1.234375, 1.34423828125, 1.4541015625, 1.56396484375, 1.673828125, 1.78369140625, 1.8935546875, 2.00341796875, 2.11328125, 2.22314453125, 2.3330078125, 2.44287109375, 2.552734375, 2.66259765625, 2.7724609375, 2.88232421875, 2.9921875, 3.10205078125, 3.2119140625, 3.32177734375, 3.431640625, 3.54150390625, 3.6513671875, 3.76123046875, 3.87109375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 2.0, 6.0, 6.0, 20.0, 24.0, 27.0, 50.0, 66.0, 115.0, 143.0, 223.0, 368.0, 623.0, 945.0, 1765.0, 3283.0, 7119.0, 21467.0, 132031.0, 684311.0, 156224.0, 23970.0, 7701.0, 3448.0, 1857.0, 1013.0, 654.0, 402.0, 226.0, 153.0, 96.0, 71.0, 46.0, 37.0, 17.0, 9.0, 9.0, 12.0, 8.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.875, -8.5843505859375, -8.293701171875, -8.0030517578125, -7.71240234375, -7.4217529296875, -7.131103515625, -6.8404541015625, -6.5498046875, -6.2591552734375, -5.968505859375, -5.6778564453125, -5.38720703125, -5.0965576171875, -4.805908203125, -4.5152587890625, -4.224609375, -3.9339599609375, -3.643310546875, -3.3526611328125, -3.06201171875, -2.7713623046875, -2.480712890625, -2.1900634765625, -1.8994140625, -1.6087646484375, -1.318115234375, -1.0274658203125, -0.73681640625, -0.4461669921875, -0.155517578125, 0.1351318359375, 0.42578125, 0.7164306640625, 1.007080078125, 1.2977294921875, 1.58837890625, 1.8790283203125, 2.169677734375, 2.4603271484375, 2.7509765625, 3.0416259765625, 3.332275390625, 3.6229248046875, 3.91357421875, 4.2042236328125, 4.494873046875, 4.7855224609375, 5.076171875, 5.3668212890625, 5.657470703125, 5.9481201171875, 6.23876953125, 6.5294189453125, 6.820068359375, 7.1107177734375, 7.4013671875, 7.6920166015625, 7.982666015625, 8.2733154296875, 8.56396484375, 8.8546142578125, 9.145263671875, 9.4359130859375, 9.7265625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 2.0, 3.0, 3.0, 7.0, 19.0, 33.0, 33.0, 96.0, 184.0, 197.0, 180.0, 100.0, 55.0, 24.0, 19.0, 11.0, 8.0, 4.0, 8.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003955364227294922, -0.0003840737044811249, -0.00037261098623275757, -0.00036114826798439026, -0.00034968554973602295, -0.00033822283148765564, -0.00032676011323928833, -0.000315297394990921, -0.0003038346767425537, -0.0002923719584941864, -0.0002809092402458191, -0.0002694465219974518, -0.00025798380374908447, -0.00024652108550071716, -0.00023505836725234985, -0.00022359564900398254, -0.00021213293075561523, -0.00020067021250724792, -0.00018920749425888062, -0.0001777447760105133, -0.000166282057762146, -0.0001548193395137787, -0.00014335662126541138, -0.00013189390301704407, -0.00012043118476867676, -0.00010896846652030945, -9.750574827194214e-05, -8.604303002357483e-05, -7.458031177520752e-05, -6.311759352684021e-05, -5.16548752784729e-05, -4.019215703010559e-05, -2.872943878173828e-05, -1.726672053337097e-05, -5.804002285003662e-06, 5.6587159633636475e-06, 1.7121434211730957e-05, 2.8584152460098267e-05, 4.0046870708465576e-05, 5.1509588956832886e-05, 6.29723072052002e-05, 7.44350254535675e-05, 8.589774370193481e-05, 9.736046195030212e-05, 0.00010882318019866943, 0.00012028589844703674, 0.00013174861669540405, 0.00014321133494377136, 0.00015467405319213867, 0.00016613677144050598, 0.0001775994896888733, 0.0001890622079372406, 0.0002005249261856079, 0.00021198764443397522, 0.00022345036268234253, 0.00023491308093070984, 0.00024637579917907715, 0.00025783851742744446, 0.00026930123567581177, 0.0002807639539241791, 0.0002922266721725464, 0.0003036893904209137, 0.000315152108669281, 0.0003266148269176483, 0.0003380775451660156]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 4.0, 2.0, 3.0, 8.0, 10.0, 23.0, 24.0, 26.0, 50.0, 76.0, 118.0, 136.0, 196.0, 242.0, 355.0, 520.0, 679.0, 989.0, 1353.0, 1937.0, 2724.0, 4121.0, 6652.0, 12024.0, 30582.0, 112937.0, 389828.0, 338368.0, 89586.0, 25482.0, 10583.0, 5998.0, 3940.0, 2586.0, 1783.0, 1318.0, 945.0, 686.0, 453.0, 336.0, 240.0, 171.0, 142.0, 94.0, 73.0, 58.0, 34.0, 25.0, 8.0, 11.0, 10.0, 6.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.078125, -4.90838623046875, -4.7386474609375, -4.56890869140625, -4.399169921875, -4.22943115234375, -4.0596923828125, -3.88995361328125, -3.72021484375, -3.55047607421875, -3.3807373046875, -3.21099853515625, -3.041259765625, -2.87152099609375, -2.7017822265625, -2.53204345703125, -2.3623046875, -2.19256591796875, -2.0228271484375, -1.85308837890625, -1.683349609375, -1.51361083984375, -1.3438720703125, -1.17413330078125, -1.00439453125, -0.83465576171875, -0.6649169921875, -0.49517822265625, -0.325439453125, -0.15570068359375, 0.0140380859375, 0.18377685546875, 0.353515625, 0.52325439453125, 0.6929931640625, 0.86273193359375, 1.032470703125, 1.20220947265625, 1.3719482421875, 1.54168701171875, 1.71142578125, 1.88116455078125, 2.0509033203125, 2.22064208984375, 2.390380859375, 2.56011962890625, 2.7298583984375, 2.89959716796875, 3.0693359375, 3.23907470703125, 3.4088134765625, 3.57855224609375, 3.748291015625, 3.91802978515625, 4.0877685546875, 4.25750732421875, 4.42724609375, 4.59698486328125, 4.7667236328125, 4.93646240234375, 5.106201171875, 5.27593994140625, 5.4456787109375, 5.61541748046875, 5.78515625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 8.0, 12.0, 34.0, 51.0, 98.0, 182.0, 218.0, 168.0, 109.0, 47.0, 26.0, 10.0, 5.0, 1.0, 8.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.470703125, -2.39874267578125, -2.3267822265625, -2.25482177734375, -2.182861328125, -2.11090087890625, -2.0389404296875, -1.96697998046875, -1.89501953125, -1.82305908203125, -1.7510986328125, -1.67913818359375, -1.607177734375, -1.53521728515625, -1.4632568359375, -1.39129638671875, -1.3193359375, -1.24737548828125, -1.1754150390625, -1.10345458984375, -1.031494140625, -0.95953369140625, -0.8875732421875, -0.81561279296875, -0.74365234375, -0.67169189453125, -0.5997314453125, -0.52777099609375, -0.455810546875, -0.38385009765625, -0.3118896484375, -0.23992919921875, -0.16796875, -0.09600830078125, -0.0240478515625, 0.04791259765625, 0.119873046875, 0.19183349609375, 0.2637939453125, 0.33575439453125, 0.40771484375, 0.47967529296875, 0.5516357421875, 0.62359619140625, 0.695556640625, 0.76751708984375, 0.8394775390625, 0.91143798828125, 0.9833984375, 1.05535888671875, 1.1273193359375, 1.19927978515625, 1.271240234375, 1.34320068359375, 1.4151611328125, 1.48712158203125, 1.55908203125, 1.63104248046875, 1.7030029296875, 1.77496337890625, 1.846923828125, 1.91888427734375, 1.9908447265625, 2.06280517578125, 2.134765625]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 5.0, 4.0, 8.0, 7.0, 9.0, 11.0, 11.0, 16.0, 21.0, 31.0, 35.0, 47.0, 33.0, 62.0, 72.0, 61.0, 65.0, 65.0, 62.0, 63.0, 51.0, 52.0, 43.0, 28.0, 31.0, 22.0, 16.0, 16.0, 13.0, 6.0, 11.0, 8.0, 3.0, 5.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.459746360778809, -11.157273292541504, -10.8548002243042, -10.552327156066895, -10.24985408782959, -9.947381019592285, -9.64490795135498, -9.34243392944336, -9.039960861206055, -8.73748779296875, -8.435014724731445, -8.13254165649414, -7.830068588256836, -7.527595520019531, -7.225121974945068, -6.922648906707764, -6.620176315307617, -6.3177032470703125, -6.015230178833008, -5.712757110595703, -5.410284042358398, -5.107810974121094, -4.805337429046631, -4.502864360809326, -4.2003912925720215, -3.897918224334717, -3.595445156097412, -3.2929718494415283, -2.9904987812042236, -2.688025712966919, -2.385552406311035, -2.0830793380737305, -1.7806062698364258, -1.478133201599121, -1.1756600141525269, -0.8731868863105774, -0.5707137584686279, -0.26824069023132324, 0.034232497215270996, 0.33670568466186523, 0.6391787528991699, 0.9416518807411194, 1.2441250085830688, 1.546598196029663, 1.8490712642669678, 2.1515443325042725, 2.4540176391601562, 2.756490707397461, 3.0589637756347656, 3.3614368438720703, 3.663909912109375, 3.966383218765259, 4.268856048583984, 4.571329116821289, 4.873802661895752, 5.176275730133057, 5.478748798370361, 5.781221866607666, 6.083694934844971, 6.386168003082275, 6.688641548156738, 6.991114616394043, 7.293587684631348, 7.596060752868652, 7.898533821105957]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 4.0, 4.0, 1.0, 3.0, 4.0, 5.0, 8.0, 8.0, 7.0, 10.0, 13.0, 10.0, 10.0, 16.0, 19.0, 22.0, 11.0, 20.0, 31.0, 20.0, 31.0, 28.0, 33.0, 34.0, 40.0, 35.0, 36.0, 41.0, 39.0, 37.0, 32.0, 38.0, 36.0, 35.0, 35.0, 29.0, 29.0, 27.0, 22.0, 28.0, 19.0, 4.0, 14.0, 17.0, 10.0, 12.0, 10.0, 6.0, 13.0, 5.0, 4.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.127529144287109, -3.9859135150909424, -3.8442978858947754, -3.7026822566986084, -3.5610666275024414, -3.4194507598876953, -3.2778351306915283, -3.1362195014953613, -2.9946038722991943, -2.8529882431030273, -2.7113726139068604, -2.5697569847106934, -2.4281411170959473, -2.2865257263183594, -2.1449098587036133, -2.0032942295074463, -1.8616786003112793, -1.7200629711151123, -1.5784473419189453, -1.4368315935134888, -1.2952159643173218, -1.1536003351211548, -1.0119845867156982, -0.8703689575195312, -0.7287533283233643, -0.5871376991271973, -0.4455220103263855, -0.3039063513278961, -0.16229069232940674, -0.020675063133239746, 0.12094062566757202, 0.2625563144683838, 0.4041719436645508, 0.5457875728607178, 0.6874032616615295, 0.8290189504623413, 0.9706345796585083, 1.1122502088546753, 1.2538659572601318, 1.3954815864562988, 1.5370972156524658, 1.6787128448486328, 1.8203284740447998, 1.9619442224502563, 2.103559970855713, 2.245175361633301, 2.386791229248047, 2.528406858444214, 2.670022487640381, 2.811638116836548, 2.953253746032715, 3.094869375228882, 3.236485004425049, 3.378100872039795, 3.519716501235962, 3.661332130432129, 3.802947759628296, 3.944563388824463, 4.086179256439209, 4.227794647216797, 4.369410514831543, 4.511025905609131, 4.652641773223877, 4.794257164001465, 4.935873031616211]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 7.0, 5.0, 5.0, 9.0, 15.0, 28.0, 34.0, 43.0, 68.0, 110.0, 153.0, 204.0, 324.0, 438.0, 688.0, 1030.0, 1446.0, 2189.0, 3354.0, 4971.0, 7623.0, 11518.0, 17342.0, 25651.0, 39182.0, 56587.0, 79743.0, 105166.0, 124651.0, 131070.0, 118931.0, 95638.0, 70821.0, 49390.0, 33494.0, 22409.0, 15019.0, 9668.0, 6517.0, 4328.0, 2851.0, 1927.0, 1265.0, 851.0, 599.0, 370.0, 263.0, 169.0, 127.0, 95.0, 59.0, 45.0, 26.0, 17.0, 11.0, 5.0, 9.0, 2.0, 2.0, 6.0, 3.0], "bins": [-3.70703125, -3.592315673828125, -3.47760009765625, -3.362884521484375, -3.2481689453125, -3.133453369140625, -3.01873779296875, -2.904022216796875, -2.789306640625, -2.674591064453125, -2.55987548828125, -2.445159912109375, -2.3304443359375, -2.215728759765625, -2.10101318359375, -1.986297607421875, -1.87158203125, -1.756866455078125, -1.64215087890625, -1.527435302734375, -1.4127197265625, -1.298004150390625, -1.18328857421875, -1.068572998046875, -0.953857421875, -0.839141845703125, -0.72442626953125, -0.609710693359375, -0.4949951171875, -0.380279541015625, -0.26556396484375, -0.150848388671875, -0.0361328125, 0.078582763671875, 0.19329833984375, 0.308013916015625, 0.4227294921875, 0.537445068359375, 0.65216064453125, 0.766876220703125, 0.881591796875, 0.996307373046875, 1.11102294921875, 1.225738525390625, 1.3404541015625, 1.455169677734375, 1.56988525390625, 1.684600830078125, 1.79931640625, 1.914031982421875, 2.02874755859375, 2.143463134765625, 2.2581787109375, 2.372894287109375, 2.48760986328125, 2.602325439453125, 2.717041015625, 2.831756591796875, 2.94647216796875, 3.061187744140625, 3.1759033203125, 3.290618896484375, 3.40533447265625, 3.520050048828125, 3.634765625]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 0.0, 6.0, 6.0, 5.0, 10.0, 10.0, 11.0, 6.0, 17.0, 15.0, 17.0, 18.0, 24.0, 24.0, 35.0, 29.0, 22.0, 25.0, 38.0, 31.0, 33.0, 35.0, 33.0, 42.0, 45.0, 39.0, 37.0, 30.0, 36.0, 33.0, 33.0, 30.0, 25.0, 30.0, 20.0, 21.0, 23.0, 14.0, 11.0, 10.0, 15.0, 15.0, 12.0, 4.0, 2.0, 6.0, 5.0, 7.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-4.703125, -4.5562744140625, -4.409423828125, -4.2625732421875, -4.11572265625, -3.9688720703125, -3.822021484375, -3.6751708984375, -3.5283203125, -3.3814697265625, -3.234619140625, -3.0877685546875, -2.94091796875, -2.7940673828125, -2.647216796875, -2.5003662109375, -2.353515625, -2.2066650390625, -2.059814453125, -1.9129638671875, -1.76611328125, -1.6192626953125, -1.472412109375, -1.3255615234375, -1.1787109375, -1.0318603515625, -0.885009765625, -0.7381591796875, -0.59130859375, -0.4444580078125, -0.297607421875, -0.1507568359375, -0.00390625, 0.1429443359375, 0.289794921875, 0.4366455078125, 0.58349609375, 0.7303466796875, 0.877197265625, 1.0240478515625, 1.1708984375, 1.3177490234375, 1.464599609375, 1.6114501953125, 1.75830078125, 1.9051513671875, 2.052001953125, 2.1988525390625, 2.345703125, 2.4925537109375, 2.639404296875, 2.7862548828125, 2.93310546875, 3.0799560546875, 3.226806640625, 3.3736572265625, 3.5205078125, 3.6673583984375, 3.814208984375, 3.9610595703125, 4.10791015625, 4.2547607421875, 4.401611328125, 4.5484619140625, 4.6953125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 7.0, 15.0, 17.0, 19.0, 24.0, 38.0, 68.0, 104.0, 178.0, 249.0, 397.0, 636.0, 1032.0, 1641.0, 2582.0, 4343.0, 7181.0, 11866.0, 19511.0, 32107.0, 51225.0, 77341.0, 110496.0, 139200.0, 149424.0, 135652.0, 105425.0, 73314.0, 47862.0, 29982.0, 18180.0, 11211.0, 6717.0, 3943.0, 2491.0, 1477.0, 994.0, 588.0, 389.0, 233.0, 137.0, 91.0, 51.0, 35.0, 29.0, 25.0, 10.0, 7.0, 5.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.07421875, -3.944580078125, -3.81494140625, -3.685302734375, -3.5556640625, -3.426025390625, -3.29638671875, -3.166748046875, -3.037109375, -2.907470703125, -2.77783203125, -2.648193359375, -2.5185546875, -2.388916015625, -2.25927734375, -2.129638671875, -2.0, -1.870361328125, -1.74072265625, -1.611083984375, -1.4814453125, -1.351806640625, -1.22216796875, -1.092529296875, -0.962890625, -0.833251953125, -0.70361328125, -0.573974609375, -0.4443359375, -0.314697265625, -0.18505859375, -0.055419921875, 0.07421875, 0.203857421875, 0.33349609375, 0.463134765625, 0.5927734375, 0.722412109375, 0.85205078125, 0.981689453125, 1.111328125, 1.240966796875, 1.37060546875, 1.500244140625, 1.6298828125, 1.759521484375, 1.88916015625, 2.018798828125, 2.1484375, 2.278076171875, 2.40771484375, 2.537353515625, 2.6669921875, 2.796630859375, 2.92626953125, 3.055908203125, 3.185546875, 3.315185546875, 3.44482421875, 3.574462890625, 3.7041015625, 3.833740234375, 3.96337890625, 4.093017578125, 4.22265625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 2.0, 10.0, 6.0, 7.0, 7.0, 6.0, 8.0, 14.0, 11.0, 16.0, 20.0, 19.0, 16.0, 26.0, 31.0, 25.0, 38.0, 43.0, 26.0, 37.0, 43.0, 35.0, 31.0, 45.0, 37.0, 39.0, 37.0, 44.0, 41.0, 27.0, 34.0, 27.0, 27.0, 23.0, 25.0, 16.0, 20.0, 18.0, 9.0, 13.0, 13.0, 5.0, 8.0, 2.0, 3.0, 8.0, 2.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.904296875, -2.81121826171875, -2.7181396484375, -2.62506103515625, -2.531982421875, -2.43890380859375, -2.3458251953125, -2.25274658203125, -2.15966796875, -2.06658935546875, -1.9735107421875, -1.88043212890625, -1.787353515625, -1.69427490234375, -1.6011962890625, -1.50811767578125, -1.4150390625, -1.32196044921875, -1.2288818359375, -1.13580322265625, -1.042724609375, -0.94964599609375, -0.8565673828125, -0.76348876953125, -0.67041015625, -0.57733154296875, -0.4842529296875, -0.39117431640625, -0.298095703125, -0.20501708984375, -0.1119384765625, -0.01885986328125, 0.07421875, 0.16729736328125, 0.2603759765625, 0.35345458984375, 0.446533203125, 0.53961181640625, 0.6326904296875, 0.72576904296875, 0.81884765625, 0.91192626953125, 1.0050048828125, 1.09808349609375, 1.191162109375, 1.28424072265625, 1.3773193359375, 1.47039794921875, 1.5634765625, 1.65655517578125, 1.7496337890625, 1.84271240234375, 1.935791015625, 2.02886962890625, 2.1219482421875, 2.21502685546875, 2.30810546875, 2.40118408203125, 2.4942626953125, 2.58734130859375, 2.680419921875, 2.77349853515625, 2.8665771484375, 2.95965576171875, 3.052734375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 10.0, 7.0, 11.0, 30.0, 47.0, 52.0, 92.0, 111.0, 178.0, 249.0, 396.0, 575.0, 713.0, 1153.0, 1653.0, 2634.0, 3936.0, 6247.0, 9623.0, 15302.0, 24329.0, 37628.0, 59204.0, 87422.0, 120513.0, 145552.0, 146154.0, 123147.0, 91426.0, 60774.0, 39585.0, 25228.0, 15828.0, 9931.0, 6338.0, 4145.0, 2764.0, 1816.0, 1295.0, 770.0, 513.0, 363.0, 239.0, 186.0, 130.0, 73.0, 60.0, 36.0, 23.0, 18.0, 18.0, 10.0, 8.0, 4.0, 4.0, 6.0], "bins": [-1.8779296875, -1.8227691650390625, -1.767608642578125, -1.7124481201171875, -1.65728759765625, -1.6021270751953125, -1.546966552734375, -1.4918060302734375, -1.4366455078125, -1.3814849853515625, -1.326324462890625, -1.2711639404296875, -1.21600341796875, -1.1608428955078125, -1.105682373046875, -1.0505218505859375, -0.995361328125, -0.9402008056640625, -0.885040283203125, -0.8298797607421875, -0.77471923828125, -0.7195587158203125, -0.664398193359375, -0.6092376708984375, -0.5540771484375, -0.4989166259765625, -0.443756103515625, -0.3885955810546875, -0.33343505859375, -0.2782745361328125, -0.223114013671875, -0.1679534912109375, -0.11279296875, -0.0576324462890625, -0.002471923828125, 0.0526885986328125, 0.10784912109375, 0.1630096435546875, 0.218170166015625, 0.2733306884765625, 0.3284912109375, 0.3836517333984375, 0.438812255859375, 0.4939727783203125, 0.54913330078125, 0.6042938232421875, 0.659454345703125, 0.7146148681640625, 0.769775390625, 0.8249359130859375, 0.880096435546875, 0.9352569580078125, 0.99041748046875, 1.0455780029296875, 1.100738525390625, 1.1558990478515625, 1.2110595703125, 1.2662200927734375, 1.321380615234375, 1.3765411376953125, 1.43170166015625, 1.4868621826171875, 1.542022705078125, 1.5971832275390625, 1.65234375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 3.0, 7.0, 7.0, 4.0, 13.0, 16.0, 17.0, 20.0, 27.0, 38.0, 59.0, 43.0, 64.0, 60.0, 69.0, 59.0, 69.0, 72.0, 67.0, 63.0, 45.0, 31.0, 40.0, 24.0, 22.0, 14.0, 15.0, 4.0, 4.0, 7.0, 1.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002636909484863281, -0.0002558566629886627, -0.0002480223774909973, -0.0002401880919933319, -0.0002323538064956665, -0.0002245195209980011, -0.0002166852355003357, -0.0002088509500026703, -0.00020101666450500488, -0.00019318237900733948, -0.00018534809350967407, -0.00017751380801200867, -0.00016967952251434326, -0.00016184523701667786, -0.00015401095151901245, -0.00014617666602134705, -0.00013834238052368164, -0.00013050809502601624, -0.00012267380952835083, -0.00011483952403068542, -0.00010700523853302002, -9.917095303535461e-05, -9.133666753768921e-05, -8.35023820400238e-05, -7.56680965423584e-05, -6.783381104469299e-05, -5.999952554702759e-05, -5.216524004936218e-05, -4.433095455169678e-05, -3.649666905403137e-05, -2.8662383556365967e-05, -2.082809805870056e-05, -1.2993812561035156e-05, -5.159527063369751e-06, 2.6747584342956543e-06, 1.050904393196106e-05, 1.8343329429626465e-05, 2.617761492729187e-05, 3.4011900424957275e-05, 4.184618592262268e-05, 4.9680471420288086e-05, 5.751475691795349e-05, 6.53490424156189e-05, 7.31833279132843e-05, 8.101761341094971e-05, 8.885189890861511e-05, 9.668618440628052e-05, 0.00010452046990394592, 0.00011235475540161133, 0.00012018904089927673, 0.00012802332639694214, 0.00013585761189460754, 0.00014369189739227295, 0.00015152618288993835, 0.00015936046838760376, 0.00016719475388526917, 0.00017502903938293457, 0.00018286332488059998, 0.00019069761037826538, 0.00019853189587593079, 0.0002063661813735962, 0.0002142004668712616, 0.000222034752368927, 0.0002298690378665924, 0.0002377033233642578]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 8.0, 5.0, 15.0, 22.0, 28.0, 48.0, 77.0, 110.0, 167.0, 247.0, 427.0, 686.0, 1109.0, 1801.0, 3073.0, 5190.0, 8687.0, 14677.0, 25126.0, 42016.0, 68137.0, 104042.0, 140922.0, 161970.0, 151190.0, 116499.0, 79629.0, 49198.0, 29907.0, 17594.0, 10302.0, 6296.0, 3647.0, 2201.0, 1321.0, 806.0, 546.0, 307.0, 165.0, 145.0, 68.0, 57.0, 39.0, 20.0, 12.0, 9.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.109375, -2.046722412109375, -1.98406982421875, -1.921417236328125, -1.8587646484375, -1.796112060546875, -1.73345947265625, -1.670806884765625, -1.608154296875, -1.545501708984375, -1.48284912109375, -1.420196533203125, -1.3575439453125, -1.294891357421875, -1.23223876953125, -1.169586181640625, -1.10693359375, -1.044281005859375, -0.98162841796875, -0.918975830078125, -0.8563232421875, -0.793670654296875, -0.73101806640625, -0.668365478515625, -0.605712890625, -0.543060302734375, -0.48040771484375, -0.417755126953125, -0.3551025390625, -0.292449951171875, -0.22979736328125, -0.167144775390625, -0.1044921875, -0.041839599609375, 0.02081298828125, 0.083465576171875, 0.1461181640625, 0.208770751953125, 0.27142333984375, 0.334075927734375, 0.396728515625, 0.459381103515625, 0.52203369140625, 0.584686279296875, 0.6473388671875, 0.709991455078125, 0.77264404296875, 0.835296630859375, 0.89794921875, 0.960601806640625, 1.02325439453125, 1.085906982421875, 1.1485595703125, 1.211212158203125, 1.27386474609375, 1.336517333984375, 1.399169921875, 1.461822509765625, 1.52447509765625, 1.587127685546875, 1.6497802734375, 1.712432861328125, 1.77508544921875, 1.837738037109375, 1.900390625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 2.0, 7.0, 7.0, 10.0, 7.0, 10.0, 15.0, 17.0, 16.0, 29.0, 33.0, 28.0, 34.0, 48.0, 37.0, 48.0, 42.0, 56.0, 52.0, 44.0, 42.0, 52.0, 44.0, 27.0, 37.0, 45.0, 32.0, 38.0, 20.0, 18.0, 18.0, 20.0, 7.0, 13.0, 14.0, 6.0, 3.0, 5.0, 7.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0], "bins": [-0.6943359375, -0.6751480102539062, -0.6559600830078125, -0.6367721557617188, -0.617584228515625, -0.5983963012695312, -0.5792083740234375, -0.5600204467773438, -0.54083251953125, -0.5216445922851562, -0.5024566650390625, -0.48326873779296875, -0.464080810546875, -0.44489288330078125, -0.4257049560546875, -0.40651702880859375, -0.3873291015625, -0.36814117431640625, -0.3489532470703125, -0.32976531982421875, -0.310577392578125, -0.29138946533203125, -0.2722015380859375, -0.25301361083984375, -0.23382568359375, -0.21463775634765625, -0.1954498291015625, -0.17626190185546875, -0.157073974609375, -0.13788604736328125, -0.1186981201171875, -0.09951019287109375, -0.080322265625, -0.06113433837890625, -0.0419464111328125, -0.02275848388671875, -0.003570556640625, 0.01561737060546875, 0.0348052978515625, 0.05399322509765625, 0.07318115234375, 0.09236907958984375, 0.1115570068359375, 0.13074493408203125, 0.149932861328125, 0.16912078857421875, 0.1883087158203125, 0.20749664306640625, 0.2266845703125, 0.24587249755859375, 0.2650604248046875, 0.28424835205078125, 0.303436279296875, 0.32262420654296875, 0.3418121337890625, 0.36100006103515625, 0.38018798828125, 0.39937591552734375, 0.4185638427734375, 0.43775177001953125, 0.456939697265625, 0.47612762451171875, 0.4953155517578125, 0.5145034790039062, 0.53369140625]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 4.0, 2.0, 3.0, 10.0, 10.0, 11.0, 12.0, 14.0, 26.0, 20.0, 29.0, 38.0, 32.0, 63.0, 67.0, 60.0, 62.0, 67.0, 55.0, 56.0, 62.0, 71.0, 45.0, 27.0, 31.0, 26.0, 21.0, 16.0, 10.0, 10.0, 13.0, 4.0, 4.0, 7.0, 2.0, 1.0, 0.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.933524131774902, -10.64033031463623, -10.347137451171875, -10.053943634033203, -9.760749816894531, -9.46755599975586, -9.174363136291504, -8.881169319152832, -8.58797550201416, -8.294781684875488, -8.001588821411133, -7.708395004272461, -7.415201187133789, -7.122007846832275, -6.828814506530762, -6.53562068939209, -6.242427349090576, -5.9492340087890625, -5.656040191650391, -5.362846851348877, -5.069653034210205, -4.776459693908691, -4.4832658767700195, -4.190072536468506, -3.896878957748413, -3.6036853790283203, -3.3104918003082275, -3.0172982215881348, -2.724104881286621, -2.430911064147949, -2.1377177238464355, -1.8445241451263428, -1.5513310432434082, -1.2581374645233154, -0.9649439454078674, -0.6717504262924194, -0.37855684757232666, -0.08536326885223389, 0.20783019065856934, 0.5010237693786621, 0.7942173480987549, 1.0874109268188477, 1.3806045055389404, 1.6737979650497437, 1.9669915437698364, 2.2601852416992188, 2.5533785820007324, 2.846572160720825, 3.139765739440918, 3.4329593181610107, 3.7261528968811035, 4.019346237182617, 4.312540054321289, 4.605733394622803, 4.898926734924316, 5.192120552062988, 5.48531436920166, 5.778507709503174, 6.071701526641846, 6.364894866943359, 6.658088684082031, 6.951282024383545, 7.244475364685059, 7.5376691818237305, 7.830862522125244]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 6.0, 5.0, 5.0, 3.0, 12.0, 3.0, 13.0, 11.0, 13.0, 8.0, 19.0, 17.0, 18.0, 24.0, 22.0, 30.0, 36.0, 34.0, 28.0, 35.0, 51.0, 38.0, 35.0, 29.0, 38.0, 42.0, 42.0, 41.0, 42.0, 40.0, 22.0, 36.0, 33.0, 29.0, 26.0, 22.0, 23.0, 18.0, 6.0, 8.0, 9.0, 9.0, 10.0, 4.0, 6.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-5.408603191375732, -5.249632358551025, -5.09066104888916, -4.931690216064453, -4.772719383239746, -4.613748550415039, -4.454777717590332, -4.295806407928467, -4.13683557510376, -3.9778647422790527, -3.8188936710357666, -3.6599225997924805, -3.5009517669677734, -3.3419809341430664, -3.1830098628997803, -3.024038791656494, -2.865067958831787, -2.70609712600708, -2.547126054763794, -2.388154983520508, -2.229184150695801, -2.0702133178710938, -1.9112422466278076, -1.752271294593811, -1.5933003425598145, -1.4343293905258179, -1.2753584384918213, -1.1163874864578247, -0.9574165344238281, -0.7984455823898315, -0.639474630355835, -0.4805036783218384, -0.321533203125, -0.16256225109100342, -0.003591299057006836, 0.15537965297698975, 0.31435060501098633, 0.4733215570449829, 0.6322925090789795, 0.7912634611129761, 0.9502344131469727, 1.1092053651809692, 1.2681763172149658, 1.4271472692489624, 1.586118221282959, 1.7450891733169556, 1.9040601253509521, 2.0630311965942383, 2.2220020294189453, 2.3809728622436523, 2.5399439334869385, 2.6989150047302246, 2.8578858375549316, 3.0168566703796387, 3.175827741622925, 3.334798812866211, 3.493769645690918, 3.652740478515625, 3.811711549758911, 3.9706826210021973, 4.129653453826904, 4.288624286651611, 4.447595596313477, 4.606566429138184, 4.765537261962891]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 4.0, 3.0, 8.0, 8.0, 13.0, 18.0, 37.0, 33.0, 61.0, 116.0, 118.0, 189.0, 314.0, 563.0, 882.0, 1405.0, 2255.0, 3640.0, 6071.0, 10707.0, 19694.0, 39324.0, 90347.0, 246382.0, 751592.0, 1497428.0, 984171.0, 327544.0, 112261.0, 46598.0, 22578.0, 11909.0, 6853.0, 4117.0, 2552.0, 1548.0, 999.0, 678.0, 429.0, 274.0, 174.0, 106.0, 105.0, 53.0, 31.0, 22.0, 21.0, 17.0, 11.0, 16.0, 6.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.1171875, -9.7637939453125, -9.410400390625, -9.0570068359375, -8.70361328125, -8.3502197265625, -7.996826171875, -7.6434326171875, -7.2900390625, -6.9366455078125, -6.583251953125, -6.2298583984375, -5.87646484375, -5.5230712890625, -5.169677734375, -4.8162841796875, -4.462890625, -4.1094970703125, -3.756103515625, -3.4027099609375, -3.04931640625, -2.6959228515625, -2.342529296875, -1.9891357421875, -1.6357421875, -1.2823486328125, -0.928955078125, -0.5755615234375, -0.22216796875, 0.1312255859375, 0.484619140625, 0.8380126953125, 1.19140625, 1.5447998046875, 1.898193359375, 2.2515869140625, 2.60498046875, 2.9583740234375, 3.311767578125, 3.6651611328125, 4.0185546875, 4.3719482421875, 4.725341796875, 5.0787353515625, 5.43212890625, 5.7855224609375, 6.138916015625, 6.4923095703125, 6.845703125, 7.1990966796875, 7.552490234375, 7.9058837890625, 8.25927734375, 8.6126708984375, 8.966064453125, 9.3194580078125, 9.6728515625, 10.0262451171875, 10.379638671875, 10.7330322265625, 11.08642578125, 11.4398193359375, 11.793212890625, 12.1466064453125, 12.5]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 3.0, 3.0, 5.0, 9.0, 3.0, 12.0, 11.0, 12.0, 13.0, 14.0, 15.0, 15.0, 26.0, 25.0, 35.0, 25.0, 38.0, 35.0, 40.0, 34.0, 46.0, 47.0, 39.0, 42.0, 31.0, 49.0, 48.0, 31.0, 42.0, 30.0, 38.0, 24.0, 34.0, 24.0, 21.0, 13.0, 14.0, 11.0, 12.0, 8.0, 5.0, 11.0, 1.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.39453125, -4.26092529296875, -4.1273193359375, -3.99371337890625, -3.860107421875, -3.72650146484375, -3.5928955078125, -3.45928955078125, -3.32568359375, -3.19207763671875, -3.0584716796875, -2.92486572265625, -2.791259765625, -2.65765380859375, -2.5240478515625, -2.39044189453125, -2.2568359375, -2.12322998046875, -1.9896240234375, -1.85601806640625, -1.722412109375, -1.58880615234375, -1.4552001953125, -1.32159423828125, -1.18798828125, -1.05438232421875, -0.9207763671875, -0.78717041015625, -0.653564453125, -0.51995849609375, -0.3863525390625, -0.25274658203125, -0.119140625, 0.01446533203125, 0.1480712890625, 0.28167724609375, 0.415283203125, 0.54888916015625, 0.6824951171875, 0.81610107421875, 0.94970703125, 1.08331298828125, 1.2169189453125, 1.35052490234375, 1.484130859375, 1.61773681640625, 1.7513427734375, 1.88494873046875, 2.0185546875, 2.15216064453125, 2.2857666015625, 2.41937255859375, 2.552978515625, 2.68658447265625, 2.8201904296875, 2.95379638671875, 3.08740234375, 3.22100830078125, 3.3546142578125, 3.48822021484375, 3.621826171875, 3.75543212890625, 3.8890380859375, 4.02264404296875, 4.15625]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 12.0, 10.0, 26.0, 27.0, 53.0, 74.0, 121.0, 185.0, 262.0, 461.0, 690.0, 1039.0, 1716.0, 2824.0, 4546.0, 8021.0, 13887.0, 25936.0, 51784.0, 108748.0, 246948.0, 591001.0, 1194175.0, 1066500.0, 483913.0, 203333.0, 91398.0, 44162.0, 22620.0, 12365.0, 6885.0, 4017.0, 2503.0, 1430.0, 938.0, 562.0, 390.0, 235.0, 161.0, 104.0, 72.0, 46.0, 38.0, 19.0, 21.0, 15.0, 6.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.8671875, -10.5263671875, -10.185546875, -9.8447265625, -9.50390625, -9.1630859375, -8.822265625, -8.4814453125, -8.140625, -7.7998046875, -7.458984375, -7.1181640625, -6.77734375, -6.4365234375, -6.095703125, -5.7548828125, -5.4140625, -5.0732421875, -4.732421875, -4.3916015625, -4.05078125, -3.7099609375, -3.369140625, -3.0283203125, -2.6875, -2.3466796875, -2.005859375, -1.6650390625, -1.32421875, -0.9833984375, -0.642578125, -0.3017578125, 0.0390625, 0.3798828125, 0.720703125, 1.0615234375, 1.40234375, 1.7431640625, 2.083984375, 2.4248046875, 2.765625, 3.1064453125, 3.447265625, 3.7880859375, 4.12890625, 4.4697265625, 4.810546875, 5.1513671875, 5.4921875, 5.8330078125, 6.173828125, 6.5146484375, 6.85546875, 7.1962890625, 7.537109375, 7.8779296875, 8.21875, 8.5595703125, 8.900390625, 9.2412109375, 9.58203125, 9.9228515625, 10.263671875, 10.6044921875, 10.9453125]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 6.0, 3.0, 5.0, 7.0, 11.0, 15.0, 14.0, 24.0, 38.0, 28.0, 55.0, 60.0, 90.0, 127.0, 148.0, 206.0, 253.0, 313.0, 374.0, 400.0, 368.0, 345.0, 241.0, 213.0, 161.0, 130.0, 113.0, 91.0, 53.0, 41.0, 34.0, 25.0, 22.0, 14.0, 12.0, 12.0, 6.0, 5.0, 5.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.041015625, -2.930755615234375, -2.82049560546875, -2.710235595703125, -2.5999755859375, -2.489715576171875, -2.37945556640625, -2.269195556640625, -2.158935546875, -2.048675537109375, -1.93841552734375, -1.828155517578125, -1.7178955078125, -1.607635498046875, -1.49737548828125, -1.387115478515625, -1.27685546875, -1.166595458984375, -1.05633544921875, -0.946075439453125, -0.8358154296875, -0.725555419921875, -0.61529541015625, -0.505035400390625, -0.394775390625, -0.284515380859375, -0.17425537109375, -0.063995361328125, 0.0462646484375, 0.156524658203125, 0.26678466796875, 0.377044677734375, 0.4873046875, 0.597564697265625, 0.70782470703125, 0.818084716796875, 0.9283447265625, 1.038604736328125, 1.14886474609375, 1.259124755859375, 1.369384765625, 1.479644775390625, 1.58990478515625, 1.700164794921875, 1.8104248046875, 1.920684814453125, 2.03094482421875, 2.141204833984375, 2.25146484375, 2.361724853515625, 2.47198486328125, 2.582244873046875, 2.6925048828125, 2.802764892578125, 2.91302490234375, 3.023284912109375, 3.133544921875, 3.243804931640625, 3.35406494140625, 3.464324951171875, 3.5745849609375, 3.684844970703125, 3.79510498046875, 3.905364990234375, 4.015625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 4.0, 5.0, 9.0, 8.0, 14.0, 11.0, 17.0, 19.0, 22.0, 19.0, 33.0, 25.0, 46.0, 48.0, 49.0, 73.0, 76.0, 70.0, 75.0, 58.0, 51.0, 36.0, 41.0, 38.0, 36.0, 27.0, 12.0, 13.0, 8.0, 12.0, 7.0, 8.0, 7.0, 1.0, 4.0, 5.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.345856666564941, -10.03372859954834, -9.721600532531738, -9.409473419189453, -9.097345352172852, -8.78521728515625, -8.473089218139648, -8.160961151123047, -7.8488335609436035, -7.536705493927002, -7.224577903747559, -6.912449836730957, -6.6003217697143555, -6.288194179534912, -5.9760661125183105, -5.663938522338867, -5.351810455322266, -5.039682388305664, -4.727554798126221, -4.415426731109619, -4.103299140930176, -3.791171073913574, -3.4790430068969727, -3.16691517829895, -2.8547873497009277, -2.5426595211029053, -2.230531692504883, -1.9184036254882812, -1.6062757968902588, -1.2941479682922363, -0.9820200204849243, -0.6698920726776123, -0.35776424407958984, -0.04563635587692261, 0.26649153232574463, 0.5786194205284119, 0.8907473087310791, 1.2028751373291016, 1.5150030851364136, 1.8271310329437256, 2.139258861541748, 2.4513866901397705, 2.763514518737793, 3.0756425857543945, 3.387770414352417, 3.6998982429504395, 4.012026309967041, 4.324153900146484, 4.636281967163086, 4.9484100341796875, 5.260537624359131, 5.572665691375732, 5.884793281555176, 6.196921348571777, 6.509049415588379, 6.8211774826049805, 7.133305072784424, 7.445433139801025, 7.757560729980469, 8.06968879699707, 8.381816864013672, 8.693944931030273, 9.006072044372559, 9.31820011138916, 9.630328178405762]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 6.0, 9.0, 16.0, 10.0, 13.0, 18.0, 10.0, 17.0, 15.0, 13.0, 20.0, 26.0, 22.0, 32.0, 25.0, 34.0, 34.0, 28.0, 42.0, 40.0, 34.0, 45.0, 34.0, 48.0, 28.0, 48.0, 40.0, 35.0, 32.0, 30.0, 19.0, 21.0, 19.0, 21.0, 19.0, 16.0, 14.0, 12.0, 15.0, 8.0, 9.0, 8.0, 7.0, 5.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.479977607727051, -5.306244373321533, -5.132511615753174, -4.958778381347656, -4.785045146942139, -4.611311912536621, -4.437579154968262, -4.263845920562744, -4.090112686157227, -3.916379690170288, -3.7426464557647705, -3.568913459777832, -3.3951802253723145, -3.221447229385376, -3.0477142333984375, -2.87398099899292, -2.7002482414245605, -2.526515245437622, -2.3527820110321045, -2.179049015045166, -2.0053157806396484, -1.83158278465271, -1.6578497886657715, -1.4841166734695435, -1.3103835582733154, -1.1366504430770874, -0.9629173874855042, -0.7891843318939209, -0.6154512166976929, -0.44171810150146484, -0.26798510551452637, -0.09425199031829834, 0.07948160171508789, 0.25321468710899353, 0.42694777250289917, 0.6006808280944824, 0.7744139432907104, 0.9481470584869385, 1.121880054473877, 1.295613169670105, 1.469346284866333, 1.643079400062561, 1.816812515258789, 1.9905455112457275, 2.164278507232666, 2.3380117416381836, 2.511744737625122, 2.6854777336120605, 2.859210968017578, 3.0329439640045166, 3.206677198410034, 3.3804101943969727, 3.5541434288024902, 3.7278764247894287, 3.901609420776367, 4.075342655181885, 4.249075889587402, 4.42280912399292, 4.596541881561279, 4.770275115966797, 4.9440083503723145, 5.117741584777832, 5.291474342346191, 5.465207576751709, 5.638940334320068]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 16.0, 15.0, 31.0, 42.0, 67.0, 120.0, 147.0, 259.0, 445.0, 738.0, 1150.0, 2044.0, 3514.0, 6123.0, 10372.0, 17987.0, 31081.0, 52445.0, 86317.0, 134149.0, 177135.0, 176225.0, 134019.0, 86701.0, 52809.0, 31274.0, 17988.0, 10578.0, 6063.0, 3568.0, 2057.0, 1225.0, 690.0, 448.0, 270.0, 190.0, 99.0, 58.0, 33.0, 19.0, 17.0, 14.0, 8.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-4.046875, -3.9278564453125, -3.808837890625, -3.6898193359375, -3.57080078125, -3.4517822265625, -3.332763671875, -3.2137451171875, -3.0947265625, -2.9757080078125, -2.856689453125, -2.7376708984375, -2.61865234375, -2.4996337890625, -2.380615234375, -2.2615966796875, -2.142578125, -2.0235595703125, -1.904541015625, -1.7855224609375, -1.66650390625, -1.5474853515625, -1.428466796875, -1.3094482421875, -1.1904296875, -1.0714111328125, -0.952392578125, -0.8333740234375, -0.71435546875, -0.5953369140625, -0.476318359375, -0.3572998046875, -0.23828125, -0.1192626953125, -0.000244140625, 0.1187744140625, 0.23779296875, 0.3568115234375, 0.475830078125, 0.5948486328125, 0.7138671875, 0.8328857421875, 0.951904296875, 1.0709228515625, 1.18994140625, 1.3089599609375, 1.427978515625, 1.5469970703125, 1.666015625, 1.7850341796875, 1.904052734375, 2.0230712890625, 2.14208984375, 2.2611083984375, 2.380126953125, 2.4991455078125, 2.6181640625, 2.7371826171875, 2.856201171875, 2.9752197265625, 3.09423828125, 3.2132568359375, 3.332275390625, 3.4512939453125, 3.5703125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 7.0, 8.0, 9.0, 11.0, 16.0, 12.0, 15.0, 11.0, 23.0, 11.0, 35.0, 25.0, 18.0, 43.0, 32.0, 24.0, 34.0, 34.0, 37.0, 43.0, 33.0, 52.0, 46.0, 44.0, 28.0, 36.0, 23.0, 34.0, 32.0, 23.0, 18.0, 24.0, 20.0, 26.0, 17.0, 11.0, 13.0, 11.0, 10.0, 10.0, 12.0, 7.0, 7.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.28125, -5.09979248046875, -4.9183349609375, -4.73687744140625, -4.555419921875, -4.37396240234375, -4.1925048828125, -4.01104736328125, -3.82958984375, -3.64813232421875, -3.4666748046875, -3.28521728515625, -3.103759765625, -2.92230224609375, -2.7408447265625, -2.55938720703125, -2.3779296875, -2.19647216796875, -2.0150146484375, -1.83355712890625, -1.652099609375, -1.47064208984375, -1.2891845703125, -1.10772705078125, -0.92626953125, -0.74481201171875, -0.5633544921875, -0.38189697265625, -0.200439453125, -0.01898193359375, 0.1624755859375, 0.34393310546875, 0.525390625, 0.70684814453125, 0.8883056640625, 1.06976318359375, 1.251220703125, 1.43267822265625, 1.6141357421875, 1.79559326171875, 1.97705078125, 2.15850830078125, 2.3399658203125, 2.52142333984375, 2.702880859375, 2.88433837890625, 3.0657958984375, 3.24725341796875, 3.4287109375, 3.61016845703125, 3.7916259765625, 3.97308349609375, 4.154541015625, 4.33599853515625, 4.5174560546875, 4.69891357421875, 4.88037109375, 5.06182861328125, 5.2432861328125, 5.42474365234375, 5.606201171875, 5.78765869140625, 5.9691162109375, 6.15057373046875, 6.33203125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 10.0, 11.0, 15.0, 21.0, 36.0, 38.0, 70.0, 112.0, 178.0, 265.0, 427.0, 604.0, 949.0, 1600.0, 2631.0, 4382.0, 7313.0, 12974.0, 23337.0, 41742.0, 77648.0, 137468.0, 209967.0, 210230.0, 139154.0, 78778.0, 42981.0, 23291.0, 13285.0, 7447.0, 4474.0, 2687.0, 1628.0, 1030.0, 626.0, 389.0, 249.0, 163.0, 112.0, 77.0, 42.0, 37.0, 29.0, 15.0, 10.0, 10.0, 8.0, 8.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.94140625, -4.78704833984375, -4.6326904296875, -4.47833251953125, -4.323974609375, -4.16961669921875, -4.0152587890625, -3.86090087890625, -3.70654296875, -3.55218505859375, -3.3978271484375, -3.24346923828125, -3.089111328125, -2.93475341796875, -2.7803955078125, -2.62603759765625, -2.4716796875, -2.31732177734375, -2.1629638671875, -2.00860595703125, -1.854248046875, -1.69989013671875, -1.5455322265625, -1.39117431640625, -1.23681640625, -1.08245849609375, -0.9281005859375, -0.77374267578125, -0.619384765625, -0.46502685546875, -0.3106689453125, -0.15631103515625, -0.001953125, 0.15240478515625, 0.3067626953125, 0.46112060546875, 0.615478515625, 0.76983642578125, 0.9241943359375, 1.07855224609375, 1.23291015625, 1.38726806640625, 1.5416259765625, 1.69598388671875, 1.850341796875, 2.00469970703125, 2.1590576171875, 2.31341552734375, 2.4677734375, 2.62213134765625, 2.7764892578125, 2.93084716796875, 3.085205078125, 3.23956298828125, 3.3939208984375, 3.54827880859375, 3.70263671875, 3.85699462890625, 4.0113525390625, 4.16571044921875, 4.320068359375, 4.47442626953125, 4.6287841796875, 4.78314208984375, 4.9375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 7.0, 11.0, 8.0, 12.0, 9.0, 10.0, 12.0, 22.0, 20.0, 22.0, 25.0, 31.0, 33.0, 36.0, 41.0, 45.0, 32.0, 42.0, 39.0, 40.0, 43.0, 47.0, 36.0, 46.0, 45.0, 46.0, 30.0, 36.0, 25.0, 18.0, 21.0, 25.0, 18.0, 9.0, 12.0, 8.0, 12.0, 4.0, 14.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.8671875, -3.745025634765625, -3.62286376953125, -3.500701904296875, -3.3785400390625, -3.256378173828125, -3.13421630859375, -3.012054443359375, -2.889892578125, -2.767730712890625, -2.64556884765625, -2.523406982421875, -2.4012451171875, -2.279083251953125, -2.15692138671875, -2.034759521484375, -1.91259765625, -1.790435791015625, -1.66827392578125, -1.546112060546875, -1.4239501953125, -1.301788330078125, -1.17962646484375, -1.057464599609375, -0.935302734375, -0.813140869140625, -0.69097900390625, -0.568817138671875, -0.4466552734375, -0.324493408203125, -0.20233154296875, -0.080169677734375, 0.0419921875, 0.164154052734375, 0.28631591796875, 0.408477783203125, 0.5306396484375, 0.652801513671875, 0.77496337890625, 0.897125244140625, 1.019287109375, 1.141448974609375, 1.26361083984375, 1.385772705078125, 1.5079345703125, 1.630096435546875, 1.75225830078125, 1.874420166015625, 1.99658203125, 2.118743896484375, 2.24090576171875, 2.363067626953125, 2.4852294921875, 2.607391357421875, 2.72955322265625, 2.851715087890625, 2.973876953125, 3.096038818359375, 3.21820068359375, 3.340362548828125, 3.4625244140625, 3.584686279296875, 3.70684814453125, 3.829010009765625, 3.951171875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 10.0, 7.0, 10.0, 20.0, 38.0, 49.0, 81.0, 89.0, 170.0, 227.0, 365.0, 559.0, 820.0, 1254.0, 1958.0, 3056.0, 4839.0, 7966.0, 13242.0, 22948.0, 40494.0, 73302.0, 129858.0, 204706.0, 213723.0, 141353.0, 80276.0, 44559.0, 25002.0, 14552.0, 8499.0, 5196.0, 3254.0, 2019.0, 1349.0, 869.0, 625.0, 380.0, 266.0, 184.0, 128.0, 87.0, 54.0, 39.0, 30.0, 15.0, 10.0, 6.0, 9.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.453125, -2.37896728515625, -2.3048095703125, -2.23065185546875, -2.156494140625, -2.08233642578125, -2.0081787109375, -1.93402099609375, -1.85986328125, -1.78570556640625, -1.7115478515625, -1.63739013671875, -1.563232421875, -1.48907470703125, -1.4149169921875, -1.34075927734375, -1.2666015625, -1.19244384765625, -1.1182861328125, -1.04412841796875, -0.969970703125, -0.89581298828125, -0.8216552734375, -0.74749755859375, -0.67333984375, -0.59918212890625, -0.5250244140625, -0.45086669921875, -0.376708984375, -0.30255126953125, -0.2283935546875, -0.15423583984375, -0.080078125, -0.00592041015625, 0.0682373046875, 0.14239501953125, 0.216552734375, 0.29071044921875, 0.3648681640625, 0.43902587890625, 0.51318359375, 0.58734130859375, 0.6614990234375, 0.73565673828125, 0.809814453125, 0.88397216796875, 0.9581298828125, 1.03228759765625, 1.1064453125, 1.18060302734375, 1.2547607421875, 1.32891845703125, 1.403076171875, 1.47723388671875, 1.5513916015625, 1.62554931640625, 1.69970703125, 1.77386474609375, 1.8480224609375, 1.92218017578125, 1.996337890625, 2.07049560546875, 2.1446533203125, 2.21881103515625, 2.29296875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 0.0, 3.0, 4.0, 7.0, 13.0, 6.0, 17.0, 15.0, 24.0, 24.0, 21.0, 36.0, 50.0, 61.0, 85.0, 67.0, 73.0, 73.0, 79.0, 59.0, 57.0, 60.0, 33.0, 30.0, 25.0, 19.0, 11.0, 8.0, 10.0, 5.0, 5.0, 8.0, 0.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0001475811004638672, -0.0001432131975889206, -0.000138845294713974, -0.0001344773918390274, -0.0001301094889640808, -0.00012574158608913422, -0.00012137368321418762, -0.00011700578033924103, -0.00011263787746429443, -0.00010826997458934784, -0.00010390207171440125, -9.953416883945465e-05, -9.516626596450806e-05, -9.079836308956146e-05, -8.643046021461487e-05, -8.206255733966827e-05, -7.769465446472168e-05, -7.332675158977509e-05, -6.895884871482849e-05, -6.45909458398819e-05, -6.02230429649353e-05, -5.585514008998871e-05, -5.1487237215042114e-05, -4.711933434009552e-05, -4.2751431465148926e-05, -3.838352859020233e-05, -3.401562571525574e-05, -2.9647722840309143e-05, -2.527981996536255e-05, -2.0911917090415955e-05, -1.654401421546936e-05, -1.2176111340522766e-05, -7.808208465576172e-06, -3.4403055906295776e-06, 9.275972843170166e-07, 5.295500159263611e-06, 9.663403034210205e-06, 1.40313059091568e-05, 1.8399208784103394e-05, 2.2767111659049988e-05, 2.7135014533996582e-05, 3.1502917408943176e-05, 3.587082028388977e-05, 4.0238723158836365e-05, 4.460662603378296e-05, 4.897452890872955e-05, 5.334243178367615e-05, 5.771033465862274e-05, 6.207823753356934e-05, 6.644614040851593e-05, 7.081404328346252e-05, 7.518194615840912e-05, 7.954984903335571e-05, 8.391775190830231e-05, 8.82856547832489e-05, 9.26535576581955e-05, 9.702146053314209e-05, 0.00010138936340808868, 0.00010575726628303528, 0.00011012516915798187, 0.00011449307203292847, 0.00011886097490787506, 0.00012322887778282166, 0.00012759678065776825, 0.00013196468353271484]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 6.0, 13.0, 23.0, 21.0, 32.0, 56.0, 69.0, 105.0, 157.0, 204.0, 345.0, 483.0, 763.0, 1212.0, 1733.0, 2771.0, 4331.0, 6666.0, 10490.0, 16912.0, 27407.0, 44394.0, 70788.0, 107968.0, 148045.0, 167108.0, 146026.0, 106197.0, 68996.0, 43177.0, 26685.0, 16377.0, 10436.0, 6620.0, 4003.0, 2713.0, 1826.0, 1124.0, 750.0, 490.0, 333.0, 217.0, 157.0, 118.0, 77.0, 47.0, 20.0, 22.0, 20.0, 10.0, 6.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.982421875, -1.91943359375, -1.8564453125, -1.79345703125, -1.73046875, -1.66748046875, -1.6044921875, -1.54150390625, -1.478515625, -1.41552734375, -1.3525390625, -1.28955078125, -1.2265625, -1.16357421875, -1.1005859375, -1.03759765625, -0.974609375, -0.91162109375, -0.8486328125, -0.78564453125, -0.72265625, -0.65966796875, -0.5966796875, -0.53369140625, -0.470703125, -0.40771484375, -0.3447265625, -0.28173828125, -0.21875, -0.15576171875, -0.0927734375, -0.02978515625, 0.033203125, 0.09619140625, 0.1591796875, 0.22216796875, 0.28515625, 0.34814453125, 0.4111328125, 0.47412109375, 0.537109375, 0.60009765625, 0.6630859375, 0.72607421875, 0.7890625, 0.85205078125, 0.9150390625, 0.97802734375, 1.041015625, 1.10400390625, 1.1669921875, 1.22998046875, 1.29296875, 1.35595703125, 1.4189453125, 1.48193359375, 1.544921875, 1.60791015625, 1.6708984375, 1.73388671875, 1.796875, 1.85986328125, 1.9228515625, 1.98583984375, 2.048828125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 5.0, 6.0, 7.0, 8.0, 7.0, 6.0, 16.0, 16.0, 14.0, 18.0, 18.0, 34.0, 29.0, 28.0, 37.0, 52.0, 46.0, 49.0, 47.0, 55.0, 48.0, 41.0, 53.0, 41.0, 49.0, 30.0, 41.0, 29.0, 29.0, 21.0, 23.0, 14.0, 15.0, 15.0, 17.0, 5.0, 13.0, 10.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.6630859375, -0.6432113647460938, -0.6233367919921875, -0.6034622192382812, -0.583587646484375, -0.5637130737304688, -0.5438385009765625, -0.5239639282226562, -0.50408935546875, -0.48421478271484375, -0.4643402099609375, -0.44446563720703125, -0.424591064453125, -0.40471649169921875, -0.3848419189453125, -0.36496734619140625, -0.3450927734375, -0.32521820068359375, -0.3053436279296875, -0.28546905517578125, -0.265594482421875, -0.24571990966796875, -0.2258453369140625, -0.20597076416015625, -0.18609619140625, -0.16622161865234375, -0.1463470458984375, -0.12647247314453125, -0.106597900390625, -0.08672332763671875, -0.0668487548828125, -0.04697418212890625, -0.027099609375, -0.00722503662109375, 0.0126495361328125, 0.03252410888671875, 0.052398681640625, 0.07227325439453125, 0.0921478271484375, 0.11202239990234375, 0.13189697265625, 0.15177154541015625, 0.1716461181640625, 0.19152069091796875, 0.211395263671875, 0.23126983642578125, 0.2511444091796875, 0.27101898193359375, 0.2908935546875, 0.31076812744140625, 0.3306427001953125, 0.35051727294921875, 0.370391845703125, 0.39026641845703125, 0.4101409912109375, 0.43001556396484375, 0.44989013671875, 0.46976470947265625, 0.4896392822265625, 0.5095138549804688, 0.529388427734375, 0.5492630004882812, 0.5691375732421875, 0.5890121459960938, 0.60888671875]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 0.0, 4.0, 5.0, 6.0, 8.0, 8.0, 15.0, 13.0, 16.0, 23.0, 28.0, 28.0, 31.0, 43.0, 61.0, 48.0, 78.0, 77.0, 78.0, 71.0, 57.0, 47.0, 48.0, 38.0, 42.0, 30.0, 13.0, 9.0, 14.0, 10.0, 13.0, 8.0, 5.0, 6.0, 4.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.154535293579102, -10.825577735900879, -10.496620178222656, -10.16766357421875, -9.838706016540527, -9.509748458862305, -9.180790901184082, -8.85183334350586, -8.522875785827637, -8.193918228149414, -7.86496114730835, -7.536003589630127, -7.207046031951904, -6.87808895111084, -6.549131393432617, -6.2201738357543945, -5.89121675491333, -5.562259197235107, -5.233302116394043, -4.90434455871582, -4.575387001037598, -4.246429443359375, -3.9174723625183105, -3.588514804840088, -3.2595574855804443, -2.930600166320801, -2.601642608642578, -2.2726852893829346, -1.9437278509140015, -1.6147704124450684, -1.2858130931854248, -0.9568555355072021, -0.6278982162475586, -0.2989408075809479, 0.030016601085662842, 0.35897397994995117, 0.6879314184188843, 1.0168888568878174, 1.345846176147461, 1.6748037338256836, 2.003761053085327, 2.3327183723449707, 2.6616759300231934, 2.990633249282837, 3.3195905685424805, 3.648548126220703, 3.9775054454803467, 4.306463241577148, 4.635420322418213, 4.9643778800964355, 5.2933349609375, 5.622292518615723, 5.951250076293945, 6.280207633972168, 6.609164714813232, 6.938122272491455, 7.2670793533325195, 7.596036911010742, 7.924993991851807, 8.253952026367188, 8.582908630371094, 8.911866188049316, 9.240823745727539, 9.569781303405762, 9.898738861083984]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 5.0, 5.0, 12.0, 13.0, 13.0, 15.0, 14.0, 12.0, 16.0, 14.0, 22.0, 22.0, 22.0, 23.0, 27.0, 36.0, 32.0, 32.0, 27.0, 48.0, 37.0, 31.0, 60.0, 38.0, 30.0, 39.0, 45.0, 41.0, 40.0, 23.0, 22.0, 24.0, 19.0, 21.0, 19.0, 22.0, 13.0, 13.0, 16.0, 10.0, 7.0, 9.0, 4.0, 6.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-5.661330223083496, -5.485322952270508, -5.3093156814575195, -5.133308410644531, -4.957301139831543, -4.781293869018555, -4.605286598205566, -4.429279327392578, -4.25327205657959, -4.077264785766602, -3.9012575149536133, -3.725250244140625, -3.5492429733276367, -3.3732357025146484, -3.19722843170166, -3.021221160888672, -2.8452138900756836, -2.6692066192626953, -2.493199348449707, -2.3171920776367188, -2.1411848068237305, -1.9651775360107422, -1.789170265197754, -1.6131629943847656, -1.4371557235717773, -1.261148452758789, -1.0851411819458008, -0.9091339111328125, -0.7331266403198242, -0.5571193695068359, -0.38111209869384766, -0.20510482788085938, -0.02909708023071289, 0.1469101905822754, 0.32291746139526367, 0.49892473220825195, 0.6749320030212402, 0.8509392738342285, 1.0269465446472168, 1.202953815460205, 1.3789610862731934, 1.5549683570861816, 1.73097562789917, 1.9069828987121582, 2.0829901695251465, 2.2589974403381348, 2.435004711151123, 2.6110119819641113, 2.7870192527770996, 2.963026523590088, 3.139033794403076, 3.3150410652160645, 3.4910483360290527, 3.667055606842041, 3.8430628776550293, 4.019070148468018, 4.195077419281006, 4.371084690093994, 4.547091960906982, 4.723099231719971, 4.899106502532959, 5.075113773345947, 5.2511210441589355, 5.427128314971924, 5.603135585784912]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 7.0, 13.0, 20.0, 33.0, 42.0, 63.0, 110.0, 150.0, 257.0, 386.0, 612.0, 984.0, 1487.0, 2194.0, 3343.0, 5342.0, 8465.0, 13044.0, 20142.0, 30653.0, 46831.0, 69623.0, 97470.0, 126392.0, 142349.0, 134910.0, 108950.0, 78992.0, 54270.0, 35474.0, 23397.0, 15097.0, 9811.0, 6286.0, 4050.0, 2644.0, 1674.0, 1100.0, 667.0, 458.0, 266.0, 193.0, 118.0, 68.0, 53.0, 24.0, 12.0, 5.0, 9.0, 6.0, 6.0, 6.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-4.2578125, -4.1190185546875, -3.980224609375, -3.8414306640625, -3.70263671875, -3.5638427734375, -3.425048828125, -3.2862548828125, -3.1474609375, -3.0086669921875, -2.869873046875, -2.7310791015625, -2.59228515625, -2.4534912109375, -2.314697265625, -2.1759033203125, -2.037109375, -1.8983154296875, -1.759521484375, -1.6207275390625, -1.48193359375, -1.3431396484375, -1.204345703125, -1.0655517578125, -0.9267578125, -0.7879638671875, -0.649169921875, -0.5103759765625, -0.37158203125, -0.2327880859375, -0.093994140625, 0.0447998046875, 0.18359375, 0.3223876953125, 0.461181640625, 0.5999755859375, 0.73876953125, 0.8775634765625, 1.016357421875, 1.1551513671875, 1.2939453125, 1.4327392578125, 1.571533203125, 1.7103271484375, 1.84912109375, 1.9879150390625, 2.126708984375, 2.2655029296875, 2.404296875, 2.5430908203125, 2.681884765625, 2.8206787109375, 2.95947265625, 3.0982666015625, 3.237060546875, 3.3758544921875, 3.5146484375, 3.6534423828125, 3.792236328125, 3.9310302734375, 4.06982421875, 4.2086181640625, 4.347412109375, 4.4862060546875, 4.625]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [5.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 9.0, 7.0, 8.0, 7.0, 10.0, 15.0, 8.0, 15.0, 23.0, 14.0, 19.0, 21.0, 19.0, 20.0, 37.0, 33.0, 31.0, 27.0, 33.0, 32.0, 40.0, 48.0, 34.0, 38.0, 33.0, 53.0, 31.0, 32.0, 36.0, 38.0, 23.0, 20.0, 15.0, 24.0, 23.0, 13.0, 15.0, 11.0, 14.0, 15.0, 7.0, 9.0, 6.0, 8.0, 8.0, 7.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.046875, -4.87652587890625, -4.7061767578125, -4.53582763671875, -4.365478515625, -4.19512939453125, -4.0247802734375, -3.85443115234375, -3.68408203125, -3.51373291015625, -3.3433837890625, -3.17303466796875, -3.002685546875, -2.83233642578125, -2.6619873046875, -2.49163818359375, -2.3212890625, -2.15093994140625, -1.9805908203125, -1.81024169921875, -1.639892578125, -1.46954345703125, -1.2991943359375, -1.12884521484375, -0.95849609375, -0.78814697265625, -0.6177978515625, -0.44744873046875, -0.277099609375, -0.10675048828125, 0.0635986328125, 0.23394775390625, 0.404296875, 0.57464599609375, 0.7449951171875, 0.91534423828125, 1.085693359375, 1.25604248046875, 1.4263916015625, 1.59674072265625, 1.76708984375, 1.93743896484375, 2.1077880859375, 2.27813720703125, 2.448486328125, 2.61883544921875, 2.7891845703125, 2.95953369140625, 3.1298828125, 3.30023193359375, 3.4705810546875, 3.64093017578125, 3.811279296875, 3.98162841796875, 4.1519775390625, 4.32232666015625, 4.49267578125, 4.66302490234375, 4.8333740234375, 5.00372314453125, 5.174072265625, 5.34442138671875, 5.5147705078125, 5.68511962890625, 5.85546875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 9.0, 12.0, 23.0, 38.0, 67.0, 89.0, 115.0, 231.0, 371.0, 531.0, 864.0, 1388.0, 2183.0, 3487.0, 5403.0, 8731.0, 13523.0, 21290.0, 32855.0, 49945.0, 74786.0, 103393.0, 131296.0, 143577.0, 132396.0, 104670.0, 73978.0, 50963.0, 33706.0, 21409.0, 13684.0, 8710.0, 5373.0, 3447.0, 2189.0, 1336.0, 893.0, 622.0, 346.0, 232.0, 151.0, 87.0, 65.0, 37.0, 19.0, 18.0, 11.0, 6.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.59375, -4.45245361328125, -4.3111572265625, -4.16986083984375, -4.028564453125, -3.88726806640625, -3.7459716796875, -3.60467529296875, -3.46337890625, -3.32208251953125, -3.1807861328125, -3.03948974609375, -2.898193359375, -2.75689697265625, -2.6156005859375, -2.47430419921875, -2.3330078125, -2.19171142578125, -2.0504150390625, -1.90911865234375, -1.767822265625, -1.62652587890625, -1.4852294921875, -1.34393310546875, -1.20263671875, -1.06134033203125, -0.9200439453125, -0.77874755859375, -0.637451171875, -0.49615478515625, -0.3548583984375, -0.21356201171875, -0.072265625, 0.06903076171875, 0.2103271484375, 0.35162353515625, 0.492919921875, 0.63421630859375, 0.7755126953125, 0.91680908203125, 1.05810546875, 1.19940185546875, 1.3406982421875, 1.48199462890625, 1.623291015625, 1.76458740234375, 1.9058837890625, 2.04718017578125, 2.1884765625, 2.32977294921875, 2.4710693359375, 2.61236572265625, 2.753662109375, 2.89495849609375, 3.0362548828125, 3.17755126953125, 3.31884765625, 3.46014404296875, 3.6014404296875, 3.74273681640625, 3.884033203125, 4.02532958984375, 4.1666259765625, 4.30792236328125, 4.44921875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 6.0, 3.0, 7.0, 6.0, 8.0, 9.0, 12.0, 12.0, 19.0, 13.0, 15.0, 21.0, 16.0, 29.0, 23.0, 20.0, 42.0, 31.0, 35.0, 33.0, 31.0, 43.0, 53.0, 31.0, 33.0, 38.0, 43.0, 27.0, 33.0, 31.0, 24.0, 27.0, 33.0, 23.0, 17.0, 20.0, 24.0, 19.0, 18.0, 12.0, 10.0, 8.0, 10.0, 9.0, 8.0, 2.0, 2.0, 7.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.2421875, -3.137054443359375, -3.03192138671875, -2.926788330078125, -2.8216552734375, -2.716522216796875, -2.61138916015625, -2.506256103515625, -2.401123046875, -2.295989990234375, -2.19085693359375, -2.085723876953125, -1.9805908203125, -1.875457763671875, -1.77032470703125, -1.665191650390625, -1.56005859375, -1.454925537109375, -1.34979248046875, -1.244659423828125, -1.1395263671875, -1.034393310546875, -0.92926025390625, -0.824127197265625, -0.718994140625, -0.613861083984375, -0.50872802734375, -0.403594970703125, -0.2984619140625, -0.193328857421875, -0.08819580078125, 0.016937255859375, 0.1220703125, 0.227203369140625, 0.33233642578125, 0.437469482421875, 0.5426025390625, 0.647735595703125, 0.75286865234375, 0.858001708984375, 0.963134765625, 1.068267822265625, 1.17340087890625, 1.278533935546875, 1.3836669921875, 1.488800048828125, 1.59393310546875, 1.699066162109375, 1.80419921875, 1.909332275390625, 2.01446533203125, 2.119598388671875, 2.2247314453125, 2.329864501953125, 2.43499755859375, 2.540130615234375, 2.645263671875, 2.750396728515625, 2.85552978515625, 2.960662841796875, 3.0657958984375, 3.170928955078125, 3.27606201171875, 3.381195068359375, 3.486328125]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 4.0, 10.0, 16.0, 27.0, 47.0, 35.0, 64.0, 83.0, 112.0, 182.0, 246.0, 391.0, 539.0, 835.0, 1368.0, 2175.0, 3511.0, 6294.0, 11263.0, 20364.0, 38186.0, 72501.0, 131440.0, 200931.0, 214501.0, 153695.0, 87559.0, 45847.0, 24414.0, 13142.0, 7338.0, 4280.0, 2547.0, 1617.0, 972.0, 625.0, 449.0, 275.0, 186.0, 132.0, 91.0, 54.0, 58.0, 41.0, 26.0, 24.0, 19.0, 10.0, 10.0, 8.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.0703125, -2.968475341796875, -2.86663818359375, -2.764801025390625, -2.6629638671875, -2.561126708984375, -2.45928955078125, -2.357452392578125, -2.255615234375, -2.153778076171875, -2.05194091796875, -1.950103759765625, -1.8482666015625, -1.746429443359375, -1.64459228515625, -1.542755126953125, -1.44091796875, -1.339080810546875, -1.23724365234375, -1.135406494140625, -1.0335693359375, -0.931732177734375, -0.82989501953125, -0.728057861328125, -0.626220703125, -0.524383544921875, -0.42254638671875, -0.320709228515625, -0.2188720703125, -0.117034912109375, -0.01519775390625, 0.086639404296875, 0.1884765625, 0.290313720703125, 0.39215087890625, 0.493988037109375, 0.5958251953125, 0.697662353515625, 0.79949951171875, 0.901336669921875, 1.003173828125, 1.105010986328125, 1.20684814453125, 1.308685302734375, 1.4105224609375, 1.512359619140625, 1.61419677734375, 1.716033935546875, 1.81787109375, 1.919708251953125, 2.02154541015625, 2.123382568359375, 2.2252197265625, 2.327056884765625, 2.42889404296875, 2.530731201171875, 2.632568359375, 2.734405517578125, 2.83624267578125, 2.938079833984375, 3.0399169921875, 3.141754150390625, 3.24359130859375, 3.345428466796875, 3.447265625]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 6.0, 3.0, 3.0, 8.0, 4.0, 6.0, 13.0, 17.0, 23.0, 38.0, 60.0, 68.0, 70.0, 112.0, 103.0, 87.0, 89.0, 66.0, 49.0, 48.0, 33.0, 23.0, 22.0, 13.0, 8.0, 7.0, 7.0, 5.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003898143768310547, -0.00037750229239463806, -0.00036519020795822144, -0.0003528781235218048, -0.0003405660390853882, -0.00032825395464897156, -0.00031594187021255493, -0.0003036297857761383, -0.0002913177013397217, -0.00027900561690330505, -0.00026669353246688843, -0.0002543814480304718, -0.00024206936359405518, -0.00022975727915763855, -0.00021744519472122192, -0.0002051331102848053, -0.00019282102584838867, -0.00018050894141197205, -0.00016819685697555542, -0.0001558847725391388, -0.00014357268810272217, -0.00013126060366630554, -0.00011894851922988892, -0.00010663643479347229, -9.432435035705566e-05, -8.201226592063904e-05, -6.970018148422241e-05, -5.7388097047805786e-05, -4.507601261138916e-05, -3.2763928174972534e-05, -2.0451843738555908e-05, -8.139759302139282e-06, 4.172325134277344e-06, 1.648440957069397e-05, 2.8796494007110596e-05, 4.110857844352722e-05, 5.342066287994385e-05, 6.573274731636047e-05, 7.80448317527771e-05, 9.035691618919373e-05, 0.00010266900062561035, 0.00011498108506202698, 0.0001272931694984436, 0.00013960525393486023, 0.00015191733837127686, 0.00016422942280769348, 0.0001765415072441101, 0.00018885359168052673, 0.00020116567611694336, 0.00021347776055335999, 0.0002257898449897766, 0.00023810192942619324, 0.00025041401386260986, 0.0002627260982990265, 0.0002750381827354431, 0.00028735026717185974, 0.00029966235160827637, 0.000311974436044693, 0.0003242865204811096, 0.00033659860491752625, 0.00034891068935394287, 0.0003612227737903595, 0.0003735348582267761, 0.00038584694266319275, 0.0003981590270996094]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 10.0, 14.0, 16.0, 20.0, 32.0, 50.0, 85.0, 107.0, 151.0, 264.0, 381.0, 683.0, 1155.0, 2018.0, 3522.0, 6627.0, 12635.0, 25277.0, 52854.0, 108263.0, 195558.0, 247764.0, 188146.0, 102492.0, 49739.0, 23909.0, 12146.0, 6366.0, 3471.0, 1915.0, 1078.0, 640.0, 447.0, 247.0, 159.0, 100.0, 66.0, 40.0, 36.0, 24.0, 9.0, 11.0, 10.0, 6.0, 6.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.65234375, -3.5362548828125, -3.420166015625, -3.3040771484375, -3.18798828125, -3.0718994140625, -2.955810546875, -2.8397216796875, -2.7236328125, -2.6075439453125, -2.491455078125, -2.3753662109375, -2.25927734375, -2.1431884765625, -2.027099609375, -1.9110107421875, -1.794921875, -1.6788330078125, -1.562744140625, -1.4466552734375, -1.33056640625, -1.2144775390625, -1.098388671875, -0.9822998046875, -0.8662109375, -0.7501220703125, -0.634033203125, -0.5179443359375, -0.40185546875, -0.2857666015625, -0.169677734375, -0.0535888671875, 0.0625, 0.1785888671875, 0.294677734375, 0.4107666015625, 0.52685546875, 0.6429443359375, 0.759033203125, 0.8751220703125, 0.9912109375, 1.1072998046875, 1.223388671875, 1.3394775390625, 1.45556640625, 1.5716552734375, 1.687744140625, 1.8038330078125, 1.919921875, 2.0360107421875, 2.152099609375, 2.2681884765625, 2.38427734375, 2.5003662109375, 2.616455078125, 2.7325439453125, 2.8486328125, 2.9647216796875, 3.080810546875, 3.1968994140625, 3.31298828125, 3.4290771484375, 3.545166015625, 3.6612548828125, 3.77734375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 8.0, 7.0, 6.0, 13.0, 19.0, 16.0, 19.0, 25.0, 24.0, 30.0, 33.0, 46.0, 40.0, 41.0, 72.0, 61.0, 46.0, 63.0, 50.0, 57.0, 46.0, 47.0, 44.0, 28.0, 31.0, 22.0, 22.0, 14.0, 14.0, 8.0, 13.0, 11.0, 7.0, 11.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.0771484375, -1.0475082397460938, -1.0178680419921875, -0.9882278442382812, -0.958587646484375, -0.9289474487304688, -0.8993072509765625, -0.8696670532226562, -0.84002685546875, -0.8103866577148438, -0.7807464599609375, -0.7511062622070312, -0.721466064453125, -0.6918258666992188, -0.6621856689453125, -0.6325454711914062, -0.6029052734375, -0.5732650756835938, -0.5436248779296875, -0.5139846801757812, -0.484344482421875, -0.45470428466796875, -0.4250640869140625, -0.39542388916015625, -0.36578369140625, -0.33614349365234375, -0.3065032958984375, -0.27686309814453125, -0.247222900390625, -0.21758270263671875, -0.1879425048828125, -0.15830230712890625, -0.128662109375, -0.09902191162109375, -0.0693817138671875, -0.03974151611328125, -0.010101318359375, 0.01953887939453125, 0.0491790771484375, 0.07881927490234375, 0.10845947265625, 0.13809967041015625, 0.1677398681640625, 0.19738006591796875, 0.227020263671875, 0.25666046142578125, 0.2863006591796875, 0.31594085693359375, 0.3455810546875, 0.37522125244140625, 0.4048614501953125, 0.43450164794921875, 0.464141845703125, 0.49378204345703125, 0.5234222412109375, 0.5530624389648438, 0.58270263671875, 0.6123428344726562, 0.6419830322265625, 0.6716232299804688, 0.701263427734375, 0.7309036254882812, 0.7605438232421875, 0.7901840209960938, 0.81982421875]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 2.0, 4.0, 7.0, 6.0, 9.0, 6.0, 14.0, 9.0, 24.0, 18.0, 32.0, 27.0, 35.0, 58.0, 49.0, 62.0, 72.0, 82.0, 66.0, 61.0, 64.0, 61.0, 24.0, 44.0, 44.0, 25.0, 23.0, 5.0, 13.0, 7.0, 8.0, 9.0, 5.0, 9.0, 9.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.37326717376709, -11.045008659362793, -10.716750144958496, -10.388492584228516, -10.060234069824219, -9.731975555419922, -9.403717041015625, -9.075458526611328, -8.747200012207031, -8.418941497802734, -8.090682983398438, -7.762424945831299, -7.43416690826416, -7.105908393859863, -6.777649879455566, -6.4493913650512695, -6.121133804321289, -5.792875289916992, -5.4646172523498535, -5.136358737945557, -4.808100700378418, -4.479842185974121, -4.151583671569824, -3.8233253955841064, -3.4950671195983887, -3.166808843612671, -2.838550567626953, -2.5102920532226562, -2.1820337772369385, -1.8537755012512207, -1.5255171060562134, -1.197258710861206, -0.8690013885498047, -0.5407430529594421, -0.2124847173690796, 0.11577361822128296, 0.4440319538116455, 0.7722902297973633, 1.1005486249923706, 1.428807020187378, 1.7570652961730957, 2.0853235721588135, 2.4135818481445312, 2.741840362548828, 3.070098638534546, 3.3983569145202637, 3.7266154289245605, 4.054873466491699, 4.383131980895996, 4.711390495300293, 5.039648532867432, 5.3679070472717285, 5.696165084838867, 6.024423599243164, 6.352682113647461, 6.680940628051758, 7.0091986656188965, 7.337457180023193, 7.665715217590332, 7.993973731994629, 8.322232246398926, 8.650489807128906, 8.978748321533203, 9.3070068359375, 9.635265350341797]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 7.0, 10.0, 4.0, 8.0, 8.0, 10.0, 12.0, 9.0, 12.0, 12.0, 19.0, 20.0, 18.0, 15.0, 24.0, 30.0, 25.0, 37.0, 24.0, 35.0, 37.0, 40.0, 40.0, 40.0, 35.0, 35.0, 35.0, 42.0, 40.0, 41.0, 45.0, 21.0, 30.0, 24.0, 21.0, 26.0, 19.0, 11.0, 15.0, 12.0, 16.0, 7.0, 3.0, 11.0, 5.0, 6.0, 4.0, 2.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-5.67939567565918, -5.50309419631958, -5.326793193817139, -5.150491714477539, -4.9741902351379395, -4.79788875579834, -4.621587753295898, -4.445286273956299, -4.268984794616699, -4.0926833152771, -3.916382074356079, -3.7400808334350586, -3.563779354095459, -3.3874781131744385, -3.211176872253418, -3.0348753929138184, -2.858574390411377, -2.6822731494903564, -2.505971670150757, -2.3296704292297363, -2.1533689498901367, -1.9770677089691162, -1.8007664680480957, -1.6244651079177856, -1.4481637477874756, -1.2718623876571655, -1.0955610275268555, -0.919259786605835, -0.7429584264755249, -0.5666570663452148, -0.39035582542419434, -0.21405446529388428, -0.03775310516357422, 0.13854822516441345, 0.3148495554924011, 0.4911508560180664, 0.6674522161483765, 0.8437535762786865, 1.020054817199707, 1.196356177330017, 1.3726575374603271, 1.5489588975906372, 1.7252602577209473, 1.9015614986419678, 2.0778627395629883, 2.254164218902588, 2.4304654598236084, 2.606766700744629, 2.7830681800842285, 2.959369421005249, 3.1356709003448486, 3.311972141265869, 3.4882736206054688, 3.6645748615264893, 3.8408761024475098, 4.017177581787109, 4.193478584289551, 4.36978006362915, 4.546081066131592, 4.722382545471191, 4.898684024810791, 5.074985504150391, 5.251286506652832, 5.427587985992432, 5.603889465332031]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 7.0, 12.0, 9.0, 11.0, 29.0, 42.0, 43.0, 76.0, 91.0, 150.0, 247.0, 369.0, 557.0, 819.0, 1304.0, 2036.0, 3098.0, 5045.0, 8459.0, 14896.0, 27026.0, 53871.0, 116996.0, 293198.0, 744650.0, 1292684.0, 949199.0, 387407.0, 149580.0, 65542.0, 32251.0, 17502.0, 10216.0, 6113.0, 3877.0, 2329.0, 1547.0, 1042.0, 695.0, 452.0, 277.0, 173.0, 131.0, 74.0, 55.0, 41.0, 23.0, 12.0, 12.0, 9.0, 2.0, 2.0, 4.0], "bins": [-12.625, -12.280517578125, -11.93603515625, -11.591552734375, -11.2470703125, -10.902587890625, -10.55810546875, -10.213623046875, -9.869140625, -9.524658203125, -9.18017578125, -8.835693359375, -8.4912109375, -8.146728515625, -7.80224609375, -7.457763671875, -7.11328125, -6.768798828125, -6.42431640625, -6.079833984375, -5.7353515625, -5.390869140625, -5.04638671875, -4.701904296875, -4.357421875, -4.012939453125, -3.66845703125, -3.323974609375, -2.9794921875, -2.635009765625, -2.29052734375, -1.946044921875, -1.6015625, -1.257080078125, -0.91259765625, -0.568115234375, -0.2236328125, 0.120849609375, 0.46533203125, 0.809814453125, 1.154296875, 1.498779296875, 1.84326171875, 2.187744140625, 2.5322265625, 2.876708984375, 3.22119140625, 3.565673828125, 3.91015625, 4.254638671875, 4.59912109375, 4.943603515625, 5.2880859375, 5.632568359375, 5.97705078125, 6.321533203125, 6.666015625, 7.010498046875, 7.35498046875, 7.699462890625, 8.0439453125, 8.388427734375, 8.73291015625, 9.077392578125, 9.421875]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 3.0, 4.0, 6.0, 5.0, 9.0, 13.0, 17.0, 11.0, 14.0, 12.0, 27.0, 20.0, 20.0, 29.0, 25.0, 25.0, 29.0, 35.0, 28.0, 38.0, 35.0, 31.0, 53.0, 37.0, 43.0, 46.0, 33.0, 49.0, 28.0, 30.0, 33.0, 22.0, 27.0, 20.0, 23.0, 21.0, 19.0, 14.0, 16.0, 8.0, 8.0, 6.0, 9.0, 1.0, 5.0, 3.0, 6.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-4.4765625, -4.3323974609375, -4.188232421875, -4.0440673828125, -3.89990234375, -3.7557373046875, -3.611572265625, -3.4674072265625, -3.3232421875, -3.1790771484375, -3.034912109375, -2.8907470703125, -2.74658203125, -2.6024169921875, -2.458251953125, -2.3140869140625, -2.169921875, -2.0257568359375, -1.881591796875, -1.7374267578125, -1.59326171875, -1.4490966796875, -1.304931640625, -1.1607666015625, -1.0166015625, -0.8724365234375, -0.728271484375, -0.5841064453125, -0.43994140625, -0.2957763671875, -0.151611328125, -0.0074462890625, 0.13671875, 0.2808837890625, 0.425048828125, 0.5692138671875, 0.71337890625, 0.8575439453125, 1.001708984375, 1.1458740234375, 1.2900390625, 1.4342041015625, 1.578369140625, 1.7225341796875, 1.86669921875, 2.0108642578125, 2.155029296875, 2.2991943359375, 2.443359375, 2.5875244140625, 2.731689453125, 2.8758544921875, 3.02001953125, 3.1641845703125, 3.308349609375, 3.4525146484375, 3.5966796875, 3.7408447265625, 3.885009765625, 4.0291748046875, 4.17333984375, 4.3175048828125, 4.461669921875, 4.6058349609375, 4.75]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 6.0, 7.0, 12.0, 18.0, 27.0, 24.0, 35.0, 63.0, 89.0, 111.0, 187.0, 226.0, 381.0, 536.0, 829.0, 1264.0, 2028.0, 3029.0, 5076.0, 8529.0, 14741.0, 27617.0, 52366.0, 106600.0, 234118.0, 547070.0, 1110847.0, 1096581.0, 532716.0, 228337.0, 104277.0, 51657.0, 27303.0, 14966.0, 8713.0, 5055.0, 3149.0, 1998.0, 1243.0, 828.0, 520.0, 367.0, 222.0, 159.0, 115.0, 74.0, 54.0, 29.0, 32.0, 13.0, 13.0, 15.0, 6.0, 3.0, 4.0, 2.0, 3.0], "bins": [-13.296875, -12.9056396484375, -12.514404296875, -12.1231689453125, -11.73193359375, -11.3406982421875, -10.949462890625, -10.5582275390625, -10.1669921875, -9.7757568359375, -9.384521484375, -8.9932861328125, -8.60205078125, -8.2108154296875, -7.819580078125, -7.4283447265625, -7.037109375, -6.6458740234375, -6.254638671875, -5.8634033203125, -5.47216796875, -5.0809326171875, -4.689697265625, -4.2984619140625, -3.9072265625, -3.5159912109375, -3.124755859375, -2.7335205078125, -2.34228515625, -1.9510498046875, -1.559814453125, -1.1685791015625, -0.77734375, -0.3861083984375, 0.005126953125, 0.3963623046875, 0.78759765625, 1.1788330078125, 1.570068359375, 1.9613037109375, 2.3525390625, 2.7437744140625, 3.135009765625, 3.5262451171875, 3.91748046875, 4.3087158203125, 4.699951171875, 5.0911865234375, 5.482421875, 5.8736572265625, 6.264892578125, 6.6561279296875, 7.04736328125, 7.4385986328125, 7.829833984375, 8.2210693359375, 8.6123046875, 9.0035400390625, 9.394775390625, 9.7860107421875, 10.17724609375, 10.5684814453125, 10.959716796875, 11.3509521484375, 11.7421875]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 4.0, 10.0, 13.0, 13.0, 19.0, 27.0, 20.0, 45.0, 26.0, 66.0, 90.0, 128.0, 128.0, 180.0, 218.0, 268.0, 327.0, 354.0, 349.0, 339.0, 302.0, 248.0, 198.0, 127.0, 124.0, 95.0, 79.0, 66.0, 42.0, 45.0, 34.0, 21.0, 21.0, 9.0, 9.0, 6.0, 7.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.23828125, -4.11419677734375, -3.9901123046875, -3.86602783203125, -3.741943359375, -3.61785888671875, -3.4937744140625, -3.36968994140625, -3.24560546875, -3.12152099609375, -2.9974365234375, -2.87335205078125, -2.749267578125, -2.62518310546875, -2.5010986328125, -2.37701416015625, -2.2529296875, -2.12884521484375, -2.0047607421875, -1.88067626953125, -1.756591796875, -1.63250732421875, -1.5084228515625, -1.38433837890625, -1.26025390625, -1.13616943359375, -1.0120849609375, -0.88800048828125, -0.763916015625, -0.63983154296875, -0.5157470703125, -0.39166259765625, -0.267578125, -0.14349365234375, -0.0194091796875, 0.10467529296875, 0.228759765625, 0.35284423828125, 0.4769287109375, 0.60101318359375, 0.72509765625, 0.84918212890625, 0.9732666015625, 1.09735107421875, 1.221435546875, 1.34552001953125, 1.4696044921875, 1.59368896484375, 1.7177734375, 1.84185791015625, 1.9659423828125, 2.09002685546875, 2.214111328125, 2.33819580078125, 2.4622802734375, 2.58636474609375, 2.71044921875, 2.83453369140625, 2.9586181640625, 3.08270263671875, 3.206787109375, 3.33087158203125, 3.4549560546875, 3.57904052734375, 3.703125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 1.0, 2.0, 5.0, 5.0, 12.0, 6.0, 18.0, 15.0, 16.0, 17.0, 16.0, 26.0, 28.0, 31.0, 49.0, 55.0, 37.0, 62.0, 59.0, 37.0, 76.0, 60.0, 48.0, 47.0, 44.0, 44.0, 31.0, 26.0, 21.0, 20.0, 11.0, 21.0, 18.0, 9.0, 4.0, 3.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.486200332641602, -9.154423713684082, -8.822648048400879, -8.49087142944336, -8.159095764160156, -7.827319145202637, -7.495542526245117, -7.163766384124756, -6.8319902420043945, -6.500214099884033, -6.168437957763672, -5.836661338806152, -5.504885196685791, -5.17310905456543, -4.84133243560791, -4.509556293487549, -4.1777801513671875, -3.846004009246826, -3.5142276287078857, -3.1824512481689453, -2.850675106048584, -2.5188989639282227, -2.1871225833892822, -1.8553462028503418, -1.5235700607299805, -1.1917937994003296, -0.8600175380706787, -0.5282412767410278, -0.19646501541137695, 0.13531124591827393, 0.4670875072479248, 0.7988638877868652, 1.1306400299072266, 1.4624162912368774, 1.7941925525665283, 2.1259689331054688, 2.45774507522583, 2.7895212173461914, 3.121297597885132, 3.4530739784240723, 3.7848501205444336, 4.116626262664795, 4.448402404785156, 4.780179023742676, 5.111955165863037, 5.443731307983398, 5.775507926940918, 6.107284069061279, 6.439060211181641, 6.770836353302002, 7.102612495422363, 7.434389114379883, 7.766165256500244, 8.097941398620605, 8.429718017578125, 8.761493682861328, 9.093270301818848, 9.425046920776367, 9.75682258605957, 10.08859920501709, 10.42037582397461, 10.752151489257812, 11.083928108215332, 11.415704727172852, 11.747480392456055]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 5.0, 5.0, 10.0, 13.0, 14.0, 14.0, 16.0, 22.0, 17.0, 19.0, 32.0, 31.0, 33.0, 34.0, 26.0, 37.0, 29.0, 34.0, 39.0, 39.0, 47.0, 44.0, 46.0, 41.0, 47.0, 38.0, 36.0, 19.0, 28.0, 31.0, 30.0, 22.0, 16.0, 14.0, 14.0, 8.0, 12.0, 8.0, 7.0, 9.0, 4.0, 1.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.198548316955566, -6.969392776489258, -6.740237236022949, -6.511082172393799, -6.28192663192749, -6.052771091461182, -5.823616027832031, -5.594460487365723, -5.365304946899414, -5.1361494064331055, -4.906993865966797, -4.6778388023376465, -4.448683261871338, -4.219527721405029, -3.9903724193573, -3.7612171173095703, -3.5320615768432617, -3.302906036376953, -3.0737507343292236, -2.844595432281494, -2.6154398918151855, -2.386284351348877, -2.1571290493011475, -1.9279736280441284, -1.6988182067871094, -1.4696627855300903, -1.2405073642730713, -1.0113519430160522, -0.7821965217590332, -0.5530411005020142, -0.3238856792449951, -0.09473025798797607, 0.13442468643188477, 0.3635801076889038, 0.5927355289459229, 0.8218909502029419, 1.051046371459961, 1.28020179271698, 1.509357213973999, 1.738512635231018, 1.967668056488037, 2.1968235969543457, 2.425978899002075, 2.6551342010498047, 2.8842897415161133, 3.113445281982422, 3.3426005840301514, 3.571755886077881, 3.8009114265441895, 4.030066967010498, 4.259222030639648, 4.488377571105957, 4.717533111572266, 4.946688652038574, 5.175844192504883, 5.404999256134033, 5.634154796600342, 5.86331033706665, 6.092465400695801, 6.321620941162109, 6.550776481628418, 6.779932022094727, 7.009087562561035, 7.2382426261901855, 7.467398166656494]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 8.0, 6.0, 21.0, 32.0, 32.0, 62.0, 68.0, 113.0, 208.0, 276.0, 434.0, 589.0, 1045.0, 1734.0, 2793.0, 4591.0, 8211.0, 14313.0, 25149.0, 44627.0, 77981.0, 127663.0, 179877.0, 190331.0, 147955.0, 93529.0, 54496.0, 30833.0, 17200.0, 9867.0, 5598.0, 3476.0, 1990.0, 1241.0, 793.0, 485.0, 299.0, 206.0, 124.0, 92.0, 63.0, 42.0, 36.0, 22.0, 22.0, 11.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0], "bins": [-5.2578125, -5.10833740234375, -4.9588623046875, -4.80938720703125, -4.659912109375, -4.51043701171875, -4.3609619140625, -4.21148681640625, -4.06201171875, -3.91253662109375, -3.7630615234375, -3.61358642578125, -3.464111328125, -3.31463623046875, -3.1651611328125, -3.01568603515625, -2.8662109375, -2.71673583984375, -2.5672607421875, -2.41778564453125, -2.268310546875, -2.11883544921875, -1.9693603515625, -1.81988525390625, -1.67041015625, -1.52093505859375, -1.3714599609375, -1.22198486328125, -1.072509765625, -0.92303466796875, -0.7735595703125, -0.62408447265625, -0.474609375, -0.32513427734375, -0.1756591796875, -0.02618408203125, 0.123291015625, 0.27276611328125, 0.4222412109375, 0.57171630859375, 0.72119140625, 0.87066650390625, 1.0201416015625, 1.16961669921875, 1.319091796875, 1.46856689453125, 1.6180419921875, 1.76751708984375, 1.9169921875, 2.06646728515625, 2.2159423828125, 2.36541748046875, 2.514892578125, 2.66436767578125, 2.8138427734375, 2.96331787109375, 3.11279296875, 3.26226806640625, 3.4117431640625, 3.56121826171875, 3.710693359375, 3.86016845703125, 4.0096435546875, 4.15911865234375, 4.30859375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 9.0, 10.0, 5.0, 7.0, 26.0, 14.0, 10.0, 12.0, 12.0, 27.0, 27.0, 29.0, 26.0, 31.0, 37.0, 28.0, 35.0, 37.0, 39.0, 48.0, 53.0, 53.0, 50.0, 39.0, 42.0, 43.0, 36.0, 31.0, 29.0, 22.0, 27.0, 21.0, 14.0, 8.0, 13.0, 9.0, 11.0, 9.0, 6.0, 3.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-8.1953125, -7.940185546875, -7.68505859375, -7.429931640625, -7.1748046875, -6.919677734375, -6.66455078125, -6.409423828125, -6.154296875, -5.899169921875, -5.64404296875, -5.388916015625, -5.1337890625, -4.878662109375, -4.62353515625, -4.368408203125, -4.11328125, -3.858154296875, -3.60302734375, -3.347900390625, -3.0927734375, -2.837646484375, -2.58251953125, -2.327392578125, -2.072265625, -1.817138671875, -1.56201171875, -1.306884765625, -1.0517578125, -0.796630859375, -0.54150390625, -0.286376953125, -0.03125, 0.223876953125, 0.47900390625, 0.734130859375, 0.9892578125, 1.244384765625, 1.49951171875, 1.754638671875, 2.009765625, 2.264892578125, 2.52001953125, 2.775146484375, 3.0302734375, 3.285400390625, 3.54052734375, 3.795654296875, 4.05078125, 4.305908203125, 4.56103515625, 4.816162109375, 5.0712890625, 5.326416015625, 5.58154296875, 5.836669921875, 6.091796875, 6.346923828125, 6.60205078125, 6.857177734375, 7.1123046875, 7.367431640625, 7.62255859375, 7.877685546875, 8.1328125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 9.0, 10.0, 9.0, 20.0, 14.0, 17.0, 37.0, 39.0, 46.0, 56.0, 95.0, 123.0, 188.0, 261.0, 363.0, 572.0, 951.0, 1510.0, 2701.0, 4618.0, 8478.0, 16346.0, 31865.0, 65511.0, 131410.0, 231353.0, 248519.0, 149994.0, 75488.0, 36665.0, 18596.0, 9557.0, 5395.0, 2976.0, 1711.0, 1030.0, 645.0, 398.0, 252.0, 197.0, 149.0, 103.0, 60.0, 55.0, 37.0, 35.0, 29.0, 17.0, 12.0, 11.0, 11.0, 8.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-7.15625, -6.933349609375, -6.71044921875, -6.487548828125, -6.2646484375, -6.041748046875, -5.81884765625, -5.595947265625, -5.373046875, -5.150146484375, -4.92724609375, -4.704345703125, -4.4814453125, -4.258544921875, -4.03564453125, -3.812744140625, -3.58984375, -3.366943359375, -3.14404296875, -2.921142578125, -2.6982421875, -2.475341796875, -2.25244140625, -2.029541015625, -1.806640625, -1.583740234375, -1.36083984375, -1.137939453125, -0.9150390625, -0.692138671875, -0.46923828125, -0.246337890625, -0.0234375, 0.199462890625, 0.42236328125, 0.645263671875, 0.8681640625, 1.091064453125, 1.31396484375, 1.536865234375, 1.759765625, 1.982666015625, 2.20556640625, 2.428466796875, 2.6513671875, 2.874267578125, 3.09716796875, 3.320068359375, 3.54296875, 3.765869140625, 3.98876953125, 4.211669921875, 4.4345703125, 4.657470703125, 4.88037109375, 5.103271484375, 5.326171875, 5.549072265625, 5.77197265625, 5.994873046875, 6.2177734375, 6.440673828125, 6.66357421875, 6.886474609375, 7.109375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0, 6.0, 3.0, 8.0, 7.0, 4.0, 13.0, 16.0, 17.0, 17.0, 13.0, 18.0, 32.0, 18.0, 35.0, 14.0, 21.0, 25.0, 35.0, 42.0, 40.0, 35.0, 38.0, 35.0, 36.0, 39.0, 46.0, 36.0, 32.0, 34.0, 35.0, 27.0, 28.0, 25.0, 22.0, 23.0, 19.0, 20.0, 15.0, 11.0, 13.0, 7.0, 9.0, 6.0, 8.0, 6.0, 2.0, 6.0, 4.0, 0.0, 1.0, 1.0, 3.0], "bins": [-4.6015625, -4.467315673828125, -4.33306884765625, -4.198822021484375, -4.0645751953125, -3.930328369140625, -3.79608154296875, -3.661834716796875, -3.527587890625, -3.393341064453125, -3.25909423828125, -3.124847412109375, -2.9906005859375, -2.856353759765625, -2.72210693359375, -2.587860107421875, -2.45361328125, -2.319366455078125, -2.18511962890625, -2.050872802734375, -1.9166259765625, -1.782379150390625, -1.64813232421875, -1.513885498046875, -1.379638671875, -1.245391845703125, -1.11114501953125, -0.976898193359375, -0.8426513671875, -0.708404541015625, -0.57415771484375, -0.439910888671875, -0.3056640625, -0.171417236328125, -0.03717041015625, 0.097076416015625, 0.2313232421875, 0.365570068359375, 0.49981689453125, 0.634063720703125, 0.768310546875, 0.902557373046875, 1.03680419921875, 1.171051025390625, 1.3052978515625, 1.439544677734375, 1.57379150390625, 1.708038330078125, 1.84228515625, 1.976531982421875, 2.11077880859375, 2.245025634765625, 2.3792724609375, 2.513519287109375, 2.64776611328125, 2.782012939453125, 2.916259765625, 3.050506591796875, 3.18475341796875, 3.319000244140625, 3.4532470703125, 3.587493896484375, 3.72174072265625, 3.855987548828125, 3.990234375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 8.0, 8.0, 7.0, 9.0, 10.0, 17.0, 23.0, 44.0, 57.0, 78.0, 125.0, 177.0, 280.0, 427.0, 678.0, 1090.0, 1817.0, 3046.0, 5211.0, 9546.0, 16949.0, 32367.0, 62700.0, 122547.0, 220672.0, 248455.0, 153177.0, 79302.0, 40969.0, 21417.0, 11371.0, 6390.0, 3699.0, 2219.0, 1372.0, 839.0, 510.0, 319.0, 188.0, 139.0, 103.0, 60.0, 41.0, 21.0, 23.0, 18.0, 21.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-3.73046875, -3.621307373046875, -3.51214599609375, -3.402984619140625, -3.2938232421875, -3.184661865234375, -3.07550048828125, -2.966339111328125, -2.857177734375, -2.748016357421875, -2.63885498046875, -2.529693603515625, -2.4205322265625, -2.311370849609375, -2.20220947265625, -2.093048095703125, -1.98388671875, -1.874725341796875, -1.76556396484375, -1.656402587890625, -1.5472412109375, -1.438079833984375, -1.32891845703125, -1.219757080078125, -1.110595703125, -1.001434326171875, -0.89227294921875, -0.783111572265625, -0.6739501953125, -0.564788818359375, -0.45562744140625, -0.346466064453125, -0.2373046875, -0.128143310546875, -0.01898193359375, 0.090179443359375, 0.1993408203125, 0.308502197265625, 0.41766357421875, 0.526824951171875, 0.635986328125, 0.745147705078125, 0.85430908203125, 0.963470458984375, 1.0726318359375, 1.181793212890625, 1.29095458984375, 1.400115966796875, 1.50927734375, 1.618438720703125, 1.72760009765625, 1.836761474609375, 1.9459228515625, 2.055084228515625, 2.16424560546875, 2.273406982421875, 2.382568359375, 2.491729736328125, 2.60089111328125, 2.710052490234375, 2.8192138671875, 2.928375244140625, 3.03753662109375, 3.146697998046875, 3.255859375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 8.0, 8.0, 8.0, 10.0, 12.0, 16.0, 33.0, 35.0, 35.0, 44.0, 55.0, 52.0, 58.0, 65.0, 83.0, 73.0, 62.0, 56.0, 55.0, 44.0, 42.0, 30.0, 21.0, 20.0, 17.0, 10.0, 8.0, 11.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00012493133544921875, -0.0001205839216709137, -0.00011623650789260864, -0.00011188909411430359, -0.00010754168033599854, -0.00010319426655769348, -9.884685277938843e-05, -9.449943900108337e-05, -9.015202522277832e-05, -8.580461144447327e-05, -8.145719766616821e-05, -7.710978388786316e-05, -7.27623701095581e-05, -6.841495633125305e-05, -6.4067542552948e-05, -5.9720128774642944e-05, -5.537271499633789e-05, -5.102530121803284e-05, -4.667788743972778e-05, -4.233047366142273e-05, -3.7983059883117676e-05, -3.363564610481262e-05, -2.928823232650757e-05, -2.4940818548202515e-05, -2.059340476989746e-05, -1.6245990991592407e-05, -1.1898577213287354e-05, -7.5511634349823e-06, -3.203749656677246e-06, 1.1436641216278076e-06, 5.491077899932861e-06, 9.838491678237915e-06, 1.4185905456542969e-05, 1.8533319234848022e-05, 2.2880733013153076e-05, 2.722814679145813e-05, 3.1575560569763184e-05, 3.592297434806824e-05, 4.027038812637329e-05, 4.4617801904678345e-05, 4.89652156829834e-05, 5.331262946128845e-05, 5.7660043239593506e-05, 6.200745701789856e-05, 6.635487079620361e-05, 7.070228457450867e-05, 7.504969835281372e-05, 7.939711213111877e-05, 8.374452590942383e-05, 8.809193968772888e-05, 9.243935346603394e-05, 9.678676724433899e-05, 0.00010113418102264404, 0.0001054815948009491, 0.00010982900857925415, 0.0001141764223575592, 0.00011852383613586426, 0.0001228712499141693, 0.00012721866369247437, 0.00013156607747077942, 0.00013591349124908447, 0.00014026090502738953, 0.00014460831880569458, 0.00014895573258399963, 0.0001533031463623047]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 7.0, 6.0, 19.0, 22.0, 35.0, 52.0, 77.0, 114.0, 159.0, 286.0, 486.0, 724.0, 1149.0, 1899.0, 3117.0, 5362.0, 9315.0, 16303.0, 29239.0, 51874.0, 90397.0, 145421.0, 193430.0, 184344.0, 131232.0, 79227.0, 45101.0, 25065.0, 14092.0, 8015.0, 4701.0, 2799.0, 1711.0, 1024.0, 626.0, 411.0, 269.0, 148.0, 90.0, 70.0, 44.0, 32.0, 27.0, 11.0, 8.0, 7.0, 7.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.337890625, -3.236358642578125, -3.13482666015625, -3.033294677734375, -2.9317626953125, -2.830230712890625, -2.72869873046875, -2.627166748046875, -2.525634765625, -2.424102783203125, -2.32257080078125, -2.221038818359375, -2.1195068359375, -2.017974853515625, -1.91644287109375, -1.814910888671875, -1.71337890625, -1.611846923828125, -1.51031494140625, -1.408782958984375, -1.3072509765625, -1.205718994140625, -1.10418701171875, -1.002655029296875, -0.901123046875, -0.799591064453125, -0.69805908203125, -0.596527099609375, -0.4949951171875, -0.393463134765625, -0.29193115234375, -0.190399169921875, -0.0888671875, 0.012664794921875, 0.11419677734375, 0.215728759765625, 0.3172607421875, 0.418792724609375, 0.52032470703125, 0.621856689453125, 0.723388671875, 0.824920654296875, 0.92645263671875, 1.027984619140625, 1.1295166015625, 1.231048583984375, 1.33258056640625, 1.434112548828125, 1.53564453125, 1.637176513671875, 1.73870849609375, 1.840240478515625, 1.9417724609375, 2.043304443359375, 2.14483642578125, 2.246368408203125, 2.347900390625, 2.449432373046875, 2.55096435546875, 2.652496337890625, 2.7540283203125, 2.855560302734375, 2.95709228515625, 3.058624267578125, 3.16015625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 4.0, 5.0, 8.0, 9.0, 8.0, 18.0, 20.0, 22.0, 25.0, 34.0, 37.0, 52.0, 64.0, 51.0, 72.0, 60.0, 67.0, 67.0, 55.0, 56.0, 47.0, 49.0, 32.0, 22.0, 31.0, 24.0, 16.0, 14.0, 6.0, 8.0, 8.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.263671875, -1.227447509765625, -1.19122314453125, -1.154998779296875, -1.1187744140625, -1.082550048828125, -1.04632568359375, -1.010101318359375, -0.973876953125, -0.937652587890625, -0.90142822265625, -0.865203857421875, -0.8289794921875, -0.792755126953125, -0.75653076171875, -0.720306396484375, -0.68408203125, -0.647857666015625, -0.61163330078125, -0.575408935546875, -0.5391845703125, -0.502960205078125, -0.46673583984375, -0.430511474609375, -0.394287109375, -0.358062744140625, -0.32183837890625, -0.285614013671875, -0.2493896484375, -0.213165283203125, -0.17694091796875, -0.140716552734375, -0.1044921875, -0.068267822265625, -0.03204345703125, 0.004180908203125, 0.0404052734375, 0.076629638671875, 0.11285400390625, 0.149078369140625, 0.185302734375, 0.221527099609375, 0.25775146484375, 0.293975830078125, 0.3302001953125, 0.366424560546875, 0.40264892578125, 0.438873291015625, 0.47509765625, 0.511322021484375, 0.54754638671875, 0.583770751953125, 0.6199951171875, 0.656219482421875, 0.69244384765625, 0.728668212890625, 0.764892578125, 0.801116943359375, 0.83734130859375, 0.873565673828125, 0.9097900390625, 0.946014404296875, 0.98223876953125, 1.018463134765625, 1.0546875]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 5.0, 4.0, 4.0, 8.0, 10.0, 9.0, 9.0, 21.0, 15.0, 15.0, 16.0, 28.0, 32.0, 28.0, 49.0, 38.0, 50.0, 55.0, 55.0, 48.0, 66.0, 57.0, 43.0, 45.0, 41.0, 40.0, 36.0, 28.0, 28.0, 24.0, 21.0, 14.0, 16.0, 5.0, 7.0, 6.0, 5.0, 2.0, 6.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.05610179901123, -8.740498542785645, -8.424895286560059, -8.109292984008789, -7.793689727783203, -7.478086471557617, -7.162483215332031, -6.8468804359436035, -6.531277656555176, -6.21567440032959, -5.900071620941162, -5.584468364715576, -5.268865585327148, -4.9532623291015625, -4.637659072875977, -4.322056293487549, -4.006453037261963, -3.690850019454956, -3.375247001647949, -3.0596437454223633, -2.7440409660339355, -2.4284377098083496, -2.1128346920013428, -1.797231674194336, -1.481628656387329, -1.1660256385803223, -0.8504225611686707, -0.534819483757019, -0.2192164659500122, 0.09638655185699463, 0.411989688873291, 0.7275927066802979, 1.0431957244873047, 1.3587987422943115, 1.6744017601013184, 1.9900048971176147, 2.305607795715332, 2.621211051940918, 2.936814069747925, 3.2524170875549316, 3.5680201053619385, 3.8836231231689453, 4.199226379394531, 4.514829158782959, 4.830432415008545, 5.146035194396973, 5.461638450622559, 5.7772417068481445, 6.092844486236572, 6.408447742462158, 6.724050521850586, 7.039653778076172, 7.3552565574646, 7.6708598136901855, 7.986462593078613, 8.3020658493042, 8.617669105529785, 8.933272361755371, 9.248875617980957, 9.564477920532227, 9.880081176757812, 10.195684432983398, 10.511287689208984, 10.82689094543457, 11.14249324798584]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 2.0, 6.0, 13.0, 13.0, 16.0, 11.0, 14.0, 22.0, 16.0, 23.0, 29.0, 30.0, 33.0, 31.0, 33.0, 33.0, 31.0, 33.0, 43.0, 39.0, 41.0, 51.0, 49.0, 44.0, 35.0, 47.0, 29.0, 19.0, 30.0, 30.0, 36.0, 13.0, 23.0, 12.0, 16.0, 8.0, 11.0, 7.0, 8.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.210147380828857, -6.9790754318237305, -6.748003959655762, -6.516932487487793, -6.285860538482666, -6.054788589477539, -5.82371711730957, -5.592645645141602, -5.361573696136475, -5.130501747131348, -4.899430274963379, -4.66835880279541, -4.437286853790283, -4.206214904785156, -3.9751434326171875, -3.7440717220306396, -3.513000011444092, -3.281928300857544, -3.050856590270996, -2.8197848796844482, -2.5887131690979004, -2.3576414585113525, -2.1265697479248047, -1.8954980373382568, -1.664426326751709, -1.4333546161651611, -1.2022829055786133, -0.9712111949920654, -0.7401394844055176, -0.5090677738189697, -0.2779960632324219, -0.04692435264587402, 0.18414783477783203, 0.4152195453643799, 0.6462912559509277, 0.8773629665374756, 1.1084346771240234, 1.3395063877105713, 1.5705780982971191, 1.801649808883667, 2.032721519470215, 2.2637932300567627, 2.4948649406433105, 2.7259366512298584, 2.9570083618164062, 3.188080072402954, 3.419151782989502, 3.65022349357605, 3.8812952041625977, 4.112366676330566, 4.343438625335693, 4.57451057434082, 4.805582046508789, 5.036653518676758, 5.267725467681885, 5.498797416687012, 5.7298688888549805, 5.960940361022949, 6.192012310028076, 6.423084259033203, 6.654155731201172, 6.885227203369141, 7.116299152374268, 7.3473711013793945, 7.578442573547363]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 0.0, 4.0, 4.0, 3.0, 9.0, 24.0, 17.0, 36.0, 56.0, 105.0, 169.0, 330.0, 564.0, 1005.0, 2005.0, 3911.0, 7597.0, 15072.0, 31676.0, 64713.0, 127206.0, 206703.0, 232631.0, 169970.0, 93575.0, 46545.0, 22105.0, 10837.0, 5559.0, 2779.0, 1516.0, 806.0, 443.0, 244.0, 124.0, 99.0, 44.0, 31.0, 21.0, 8.0, 6.0, 3.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.921875, -6.6583251953125, -6.394775390625, -6.1312255859375, -5.86767578125, -5.6041259765625, -5.340576171875, -5.0770263671875, -4.8134765625, -4.5499267578125, -4.286376953125, -4.0228271484375, -3.75927734375, -3.4957275390625, -3.232177734375, -2.9686279296875, -2.705078125, -2.4415283203125, -2.177978515625, -1.9144287109375, -1.65087890625, -1.3873291015625, -1.123779296875, -0.8602294921875, -0.5966796875, -0.3331298828125, -0.069580078125, 0.1939697265625, 0.45751953125, 0.7210693359375, 0.984619140625, 1.2481689453125, 1.51171875, 1.7752685546875, 2.038818359375, 2.3023681640625, 2.56591796875, 2.8294677734375, 3.093017578125, 3.3565673828125, 3.6201171875, 3.8836669921875, 4.147216796875, 4.4107666015625, 4.67431640625, 4.9378662109375, 5.201416015625, 5.4649658203125, 5.728515625, 5.9920654296875, 6.255615234375, 6.5191650390625, 6.78271484375, 7.0462646484375, 7.309814453125, 7.5733642578125, 7.8369140625, 8.1004638671875, 8.364013671875, 8.6275634765625, 8.89111328125, 9.1546630859375, 9.418212890625, 9.6817626953125, 9.9453125]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 5.0, 8.0, 11.0, 7.0, 18.0, 17.0, 19.0, 24.0, 15.0, 31.0, 31.0, 18.0, 28.0, 36.0, 42.0, 36.0, 46.0, 38.0, 43.0, 53.0, 54.0, 48.0, 42.0, 37.0, 39.0, 30.0, 24.0, 24.0, 24.0, 27.0, 24.0, 24.0, 11.0, 16.0, 10.0, 10.0, 7.0, 9.0, 4.0, 5.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.59765625, -7.34710693359375, -7.0965576171875, -6.84600830078125, -6.595458984375, -6.34490966796875, -6.0943603515625, -5.84381103515625, -5.59326171875, -5.34271240234375, -5.0921630859375, -4.84161376953125, -4.591064453125, -4.34051513671875, -4.0899658203125, -3.83941650390625, -3.5888671875, -3.33831787109375, -3.0877685546875, -2.83721923828125, -2.586669921875, -2.33612060546875, -2.0855712890625, -1.83502197265625, -1.58447265625, -1.33392333984375, -1.0833740234375, -0.83282470703125, -0.582275390625, -0.33172607421875, -0.0811767578125, 0.16937255859375, 0.419921875, 0.67047119140625, 0.9210205078125, 1.17156982421875, 1.422119140625, 1.67266845703125, 1.9232177734375, 2.17376708984375, 2.42431640625, 2.67486572265625, 2.9254150390625, 3.17596435546875, 3.426513671875, 3.67706298828125, 3.9276123046875, 4.17816162109375, 4.4287109375, 4.67926025390625, 4.9298095703125, 5.18035888671875, 5.430908203125, 5.68145751953125, 5.9320068359375, 6.18255615234375, 6.43310546875, 6.68365478515625, 6.9342041015625, 7.18475341796875, 7.435302734375, 7.68585205078125, 7.9364013671875, 8.18695068359375, 8.4375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 4.0, 3.0, 6.0, 13.0, 14.0, 22.0, 34.0, 44.0, 81.0, 98.0, 137.0, 231.0, 358.0, 560.0, 968.0, 1459.0, 2523.0, 4014.0, 6702.0, 11298.0, 19352.0, 33318.0, 56498.0, 92931.0, 138653.0, 174447.0, 169328.0, 129091.0, 83509.0, 50601.0, 29591.0, 17160.0, 10137.0, 6045.0, 3574.0, 2108.0, 1345.0, 802.0, 524.0, 319.0, 225.0, 144.0, 82.0, 58.0, 40.0, 27.0, 21.0, 11.0, 21.0, 11.0, 6.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0], "bins": [-6.7734375, -6.56103515625, -6.3486328125, -6.13623046875, -5.923828125, -5.71142578125, -5.4990234375, -5.28662109375, -5.07421875, -4.86181640625, -4.6494140625, -4.43701171875, -4.224609375, -4.01220703125, -3.7998046875, -3.58740234375, -3.375, -3.16259765625, -2.9501953125, -2.73779296875, -2.525390625, -2.31298828125, -2.1005859375, -1.88818359375, -1.67578125, -1.46337890625, -1.2509765625, -1.03857421875, -0.826171875, -0.61376953125, -0.4013671875, -0.18896484375, 0.0234375, 0.23583984375, 0.4482421875, 0.66064453125, 0.873046875, 1.08544921875, 1.2978515625, 1.51025390625, 1.72265625, 1.93505859375, 2.1474609375, 2.35986328125, 2.572265625, 2.78466796875, 2.9970703125, 3.20947265625, 3.421875, 3.63427734375, 3.8466796875, 4.05908203125, 4.271484375, 4.48388671875, 4.6962890625, 4.90869140625, 5.12109375, 5.33349609375, 5.5458984375, 5.75830078125, 5.970703125, 6.18310546875, 6.3955078125, 6.60791015625, 6.8203125]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 2.0, 7.0, 2.0, 5.0, 6.0, 3.0, 9.0, 8.0, 14.0, 21.0, 16.0, 18.0, 23.0, 32.0, 26.0, 27.0, 39.0, 29.0, 53.0, 40.0, 33.0, 41.0, 39.0, 47.0, 38.0, 29.0, 39.0, 31.0, 23.0, 45.0, 30.0, 35.0, 31.0, 18.0, 16.0, 19.0, 19.0, 11.0, 10.0, 6.0, 15.0, 8.0, 12.0, 9.0, 4.0, 8.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.5390625, -4.3956298828125, -4.252197265625, -4.1087646484375, -3.96533203125, -3.8218994140625, -3.678466796875, -3.5350341796875, -3.3916015625, -3.2481689453125, -3.104736328125, -2.9613037109375, -2.81787109375, -2.6744384765625, -2.531005859375, -2.3875732421875, -2.244140625, -2.1007080078125, -1.957275390625, -1.8138427734375, -1.67041015625, -1.5269775390625, -1.383544921875, -1.2401123046875, -1.0966796875, -0.9532470703125, -0.809814453125, -0.6663818359375, -0.52294921875, -0.3795166015625, -0.236083984375, -0.0926513671875, 0.05078125, 0.1942138671875, 0.337646484375, 0.4810791015625, 0.62451171875, 0.7679443359375, 0.911376953125, 1.0548095703125, 1.1982421875, 1.3416748046875, 1.485107421875, 1.6285400390625, 1.77197265625, 1.9154052734375, 2.058837890625, 2.2022705078125, 2.345703125, 2.4891357421875, 2.632568359375, 2.7760009765625, 2.91943359375, 3.0628662109375, 3.206298828125, 3.3497314453125, 3.4931640625, 3.6365966796875, 3.780029296875, 3.9234619140625, 4.06689453125, 4.2103271484375, 4.353759765625, 4.4971923828125, 4.640625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 7.0, 4.0, 4.0, 5.0, 7.0, 13.0, 12.0, 31.0, 26.0, 50.0, 60.0, 83.0, 113.0, 167.0, 258.0, 379.0, 548.0, 811.0, 1280.0, 1971.0, 3337.0, 5505.0, 9772.0, 19004.0, 38982.0, 87020.0, 191503.0, 286352.0, 210703.0, 99177.0, 43729.0, 20898.0, 10908.0, 6093.0, 3490.0, 2131.0, 1357.0, 944.0, 569.0, 387.0, 274.0, 168.0, 130.0, 85.0, 75.0, 55.0, 30.0, 21.0, 9.0, 13.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.1953125, -5.03582763671875, -4.8763427734375, -4.71685791015625, -4.557373046875, -4.39788818359375, -4.2384033203125, -4.07891845703125, -3.91943359375, -3.75994873046875, -3.6004638671875, -3.44097900390625, -3.281494140625, -3.12200927734375, -2.9625244140625, -2.80303955078125, -2.6435546875, -2.48406982421875, -2.3245849609375, -2.16510009765625, -2.005615234375, -1.84613037109375, -1.6866455078125, -1.52716064453125, -1.36767578125, -1.20819091796875, -1.0487060546875, -0.88922119140625, -0.729736328125, -0.57025146484375, -0.4107666015625, -0.25128173828125, -0.091796875, 0.06768798828125, 0.2271728515625, 0.38665771484375, 0.546142578125, 0.70562744140625, 0.8651123046875, 1.02459716796875, 1.18408203125, 1.34356689453125, 1.5030517578125, 1.66253662109375, 1.822021484375, 1.98150634765625, 2.1409912109375, 2.30047607421875, 2.4599609375, 2.61944580078125, 2.7789306640625, 2.93841552734375, 3.097900390625, 3.25738525390625, 3.4168701171875, 3.57635498046875, 3.73583984375, 3.89532470703125, 4.0548095703125, 4.21429443359375, 4.373779296875, 4.53326416015625, 4.6927490234375, 4.85223388671875, 5.01171875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 3.0, 6.0, 3.0, 2.0, 4.0, 8.0, 7.0, 7.0, 7.0, 12.0, 17.0, 22.0, 28.0, 36.0, 33.0, 47.0, 58.0, 61.0, 65.0, 70.0, 64.0, 59.0, 61.0, 57.0, 44.0, 37.0, 39.0, 31.0, 24.0, 19.0, 21.0, 11.0, 9.0, 1.0, 8.0, 1.0, 3.0, 3.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.0003387928009033203, -0.00032854825258255005, -0.0003183037042617798, -0.0003080591559410095, -0.00029781460762023926, -0.000287570059299469, -0.00027732551097869873, -0.00026708096265792847, -0.0002568364143371582, -0.00024659186601638794, -0.00023634731769561768, -0.0002261027693748474, -0.00021585822105407715, -0.00020561367273330688, -0.00019536912441253662, -0.00018512457609176636, -0.0001748800277709961, -0.00016463547945022583, -0.00015439093112945557, -0.0001441463828086853, -0.00013390183448791504, -0.00012365728616714478, -0.00011341273784637451, -0.00010316818952560425, -9.292364120483398e-05, -8.267909288406372e-05, -7.243454456329346e-05, -6.21899962425232e-05, -5.194544792175293e-05, -4.1700899600982666e-05, -3.14563512802124e-05, -2.121180295944214e-05, -1.0967254638671875e-05, -7.227063179016113e-07, 9.521842002868652e-06, 1.9766390323638916e-05, 3.001093864440918e-05, 4.025548696517944e-05, 5.050003528594971e-05, 6.074458360671997e-05, 7.098913192749023e-05, 8.12336802482605e-05, 9.147822856903076e-05, 0.00010172277688980103, 0.00011196732521057129, 0.00012221187353134155, 0.00013245642185211182, 0.00014270097017288208, 0.00015294551849365234, 0.0001631900668144226, 0.00017343461513519287, 0.00018367916345596313, 0.0001939237117767334, 0.00020416826009750366, 0.00021441280841827393, 0.0002246573567390442, 0.00023490190505981445, 0.0002451464533805847, 0.000255391001701355, 0.00026563555002212524, 0.0002758800983428955, 0.00028612464666366577, 0.00029636919498443604, 0.0003066137433052063, 0.00031685829162597656]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 4.0, 8.0, 16.0, 22.0, 24.0, 36.0, 52.0, 81.0, 108.0, 163.0, 247.0, 301.0, 498.0, 723.0, 1080.0, 1798.0, 2714.0, 4536.0, 7689.0, 13659.0, 25332.0, 49265.0, 96965.0, 181538.0, 244365.0, 193236.0, 106384.0, 54132.0, 27323.0, 14729.0, 8386.0, 4750.0, 2976.0, 1783.0, 1236.0, 772.0, 541.0, 341.0, 208.0, 163.0, 106.0, 74.0, 69.0, 32.0, 19.0, 24.0, 13.0, 7.0, 5.0, 7.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0], "bins": [-4.61328125, -4.47161865234375, -4.3299560546875, -4.18829345703125, -4.046630859375, -3.90496826171875, -3.7633056640625, -3.62164306640625, -3.47998046875, -3.33831787109375, -3.1966552734375, -3.05499267578125, -2.913330078125, -2.77166748046875, -2.6300048828125, -2.48834228515625, -2.3466796875, -2.20501708984375, -2.0633544921875, -1.92169189453125, -1.780029296875, -1.63836669921875, -1.4967041015625, -1.35504150390625, -1.21337890625, -1.07171630859375, -0.9300537109375, -0.78839111328125, -0.646728515625, -0.50506591796875, -0.3634033203125, -0.22174072265625, -0.080078125, 0.06158447265625, 0.2032470703125, 0.34490966796875, 0.486572265625, 0.62823486328125, 0.7698974609375, 0.91156005859375, 1.05322265625, 1.19488525390625, 1.3365478515625, 1.47821044921875, 1.619873046875, 1.76153564453125, 1.9031982421875, 2.04486083984375, 2.1865234375, 2.32818603515625, 2.4698486328125, 2.61151123046875, 2.753173828125, 2.89483642578125, 3.0364990234375, 3.17816162109375, 3.31982421875, 3.46148681640625, 3.6031494140625, 3.74481201171875, 3.886474609375, 4.02813720703125, 4.1697998046875, 4.31146240234375, 4.453125]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 2.0, 8.0, 4.0, 8.0, 7.0, 9.0, 24.0, 17.0, 27.0, 17.0, 25.0, 33.0, 40.0, 45.0, 37.0, 70.0, 73.0, 64.0, 72.0, 68.0, 62.0, 68.0, 42.0, 33.0, 19.0, 28.0, 21.0, 14.0, 13.0, 7.0, 12.0, 8.0, 3.0, 6.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.36328125, -1.3202362060546875, -1.277191162109375, -1.2341461181640625, -1.19110107421875, -1.1480560302734375, -1.105010986328125, -1.0619659423828125, -1.0189208984375, -0.9758758544921875, -0.932830810546875, -0.8897857666015625, -0.84674072265625, -0.8036956787109375, -0.760650634765625, -0.7176055908203125, -0.674560546875, -0.6315155029296875, -0.588470458984375, -0.5454254150390625, -0.50238037109375, -0.4593353271484375, -0.416290283203125, -0.3732452392578125, -0.3302001953125, -0.2871551513671875, -0.244110107421875, -0.2010650634765625, -0.15802001953125, -0.1149749755859375, -0.071929931640625, -0.0288848876953125, 0.01416015625, 0.0572052001953125, 0.100250244140625, 0.1432952880859375, 0.18634033203125, 0.2293853759765625, 0.272430419921875, 0.3154754638671875, 0.3585205078125, 0.4015655517578125, 0.444610595703125, 0.4876556396484375, 0.53070068359375, 0.5737457275390625, 0.616790771484375, 0.6598358154296875, 0.702880859375, 0.7459259033203125, 0.788970947265625, 0.8320159912109375, 0.87506103515625, 0.9181060791015625, 0.961151123046875, 1.0041961669921875, 1.0472412109375, 1.0902862548828125, 1.133331298828125, 1.1763763427734375, 1.21942138671875, 1.2624664306640625, 1.305511474609375, 1.3485565185546875, 1.3916015625]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 3.0, 6.0, 2.0, 3.0, 0.0, 4.0, 9.0, 3.0, 11.0, 11.0, 10.0, 13.0, 15.0, 21.0, 23.0, 28.0, 25.0, 28.0, 34.0, 49.0, 50.0, 49.0, 65.0, 52.0, 56.0, 54.0, 42.0, 39.0, 50.0, 37.0, 29.0, 33.0, 34.0, 30.0, 19.0, 15.0, 9.0, 6.0, 9.0, 6.0, 6.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.812718391418457, -8.497692108154297, -8.182665824890137, -7.867639541625977, -7.552613258361816, -7.237586975097656, -6.922560691833496, -6.607534408569336, -6.292508125305176, -5.977481842041016, -5.6624555587768555, -5.347429275512695, -5.032402992248535, -4.717376708984375, -4.402350425720215, -4.087324142456055, -3.7722978591918945, -3.4572715759277344, -3.142245292663574, -2.827219009399414, -2.512192726135254, -2.1971664428710938, -1.8821401596069336, -1.5671138763427734, -1.2520875930786133, -0.9370613098144531, -0.622035026550293, -0.3070087432861328, 0.008017539978027344, 0.3230438232421875, 0.6380701065063477, 0.9530963897705078, 1.2681236267089844, 1.5831499099731445, 1.8981761932373047, 2.213202476501465, 2.528228759765625, 2.843255043029785, 3.1582813262939453, 3.4733076095581055, 3.7883338928222656, 4.103360176086426, 4.418386459350586, 4.733412742614746, 5.048439025878906, 5.363465309143066, 5.678491592407227, 5.993517875671387, 6.308544158935547, 6.623570442199707, 6.938596725463867, 7.253623008728027, 7.5686492919921875, 7.883675575256348, 8.198701858520508, 8.513728141784668, 8.828754425048828, 9.143780708312988, 9.458806991577148, 9.773833274841309, 10.088859558105469, 10.403885841369629, 10.718912124633789, 11.03393840789795, 11.34896469116211]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 7.0, 6.0, 7.0, 11.0, 10.0, 14.0, 23.0, 23.0, 18.0, 27.0, 28.0, 24.0, 31.0, 29.0, 48.0, 50.0, 52.0, 49.0, 42.0, 38.0, 39.0, 43.0, 43.0, 44.0, 41.0, 32.0, 31.0, 42.0, 24.0, 21.0, 23.0, 18.0, 20.0, 4.0, 10.0, 6.0, 8.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.13933277130127, -7.876277923583984, -7.613223075866699, -7.350168704986572, -7.087113857269287, -6.824059009552002, -6.561004638671875, -6.29794979095459, -6.034894943237305, -5.7718400955200195, -5.508785247802734, -5.245730876922607, -4.982676029205322, -4.719621181488037, -4.45656681060791, -4.193511962890625, -3.93045711517334, -3.6674022674560547, -3.4043476581573486, -3.1412930488586426, -2.8782382011413574, -2.6151833534240723, -2.352128744125366, -2.08907413482666, -1.826019287109375, -1.5629645586013794, -1.2999098300933838, -1.0368551015853882, -0.7738003730773926, -0.510745644569397, -0.24769091606140137, 0.015363812446594238, 0.27841949462890625, 0.5414742231369019, 0.8045289516448975, 1.067583680152893, 1.3306384086608887, 1.5936931371688843, 1.8567478656768799, 2.119802474975586, 2.382857322692871, 2.6459121704101562, 2.9089667797088623, 3.1720213890075684, 3.4350762367248535, 3.6981310844421387, 3.9611856937408447, 4.224240303039551, 4.487295150756836, 4.750349998474121, 5.013404846191406, 5.276459217071533, 5.539514064788818, 5.8025689125061035, 6.0656232833862305, 6.328678131103516, 6.591732978820801, 6.854787826538086, 7.117842674255371, 7.380897045135498, 7.643951892852783, 7.907006740570068, 8.170061111450195, 8.43311595916748, 8.696170806884766]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 1.0, 3.0, 5.0, 10.0, 6.0, 7.0, 20.0, 22.0, 45.0, 62.0, 127.0, 151.0, 256.0, 434.0, 671.0, 1229.0, 2209.0, 4037.0, 7154.0, 13747.0, 27297.0, 59933.0, 151908.0, 448550.0, 1195962.0, 1364902.0, 584118.0, 188774.0, 72139.0, 32356.0, 16665.0, 8758.0, 5070.0, 2939.0, 1717.0, 1098.0, 668.0, 413.0, 285.0, 173.0, 123.0, 84.0, 57.0, 28.0, 19.0, 17.0, 9.0, 7.0, 5.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-16.015625, -15.531982421875, -15.04833984375, -14.564697265625, -14.0810546875, -13.597412109375, -13.11376953125, -12.630126953125, -12.146484375, -11.662841796875, -11.17919921875, -10.695556640625, -10.2119140625, -9.728271484375, -9.24462890625, -8.760986328125, -8.27734375, -7.793701171875, -7.31005859375, -6.826416015625, -6.3427734375, -5.859130859375, -5.37548828125, -4.891845703125, -4.408203125, -3.924560546875, -3.44091796875, -2.957275390625, -2.4736328125, -1.989990234375, -1.50634765625, -1.022705078125, -0.5390625, -0.055419921875, 0.42822265625, 0.911865234375, 1.3955078125, 1.879150390625, 2.36279296875, 2.846435546875, 3.330078125, 3.813720703125, 4.29736328125, 4.781005859375, 5.2646484375, 5.748291015625, 6.23193359375, 6.715576171875, 7.19921875, 7.682861328125, 8.16650390625, 8.650146484375, 9.1337890625, 9.617431640625, 10.10107421875, 10.584716796875, 11.068359375, 11.552001953125, 12.03564453125, 12.519287109375, 13.0029296875, 13.486572265625, 13.97021484375, 14.453857421875, 14.9375]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 4.0, 4.0, 5.0, 5.0, 6.0, 8.0, 9.0, 13.0, 23.0, 24.0, 21.0, 24.0, 29.0, 29.0, 44.0, 45.0, 54.0, 48.0, 39.0, 52.0, 45.0, 48.0, 53.0, 46.0, 43.0, 41.0, 46.0, 34.0, 30.0, 29.0, 12.0, 16.0, 18.0, 18.0, 9.0, 11.0, 5.0, 8.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.67578125, -7.42974853515625, -7.1837158203125, -6.93768310546875, -6.691650390625, -6.44561767578125, -6.1995849609375, -5.95355224609375, -5.70751953125, -5.46148681640625, -5.2154541015625, -4.96942138671875, -4.723388671875, -4.47735595703125, -4.2313232421875, -3.98529052734375, -3.7392578125, -3.49322509765625, -3.2471923828125, -3.00115966796875, -2.755126953125, -2.50909423828125, -2.2630615234375, -2.01702880859375, -1.77099609375, -1.52496337890625, -1.2789306640625, -1.03289794921875, -0.786865234375, -0.54083251953125, -0.2947998046875, -0.04876708984375, 0.197265625, 0.44329833984375, 0.6893310546875, 0.93536376953125, 1.181396484375, 1.42742919921875, 1.6734619140625, 1.91949462890625, 2.16552734375, 2.41156005859375, 2.6575927734375, 2.90362548828125, 3.149658203125, 3.39569091796875, 3.6417236328125, 3.88775634765625, 4.1337890625, 4.37982177734375, 4.6258544921875, 4.87188720703125, 5.117919921875, 5.36395263671875, 5.6099853515625, 5.85601806640625, 6.10205078125, 6.34808349609375, 6.5941162109375, 6.84014892578125, 7.086181640625, 7.33221435546875, 7.5782470703125, 7.82427978515625, 8.0703125]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 7.0, 13.0, 9.0, 18.0, 37.0, 57.0, 88.0, 101.0, 164.0, 244.0, 313.0, 475.0, 701.0, 1009.0, 1557.0, 2349.0, 3740.0, 5912.0, 10222.0, 17796.0, 32862.0, 63802.0, 133609.0, 297608.0, 690730.0, 1209598.0, 930700.0, 420163.0, 183667.0, 85985.0, 43592.0, 23552.0, 13200.0, 7715.0, 4711.0, 2772.0, 1792.0, 1126.0, 806.0, 468.0, 384.0, 199.0, 153.0, 92.0, 64.0, 52.0, 32.0, 18.0, 7.0, 7.0, 7.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.4375, -15.9498291015625, -15.462158203125, -14.9744873046875, -14.48681640625, -13.9991455078125, -13.511474609375, -13.0238037109375, -12.5361328125, -12.0484619140625, -11.560791015625, -11.0731201171875, -10.58544921875, -10.0977783203125, -9.610107421875, -9.1224365234375, -8.634765625, -8.1470947265625, -7.659423828125, -7.1717529296875, -6.68408203125, -6.1964111328125, -5.708740234375, -5.2210693359375, -4.7333984375, -4.2457275390625, -3.758056640625, -3.2703857421875, -2.78271484375, -2.2950439453125, -1.807373046875, -1.3197021484375, -0.83203125, -0.3443603515625, 0.143310546875, 0.6309814453125, 1.11865234375, 1.6063232421875, 2.093994140625, 2.5816650390625, 3.0693359375, 3.5570068359375, 4.044677734375, 4.5323486328125, 5.02001953125, 5.5076904296875, 5.995361328125, 6.4830322265625, 6.970703125, 7.4583740234375, 7.946044921875, 8.4337158203125, 8.92138671875, 9.4090576171875, 9.896728515625, 10.3843994140625, 10.8720703125, 11.3597412109375, 11.847412109375, 12.3350830078125, 12.82275390625, 13.3104248046875, 13.798095703125, 14.2857666015625, 14.7734375]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 10.0, 6.0, 8.0, 9.0, 9.0, 13.0, 17.0, 28.0, 22.0, 45.0, 57.0, 77.0, 100.0, 133.0, 157.0, 216.0, 230.0, 326.0, 328.0, 365.0, 351.0, 289.0, 275.0, 237.0, 183.0, 142.0, 85.0, 75.0, 74.0, 58.0, 41.0, 32.0, 22.0, 11.0, 16.0, 7.0, 6.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.39453125, -5.228759765625, -5.06298828125, -4.897216796875, -4.7314453125, -4.565673828125, -4.39990234375, -4.234130859375, -4.068359375, -3.902587890625, -3.73681640625, -3.571044921875, -3.4052734375, -3.239501953125, -3.07373046875, -2.907958984375, -2.7421875, -2.576416015625, -2.41064453125, -2.244873046875, -2.0791015625, -1.913330078125, -1.74755859375, -1.581787109375, -1.416015625, -1.250244140625, -1.08447265625, -0.918701171875, -0.7529296875, -0.587158203125, -0.42138671875, -0.255615234375, -0.08984375, 0.075927734375, 0.24169921875, 0.407470703125, 0.5732421875, 0.739013671875, 0.90478515625, 1.070556640625, 1.236328125, 1.402099609375, 1.56787109375, 1.733642578125, 1.8994140625, 2.065185546875, 2.23095703125, 2.396728515625, 2.5625, 2.728271484375, 2.89404296875, 3.059814453125, 3.2255859375, 3.391357421875, 3.55712890625, 3.722900390625, 3.888671875, 4.054443359375, 4.22021484375, 4.385986328125, 4.5517578125, 4.717529296875, 4.88330078125, 5.049072265625, 5.21484375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 4.0, 4.0, 4.0, 11.0, 7.0, 15.0, 14.0, 16.0, 16.0, 23.0, 26.0, 36.0, 39.0, 43.0, 42.0, 51.0, 51.0, 64.0, 60.0, 58.0, 59.0, 57.0, 44.0, 38.0, 42.0, 34.0, 32.0, 21.0, 21.0, 9.0, 8.0, 7.0, 9.0, 9.0, 8.0, 2.0, 3.0, 0.0, 6.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.505025863647461, -13.072253227233887, -12.639480590820312, -12.206708908081055, -11.77393627166748, -11.341163635253906, -10.908391952514648, -10.475619316101074, -10.0428466796875, -9.610074043273926, -9.177301406860352, -8.744529724121094, -8.31175708770752, -7.878984451293945, -7.446212291717529, -7.013440132141113, -6.580667495727539, -6.147894859313965, -5.715122699737549, -5.282350540161133, -4.849577903747559, -4.416805267333984, -3.9840331077575684, -3.5512607097625732, -3.118488311767578, -2.685715913772583, -2.252943515777588, -1.8201711177825928, -1.3873987197875977, -0.9546263217926025, -0.5218539237976074, -0.0890815258026123, 0.3436908721923828, 0.7764632701873779, 1.209235668182373, 1.6420080661773682, 2.0747804641723633, 2.5075528621673584, 2.9403252601623535, 3.3730976581573486, 3.8058700561523438, 4.238642692565918, 4.671414852142334, 5.10418701171875, 5.536959648132324, 5.969732284545898, 6.4025044441223145, 6.8352766036987305, 7.268049240112305, 7.700821876525879, 8.133594512939453, 8.566366195678711, 8.999138832092285, 9.43191146850586, 9.864683151245117, 10.297455787658691, 10.730228424072266, 11.16300106048584, 11.595773696899414, 12.028545379638672, 12.461318016052246, 12.89409065246582, 13.326862335205078, 13.759634971618652, 14.192407608032227]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 5.0, 7.0, 8.0, 3.0, 5.0, 14.0, 13.0, 15.0, 15.0, 19.0, 17.0, 21.0, 27.0, 32.0, 30.0, 23.0, 32.0, 34.0, 35.0, 48.0, 29.0, 44.0, 42.0, 30.0, 31.0, 36.0, 38.0, 27.0, 33.0, 34.0, 32.0, 28.0, 23.0, 23.0, 11.0, 19.0, 19.0, 9.0, 23.0, 8.0, 5.0, 9.0, 5.0, 9.0, 5.0, 5.0, 6.0, 4.0, 0.0, 6.0, 4.0, 0.0, 2.0, 2.0], "bins": [-8.791692733764648, -8.5216064453125, -8.251520156860352, -7.981433868408203, -7.711347579956055, -7.441261291503906, -7.171175003051758, -6.901088714599609, -6.631002426147461, -6.3609161376953125, -6.090829849243164, -5.820743560791016, -5.550657272338867, -5.280570983886719, -5.01048469543457, -4.740398406982422, -4.470311641693115, -4.200225353240967, -3.9301390647888184, -3.66005277633667, -3.3899664878845215, -3.119880199432373, -2.8497936725616455, -2.579707384109497, -2.3096210956573486, -2.0395348072052, -1.7694485187530518, -1.4993621110916138, -1.2292758226394653, -0.9591895341873169, -0.6891031265258789, -0.41901683807373047, -0.14893054962158203, 0.1211557686328888, 0.3912420868873596, 0.6613284349441528, 0.9314147233963013, 1.2015010118484497, 1.4715874195098877, 1.7416737079620361, 2.0117599964141846, 2.281846284866333, 2.5519325733184814, 2.822019100189209, 3.0921053886413574, 3.362191677093506, 3.6322779655456543, 3.9023642539978027, 4.172450542449951, 4.4425368309021, 4.712623119354248, 4.9827094078063965, 5.252795696258545, 5.522881984710693, 5.79296875, 6.063055038452148, 6.333141326904297, 6.603227615356445, 6.873313903808594, 7.143400192260742, 7.413486480712891, 7.683572769165039, 7.9536590576171875, 8.223745346069336, 8.493831634521484]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 1.0, 8.0, 6.0, 7.0, 21.0, 19.0, 26.0, 46.0, 69.0, 102.0, 189.0, 298.0, 438.0, 695.0, 1187.0, 1889.0, 3117.0, 5473.0, 9293.0, 16448.0, 29581.0, 53431.0, 96775.0, 158554.0, 206855.0, 185128.0, 121294.0, 69542.0, 38013.0, 21101.0, 11923.0, 6781.0, 4012.0, 2414.0, 1481.0, 831.0, 567.0, 283.0, 239.0, 156.0, 80.0, 62.0, 41.0, 33.0, 14.0, 12.0, 8.0, 4.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.7734375, -6.55987548828125, -6.3463134765625, -6.13275146484375, -5.919189453125, -5.70562744140625, -5.4920654296875, -5.27850341796875, -5.06494140625, -4.85137939453125, -4.6378173828125, -4.42425537109375, -4.210693359375, -3.99713134765625, -3.7835693359375, -3.57000732421875, -3.3564453125, -3.14288330078125, -2.9293212890625, -2.71575927734375, -2.502197265625, -2.28863525390625, -2.0750732421875, -1.86151123046875, -1.64794921875, -1.43438720703125, -1.2208251953125, -1.00726318359375, -0.793701171875, -0.58013916015625, -0.3665771484375, -0.15301513671875, 0.060546875, 0.27410888671875, 0.4876708984375, 0.70123291015625, 0.914794921875, 1.12835693359375, 1.3419189453125, 1.55548095703125, 1.76904296875, 1.98260498046875, 2.1961669921875, 2.40972900390625, 2.623291015625, 2.83685302734375, 3.0504150390625, 3.26397705078125, 3.4775390625, 3.69110107421875, 3.9046630859375, 4.11822509765625, 4.331787109375, 4.54534912109375, 4.7589111328125, 4.97247314453125, 5.18603515625, 5.39959716796875, 5.6131591796875, 5.82672119140625, 6.040283203125, 6.25384521484375, 6.4674072265625, 6.68096923828125, 6.89453125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 4.0, 4.0, 10.0, 13.0, 10.0, 15.0, 13.0, 13.0, 23.0, 14.0, 19.0, 31.0, 29.0, 38.0, 31.0, 37.0, 39.0, 45.0, 44.0, 41.0, 40.0, 33.0, 34.0, 27.0, 35.0, 38.0, 41.0, 35.0, 32.0, 20.0, 40.0, 20.0, 20.0, 11.0, 17.0, 11.0, 9.0, 10.0, 6.0, 9.0, 8.0, 9.0, 6.0, 1.0, 4.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.71875, -9.4139404296875, -9.109130859375, -8.8043212890625, -8.49951171875, -8.1947021484375, -7.889892578125, -7.5850830078125, -7.2802734375, -6.9754638671875, -6.670654296875, -6.3658447265625, -6.06103515625, -5.7562255859375, -5.451416015625, -5.1466064453125, -4.841796875, -4.5369873046875, -4.232177734375, -3.9273681640625, -3.62255859375, -3.3177490234375, -3.012939453125, -2.7081298828125, -2.4033203125, -2.0985107421875, -1.793701171875, -1.4888916015625, -1.18408203125, -0.8792724609375, -0.574462890625, -0.2696533203125, 0.03515625, 0.3399658203125, 0.644775390625, 0.9495849609375, 1.25439453125, 1.5592041015625, 1.864013671875, 2.1688232421875, 2.4736328125, 2.7784423828125, 3.083251953125, 3.3880615234375, 3.69287109375, 3.9976806640625, 4.302490234375, 4.6072998046875, 4.912109375, 5.2169189453125, 5.521728515625, 5.8265380859375, 6.13134765625, 6.4361572265625, 6.740966796875, 7.0457763671875, 7.3505859375, 7.6553955078125, 7.960205078125, 8.2650146484375, 8.56982421875, 8.8746337890625, 9.179443359375, 9.4842529296875, 9.7890625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 9.0, 6.0, 4.0, 6.0, 13.0, 12.0, 31.0, 32.0, 34.0, 48.0, 64.0, 96.0, 140.0, 181.0, 247.0, 379.0, 584.0, 964.0, 1577.0, 2516.0, 4678.0, 8228.0, 15501.0, 30273.0, 62328.0, 128811.0, 240660.0, 258420.0, 146871.0, 71727.0, 34804.0, 17473.0, 9197.0, 4988.0, 2943.0, 1603.0, 1016.0, 657.0, 402.0, 314.0, 206.0, 144.0, 90.0, 79.0, 54.0, 26.0, 30.0, 22.0, 22.0, 16.0, 16.0, 6.0, 7.0, 4.0, 1.0, 0.0, 1.0, 4.0], "bins": [-10.40625, -10.091796875, -9.77734375, -9.462890625, -9.1484375, -8.833984375, -8.51953125, -8.205078125, -7.890625, -7.576171875, -7.26171875, -6.947265625, -6.6328125, -6.318359375, -6.00390625, -5.689453125, -5.375, -5.060546875, -4.74609375, -4.431640625, -4.1171875, -3.802734375, -3.48828125, -3.173828125, -2.859375, -2.544921875, -2.23046875, -1.916015625, -1.6015625, -1.287109375, -0.97265625, -0.658203125, -0.34375, -0.029296875, 0.28515625, 0.599609375, 0.9140625, 1.228515625, 1.54296875, 1.857421875, 2.171875, 2.486328125, 2.80078125, 3.115234375, 3.4296875, 3.744140625, 4.05859375, 4.373046875, 4.6875, 5.001953125, 5.31640625, 5.630859375, 5.9453125, 6.259765625, 6.57421875, 6.888671875, 7.203125, 7.517578125, 7.83203125, 8.146484375, 8.4609375, 8.775390625, 9.08984375, 9.404296875, 9.71875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 9.0, 8.0, 7.0, 12.0, 7.0, 12.0, 15.0, 21.0, 28.0, 26.0, 20.0, 31.0, 30.0, 39.0, 40.0, 35.0, 31.0, 40.0, 59.0, 42.0, 32.0, 30.0, 46.0, 46.0, 40.0, 46.0, 31.0, 36.0, 30.0, 26.0, 22.0, 15.0, 20.0, 15.0, 13.0, 12.0, 12.0, 7.0, 1.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.59375, -6.38909912109375, -6.1844482421875, -5.97979736328125, -5.775146484375, -5.57049560546875, -5.3658447265625, -5.16119384765625, -4.95654296875, -4.75189208984375, -4.5472412109375, -4.34259033203125, -4.137939453125, -3.93328857421875, -3.7286376953125, -3.52398681640625, -3.3193359375, -3.11468505859375, -2.9100341796875, -2.70538330078125, -2.500732421875, -2.29608154296875, -2.0914306640625, -1.88677978515625, -1.68212890625, -1.47747802734375, -1.2728271484375, -1.06817626953125, -0.863525390625, -0.65887451171875, -0.4542236328125, -0.24957275390625, -0.044921875, 0.15972900390625, 0.3643798828125, 0.56903076171875, 0.773681640625, 0.97833251953125, 1.1829833984375, 1.38763427734375, 1.59228515625, 1.79693603515625, 2.0015869140625, 2.20623779296875, 2.410888671875, 2.61553955078125, 2.8201904296875, 3.02484130859375, 3.2294921875, 3.43414306640625, 3.6387939453125, 3.84344482421875, 4.048095703125, 4.25274658203125, 4.4573974609375, 4.66204833984375, 4.86669921875, 5.07135009765625, 5.2760009765625, 5.48065185546875, 5.685302734375, 5.88995361328125, 6.0946044921875, 6.29925537109375, 6.50390625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 4.0, 2.0, 4.0, 5.0, 10.0, 8.0, 7.0, 12.0, 12.0, 29.0, 34.0, 34.0, 55.0, 74.0, 91.0, 110.0, 176.0, 268.0, 346.0, 581.0, 950.0, 1629.0, 2787.0, 5104.0, 10293.0, 21673.0, 50364.0, 123416.0, 282383.0, 303397.0, 139513.0, 56412.0, 24291.0, 11143.0, 5544.0, 3018.0, 1694.0, 1034.0, 616.0, 429.0, 313.0, 190.0, 120.0, 97.0, 73.0, 52.0, 49.0, 27.0, 18.0, 11.0, 19.0, 12.0, 7.0, 6.0, 5.0, 6.0, 3.0, 5.0, 1.0, 3.0, 1.0], "bins": [-6.6484375, -6.44110107421875, -6.2337646484375, -6.02642822265625, -5.819091796875, -5.61175537109375, -5.4044189453125, -5.19708251953125, -4.98974609375, -4.78240966796875, -4.5750732421875, -4.36773681640625, -4.160400390625, -3.95306396484375, -3.7457275390625, -3.53839111328125, -3.3310546875, -3.12371826171875, -2.9163818359375, -2.70904541015625, -2.501708984375, -2.29437255859375, -2.0870361328125, -1.87969970703125, -1.67236328125, -1.46502685546875, -1.2576904296875, -1.05035400390625, -0.843017578125, -0.63568115234375, -0.4283447265625, -0.22100830078125, -0.013671875, 0.19366455078125, 0.4010009765625, 0.60833740234375, 0.815673828125, 1.02301025390625, 1.2303466796875, 1.43768310546875, 1.64501953125, 1.85235595703125, 2.0596923828125, 2.26702880859375, 2.474365234375, 2.68170166015625, 2.8890380859375, 3.09637451171875, 3.3037109375, 3.51104736328125, 3.7183837890625, 3.92572021484375, 4.133056640625, 4.34039306640625, 4.5477294921875, 4.75506591796875, 4.96240234375, 5.16973876953125, 5.3770751953125, 5.58441162109375, 5.791748046875, 5.99908447265625, 6.2064208984375, 6.41375732421875, 6.62109375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 7.0, 4.0, 7.0, 8.0, 7.0, 10.0, 14.0, 16.0, 18.0, 20.0, 28.0, 20.0, 23.0, 33.0, 41.0, 35.0, 48.0, 50.0, 56.0, 65.0, 51.0, 53.0, 49.0, 57.0, 48.0, 33.0, 34.0, 32.0, 22.0, 26.0, 23.0, 16.0, 9.0, 11.0, 8.0, 5.0, 5.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.00017261505126953125, -0.00016780942678451538, -0.0001630038022994995, -0.00015819817781448364, -0.00015339255332946777, -0.0001485869288444519, -0.00014378130435943604, -0.00013897567987442017, -0.0001341700553894043, -0.00012936443090438843, -0.00012455880641937256, -0.00011975318193435669, -0.00011494755744934082, -0.00011014193296432495, -0.00010533630847930908, -0.00010053068399429321, -9.572505950927734e-05, -9.091943502426147e-05, -8.61138105392456e-05, -8.130818605422974e-05, -7.650256156921387e-05, -7.1696937084198e-05, -6.689131259918213e-05, -6.208568811416626e-05, -5.728006362915039e-05, -5.247443914413452e-05, -4.766881465911865e-05, -4.286319017410278e-05, -3.8057565689086914e-05, -3.3251941204071045e-05, -2.8446316719055176e-05, -2.3640692234039307e-05, -1.8835067749023438e-05, -1.4029443264007568e-05, -9.2238187789917e-06, -4.41819429397583e-06, 3.8743019104003906e-07, 5.193054676055908e-06, 9.998679161071777e-06, 1.4804303646087646e-05, 1.9609928131103516e-05, 2.4415552616119385e-05, 2.9221177101135254e-05, 3.402680158615112e-05, 3.883242607116699e-05, 4.363805055618286e-05, 4.844367504119873e-05, 5.32492995262146e-05, 5.805492401123047e-05, 6.286054849624634e-05, 6.766617298126221e-05, 7.247179746627808e-05, 7.727742195129395e-05, 8.208304643630981e-05, 8.688867092132568e-05, 9.169429540634155e-05, 9.649991989135742e-05, 0.00010130554437637329, 0.00010611116886138916, 0.00011091679334640503, 0.0001157224178314209, 0.00012052804231643677, 0.00012533366680145264, 0.0001301392912864685, 0.00013494491577148438]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 8.0, 15.0, 14.0, 18.0, 19.0, 37.0, 51.0, 83.0, 115.0, 136.0, 248.0, 374.0, 619.0, 1010.0, 1706.0, 3085.0, 5742.0, 11783.0, 27077.0, 72871.0, 212819.0, 366810.0, 216069.0, 74723.0, 27765.0, 12125.0, 5713.0, 2972.0, 1647.0, 988.0, 692.0, 390.0, 249.0, 169.0, 125.0, 117.0, 55.0, 32.0, 14.0, 17.0, 18.0, 11.0, 8.0, 7.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.796875, -8.508544921875, -8.22021484375, -7.931884765625, -7.6435546875, -7.355224609375, -7.06689453125, -6.778564453125, -6.490234375, -6.201904296875, -5.91357421875, -5.625244140625, -5.3369140625, -5.048583984375, -4.76025390625, -4.471923828125, -4.18359375, -3.895263671875, -3.60693359375, -3.318603515625, -3.0302734375, -2.741943359375, -2.45361328125, -2.165283203125, -1.876953125, -1.588623046875, -1.30029296875, -1.011962890625, -0.7236328125, -0.435302734375, -0.14697265625, 0.141357421875, 0.4296875, 0.718017578125, 1.00634765625, 1.294677734375, 1.5830078125, 1.871337890625, 2.15966796875, 2.447998046875, 2.736328125, 3.024658203125, 3.31298828125, 3.601318359375, 3.8896484375, 4.177978515625, 4.46630859375, 4.754638671875, 5.04296875, 5.331298828125, 5.61962890625, 5.907958984375, 6.1962890625, 6.484619140625, 6.77294921875, 7.061279296875, 7.349609375, 7.637939453125, 7.92626953125, 8.214599609375, 8.5029296875, 8.791259765625, 9.07958984375, 9.367919921875, 9.65625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 9.0, 13.0, 9.0, 21.0, 19.0, 27.0, 57.0, 57.0, 80.0, 114.0, 118.0, 124.0, 94.0, 72.0, 52.0, 30.0, 34.0, 24.0, 11.0, 6.0, 10.0, 5.0, 6.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.990234375, -2.9014892578125, -2.812744140625, -2.7239990234375, -2.63525390625, -2.5465087890625, -2.457763671875, -2.3690185546875, -2.2802734375, -2.1915283203125, -2.102783203125, -2.0140380859375, -1.92529296875, -1.8365478515625, -1.747802734375, -1.6590576171875, -1.5703125, -1.4815673828125, -1.392822265625, -1.3040771484375, -1.21533203125, -1.1265869140625, -1.037841796875, -0.9490966796875, -0.8603515625, -0.7716064453125, -0.682861328125, -0.5941162109375, -0.50537109375, -0.4166259765625, -0.327880859375, -0.2391357421875, -0.150390625, -0.0616455078125, 0.027099609375, 0.1158447265625, 0.20458984375, 0.2933349609375, 0.382080078125, 0.4708251953125, 0.5595703125, 0.6483154296875, 0.737060546875, 0.8258056640625, 0.91455078125, 1.0032958984375, 1.092041015625, 1.1807861328125, 1.26953125, 1.3582763671875, 1.447021484375, 1.5357666015625, 1.62451171875, 1.7132568359375, 1.802001953125, 1.8907470703125, 1.9794921875, 2.0682373046875, 2.156982421875, 2.2457275390625, 2.33447265625, 2.4232177734375, 2.511962890625, 2.6007080078125, 2.689453125]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 1.0, 5.0, 1.0, 5.0, 4.0, 11.0, 5.0, 16.0, 13.0, 15.0, 18.0, 25.0, 25.0, 31.0, 37.0, 45.0, 44.0, 50.0, 49.0, 57.0, 70.0, 67.0, 63.0, 51.0, 50.0, 38.0, 44.0, 27.0, 22.0, 24.0, 14.0, 12.0, 10.0, 7.0, 10.0, 10.0, 8.0, 5.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.514822006225586, -13.080727577209473, -12.64663314819336, -12.212539672851562, -11.77844524383545, -11.344350814819336, -10.910256385803223, -10.47616195678711, -10.042068481445312, -9.6079740524292, -9.173879623413086, -8.739786148071289, -8.305691719055176, -7.8715972900390625, -7.437502861022949, -7.003408432006836, -6.569314002990723, -6.135219573974609, -5.701125621795654, -5.267031192779541, -4.832937240600586, -4.398842811584473, -3.9647483825683594, -3.530654191970825, -3.096560001373291, -2.662465810775757, -2.2283716201782227, -1.7942771911621094, -1.3601830005645752, -0.926088809967041, -0.49199438095092773, -0.057900190353393555, 0.3761940002441406, 0.8102882504463196, 1.2443825006484985, 1.6784768104553223, 2.1125710010528564, 2.5466651916503906, 2.980759620666504, 3.414853811264038, 3.8489480018615723, 4.2830424308776855, 4.717136383056641, 5.151230812072754, 5.585325241088867, 6.019419193267822, 6.4535136222839355, 6.887607574462891, 7.321702003479004, 7.755796432495117, 8.18989086151123, 8.623985290527344, 9.05807876586914, 9.492173194885254, 9.926267623901367, 10.36036205291748, 10.794456481933594, 11.228550910949707, 11.66264533996582, 12.096738815307617, 12.53083324432373, 12.964927673339844, 13.399022102355957, 13.83311653137207, 14.267210006713867]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 4.0, 6.0, 5.0, 3.0, 8.0, 5.0, 11.0, 10.0, 14.0, 13.0, 15.0, 16.0, 25.0, 20.0, 35.0, 20.0, 27.0, 42.0, 36.0, 25.0, 35.0, 33.0, 50.0, 42.0, 40.0, 40.0, 32.0, 38.0, 31.0, 41.0, 29.0, 34.0, 38.0, 23.0, 13.0, 18.0, 16.0, 22.0, 14.0, 13.0, 14.0, 8.0, 7.0, 9.0, 4.0, 4.0, 4.0, 9.0, 0.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-9.146806716918945, -8.863174438476562, -8.579541206359863, -8.295907974243164, -8.012275695800781, -7.72864294052124, -7.445010185241699, -7.161377429962158, -6.877744674682617, -6.594111919403076, -6.310479164123535, -6.026846408843994, -5.743213653564453, -5.459580898284912, -5.175948143005371, -4.89231538772583, -4.608682632446289, -4.325049877166748, -4.041417121887207, -3.757784366607666, -3.474151611328125, -3.190518856048584, -2.906886100769043, -2.623253345489502, -2.339620590209961, -2.05598783493042, -1.772355079650879, -1.488722324371338, -1.2050895690917969, -0.9214568138122559, -0.6378240585327148, -0.35419130325317383, -0.0705575942993164, 0.2130751609802246, 0.4967079162597656, 0.7803406715393066, 1.0639734268188477, 1.3476061820983887, 1.6312389373779297, 1.9148716926574707, 2.1985044479370117, 2.4821372032165527, 2.7657699584960938, 3.0494027137756348, 3.333035469055176, 3.616668224334717, 3.900300979614258, 4.183933734893799, 4.46756649017334, 4.751199245452881, 5.034832000732422, 5.318464756011963, 5.602097511291504, 5.885730266571045, 6.169363021850586, 6.452995777130127, 6.736628532409668, 7.020261287689209, 7.30389404296875, 7.587526798248291, 7.871159553527832, 8.154792785644531, 8.438425064086914, 8.722057342529297, 9.005690574645996]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 6.0, 15.0, 15.0, 25.0, 43.0, 65.0, 87.0, 127.0, 173.0, 274.0, 410.0, 624.0, 974.0, 1459.0, 2191.0, 3377.0, 5238.0, 7843.0, 12107.0, 19007.0, 28643.0, 43483.0, 64706.0, 92470.0, 120543.0, 139617.0, 136293.0, 113941.0, 84257.0, 58649.0, 38938.0, 25488.0, 16544.0, 10798.0, 7031.0, 4468.0, 2899.0, 1918.0, 1294.0, 847.0, 569.0, 381.0, 252.0, 164.0, 112.0, 69.0, 42.0, 29.0, 21.0, 14.0, 10.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.44140625, -5.25286865234375, -5.0643310546875, -4.87579345703125, -4.687255859375, -4.49871826171875, -4.3101806640625, -4.12164306640625, -3.93310546875, -3.74456787109375, -3.5560302734375, -3.36749267578125, -3.178955078125, -2.99041748046875, -2.8018798828125, -2.61334228515625, -2.4248046875, -2.23626708984375, -2.0477294921875, -1.85919189453125, -1.670654296875, -1.48211669921875, -1.2935791015625, -1.10504150390625, -0.91650390625, -0.72796630859375, -0.5394287109375, -0.35089111328125, -0.162353515625, 0.02618408203125, 0.2147216796875, 0.40325927734375, 0.591796875, 0.78033447265625, 0.9688720703125, 1.15740966796875, 1.345947265625, 1.53448486328125, 1.7230224609375, 1.91156005859375, 2.10009765625, 2.28863525390625, 2.4771728515625, 2.66571044921875, 2.854248046875, 3.04278564453125, 3.2313232421875, 3.41986083984375, 3.6083984375, 3.79693603515625, 3.9854736328125, 4.17401123046875, 4.362548828125, 4.55108642578125, 4.7396240234375, 4.92816162109375, 5.11669921875, 5.30523681640625, 5.4937744140625, 5.68231201171875, 5.870849609375, 6.05938720703125, 6.2479248046875, 6.43646240234375, 6.625]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 6.0, 2.0, 5.0, 4.0, 3.0, 6.0, 8.0, 5.0, 10.0, 10.0, 11.0, 19.0, 20.0, 19.0, 26.0, 30.0, 30.0, 30.0, 35.0, 41.0, 36.0, 32.0, 58.0, 40.0, 34.0, 40.0, 46.0, 44.0, 37.0, 29.0, 40.0, 31.0, 29.0, 26.0, 18.0, 23.0, 16.0, 17.0, 22.0, 13.0, 11.0, 6.0, 6.0, 9.0, 9.0, 5.0, 5.0, 6.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.03125, -9.7147216796875, -9.398193359375, -9.0816650390625, -8.76513671875, -8.4486083984375, -8.132080078125, -7.8155517578125, -7.4990234375, -7.1824951171875, -6.865966796875, -6.5494384765625, -6.23291015625, -5.9163818359375, -5.599853515625, -5.2833251953125, -4.966796875, -4.6502685546875, -4.333740234375, -4.0172119140625, -3.70068359375, -3.3841552734375, -3.067626953125, -2.7510986328125, -2.4345703125, -2.1180419921875, -1.801513671875, -1.4849853515625, -1.16845703125, -0.8519287109375, -0.535400390625, -0.2188720703125, 0.09765625, 0.4141845703125, 0.730712890625, 1.0472412109375, 1.36376953125, 1.6802978515625, 1.996826171875, 2.3133544921875, 2.6298828125, 2.9464111328125, 3.262939453125, 3.5794677734375, 3.89599609375, 4.2125244140625, 4.529052734375, 4.8455810546875, 5.162109375, 5.4786376953125, 5.795166015625, 6.1116943359375, 6.42822265625, 6.7447509765625, 7.061279296875, 7.3778076171875, 7.6943359375, 8.0108642578125, 8.327392578125, 8.6439208984375, 8.96044921875, 9.2769775390625, 9.593505859375, 9.9100341796875, 10.2265625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 6.0, 13.0, 17.0, 25.0, 38.0, 75.0, 132.0, 191.0, 381.0, 597.0, 1033.0, 1862.0, 3121.0, 5561.0, 9568.0, 17015.0, 30269.0, 53946.0, 92723.0, 147744.0, 190629.0, 180388.0, 130309.0, 79685.0, 45023.0, 24971.0, 14168.0, 8144.0, 4516.0, 2615.0, 1521.0, 906.0, 563.0, 324.0, 191.0, 110.0, 67.0, 33.0, 26.0, 16.0, 10.0, 9.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0], "bins": [-9.9609375, -9.6666259765625, -9.372314453125, -9.0780029296875, -8.78369140625, -8.4893798828125, -8.195068359375, -7.9007568359375, -7.6064453125, -7.3121337890625, -7.017822265625, -6.7235107421875, -6.42919921875, -6.1348876953125, -5.840576171875, -5.5462646484375, -5.251953125, -4.9576416015625, -4.663330078125, -4.3690185546875, -4.07470703125, -3.7803955078125, -3.486083984375, -3.1917724609375, -2.8974609375, -2.6031494140625, -2.308837890625, -2.0145263671875, -1.72021484375, -1.4259033203125, -1.131591796875, -0.8372802734375, -0.54296875, -0.2486572265625, 0.045654296875, 0.3399658203125, 0.63427734375, 0.9285888671875, 1.222900390625, 1.5172119140625, 1.8115234375, 2.1058349609375, 2.400146484375, 2.6944580078125, 2.98876953125, 3.2830810546875, 3.577392578125, 3.8717041015625, 4.166015625, 4.4603271484375, 4.754638671875, 5.0489501953125, 5.34326171875, 5.6375732421875, 5.931884765625, 6.2261962890625, 6.5205078125, 6.8148193359375, 7.109130859375, 7.4034423828125, 7.69775390625, 7.9920654296875, 8.286376953125, 8.5806884765625, 8.875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 2.0, 4.0, 8.0, 7.0, 9.0, 15.0, 9.0, 12.0, 15.0, 25.0, 18.0, 25.0, 29.0, 35.0, 28.0, 26.0, 38.0, 36.0, 40.0, 36.0, 44.0, 34.0, 28.0, 33.0, 44.0, 22.0, 26.0, 35.0, 32.0, 31.0, 31.0, 30.0, 25.0, 16.0, 15.0, 16.0, 16.0, 26.0, 13.0, 10.0, 9.0, 6.0, 5.0, 10.0, 3.0, 6.0, 9.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-5.95703125, -5.76678466796875, -5.5765380859375, -5.38629150390625, -5.196044921875, -5.00579833984375, -4.8155517578125, -4.62530517578125, -4.43505859375, -4.24481201171875, -4.0545654296875, -3.86431884765625, -3.674072265625, -3.48382568359375, -3.2935791015625, -3.10333251953125, -2.9130859375, -2.72283935546875, -2.5325927734375, -2.34234619140625, -2.152099609375, -1.96185302734375, -1.7716064453125, -1.58135986328125, -1.39111328125, -1.20086669921875, -1.0106201171875, -0.82037353515625, -0.630126953125, -0.43988037109375, -0.2496337890625, -0.05938720703125, 0.130859375, 0.32110595703125, 0.5113525390625, 0.70159912109375, 0.891845703125, 1.08209228515625, 1.2723388671875, 1.46258544921875, 1.65283203125, 1.84307861328125, 2.0333251953125, 2.22357177734375, 2.413818359375, 2.60406494140625, 2.7943115234375, 2.98455810546875, 3.1748046875, 3.36505126953125, 3.5552978515625, 3.74554443359375, 3.935791015625, 4.12603759765625, 4.3162841796875, 4.50653076171875, 4.69677734375, 4.88702392578125, 5.0772705078125, 5.26751708984375, 5.457763671875, 5.64801025390625, 5.8382568359375, 6.02850341796875, 6.21875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 7.0, 7.0, 18.0, 25.0, 42.0, 47.0, 72.0, 114.0, 153.0, 247.0, 311.0, 526.0, 772.0, 1265.0, 2185.0, 3851.0, 7373.0, 15542.0, 36164.0, 101053.0, 269714.0, 348051.0, 160152.0, 55947.0, 22346.0, 10221.0, 5146.0, 2789.0, 1598.0, 995.0, 609.0, 391.0, 250.0, 185.0, 120.0, 87.0, 56.0, 30.0, 36.0, 25.0, 10.0, 8.0, 7.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.453125, -8.182373046875, -7.91162109375, -7.640869140625, -7.3701171875, -7.099365234375, -6.82861328125, -6.557861328125, -6.287109375, -6.016357421875, -5.74560546875, -5.474853515625, -5.2041015625, -4.933349609375, -4.66259765625, -4.391845703125, -4.12109375, -3.850341796875, -3.57958984375, -3.308837890625, -3.0380859375, -2.767333984375, -2.49658203125, -2.225830078125, -1.955078125, -1.684326171875, -1.41357421875, -1.142822265625, -0.8720703125, -0.601318359375, -0.33056640625, -0.059814453125, 0.2109375, 0.481689453125, 0.75244140625, 1.023193359375, 1.2939453125, 1.564697265625, 1.83544921875, 2.106201171875, 2.376953125, 2.647705078125, 2.91845703125, 3.189208984375, 3.4599609375, 3.730712890625, 4.00146484375, 4.272216796875, 4.54296875, 4.813720703125, 5.08447265625, 5.355224609375, 5.6259765625, 5.896728515625, 6.16748046875, 6.438232421875, 6.708984375, 6.979736328125, 7.25048828125, 7.521240234375, 7.7919921875, 8.062744140625, 8.33349609375, 8.604248046875, 8.875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 7.0, 17.0, 12.0, 21.0, 25.0, 34.0, 50.0, 90.0, 118.0, 124.0, 115.0, 116.0, 88.0, 49.0, 32.0, 30.0, 16.0, 16.0, 11.0, 5.0, 3.0, 7.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007653236389160156, -0.0007405653595924377, -0.0007158070802688599, -0.000691048800945282, -0.0006662905216217041, -0.0006415322422981262, -0.0006167739629745483, -0.0005920156836509705, -0.0005672574043273926, -0.0005424991250038147, -0.0005177408456802368, -0.0004929825663566589, -0.00046822428703308105, -0.0004434660077095032, -0.0004187077283859253, -0.0003939494490623474, -0.00036919116973876953, -0.00034443289041519165, -0.00031967461109161377, -0.0002949163317680359, -0.000270158052444458, -0.0002453997731208801, -0.00022064149379730225, -0.00019588321447372437, -0.00017112493515014648, -0.0001463666558265686, -0.00012160837650299072, -9.685009717941284e-05, -7.209181785583496e-05, -4.733353853225708e-05, -2.25752592086792e-05, 2.1830201148986816e-06, 2.6941299438476562e-05, 5.169957876205444e-05, 7.645785808563232e-05, 0.0001012161374092102, 0.00012597441673278809, 0.00015073269605636597, 0.00017549097537994385, 0.00020024925470352173, 0.0002250075340270996, 0.0002497658133506775, 0.00027452409267425537, 0.00029928237199783325, 0.00032404065132141113, 0.000348798930644989, 0.0003735572099685669, 0.0003983154892921448, 0.00042307376861572266, 0.00044783204793930054, 0.0004725903272628784, 0.0004973486065864563, 0.0005221068859100342, 0.0005468651652336121, 0.0005716234445571899, 0.0005963817238807678, 0.0006211400032043457, 0.0006458982825279236, 0.0006706565618515015, 0.0006954148411750793, 0.0007201731204986572, 0.0007449313998222351, 0.000769689679145813, 0.0007944479584693909, 0.0008192062377929688]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 6.0, 7.0, 11.0, 18.0, 26.0, 31.0, 60.0, 94.0, 125.0, 206.0, 298.0, 395.0, 679.0, 1077.0, 1760.0, 3181.0, 6028.0, 12517.0, 29267.0, 75806.0, 202995.0, 351994.0, 219326.0, 82774.0, 31636.0, 13526.0, 6441.0, 3226.0, 1924.0, 1114.0, 670.0, 451.0, 302.0, 190.0, 119.0, 79.0, 65.0, 41.0, 31.0, 13.0, 19.0, 8.0, 8.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-9.390625, -9.1187744140625, -8.846923828125, -8.5750732421875, -8.30322265625, -8.0313720703125, -7.759521484375, -7.4876708984375, -7.2158203125, -6.9439697265625, -6.672119140625, -6.4002685546875, -6.12841796875, -5.8565673828125, -5.584716796875, -5.3128662109375, -5.041015625, -4.7691650390625, -4.497314453125, -4.2254638671875, -3.95361328125, -3.6817626953125, -3.409912109375, -3.1380615234375, -2.8662109375, -2.5943603515625, -2.322509765625, -2.0506591796875, -1.77880859375, -1.5069580078125, -1.235107421875, -0.9632568359375, -0.69140625, -0.4195556640625, -0.147705078125, 0.1241455078125, 0.39599609375, 0.6678466796875, 0.939697265625, 1.2115478515625, 1.4833984375, 1.7552490234375, 2.027099609375, 2.2989501953125, 2.57080078125, 2.8426513671875, 3.114501953125, 3.3863525390625, 3.658203125, 3.9300537109375, 4.201904296875, 4.4737548828125, 4.74560546875, 5.0174560546875, 5.289306640625, 5.5611572265625, 5.8330078125, 6.1048583984375, 6.376708984375, 6.6485595703125, 6.92041015625, 7.1922607421875, 7.464111328125, 7.7359619140625, 8.0078125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 8.0, 7.0, 9.0, 9.0, 10.0, 18.0, 19.0, 18.0, 32.0, 37.0, 41.0, 67.0, 50.0, 72.0, 73.0, 78.0, 75.0, 67.0, 61.0, 41.0, 47.0, 40.0, 23.0, 21.0, 18.0, 9.0, 10.0, 11.0, 6.0, 4.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.462890625, -2.398406982421875, -2.33392333984375, -2.269439697265625, -2.2049560546875, -2.140472412109375, -2.07598876953125, -2.011505126953125, -1.947021484375, -1.882537841796875, -1.81805419921875, -1.753570556640625, -1.6890869140625, -1.624603271484375, -1.56011962890625, -1.495635986328125, -1.43115234375, -1.366668701171875, -1.30218505859375, -1.237701416015625, -1.1732177734375, -1.108734130859375, -1.04425048828125, -0.979766845703125, -0.915283203125, -0.850799560546875, -0.78631591796875, -0.721832275390625, -0.6573486328125, -0.592864990234375, -0.52838134765625, -0.463897705078125, -0.3994140625, -0.334930419921875, -0.27044677734375, -0.205963134765625, -0.1414794921875, -0.076995849609375, -0.01251220703125, 0.051971435546875, 0.116455078125, 0.180938720703125, 0.24542236328125, 0.309906005859375, 0.3743896484375, 0.438873291015625, 0.50335693359375, 0.567840576171875, 0.63232421875, 0.696807861328125, 0.76129150390625, 0.825775146484375, 0.8902587890625, 0.954742431640625, 1.01922607421875, 1.083709716796875, 1.148193359375, 1.212677001953125, 1.27716064453125, 1.341644287109375, 1.4061279296875, 1.470611572265625, 1.53509521484375, 1.599578857421875, 1.6640625]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 9.0, 7.0, 2.0, 5.0, 6.0, 10.0, 10.0, 12.0, 16.0, 16.0, 22.0, 21.0, 32.0, 37.0, 34.0, 47.0, 51.0, 52.0, 52.0, 65.0, 63.0, 78.0, 44.0, 54.0, 41.0, 41.0, 25.0, 26.0, 26.0, 27.0, 14.0, 16.0, 7.0, 8.0, 7.0, 8.0, 3.0, 2.0, 0.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.086257934570312, -12.643107414245605, -12.199956893920898, -11.756806373596191, -11.313655853271484, -10.870505332946777, -10.42735481262207, -9.984204292297363, -9.541053771972656, -9.09790325164795, -8.654752731323242, -8.211602210998535, -7.768451690673828, -7.325301170349121, -6.882150650024414, -6.439000129699707, -5.995849609375, -5.552699089050293, -5.109548568725586, -4.666398048400879, -4.223247528076172, -3.780097007751465, -3.336946487426758, -2.893795967102051, -2.4506454467773438, -2.0074949264526367, -1.5643444061279297, -1.1211938858032227, -0.6780433654785156, -0.2348928451538086, 0.20825767517089844, 0.6514081954956055, 1.094557762145996, 1.5377082824707031, 1.9808588027954102, 2.424009323120117, 2.867159843444824, 3.3103103637695312, 3.7534608840942383, 4.196611404418945, 4.639761924743652, 5.082912445068359, 5.526062965393066, 5.969213485717773, 6.4123640060424805, 6.8555145263671875, 7.2986650466918945, 7.741815567016602, 8.184966087341309, 8.628116607666016, 9.071267127990723, 9.51441764831543, 9.957568168640137, 10.400718688964844, 10.84386920928955, 11.287019729614258, 11.730170249938965, 12.173320770263672, 12.616471290588379, 13.059621810913086, 13.502772331237793, 13.9459228515625, 14.389073371887207, 14.832223892211914, 15.275374412536621]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 10.0, 8.0, 9.0, 3.0, 7.0, 21.0, 15.0, 25.0, 19.0, 24.0, 25.0, 41.0, 29.0, 41.0, 32.0, 55.0, 45.0, 49.0, 32.0, 39.0, 51.0, 50.0, 35.0, 43.0, 48.0, 33.0, 43.0, 24.0, 32.0, 13.0, 19.0, 15.0, 12.0, 12.0, 8.0, 11.0, 6.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-12.65682315826416, -12.281082153320312, -11.905341148376465, -11.529600143432617, -11.153858184814453, -10.778117179870605, -10.402376174926758, -10.02663516998291, -9.650894165039062, -9.275153160095215, -8.899412155151367, -8.523670196533203, -8.147929191589355, -7.772188186645508, -7.39644718170166, -7.0207061767578125, -6.644964218139648, -6.269223213195801, -5.893481731414795, -5.517740726470947, -5.141999244689941, -4.766258239746094, -4.390517234802246, -4.014776229858398, -3.6390347480773926, -3.263293504714966, -2.887552261352539, -2.5118112564086914, -2.1360700130462646, -1.760328769683838, -1.3845877647399902, -1.0088465213775635, -0.6331043243408203, -0.25736314058303833, 0.11837804317474365, 0.49411916732788086, 0.8698604106903076, 1.2456016540527344, 1.621342658996582, 1.9970839023590088, 2.3728251457214355, 2.7485663890838623, 3.124307632446289, 3.5000486373901367, 3.8757898807525635, 4.25153112411499, 4.627272129058838, 5.003013610839844, 5.378754615783691, 5.754495620727539, 6.130237102508545, 6.505978107452393, 6.881719589233398, 7.257460594177246, 7.633201599121094, 8.008942604064941, 8.384683609008789, 8.760424613952637, 9.136165618896484, 9.511907577514648, 9.887648582458496, 10.263389587402344, 10.639130592346191, 11.014871597290039, 11.390613555908203]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [1.0, 5.0, 7.0, 7.0, 20.0, 13.0, 26.0, 35.0, 69.0, 75.0, 108.0, 156.0, 223.0, 359.0, 501.0, 733.0, 1151.0, 1707.0, 2626.0, 4039.0, 6490.0, 10663.0, 18439.0, 33750.0, 66281.0, 143043.0, 334182.0, 749652.0, 1158185.0, 897343.0, 420239.0, 174362.0, 78084.0, 38573.0, 20735.0, 11954.0, 7218.0, 4491.0, 2901.0, 1890.0, 1270.0, 839.0, 524.0, 416.0, 275.0, 191.0, 137.0, 93.0, 70.0, 48.0, 32.0, 21.0, 15.0, 3.0, 6.0, 10.0, 5.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-13.5703125, -13.0963134765625, -12.622314453125, -12.1483154296875, -11.67431640625, -11.2003173828125, -10.726318359375, -10.2523193359375, -9.7783203125, -9.3043212890625, -8.830322265625, -8.3563232421875, -7.88232421875, -7.4083251953125, -6.934326171875, -6.4603271484375, -5.986328125, -5.5123291015625, -5.038330078125, -4.5643310546875, -4.09033203125, -3.6163330078125, -3.142333984375, -2.6683349609375, -2.1943359375, -1.7203369140625, -1.246337890625, -0.7723388671875, -0.29833984375, 0.1756591796875, 0.649658203125, 1.1236572265625, 1.59765625, 2.0716552734375, 2.545654296875, 3.0196533203125, 3.49365234375, 3.9676513671875, 4.441650390625, 4.9156494140625, 5.3896484375, 5.8636474609375, 6.337646484375, 6.8116455078125, 7.28564453125, 7.7596435546875, 8.233642578125, 8.7076416015625, 9.181640625, 9.6556396484375, 10.129638671875, 10.6036376953125, 11.07763671875, 11.5516357421875, 12.025634765625, 12.4996337890625, 12.9736328125, 13.4476318359375, 13.921630859375, 14.3956298828125, 14.86962890625, 15.3436279296875, 15.817626953125, 16.2916259765625, 16.765625]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 9.0, 6.0, 9.0, 11.0, 13.0, 10.0, 19.0, 21.0, 24.0, 25.0, 27.0, 28.0, 41.0, 39.0, 39.0, 49.0, 55.0, 51.0, 33.0, 50.0, 45.0, 40.0, 42.0, 55.0, 40.0, 34.0, 37.0, 25.0, 28.0, 13.0, 23.0, 14.0, 4.0, 8.0, 9.0, 12.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-11.6796875, -11.3319091796875, -10.984130859375, -10.6363525390625, -10.28857421875, -9.9407958984375, -9.593017578125, -9.2452392578125, -8.8974609375, -8.5496826171875, -8.201904296875, -7.8541259765625, -7.50634765625, -7.1585693359375, -6.810791015625, -6.4630126953125, -6.115234375, -5.7674560546875, -5.419677734375, -5.0718994140625, -4.72412109375, -4.3763427734375, -4.028564453125, -3.6807861328125, -3.3330078125, -2.9852294921875, -2.637451171875, -2.2896728515625, -1.94189453125, -1.5941162109375, -1.246337890625, -0.8985595703125, -0.55078125, -0.2030029296875, 0.144775390625, 0.4925537109375, 0.84033203125, 1.1881103515625, 1.535888671875, 1.8836669921875, 2.2314453125, 2.5792236328125, 2.927001953125, 3.2747802734375, 3.62255859375, 3.9703369140625, 4.318115234375, 4.6658935546875, 5.013671875, 5.3614501953125, 5.709228515625, 6.0570068359375, 6.40478515625, 6.7525634765625, 7.100341796875, 7.4481201171875, 7.7958984375, 8.1436767578125, 8.491455078125, 8.8392333984375, 9.18701171875, 9.5347900390625, 9.882568359375, 10.2303466796875, 10.578125]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 5.0, 16.0, 15.0, 31.0, 35.0, 67.0, 98.0, 127.0, 165.0, 269.0, 403.0, 614.0, 953.0, 1457.0, 2453.0, 4071.0, 7080.0, 12801.0, 23705.0, 46657.0, 94696.0, 204468.0, 465855.0, 993135.0, 1173884.0, 632060.0, 276198.0, 124382.0, 60476.0, 30525.0, 16015.0, 8810.0, 5020.0, 2877.0, 1744.0, 1088.0, 692.0, 463.0, 285.0, 195.0, 123.0, 87.0, 57.0, 37.0, 32.0, 16.0, 13.0, 12.0, 3.0, 5.0, 4.0, 0.0, 0.0, 3.0, 2.0], "bins": [-21.890625, -21.23095703125, -20.5712890625, -19.91162109375, -19.251953125, -18.59228515625, -17.9326171875, -17.27294921875, -16.61328125, -15.95361328125, -15.2939453125, -14.63427734375, -13.974609375, -13.31494140625, -12.6552734375, -11.99560546875, -11.3359375, -10.67626953125, -10.0166015625, -9.35693359375, -8.697265625, -8.03759765625, -7.3779296875, -6.71826171875, -6.05859375, -5.39892578125, -4.7392578125, -4.07958984375, -3.419921875, -2.76025390625, -2.1005859375, -1.44091796875, -0.78125, -0.12158203125, 0.5380859375, 1.19775390625, 1.857421875, 2.51708984375, 3.1767578125, 3.83642578125, 4.49609375, 5.15576171875, 5.8154296875, 6.47509765625, 7.134765625, 7.79443359375, 8.4541015625, 9.11376953125, 9.7734375, 10.43310546875, 11.0927734375, 11.75244140625, 12.412109375, 13.07177734375, 13.7314453125, 14.39111328125, 15.05078125, 15.71044921875, 16.3701171875, 17.02978515625, 17.689453125, 18.34912109375, 19.0087890625, 19.66845703125, 20.328125]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 3.0, 0.0, 2.0, 4.0, 11.0, 6.0, 9.0, 18.0, 25.0, 29.0, 34.0, 62.0, 54.0, 80.0, 130.0, 135.0, 223.0, 239.0, 279.0, 346.0, 405.0, 393.0, 306.0, 313.0, 202.0, 198.0, 127.0, 119.0, 77.0, 70.0, 50.0, 40.0, 22.0, 16.0, 19.0, 10.0, 3.0, 5.0, 3.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8515625, -7.61297607421875, -7.3743896484375, -7.13580322265625, -6.897216796875, -6.65863037109375, -6.4200439453125, -6.18145751953125, -5.94287109375, -5.70428466796875, -5.4656982421875, -5.22711181640625, -4.988525390625, -4.74993896484375, -4.5113525390625, -4.27276611328125, -4.0341796875, -3.79559326171875, -3.5570068359375, -3.31842041015625, -3.079833984375, -2.84124755859375, -2.6026611328125, -2.36407470703125, -2.12548828125, -1.88690185546875, -1.6483154296875, -1.40972900390625, -1.171142578125, -0.93255615234375, -0.6939697265625, -0.45538330078125, -0.216796875, 0.02178955078125, 0.2603759765625, 0.49896240234375, 0.737548828125, 0.97613525390625, 1.2147216796875, 1.45330810546875, 1.69189453125, 1.93048095703125, 2.1690673828125, 2.40765380859375, 2.646240234375, 2.88482666015625, 3.1234130859375, 3.36199951171875, 3.6005859375, 3.83917236328125, 4.0777587890625, 4.31634521484375, 4.554931640625, 4.79351806640625, 5.0321044921875, 5.27069091796875, 5.50927734375, 5.74786376953125, 5.9864501953125, 6.22503662109375, 6.463623046875, 6.70220947265625, 6.9407958984375, 7.17938232421875, 7.41796875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 3.0, 9.0, 4.0, 4.0, 8.0, 8.0, 9.0, 15.0, 20.0, 37.0, 24.0, 33.0, 48.0, 50.0, 57.0, 65.0, 74.0, 75.0, 72.0, 56.0, 49.0, 48.0, 41.0, 39.0, 26.0, 28.0, 21.0, 12.0, 12.0, 8.0, 8.0, 10.0, 9.0, 5.0, 3.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.54970359802246, -18.924062728881836, -18.29842185974121, -17.672780990600586, -17.04714012145996, -16.421499252319336, -15.795857429504395, -15.17021656036377, -14.544575691223145, -13.91893482208252, -13.293293952941895, -12.66765308380127, -12.042011260986328, -11.416370391845703, -10.790729522705078, -10.165088653564453, -9.539447784423828, -8.913806915283203, -8.288166046142578, -7.662524700164795, -7.03688383102417, -6.411242961883545, -5.785601615905762, -5.159960746765137, -4.534319877624512, -3.9086790084838867, -3.2830379009246826, -2.6573967933654785, -2.0317559242248535, -1.4061150550842285, -0.7804739475250244, -0.1548328399658203, 0.4708080291748047, 1.0964490175247192, 1.7220900058746338, 2.347731113433838, 2.973371982574463, 3.599012851715088, 4.224654197692871, 4.850295066833496, 5.475935935974121, 6.101576805114746, 6.727217674255371, 7.352859020233154, 7.978499889373779, 8.604141235351562, 9.229782104492188, 9.855422973632812, 10.481063842773438, 11.106704711914062, 11.732345581054688, 12.357986450195312, 12.983627319335938, 13.609268188476562, 14.234910011291504, 14.860550880432129, 15.486191749572754, 16.111833572387695, 16.73747444152832, 17.363115310668945, 17.98875617980957, 18.614397048950195, 19.24003791809082, 19.865678787231445, 20.49131965637207]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 5.0, 4.0, 13.0, 10.0, 16.0, 16.0, 12.0, 22.0, 24.0, 22.0, 21.0, 16.0, 26.0, 33.0, 33.0, 45.0, 34.0, 42.0, 49.0, 41.0, 35.0, 41.0, 39.0, 36.0, 36.0, 34.0, 43.0, 32.0, 30.0, 27.0, 21.0, 19.0, 17.0, 16.0, 13.0, 15.0, 12.0, 12.0, 3.0, 9.0, 5.0, 5.0, 3.0, 5.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0], "bins": [-14.454890251159668, -14.022396087646484, -13.589900970458984, -13.1574068069458, -12.724912643432617, -12.292417526245117, -11.859923362731934, -11.42742919921875, -10.99493408203125, -10.562439918518066, -10.129944801330566, -9.697450637817383, -9.264955520629883, -8.8324613571167, -8.399967193603516, -7.967472553253174, -7.534977912902832, -7.10248327255249, -6.669988632202148, -6.237494468688965, -5.804999828338623, -5.372505187988281, -4.940011024475098, -4.507516384124756, -4.075021743774414, -3.6425271034240723, -3.2100327014923096, -2.777538299560547, -2.345043659210205, -1.9125490188598633, -1.4800546169281006, -1.047560214996338, -0.6150665283203125, -0.18257200717926025, 0.249922513961792, 0.6824170351028442, 1.1149115562438965, 1.5474061965942383, 1.979900598526001, 2.4123950004577637, 2.8448896408081055, 3.2773842811584473, 3.70987868309021, 4.142373085021973, 4.5748677253723145, 5.007362365722656, 5.43985652923584, 5.872351169586182, 6.304845809936523, 6.737340450286865, 7.169835090637207, 7.602329254150391, 8.03482437133789, 8.467318534851074, 8.899812698364258, 9.332307815551758, 9.764801979064941, 10.197296142578125, 10.629791259765625, 11.062285423278809, 11.494779586791992, 11.927274703979492, 12.359768867492676, 12.79226303100586, 13.22475814819336]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 6.0, 10.0, 14.0, 17.0, 18.0, 46.0, 67.0, 82.0, 126.0, 209.0, 276.0, 460.0, 667.0, 967.0, 1505.0, 2176.0, 3413.0, 5318.0, 8133.0, 12668.0, 20426.0, 32313.0, 51070.0, 79372.0, 115531.0, 151552.0, 159634.0, 134614.0, 95601.0, 62899.0, 39889.0, 25028.0, 15755.0, 10040.0, 6515.0, 4104.0, 2782.0, 1742.0, 1168.0, 721.0, 509.0, 375.0, 240.0, 173.0, 110.0, 66.0, 56.0, 40.0, 21.0, 13.0, 12.0, 4.0, 1.0, 5.0, 3.0, 0.0, 2.0], "bins": [-7.52734375, -7.30084228515625, -7.0743408203125, -6.84783935546875, -6.621337890625, -6.39483642578125, -6.1683349609375, -5.94183349609375, -5.71533203125, -5.48883056640625, -5.2623291015625, -5.03582763671875, -4.809326171875, -4.58282470703125, -4.3563232421875, -4.12982177734375, -3.9033203125, -3.67681884765625, -3.4503173828125, -3.22381591796875, -2.997314453125, -2.77081298828125, -2.5443115234375, -2.31781005859375, -2.09130859375, -1.86480712890625, -1.6383056640625, -1.41180419921875, -1.185302734375, -0.95880126953125, -0.7322998046875, -0.50579833984375, -0.279296875, -0.05279541015625, 0.1737060546875, 0.40020751953125, 0.626708984375, 0.85321044921875, 1.0797119140625, 1.30621337890625, 1.53271484375, 1.75921630859375, 1.9857177734375, 2.21221923828125, 2.438720703125, 2.66522216796875, 2.8917236328125, 3.11822509765625, 3.3447265625, 3.57122802734375, 3.7977294921875, 4.02423095703125, 4.250732421875, 4.47723388671875, 4.7037353515625, 4.93023681640625, 5.15673828125, 5.38323974609375, 5.6097412109375, 5.83624267578125, 6.062744140625, 6.28924560546875, 6.5157470703125, 6.74224853515625, 6.96875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 9.0, 8.0, 10.0, 16.0, 15.0, 18.0, 12.0, 23.0, 18.0, 19.0, 23.0, 34.0, 28.0, 43.0, 40.0, 39.0, 52.0, 48.0, 49.0, 43.0, 38.0, 50.0, 37.0, 35.0, 42.0, 47.0, 35.0, 27.0, 16.0, 15.0, 17.0, 15.0, 15.0, 9.0, 11.0, 7.0, 6.0, 5.0, 9.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-16.03125, -15.5465087890625, -15.061767578125, -14.5770263671875, -14.09228515625, -13.6075439453125, -13.122802734375, -12.6380615234375, -12.1533203125, -11.6685791015625, -11.183837890625, -10.6990966796875, -10.21435546875, -9.7296142578125, -9.244873046875, -8.7601318359375, -8.275390625, -7.7906494140625, -7.305908203125, -6.8211669921875, -6.33642578125, -5.8516845703125, -5.366943359375, -4.8822021484375, -4.3974609375, -3.9127197265625, -3.427978515625, -2.9432373046875, -2.45849609375, -1.9737548828125, -1.489013671875, -1.0042724609375, -0.51953125, -0.0347900390625, 0.449951171875, 0.9346923828125, 1.41943359375, 1.9041748046875, 2.388916015625, 2.8736572265625, 3.3583984375, 3.8431396484375, 4.327880859375, 4.8126220703125, 5.29736328125, 5.7821044921875, 6.266845703125, 6.7515869140625, 7.236328125, 7.7210693359375, 8.205810546875, 8.6905517578125, 9.17529296875, 9.6600341796875, 10.144775390625, 10.6295166015625, 11.1142578125, 11.5989990234375, 12.083740234375, 12.5684814453125, 13.05322265625, 13.5379638671875, 14.022705078125, 14.5074462890625, 14.9921875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 5.0, 9.0, 11.0, 14.0, 25.0, 33.0, 46.0, 47.0, 77.0, 144.0, 182.0, 312.0, 425.0, 675.0, 1106.0, 1707.0, 2828.0, 4599.0, 7883.0, 13275.0, 23857.0, 42759.0, 80434.0, 144145.0, 220783.0, 210084.0, 130665.0, 71851.0, 39051.0, 21249.0, 12129.0, 7078.0, 4140.0, 2500.0, 1509.0, 1022.0, 635.0, 422.0, 274.0, 159.0, 134.0, 74.0, 61.0, 44.0, 21.0, 18.0, 19.0, 6.0, 12.0, 4.0, 9.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9921875, -10.6365966796875, -10.281005859375, -9.9254150390625, -9.56982421875, -9.2142333984375, -8.858642578125, -8.5030517578125, -8.1474609375, -7.7918701171875, -7.436279296875, -7.0806884765625, -6.72509765625, -6.3695068359375, -6.013916015625, -5.6583251953125, -5.302734375, -4.9471435546875, -4.591552734375, -4.2359619140625, -3.88037109375, -3.5247802734375, -3.169189453125, -2.8135986328125, -2.4580078125, -2.1024169921875, -1.746826171875, -1.3912353515625, -1.03564453125, -0.6800537109375, -0.324462890625, 0.0311279296875, 0.38671875, 0.7423095703125, 1.097900390625, 1.4534912109375, 1.80908203125, 2.1646728515625, 2.520263671875, 2.8758544921875, 3.2314453125, 3.5870361328125, 3.942626953125, 4.2982177734375, 4.65380859375, 5.0093994140625, 5.364990234375, 5.7205810546875, 6.076171875, 6.4317626953125, 6.787353515625, 7.1429443359375, 7.49853515625, 7.8541259765625, 8.209716796875, 8.5653076171875, 8.9208984375, 9.2764892578125, 9.632080078125, 9.9876708984375, 10.34326171875, 10.6988525390625, 11.054443359375, 11.4100341796875, 11.765625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 1.0, 6.0, 9.0, 10.0, 9.0, 16.0, 8.0, 15.0, 19.0, 19.0, 30.0, 18.0, 26.0, 25.0, 39.0, 33.0, 41.0, 34.0, 55.0, 37.0, 43.0, 34.0, 36.0, 41.0, 35.0, 34.0, 22.0, 38.0, 35.0, 26.0, 28.0, 26.0, 19.0, 23.0, 22.0, 12.0, 8.0, 12.0, 4.0, 15.0, 6.0, 5.0, 5.0, 6.0, 3.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-8.96875, -8.69921875, -8.4296875, -8.16015625, -7.890625, -7.62109375, -7.3515625, -7.08203125, -6.8125, -6.54296875, -6.2734375, -6.00390625, -5.734375, -5.46484375, -5.1953125, -4.92578125, -4.65625, -4.38671875, -4.1171875, -3.84765625, -3.578125, -3.30859375, -3.0390625, -2.76953125, -2.5, -2.23046875, -1.9609375, -1.69140625, -1.421875, -1.15234375, -0.8828125, -0.61328125, -0.34375, -0.07421875, 0.1953125, 0.46484375, 0.734375, 1.00390625, 1.2734375, 1.54296875, 1.8125, 2.08203125, 2.3515625, 2.62109375, 2.890625, 3.16015625, 3.4296875, 3.69921875, 3.96875, 4.23828125, 4.5078125, 4.77734375, 5.046875, 5.31640625, 5.5859375, 5.85546875, 6.125, 6.39453125, 6.6640625, 6.93359375, 7.203125, 7.47265625, 7.7421875, 8.01171875, 8.28125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 6.0, 13.0, 13.0, 17.0, 33.0, 34.0, 59.0, 66.0, 104.0, 146.0, 257.0, 340.0, 451.0, 678.0, 1037.0, 1600.0, 2529.0, 4036.0, 6971.0, 12043.0, 21767.0, 40679.0, 78992.0, 150446.0, 243885.0, 217658.0, 123784.0, 63770.0, 33556.0, 17646.0, 10176.0, 5809.0, 3540.0, 2174.0, 1406.0, 876.0, 639.0, 388.0, 265.0, 207.0, 134.0, 107.0, 60.0, 54.0, 30.0, 22.0, 13.0, 16.0, 5.0, 12.0, 3.0, 6.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.953125, -6.74139404296875, -6.5296630859375, -6.31793212890625, -6.106201171875, -5.89447021484375, -5.6827392578125, -5.47100830078125, -5.25927734375, -5.04754638671875, -4.8358154296875, -4.62408447265625, -4.412353515625, -4.20062255859375, -3.9888916015625, -3.77716064453125, -3.5654296875, -3.35369873046875, -3.1419677734375, -2.93023681640625, -2.718505859375, -2.50677490234375, -2.2950439453125, -2.08331298828125, -1.87158203125, -1.65985107421875, -1.4481201171875, -1.23638916015625, -1.024658203125, -0.81292724609375, -0.6011962890625, -0.38946533203125, -0.177734375, 0.03399658203125, 0.2457275390625, 0.45745849609375, 0.669189453125, 0.88092041015625, 1.0926513671875, 1.30438232421875, 1.51611328125, 1.72784423828125, 1.9395751953125, 2.15130615234375, 2.363037109375, 2.57476806640625, 2.7864990234375, 2.99822998046875, 3.2099609375, 3.42169189453125, 3.6334228515625, 3.84515380859375, 4.056884765625, 4.26861572265625, 4.4803466796875, 4.69207763671875, 4.90380859375, 5.11553955078125, 5.3272705078125, 5.53900146484375, 5.750732421875, 5.96246337890625, 6.1741943359375, 6.38592529296875, 6.59765625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 10.0, 5.0, 4.0, 11.0, 17.0, 7.0, 10.0, 17.0, 24.0, 33.0, 32.0, 33.0, 37.0, 50.0, 54.0, 44.0, 59.0, 60.0, 56.0, 59.0, 61.0, 47.0, 45.0, 40.0, 34.0, 19.0, 19.0, 20.0, 10.0, 15.0, 14.0, 13.0, 7.0, 7.0, 2.0, 6.0, 2.0, 4.0, 2.0, 1.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0002243518829345703, -0.00021751224994659424, -0.00021067261695861816, -0.0002038329839706421, -0.00019699335098266602, -0.00019015371799468994, -0.00018331408500671387, -0.0001764744520187378, -0.00016963481903076172, -0.00016279518604278564, -0.00015595555305480957, -0.0001491159200668335, -0.00014227628707885742, -0.00013543665409088135, -0.00012859702110290527, -0.0001217573881149292, -0.00011491775512695312, -0.00010807812213897705, -0.00010123848915100098, -9.43988561630249e-05, -8.755922317504883e-05, -8.071959018707275e-05, -7.387995719909668e-05, -6.70403242111206e-05, -6.020069122314453e-05, -5.336105823516846e-05, -4.652142524719238e-05, -3.968179225921631e-05, -3.2842159271240234e-05, -2.600252628326416e-05, -1.9162893295288086e-05, -1.2323260307312012e-05, -5.4836273193359375e-06, 1.3560056686401367e-06, 8.195638656616211e-06, 1.5035271644592285e-05, 2.187490463256836e-05, 2.8714537620544434e-05, 3.555417060852051e-05, 4.239380359649658e-05, 4.9233436584472656e-05, 5.607306957244873e-05, 6.29127025604248e-05, 6.975233554840088e-05, 7.659196853637695e-05, 8.343160152435303e-05, 9.02712345123291e-05, 9.711086750030518e-05, 0.00010395050048828125, 0.00011079013347625732, 0.0001176297664642334, 0.00012446939945220947, 0.00013130903244018555, 0.00013814866542816162, 0.0001449882984161377, 0.00015182793140411377, 0.00015866756439208984, 0.00016550719738006592, 0.000172346830368042, 0.00017918646335601807, 0.00018602609634399414, 0.00019286572933197021, 0.0001997053623199463, 0.00020654499530792236, 0.00021338462829589844]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 6.0, 15.0, 9.0, 11.0, 34.0, 46.0, 75.0, 116.0, 223.0, 334.0, 650.0, 1080.0, 1917.0, 3294.0, 5566.0, 10149.0, 19165.0, 37444.0, 74901.0, 148175.0, 237738.0, 228995.0, 136605.0, 68599.0, 34107.0, 17607.0, 9359.0, 5094.0, 3046.0, 1697.0, 1034.0, 580.0, 374.0, 185.0, 123.0, 81.0, 41.0, 31.0, 24.0, 10.0, 10.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.109375, -7.8291015625, -7.548828125, -7.2685546875, -6.98828125, -6.7080078125, -6.427734375, -6.1474609375, -5.8671875, -5.5869140625, -5.306640625, -5.0263671875, -4.74609375, -4.4658203125, -4.185546875, -3.9052734375, -3.625, -3.3447265625, -3.064453125, -2.7841796875, -2.50390625, -2.2236328125, -1.943359375, -1.6630859375, -1.3828125, -1.1025390625, -0.822265625, -0.5419921875, -0.26171875, 0.0185546875, 0.298828125, 0.5791015625, 0.859375, 1.1396484375, 1.419921875, 1.7001953125, 1.98046875, 2.2607421875, 2.541015625, 2.8212890625, 3.1015625, 3.3818359375, 3.662109375, 3.9423828125, 4.22265625, 4.5029296875, 4.783203125, 5.0634765625, 5.34375, 5.6240234375, 5.904296875, 6.1845703125, 6.46484375, 6.7451171875, 7.025390625, 7.3056640625, 7.5859375, 7.8662109375, 8.146484375, 8.4267578125, 8.70703125, 8.9873046875, 9.267578125, 9.5478515625, 9.828125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 8.0, 7.0, 11.0, 18.0, 19.0, 19.0, 26.0, 36.0, 37.0, 47.0, 62.0, 50.0, 61.0, 62.0, 60.0, 61.0, 64.0, 54.0, 44.0, 42.0, 36.0, 25.0, 29.0, 15.0, 20.0, 17.0, 15.0, 9.0, 9.0, 12.0, 5.0, 2.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.068359375, -1.98846435546875, -1.9085693359375, -1.82867431640625, -1.748779296875, -1.66888427734375, -1.5889892578125, -1.50909423828125, -1.42919921875, -1.34930419921875, -1.2694091796875, -1.18951416015625, -1.109619140625, -1.02972412109375, -0.9498291015625, -0.86993408203125, -0.7900390625, -0.71014404296875, -0.6302490234375, -0.55035400390625, -0.470458984375, -0.39056396484375, -0.3106689453125, -0.23077392578125, -0.15087890625, -0.07098388671875, 0.0089111328125, 0.08880615234375, 0.168701171875, 0.24859619140625, 0.3284912109375, 0.40838623046875, 0.48828125, 0.56817626953125, 0.6480712890625, 0.72796630859375, 0.807861328125, 0.88775634765625, 0.9676513671875, 1.04754638671875, 1.12744140625, 1.20733642578125, 1.2872314453125, 1.36712646484375, 1.447021484375, 1.52691650390625, 1.6068115234375, 1.68670654296875, 1.7666015625, 1.84649658203125, 1.9263916015625, 2.00628662109375, 2.086181640625, 2.16607666015625, 2.2459716796875, 2.32586669921875, 2.40576171875, 2.48565673828125, 2.5655517578125, 2.64544677734375, 2.725341796875, 2.80523681640625, 2.8851318359375, 2.96502685546875, 3.044921875]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 3.0, 7.0, 5.0, 5.0, 7.0, 9.0, 11.0, 18.0, 21.0, 23.0, 30.0, 41.0, 39.0, 50.0, 53.0, 70.0, 69.0, 78.0, 71.0, 62.0, 45.0, 51.0, 37.0, 38.0, 27.0, 33.0, 20.0, 11.0, 11.0, 8.0, 8.0, 9.0, 9.0, 6.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.962488174438477, -18.337907791137695, -17.713327407836914, -17.088748931884766, -16.464168548583984, -15.839588165283203, -15.215007781982422, -14.590428352355957, -13.965848922729492, -13.341268539428711, -12.716689109802246, -12.092108726501465, -11.467529296875, -10.842948913574219, -10.218368530273438, -9.593789100646973, -8.969208717346191, -8.34462833404541, -7.720048904418945, -7.095468521118164, -6.470889091491699, -5.846308708190918, -5.221728801727295, -4.597148895263672, -3.972568988800049, -3.347989082336426, -2.7234091758728027, -2.0988290309906006, -1.4742491245269775, -0.8496692180633545, -0.22508907318115234, 0.3994908332824707, 1.0240707397460938, 1.6486506462097168, 2.27323055267334, 2.897810697555542, 3.522390604019165, 4.146970748901367, 4.77155065536499, 5.396130561828613, 6.020710468292236, 6.645290374755859, 7.269870281219482, 7.8944501876831055, 8.519030570983887, 9.143610000610352, 9.768190383911133, 10.392770767211914, 11.017350196838379, 11.64193058013916, 12.266510009765625, 12.891090393066406, 13.515669822692871, 14.140250205993652, 14.764829635620117, 15.389410018920898, 16.01399040222168, 16.63857078552246, 17.263151168823242, 17.88772964477539, 18.512310028076172, 19.136890411376953, 19.761470794677734, 20.386051177978516, 21.010629653930664]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 7.0, 3.0, 4.0, 4.0, 10.0, 14.0, 21.0, 11.0, 10.0, 25.0, 19.0, 22.0, 26.0, 19.0, 30.0, 35.0, 37.0, 35.0, 41.0, 42.0, 43.0, 45.0, 41.0, 41.0, 39.0, 41.0, 41.0, 32.0, 33.0, 44.0, 27.0, 21.0, 16.0, 19.0, 15.0, 17.0, 13.0, 11.0, 7.0, 13.0, 8.0, 4.0, 7.0, 3.0, 5.0, 2.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-14.69821548461914, -14.253523826599121, -13.808832168579102, -13.364140510559082, -12.919448852539062, -12.47475814819336, -12.03006649017334, -11.58537483215332, -11.1406831741333, -10.695991516113281, -10.251299858093262, -9.806608200073242, -9.361917495727539, -8.917224884033203, -8.4725341796875, -8.02784252166748, -7.583150863647461, -7.138459205627441, -6.693767547607422, -6.2490763664245605, -5.804384708404541, -5.3596930503845215, -4.91500186920166, -4.470310211181641, -4.025618553161621, -3.5809268951416016, -3.136235475540161, -2.6915440559387207, -2.246852397918701, -1.8021607398986816, -1.3574693202972412, -0.9127779006958008, -0.46808624267578125, -0.02339470386505127, 0.4212968349456787, 0.8659883737564087, 1.3106799125671387, 1.7553715705871582, 2.2000629901885986, 2.644754409790039, 3.0894460678100586, 3.534137725830078, 3.9788291454315186, 4.423520565032959, 4.8682122230529785, 5.312903881072998, 5.757595062255859, 6.202286720275879, 6.646978378295898, 7.091670036315918, 7.5363616943359375, 7.981052875518799, 8.425745010375977, 8.87043571472168, 9.3151273727417, 9.759819030761719, 10.204510688781738, 10.649202346801758, 11.093894004821777, 11.538585662841797, 11.9832763671875, 12.427968978881836, 12.872659683227539, 13.317351341247559, 13.762042999267578]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 1.0, 5.0, 7.0, 13.0, 17.0, 19.0, 27.0, 48.0, 56.0, 106.0, 135.0, 178.0, 314.0, 480.0, 746.0, 1161.0, 2018.0, 3659.0, 6816.0, 14140.0, 30482.0, 68437.0, 151969.0, 262596.0, 251308.0, 136856.0, 61753.0, 27493.0, 12817.0, 6577.0, 3393.0, 1933.0, 1105.0, 598.0, 431.0, 286.0, 186.0, 110.0, 70.0, 66.0, 36.0, 38.0, 23.0, 15.0, 8.0, 6.0, 7.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.1875, -15.646728515625, -15.10595703125, -14.565185546875, -14.0244140625, -13.483642578125, -12.94287109375, -12.402099609375, -11.861328125, -11.320556640625, -10.77978515625, -10.239013671875, -9.6982421875, -9.157470703125, -8.61669921875, -8.075927734375, -7.53515625, -6.994384765625, -6.45361328125, -5.912841796875, -5.3720703125, -4.831298828125, -4.29052734375, -3.749755859375, -3.208984375, -2.668212890625, -2.12744140625, -1.586669921875, -1.0458984375, -0.505126953125, 0.03564453125, 0.576416015625, 1.1171875, 1.657958984375, 2.19873046875, 2.739501953125, 3.2802734375, 3.821044921875, 4.36181640625, 4.902587890625, 5.443359375, 5.984130859375, 6.52490234375, 7.065673828125, 7.6064453125, 8.147216796875, 8.68798828125, 9.228759765625, 9.76953125, 10.310302734375, 10.85107421875, 11.391845703125, 11.9326171875, 12.473388671875, 13.01416015625, 13.554931640625, 14.095703125, 14.636474609375, 15.17724609375, 15.718017578125, 16.2587890625, 16.799560546875, 17.34033203125, 17.881103515625, 18.421875]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 10.0, 4.0, 17.0, 11.0, 18.0, 17.0, 14.0, 19.0, 18.0, 32.0, 33.0, 33.0, 44.0, 64.0, 48.0, 51.0, 52.0, 48.0, 41.0, 46.0, 47.0, 40.0, 48.0, 35.0, 39.0, 36.0, 16.0, 15.0, 23.0, 13.0, 17.0, 6.0, 4.0, 12.0, 9.0, 3.0, 4.0, 3.0, 6.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.65625, -17.126708984375, -16.59716796875, -16.067626953125, -15.5380859375, -15.008544921875, -14.47900390625, -13.949462890625, -13.419921875, -12.890380859375, -12.36083984375, -11.831298828125, -11.3017578125, -10.772216796875, -10.24267578125, -9.713134765625, -9.18359375, -8.654052734375, -8.12451171875, -7.594970703125, -7.0654296875, -6.535888671875, -6.00634765625, -5.476806640625, -4.947265625, -4.417724609375, -3.88818359375, -3.358642578125, -2.8291015625, -2.299560546875, -1.77001953125, -1.240478515625, -0.7109375, -0.181396484375, 0.34814453125, 0.877685546875, 1.4072265625, 1.936767578125, 2.46630859375, 2.995849609375, 3.525390625, 4.054931640625, 4.58447265625, 5.114013671875, 5.6435546875, 6.173095703125, 6.70263671875, 7.232177734375, 7.76171875, 8.291259765625, 8.82080078125, 9.350341796875, 9.8798828125, 10.409423828125, 10.93896484375, 11.468505859375, 11.998046875, 12.527587890625, 13.05712890625, 13.586669921875, 14.1162109375, 14.645751953125, 15.17529296875, 15.704833984375, 16.234375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 7.0, 10.0, 8.0, 13.0, 17.0, 21.0, 41.0, 47.0, 53.0, 90.0, 127.0, 220.0, 277.0, 380.0, 624.0, 903.0, 1403.0, 2253.0, 3641.0, 6101.0, 10755.0, 19021.0, 35761.0, 71014.0, 136522.0, 219324.0, 226600.0, 147096.0, 77666.0, 39164.0, 20789.0, 11413.0, 6471.0, 3862.0, 2360.0, 1510.0, 1013.0, 615.0, 418.0, 274.0, 217.0, 137.0, 81.0, 70.0, 48.0, 40.0, 16.0, 20.0, 10.0, 9.0, 10.0, 8.0, 3.0, 4.0, 3.0, 3.0], "bins": [-18.828125, -18.275390625, -17.72265625, -17.169921875, -16.6171875, -16.064453125, -15.51171875, -14.958984375, -14.40625, -13.853515625, -13.30078125, -12.748046875, -12.1953125, -11.642578125, -11.08984375, -10.537109375, -9.984375, -9.431640625, -8.87890625, -8.326171875, -7.7734375, -7.220703125, -6.66796875, -6.115234375, -5.5625, -5.009765625, -4.45703125, -3.904296875, -3.3515625, -2.798828125, -2.24609375, -1.693359375, -1.140625, -0.587890625, -0.03515625, 0.517578125, 1.0703125, 1.623046875, 2.17578125, 2.728515625, 3.28125, 3.833984375, 4.38671875, 4.939453125, 5.4921875, 6.044921875, 6.59765625, 7.150390625, 7.703125, 8.255859375, 8.80859375, 9.361328125, 9.9140625, 10.466796875, 11.01953125, 11.572265625, 12.125, 12.677734375, 13.23046875, 13.783203125, 14.3359375, 14.888671875, 15.44140625, 15.994140625, 16.546875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 2.0, 9.0, 7.0, 11.0, 8.0, 9.0, 8.0, 11.0, 13.0, 21.0, 22.0, 25.0, 24.0, 26.0, 25.0, 31.0, 32.0, 41.0, 31.0, 30.0, 35.0, 29.0, 34.0, 45.0, 39.0, 44.0, 30.0, 38.0, 36.0, 37.0, 34.0, 25.0, 23.0, 32.0, 24.0, 19.0, 13.0, 10.0, 16.0, 13.0, 7.0, 6.0, 7.0, 6.0, 7.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-10.0390625, -9.7431640625, -9.447265625, -9.1513671875, -8.85546875, -8.5595703125, -8.263671875, -7.9677734375, -7.671875, -7.3759765625, -7.080078125, -6.7841796875, -6.48828125, -6.1923828125, -5.896484375, -5.6005859375, -5.3046875, -5.0087890625, -4.712890625, -4.4169921875, -4.12109375, -3.8251953125, -3.529296875, -3.2333984375, -2.9375, -2.6416015625, -2.345703125, -2.0498046875, -1.75390625, -1.4580078125, -1.162109375, -0.8662109375, -0.5703125, -0.2744140625, 0.021484375, 0.3173828125, 0.61328125, 0.9091796875, 1.205078125, 1.5009765625, 1.796875, 2.0927734375, 2.388671875, 2.6845703125, 2.98046875, 3.2763671875, 3.572265625, 3.8681640625, 4.1640625, 4.4599609375, 4.755859375, 5.0517578125, 5.34765625, 5.6435546875, 5.939453125, 6.2353515625, 6.53125, 6.8271484375, 7.123046875, 7.4189453125, 7.71484375, 8.0107421875, 8.306640625, 8.6025390625, 8.8984375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 5.0, 7.0, 14.0, 25.0, 20.0, 47.0, 61.0, 90.0, 114.0, 181.0, 235.0, 396.0, 596.0, 937.0, 1483.0, 2326.0, 3754.0, 6389.0, 10913.0, 19380.0, 37119.0, 76333.0, 157989.0, 261921.0, 226403.0, 118904.0, 56606.0, 28750.0, 15186.0, 8611.0, 4996.0, 3120.0, 2035.0, 1229.0, 814.0, 524.0, 355.0, 255.0, 156.0, 96.0, 54.0, 40.0, 28.0, 22.0, 12.0, 11.0, 5.0, 3.0, 1.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.5234375, -10.1925048828125, -9.861572265625, -9.5306396484375, -9.19970703125, -8.8687744140625, -8.537841796875, -8.2069091796875, -7.8759765625, -7.5450439453125, -7.214111328125, -6.8831787109375, -6.55224609375, -6.2213134765625, -5.890380859375, -5.5594482421875, -5.228515625, -4.8975830078125, -4.566650390625, -4.2357177734375, -3.90478515625, -3.5738525390625, -3.242919921875, -2.9119873046875, -2.5810546875, -2.2501220703125, -1.919189453125, -1.5882568359375, -1.25732421875, -0.9263916015625, -0.595458984375, -0.2645263671875, 0.06640625, 0.3973388671875, 0.728271484375, 1.0592041015625, 1.39013671875, 1.7210693359375, 2.052001953125, 2.3829345703125, 2.7138671875, 3.0447998046875, 3.375732421875, 3.7066650390625, 4.03759765625, 4.3685302734375, 4.699462890625, 5.0303955078125, 5.361328125, 5.6922607421875, 6.023193359375, 6.3541259765625, 6.68505859375, 7.0159912109375, 7.346923828125, 7.6778564453125, 8.0087890625, 8.3397216796875, 8.670654296875, 9.0015869140625, 9.33251953125, 9.6634521484375, 9.994384765625, 10.3253173828125, 10.65625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 6.0, 2.0, 4.0, 4.0, 2.0, 2.0, 8.0, 10.0, 14.0, 14.0, 21.0, 17.0, 33.0, 35.0, 37.0, 79.0, 73.0, 111.0, 93.0, 94.0, 80.0, 54.0, 52.0, 36.0, 29.0, 18.0, 14.0, 15.0, 14.0, 8.0, 6.0, 6.0, 1.0, 7.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.0012760162353515625, -0.0012428909540176392, -0.0012097656726837158, -0.0011766403913497925, -0.0011435151100158691, -0.0011103898286819458, -0.0010772645473480225, -0.0010441392660140991, -0.0010110139846801758, -0.0009778887033462524, -0.0009447634220123291, -0.0009116381406784058, -0.0008785128593444824, -0.0008453875780105591, -0.0008122622966766357, -0.0007791370153427124, -0.0007460117340087891, -0.0007128864526748657, -0.0006797611713409424, -0.000646635890007019, -0.0006135106086730957, -0.0005803853273391724, -0.000547260046005249, -0.0005141347646713257, -0.00048100948333740234, -0.000447884202003479, -0.00041475892066955566, -0.0003816336393356323, -0.000348508358001709, -0.00031538307666778564, -0.0002822577953338623, -0.00024913251399993896, -0.00021600723266601562, -0.00018288195133209229, -0.00014975666999816895, -0.0001166313886642456, -8.350610733032227e-05, -5.0380825996398926e-05, -1.7255544662475586e-05, 1.5869736671447754e-05, 4.8995018005371094e-05, 8.212029933929443e-05, 0.00011524558067321777, 0.0001483708620071411, 0.00018149614334106445, 0.0002146214246749878, 0.00024774670600891113, 0.00028087198734283447, 0.0003139972686767578, 0.00034712255001068115, 0.0003802478313446045, 0.00041337311267852783, 0.00044649839401245117, 0.0004796236753463745, 0.0005127489566802979, 0.0005458742380142212, 0.0005789995193481445, 0.0006121248006820679, 0.0006452500820159912, 0.0006783753633499146, 0.0007115006446838379, 0.0007446259260177612, 0.0007777512073516846, 0.0008108764886856079, 0.0008440017700195312]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 3.0, 3.0, 11.0, 11.0, 16.0, 25.0, 43.0, 50.0, 149.0, 192.0, 375.0, 676.0, 1346.0, 2469.0, 5059.0, 10371.0, 23639.0, 56381.0, 143660.0, 312854.0, 283986.0, 121088.0, 47484.0, 20201.0, 9307.0, 4442.0, 2234.0, 1090.0, 586.0, 336.0, 178.0, 93.0, 60.0, 54.0, 27.0, 17.0, 10.0, 8.0, 7.0, 9.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.015625, -12.5804443359375, -12.145263671875, -11.7100830078125, -11.27490234375, -10.8397216796875, -10.404541015625, -9.9693603515625, -9.5341796875, -9.0989990234375, -8.663818359375, -8.2286376953125, -7.79345703125, -7.3582763671875, -6.923095703125, -6.4879150390625, -6.052734375, -5.6175537109375, -5.182373046875, -4.7471923828125, -4.31201171875, -3.8768310546875, -3.441650390625, -3.0064697265625, -2.5712890625, -2.1361083984375, -1.700927734375, -1.2657470703125, -0.83056640625, -0.3953857421875, 0.039794921875, 0.4749755859375, 0.91015625, 1.3453369140625, 1.780517578125, 2.2156982421875, 2.65087890625, 3.0860595703125, 3.521240234375, 3.9564208984375, 4.3916015625, 4.8267822265625, 5.261962890625, 5.6971435546875, 6.13232421875, 6.5675048828125, 7.002685546875, 7.4378662109375, 7.873046875, 8.3082275390625, 8.743408203125, 9.1785888671875, 9.61376953125, 10.0489501953125, 10.484130859375, 10.9193115234375, 11.3544921875, 11.7896728515625, 12.224853515625, 12.6600341796875, 13.09521484375, 13.5303955078125, 13.965576171875, 14.4007568359375, 14.8359375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 6.0, 6.0, 9.0, 14.0, 9.0, 23.0, 20.0, 25.0, 30.0, 33.0, 35.0, 50.0, 58.0, 55.0, 56.0, 50.0, 55.0, 38.0, 53.0, 51.0, 38.0, 47.0, 41.0, 33.0, 27.0, 23.0, 20.0, 11.0, 13.0, 19.0, 8.0, 5.0, 11.0, 3.0, 3.0, 6.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.05078125, -1.979644775390625, -1.90850830078125, -1.837371826171875, -1.7662353515625, -1.695098876953125, -1.62396240234375, -1.552825927734375, -1.481689453125, -1.410552978515625, -1.33941650390625, -1.268280029296875, -1.1971435546875, -1.126007080078125, -1.05487060546875, -0.983734130859375, -0.91259765625, -0.841461181640625, -0.77032470703125, -0.699188232421875, -0.6280517578125, -0.556915283203125, -0.48577880859375, -0.414642333984375, -0.343505859375, -0.272369384765625, -0.20123291015625, -0.130096435546875, -0.0589599609375, 0.012176513671875, 0.08331298828125, 0.154449462890625, 0.2255859375, 0.296722412109375, 0.36785888671875, 0.438995361328125, 0.5101318359375, 0.581268310546875, 0.65240478515625, 0.723541259765625, 0.794677734375, 0.865814208984375, 0.93695068359375, 1.008087158203125, 1.0792236328125, 1.150360107421875, 1.22149658203125, 1.292633056640625, 1.36376953125, 1.434906005859375, 1.50604248046875, 1.577178955078125, 1.6483154296875, 1.719451904296875, 1.79058837890625, 1.861724853515625, 1.932861328125, 2.003997802734375, 2.07513427734375, 2.146270751953125, 2.2174072265625, 2.288543701171875, 2.35968017578125, 2.430816650390625, 2.501953125]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 4.0, 6.0, 3.0, 2.0, 5.0, 3.0, 4.0, 6.0, 14.0, 5.0, 18.0, 14.0, 11.0, 15.0, 29.0, 29.0, 37.0, 39.0, 67.0, 69.0, 65.0, 59.0, 56.0, 51.0, 58.0, 50.0, 47.0, 40.0, 37.0, 39.0, 26.0, 19.0, 17.0, 11.0, 7.0, 11.0, 5.0, 8.0, 6.0, 3.0, 5.0, 6.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.010011672973633, -18.402679443359375, -17.795345306396484, -17.188013076782227, -16.58068084716797, -15.973347663879395, -15.36601448059082, -14.758682250976562, -14.151349067687988, -13.544015884399414, -12.936683654785156, -12.329350471496582, -11.722017288208008, -11.11468505859375, -10.507351875305176, -9.900018692016602, -9.292686462402344, -8.68535327911377, -8.078021049499512, -7.4706878662109375, -6.8633551597595215, -6.2560224533081055, -5.648689270019531, -5.041356563568115, -4.434023857116699, -3.826691150665283, -3.219358205795288, -2.612025260925293, -2.004692554473877, -1.397359848022461, -0.7900269031524658, -0.1826939582824707, 0.4246368408203125, 1.031969666481018, 1.6393024921417236, 2.2466354370117188, 2.8539681434631348, 3.461300849914551, 4.068634033203125, 4.675966739654541, 5.283299446105957, 5.890632152557373, 6.497964859008789, 7.105298042297363, 7.712630748748779, 8.319963455200195, 8.92729663848877, 9.534629821777344, 10.141962051391602, 10.749295234680176, 11.356627464294434, 11.963960647583008, 12.571292877197266, 13.17862606048584, 13.785959243774414, 14.393291473388672, 15.000624656677246, 15.60795783996582, 16.215290069580078, 16.822622299194336, 17.429956436157227, 18.037288665771484, 18.644620895385742, 19.251955032348633, 19.85928726196289]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 10.0, 8.0, 18.0, 19.0, 20.0, 12.0, 21.0, 20.0, 30.0, 25.0, 23.0, 35.0, 46.0, 50.0, 41.0, 40.0, 49.0, 50.0, 49.0, 41.0, 36.0, 43.0, 37.0, 36.0, 36.0, 28.0, 25.0, 22.0, 23.0, 17.0, 18.0, 14.0, 11.0, 11.0, 9.0, 7.0, 8.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-18.90999984741211, -18.345932006835938, -17.7818660736084, -17.217798233032227, -16.653732299804688, -16.089664459228516, -15.525596618652344, -14.961529731750488, -14.397462844848633, -13.833395957946777, -13.269329071044922, -12.70526123046875, -12.141194343566895, -11.577127456665039, -11.013059616088867, -10.448992729187012, -9.884925842285156, -9.3208589553833, -8.756792068481445, -8.192724227905273, -7.628657341003418, -7.0645904541015625, -6.500523090362549, -5.936455726623535, -5.37238883972168, -4.808321952819824, -4.2442545890808105, -3.680187463760376, -3.1161203384399414, -2.552053213119507, -1.9879860877990723, -1.4239189624786377, -0.8598537445068359, -0.29578661918640137, 0.2682805061340332, 0.8323476314544678, 1.3964147567749023, 1.960481882095337, 2.5245490074157715, 3.088616132736206, 3.6526832580566406, 4.216750144958496, 4.78081750869751, 5.344884872436523, 5.908951759338379, 6.473018646240234, 7.037086009979248, 7.601153373718262, 8.165220260620117, 8.729287147521973, 9.293354034423828, 9.857421875, 10.421488761901855, 10.985555648803711, 11.549623489379883, 12.113690376281738, 12.677757263183594, 13.24182415008545, 13.805891036987305, 14.369958877563477, 14.934025764465332, 15.498092651367188, 16.06216049194336, 16.6262264251709, 17.19029426574707]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 9.0, 12.0, 20.0, 19.0, 36.0, 65.0, 90.0, 110.0, 217.0, 297.0, 529.0, 855.0, 1286.0, 2330.0, 4130.0, 7473.0, 14364.0, 29628.0, 67494.0, 178879.0, 511646.0, 1194216.0, 1266170.0, 570786.0, 199934.0, 75704.0, 33069.0, 15899.0, 8128.0, 4505.0, 2550.0, 1509.0, 872.0, 553.0, 339.0, 214.0, 121.0, 85.0, 52.0, 25.0, 20.0, 16.0, 4.0, 8.0, 7.0, 3.0, 9.0, 1.0, 1.0, 0.0, 1.0], "bins": [-28.3125, -27.5048828125, -26.697265625, -25.8896484375, -25.08203125, -24.2744140625, -23.466796875, -22.6591796875, -21.8515625, -21.0439453125, -20.236328125, -19.4287109375, -18.62109375, -17.8134765625, -17.005859375, -16.1982421875, -15.390625, -14.5830078125, -13.775390625, -12.9677734375, -12.16015625, -11.3525390625, -10.544921875, -9.7373046875, -8.9296875, -8.1220703125, -7.314453125, -6.5068359375, -5.69921875, -4.8916015625, -4.083984375, -3.2763671875, -2.46875, -1.6611328125, -0.853515625, -0.0458984375, 0.76171875, 1.5693359375, 2.376953125, 3.1845703125, 3.9921875, 4.7998046875, 5.607421875, 6.4150390625, 7.22265625, 8.0302734375, 8.837890625, 9.6455078125, 10.453125, 11.2607421875, 12.068359375, 12.8759765625, 13.68359375, 14.4912109375, 15.298828125, 16.1064453125, 16.9140625, 17.7216796875, 18.529296875, 19.3369140625, 20.14453125, 20.9521484375, 21.759765625, 22.5673828125, 23.375]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 5.0, 5.0, 11.0, 11.0, 15.0, 17.0, 15.0, 9.0, 21.0, 17.0, 26.0, 23.0, 29.0, 31.0, 42.0, 54.0, 44.0, 38.0, 46.0, 49.0, 36.0, 29.0, 44.0, 44.0, 40.0, 40.0, 29.0, 28.0, 29.0, 28.0, 21.0, 19.0, 15.0, 14.0, 11.0, 14.0, 10.0, 15.0, 7.0, 6.0, 4.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-17.171875, -16.653076171875, -16.13427734375, -15.615478515625, -15.0966796875, -14.577880859375, -14.05908203125, -13.540283203125, -13.021484375, -12.502685546875, -11.98388671875, -11.465087890625, -10.9462890625, -10.427490234375, -9.90869140625, -9.389892578125, -8.87109375, -8.352294921875, -7.83349609375, -7.314697265625, -6.7958984375, -6.277099609375, -5.75830078125, -5.239501953125, -4.720703125, -4.201904296875, -3.68310546875, -3.164306640625, -2.6455078125, -2.126708984375, -1.60791015625, -1.089111328125, -0.5703125, -0.051513671875, 0.46728515625, 0.986083984375, 1.5048828125, 2.023681640625, 2.54248046875, 3.061279296875, 3.580078125, 4.098876953125, 4.61767578125, 5.136474609375, 5.6552734375, 6.174072265625, 6.69287109375, 7.211669921875, 7.73046875, 8.249267578125, 8.76806640625, 9.286865234375, 9.8056640625, 10.324462890625, 10.84326171875, 11.362060546875, 11.880859375, 12.399658203125, 12.91845703125, 13.437255859375, 13.9560546875, 14.474853515625, 14.99365234375, 15.512451171875, 16.03125]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 6.0, 5.0, 6.0, 11.0, 14.0, 6.0, 19.0, 35.0, 37.0, 61.0, 97.0, 121.0, 190.0, 283.0, 432.0, 634.0, 1035.0, 1638.0, 2463.0, 4036.0, 6465.0, 10369.0, 17493.0, 29766.0, 52881.0, 98563.0, 189743.0, 380010.0, 738514.0, 1056046.0, 769899.0, 398419.0, 198999.0, 103164.0, 55308.0, 30888.0, 18199.0, 10549.0, 6546.0, 4070.0, 2562.0, 1657.0, 1008.0, 691.0, 425.0, 314.0, 184.0, 133.0, 110.0, 71.0, 44.0, 21.0, 19.0, 9.0, 12.0, 7.0, 4.0, 3.0, 0.0, 4.0, 1.0], "bins": [-26.171875, -25.367431640625, -24.56298828125, -23.758544921875, -22.9541015625, -22.149658203125, -21.34521484375, -20.540771484375, -19.736328125, -18.931884765625, -18.12744140625, -17.322998046875, -16.5185546875, -15.714111328125, -14.90966796875, -14.105224609375, -13.30078125, -12.496337890625, -11.69189453125, -10.887451171875, -10.0830078125, -9.278564453125, -8.47412109375, -7.669677734375, -6.865234375, -6.060791015625, -5.25634765625, -4.451904296875, -3.6474609375, -2.843017578125, -2.03857421875, -1.234130859375, -0.4296875, 0.374755859375, 1.17919921875, 1.983642578125, 2.7880859375, 3.592529296875, 4.39697265625, 5.201416015625, 6.005859375, 6.810302734375, 7.61474609375, 8.419189453125, 9.2236328125, 10.028076171875, 10.83251953125, 11.636962890625, 12.44140625, 13.245849609375, 14.05029296875, 14.854736328125, 15.6591796875, 16.463623046875, 17.26806640625, 18.072509765625, 18.876953125, 19.681396484375, 20.48583984375, 21.290283203125, 22.0947265625, 22.899169921875, 23.70361328125, 24.508056640625, 25.3125]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 0.0, 4.0, 3.0, 3.0, 9.0, 5.0, 9.0, 12.0, 17.0, 18.0, 37.0, 34.0, 45.0, 54.0, 64.0, 87.0, 98.0, 149.0, 163.0, 217.0, 215.0, 235.0, 314.0, 311.0, 287.0, 307.0, 248.0, 215.0, 182.0, 141.0, 136.0, 96.0, 86.0, 59.0, 48.0, 32.0, 33.0, 23.0, 15.0, 10.0, 13.0, 9.0, 8.0, 10.0, 6.0, 2.0, 7.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-10.5, -10.2086181640625, -9.917236328125, -9.6258544921875, -9.33447265625, -9.0430908203125, -8.751708984375, -8.4603271484375, -8.1689453125, -7.8775634765625, -7.586181640625, -7.2947998046875, -7.00341796875, -6.7120361328125, -6.420654296875, -6.1292724609375, -5.837890625, -5.5465087890625, -5.255126953125, -4.9637451171875, -4.67236328125, -4.3809814453125, -4.089599609375, -3.7982177734375, -3.5068359375, -3.2154541015625, -2.924072265625, -2.6326904296875, -2.34130859375, -2.0499267578125, -1.758544921875, -1.4671630859375, -1.17578125, -0.8843994140625, -0.593017578125, -0.3016357421875, -0.01025390625, 0.2811279296875, 0.572509765625, 0.8638916015625, 1.1552734375, 1.4466552734375, 1.738037109375, 2.0294189453125, 2.32080078125, 2.6121826171875, 2.903564453125, 3.1949462890625, 3.486328125, 3.7777099609375, 4.069091796875, 4.3604736328125, 4.65185546875, 4.9432373046875, 5.234619140625, 5.5260009765625, 5.8173828125, 6.1087646484375, 6.400146484375, 6.6915283203125, 6.98291015625, 7.2742919921875, 7.565673828125, 7.8570556640625, 8.1484375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 6.0, 3.0, 7.0, 9.0, 7.0, 11.0, 25.0, 15.0, 20.0, 30.0, 36.0, 36.0, 56.0, 80.0, 61.0, 68.0, 72.0, 64.0, 77.0, 52.0, 52.0, 36.0, 35.0, 32.0, 31.0, 14.0, 15.0, 9.0, 8.0, 10.0, 4.0, 2.0, 3.0, 4.0, 4.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.50762176513672, -31.463815689086914, -30.420007705688477, -29.376201629638672, -28.332393646240234, -27.28858757019043, -26.244781494140625, -25.200973510742188, -24.157167434692383, -23.113361358642578, -22.06955337524414, -21.025747299194336, -19.98194122314453, -18.938133239746094, -17.89432716369629, -16.850521087646484, -15.806713104248047, -14.762906074523926, -13.719099044799805, -12.67529296875, -11.631485939025879, -10.587678909301758, -9.543872833251953, -8.500065803527832, -7.456258773803711, -6.41245174407959, -5.368645191192627, -4.324838638305664, -3.281031608581543, -2.237224578857422, -1.193418025970459, -0.1496114730834961, 0.8941993713378906, 1.9380061626434326, 2.9818129539489746, 4.0256195068359375, 5.069426536560059, 6.11323356628418, 7.157040119171143, 8.200846672058105, 9.244653701782227, 10.288460731506348, 11.332267761230469, 12.376073837280273, 13.419880867004395, 14.463687896728516, 15.50749397277832, 16.551300048828125, 17.595108032226562, 18.638914108276367, 19.682722091674805, 20.72652816772461, 21.770336151123047, 22.81414222717285, 23.857948303222656, 24.901756286621094, 25.9455623626709, 26.989368438720703, 28.03317642211914, 29.076982498168945, 30.12078857421875, 31.164596557617188, 32.208404541015625, 33.2522087097168, 34.296016693115234]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 6.0, 7.0, 5.0, 17.0, 17.0, 19.0, 21.0, 20.0, 16.0, 21.0, 23.0, 38.0, 32.0, 36.0, 44.0, 42.0, 46.0, 49.0, 48.0, 41.0, 38.0, 37.0, 40.0, 38.0, 41.0, 26.0, 41.0, 30.0, 16.0, 32.0, 18.0, 22.0, 16.0, 10.0, 8.0, 5.0, 7.0, 5.0, 5.0, 7.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.939693450927734, -24.156044006347656, -23.372394561767578, -22.5887451171875, -21.805095672607422, -21.02144432067871, -20.237794876098633, -19.454145431518555, -18.670495986938477, -17.8868465423584, -17.10319709777832, -16.319547653198242, -15.535897254943848, -14.75224781036377, -13.968597412109375, -13.184947967529297, -12.401298522949219, -11.61764907836914, -10.833999633789062, -10.050349235534668, -9.26669979095459, -8.483050346374512, -7.699400424957275, -6.915750503540039, -6.132101058959961, -5.348451614379883, -4.5648016929626465, -3.7811520099639893, -2.997502326965332, -2.213852643966675, -1.4302029609680176, -0.6465530395507812, 0.13709640502929688, 0.9207460880279541, 1.7043957710266113, 2.4880454540252686, 3.271695137023926, 4.055344581604004, 4.83899450302124, 5.622644424438477, 6.406293869018555, 7.189943313598633, 7.973593235015869, 8.757243156433105, 9.540892601013184, 10.324542045593262, 11.108192443847656, 11.891841888427734, 12.675491333007812, 13.45914077758789, 14.242790222167969, 15.026440620422363, 15.810090065002441, 16.593740463256836, 17.377389907836914, 18.161039352416992, 18.94468879699707, 19.72833824157715, 20.511987686157227, 21.295637130737305, 22.079288482666016, 22.862937927246094, 23.646587371826172, 24.43023681640625, 25.213886260986328]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 9.0, 13.0, 13.0, 12.0, 23.0, 42.0, 56.0, 78.0, 128.0, 202.0, 276.0, 441.0, 613.0, 1028.0, 1613.0, 2652.0, 4136.0, 6612.0, 10984.0, 18313.0, 30577.0, 51825.0, 87858.0, 139209.0, 186864.0, 179607.0, 128482.0, 79708.0, 46687.0, 27668.0, 16726.0, 9925.0, 6046.0, 3600.0, 2278.0, 1521.0, 923.0, 610.0, 389.0, 260.0, 177.0, 130.0, 99.0, 55.0, 29.0, 27.0, 15.0, 6.0, 3.0, 11.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.4296875, -11.059814453125, -10.68994140625, -10.320068359375, -9.9501953125, -9.580322265625, -9.21044921875, -8.840576171875, -8.470703125, -8.100830078125, -7.73095703125, -7.361083984375, -6.9912109375, -6.621337890625, -6.25146484375, -5.881591796875, -5.51171875, -5.141845703125, -4.77197265625, -4.402099609375, -4.0322265625, -3.662353515625, -3.29248046875, -2.922607421875, -2.552734375, -2.182861328125, -1.81298828125, -1.443115234375, -1.0732421875, -0.703369140625, -0.33349609375, 0.036376953125, 0.40625, 0.776123046875, 1.14599609375, 1.515869140625, 1.8857421875, 2.255615234375, 2.62548828125, 2.995361328125, 3.365234375, 3.735107421875, 4.10498046875, 4.474853515625, 4.8447265625, 5.214599609375, 5.58447265625, 5.954345703125, 6.32421875, 6.694091796875, 7.06396484375, 7.433837890625, 7.8037109375, 8.173583984375, 8.54345703125, 8.913330078125, 9.283203125, 9.653076171875, 10.02294921875, 10.392822265625, 10.7626953125, 11.132568359375, 11.50244140625, 11.872314453125, 12.2421875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 5.0, 8.0, 11.0, 8.0, 11.0, 17.0, 20.0, 13.0, 27.0, 26.0, 35.0, 34.0, 39.0, 38.0, 43.0, 46.0, 51.0, 64.0, 43.0, 46.0, 42.0, 42.0, 45.0, 43.0, 37.0, 31.0, 30.0, 17.0, 33.0, 23.0, 17.0, 12.0, 10.0, 8.0, 1.0, 5.0, 3.0, 6.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.125, -28.220458984375, -27.31591796875, -26.411376953125, -25.5068359375, -24.602294921875, -23.69775390625, -22.793212890625, -21.888671875, -20.984130859375, -20.07958984375, -19.175048828125, -18.2705078125, -17.365966796875, -16.46142578125, -15.556884765625, -14.65234375, -13.747802734375, -12.84326171875, -11.938720703125, -11.0341796875, -10.129638671875, -9.22509765625, -8.320556640625, -7.416015625, -6.511474609375, -5.60693359375, -4.702392578125, -3.7978515625, -2.893310546875, -1.98876953125, -1.084228515625, -0.1796875, 0.724853515625, 1.62939453125, 2.533935546875, 3.4384765625, 4.343017578125, 5.24755859375, 6.152099609375, 7.056640625, 7.961181640625, 8.86572265625, 9.770263671875, 10.6748046875, 11.579345703125, 12.48388671875, 13.388427734375, 14.29296875, 15.197509765625, 16.10205078125, 17.006591796875, 17.9111328125, 18.815673828125, 19.72021484375, 20.624755859375, 21.529296875, 22.433837890625, 23.33837890625, 24.242919921875, 25.1474609375, 26.052001953125, 26.95654296875, 27.861083984375, 28.765625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 9.0, 15.0, 7.0, 16.0, 32.0, 22.0, 60.0, 95.0, 128.0, 217.0, 308.0, 481.0, 684.0, 1146.0, 1839.0, 2800.0, 4432.0, 7055.0, 11607.0, 18797.0, 30932.0, 52191.0, 86029.0, 138033.0, 190299.0, 181350.0, 123964.0, 77087.0, 46241.0, 27820.0, 16875.0, 10348.0, 6460.0, 3979.0, 2537.0, 1662.0, 1004.0, 708.0, 464.0, 277.0, 199.0, 122.0, 88.0, 46.0, 43.0, 13.0, 11.0, 7.0, 9.0, 7.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.40625, -11.976806640625, -11.54736328125, -11.117919921875, -10.6884765625, -10.259033203125, -9.82958984375, -9.400146484375, -8.970703125, -8.541259765625, -8.11181640625, -7.682373046875, -7.2529296875, -6.823486328125, -6.39404296875, -5.964599609375, -5.53515625, -5.105712890625, -4.67626953125, -4.246826171875, -3.8173828125, -3.387939453125, -2.95849609375, -2.529052734375, -2.099609375, -1.670166015625, -1.24072265625, -0.811279296875, -0.3818359375, 0.047607421875, 0.47705078125, 0.906494140625, 1.3359375, 1.765380859375, 2.19482421875, 2.624267578125, 3.0537109375, 3.483154296875, 3.91259765625, 4.342041015625, 4.771484375, 5.200927734375, 5.63037109375, 6.059814453125, 6.4892578125, 6.918701171875, 7.34814453125, 7.777587890625, 8.20703125, 8.636474609375, 9.06591796875, 9.495361328125, 9.9248046875, 10.354248046875, 10.78369140625, 11.213134765625, 11.642578125, 12.072021484375, 12.50146484375, 12.930908203125, 13.3603515625, 13.789794921875, 14.21923828125, 14.648681640625, 15.078125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 8.0, 12.0, 9.0, 7.0, 8.0, 15.0, 13.0, 10.0, 14.0, 22.0, 16.0, 23.0, 18.0, 35.0, 43.0, 29.0, 35.0, 32.0, 39.0, 49.0, 35.0, 44.0, 31.0, 39.0, 35.0, 44.0, 41.0, 28.0, 30.0, 32.0, 20.0, 33.0, 18.0, 19.0, 17.0, 14.0, 17.0, 10.0, 6.0, 11.0, 9.0, 8.0, 8.0, 1.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8828125, -12.45703125, -12.03125, -11.60546875, -11.1796875, -10.75390625, -10.328125, -9.90234375, -9.4765625, -9.05078125, -8.625, -8.19921875, -7.7734375, -7.34765625, -6.921875, -6.49609375, -6.0703125, -5.64453125, -5.21875, -4.79296875, -4.3671875, -3.94140625, -3.515625, -3.08984375, -2.6640625, -2.23828125, -1.8125, -1.38671875, -0.9609375, -0.53515625, -0.109375, 0.31640625, 0.7421875, 1.16796875, 1.59375, 2.01953125, 2.4453125, 2.87109375, 3.296875, 3.72265625, 4.1484375, 4.57421875, 5.0, 5.42578125, 5.8515625, 6.27734375, 6.703125, 7.12890625, 7.5546875, 7.98046875, 8.40625, 8.83203125, 9.2578125, 9.68359375, 10.109375, 10.53515625, 10.9609375, 11.38671875, 11.8125, 12.23828125, 12.6640625, 13.08984375, 13.515625, 13.94140625, 14.3671875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 8.0, 12.0, 12.0, 21.0, 25.0, 34.0, 50.0, 61.0, 94.0, 183.0, 241.0, 347.0, 491.0, 816.0, 1286.0, 1961.0, 3228.0, 5137.0, 8720.0, 14963.0, 25925.0, 45220.0, 82037.0, 144422.0, 218299.0, 202728.0, 126528.0, 70935.0, 39343.0, 22209.0, 12907.0, 7579.0, 4533.0, 2961.0, 1847.0, 1140.0, 740.0, 514.0, 299.0, 221.0, 176.0, 100.0, 63.0, 51.0, 29.0, 21.0, 22.0, 9.0, 0.0, 9.0, 3.0, 2.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-7.1875, -6.9547119140625, -6.721923828125, -6.4891357421875, -6.25634765625, -6.0235595703125, -5.790771484375, -5.5579833984375, -5.3251953125, -5.0924072265625, -4.859619140625, -4.6268310546875, -4.39404296875, -4.1612548828125, -3.928466796875, -3.6956787109375, -3.462890625, -3.2301025390625, -2.997314453125, -2.7645263671875, -2.53173828125, -2.2989501953125, -2.066162109375, -1.8333740234375, -1.6005859375, -1.3677978515625, -1.135009765625, -0.9022216796875, -0.66943359375, -0.4366455078125, -0.203857421875, 0.0289306640625, 0.26171875, 0.4945068359375, 0.727294921875, 0.9600830078125, 1.19287109375, 1.4256591796875, 1.658447265625, 1.8912353515625, 2.1240234375, 2.3568115234375, 2.589599609375, 2.8223876953125, 3.05517578125, 3.2879638671875, 3.520751953125, 3.7535400390625, 3.986328125, 4.2191162109375, 4.451904296875, 4.6846923828125, 4.91748046875, 5.1502685546875, 5.383056640625, 5.6158447265625, 5.8486328125, 6.0814208984375, 6.314208984375, 6.5469970703125, 6.77978515625, 7.0125732421875, 7.245361328125, 7.4781494140625, 7.7109375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 3.0, 7.0, 4.0, 5.0, 8.0, 7.0, 11.0, 9.0, 9.0, 16.0, 17.0, 17.0, 20.0, 26.0, 28.0, 37.0, 35.0, 48.0, 46.0, 45.0, 46.0, 60.0, 60.0, 44.0, 57.0, 35.0, 48.0, 41.0, 20.0, 24.0, 29.0, 31.0, 19.0, 19.0, 21.0, 16.0, 9.0, 7.0, 8.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00023603439331054688, -0.0002270713448524475, -0.00021810829639434814, -0.00020914524793624878, -0.00020018219947814941, -0.00019121915102005005, -0.00018225610256195068, -0.00017329305410385132, -0.00016433000564575195, -0.0001553669571876526, -0.00014640390872955322, -0.00013744086027145386, -0.0001284778118133545, -0.00011951476335525513, -0.00011055171489715576, -0.0001015886664390564, -9.262561798095703e-05, -8.366256952285767e-05, -7.46995210647583e-05, -6.573647260665894e-05, -5.677342414855957e-05, -4.7810375690460205e-05, -3.884732723236084e-05, -2.9884278774261475e-05, -2.092123031616211e-05, -1.1958181858062744e-05, -2.995133399963379e-06, 5.967915058135986e-06, 1.4930963516235352e-05, 2.3894011974334717e-05, 3.285706043243408e-05, 4.182010889053345e-05, 5.078315734863281e-05, 5.974620580673218e-05, 6.870925426483154e-05, 7.767230272293091e-05, 8.663535118103027e-05, 9.559839963912964e-05, 0.000104561448097229, 0.00011352449655532837, 0.00012248754501342773, 0.0001314505934715271, 0.00014041364192962646, 0.00014937669038772583, 0.0001583397388458252, 0.00016730278730392456, 0.00017626583576202393, 0.0001852288842201233, 0.00019419193267822266, 0.00020315498113632202, 0.0002121180295944214, 0.00022108107805252075, 0.00023004412651062012, 0.00023900717496871948, 0.00024797022342681885, 0.0002569332718849182, 0.0002658963203430176, 0.00027485936880111694, 0.0002838224172592163, 0.0002927854657173157, 0.00030174851417541504, 0.0003107115626335144, 0.00031967461109161377, 0.00032863765954971313, 0.0003376007080078125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 6.0, 14.0, 12.0, 18.0, 26.0, 20.0, 35.0, 47.0, 73.0, 89.0, 133.0, 190.0, 259.0, 391.0, 599.0, 966.0, 1513.0, 2695.0, 4784.0, 8878.0, 17392.0, 33713.0, 66818.0, 127241.0, 211496.0, 233087.0, 160009.0, 86267.0, 43468.0, 22223.0, 11331.0, 6016.0, 3265.0, 2003.0, 1206.0, 697.0, 487.0, 312.0, 236.0, 152.0, 114.0, 69.0, 51.0, 39.0, 38.0, 26.0, 15.0, 10.0, 10.0, 6.0, 8.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-9.8359375, -9.5303955078125, -9.224853515625, -8.9193115234375, -8.61376953125, -8.3082275390625, -8.002685546875, -7.6971435546875, -7.3916015625, -7.0860595703125, -6.780517578125, -6.4749755859375, -6.16943359375, -5.8638916015625, -5.558349609375, -5.2528076171875, -4.947265625, -4.6417236328125, -4.336181640625, -4.0306396484375, -3.72509765625, -3.4195556640625, -3.114013671875, -2.8084716796875, -2.5029296875, -2.1973876953125, -1.891845703125, -1.5863037109375, -1.28076171875, -0.9752197265625, -0.669677734375, -0.3641357421875, -0.05859375, 0.2469482421875, 0.552490234375, 0.8580322265625, 1.16357421875, 1.4691162109375, 1.774658203125, 2.0802001953125, 2.3857421875, 2.6912841796875, 2.996826171875, 3.3023681640625, 3.60791015625, 3.9134521484375, 4.218994140625, 4.5245361328125, 4.830078125, 5.1356201171875, 5.441162109375, 5.7467041015625, 6.05224609375, 6.3577880859375, 6.663330078125, 6.9688720703125, 7.2744140625, 7.5799560546875, 7.885498046875, 8.1910400390625, 8.49658203125, 8.8021240234375, 9.107666015625, 9.4132080078125, 9.71875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 2.0, 3.0, 8.0, 15.0, 8.0, 19.0, 22.0, 19.0, 31.0, 33.0, 52.0, 66.0, 57.0, 80.0, 72.0, 62.0, 86.0, 62.0, 69.0, 57.0, 36.0, 43.0, 23.0, 19.0, 17.0, 11.0, 7.0, 3.0, 3.0, 4.0, 6.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.923828125, -3.800445556640625, -3.67706298828125, -3.553680419921875, -3.4302978515625, -3.306915283203125, -3.18353271484375, -3.060150146484375, -2.936767578125, -2.813385009765625, -2.69000244140625, -2.566619873046875, -2.4432373046875, -2.319854736328125, -2.19647216796875, -2.073089599609375, -1.94970703125, -1.826324462890625, -1.70294189453125, -1.579559326171875, -1.4561767578125, -1.332794189453125, -1.20941162109375, -1.086029052734375, -0.962646484375, -0.839263916015625, -0.71588134765625, -0.592498779296875, -0.4691162109375, -0.345733642578125, -0.22235107421875, -0.098968505859375, 0.0244140625, 0.147796630859375, 0.27117919921875, 0.394561767578125, 0.5179443359375, 0.641326904296875, 0.76470947265625, 0.888092041015625, 1.011474609375, 1.134857177734375, 1.25823974609375, 1.381622314453125, 1.5050048828125, 1.628387451171875, 1.75177001953125, 1.875152587890625, 1.99853515625, 2.121917724609375, 2.24530029296875, 2.368682861328125, 2.4920654296875, 2.615447998046875, 2.73883056640625, 2.862213134765625, 2.985595703125, 3.108978271484375, 3.23236083984375, 3.355743408203125, 3.4791259765625, 3.602508544921875, 3.72589111328125, 3.849273681640625, 3.97265625]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 2.0, 8.0, 6.0, 7.0, 8.0, 5.0, 13.0, 18.0, 24.0, 17.0, 28.0, 30.0, 34.0, 58.0, 66.0, 70.0, 68.0, 74.0, 68.0, 75.0, 46.0, 43.0, 47.0, 38.0, 33.0, 30.0, 20.0, 14.0, 15.0, 7.0, 7.0, 3.0, 5.0, 2.0, 0.0, 5.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.53426742553711, -30.496740341186523, -29.459213256835938, -28.421688079833984, -27.3841609954834, -26.346633911132812, -25.309106826782227, -24.27157974243164, -23.234054565429688, -22.1965274810791, -21.159000396728516, -20.121475219726562, -19.083948135375977, -18.04642105102539, -17.008893966674805, -15.971366882324219, -14.933839797973633, -13.896312713623047, -12.858786582946777, -11.821259498596191, -10.783733367919922, -9.746206283569336, -8.70867919921875, -7.671152591705322, -6.6336259841918945, -5.596099376678467, -4.558572769165039, -3.521045684814453, -2.4835190773010254, -1.4459924697875977, -0.4084653854370117, 0.629061222076416, 1.6665878295898438, 2.7041144371032715, 3.7416412830352783, 4.779168128967285, 5.816694736480713, 6.854221343994141, 7.891748428344727, 8.929275512695312, 9.966801643371582, 11.004328727722168, 12.041854858398438, 13.079381942749023, 14.11690902709961, 15.154435157775879, 16.19196319580078, 17.229488372802734, 18.26701545715332, 19.304542541503906, 20.342069625854492, 21.379596710205078, 22.41712188720703, 23.454648971557617, 24.492176055908203, 25.52970314025879, 26.567230224609375, 27.60475730895996, 28.642284393310547, 29.6798095703125, 30.717336654663086, 31.754863739013672, 32.792388916015625, 33.829917907714844, 34.8674430847168]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 9.0, 6.0, 10.0, 17.0, 12.0, 19.0, 22.0, 17.0, 22.0, 24.0, 31.0, 34.0, 32.0, 48.0, 36.0, 48.0, 45.0, 47.0, 43.0, 50.0, 37.0, 25.0, 54.0, 40.0, 29.0, 33.0, 34.0, 30.0, 23.0, 21.0, 19.0, 20.0, 13.0, 8.0, 6.0, 6.0, 1.0, 6.0, 8.0, 5.0, 5.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.265186309814453, -25.455320358276367, -24.64545249938965, -23.835586547851562, -23.025718688964844, -22.215852737426758, -21.405986785888672, -20.596118927001953, -19.786251068115234, -18.97638511657715, -18.16651725769043, -17.356651306152344, -16.546783447265625, -15.736917495727539, -14.927050590515137, -14.117183685302734, -13.307317733764648, -12.497450828552246, -11.687583923339844, -10.877717971801758, -10.067850112915039, -9.257984161376953, -8.44811725616455, -7.638250350952148, -6.828383445739746, -6.018516540527344, -5.208649635314941, -4.398783206939697, -3.588916301727295, -2.7790493965148926, -1.9691829681396484, -1.159316062927246, -0.34944725036621094, 0.46041953563690186, 1.2702863216400146, 2.080152988433838, 2.8900198936462402, 3.6998867988586426, 4.509753227233887, 5.319620132446289, 6.129487037658691, 6.939353942871094, 7.749220848083496, 8.559087753295898, 9.368953704833984, 10.178821563720703, 10.988687515258789, 11.798554420471191, 12.608421325683594, 13.418288230895996, 14.228155136108398, 15.038021087646484, 15.847888946533203, 16.65775489807129, 17.467620849609375, 18.277488708496094, 19.087356567382812, 19.8972225189209, 20.707090377807617, 21.516956329345703, 22.326824188232422, 23.136690139770508, 23.946556091308594, 24.756423950195312, 25.5662899017334]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 8.0, 11.0, 6.0, 14.0, 17.0, 46.0, 75.0, 82.0, 123.0, 155.0, 265.0, 383.0, 542.0, 783.0, 1200.0, 1807.0, 2804.0, 4257.0, 6522.0, 10252.0, 16132.0, 25962.0, 42001.0, 66221.0, 99806.0, 137473.0, 159742.0, 148430.0, 114410.0, 76260.0, 48794.0, 30474.0, 19125.0, 12002.0, 7686.0, 4975.0, 3219.0, 2188.0, 1404.0, 950.0, 614.0, 445.0, 281.0, 184.0, 139.0, 95.0, 62.0, 45.0, 30.0, 19.0, 17.0, 6.0, 12.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-13.28125, -12.8482666015625, -12.415283203125, -11.9822998046875, -11.54931640625, -11.1163330078125, -10.683349609375, -10.2503662109375, -9.8173828125, -9.3843994140625, -8.951416015625, -8.5184326171875, -8.08544921875, -7.6524658203125, -7.219482421875, -6.7864990234375, -6.353515625, -5.9205322265625, -5.487548828125, -5.0545654296875, -4.62158203125, -4.1885986328125, -3.755615234375, -3.3226318359375, -2.8896484375, -2.4566650390625, -2.023681640625, -1.5906982421875, -1.15771484375, -0.7247314453125, -0.291748046875, 0.1412353515625, 0.57421875, 1.0072021484375, 1.440185546875, 1.8731689453125, 2.30615234375, 2.7391357421875, 3.172119140625, 3.6051025390625, 4.0380859375, 4.4710693359375, 4.904052734375, 5.3370361328125, 5.77001953125, 6.2030029296875, 6.635986328125, 7.0689697265625, 7.501953125, 7.9349365234375, 8.367919921875, 8.8009033203125, 9.23388671875, 9.6668701171875, 10.099853515625, 10.5328369140625, 10.9658203125, 11.3988037109375, 11.831787109375, 12.2647705078125, 12.69775390625, 13.1307373046875, 13.563720703125, 13.9967041015625, 14.4296875]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 9.0, 1.0, 11.0, 9.0, 18.0, 12.0, 24.0, 14.0, 20.0, 10.0, 25.0, 31.0, 37.0, 32.0, 37.0, 32.0, 47.0, 51.0, 34.0, 42.0, 45.0, 53.0, 35.0, 38.0, 51.0, 39.0, 23.0, 39.0, 34.0, 25.0, 16.0, 23.0, 19.0, 16.0, 10.0, 10.0, 4.0, 0.0, 4.0, 0.0, 6.0, 4.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.609375, -25.796142578125, -24.98291015625, -24.169677734375, -23.3564453125, -22.543212890625, -21.72998046875, -20.916748046875, -20.103515625, -19.290283203125, -18.47705078125, -17.663818359375, -16.8505859375, -16.037353515625, -15.22412109375, -14.410888671875, -13.59765625, -12.784423828125, -11.97119140625, -11.157958984375, -10.3447265625, -9.531494140625, -8.71826171875, -7.905029296875, -7.091796875, -6.278564453125, -5.46533203125, -4.652099609375, -3.8388671875, -3.025634765625, -2.21240234375, -1.399169921875, -0.5859375, 0.227294921875, 1.04052734375, 1.853759765625, 2.6669921875, 3.480224609375, 4.29345703125, 5.106689453125, 5.919921875, 6.733154296875, 7.54638671875, 8.359619140625, 9.1728515625, 9.986083984375, 10.79931640625, 11.612548828125, 12.42578125, 13.239013671875, 14.05224609375, 14.865478515625, 15.6787109375, 16.491943359375, 17.30517578125, 18.118408203125, 18.931640625, 19.744873046875, 20.55810546875, 21.371337890625, 22.1845703125, 22.997802734375, 23.81103515625, 24.624267578125, 25.4375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 8.0, 15.0, 17.0, 32.0, 38.0, 65.0, 85.0, 162.0, 210.0, 321.0, 452.0, 736.0, 1086.0, 1661.0, 2532.0, 3972.0, 6493.0, 10435.0, 17102.0, 30064.0, 52919.0, 94874.0, 169773.0, 233563.0, 181432.0, 102643.0, 57358.0, 31881.0, 18644.0, 11256.0, 6724.0, 4260.0, 2658.0, 1699.0, 1129.0, 760.0, 532.0, 307.0, 224.0, 119.0, 116.0, 74.0, 38.0, 24.0, 24.0, 12.0, 8.0, 12.0, 5.0, 0.0, 4.0, 1.0, 1.0], "bins": [-36.53125, -35.474365234375, -34.41748046875, -33.360595703125, -32.3037109375, -31.246826171875, -30.18994140625, -29.133056640625, -28.076171875, -27.019287109375, -25.96240234375, -24.905517578125, -23.8486328125, -22.791748046875, -21.73486328125, -20.677978515625, -19.62109375, -18.564208984375, -17.50732421875, -16.450439453125, -15.3935546875, -14.336669921875, -13.27978515625, -12.222900390625, -11.166015625, -10.109130859375, -9.05224609375, -7.995361328125, -6.9384765625, -5.881591796875, -4.82470703125, -3.767822265625, -2.7109375, -1.654052734375, -0.59716796875, 0.459716796875, 1.5166015625, 2.573486328125, 3.63037109375, 4.687255859375, 5.744140625, 6.801025390625, 7.85791015625, 8.914794921875, 9.9716796875, 11.028564453125, 12.08544921875, 13.142333984375, 14.19921875, 15.256103515625, 16.31298828125, 17.369873046875, 18.4267578125, 19.483642578125, 20.54052734375, 21.597412109375, 22.654296875, 23.711181640625, 24.76806640625, 25.824951171875, 26.8818359375, 27.938720703125, 28.99560546875, 30.052490234375, 31.109375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 2.0, 1.0, 5.0, 9.0, 5.0, 12.0, 7.0, 12.0, 10.0, 14.0, 20.0, 27.0, 20.0, 28.0, 29.0, 28.0, 28.0, 33.0, 34.0, 40.0, 45.0, 40.0, 49.0, 44.0, 36.0, 28.0, 33.0, 36.0, 35.0, 23.0, 30.0, 36.0, 18.0, 31.0, 27.0, 24.0, 15.0, 20.0, 13.0, 14.0, 11.0, 4.0, 9.0, 8.0, 7.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.8125, -15.275146484375, -14.73779296875, -14.200439453125, -13.6630859375, -13.125732421875, -12.58837890625, -12.051025390625, -11.513671875, -10.976318359375, -10.43896484375, -9.901611328125, -9.3642578125, -8.826904296875, -8.28955078125, -7.752197265625, -7.21484375, -6.677490234375, -6.14013671875, -5.602783203125, -5.0654296875, -4.528076171875, -3.99072265625, -3.453369140625, -2.916015625, -2.378662109375, -1.84130859375, -1.303955078125, -0.7666015625, -0.229248046875, 0.30810546875, 0.845458984375, 1.3828125, 1.920166015625, 2.45751953125, 2.994873046875, 3.5322265625, 4.069580078125, 4.60693359375, 5.144287109375, 5.681640625, 6.218994140625, 6.75634765625, 7.293701171875, 7.8310546875, 8.368408203125, 8.90576171875, 9.443115234375, 9.98046875, 10.517822265625, 11.05517578125, 11.592529296875, 12.1298828125, 12.667236328125, 13.20458984375, 13.741943359375, 14.279296875, 14.816650390625, 15.35400390625, 15.891357421875, 16.4287109375, 16.966064453125, 17.50341796875, 18.040771484375, 18.578125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 5.0, 13.0, 13.0, 16.0, 28.0, 32.0, 48.0, 67.0, 95.0, 137.0, 163.0, 229.0, 362.0, 514.0, 688.0, 1064.0, 1703.0, 2686.0, 4555.0, 8108.0, 14859.0, 28900.0, 57057.0, 114363.0, 202018.0, 242986.0, 174850.0, 93367.0, 46312.0, 23369.0, 12244.0, 6769.0, 3881.0, 2431.0, 1460.0, 992.0, 647.0, 466.0, 314.0, 213.0, 162.0, 106.0, 89.0, 56.0, 27.0, 31.0, 19.0, 12.0, 13.0, 5.0, 6.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.3515625, -13.8453369140625, -13.339111328125, -12.8328857421875, -12.32666015625, -11.8204345703125, -11.314208984375, -10.8079833984375, -10.3017578125, -9.7955322265625, -9.289306640625, -8.7830810546875, -8.27685546875, -7.7706298828125, -7.264404296875, -6.7581787109375, -6.251953125, -5.7457275390625, -5.239501953125, -4.7332763671875, -4.22705078125, -3.7208251953125, -3.214599609375, -2.7083740234375, -2.2021484375, -1.6959228515625, -1.189697265625, -0.6834716796875, -0.17724609375, 0.3289794921875, 0.835205078125, 1.3414306640625, 1.84765625, 2.3538818359375, 2.860107421875, 3.3663330078125, 3.87255859375, 4.3787841796875, 4.885009765625, 5.3912353515625, 5.8974609375, 6.4036865234375, 6.909912109375, 7.4161376953125, 7.92236328125, 8.4285888671875, 8.934814453125, 9.4410400390625, 9.947265625, 10.4534912109375, 10.959716796875, 11.4659423828125, 11.97216796875, 12.4783935546875, 12.984619140625, 13.4908447265625, 13.9970703125, 14.5032958984375, 15.009521484375, 15.5157470703125, 16.02197265625, 16.5281982421875, 17.034423828125, 17.5406494140625, 18.046875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 7.0, 6.0, 7.0, 5.0, 17.0, 25.0, 24.0, 14.0, 25.0, 38.0, 59.0, 62.0, 54.0, 72.0, 78.0, 65.0, 71.0, 57.0, 54.0, 51.0, 37.0, 37.0, 31.0, 15.0, 18.0, 18.0, 15.0, 9.0, 8.0, 5.0, 6.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0013484954833984375, -0.001299530267715454, -0.0012505650520324707, -0.0012015998363494873, -0.001152634620666504, -0.0011036694049835205, -0.0010547041893005371, -0.0010057389736175537, -0.0009567737579345703, -0.0009078085422515869, -0.0008588433265686035, -0.0008098781108856201, -0.0007609128952026367, -0.0007119476795196533, -0.0006629824638366699, -0.0006140172481536865, -0.0005650520324707031, -0.0005160868167877197, -0.00046712160110473633, -0.00041815638542175293, -0.00036919116973876953, -0.00032022595405578613, -0.00027126073837280273, -0.00022229552268981934, -0.00017333030700683594, -0.00012436509132385254, -7.539987564086914e-05, -2.6434659957885742e-05, 2.2530555725097656e-05, 7.149577140808105e-05, 0.00012046098709106445, 0.00016942620277404785, 0.00021839141845703125, 0.00026735663414001465, 0.00031632184982299805, 0.00036528706550598145, 0.00041425228118896484, 0.00046321749687194824, 0.0005121827125549316, 0.000561147928237915, 0.0006101131439208984, 0.0006590783596038818, 0.0007080435752868652, 0.0007570087909698486, 0.000805974006652832, 0.0008549392223358154, 0.0009039044380187988, 0.0009528696537017822, 0.0010018348693847656, 0.001050800085067749, 0.0010997653007507324, 0.0011487305164337158, 0.0011976957321166992, 0.0012466609477996826, 0.001295626163482666, 0.0013445913791656494, 0.0013935565948486328, 0.0014425218105316162, 0.0014914870262145996, 0.001540452241897583, 0.0015894174575805664, 0.0016383826732635498, 0.0016873478889465332, 0.0017363131046295166, 0.0017852783203125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 9.0, 13.0, 12.0, 15.0, 23.0, 35.0, 59.0, 45.0, 86.0, 96.0, 121.0, 170.0, 239.0, 327.0, 506.0, 718.0, 1110.0, 1778.0, 3141.0, 5592.0, 10346.0, 20496.0, 44722.0, 99143.0, 200609.0, 277222.0, 197100.0, 96468.0, 43878.0, 20377.0, 10379.0, 5390.0, 3022.0, 1774.0, 1159.0, 713.0, 421.0, 313.0, 256.0, 156.0, 113.0, 105.0, 78.0, 59.0, 36.0, 46.0, 22.0, 16.0, 10.0, 16.0, 10.0, 5.0, 7.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.1875, -16.6416015625, -16.095703125, -15.5498046875, -15.00390625, -14.4580078125, -13.912109375, -13.3662109375, -12.8203125, -12.2744140625, -11.728515625, -11.1826171875, -10.63671875, -10.0908203125, -9.544921875, -8.9990234375, -8.453125, -7.9072265625, -7.361328125, -6.8154296875, -6.26953125, -5.7236328125, -5.177734375, -4.6318359375, -4.0859375, -3.5400390625, -2.994140625, -2.4482421875, -1.90234375, -1.3564453125, -0.810546875, -0.2646484375, 0.28125, 0.8271484375, 1.373046875, 1.9189453125, 2.46484375, 3.0107421875, 3.556640625, 4.1025390625, 4.6484375, 5.1943359375, 5.740234375, 6.2861328125, 6.83203125, 7.3779296875, 7.923828125, 8.4697265625, 9.015625, 9.5615234375, 10.107421875, 10.6533203125, 11.19921875, 11.7451171875, 12.291015625, 12.8369140625, 13.3828125, 13.9287109375, 14.474609375, 15.0205078125, 15.56640625, 16.1123046875, 16.658203125, 17.2041015625, 17.75]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 9.0, 15.0, 19.0, 16.0, 23.0, 42.0, 49.0, 51.0, 66.0, 68.0, 101.0, 85.0, 83.0, 60.0, 75.0, 58.0, 48.0, 32.0, 27.0, 19.0, 12.0, 11.0, 10.0, 6.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.80859375, -4.65460205078125, -4.5006103515625, -4.34661865234375, -4.192626953125, -4.03863525390625, -3.8846435546875, -3.73065185546875, -3.57666015625, -3.42266845703125, -3.2686767578125, -3.11468505859375, -2.960693359375, -2.80670166015625, -2.6527099609375, -2.49871826171875, -2.3447265625, -2.19073486328125, -2.0367431640625, -1.88275146484375, -1.728759765625, -1.57476806640625, -1.4207763671875, -1.26678466796875, -1.11279296875, -0.95880126953125, -0.8048095703125, -0.65081787109375, -0.496826171875, -0.34283447265625, -0.1888427734375, -0.03485107421875, 0.119140625, 0.27313232421875, 0.4271240234375, 0.58111572265625, 0.735107421875, 0.88909912109375, 1.0430908203125, 1.19708251953125, 1.35107421875, 1.50506591796875, 1.6590576171875, 1.81304931640625, 1.967041015625, 2.12103271484375, 2.2750244140625, 2.42901611328125, 2.5830078125, 2.73699951171875, 2.8909912109375, 3.04498291015625, 3.198974609375, 3.35296630859375, 3.5069580078125, 3.66094970703125, 3.81494140625, 3.96893310546875, 4.1229248046875, 4.27691650390625, 4.430908203125, 4.58489990234375, 4.7388916015625, 4.89288330078125, 5.046875]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 6.0, 9.0, 1.0, 8.0, 5.0, 9.0, 22.0, 26.0, 30.0, 34.0, 44.0, 50.0, 58.0, 72.0, 66.0, 75.0, 79.0, 71.0, 46.0, 50.0, 52.0, 36.0, 29.0, 30.0, 15.0, 18.0, 14.0, 12.0, 6.0, 7.0, 5.0, 2.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.58736038208008, -31.37037467956543, -30.15338897705078, -28.936403274536133, -27.719417572021484, -26.50243377685547, -25.28544807434082, -24.068462371826172, -22.851476669311523, -21.634490966796875, -20.417505264282227, -19.200519561767578, -17.983535766601562, -16.76654815673828, -15.549564361572266, -14.332578659057617, -13.115592956542969, -11.89860725402832, -10.681621551513672, -9.46463680267334, -8.247651100158691, -7.030665397644043, -5.813680171966553, -4.5966949462890625, -3.379709243774414, -2.1627237796783447, -0.9457383155822754, 0.27124714851379395, 1.4882326126098633, 2.7052183151245117, 3.922203540802002, 5.139188766479492, 6.356174468994141, 7.573160171508789, 8.790145874023438, 10.00713062286377, 11.224116325378418, 12.441102027893066, 13.658086776733398, 14.875072479248047, 16.092058181762695, 17.309043884277344, 18.526029586791992, 19.74301528930664, 20.959999084472656, 22.176986694335938, 23.393970489501953, 24.6109561920166, 25.82794189453125, 27.0449275970459, 28.261913299560547, 29.478899002075195, 30.695884704589844, 31.91286849975586, 33.12985610961914, 34.346839904785156, 35.56382751464844, 36.78081130981445, 37.997798919677734, 39.21478271484375, 40.43177032470703, 41.64875411987305, 42.86574172973633, 44.082725524902344, 45.29970932006836]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 7.0, 8.0, 6.0, 6.0, 12.0, 13.0, 17.0, 19.0, 25.0, 31.0, 24.0, 35.0, 38.0, 29.0, 35.0, 30.0, 40.0, 49.0, 48.0, 46.0, 46.0, 46.0, 39.0, 45.0, 30.0, 30.0, 30.0, 41.0, 35.0, 28.0, 21.0, 21.0, 16.0, 6.0, 9.0, 14.0, 8.0, 5.0, 2.0, 5.0, 2.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-32.42322540283203, -31.32977867126465, -30.236331939697266, -29.142885208129883, -28.0494384765625, -26.955991744995117, -25.862545013427734, -24.76909828186035, -23.67565155029297, -22.582204818725586, -21.488758087158203, -20.39531135559082, -19.301864624023438, -18.208417892456055, -17.114971160888672, -16.02152442932129, -14.928077697753906, -13.834630966186523, -12.74118423461914, -11.647737503051758, -10.554290771484375, -9.460844039916992, -8.36739730834961, -7.273950576782227, -6.180503845214844, -5.087057113647461, -3.993610382080078, -2.9001636505126953, -1.8067169189453125, -0.7132701873779297, 0.3801765441894531, 1.473623275756836, 2.567066192626953, 3.660512924194336, 4.753959655761719, 5.847406387329102, 6.940853118896484, 8.034299850463867, 9.12774658203125, 10.221193313598633, 11.314640045166016, 12.408086776733398, 13.501533508300781, 14.594980239868164, 15.688426971435547, 16.78187370300293, 17.875320434570312, 18.968767166137695, 20.062213897705078, 21.15566062927246, 22.249107360839844, 23.342554092407227, 24.43600082397461, 25.529447555541992, 26.622894287109375, 27.716341018676758, 28.80978775024414, 29.903234481811523, 30.996681213378906, 32.090126037597656, 33.18357467651367, 34.27702331542969, 35.37046813964844, 36.46391296386719, 37.5573616027832]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 10.0, 6.0, 9.0, 4.0, 19.0, 12.0, 17.0, 23.0, 37.0, 36.0, 47.0, 72.0, 71.0, 100.0, 101.0, 127.0, 166.0, 187.0, 262.0, 372.0, 714.0, 1443.0, 3717.0, 493522.0, 16476.0, 3085.0, 1301.0, 646.0, 382.0, 273.0, 211.0, 161.0, 138.0, 104.0, 93.0, 66.0, 53.0, 56.0, 32.0, 27.0, 22.0, 13.0, 10.0, 10.0, 11.0, 3.0, 5.0, 6.0, 2.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-404.01214599609375, -390.50897216796875, -377.00579833984375, -363.5026550292969, -349.9994812011719, -336.4963073730469, -322.9931640625, -309.489990234375, -295.98681640625, -282.483642578125, -268.98046875, -255.47732543945312, -241.97415161132812, -228.47097778320312, -214.9678192138672, -201.46466064453125, -187.96148681640625, -174.45831298828125, -160.9551544189453, -147.45199584960938, -133.94882202148438, -120.4456558227539, -106.94248962402344, -93.43932342529297, -79.9361572265625, -66.43299102783203, -52.92982482910156, -39.426658630371094, -25.923492431640625, -12.420326232910156, 1.0828399658203125, 14.586006164550781, 28.089141845703125, 41.592308044433594, 55.09547424316406, 68.59864044189453, 82.101806640625, 95.60497283935547, 109.10813903808594, 122.6113052368164, 136.11447143554688, 149.61764526367188, 163.1208038330078, 176.62396240234375, 190.12713623046875, 203.63031005859375, 217.1334686279297, 230.63662719726562, 244.13980102539062, 257.6429748535156, 271.1461181640625, 284.6492919921875, 298.1524658203125, 311.6556396484375, 325.1588134765625, 338.6619567871094, 352.1651306152344, 365.6683044433594, 379.17144775390625, 392.67462158203125, 406.17779541015625, 419.68096923828125, 433.18414306640625, 446.6872863769531, 460.1904602050781]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 8.0, 5.0, 8.0, 5.0, 12.0, 18.0, 10.0, 19.0, 24.0, 33.0, 28.0, 34.0, 29.0, 34.0, 38.0, 33.0, 37.0, 45.0, 56.0, 1067.0, 51.0, 49.0, 33.0, 39.0, 42.0, 24.0, 29.0, 43.0, 32.0, 32.0, 18.0, 22.0, 14.0, 6.0, 10.0, 12.0, 10.0, 2.0, 4.0, 3.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1043.31787109375, -1008.0817260742188, -972.8455810546875, -937.6094360351562, -902.373291015625, -867.1371459960938, -831.9010009765625, -796.664794921875, -761.4287109375, -726.1925659179688, -690.9564208984375, -655.7202758789062, -620.484130859375, -585.2479858398438, -550.0118408203125, -514.775634765625, -479.53948974609375, -444.3033447265625, -409.06719970703125, -373.8310546875, -338.59490966796875, -303.3587646484375, -268.1225891113281, -232.88644409179688, -197.65029907226562, -162.41415405273438, -127.1780014038086, -91.94184875488281, -56.70570373535156, -21.469558715820312, 13.7666015625, 49.00274658203125, 84.2388916015625, 119.47503662109375, 154.711181640625, 189.9473419189453, 225.18348693847656, 260.41961669921875, 295.6557922363281, 330.8919372558594, 366.1280822753906, 401.3642272949219, 436.6003723144531, 471.8365478515625, 507.07269287109375, 542.308837890625, 577.5449829101562, 612.7811279296875, 648.0172729492188, 683.25341796875, 718.4895629882812, 753.7257080078125, 788.9618530273438, 824.197998046875, 859.4342041015625, 894.6702880859375, 929.906494140625, 965.1426391601562, 1000.3787841796875, 1035.614990234375, 1070.85107421875, 1106.0872802734375, 1141.3233642578125, 1176.5595703125, 1211.795654296875]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 5.0, 7.0, 8.0, 7.0, 8.0, 12.0, 17.0, 18.0, 19.0, 42.0, 42.0, 64.0, 96.0, 113.0, 185.0, 243.0, 339.0, 493.0, 678.0, 884.0, 1184.0, 1562.0, 2085.0, 3210.0, 9003.0, 31201316.0, 15442.0, 8018.0, 6085.0, 1687.0, 635.0, 489.0, 165.0, 96.0, 62.0, 50.0, 41.0, 35.0, 17.0, 16.0, 8.0, 6.0, 13.0, 2.0, 3.0, 3.0, 1.0, 2.0], "bins": [-1371.5205078125, -1338.51171875, -1305.5029296875, -1272.4942626953125, -1239.4854736328125, -1206.4766845703125, -1173.4678955078125, -1140.4591064453125, -1107.450439453125, -1074.441650390625, -1041.432861328125, -1008.4241333007812, -975.4154052734375, -942.4066162109375, -909.3978271484375, -876.3890380859375, -843.3802490234375, -810.3714599609375, -777.3627319335938, -744.3539428710938, -711.34521484375, -678.33642578125, -645.32763671875, -612.31884765625, -579.3101196289062, -546.3013305664062, -513.2926025390625, -480.2838134765625, -447.2750549316406, -414.26629638671875, -381.25750732421875, -348.2487487792969, -315.239990234375, -282.2312316894531, -249.2224578857422, -216.21368408203125, -183.20492553710938, -150.1961669921875, -117.18739318847656, -84.17861938476562, -51.16986083984375, -18.161094665527344, 14.847671508789062, 47.85643768310547, 80.86520385742188, 113.87396240234375, 146.8827362060547, 179.89151000976562, 212.9002685546875, 245.90902709960938, 278.91778564453125, 311.92657470703125, 344.9353332519531, 377.944091796875, 410.952880859375, 443.9616394042969, 476.97039794921875, 509.9791564941406, 542.9879150390625, 575.9967041015625, 609.0054931640625, 642.0142211914062, 675.0230102539062, 708.03173828125, 741.04052734375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 6.0, 3.0, 4.0, 13.0, 9.0, 7.0, 20.0, 31.0, 29.0, 75.0, 109.0, 234.0, 426.0, 772.0, 1685.0, 3703.0, 8947.0, 23004.0, 63762.0, 200705.0, 726139.0, 3053758.0, 1639213.0, 387557.0, 115909.0, 39638.0, 14573.0, 6070.0, 2545.0, 1189.0, 550.0, 278.0, 199.0, 101.0, 69.0, 41.0, 16.0, 14.0, 15.0, 9.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.1875, -86.6865234375, -83.185546875, -79.6845703125, -76.18359375, -72.6826171875, -69.181640625, -65.6806640625, -62.1796875, -58.6787109375, -55.177734375, -51.6767578125, -48.17578125, -44.6748046875, -41.173828125, -37.6728515625, -34.171875, -30.6708984375, -27.169921875, -23.6689453125, -20.16796875, -16.6669921875, -13.166015625, -9.6650390625, -6.1640625, -2.6630859375, 0.837890625, 4.3388671875, 7.83984375, 11.3408203125, 14.841796875, 18.3427734375, 21.84375, 25.3447265625, 28.845703125, 32.3466796875, 35.84765625, 39.3486328125, 42.849609375, 46.3505859375, 49.8515625, 53.3525390625, 56.853515625, 60.3544921875, 63.85546875, 67.3564453125, 70.857421875, 74.3583984375, 77.859375, 81.3603515625, 84.861328125, 88.3623046875, 91.86328125, 95.3642578125, 98.865234375, 102.3662109375, 105.8671875, 109.3681640625, 112.869140625, 116.3701171875, 119.87109375, 123.3720703125, 126.873046875, 130.3740234375, 133.875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 2.0, 4.0, 5.0, 6.0, 6.0, 4.0, 7.0, 8.0, 15.0, 24.0, 29.0, 20.0, 35.0, 38.0, 56.0, 66.0, 92.0, 95.0, 132.0, 176.0, 191.0, 189.0, 148.0, 132.0, 120.0, 101.0, 62.0, 46.0, 51.0, 31.0, 23.0, 28.0, 19.0, 15.0, 13.0, 6.0, 9.0, 3.0, 7.0, 4.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.171875, -23.369873046875, -22.56787109375, -21.765869140625, -20.9638671875, -20.161865234375, -19.35986328125, -18.557861328125, -17.755859375, -16.953857421875, -16.15185546875, -15.349853515625, -14.5478515625, -13.745849609375, -12.94384765625, -12.141845703125, -11.33984375, -10.537841796875, -9.73583984375, -8.933837890625, -8.1318359375, -7.329833984375, -6.52783203125, -5.725830078125, -4.923828125, -4.121826171875, -3.31982421875, -2.517822265625, -1.7158203125, -0.913818359375, -0.11181640625, 0.690185546875, 1.4921875, 2.294189453125, 3.09619140625, 3.898193359375, 4.7001953125, 5.502197265625, 6.30419921875, 7.106201171875, 7.908203125, 8.710205078125, 9.51220703125, 10.314208984375, 11.1162109375, 11.918212890625, 12.72021484375, 13.522216796875, 14.32421875, 15.126220703125, 15.92822265625, 16.730224609375, 17.5322265625, 18.334228515625, 19.13623046875, 19.938232421875, 20.740234375, 21.542236328125, 22.34423828125, 23.146240234375, 23.9482421875, 24.750244140625, 25.55224609375, 26.354248046875, 27.15625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 7.0, 8.0, 6.0, 12.0, 24.0, 44.0, 52.0, 78.0, 138.0, 191.0, 320.0, 464.0, 753.0, 1340.0, 2004.0, 3222.0, 5019.0, 8261.0, 13129.0, 21224.0, 34615.0, 56763.0, 92063.0, 149966.0, 248307.0, 432166.0, 867601.0, 1720361.0, 1244374.0, 582665.0, 318611.0, 188738.0, 114555.0, 70511.0, 43978.0, 26800.0, 16232.0, 10026.0, 6263.0, 3926.0, 2403.0, 1514.0, 985.0, 642.0, 394.0, 257.0, 164.0, 93.0, 73.0, 43.0, 24.0, 17.0, 5.0, 7.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-25.296875, -24.4736328125, -23.650390625, -22.8271484375, -22.00390625, -21.1806640625, -20.357421875, -19.5341796875, -18.7109375, -17.8876953125, -17.064453125, -16.2412109375, -15.41796875, -14.5947265625, -13.771484375, -12.9482421875, -12.125, -11.3017578125, -10.478515625, -9.6552734375, -8.83203125, -8.0087890625, -7.185546875, -6.3623046875, -5.5390625, -4.7158203125, -3.892578125, -3.0693359375, -2.24609375, -1.4228515625, -0.599609375, 0.2236328125, 1.046875, 1.8701171875, 2.693359375, 3.5166015625, 4.33984375, 5.1630859375, 5.986328125, 6.8095703125, 7.6328125, 8.4560546875, 9.279296875, 10.1025390625, 10.92578125, 11.7490234375, 12.572265625, 13.3955078125, 14.21875, 15.0419921875, 15.865234375, 16.6884765625, 17.51171875, 18.3349609375, 19.158203125, 19.9814453125, 20.8046875, 21.6279296875, 22.451171875, 23.2744140625, 24.09765625, 24.9208984375, 25.744140625, 26.5673828125, 27.390625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 5.0, 3.0, 7.0, 3.0, 5.0, 11.0, 7.0, 5.0, 10.0, 15.0, 24.0, 19.0, 31.0, 31.0, 30.0, 61.0, 62.0, 80.0, 96.0, 153.0, 201.0, 213.0, 223.0, 159.0, 119.0, 95.0, 68.0, 49.0, 43.0, 34.0, 32.0, 14.0, 20.0, 17.0, 18.0, 18.0, 10.0, 11.0, 6.0, 6.0, 7.0, 2.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-31.484375, -30.496337890625, -29.50830078125, -28.520263671875, -27.5322265625, -26.544189453125, -25.55615234375, -24.568115234375, -23.580078125, -22.592041015625, -21.60400390625, -20.615966796875, -19.6279296875, -18.639892578125, -17.65185546875, -16.663818359375, -15.67578125, -14.687744140625, -13.69970703125, -12.711669921875, -11.7236328125, -10.735595703125, -9.74755859375, -8.759521484375, -7.771484375, -6.783447265625, -5.79541015625, -4.807373046875, -3.8193359375, -2.831298828125, -1.84326171875, -0.855224609375, 0.1328125, 1.120849609375, 2.10888671875, 3.096923828125, 4.0849609375, 5.072998046875, 6.06103515625, 7.049072265625, 8.037109375, 9.025146484375, 10.01318359375, 11.001220703125, 11.9892578125, 12.977294921875, 13.96533203125, 14.953369140625, 15.94140625, 16.929443359375, 17.91748046875, 18.905517578125, 19.8935546875, 20.881591796875, 21.86962890625, 22.857666015625, 23.845703125, 24.833740234375, 25.82177734375, 26.809814453125, 27.7978515625, 28.785888671875, 29.77392578125, 30.761962890625, 31.75]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 9.0, 19.0, 23.0, 31.0, 50.0, 90.0, 88.0, 160.0, 222.0, 412.0, 571.0, 964.0, 1767.0, 3330.0, 6068.0, 13239.0, 28929.0, 71104.0, 308014.0, 5654121.0, 120422.0, 43559.0, 19016.0, 9193.0, 4389.0, 2221.0, 1335.0, 852.0, 499.0, 270.0, 161.0, 95.0, 62.0, 44.0, 38.0, 22.0, 9.0, 7.0, 8.0, 5.0, 4.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-96.25, -92.841796875, -89.43359375, -86.025390625, -82.6171875, -79.208984375, -75.80078125, -72.392578125, -68.984375, -65.576171875, -62.16796875, -58.759765625, -55.3515625, -51.943359375, -48.53515625, -45.126953125, -41.71875, -38.310546875, -34.90234375, -31.494140625, -28.0859375, -24.677734375, -21.26953125, -17.861328125, -14.453125, -11.044921875, -7.63671875, -4.228515625, -0.8203125, 2.587890625, 5.99609375, 9.404296875, 12.8125, 16.220703125, 19.62890625, 23.037109375, 26.4453125, 29.853515625, 33.26171875, 36.669921875, 40.078125, 43.486328125, 46.89453125, 50.302734375, 53.7109375, 57.119140625, 60.52734375, 63.935546875, 67.34375, 70.751953125, 74.16015625, 77.568359375, 80.9765625, 84.384765625, 87.79296875, 91.201171875, 94.609375, 98.017578125, 101.42578125, 104.833984375, 108.2421875, 111.650390625, 115.05859375, 118.466796875, 121.875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 8.0, 16.0, 15.0, 20.0, 13.0, 19.0, 29.0, 40.0, 47.0, 52.0, 74.0, 126.0, 280.0, 480.0, 290.0, 137.0, 79.0, 59.0, 40.0, 43.0, 35.0, 21.0, 27.0, 12.0, 9.0, 18.0, 7.0, 8.0, 6.0, 4.0, 9.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.6875, -61.462890625, -59.23828125, -57.013671875, -54.7890625, -52.564453125, -50.33984375, -48.115234375, -45.890625, -43.666015625, -41.44140625, -39.216796875, -36.9921875, -34.767578125, -32.54296875, -30.318359375, -28.09375, -25.869140625, -23.64453125, -21.419921875, -19.1953125, -16.970703125, -14.74609375, -12.521484375, -10.296875, -8.072265625, -5.84765625, -3.623046875, -1.3984375, 0.826171875, 3.05078125, 5.275390625, 7.5, 9.724609375, 11.94921875, 14.173828125, 16.3984375, 18.623046875, 20.84765625, 23.072265625, 25.296875, 27.521484375, 29.74609375, 31.970703125, 34.1953125, 36.419921875, 38.64453125, 40.869140625, 43.09375, 45.318359375, 47.54296875, 49.767578125, 51.9921875, 54.216796875, 56.44140625, 58.666015625, 60.890625, 63.115234375, 65.33984375, 67.564453125, 69.7890625, 72.013671875, 74.23828125, 76.462890625, 78.6875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 4.0, 7.0, 8.0, 5.0, 5.0, 9.0, 14.0, 21.0, 32.0, 25.0, 35.0, 47.0, 69.0, 118.0, 208.0, 113.0, 71.0, 47.0, 38.0, 22.0, 30.0, 17.0, 19.0, 8.0, 8.0, 9.0, 7.0, 6.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2328.625, -2272.683349609375, -2216.741943359375, -2160.80029296875, -2104.858642578125, -2048.917236328125, -1992.9755859375, -1937.033935546875, -1881.0924072265625, -1825.15087890625, -1769.209228515625, -1713.2677001953125, -1657.326171875, -1601.384521484375, -1545.4429931640625, -1489.50146484375, -1433.559814453125, -1377.6182861328125, -1321.6766357421875, -1265.735107421875, -1209.7935791015625, -1153.8519287109375, -1097.910400390625, -1041.96875, -986.02734375, -930.0857543945312, -874.1442260742188, -818.20263671875, -762.2610473632812, -706.3194580078125, -650.3779296875, -594.4363403320312, -538.4947509765625, -482.5531921386719, -426.6116027832031, -370.6700439453125, -314.72845458984375, -258.7868957519531, -202.8453369140625, -146.90374755859375, -90.96218872070312, -35.0206184387207, 20.92095184326172, 76.86251831054688, 132.80409240722656, 188.74566650390625, 244.68722534179688, 300.6288146972656, 356.57037353515625, 412.5119323730469, 468.4535217285156, 524.3950805664062, 580.336669921875, 636.2781982421875, 692.2197875976562, 748.161376953125, 804.1029052734375, 860.0444946289062, 915.9860229492188, 971.9276123046875, 1027.869140625, 1083.810791015625, 1139.7523193359375, 1195.69384765625, 1251.635498046875]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 4.0, 4.0, 3.0, 4.0, 10.0, 8.0, 8.0, 8.0, 14.0, 10.0, 17.0, 13.0, 18.0, 17.0, 22.0, 19.0, 24.0, 32.0, 45.0, 85.0, 137.0, 135.0, 67.0, 45.0, 26.0, 33.0, 28.0, 16.0, 14.0, 19.0, 17.0, 7.0, 17.0, 13.0, 12.0, 11.0, 12.0, 4.0, 3.0, 7.0, 7.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1619.1690673828125, -1568.353759765625, -1517.53857421875, -1466.723388671875, -1415.9080810546875, -1365.0927734375, -1314.277587890625, -1263.46240234375, -1212.6470947265625, -1161.831787109375, -1111.0166015625, -1060.201416015625, -1009.3861083984375, -958.5708618164062, -907.755615234375, -856.9403686523438, -806.1251220703125, -755.3098754882812, -704.49462890625, -653.6793823242188, -602.8641357421875, -552.0488891601562, -501.233642578125, -450.41839599609375, -399.6031494140625, -348.78790283203125, -297.97265625, -247.15740966796875, -196.3421630859375, -145.52691650390625, -94.711669921875, -43.89642333984375, 6.9188232421875, 57.73406982421875, 108.54931640625, 159.36456298828125, 210.1798095703125, 260.99505615234375, 311.810302734375, 362.62554931640625, 413.4407958984375, 464.25604248046875, 515.0712890625, 565.8865356445312, 616.7017822265625, 667.5170288085938, 718.332275390625, 769.1475219726562, 819.9627685546875, 870.7780151367188, 921.59326171875, 972.4085083007812, 1023.2237548828125, 1074.0390625, 1124.854248046875, 1175.66943359375, 1226.4847412109375, 1277.300048828125, 1328.115234375, 1378.930419921875, 1429.7457275390625, 1480.56103515625, 1531.376220703125, 1582.19140625, 1633.0067138671875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 3.0, 3.0, 9.0, 5.0, 7.0, 20.0, 25.0, 39.0, 34.0, 78.0, 78.0, 106.0, 177.0, 246.0, 354.0, 511.0, 707.0, 1070.0, 1549.0, 2381.0, 3852.0, 6641.0, 12263.0, 25934.0, 65140.0, 236079.0, 2929813.0, 701064.0, 123147.0, 41711.0, 18442.0, 9344.0, 5062.0, 3001.0, 1877.0, 1201.0, 811.0, 503.0, 355.0, 203.0, 137.0, 110.0, 69.0, 37.0, 29.0, 27.0, 7.0, 10.0, 6.0, 6.0, 6.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-17.5625, -17.057373046875, -16.55224609375, -16.047119140625, -15.5419921875, -15.036865234375, -14.53173828125, -14.026611328125, -13.521484375, -13.016357421875, -12.51123046875, -12.006103515625, -11.5009765625, -10.995849609375, -10.49072265625, -9.985595703125, -9.48046875, -8.975341796875, -8.47021484375, -7.965087890625, -7.4599609375, -6.954833984375, -6.44970703125, -5.944580078125, -5.439453125, -4.934326171875, -4.42919921875, -3.924072265625, -3.4189453125, -2.913818359375, -2.40869140625, -1.903564453125, -1.3984375, -0.893310546875, -0.38818359375, 0.116943359375, 0.6220703125, 1.127197265625, 1.63232421875, 2.137451171875, 2.642578125, 3.147705078125, 3.65283203125, 4.157958984375, 4.6630859375, 5.168212890625, 5.67333984375, 6.178466796875, 6.68359375, 7.188720703125, 7.69384765625, 8.198974609375, 8.7041015625, 9.209228515625, 9.71435546875, 10.219482421875, 10.724609375, 11.229736328125, 11.73486328125, 12.239990234375, 12.7451171875, 13.250244140625, 13.75537109375, 14.260498046875, 14.765625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 5.0, 5.0, 9.0, 10.0, 13.0, 16.0, 21.0, 41.0, 44.0, 61.0, 97.0, 150.0, 176.0, 97.0, 74.0, 57.0, 21.0, 28.0, 19.0, 11.0, 9.0, 5.0, 9.0, 7.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8369140625, -1.7829742431640625, -1.729034423828125, -1.6750946044921875, -1.62115478515625, -1.5672149658203125, -1.513275146484375, -1.4593353271484375, -1.4053955078125, -1.3514556884765625, -1.297515869140625, -1.2435760498046875, -1.18963623046875, -1.1356964111328125, -1.081756591796875, -1.0278167724609375, -0.973876953125, -0.9199371337890625, -0.865997314453125, -0.8120574951171875, -0.75811767578125, -0.7041778564453125, -0.650238037109375, -0.5962982177734375, -0.5423583984375, -0.4884185791015625, -0.434478759765625, -0.3805389404296875, -0.32659912109375, -0.2726593017578125, -0.218719482421875, -0.1647796630859375, -0.11083984375, -0.0569000244140625, -0.002960205078125, 0.0509796142578125, 0.10491943359375, 0.1588592529296875, 0.212799072265625, 0.2667388916015625, 0.3206787109375, 0.3746185302734375, 0.428558349609375, 0.4824981689453125, 0.53643798828125, 0.5903778076171875, 0.644317626953125, 0.6982574462890625, 0.752197265625, 0.8061370849609375, 0.860076904296875, 0.9140167236328125, 0.96795654296875, 1.0218963623046875, 1.075836181640625, 1.1297760009765625, 1.1837158203125, 1.2376556396484375, 1.291595458984375, 1.3455352783203125, 1.39947509765625, 1.4534149169921875, 1.507354736328125, 1.5612945556640625, 1.615234375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 6.0, 14.0, 13.0, 26.0, 44.0, 48.0, 97.0, 138.0, 215.0, 343.0, 621.0, 1085.0, 2132.0, 4519.0, 10977.0, 31461.0, 105320.0, 438597.0, 2344403.0, 972435.0, 198463.0, 52880.0, 17168.0, 6699.0, 3009.0, 1451.0, 807.0, 482.0, 256.0, 199.0, 110.0, 72.0, 60.0, 35.0, 29.0, 19.0, 7.0, 15.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-18.328125, -17.784912109375, -17.24169921875, -16.698486328125, -16.1552734375, -15.612060546875, -15.06884765625, -14.525634765625, -13.982421875, -13.439208984375, -12.89599609375, -12.352783203125, -11.8095703125, -11.266357421875, -10.72314453125, -10.179931640625, -9.63671875, -9.093505859375, -8.55029296875, -8.007080078125, -7.4638671875, -6.920654296875, -6.37744140625, -5.834228515625, -5.291015625, -4.747802734375, -4.20458984375, -3.661376953125, -3.1181640625, -2.574951171875, -2.03173828125, -1.488525390625, -0.9453125, -0.402099609375, 0.14111328125, 0.684326171875, 1.2275390625, 1.770751953125, 2.31396484375, 2.857177734375, 3.400390625, 3.943603515625, 4.48681640625, 5.030029296875, 5.5732421875, 6.116455078125, 6.65966796875, 7.202880859375, 7.74609375, 8.289306640625, 8.83251953125, 9.375732421875, 9.9189453125, 10.462158203125, 11.00537109375, 11.548583984375, 12.091796875, 12.635009765625, 13.17822265625, 13.721435546875, 14.2646484375, 14.807861328125, 15.35107421875, 15.894287109375, 16.4375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 3.0, 12.0, 10.0, 15.0, 15.0, 25.0, 28.0, 39.0, 45.0, 53.0, 78.0, 84.0, 103.0, 152.0, 201.0, 226.0, 350.0, 538.0, 614.0, 371.0, 257.0, 194.0, 141.0, 120.0, 85.0, 73.0, 51.0, 47.0, 37.0, 29.0, 18.0, 17.0, 8.0, 9.0, 6.0, 5.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.08203125, -3.9371337890625, -3.792236328125, -3.6473388671875, -3.50244140625, -3.3575439453125, -3.212646484375, -3.0677490234375, -2.9228515625, -2.7779541015625, -2.633056640625, -2.4881591796875, -2.34326171875, -2.1983642578125, -2.053466796875, -1.9085693359375, -1.763671875, -1.6187744140625, -1.473876953125, -1.3289794921875, -1.18408203125, -1.0391845703125, -0.894287109375, -0.7493896484375, -0.6044921875, -0.4595947265625, -0.314697265625, -0.1697998046875, -0.02490234375, 0.1199951171875, 0.264892578125, 0.4097900390625, 0.5546875, 0.6995849609375, 0.844482421875, 0.9893798828125, 1.13427734375, 1.2791748046875, 1.424072265625, 1.5689697265625, 1.7138671875, 1.8587646484375, 2.003662109375, 2.1485595703125, 2.29345703125, 2.4383544921875, 2.583251953125, 2.7281494140625, 2.873046875, 3.0179443359375, 3.162841796875, 3.3077392578125, 3.45263671875, 3.5975341796875, 3.742431640625, 3.8873291015625, 4.0322265625, 4.1771240234375, 4.322021484375, 4.4669189453125, 4.61181640625, 4.7567138671875, 4.901611328125, 5.0465087890625, 5.19140625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 8.0, 6.0, 5.0, 10.0, 15.0, 19.0, 24.0, 45.0, 80.0, 108.0, 173.0, 163.0, 126.0, 92.0, 45.0, 30.0, 16.0, 11.0, 8.0, 5.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-57.42622375488281, -55.24839782714844, -53.07057189941406, -50.89274978637695, -48.71492385864258, -46.5370979309082, -44.359275817871094, -42.18144989013672, -40.003623962402344, -37.82579803466797, -35.647972106933594, -33.470149993896484, -31.29232406616211, -29.114498138427734, -26.936674118041992, -24.75885009765625, -22.581024169921875, -20.4031982421875, -18.225374221801758, -16.047550201416016, -13.86972427368164, -11.691899299621582, -9.514074325561523, -7.336249351501465, -5.158424377441406, -2.9805994033813477, -0.8027744293212891, 1.3750505447387695, 3.552875518798828, 5.730700492858887, 7.908525466918945, 10.086350440979004, 12.264175415039062, 14.442000389099121, 16.61982536315918, 18.797649383544922, 20.975475311279297, 23.153301239013672, 25.331125259399414, 27.508949279785156, 29.68677520751953, 31.864601135253906, 34.04242706298828, 36.22024917602539, 38.398075103759766, 40.57590103149414, 42.75372314453125, 44.931549072265625, 47.109375, 49.287200927734375, 51.46502685546875, 53.64284896850586, 55.820674896240234, 57.99850082397461, 60.17632293701172, 62.354148864746094, 64.53197479248047, 66.70980072021484, 68.88762664794922, 71.0654525756836, 73.24327087402344, 75.42109680175781, 77.59892272949219, 79.77674865722656, 81.95457458496094]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 10.0, 6.0, 21.0, 8.0, 10.0, 23.0, 13.0, 37.0, 31.0, 32.0, 35.0, 42.0, 28.0, 45.0, 39.0, 52.0, 54.0, 62.0, 62.0, 52.0, 43.0, 25.0, 45.0, 38.0, 23.0, 25.0, 29.0, 21.0, 25.0, 17.0, 14.0, 7.0, 5.0, 9.0, 2.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.19241714477539, -30.18705940246582, -29.18170166015625, -28.17634391784668, -27.17098617553711, -26.165630340576172, -25.1602725982666, -24.15491485595703, -23.14955711364746, -22.14419937133789, -21.13884162902832, -20.13348388671875, -19.128128051757812, -18.12276840209961, -17.117412567138672, -16.1120548248291, -15.106697082519531, -14.101339340209961, -13.09598159790039, -12.090624809265137, -11.085267066955566, -10.079909324645996, -9.074552536010742, -8.069194793701172, -7.063837051391602, -6.058479309082031, -5.053122043609619, -4.047764778137207, -3.0424070358276367, -2.0370492935180664, -1.0316920280456543, -0.026334762573242188, 0.9790267944335938, 1.984384298324585, 2.989741802215576, 3.9950993061065674, 5.000456809997559, 6.005814552307129, 7.011171817779541, 8.016529083251953, 9.021886825561523, 10.027244567871094, 11.032602310180664, 12.037959098815918, 13.043316841125488, 14.048674583435059, 15.054031372070312, 16.059389114379883, 17.064746856689453, 18.070104598999023, 19.075462341308594, 20.080820083618164, 21.086177825927734, 22.091533660888672, 23.096891403198242, 24.102249145507812, 25.107606887817383, 26.112964630126953, 27.118322372436523, 28.123680114746094, 29.12903594970703, 30.134395599365234, 31.139751434326172, 32.145111083984375, 33.15046691894531]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 11.0, 10.0, 12.0, 11.0, 21.0, 25.0, 47.0, 59.0, 80.0, 140.0, 228.0, 275.0, 408.0, 633.0, 1043.0, 1718.0, 3112.0, 5529.0, 11378.0, 25982.0, 71632.0, 276606.0, 461411.0, 117017.0, 38520.0, 15531.0, 7439.0, 3851.0, 2249.0, 1268.0, 845.0, 472.0, 289.0, 214.0, 154.0, 92.0, 55.0, 47.0, 53.0, 18.0, 16.0, 15.0, 10.0, 7.0, 8.0, 7.0, 2.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.890625, -9.58349609375, -9.2763671875, -8.96923828125, -8.662109375, -8.35498046875, -8.0478515625, -7.74072265625, -7.43359375, -7.12646484375, -6.8193359375, -6.51220703125, -6.205078125, -5.89794921875, -5.5908203125, -5.28369140625, -4.9765625, -4.66943359375, -4.3623046875, -4.05517578125, -3.748046875, -3.44091796875, -3.1337890625, -2.82666015625, -2.51953125, -2.21240234375, -1.9052734375, -1.59814453125, -1.291015625, -0.98388671875, -0.6767578125, -0.36962890625, -0.0625, 0.24462890625, 0.5517578125, 0.85888671875, 1.166015625, 1.47314453125, 1.7802734375, 2.08740234375, 2.39453125, 2.70166015625, 3.0087890625, 3.31591796875, 3.623046875, 3.93017578125, 4.2373046875, 4.54443359375, 4.8515625, 5.15869140625, 5.4658203125, 5.77294921875, 6.080078125, 6.38720703125, 6.6943359375, 7.00146484375, 7.30859375, 7.61572265625, 7.9228515625, 8.22998046875, 8.537109375, 8.84423828125, 9.1513671875, 9.45849609375, 9.765625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 3.0, 1.0, 10.0, 10.0, 10.0, 14.0, 26.0, 36.0, 37.0, 63.0, 70.0, 84.0, 112.0, 84.0, 86.0, 74.0, 68.0, 54.0, 42.0, 30.0, 18.0, 16.0, 15.0, 10.0, 3.0, 9.0, 0.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.83203125, -1.76739501953125, -1.7027587890625, -1.63812255859375, -1.573486328125, -1.50885009765625, -1.4442138671875, -1.37957763671875, -1.31494140625, -1.25030517578125, -1.1856689453125, -1.12103271484375, -1.056396484375, -0.99176025390625, -0.9271240234375, -0.86248779296875, -0.7978515625, -0.73321533203125, -0.6685791015625, -0.60394287109375, -0.539306640625, -0.47467041015625, -0.4100341796875, -0.34539794921875, -0.28076171875, -0.21612548828125, -0.1514892578125, -0.08685302734375, -0.022216796875, 0.04241943359375, 0.1070556640625, 0.17169189453125, 0.236328125, 0.30096435546875, 0.3656005859375, 0.43023681640625, 0.494873046875, 0.55950927734375, 0.6241455078125, 0.68878173828125, 0.75341796875, 0.81805419921875, 0.8826904296875, 0.94732666015625, 1.011962890625, 1.07659912109375, 1.1412353515625, 1.20587158203125, 1.2705078125, 1.33514404296875, 1.3997802734375, 1.46441650390625, 1.529052734375, 1.59368896484375, 1.6583251953125, 1.72296142578125, 1.78759765625, 1.85223388671875, 1.9168701171875, 1.98150634765625, 2.046142578125, 2.11077880859375, 2.1754150390625, 2.24005126953125, 2.3046875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 5.0, 4.0, 4.0, 5.0, 8.0, 17.0, 23.0, 20.0, 37.0, 59.0, 57.0, 85.0, 112.0, 144.0, 229.0, 303.0, 442.0, 713.0, 1075.0, 1694.0, 2705.0, 4583.0, 7969.0, 14973.0, 30149.0, 67757.0, 177061.0, 389585.0, 201773.0, 75674.0, 33261.0, 16278.0, 8875.0, 4912.0, 2779.0, 1787.0, 1120.0, 642.0, 483.0, 335.0, 239.0, 168.0, 99.0, 101.0, 58.0, 40.0, 21.0, 25.0, 27.0, 11.0, 7.0, 8.0, 4.0, 10.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-6.46875, -6.24993896484375, -6.0311279296875, -5.81231689453125, -5.593505859375, -5.37469482421875, -5.1558837890625, -4.93707275390625, -4.71826171875, -4.49945068359375, -4.2806396484375, -4.06182861328125, -3.843017578125, -3.62420654296875, -3.4053955078125, -3.18658447265625, -2.9677734375, -2.74896240234375, -2.5301513671875, -2.31134033203125, -2.092529296875, -1.87371826171875, -1.6549072265625, -1.43609619140625, -1.21728515625, -0.99847412109375, -0.7796630859375, -0.56085205078125, -0.342041015625, -0.12322998046875, 0.0955810546875, 0.31439208984375, 0.533203125, 0.75201416015625, 0.9708251953125, 1.18963623046875, 1.408447265625, 1.62725830078125, 1.8460693359375, 2.06488037109375, 2.28369140625, 2.50250244140625, 2.7213134765625, 2.94012451171875, 3.158935546875, 3.37774658203125, 3.5965576171875, 3.81536865234375, 4.0341796875, 4.25299072265625, 4.4718017578125, 4.69061279296875, 4.909423828125, 5.12823486328125, 5.3470458984375, 5.56585693359375, 5.78466796875, 6.00347900390625, 6.2222900390625, 6.44110107421875, 6.659912109375, 6.87872314453125, 7.0975341796875, 7.31634521484375, 7.53515625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 3.0, 0.0, 6.0, 3.0, 8.0, 6.0, 11.0, 9.0, 11.0, 13.0, 11.0, 14.0, 14.0, 25.0, 22.0, 30.0, 42.0, 28.0, 27.0, 25.0, 34.0, 24.0, 33.0, 47.0, 36.0, 33.0, 48.0, 41.0, 34.0, 37.0, 30.0, 29.0, 22.0, 33.0, 28.0, 28.0, 19.0, 17.0, 25.0, 16.0, 12.0, 11.0, 7.0, 9.0, 13.0, 6.0, 5.0, 8.0, 5.0, 4.0, 3.0, 2.0, 3.0, 3.0], "bins": [-7.91796875, -7.69134521484375, -7.4647216796875, -7.23809814453125, -7.011474609375, -6.78485107421875, -6.5582275390625, -6.33160400390625, -6.10498046875, -5.87835693359375, -5.6517333984375, -5.42510986328125, -5.198486328125, -4.97186279296875, -4.7452392578125, -4.51861572265625, -4.2919921875, -4.06536865234375, -3.8387451171875, -3.61212158203125, -3.385498046875, -3.15887451171875, -2.9322509765625, -2.70562744140625, -2.47900390625, -2.25238037109375, -2.0257568359375, -1.79913330078125, -1.572509765625, -1.34588623046875, -1.1192626953125, -0.89263916015625, -0.666015625, -0.43939208984375, -0.2127685546875, 0.01385498046875, 0.240478515625, 0.46710205078125, 0.6937255859375, 0.92034912109375, 1.14697265625, 1.37359619140625, 1.6002197265625, 1.82684326171875, 2.053466796875, 2.28009033203125, 2.5067138671875, 2.73333740234375, 2.9599609375, 3.18658447265625, 3.4132080078125, 3.63983154296875, 3.866455078125, 4.09307861328125, 4.3197021484375, 4.54632568359375, 4.77294921875, 4.99957275390625, 5.2261962890625, 5.45281982421875, 5.679443359375, 5.90606689453125, 6.1326904296875, 6.35931396484375, 6.5859375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 0.0, 1.0, 6.0, 3.0, 6.0, 10.0, 15.0, 28.0, 31.0, 58.0, 61.0, 88.0, 167.0, 292.0, 463.0, 1048.0, 2095.0, 5136.0, 14398.0, 54598.0, 312991.0, 521729.0, 99501.0, 22681.0, 7328.0, 2980.0, 1318.0, 654.0, 327.0, 201.0, 107.0, 63.0, 54.0, 39.0, 27.0, 20.0, 9.0, 7.0, 9.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.44921875, -7.2247314453125, -7.000244140625, -6.7757568359375, -6.55126953125, -6.3267822265625, -6.102294921875, -5.8778076171875, -5.6533203125, -5.4288330078125, -5.204345703125, -4.9798583984375, -4.75537109375, -4.5308837890625, -4.306396484375, -4.0819091796875, -3.857421875, -3.6329345703125, -3.408447265625, -3.1839599609375, -2.95947265625, -2.7349853515625, -2.510498046875, -2.2860107421875, -2.0615234375, -1.8370361328125, -1.612548828125, -1.3880615234375, -1.16357421875, -0.9390869140625, -0.714599609375, -0.4901123046875, -0.265625, -0.0411376953125, 0.183349609375, 0.4078369140625, 0.63232421875, 0.8568115234375, 1.081298828125, 1.3057861328125, 1.5302734375, 1.7547607421875, 1.979248046875, 2.2037353515625, 2.42822265625, 2.6527099609375, 2.877197265625, 3.1016845703125, 3.326171875, 3.5506591796875, 3.775146484375, 3.9996337890625, 4.22412109375, 4.4486083984375, 4.673095703125, 4.8975830078125, 5.1220703125, 5.3465576171875, 5.571044921875, 5.7955322265625, 6.02001953125, 6.2445068359375, 6.468994140625, 6.6934814453125, 6.91796875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 10.0, 8.0, 12.0, 19.0, 23.0, 38.0, 55.0, 64.0, 80.0, 75.0, 92.0, 108.0, 85.0, 81.0, 54.0, 43.0, 33.0, 30.0, 32.0, 16.0, 7.0, 9.0, 5.0, 6.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00022423267364501953, -0.00021628104150295258, -0.00020832940936088562, -0.00020037777721881866, -0.0001924261450767517, -0.00018447451293468475, -0.0001765228807926178, -0.00016857124865055084, -0.0001606196165084839, -0.00015266798436641693, -0.00014471635222434998, -0.00013676472008228302, -0.00012881308794021606, -0.00012086145579814911, -0.00011290982365608215, -0.0001049581915140152, -9.700655937194824e-05, -8.905492722988129e-05, -8.110329508781433e-05, -7.315166294574738e-05, -6.520003080368042e-05, -5.7248398661613464e-05, -4.929676651954651e-05, -4.134513437747955e-05, -3.33935022354126e-05, -2.5441870093345642e-05, -1.7490237951278687e-05, -9.538605809211731e-06, -1.5869736671447754e-06, 6.36465847492218e-06, 1.4316290616989136e-05, 2.226792275905609e-05, 3.0219554901123047e-05, 3.817118704319e-05, 4.612281918525696e-05, 5.4074451327323914e-05, 6.202608346939087e-05, 6.997771561145782e-05, 7.792934775352478e-05, 8.588097989559174e-05, 9.383261203765869e-05, 0.00010178424417972565, 0.0001097358763217926, 0.00011768750846385956, 0.00012563914060592651, 0.00013359077274799347, 0.00014154240489006042, 0.00014949403703212738, 0.00015744566917419434, 0.0001653973013162613, 0.00017334893345832825, 0.0001813005656003952, 0.00018925219774246216, 0.00019720382988452911, 0.00020515546202659607, 0.00021310709416866302, 0.00022105872631072998, 0.00022901035845279694, 0.0002369619905948639, 0.00024491362273693085, 0.0002528652548789978, 0.00026081688702106476, 0.0002687685191631317, 0.00027672015130519867, 0.0002846717834472656]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 8.0, 9.0, 10.0, 24.0, 25.0, 48.0, 57.0, 121.0, 147.0, 229.0, 365.0, 532.0, 987.0, 1644.0, 3209.0, 6415.0, 13728.0, 33311.0, 93881.0, 286383.0, 383614.0, 140831.0, 46946.0, 18566.0, 8256.0, 4147.0, 2099.0, 1189.0, 671.0, 397.0, 236.0, 162.0, 110.0, 75.0, 40.0, 28.0, 23.0, 12.0, 6.0, 6.0, 5.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6015625, -4.45855712890625, -4.3155517578125, -4.17254638671875, -4.029541015625, -3.88653564453125, -3.7435302734375, -3.60052490234375, -3.45751953125, -3.31451416015625, -3.1715087890625, -3.02850341796875, -2.885498046875, -2.74249267578125, -2.5994873046875, -2.45648193359375, -2.3134765625, -2.17047119140625, -2.0274658203125, -1.88446044921875, -1.741455078125, -1.59844970703125, -1.4554443359375, -1.31243896484375, -1.16943359375, -1.02642822265625, -0.8834228515625, -0.74041748046875, -0.597412109375, -0.45440673828125, -0.3114013671875, -0.16839599609375, -0.025390625, 0.11761474609375, 0.2606201171875, 0.40362548828125, 0.546630859375, 0.68963623046875, 0.8326416015625, 0.97564697265625, 1.11865234375, 1.26165771484375, 1.4046630859375, 1.54766845703125, 1.690673828125, 1.83367919921875, 1.9766845703125, 2.11968994140625, 2.2626953125, 2.40570068359375, 2.5487060546875, 2.69171142578125, 2.834716796875, 2.97772216796875, 3.1207275390625, 3.26373291015625, 3.40673828125, 3.54974365234375, 3.6927490234375, 3.83575439453125, 3.978759765625, 4.12176513671875, 4.2647705078125, 4.40777587890625, 4.55078125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 4.0, 3.0, 5.0, 6.0, 10.0, 12.0, 20.0, 19.0, 31.0, 30.0, 30.0, 43.0, 39.0, 49.0, 60.0, 49.0, 60.0, 63.0, 65.0, 54.0, 50.0, 42.0, 46.0, 39.0, 30.0, 27.0, 23.0, 13.0, 22.0, 13.0, 9.0, 8.0, 4.0, 6.0, 3.0, 3.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.005859375, -2.895782470703125, -2.78570556640625, -2.675628662109375, -2.5655517578125, -2.455474853515625, -2.34539794921875, -2.235321044921875, -2.125244140625, -2.015167236328125, -1.90509033203125, -1.795013427734375, -1.6849365234375, -1.574859619140625, -1.46478271484375, -1.354705810546875, -1.24462890625, -1.134552001953125, -1.02447509765625, -0.914398193359375, -0.8043212890625, -0.694244384765625, -0.58416748046875, -0.474090576171875, -0.364013671875, -0.253936767578125, -0.14385986328125, -0.033782958984375, 0.0762939453125, 0.186370849609375, 0.29644775390625, 0.406524658203125, 0.5166015625, 0.626678466796875, 0.73675537109375, 0.846832275390625, 0.9569091796875, 1.066986083984375, 1.17706298828125, 1.287139892578125, 1.397216796875, 1.507293701171875, 1.61737060546875, 1.727447509765625, 1.8375244140625, 1.947601318359375, 2.05767822265625, 2.167755126953125, 2.27783203125, 2.387908935546875, 2.49798583984375, 2.608062744140625, 2.7181396484375, 2.828216552734375, 2.93829345703125, 3.048370361328125, 3.158447265625, 3.268524169921875, 3.37860107421875, 3.488677978515625, 3.5987548828125, 3.708831787109375, 3.81890869140625, 3.928985595703125, 4.0390625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 8.0, 9.0, 25.0, 80.0, 148.0, 236.0, 219.0, 110.0, 51.0, 35.0, 22.0, 13.0, 9.0, 9.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.54007720947266, -60.87861633300781, -57.21715545654297, -53.555694580078125, -49.89423370361328, -46.23277282714844, -42.571311950683594, -38.90985107421875, -35.248390197753906, -31.586929321289062, -27.92546844482422, -24.264007568359375, -20.60254669189453, -16.941085815429688, -13.279624938964844, -9.6181640625, -5.956703186035156, -2.2952423095703125, 1.3662185668945312, 5.027679443359375, 8.689140319824219, 12.350601196289062, 16.012062072753906, 19.67352294921875, 23.334983825683594, 26.996444702148438, 30.65790557861328, 34.319366455078125, 37.98082733154297, 41.64228820800781, 45.303749084472656, 48.9652099609375, 52.62666320800781, 56.288124084472656, 59.9495849609375, 63.611045837402344, 67.27250671386719, 70.93396759033203, 74.59542846679688, 78.25688934326172, 81.91835021972656, 85.5798110961914, 89.24127197265625, 92.9027328491211, 96.56419372558594, 100.22565460205078, 103.88711547851562, 107.54857635498047, 111.21003723144531, 114.87149810791016, 118.532958984375, 122.19441986083984, 125.85588073730469, 129.517333984375, 133.17880249023438, 136.84027099609375, 140.50172424316406, 144.16317749023438, 147.82464599609375, 151.48611450195312, 155.14756774902344, 158.80902099609375, 162.47048950195312, 166.1319580078125, 169.7934112548828]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 3.0, 8.0, 6.0, 16.0, 13.0, 24.0, 57.0, 73.0, 118.0, 158.0, 152.0, 117.0, 96.0, 38.0, 34.0, 16.0, 14.0, 7.0, 9.0, 5.0, 5.0, 3.0, 7.0, 3.0, 0.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-150.6510467529297, -145.63816833496094, -140.62530517578125, -135.6124267578125, -130.5995635986328, -125.58668518066406, -120.57381439208984, -115.56094360351562, -110.5480728149414, -105.53520202636719, -100.52233123779297, -95.50946044921875, -90.49658203125, -85.48371887207031, -80.47084045410156, -75.45796966552734, -70.44509887695312, -65.4322280883789, -60.41935729980469, -55.4064826965332, -50.393611907958984, -45.380741119384766, -40.36786651611328, -35.35499572753906, -30.342124938964844, -25.329254150390625, -20.316381454467773, -15.303509712219238, -10.290637969970703, -5.277767181396484, -0.2648944854736328, 4.747978210449219, 9.760833740234375, 14.77370548248291, 19.786577224731445, 24.799449920654297, 29.812320709228516, 34.825191497802734, 39.83806610107422, 44.85093688964844, 49.863807678222656, 54.876678466796875, 59.889549255371094, 64.90242004394531, 69.91529846191406, 74.92816162109375, 79.9410400390625, 84.95391082763672, 89.96678161621094, 94.97965240478516, 99.99252319335938, 105.0053939819336, 110.01826477050781, 115.03114318847656, 120.04401397705078, 125.056884765625, 130.06976318359375, 135.0826416015625, 140.0955047607422, 145.10838317871094, 150.12124633789062, 155.13412475585938, 160.14698791503906, 165.1598663330078, 170.1727294921875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 6.0, 6.0, 10.0, 7.0, 13.0, 13.0, 19.0, 18.0, 45.0, 48.0, 78.0, 118.0, 160.0, 264.0, 466.0, 796.0, 1350.0, 2708.0, 6093.0, 15899.0, 56108.0, 471244.0, 3477828.0, 117590.0, 26413.0, 9147.0, 3760.0, 1825.0, 944.0, 467.0, 271.0, 192.0, 114.0, 79.0, 57.0, 35.0, 18.0, 21.0, 14.0, 12.0, 8.0, 7.0, 3.0, 4.0, 3.0, 0.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-31.1875, -30.1884765625, -29.189453125, -28.1904296875, -27.19140625, -26.1923828125, -25.193359375, -24.1943359375, -23.1953125, -22.1962890625, -21.197265625, -20.1982421875, -19.19921875, -18.2001953125, -17.201171875, -16.2021484375, -15.203125, -14.2041015625, -13.205078125, -12.2060546875, -11.20703125, -10.2080078125, -9.208984375, -8.2099609375, -7.2109375, -6.2119140625, -5.212890625, -4.2138671875, -3.21484375, -2.2158203125, -1.216796875, -0.2177734375, 0.78125, 1.7802734375, 2.779296875, 3.7783203125, 4.77734375, 5.7763671875, 6.775390625, 7.7744140625, 8.7734375, 9.7724609375, 10.771484375, 11.7705078125, 12.76953125, 13.7685546875, 14.767578125, 15.7666015625, 16.765625, 17.7646484375, 18.763671875, 19.7626953125, 20.76171875, 21.7607421875, 22.759765625, 23.7587890625, 24.7578125, 25.7568359375, 26.755859375, 27.7548828125, 28.75390625, 29.7529296875, 30.751953125, 31.7509765625, 32.75]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 2.0, 10.0, 3.0, 8.0, 15.0, 18.0, 26.0, 40.0, 54.0, 65.0, 79.0, 103.0, 84.0, 102.0, 78.0, 75.0, 59.0, 39.0, 31.0, 31.0, 20.0, 19.0, 8.0, 7.0, 5.0, 4.0, 3.0, 4.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.2109375, -2.139251708984375, -2.06756591796875, -1.995880126953125, -1.9241943359375, -1.852508544921875, -1.78082275390625, -1.709136962890625, -1.637451171875, -1.565765380859375, -1.49407958984375, -1.422393798828125, -1.3507080078125, -1.279022216796875, -1.20733642578125, -1.135650634765625, -1.06396484375, -0.992279052734375, -0.92059326171875, -0.848907470703125, -0.7772216796875, -0.705535888671875, -0.63385009765625, -0.562164306640625, -0.490478515625, -0.418792724609375, -0.34710693359375, -0.275421142578125, -0.2037353515625, -0.132049560546875, -0.06036376953125, 0.011322021484375, 0.0830078125, 0.154693603515625, 0.22637939453125, 0.298065185546875, 0.3697509765625, 0.441436767578125, 0.51312255859375, 0.584808349609375, 0.656494140625, 0.728179931640625, 0.79986572265625, 0.871551513671875, 0.9432373046875, 1.014923095703125, 1.08660888671875, 1.158294677734375, 1.22998046875, 1.301666259765625, 1.37335205078125, 1.445037841796875, 1.5167236328125, 1.588409423828125, 1.66009521484375, 1.731781005859375, 1.803466796875, 1.875152587890625, 1.94683837890625, 2.018524169921875, 2.0902099609375, 2.161895751953125, 2.23358154296875, 2.305267333984375, 2.376953125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 8.0, 6.0, 12.0, 19.0, 22.0, 31.0, 49.0, 61.0, 104.0, 180.0, 286.0, 581.0, 1125.0, 2374.0, 5587.0, 15007.0, 50451.0, 254989.0, 3187679.0, 556573.0, 83745.0, 21907.0, 7410.0, 3076.0, 1384.0, 706.0, 342.0, 188.0, 122.0, 84.0, 41.0, 33.0, 27.0, 20.0, 14.0, 6.0, 12.0, 8.0, 0.0, 2.0, 3.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.4375, -31.474365234375, -30.51123046875, -29.548095703125, -28.5849609375, -27.621826171875, -26.65869140625, -25.695556640625, -24.732421875, -23.769287109375, -22.80615234375, -21.843017578125, -20.8798828125, -19.916748046875, -18.95361328125, -17.990478515625, -17.02734375, -16.064208984375, -15.10107421875, -14.137939453125, -13.1748046875, -12.211669921875, -11.24853515625, -10.285400390625, -9.322265625, -8.359130859375, -7.39599609375, -6.432861328125, -5.4697265625, -4.506591796875, -3.54345703125, -2.580322265625, -1.6171875, -0.654052734375, 0.30908203125, 1.272216796875, 2.2353515625, 3.198486328125, 4.16162109375, 5.124755859375, 6.087890625, 7.051025390625, 8.01416015625, 8.977294921875, 9.9404296875, 10.903564453125, 11.86669921875, 12.829833984375, 13.79296875, 14.756103515625, 15.71923828125, 16.682373046875, 17.6455078125, 18.608642578125, 19.57177734375, 20.534912109375, 21.498046875, 22.461181640625, 23.42431640625, 24.387451171875, 25.3505859375, 26.313720703125, 27.27685546875, 28.239990234375, 29.203125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 5.0, 7.0, 4.0, 6.0, 5.0, 13.0, 14.0, 28.0, 35.0, 34.0, 56.0, 101.0, 153.0, 274.0, 754.0, 1588.0, 429.0, 223.0, 123.0, 78.0, 39.0, 36.0, 25.0, 12.0, 11.0, 7.0, 6.0, 3.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.109375, -6.937103271484375, -6.76483154296875, -6.592559814453125, -6.4202880859375, -6.248016357421875, -6.07574462890625, -5.903472900390625, -5.731201171875, -5.558929443359375, -5.38665771484375, -5.214385986328125, -5.0421142578125, -4.869842529296875, -4.69757080078125, -4.525299072265625, -4.35302734375, -4.180755615234375, -4.00848388671875, -3.836212158203125, -3.6639404296875, -3.491668701171875, -3.31939697265625, -3.147125244140625, -2.974853515625, -2.802581787109375, -2.63031005859375, -2.458038330078125, -2.2857666015625, -2.113494873046875, -1.94122314453125, -1.768951416015625, -1.5966796875, -1.424407958984375, -1.25213623046875, -1.079864501953125, -0.9075927734375, -0.735321044921875, -0.56304931640625, -0.390777587890625, -0.218505859375, -0.046234130859375, 0.12603759765625, 0.298309326171875, 0.4705810546875, 0.642852783203125, 0.81512451171875, 0.987396240234375, 1.15966796875, 1.331939697265625, 1.50421142578125, 1.676483154296875, 1.8487548828125, 2.021026611328125, 2.19329833984375, 2.365570068359375, 2.537841796875, 2.710113525390625, 2.88238525390625, 3.054656982421875, 3.2269287109375, 3.399200439453125, 3.57147216796875, 3.743743896484375, 3.916015625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 8.0, 15.0, 15.0, 27.0, 50.0, 82.0, 130.0, 175.0, 188.0, 155.0, 76.0, 41.0, 12.0, 14.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-59.660587310791016, -58.139892578125, -56.61920166015625, -55.098506927490234, -53.57781219482422, -52.05712127685547, -50.53642654418945, -49.01573181152344, -47.49504089355469, -45.97434616088867, -44.45365524291992, -42.932960510253906, -41.412269592285156, -39.89157485961914, -38.370880126953125, -36.850189208984375, -35.32949447631836, -33.808799743652344, -32.288108825683594, -30.767414093017578, -29.246721267700195, -27.726028442382812, -26.205333709716797, -24.684640884399414, -23.16394805908203, -21.64325523376465, -20.122562408447266, -18.60186767578125, -17.081174850463867, -15.560482025146484, -14.039788246154785, -12.519094467163086, -10.998405456542969, -9.477712631225586, -7.957018852233887, -6.436325550079346, -4.915632247924805, -3.3949389457702637, -1.8742456436157227, -0.35355186462402344, 1.1671409606933594, 2.6878342628479004, 4.208527565002441, 5.729220867156982, 7.249914169311523, 8.770606994628906, 10.291300773620605, 11.811994552612305, 13.332687377929688, 14.85338020324707, 16.374073028564453, 17.89476776123047, 19.41546058654785, 20.936153411865234, 22.45684814453125, 23.977540969848633, 25.498233795166016, 27.0189266204834, 28.53961944580078, 30.060314178466797, 31.58100700378418, 33.10169982910156, 34.62239456176758, 36.143089294433594, 37.663780212402344]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 5.0, 2.0, 3.0, 6.0, 10.0, 6.0, 9.0, 10.0, 11.0, 20.0, 20.0, 31.0, 35.0, 27.0, 32.0, 32.0, 36.0, 44.0, 50.0, 51.0, 38.0, 51.0, 56.0, 54.0, 38.0, 40.0, 29.0, 34.0, 27.0, 35.0, 26.0, 16.0, 26.0, 14.0, 16.0, 14.0, 11.0, 10.0, 5.0, 5.0, 3.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-18.467355728149414, -17.914037704467773, -17.360721588134766, -16.807403564453125, -16.254085540771484, -15.700767517089844, -15.14745044708252, -14.594133377075195, -14.040815353393555, -13.487497329711914, -12.93418025970459, -12.380863189697266, -11.827545166015625, -11.274227142333984, -10.72091007232666, -10.167593002319336, -9.614274978637695, -9.060956954956055, -8.50763988494873, -7.954322338104248, -7.401004791259766, -6.847687244415283, -6.294369697570801, -5.741052150726318, -5.187734603881836, -4.6344170570373535, -4.081099510192871, -3.5277819633483887, -2.9744644165039062, -2.421146869659424, -1.8678293228149414, -1.314511775970459, -0.7611923217773438, -0.20787477493286133, 0.3454427719116211, 0.8987603187561035, 1.452077865600586, 2.0053954124450684, 2.558712959289551, 3.112030506134033, 3.6653480529785156, 4.218665599822998, 4.7719831466674805, 5.325300693511963, 5.878618240356445, 6.431935787200928, 6.98525333404541, 7.538570880889893, 8.091888427734375, 8.645206451416016, 9.19852352142334, 9.751840591430664, 10.305158615112305, 10.858476638793945, 11.41179370880127, 11.965110778808594, 12.518428802490234, 13.071746826171875, 13.6250638961792, 14.178380966186523, 14.731698989868164, 15.285017013549805, 15.838334083557129, 16.391651153564453, 16.944969177246094]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 6.0, 0.0, 2.0, 5.0, 4.0, 7.0, 7.0, 13.0, 21.0, 30.0, 37.0, 69.0, 117.0, 214.0, 342.0, 581.0, 992.0, 1794.0, 3718.0, 7377.0, 16585.0, 43383.0, 143941.0, 489449.0, 234747.0, 63120.0, 22464.0, 9783.0, 4570.0, 2190.0, 1226.0, 705.0, 403.0, 250.0, 132.0, 85.0, 60.0, 49.0, 32.0, 14.0, 15.0, 5.0, 6.0, 8.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9765625, -12.4505615234375, -11.924560546875, -11.3985595703125, -10.87255859375, -10.3465576171875, -9.820556640625, -9.2945556640625, -8.7685546875, -8.2425537109375, -7.716552734375, -7.1905517578125, -6.66455078125, -6.1385498046875, -5.612548828125, -5.0865478515625, -4.560546875, -4.0345458984375, -3.508544921875, -2.9825439453125, -2.45654296875, -1.9305419921875, -1.404541015625, -0.8785400390625, -0.3525390625, 0.1734619140625, 0.699462890625, 1.2254638671875, 1.75146484375, 2.2774658203125, 2.803466796875, 3.3294677734375, 3.85546875, 4.3814697265625, 4.907470703125, 5.4334716796875, 5.95947265625, 6.4854736328125, 7.011474609375, 7.5374755859375, 8.0634765625, 8.5894775390625, 9.115478515625, 9.6414794921875, 10.16748046875, 10.6934814453125, 11.219482421875, 11.7454833984375, 12.271484375, 12.7974853515625, 13.323486328125, 13.8494873046875, 14.37548828125, 14.9014892578125, 15.427490234375, 15.9534912109375, 16.4794921875, 17.0054931640625, 17.531494140625, 18.0574951171875, 18.58349609375, 19.1094970703125, 19.635498046875, 20.1614990234375, 20.6875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 4.0, 3.0, 6.0, 7.0, 11.0, 10.0, 13.0, 28.0, 19.0, 25.0, 45.0, 33.0, 47.0, 46.0, 62.0, 69.0, 65.0, 60.0, 62.0, 59.0, 58.0, 51.0, 48.0, 43.0, 23.0, 18.0, 20.0, 14.0, 13.0, 9.0, 12.0, 9.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.072265625, -2.0162353515625, -1.960205078125, -1.9041748046875, -1.84814453125, -1.7921142578125, -1.736083984375, -1.6800537109375, -1.6240234375, -1.5679931640625, -1.511962890625, -1.4559326171875, -1.39990234375, -1.3438720703125, -1.287841796875, -1.2318115234375, -1.17578125, -1.1197509765625, -1.063720703125, -1.0076904296875, -0.95166015625, -0.8956298828125, -0.839599609375, -0.7835693359375, -0.7275390625, -0.6715087890625, -0.615478515625, -0.5594482421875, -0.50341796875, -0.4473876953125, -0.391357421875, -0.3353271484375, -0.279296875, -0.2232666015625, -0.167236328125, -0.1112060546875, -0.05517578125, 0.0008544921875, 0.056884765625, 0.1129150390625, 0.1689453125, 0.2249755859375, 0.281005859375, 0.3370361328125, 0.39306640625, 0.4490966796875, 0.505126953125, 0.5611572265625, 0.6171875, 0.6732177734375, 0.729248046875, 0.7852783203125, 0.84130859375, 0.8973388671875, 0.953369140625, 1.0093994140625, 1.0654296875, 1.1214599609375, 1.177490234375, 1.2335205078125, 1.28955078125, 1.3455810546875, 1.401611328125, 1.4576416015625, 1.513671875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 5.0, 14.0, 11.0, 18.0, 21.0, 30.0, 43.0, 80.0, 87.0, 146.0, 221.0, 365.0, 600.0, 924.0, 1488.0, 2620.0, 4918.0, 10007.0, 22181.0, 59369.0, 202276.0, 455043.0, 189213.0, 57022.0, 21353.0, 9437.0, 4638.0, 2537.0, 1553.0, 844.0, 515.0, 351.0, 218.0, 138.0, 78.0, 57.0, 47.0, 25.0, 15.0, 11.0, 13.0, 8.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-12.53125, -12.1568603515625, -11.782470703125, -11.4080810546875, -11.03369140625, -10.6593017578125, -10.284912109375, -9.9105224609375, -9.5361328125, -9.1617431640625, -8.787353515625, -8.4129638671875, -8.03857421875, -7.6641845703125, -7.289794921875, -6.9154052734375, -6.541015625, -6.1666259765625, -5.792236328125, -5.4178466796875, -5.04345703125, -4.6690673828125, -4.294677734375, -3.9202880859375, -3.5458984375, -3.1715087890625, -2.797119140625, -2.4227294921875, -2.04833984375, -1.6739501953125, -1.299560546875, -0.9251708984375, -0.55078125, -0.1763916015625, 0.197998046875, 0.5723876953125, 0.94677734375, 1.3211669921875, 1.695556640625, 2.0699462890625, 2.4443359375, 2.8187255859375, 3.193115234375, 3.5675048828125, 3.94189453125, 4.3162841796875, 4.690673828125, 5.0650634765625, 5.439453125, 5.8138427734375, 6.188232421875, 6.5626220703125, 6.93701171875, 7.3114013671875, 7.685791015625, 8.0601806640625, 8.4345703125, 8.8089599609375, 9.183349609375, 9.5577392578125, 9.93212890625, 10.3065185546875, 10.680908203125, 11.0552978515625, 11.4296875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 5.0, 2.0, 4.0, 1.0, 6.0, 7.0, 14.0, 16.0, 14.0, 22.0, 30.0, 48.0, 41.0, 45.0, 40.0, 53.0, 54.0, 51.0, 66.0, 56.0, 55.0, 63.0, 54.0, 53.0, 46.0, 26.0, 21.0, 24.0, 20.0, 18.0, 17.0, 9.0, 9.0, 3.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-10.1328125, -9.862548828125, -9.59228515625, -9.322021484375, -9.0517578125, -8.781494140625, -8.51123046875, -8.240966796875, -7.970703125, -7.700439453125, -7.43017578125, -7.159912109375, -6.8896484375, -6.619384765625, -6.34912109375, -6.078857421875, -5.80859375, -5.538330078125, -5.26806640625, -4.997802734375, -4.7275390625, -4.457275390625, -4.18701171875, -3.916748046875, -3.646484375, -3.376220703125, -3.10595703125, -2.835693359375, -2.5654296875, -2.295166015625, -2.02490234375, -1.754638671875, -1.484375, -1.214111328125, -0.94384765625, -0.673583984375, -0.4033203125, -0.133056640625, 0.13720703125, 0.407470703125, 0.677734375, 0.947998046875, 1.21826171875, 1.488525390625, 1.7587890625, 2.029052734375, 2.29931640625, 2.569580078125, 2.83984375, 3.110107421875, 3.38037109375, 3.650634765625, 3.9208984375, 4.191162109375, 4.46142578125, 4.731689453125, 5.001953125, 5.272216796875, 5.54248046875, 5.812744140625, 6.0830078125, 6.353271484375, 6.62353515625, 6.893798828125, 7.1640625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 8.0, 2.0, 8.0, 14.0, 23.0, 37.0, 60.0, 86.0, 123.0, 217.0, 377.0, 711.0, 1263.0, 2367.0, 4990.0, 11385.0, 27607.0, 74068.0, 196933.0, 352563.0, 229610.0, 88357.0, 32985.0, 13117.0, 5726.0, 2712.0, 1402.0, 754.0, 422.0, 252.0, 157.0, 70.0, 53.0, 30.0, 23.0, 14.0, 13.0, 6.0, 10.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.26171875, -7.01629638671875, -6.7708740234375, -6.52545166015625, -6.280029296875, -6.03460693359375, -5.7891845703125, -5.54376220703125, -5.29833984375, -5.05291748046875, -4.8074951171875, -4.56207275390625, -4.316650390625, -4.07122802734375, -3.8258056640625, -3.58038330078125, -3.3349609375, -3.08953857421875, -2.8441162109375, -2.59869384765625, -2.353271484375, -2.10784912109375, -1.8624267578125, -1.61700439453125, -1.37158203125, -1.12615966796875, -0.8807373046875, -0.63531494140625, -0.389892578125, -0.14447021484375, 0.1009521484375, 0.34637451171875, 0.591796875, 0.83721923828125, 1.0826416015625, 1.32806396484375, 1.573486328125, 1.81890869140625, 2.0643310546875, 2.30975341796875, 2.55517578125, 2.80059814453125, 3.0460205078125, 3.29144287109375, 3.536865234375, 3.78228759765625, 4.0277099609375, 4.27313232421875, 4.5185546875, 4.76397705078125, 5.0093994140625, 5.25482177734375, 5.500244140625, 5.74566650390625, 5.9910888671875, 6.23651123046875, 6.48193359375, 6.72735595703125, 6.9727783203125, 7.21820068359375, 7.463623046875, 7.70904541015625, 7.9544677734375, 8.19989013671875, 8.4453125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 5.0, 5.0, 5.0, 6.0, 11.0, 21.0, 74.0, 198.0, 309.0, 205.0, 80.0, 30.0, 18.0, 6.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00121307373046875, -0.0011673569679260254, -0.0011216402053833008, -0.0010759234428405762, -0.0010302066802978516, -0.000984489917755127, -0.0009387731552124023, -0.0008930563926696777, -0.0008473396301269531, -0.0008016228675842285, -0.0007559061050415039, -0.0007101893424987793, -0.0006644725799560547, -0.0006187558174133301, -0.0005730390548706055, -0.0005273222923278809, -0.00048160552978515625, -0.00043588876724243164, -0.00039017200469970703, -0.0003444552421569824, -0.0002987384796142578, -0.0002530217170715332, -0.0002073049545288086, -0.00016158819198608398, -0.00011587142944335938, -7.015466690063477e-05, -2.4437904357910156e-05, 2.1278858184814453e-05, 6.699562072753906e-05, 0.00011271238327026367, 0.00015842914581298828, 0.0002041459083557129, 0.0002498626708984375, 0.0002955794334411621, 0.0003412961959838867, 0.00038701295852661133, 0.00043272972106933594, 0.00047844648361206055, 0.0005241632461547852, 0.0005698800086975098, 0.0006155967712402344, 0.000661313533782959, 0.0007070302963256836, 0.0007527470588684082, 0.0007984638214111328, 0.0008441805839538574, 0.000889897346496582, 0.0009356141090393066, 0.0009813308715820312, 0.0010270476341247559, 0.0010727643966674805, 0.001118481159210205, 0.0011641979217529297, 0.0012099146842956543, 0.001255631446838379, 0.0013013482093811035, 0.0013470649719238281, 0.0013927817344665527, 0.0014384984970092773, 0.001484215259552002, 0.0015299320220947266, 0.0015756487846374512, 0.0016213655471801758, 0.0016670823097229004, 0.001712799072265625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 7.0, 12.0, 13.0, 20.0, 31.0, 51.0, 87.0, 120.0, 205.0, 284.0, 461.0, 766.0, 1247.0, 2154.0, 3804.0, 6874.0, 12385.0, 23831.0, 45650.0, 89813.0, 165758.0, 239203.0, 205694.0, 119685.0, 61897.0, 31526.0, 16363.0, 9000.0, 4815.0, 2716.0, 1636.0, 898.0, 618.0, 313.0, 204.0, 141.0, 88.0, 76.0, 47.0, 27.0, 8.0, 12.0, 12.0, 7.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0], "bins": [-6.21875, -6.0396728515625, -5.860595703125, -5.6815185546875, -5.50244140625, -5.3233642578125, -5.144287109375, -4.9652099609375, -4.7861328125, -4.6070556640625, -4.427978515625, -4.2489013671875, -4.06982421875, -3.8907470703125, -3.711669921875, -3.5325927734375, -3.353515625, -3.1744384765625, -2.995361328125, -2.8162841796875, -2.63720703125, -2.4581298828125, -2.279052734375, -2.0999755859375, -1.9208984375, -1.7418212890625, -1.562744140625, -1.3836669921875, -1.20458984375, -1.0255126953125, -0.846435546875, -0.6673583984375, -0.48828125, -0.3092041015625, -0.130126953125, 0.0489501953125, 0.22802734375, 0.4071044921875, 0.586181640625, 0.7652587890625, 0.9443359375, 1.1234130859375, 1.302490234375, 1.4815673828125, 1.66064453125, 1.8397216796875, 2.018798828125, 2.1978759765625, 2.376953125, 2.5560302734375, 2.735107421875, 2.9141845703125, 3.09326171875, 3.2723388671875, 3.451416015625, 3.6304931640625, 3.8095703125, 3.9886474609375, 4.167724609375, 4.3468017578125, 4.52587890625, 4.7049560546875, 4.884033203125, 5.0631103515625, 5.2421875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 10.0, 6.0, 9.0, 12.0, 15.0, 18.0, 24.0, 22.0, 23.0, 30.0, 30.0, 38.0, 34.0, 39.0, 48.0, 51.0, 62.0, 57.0, 47.0, 50.0, 30.0, 57.0, 42.0, 34.0, 32.0, 24.0, 21.0, 20.0, 23.0, 12.0, 8.0, 12.0, 12.0, 9.0, 10.0, 3.0, 7.0, 3.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.328125, -3.21588134765625, -3.1036376953125, -2.99139404296875, -2.879150390625, -2.76690673828125, -2.6546630859375, -2.54241943359375, -2.43017578125, -2.31793212890625, -2.2056884765625, -2.09344482421875, -1.981201171875, -1.86895751953125, -1.7567138671875, -1.64447021484375, -1.5322265625, -1.41998291015625, -1.3077392578125, -1.19549560546875, -1.083251953125, -0.97100830078125, -0.8587646484375, -0.74652099609375, -0.63427734375, -0.52203369140625, -0.4097900390625, -0.29754638671875, -0.185302734375, -0.07305908203125, 0.0391845703125, 0.15142822265625, 0.263671875, 0.37591552734375, 0.4881591796875, 0.60040283203125, 0.712646484375, 0.82489013671875, 0.9371337890625, 1.04937744140625, 1.16162109375, 1.27386474609375, 1.3861083984375, 1.49835205078125, 1.610595703125, 1.72283935546875, 1.8350830078125, 1.94732666015625, 2.0595703125, 2.17181396484375, 2.2840576171875, 2.39630126953125, 2.508544921875, 2.62078857421875, 2.7330322265625, 2.84527587890625, 2.95751953125, 3.06976318359375, 3.1820068359375, 3.29425048828125, 3.406494140625, 3.51873779296875, 3.6309814453125, 3.74322509765625, 3.85546875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 9.0, 10.0, 19.0, 40.0, 74.0, 132.0, 177.0, 184.0, 162.0, 83.0, 46.0, 39.0, 13.0, 9.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.42327117919922, -79.64752197265625, -75.87176513671875, -72.09601593017578, -68.32025909423828, -64.54450988769531, -60.76875686645508, -56.993003845214844, -53.21725082397461, -49.441497802734375, -45.66574478149414, -41.889991760253906, -38.11424255371094, -34.33848571777344, -30.56273651123047, -26.786983489990234, -23.01123046875, -19.235477447509766, -15.459725379943848, -11.68397331237793, -7.908220291137695, -4.132467269897461, -0.3567161560058594, 3.419036865234375, 7.194789886474609, 10.970542907714844, 14.746294975280762, 18.52204704284668, 22.297800064086914, 26.07355308532715, 29.84930419921875, 33.625057220458984, 37.40080261230469, 41.17655563354492, 44.952308654785156, 48.728057861328125, 52.503814697265625, 56.279563903808594, 60.05531692504883, 63.83106994628906, 67.60682678222656, 71.38257598876953, 75.15833282470703, 78.93408203125, 82.7098388671875, 86.48558807373047, 90.26133728027344, 94.03709411621094, 97.8128433227539, 101.58859252929688, 105.36434936523438, 109.14009857177734, 112.91585540771484, 116.69160461425781, 120.46736145019531, 124.24311065673828, 128.01885986328125, 131.79461669921875, 135.5703582763672, 139.3461151123047, 143.1218719482422, 146.8976287841797, 150.67337036132812, 154.44912719726562, 158.22488403320312]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 5.0, 4.0, 3.0, 7.0, 7.0, 7.0, 11.0, 13.0, 12.0, 8.0, 17.0, 30.0, 28.0, 22.0, 39.0, 46.0, 49.0, 48.0, 62.0, 51.0, 58.0, 48.0, 72.0, 53.0, 43.0, 38.0, 48.0, 39.0, 23.0, 16.0, 28.0, 17.0, 6.0, 7.0, 4.0, 13.0, 5.0, 5.0, 3.0, 4.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.52190399169922, -38.87868118286133, -37.23545837402344, -35.59223556518555, -33.949012756347656, -32.305789947509766, -30.662567138671875, -29.019344329833984, -27.376121520996094, -25.732898712158203, -24.089675903320312, -22.446453094482422, -20.80323028564453, -19.16000747680664, -17.51678466796875, -15.873560905456543, -14.230337142944336, -12.587114334106445, -10.943891525268555, -9.300668716430664, -7.657445430755615, -6.014222145080566, -4.370999336242676, -2.727776527404785, -1.0845537185668945, 0.5586692094802856, 2.201892137527466, 3.8451151847839355, 5.488337993621826, 7.131561279296875, 8.774784088134766, 10.418006896972656, 12.061229705810547, 13.704452514648438, 15.347675323486328, 16.99089813232422, 18.63412094116211, 20.27734375, 21.92056655883789, 23.56378936767578, 25.207012176513672, 26.850234985351562, 28.493457794189453, 30.136680603027344, 31.779903411865234, 33.423126220703125, 35.066349029541016, 36.709571838378906, 38.35279846191406, 39.99602127075195, 41.639244079589844, 43.282466888427734, 44.925689697265625, 46.568912506103516, 48.212135314941406, 49.8553581237793, 51.49858093261719, 53.14180374145508, 54.78502655029297, 56.42824935913086, 58.07147216796875, 59.71469497680664, 61.35791778564453, 63.00114059448242, 64.64436340332031]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 5.0, 4.0, 6.0, 10.0, 14.0, 18.0, 20.0, 31.0, 46.0, 75.0, 108.0, 142.0, 199.0, 329.0, 458.0, 800.0, 1232.0, 2023.0, 3800.0, 6735.0, 13480.0, 29224.0, 81754.0, 488442.0, 3310888.0, 166854.0, 46612.0, 19180.0, 9536.0, 4914.0, 2913.0, 1668.0, 957.0, 652.0, 382.0, 263.0, 153.0, 111.0, 84.0, 52.0, 35.0, 26.0, 12.0, 17.0, 6.0, 5.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-34.28125, -33.21826171875, -32.1552734375, -31.09228515625, -30.029296875, -28.96630859375, -27.9033203125, -26.84033203125, -25.77734375, -24.71435546875, -23.6513671875, -22.58837890625, -21.525390625, -20.46240234375, -19.3994140625, -18.33642578125, -17.2734375, -16.21044921875, -15.1474609375, -14.08447265625, -13.021484375, -11.95849609375, -10.8955078125, -9.83251953125, -8.76953125, -7.70654296875, -6.6435546875, -5.58056640625, -4.517578125, -3.45458984375, -2.3916015625, -1.32861328125, -0.265625, 0.79736328125, 1.8603515625, 2.92333984375, 3.986328125, 5.04931640625, 6.1123046875, 7.17529296875, 8.23828125, 9.30126953125, 10.3642578125, 11.42724609375, 12.490234375, 13.55322265625, 14.6162109375, 15.67919921875, 16.7421875, 17.80517578125, 18.8681640625, 19.93115234375, 20.994140625, 22.05712890625, 23.1201171875, 24.18310546875, 25.24609375, 26.30908203125, 27.3720703125, 28.43505859375, 29.498046875, 30.56103515625, 31.6240234375, 32.68701171875, 33.75]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 2.0, 2.0, 5.0, 2.0, 7.0, 7.0, 13.0, 19.0, 14.0, 28.0, 30.0, 29.0, 38.0, 47.0, 47.0, 45.0, 44.0, 54.0, 68.0, 62.0, 54.0, 52.0, 49.0, 53.0, 38.0, 33.0, 27.0, 19.0, 26.0, 20.0, 20.0, 10.0, 16.0, 6.0, 3.0, 8.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8251953125, -1.77301025390625, -1.7208251953125, -1.66864013671875, -1.616455078125, -1.56427001953125, -1.5120849609375, -1.45989990234375, -1.40771484375, -1.35552978515625, -1.3033447265625, -1.25115966796875, -1.198974609375, -1.14678955078125, -1.0946044921875, -1.04241943359375, -0.990234375, -0.93804931640625, -0.8858642578125, -0.83367919921875, -0.781494140625, -0.72930908203125, -0.6771240234375, -0.62493896484375, -0.57275390625, -0.52056884765625, -0.4683837890625, -0.41619873046875, -0.364013671875, -0.31182861328125, -0.2596435546875, -0.20745849609375, -0.1552734375, -0.10308837890625, -0.0509033203125, 0.00128173828125, 0.053466796875, 0.10565185546875, 0.1578369140625, 0.21002197265625, 0.26220703125, 0.31439208984375, 0.3665771484375, 0.41876220703125, 0.470947265625, 0.52313232421875, 0.5753173828125, 0.62750244140625, 0.6796875, 0.73187255859375, 0.7840576171875, 0.83624267578125, 0.888427734375, 0.94061279296875, 0.9927978515625, 1.04498291015625, 1.09716796875, 1.14935302734375, 1.2015380859375, 1.25372314453125, 1.305908203125, 1.35809326171875, 1.4102783203125, 1.46246337890625, 1.5146484375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 8.0, 5.0, 12.0, 22.0, 34.0, 44.0, 63.0, 139.0, 197.0, 445.0, 1306.0, 7954.0, 182478.0, 3928227.0, 67171.0, 4383.0, 892.0, 369.0, 205.0, 111.0, 84.0, 44.0, 33.0, 19.0, 11.0, 11.0, 10.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.875, -111.212890625, -107.55078125, -103.888671875, -100.2265625, -96.564453125, -92.90234375, -89.240234375, -85.578125, -81.916015625, -78.25390625, -74.591796875, -70.9296875, -67.267578125, -63.60546875, -59.943359375, -56.28125, -52.619140625, -48.95703125, -45.294921875, -41.6328125, -37.970703125, -34.30859375, -30.646484375, -26.984375, -23.322265625, -19.66015625, -15.998046875, -12.3359375, -8.673828125, -5.01171875, -1.349609375, 2.3125, 5.974609375, 9.63671875, 13.298828125, 16.9609375, 20.623046875, 24.28515625, 27.947265625, 31.609375, 35.271484375, 38.93359375, 42.595703125, 46.2578125, 49.919921875, 53.58203125, 57.244140625, 60.90625, 64.568359375, 68.23046875, 71.892578125, 75.5546875, 79.216796875, 82.87890625, 86.541015625, 90.203125, 93.865234375, 97.52734375, 101.189453125, 104.8515625, 108.513671875, 112.17578125, 115.837890625, 119.5]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 9.0, 7.0, 11.0, 14.0, 27.0, 37.0, 43.0, 66.0, 102.0, 150.0, 266.0, 588.0, 1662.0, 514.0, 205.0, 120.0, 81.0, 51.0, 41.0, 31.0, 18.0, 10.0, 5.0, 8.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.94140625, -6.7203369140625, -6.499267578125, -6.2781982421875, -6.05712890625, -5.8360595703125, -5.614990234375, -5.3939208984375, -5.1728515625, -4.9517822265625, -4.730712890625, -4.5096435546875, -4.28857421875, -4.0675048828125, -3.846435546875, -3.6253662109375, -3.404296875, -3.1832275390625, -2.962158203125, -2.7410888671875, -2.52001953125, -2.2989501953125, -2.077880859375, -1.8568115234375, -1.6357421875, -1.4146728515625, -1.193603515625, -0.9725341796875, -0.75146484375, -0.5303955078125, -0.309326171875, -0.0882568359375, 0.1328125, 0.3538818359375, 0.574951171875, 0.7960205078125, 1.01708984375, 1.2381591796875, 1.459228515625, 1.6802978515625, 1.9013671875, 2.1224365234375, 2.343505859375, 2.5645751953125, 2.78564453125, 3.0067138671875, 3.227783203125, 3.4488525390625, 3.669921875, 3.8909912109375, 4.112060546875, 4.3331298828125, 4.55419921875, 4.7752685546875, 4.996337890625, 5.2174072265625, 5.4384765625, 5.6595458984375, 5.880615234375, 6.1016845703125, 6.32275390625, 6.5438232421875, 6.764892578125, 6.9859619140625, 7.20703125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 12.0, 8.0, 19.0, 43.0, 90.0, 188.0, 234.0, 200.0, 124.0, 46.0, 22.0, 9.0, 7.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.22520446777344, -51.134368896484375, -48.04352951049805, -44.952693939208984, -41.861854553222656, -38.771018981933594, -35.68018341064453, -32.5893440246582, -29.498506546020508, -26.407669067382812, -23.316831588745117, -20.225994110107422, -17.13515853881836, -14.044320106506348, -10.953483581542969, -7.862646102905273, -4.771808624267578, -1.680971384048462, 1.4098658561706543, 4.500702857971191, 7.591540336608887, 10.682377815246582, 13.773214340209961, 16.864051818847656, 19.95488929748535, 23.045726776123047, 26.136564254760742, 29.227401733398438, 32.3182373046875, 35.40907669067383, 38.49991226196289, 41.59075164794922, 44.68158721923828, 47.772422790527344, 50.86326217651367, 53.954097747802734, 57.04493713378906, 60.135772705078125, 63.22660827636719, 66.31744384765625, 69.40828704833984, 72.4991226196289, 75.58995819091797, 78.68080139160156, 81.77163696289062, 84.86247253417969, 87.95330810546875, 91.04414367675781, 94.13497924804688, 97.22581481933594, 100.316650390625, 103.4074935913086, 106.49832916259766, 109.58916473388672, 112.68000030517578, 115.77084350585938, 118.86167907714844, 121.9525146484375, 125.04335021972656, 128.13418579101562, 131.2250213623047, 134.3158721923828, 137.40670776367188, 140.49754333496094, 143.58837890625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 4.0, 6.0, 12.0, 9.0, 10.0, 17.0, 4.0, 17.0, 23.0, 22.0, 30.0, 24.0, 14.0, 26.0, 38.0, 35.0, 41.0, 44.0, 39.0, 31.0, 41.0, 47.0, 46.0, 43.0, 36.0, 50.0, 25.0, 28.0, 39.0, 27.0, 24.0, 21.0, 24.0, 11.0, 13.0, 12.0, 10.0, 14.0, 3.0, 7.0, 10.0, 6.0, 3.0, 3.0, 1.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-23.066146850585938, -22.335039138793945, -21.603933334350586, -20.872825622558594, -20.1417179107666, -19.41061019897461, -18.67950439453125, -17.948396682739258, -17.217288970947266, -16.486181259155273, -15.755074501037598, -15.023967742919922, -14.29286003112793, -13.561753273010254, -12.830646514892578, -12.099538803100586, -11.36843204498291, -10.637325286865234, -9.906217575073242, -9.175110816955566, -8.444003105163574, -7.712896347045898, -6.9817891120910645, -6.2506818771362305, -5.5195746421813965, -4.7884674072265625, -4.0573601722717285, -3.3262531757354736, -2.5951459407806396, -1.8640387058258057, -1.1329317092895508, -0.4018244743347168, 0.3292827606201172, 1.0603899955749512, 1.7914971113204956, 2.52260422706604, 3.253711462020874, 3.984818696975708, 4.715925693511963, 5.447032928466797, 6.178140163421631, 6.909247398376465, 7.640354633331299, 8.371461868286133, 9.102568626403809, 9.8336763381958, 10.564783096313477, 11.295890808105469, 12.026997566223145, 12.75810432434082, 13.489212036132812, 14.220318794250488, 14.95142650604248, 15.682533264160156, 16.41364097595215, 17.14474868774414, 17.8758544921875, 18.606962203979492, 19.33806800842285, 20.069175720214844, 20.800283432006836, 21.531391143798828, 22.262496948242188, 22.99360466003418, 23.724712371826172]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 12.0, 17.0, 20.0, 37.0, 67.0, 104.0, 142.0, 224.0, 350.0, 594.0, 1084.0, 1725.0, 2996.0, 5154.0, 8856.0, 15782.0, 28929.0, 53930.0, 96805.0, 162865.0, 218943.0, 187057.0, 117063.0, 65204.0, 35829.0, 19462.0, 10729.0, 5910.0, 3506.0, 2036.0, 1219.0, 742.0, 445.0, 262.0, 171.0, 110.0, 74.0, 43.0, 21.0, 10.0, 11.0, 5.0, 4.0, 1.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.6484375, -15.197021484375, -14.74560546875, -14.294189453125, -13.8427734375, -13.391357421875, -12.93994140625, -12.488525390625, -12.037109375, -11.585693359375, -11.13427734375, -10.682861328125, -10.2314453125, -9.780029296875, -9.32861328125, -8.877197265625, -8.42578125, -7.974365234375, -7.52294921875, -7.071533203125, -6.6201171875, -6.168701171875, -5.71728515625, -5.265869140625, -4.814453125, -4.363037109375, -3.91162109375, -3.460205078125, -3.0087890625, -2.557373046875, -2.10595703125, -1.654541015625, -1.203125, -0.751708984375, -0.30029296875, 0.151123046875, 0.6025390625, 1.053955078125, 1.50537109375, 1.956787109375, 2.408203125, 2.859619140625, 3.31103515625, 3.762451171875, 4.2138671875, 4.665283203125, 5.11669921875, 5.568115234375, 6.01953125, 6.470947265625, 6.92236328125, 7.373779296875, 7.8251953125, 8.276611328125, 8.72802734375, 9.179443359375, 9.630859375, 10.082275390625, 10.53369140625, 10.985107421875, 11.4365234375, 11.887939453125, 12.33935546875, 12.790771484375, 13.2421875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 7.0, 2.0, 1.0, 7.0, 7.0, 3.0, 10.0, 14.0, 9.0, 18.0, 18.0, 14.0, 24.0, 15.0, 29.0, 32.0, 30.0, 49.0, 54.0, 34.0, 41.0, 43.0, 44.0, 47.0, 42.0, 45.0, 43.0, 29.0, 35.0, 32.0, 38.0, 25.0, 20.0, 15.0, 17.0, 17.0, 17.0, 10.0, 19.0, 6.0, 15.0, 2.0, 4.0, 12.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.5400390625, -1.492034912109375, -1.44403076171875, -1.396026611328125, -1.3480224609375, -1.300018310546875, -1.25201416015625, -1.204010009765625, -1.156005859375, -1.108001708984375, -1.05999755859375, -1.011993408203125, -0.9639892578125, -0.915985107421875, -0.86798095703125, -0.819976806640625, -0.77197265625, -0.723968505859375, -0.67596435546875, -0.627960205078125, -0.5799560546875, -0.531951904296875, -0.48394775390625, -0.435943603515625, -0.387939453125, -0.339935302734375, -0.29193115234375, -0.243927001953125, -0.1959228515625, -0.147918701171875, -0.09991455078125, -0.051910400390625, -0.00390625, 0.044097900390625, 0.09210205078125, 0.140106201171875, 0.1881103515625, 0.236114501953125, 0.28411865234375, 0.332122802734375, 0.380126953125, 0.428131103515625, 0.47613525390625, 0.524139404296875, 0.5721435546875, 0.620147705078125, 0.66815185546875, 0.716156005859375, 0.76416015625, 0.812164306640625, 0.86016845703125, 0.908172607421875, 0.9561767578125, 1.004180908203125, 1.05218505859375, 1.100189208984375, 1.148193359375, 1.196197509765625, 1.24420166015625, 1.292205810546875, 1.3402099609375, 1.388214111328125, 1.43621826171875, 1.484222412109375, 1.5322265625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 5.0, 6.0, 13.0, 9.0, 25.0, 26.0, 31.0, 52.0, 78.0, 108.0, 190.0, 325.0, 514.0, 807.0, 1641.0, 3499.0, 8495.0, 24167.0, 75261.0, 232823.0, 403234.0, 199656.0, 63270.0, 20281.0, 7342.0, 3080.0, 1541.0, 810.0, 479.0, 313.0, 173.0, 107.0, 70.0, 45.0, 35.0, 17.0, 10.0, 4.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-31.6875, -30.710205078125, -29.73291015625, -28.755615234375, -27.7783203125, -26.801025390625, -25.82373046875, -24.846435546875, -23.869140625, -22.891845703125, -21.91455078125, -20.937255859375, -19.9599609375, -18.982666015625, -18.00537109375, -17.028076171875, -16.05078125, -15.073486328125, -14.09619140625, -13.118896484375, -12.1416015625, -11.164306640625, -10.18701171875, -9.209716796875, -8.232421875, -7.255126953125, -6.27783203125, -5.300537109375, -4.3232421875, -3.345947265625, -2.36865234375, -1.391357421875, -0.4140625, 0.563232421875, 1.54052734375, 2.517822265625, 3.4951171875, 4.472412109375, 5.44970703125, 6.427001953125, 7.404296875, 8.381591796875, 9.35888671875, 10.336181640625, 11.3134765625, 12.290771484375, 13.26806640625, 14.245361328125, 15.22265625, 16.199951171875, 17.17724609375, 18.154541015625, 19.1318359375, 20.109130859375, 21.08642578125, 22.063720703125, 23.041015625, 24.018310546875, 24.99560546875, 25.972900390625, 26.9501953125, 27.927490234375, 28.90478515625, 29.882080078125, 30.859375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 7.0, 11.0, 18.0, 20.0, 27.0, 38.0, 49.0, 46.0, 59.0, 70.0, 82.0, 65.0, 85.0, 64.0, 68.0, 55.0, 55.0, 40.0, 40.0, 27.0, 22.0, 18.0, 14.0, 11.0, 4.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.8125, -18.18701171875, -17.5615234375, -16.93603515625, -16.310546875, -15.68505859375, -15.0595703125, -14.43408203125, -13.80859375, -13.18310546875, -12.5576171875, -11.93212890625, -11.306640625, -10.68115234375, -10.0556640625, -9.43017578125, -8.8046875, -8.17919921875, -7.5537109375, -6.92822265625, -6.302734375, -5.67724609375, -5.0517578125, -4.42626953125, -3.80078125, -3.17529296875, -2.5498046875, -1.92431640625, -1.298828125, -0.67333984375, -0.0478515625, 0.57763671875, 1.203125, 1.82861328125, 2.4541015625, 3.07958984375, 3.705078125, 4.33056640625, 4.9560546875, 5.58154296875, 6.20703125, 6.83251953125, 7.4580078125, 8.08349609375, 8.708984375, 9.33447265625, 9.9599609375, 10.58544921875, 11.2109375, 11.83642578125, 12.4619140625, 13.08740234375, 13.712890625, 14.33837890625, 14.9638671875, 15.58935546875, 16.21484375, 16.84033203125, 17.4658203125, 18.09130859375, 18.716796875, 19.34228515625, 19.9677734375, 20.59326171875, 21.21875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 5.0, 2.0, 14.0, 12.0, 20.0, 16.0, 38.0, 33.0, 83.0, 124.0, 187.0, 278.0, 491.0, 859.0, 1856.0, 3937.0, 9444.0, 25298.0, 74021.0, 218931.0, 379034.0, 217448.0, 74145.0, 25079.0, 9184.0, 3871.0, 1800.0, 949.0, 524.0, 290.0, 205.0, 119.0, 71.0, 59.0, 42.0, 35.0, 11.0, 12.0, 5.0, 6.0, 1.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.65625, -16.12744140625, -15.5986328125, -15.06982421875, -14.541015625, -14.01220703125, -13.4833984375, -12.95458984375, -12.42578125, -11.89697265625, -11.3681640625, -10.83935546875, -10.310546875, -9.78173828125, -9.2529296875, -8.72412109375, -8.1953125, -7.66650390625, -7.1376953125, -6.60888671875, -6.080078125, -5.55126953125, -5.0224609375, -4.49365234375, -3.96484375, -3.43603515625, -2.9072265625, -2.37841796875, -1.849609375, -1.32080078125, -0.7919921875, -0.26318359375, 0.265625, 0.79443359375, 1.3232421875, 1.85205078125, 2.380859375, 2.90966796875, 3.4384765625, 3.96728515625, 4.49609375, 5.02490234375, 5.5537109375, 6.08251953125, 6.611328125, 7.14013671875, 7.6689453125, 8.19775390625, 8.7265625, 9.25537109375, 9.7841796875, 10.31298828125, 10.841796875, 11.37060546875, 11.8994140625, 12.42822265625, 12.95703125, 13.48583984375, 14.0146484375, 14.54345703125, 15.072265625, 15.60107421875, 16.1298828125, 16.65869140625, 17.1875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 9.0, 8.0, 10.0, 34.0, 40.0, 39.0, 72.0, 102.0, 152.0, 120.0, 122.0, 84.0, 64.0, 43.0, 35.0, 14.0, 21.0, 11.0, 8.0, 7.0, 1.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.004604339599609375, -0.004487335681915283, -0.004370331764221191, -0.0042533278465271, -0.004136323928833008, -0.004019320011138916, -0.0039023160934448242, -0.0037853121757507324, -0.0036683082580566406, -0.003551304340362549, -0.003434300422668457, -0.0033172965049743652, -0.0032002925872802734, -0.0030832886695861816, -0.00296628475189209, -0.002849280834197998, -0.0027322769165039062, -0.0026152729988098145, -0.0024982690811157227, -0.002381265163421631, -0.002264261245727539, -0.0021472573280334473, -0.0020302534103393555, -0.0019132494926452637, -0.0017962455749511719, -0.00167924165725708, -0.0015622377395629883, -0.0014452338218688965, -0.0013282299041748047, -0.0012112259864807129, -0.001094222068786621, -0.0009772181510925293, -0.0008602142333984375, -0.0007432103157043457, -0.0006262063980102539, -0.0005092024803161621, -0.0003921985626220703, -0.0002751946449279785, -0.00015819072723388672, -4.118680953979492e-05, 7.581710815429688e-05, 0.00019282102584838867, 0.00030982494354248047, 0.00042682886123657227, 0.0005438327789306641, 0.0006608366966247559, 0.0007778406143188477, 0.0008948445320129395, 0.0010118484497070312, 0.001128852367401123, 0.0012458562850952148, 0.0013628602027893066, 0.0014798641204833984, 0.0015968680381774902, 0.001713871955871582, 0.0018308758735656738, 0.0019478797912597656, 0.0020648837089538574, 0.0021818876266479492, 0.002298891544342041, 0.002415895462036133, 0.0025328993797302246, 0.0026499032974243164, 0.002766907215118408, 0.0028839111328125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 9.0, 9.0, 13.0, 18.0, 34.0, 23.0, 49.0, 72.0, 86.0, 123.0, 176.0, 247.0, 344.0, 531.0, 767.0, 1283.0, 2135.0, 3608.0, 6810.0, 13818.0, 28667.0, 63754.0, 139317.0, 249084.0, 257339.0, 149538.0, 68744.0, 30492.0, 14445.0, 7050.0, 3876.0, 2145.0, 1290.0, 828.0, 579.0, 383.0, 260.0, 194.0, 104.0, 87.0, 74.0, 36.0, 34.0, 19.0, 13.0, 17.0, 11.0, 5.0, 8.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-10.0234375, -9.6898193359375, -9.356201171875, -9.0225830078125, -8.68896484375, -8.3553466796875, -8.021728515625, -7.6881103515625, -7.3544921875, -7.0208740234375, -6.687255859375, -6.3536376953125, -6.02001953125, -5.6864013671875, -5.352783203125, -5.0191650390625, -4.685546875, -4.3519287109375, -4.018310546875, -3.6846923828125, -3.35107421875, -3.0174560546875, -2.683837890625, -2.3502197265625, -2.0166015625, -1.6829833984375, -1.349365234375, -1.0157470703125, -0.68212890625, -0.3485107421875, -0.014892578125, 0.3187255859375, 0.65234375, 0.9859619140625, 1.319580078125, 1.6531982421875, 1.98681640625, 2.3204345703125, 2.654052734375, 2.9876708984375, 3.3212890625, 3.6549072265625, 3.988525390625, 4.3221435546875, 4.65576171875, 4.9893798828125, 5.322998046875, 5.6566162109375, 5.990234375, 6.3238525390625, 6.657470703125, 6.9910888671875, 7.32470703125, 7.6583251953125, 7.991943359375, 8.3255615234375, 8.6591796875, 8.9927978515625, 9.326416015625, 9.6600341796875, 9.99365234375, 10.3272705078125, 10.660888671875, 10.9945068359375, 11.328125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 6.0, 3.0, 8.0, 4.0, 7.0, 13.0, 5.0, 14.0, 18.0, 21.0, 14.0, 24.0, 18.0, 18.0, 28.0, 46.0, 30.0, 41.0, 50.0, 45.0, 41.0, 51.0, 65.0, 38.0, 56.0, 47.0, 39.0, 45.0, 31.0, 31.0, 16.0, 21.0, 23.0, 17.0, 13.0, 8.0, 15.0, 2.0, 6.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.03515625, -4.8521728515625, -4.669189453125, -4.4862060546875, -4.30322265625, -4.1202392578125, -3.937255859375, -3.7542724609375, -3.5712890625, -3.3883056640625, -3.205322265625, -3.0223388671875, -2.83935546875, -2.6563720703125, -2.473388671875, -2.2904052734375, -2.107421875, -1.9244384765625, -1.741455078125, -1.5584716796875, -1.37548828125, -1.1925048828125, -1.009521484375, -0.8265380859375, -0.6435546875, -0.4605712890625, -0.277587890625, -0.0946044921875, 0.08837890625, 0.2713623046875, 0.454345703125, 0.6373291015625, 0.8203125, 1.0032958984375, 1.186279296875, 1.3692626953125, 1.55224609375, 1.7352294921875, 1.918212890625, 2.1011962890625, 2.2841796875, 2.4671630859375, 2.650146484375, 2.8331298828125, 3.01611328125, 3.1990966796875, 3.382080078125, 3.5650634765625, 3.748046875, 3.9310302734375, 4.114013671875, 4.2969970703125, 4.47998046875, 4.6629638671875, 4.845947265625, 5.0289306640625, 5.2119140625, 5.3948974609375, 5.577880859375, 5.7608642578125, 5.94384765625, 6.1268310546875, 6.309814453125, 6.4927978515625, 6.67578125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 8.0, 11.0, 27.0, 69.0, 144.0, 272.0, 259.0, 138.0, 54.0, 18.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-427.16729736328125, -414.5718994140625, -401.97650146484375, -389.381103515625, -376.7857360839844, -364.1903381347656, -351.5949401855469, -338.9995422363281, -326.4041748046875, -313.80877685546875, -301.21337890625, -288.61798095703125, -276.0226135253906, -263.4272155761719, -250.83181762695312, -238.23641967773438, -225.64102172851562, -213.04562377929688, -200.4502410888672, -187.85484313964844, -175.25946044921875, -162.6640625, -150.06866455078125, -137.4732666015625, -124.87788391113281, -112.2824935913086, -99.68710327148438, -87.09170532226562, -74.4963150024414, -61.90092468261719, -49.30552673339844, -36.71013641357422, -24.11474609375, -11.519353866577148, 1.0760383605957031, 13.671432495117188, 26.266822814941406, 38.862213134765625, 51.457611083984375, 64.0530014038086, 76.64839172363281, 89.24378204345703, 101.83917236328125, 114.4345703125, 127.02996063232422, 139.62535095214844, 152.2207489013672, 164.81613159179688, 177.41152954101562, 190.00692749023438, 202.60231018066406, 215.1977081298828, 227.7930908203125, 240.38848876953125, 252.98388671875, 265.57928466796875, 278.1746826171875, 290.77008056640625, 303.365478515625, 315.96087646484375, 328.5562438964844, 341.1516418457031, 353.7470397949219, 366.3424377441406, 378.93780517578125]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 9.0, 13.0, 13.0, 16.0, 25.0, 21.0, 44.0, 45.0, 49.0, 54.0, 64.0, 58.0, 65.0, 64.0, 69.0, 66.0, 47.0, 51.0, 41.0, 44.0, 26.0, 32.0, 22.0, 20.0, 16.0, 8.0, 5.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-134.555908203125, -130.48863220214844, -126.42134857177734, -122.35407257080078, -118.28678894042969, -114.21951293945312, -110.15223693847656, -106.0849609375, -102.0176773071289, -97.95040130615234, -93.88311767578125, -89.81584167480469, -85.74856567382812, -81.68128204345703, -77.61400604248047, -73.54672241210938, -69.47944641113281, -65.41217041015625, -61.344886779785156, -57.277610778808594, -53.210330963134766, -49.14305114746094, -45.075775146484375, -41.00849533081055, -36.94121551513672, -32.87393569946289, -28.806657791137695, -24.7393798828125, -20.672100067138672, -16.604820251464844, -12.537542343139648, -8.470264434814453, -4.4029998779296875, -0.3357210159301758, 3.731557846069336, 7.798836708068848, 11.86611557006836, 15.933395385742188, 20.000673294067383, 24.067951202392578, 28.135231018066406, 32.202510833740234, 36.26979064941406, 40.337066650390625, 44.40434646606445, 48.47162628173828, 52.538902282714844, 56.60618209838867, 60.6734619140625, 64.74073791503906, 68.80802154541016, 72.87529754638672, 76.94258117675781, 81.00985717773438, 85.07713317871094, 89.1444091796875, 93.2116928100586, 97.27896881103516, 101.34625244140625, 105.41352844238281, 109.48080444335938, 113.54808807373047, 117.61536407470703, 121.68264770507812, 125.74992370605469]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 12.0, 10.0, 12.0, 32.0, 47.0, 99.0, 180.0, 481.0, 1439.0, 6955.0, 76253.0, 3970709.0, 127289.0, 8815.0, 1250.0, 348.0, 139.0, 62.0, 51.0, 36.0, 25.0, 13.0, 13.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-136.5, -131.72265625, -126.9453125, -122.16796875, -117.390625, -112.61328125, -107.8359375, -103.05859375, -98.28125, -93.50390625, -88.7265625, -83.94921875, -79.171875, -74.39453125, -69.6171875, -64.83984375, -60.0625, -55.28515625, -50.5078125, -45.73046875, -40.953125, -36.17578125, -31.3984375, -26.62109375, -21.84375, -17.06640625, -12.2890625, -7.51171875, -2.734375, 2.04296875, 6.8203125, 11.59765625, 16.375, 21.15234375, 25.9296875, 30.70703125, 35.484375, 40.26171875, 45.0390625, 49.81640625, 54.59375, 59.37109375, 64.1484375, 68.92578125, 73.703125, 78.48046875, 83.2578125, 88.03515625, 92.8125, 97.58984375, 102.3671875, 107.14453125, 111.921875, 116.69921875, 121.4765625, 126.25390625, 131.03125, 135.80859375, 140.5859375, 145.36328125, 150.140625, 154.91796875, 159.6953125, 164.47265625, 169.25]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 7.0, 9.0, 10.0, 12.0, 25.0, 37.0, 40.0, 44.0, 68.0, 77.0, 87.0, 96.0, 85.0, 82.0, 63.0, 62.0, 48.0, 40.0, 33.0, 30.0, 18.0, 14.0, 8.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.80859375, -3.67657470703125, -3.5445556640625, -3.41253662109375, -3.280517578125, -3.14849853515625, -3.0164794921875, -2.88446044921875, -2.75244140625, -2.62042236328125, -2.4884033203125, -2.35638427734375, -2.224365234375, -2.09234619140625, -1.9603271484375, -1.82830810546875, -1.6962890625, -1.56427001953125, -1.4322509765625, -1.30023193359375, -1.168212890625, -1.03619384765625, -0.9041748046875, -0.77215576171875, -0.64013671875, -0.50811767578125, -0.3760986328125, -0.24407958984375, -0.112060546875, 0.01995849609375, 0.1519775390625, 0.28399658203125, 0.416015625, 0.54803466796875, 0.6800537109375, 0.81207275390625, 0.944091796875, 1.07611083984375, 1.2081298828125, 1.34014892578125, 1.47216796875, 1.60418701171875, 1.7362060546875, 1.86822509765625, 2.000244140625, 2.13226318359375, 2.2642822265625, 2.39630126953125, 2.5283203125, 2.66033935546875, 2.7923583984375, 2.92437744140625, 3.056396484375, 3.18841552734375, 3.3204345703125, 3.45245361328125, 3.58447265625, 3.71649169921875, 3.8485107421875, 3.98052978515625, 4.112548828125, 4.24456787109375, 4.3765869140625, 4.50860595703125, 4.640625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 5.0, 13.0, 9.0, 11.0, 12.0, 16.0, 23.0, 20.0, 25.0, 28.0, 36.0, 49.0, 136.0, 552.0, 4381.0, 67460.0, 3744152.0, 361376.0, 14098.0, 1282.0, 222.0, 66.0, 38.0, 55.0, 31.0, 32.0, 29.0, 27.0, 26.0, 15.0, 18.0, 11.0, 7.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-156.75, -152.103515625, -147.45703125, -142.810546875, -138.1640625, -133.517578125, -128.87109375, -124.224609375, -119.578125, -114.931640625, -110.28515625, -105.638671875, -100.9921875, -96.345703125, -91.69921875, -87.052734375, -82.40625, -77.759765625, -73.11328125, -68.466796875, -63.8203125, -59.173828125, -54.52734375, -49.880859375, -45.234375, -40.587890625, -35.94140625, -31.294921875, -26.6484375, -22.001953125, -17.35546875, -12.708984375, -8.0625, -3.416015625, 1.23046875, 5.876953125, 10.5234375, 15.169921875, 19.81640625, 24.462890625, 29.109375, 33.755859375, 38.40234375, 43.048828125, 47.6953125, 52.341796875, 56.98828125, 61.634765625, 66.28125, 70.927734375, 75.57421875, 80.220703125, 84.8671875, 89.513671875, 94.16015625, 98.806640625, 103.453125, 108.099609375, 112.74609375, 117.392578125, 122.0390625, 126.685546875, 131.33203125, 135.978515625, 140.625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 9.0, 12.0, 23.0, 56.0, 64.0, 132.0, 212.0, 574.0, 2013.0, 523.0, 209.0, 110.0, 43.0, 44.0, 31.0, 12.0, 9.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.328125, -9.736083984375, -9.14404296875, -8.552001953125, -7.9599609375, -7.367919921875, -6.77587890625, -6.183837890625, -5.591796875, -4.999755859375, -4.40771484375, -3.815673828125, -3.2236328125, -2.631591796875, -2.03955078125, -1.447509765625, -0.85546875, -0.263427734375, 0.32861328125, 0.920654296875, 1.5126953125, 2.104736328125, 2.69677734375, 3.288818359375, 3.880859375, 4.472900390625, 5.06494140625, 5.656982421875, 6.2490234375, 6.841064453125, 7.43310546875, 8.025146484375, 8.6171875, 9.209228515625, 9.80126953125, 10.393310546875, 10.9853515625, 11.577392578125, 12.16943359375, 12.761474609375, 13.353515625, 13.945556640625, 14.53759765625, 15.129638671875, 15.7216796875, 16.313720703125, 16.90576171875, 17.497802734375, 18.08984375, 18.681884765625, 19.27392578125, 19.865966796875, 20.4580078125, 21.050048828125, 21.64208984375, 22.234130859375, 22.826171875, 23.418212890625, 24.01025390625, 24.602294921875, 25.1943359375, 25.786376953125, 26.37841796875, 26.970458984375, 27.5625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 8.0, 7.0, 13.0, 20.0, 29.0, 47.0, 100.0, 117.0, 142.0, 151.0, 113.0, 76.0, 59.0, 41.0, 29.0, 15.0, 15.0, 7.0, 0.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.46695709228516, -120.31245422363281, -117.15795135498047, -114.00344848632812, -110.84893798828125, -107.6944351196289, -104.53993225097656, -101.38542938232422, -98.23092651367188, -95.07642364501953, -91.92192077636719, -88.76741790771484, -85.6129150390625, -82.45840454101562, -79.30390167236328, -76.14939880371094, -72.9948959350586, -69.84039306640625, -66.6858901977539, -63.5313835144043, -60.37688064575195, -57.22237777709961, -54.06787109375, -50.913368225097656, -47.75886535644531, -44.60436248779297, -41.449859619140625, -38.295352935791016, -35.14085006713867, -31.986347198486328, -28.83184242248535, -25.677337646484375, -22.5228271484375, -19.368324279785156, -16.21381950378418, -13.05931568145752, -9.90481185913086, -6.750308036804199, -3.595804214477539, -0.4412994384765625, 2.7132034301757812, 5.867707252502441, 9.022211074829102, 12.176714897155762, 15.331218719482422, 18.485721588134766, 21.640226364135742, 24.79473114013672, 27.949234008789062, 31.103736877441406, 34.25823974609375, 37.41274642944336, 40.5672492980957, 43.72175216674805, 46.876258850097656, 50.03076171875, 53.185264587402344, 56.33976745605469, 59.49427032470703, 62.64877700805664, 65.80328369140625, 68.9577865600586, 72.11228942871094, 75.26679229736328, 78.42129516601562]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 9.0, 5.0, 8.0, 9.0, 9.0, 5.0, 10.0, 15.0, 16.0, 19.0, 28.0, 19.0, 23.0, 34.0, 37.0, 44.0, 42.0, 45.0, 42.0, 47.0, 55.0, 28.0, 53.0, 51.0, 48.0, 39.0, 28.0, 39.0, 30.0, 33.0, 28.0, 20.0, 22.0, 16.0, 12.0, 9.0, 12.0, 6.0, 6.0, 4.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.714412689208984, -34.186805725097656, -32.659202575683594, -31.131595611572266, -29.603988647460938, -28.07638168334961, -26.548776626586914, -25.02117156982422, -23.49356460571289, -21.965957641601562, -20.438352584838867, -18.910747528076172, -17.383140563964844, -15.855534553527832, -14.32792854309082, -12.800322532653809, -11.272716522216797, -9.745110511779785, -8.217504501342773, -6.689898490905762, -5.16229248046875, -3.6346864700317383, -2.1070804595947266, -0.5794744491577148, 0.9481315612792969, 2.4757375717163086, 4.00334358215332, 5.530949592590332, 7.058555603027344, 8.586161613464355, 10.113767623901367, 11.641373634338379, 13.168983459472656, 14.696589469909668, 16.22419548034668, 17.751800537109375, 19.279407501220703, 20.80701446533203, 22.334619522094727, 23.862224578857422, 25.38983154296875, 26.917438507080078, 28.445043563842773, 29.97264862060547, 31.500255584716797, 33.027862548828125, 34.55546569824219, 36.083072662353516, 37.610679626464844, 39.13828659057617, 40.6658935546875, 42.19349670410156, 43.72110366821289, 45.24871063232422, 46.77631378173828, 48.30392074584961, 49.83152770996094, 51.359134674072266, 52.886741638183594, 54.414344787597656, 55.941951751708984, 57.46955871582031, 58.997161865234375, 60.5247688293457, 62.05237579345703]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 0.0, 7.0, 11.0, 14.0, 20.0, 21.0, 38.0, 54.0, 73.0, 133.0, 198.0, 350.0, 598.0, 1120.0, 2281.0, 6813.0, 26029.0, 115669.0, 412450.0, 358553.0, 92721.0, 21259.0, 5575.0, 2135.0, 976.0, 535.0, 354.0, 214.0, 129.0, 97.0, 40.0, 31.0, 17.0, 14.0, 9.0, 9.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.59375, -36.24755859375, -34.9013671875, -33.55517578125, -32.208984375, -30.86279296875, -29.5166015625, -28.17041015625, -26.82421875, -25.47802734375, -24.1318359375, -22.78564453125, -21.439453125, -20.09326171875, -18.7470703125, -17.40087890625, -16.0546875, -14.70849609375, -13.3623046875, -12.01611328125, -10.669921875, -9.32373046875, -7.9775390625, -6.63134765625, -5.28515625, -3.93896484375, -2.5927734375, -1.24658203125, 0.099609375, 1.44580078125, 2.7919921875, 4.13818359375, 5.484375, 6.83056640625, 8.1767578125, 9.52294921875, 10.869140625, 12.21533203125, 13.5615234375, 14.90771484375, 16.25390625, 17.60009765625, 18.9462890625, 20.29248046875, 21.638671875, 22.98486328125, 24.3310546875, 25.67724609375, 27.0234375, 28.36962890625, 29.7158203125, 31.06201171875, 32.408203125, 33.75439453125, 35.1005859375, 36.44677734375, 37.79296875, 39.13916015625, 40.4853515625, 41.83154296875, 43.177734375, 44.52392578125, 45.8701171875, 47.21630859375, 48.5625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 13.0, 14.0, 39.0, 51.0, 38.0, 61.0, 82.0, 95.0, 102.0, 99.0, 100.0, 85.0, 71.0, 49.0, 33.0, 20.0, 20.0, 7.0, 10.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.66015625, -4.4727783203125, -4.285400390625, -4.0980224609375, -3.91064453125, -3.7232666015625, -3.535888671875, -3.3485107421875, -3.1611328125, -2.9737548828125, -2.786376953125, -2.5989990234375, -2.41162109375, -2.2242431640625, -2.036865234375, -1.8494873046875, -1.662109375, -1.4747314453125, -1.287353515625, -1.0999755859375, -0.91259765625, -0.7252197265625, -0.537841796875, -0.3504638671875, -0.1630859375, 0.0242919921875, 0.211669921875, 0.3990478515625, 0.58642578125, 0.7738037109375, 0.961181640625, 1.1485595703125, 1.3359375, 1.5233154296875, 1.710693359375, 1.8980712890625, 2.08544921875, 2.2728271484375, 2.460205078125, 2.6475830078125, 2.8349609375, 3.0223388671875, 3.209716796875, 3.3970947265625, 3.58447265625, 3.7718505859375, 3.959228515625, 4.1466064453125, 4.333984375, 4.5213623046875, 4.708740234375, 4.8961181640625, 5.08349609375, 5.2708740234375, 5.458251953125, 5.6456298828125, 5.8330078125, 6.0203857421875, 6.207763671875, 6.3951416015625, 6.58251953125, 6.7698974609375, 6.957275390625, 7.1446533203125, 7.33203125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 0.0, 2.0, 9.0, 3.0, 12.0, 15.0, 22.0, 29.0, 44.0, 67.0, 98.0, 139.0, 209.0, 291.0, 502.0, 790.0, 1401.0, 2626.0, 5472.0, 14019.0, 39389.0, 117435.0, 314786.0, 343478.0, 134266.0, 44846.0, 15603.0, 6251.0, 2835.0, 1519.0, 850.0, 532.0, 324.0, 220.0, 145.0, 101.0, 79.0, 42.0, 33.0, 28.0, 18.0, 5.0, 4.0, 1.0, 4.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-32.21875, -31.2138671875, -30.208984375, -29.2041015625, -28.19921875, -27.1943359375, -26.189453125, -25.1845703125, -24.1796875, -23.1748046875, -22.169921875, -21.1650390625, -20.16015625, -19.1552734375, -18.150390625, -17.1455078125, -16.140625, -15.1357421875, -14.130859375, -13.1259765625, -12.12109375, -11.1162109375, -10.111328125, -9.1064453125, -8.1015625, -7.0966796875, -6.091796875, -5.0869140625, -4.08203125, -3.0771484375, -2.072265625, -1.0673828125, -0.0625, 0.9423828125, 1.947265625, 2.9521484375, 3.95703125, 4.9619140625, 5.966796875, 6.9716796875, 7.9765625, 8.9814453125, 9.986328125, 10.9912109375, 11.99609375, 13.0009765625, 14.005859375, 15.0107421875, 16.015625, 17.0205078125, 18.025390625, 19.0302734375, 20.03515625, 21.0400390625, 22.044921875, 23.0498046875, 24.0546875, 25.0595703125, 26.064453125, 27.0693359375, 28.07421875, 29.0791015625, 30.083984375, 31.0888671875, 32.09375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 5.0, 4.0, 9.0, 13.0, 17.0, 12.0, 24.0, 23.0, 25.0, 31.0, 40.0, 30.0, 49.0, 46.0, 54.0, 53.0, 60.0, 51.0, 60.0, 57.0, 47.0, 50.0, 45.0, 36.0, 22.0, 32.0, 13.0, 25.0, 17.0, 14.0, 9.0, 6.0, 13.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-24.0625, -23.43017578125, -22.7978515625, -22.16552734375, -21.533203125, -20.90087890625, -20.2685546875, -19.63623046875, -19.00390625, -18.37158203125, -17.7392578125, -17.10693359375, -16.474609375, -15.84228515625, -15.2099609375, -14.57763671875, -13.9453125, -13.31298828125, -12.6806640625, -12.04833984375, -11.416015625, -10.78369140625, -10.1513671875, -9.51904296875, -8.88671875, -8.25439453125, -7.6220703125, -6.98974609375, -6.357421875, -5.72509765625, -5.0927734375, -4.46044921875, -3.828125, -3.19580078125, -2.5634765625, -1.93115234375, -1.298828125, -0.66650390625, -0.0341796875, 0.59814453125, 1.23046875, 1.86279296875, 2.4951171875, 3.12744140625, 3.759765625, 4.39208984375, 5.0244140625, 5.65673828125, 6.2890625, 6.92138671875, 7.5537109375, 8.18603515625, 8.818359375, 9.45068359375, 10.0830078125, 10.71533203125, 11.34765625, 11.97998046875, 12.6123046875, 13.24462890625, 13.876953125, 14.50927734375, 15.1416015625, 15.77392578125, 16.40625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 4.0, 8.0, 9.0, 18.0, 17.0, 44.0, 64.0, 72.0, 122.0, 207.0, 321.0, 640.0, 1251.0, 2720.0, 7366.0, 23512.0, 89251.0, 322218.0, 411540.0, 137128.0, 34826.0, 10267.0, 3602.0, 1506.0, 786.0, 399.0, 217.0, 132.0, 91.0, 56.0, 36.0, 35.0, 19.0, 17.0, 13.0, 13.0, 8.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.96875, -16.424072265625, -15.87939453125, -15.334716796875, -14.7900390625, -14.245361328125, -13.70068359375, -13.156005859375, -12.611328125, -12.066650390625, -11.52197265625, -10.977294921875, -10.4326171875, -9.887939453125, -9.34326171875, -8.798583984375, -8.25390625, -7.709228515625, -7.16455078125, -6.619873046875, -6.0751953125, -5.530517578125, -4.98583984375, -4.441162109375, -3.896484375, -3.351806640625, -2.80712890625, -2.262451171875, -1.7177734375, -1.173095703125, -0.62841796875, -0.083740234375, 0.4609375, 1.005615234375, 1.55029296875, 2.094970703125, 2.6396484375, 3.184326171875, 3.72900390625, 4.273681640625, 4.818359375, 5.363037109375, 5.90771484375, 6.452392578125, 6.9970703125, 7.541748046875, 8.08642578125, 8.631103515625, 9.17578125, 9.720458984375, 10.26513671875, 10.809814453125, 11.3544921875, 11.899169921875, 12.44384765625, 12.988525390625, 13.533203125, 14.077880859375, 14.62255859375, 15.167236328125, 15.7119140625, 16.256591796875, 16.80126953125, 17.345947265625, 17.890625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 5.0, 6.0, 7.0, 8.0, 4.0, 10.0, 16.0, 18.0, 14.0, 13.0, 35.0, 33.0, 40.0, 39.0, 52.0, 46.0, 67.0, 59.0, 86.0, 78.0, 82.0, 50.0, 41.0, 39.0, 31.0, 25.0, 17.0, 10.0, 15.0, 12.0, 7.0, 11.0, 4.0, 5.0, 7.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0020580291748046875, -0.001995474100112915, -0.0019329190254211426, -0.0018703639507293701, -0.0018078088760375977, -0.0017452538013458252, -0.0016826987266540527, -0.0016201436519622803, -0.0015575885772705078, -0.0014950335025787354, -0.0014324784278869629, -0.0013699233531951904, -0.001307368278503418, -0.0012448132038116455, -0.001182258129119873, -0.0011197030544281006, -0.0010571479797363281, -0.0009945929050445557, -0.0009320378303527832, -0.0008694827556610107, -0.0008069276809692383, -0.0007443726062774658, -0.0006818175315856934, -0.0006192624568939209, -0.0005567073822021484, -0.000494152307510376, -0.0004315972328186035, -0.00036904215812683105, -0.0003064870834350586, -0.00024393200874328613, -0.00018137693405151367, -0.00011882185935974121, -5.626678466796875e-05, 6.288290023803711e-06, 6.884336471557617e-05, 0.00013139843940734863, 0.0001939535140991211, 0.00025650858879089355, 0.000319063663482666, 0.0003816187381744385, 0.00044417381286621094, 0.0005067288875579834, 0.0005692839622497559, 0.0006318390369415283, 0.0006943941116333008, 0.0007569491863250732, 0.0008195042610168457, 0.0008820593357086182, 0.0009446144104003906, 0.001007169485092163, 0.0010697245597839355, 0.001132279634475708, 0.0011948347091674805, 0.001257389783859253, 0.0013199448585510254, 0.0013824999332427979, 0.0014450550079345703, 0.0015076100826263428, 0.0015701651573181152, 0.0016327202320098877, 0.0016952753067016602, 0.0017578303813934326, 0.001820385456085205, 0.0018829405307769775, 0.00194549560546875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 4.0, 7.0, 10.0, 11.0, 20.0, 24.0, 41.0, 58.0, 85.0, 136.0, 208.0, 352.0, 687.0, 1147.0, 2331.0, 5052.0, 13489.0, 47413.0, 200489.0, 464920.0, 231066.0, 54722.0, 15231.0, 5555.0, 2452.0, 1274.0, 674.0, 427.0, 239.0, 137.0, 81.0, 52.0, 44.0, 27.0, 31.0, 6.0, 9.0, 13.0, 3.0, 3.0, 5.0, 1.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-16.515625, -15.956787109375, -15.39794921875, -14.839111328125, -14.2802734375, -13.721435546875, -13.16259765625, -12.603759765625, -12.044921875, -11.486083984375, -10.92724609375, -10.368408203125, -9.8095703125, -9.250732421875, -8.69189453125, -8.133056640625, -7.57421875, -7.015380859375, -6.45654296875, -5.897705078125, -5.3388671875, -4.780029296875, -4.22119140625, -3.662353515625, -3.103515625, -2.544677734375, -1.98583984375, -1.427001953125, -0.8681640625, -0.309326171875, 0.24951171875, 0.808349609375, 1.3671875, 1.926025390625, 2.48486328125, 3.043701171875, 3.6025390625, 4.161376953125, 4.72021484375, 5.279052734375, 5.837890625, 6.396728515625, 6.95556640625, 7.514404296875, 8.0732421875, 8.632080078125, 9.19091796875, 9.749755859375, 10.30859375, 10.867431640625, 11.42626953125, 11.985107421875, 12.5439453125, 13.102783203125, 13.66162109375, 14.220458984375, 14.779296875, 15.338134765625, 15.89697265625, 16.455810546875, 17.0146484375, 17.573486328125, 18.13232421875, 18.691162109375, 19.25]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 4.0, 8.0, 9.0, 5.0, 9.0, 19.0, 14.0, 31.0, 48.0, 60.0, 59.0, 68.0, 59.0, 78.0, 92.0, 70.0, 71.0, 65.0, 55.0, 45.0, 35.0, 28.0, 14.0, 17.0, 12.0, 13.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.0859375, -8.786376953125, -8.48681640625, -8.187255859375, -7.8876953125, -7.588134765625, -7.28857421875, -6.989013671875, -6.689453125, -6.389892578125, -6.09033203125, -5.790771484375, -5.4912109375, -5.191650390625, -4.89208984375, -4.592529296875, -4.29296875, -3.993408203125, -3.69384765625, -3.394287109375, -3.0947265625, -2.795166015625, -2.49560546875, -2.196044921875, -1.896484375, -1.596923828125, -1.29736328125, -0.997802734375, -0.6982421875, -0.398681640625, -0.09912109375, 0.200439453125, 0.5, 0.799560546875, 1.09912109375, 1.398681640625, 1.6982421875, 1.997802734375, 2.29736328125, 2.596923828125, 2.896484375, 3.196044921875, 3.49560546875, 3.795166015625, 4.0947265625, 4.394287109375, 4.69384765625, 4.993408203125, 5.29296875, 5.592529296875, 5.89208984375, 6.191650390625, 6.4912109375, 6.790771484375, 7.09033203125, 7.389892578125, 7.689453125, 7.989013671875, 8.28857421875, 8.588134765625, 8.8876953125, 9.187255859375, 9.48681640625, 9.786376953125, 10.0859375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 10.0, 12.0, 27.0, 55.0, 107.0, 162.0, 210.0, 193.0, 111.0, 56.0, 34.0, 17.0, 5.0, 8.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-186.885498046875, -176.25062561035156, -165.61575317382812, -154.9808807373047, -144.34600830078125, -133.7111358642578, -123.07625579833984, -112.4413833618164, -101.80651092529297, -91.17163848876953, -80.5367660522461, -69.90188598632812, -59.26701736450195, -48.632144927978516, -37.99726867675781, -27.362396240234375, -16.727523803710938, -6.092650413513184, 4.54222297668457, 15.17709732055664, 25.811969757080078, 36.446842193603516, 47.08171844482422, 57.716590881347656, 68.3514633178711, 78.98633575439453, 89.62120819091797, 100.25608825683594, 110.89096069335938, 121.52583312988281, 132.16070556640625, 142.7955780029297, 153.43045043945312, 164.06532287597656, 174.7001953125, 185.33506774902344, 195.96994018554688, 206.6048126220703, 217.23968505859375, 227.87457275390625, 238.50942993164062, 249.14430236816406, 259.7791748046875, 270.4140625, 281.0489196777344, 291.6838073730469, 302.31866455078125, 312.95355224609375, 323.58843994140625, 334.22332763671875, 344.8581848144531, 355.4930725097656, 366.1279296875, 376.7628173828125, 387.3976745605469, 398.0325622558594, 408.66741943359375, 419.30230712890625, 429.9371643066406, 440.5720520019531, 451.2069091796875, 461.841796875, 472.4766540527344, 483.1115417480469, 493.74639892578125]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 7.0, 10.0, 17.0, 3.0, 29.0, 20.0, 29.0, 34.0, 39.0, 45.0, 44.0, 48.0, 59.0, 53.0, 49.0, 55.0, 54.0, 54.0, 41.0, 57.0, 39.0, 41.0, 33.0, 16.0, 28.0, 18.0, 15.0, 12.0, 13.0, 12.0, 2.0, 5.0, 4.0, 6.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-119.51838684082031, -115.35527038574219, -111.19215393066406, -107.0290298461914, -102.86591339111328, -98.70279693603516, -94.5396728515625, -90.37655639648438, -86.21343994140625, -82.05032348632812, -77.88720703125, -73.72408294677734, -69.56096649169922, -65.3978500366211, -61.2347297668457, -57.07160949707031, -52.90849304199219, -48.74537658691406, -44.58225631713867, -40.41913604736328, -36.256019592285156, -32.09290313720703, -27.92978286743164, -23.766664505004883, -19.603546142578125, -15.440427780151367, -11.27730941772461, -7.114191055297852, -2.9510726928710938, 1.212045669555664, 5.375164031982422, 9.53828239440918, 13.701416015625, 17.864534378051758, 22.027652740478516, 26.190771102905273, 30.35388946533203, 34.517005920410156, 38.68012619018555, 42.84324645996094, 47.00636291503906, 51.16947937011719, 55.33259963989258, 59.49571990966797, 63.658836364746094, 67.82195281982422, 71.98507690429688, 76.148193359375, 80.31130981445312, 84.47442626953125, 88.63754272460938, 92.80066680908203, 96.96378326416016, 101.12689971923828, 105.29002380371094, 109.45314025878906, 113.61625671386719, 117.77937316894531, 121.94248962402344, 126.1056137084961, 130.26873779296875, 134.43185424804688, 138.594970703125, 142.75808715820312, 146.92120361328125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 7.0, 8.0, 11.0, 24.0, 23.0, 46.0, 52.0, 110.0, 203.0, 428.0, 1064.0, 3593.0, 15309.0, 137801.0, 3907742.0, 108975.0, 13411.0, 3329.0, 1153.0, 449.0, 225.0, 123.0, 74.0, 38.0, 22.0, 25.0, 9.0, 10.0, 7.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.0625, -81.96484375, -78.8671875, -75.76953125, -72.671875, -69.57421875, -66.4765625, -63.37890625, -60.28125, -57.18359375, -54.0859375, -50.98828125, -47.890625, -44.79296875, -41.6953125, -38.59765625, -35.5, -32.40234375, -29.3046875, -26.20703125, -23.109375, -20.01171875, -16.9140625, -13.81640625, -10.71875, -7.62109375, -4.5234375, -1.42578125, 1.671875, 4.76953125, 7.8671875, 10.96484375, 14.0625, 17.16015625, 20.2578125, 23.35546875, 26.453125, 29.55078125, 32.6484375, 35.74609375, 38.84375, 41.94140625, 45.0390625, 48.13671875, 51.234375, 54.33203125, 57.4296875, 60.52734375, 63.625, 66.72265625, 69.8203125, 72.91796875, 76.015625, 79.11328125, 82.2109375, 85.30859375, 88.40625, 91.50390625, 94.6015625, 97.69921875, 100.796875, 103.89453125, 106.9921875, 110.08984375, 113.1875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 9.0, 5.0, 8.0, 7.0, 15.0, 17.0, 25.0, 30.0, 36.0, 51.0, 55.0, 65.0, 69.0, 72.0, 77.0, 72.0, 75.0, 65.0, 61.0, 43.0, 28.0, 22.0, 23.0, 24.0, 16.0, 9.0, 8.0, 6.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.46875, -4.3175048828125, -4.166259765625, -4.0150146484375, -3.86376953125, -3.7125244140625, -3.561279296875, -3.4100341796875, -3.2587890625, -3.1075439453125, -2.956298828125, -2.8050537109375, -2.65380859375, -2.5025634765625, -2.351318359375, -2.2000732421875, -2.048828125, -1.8975830078125, -1.746337890625, -1.5950927734375, -1.44384765625, -1.2926025390625, -1.141357421875, -0.9901123046875, -0.8388671875, -0.6876220703125, -0.536376953125, -0.3851318359375, -0.23388671875, -0.0826416015625, 0.068603515625, 0.2198486328125, 0.37109375, 0.5223388671875, 0.673583984375, 0.8248291015625, 0.97607421875, 1.1273193359375, 1.278564453125, 1.4298095703125, 1.5810546875, 1.7322998046875, 1.883544921875, 2.0347900390625, 2.18603515625, 2.3372802734375, 2.488525390625, 2.6397705078125, 2.791015625, 2.9422607421875, 3.093505859375, 3.2447509765625, 3.39599609375, 3.5472412109375, 3.698486328125, 3.8497314453125, 4.0009765625, 4.1522216796875, 4.303466796875, 4.4547119140625, 4.60595703125, 4.7572021484375, 4.908447265625, 5.0596923828125, 5.2109375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 7.0, 5.0, 14.0, 19.0, 37.0, 54.0, 103.0, 172.0, 329.0, 457.0, 883.0, 1630.0, 3178.0, 6516.0, 15089.0, 38031.0, 113521.0, 530275.0, 3046151.0, 305567.0, 80771.0, 28791.0, 11805.0, 5391.0, 2699.0, 1250.0, 661.0, 330.0, 214.0, 133.0, 74.0, 48.0, 35.0, 31.0, 8.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.09375, -35.87158203125, -34.6494140625, -33.42724609375, -32.205078125, -30.98291015625, -29.7607421875, -28.53857421875, -27.31640625, -26.09423828125, -24.8720703125, -23.64990234375, -22.427734375, -21.20556640625, -19.9833984375, -18.76123046875, -17.5390625, -16.31689453125, -15.0947265625, -13.87255859375, -12.650390625, -11.42822265625, -10.2060546875, -8.98388671875, -7.76171875, -6.53955078125, -5.3173828125, -4.09521484375, -2.873046875, -1.65087890625, -0.4287109375, 0.79345703125, 2.015625, 3.23779296875, 4.4599609375, 5.68212890625, 6.904296875, 8.12646484375, 9.3486328125, 10.57080078125, 11.79296875, 13.01513671875, 14.2373046875, 15.45947265625, 16.681640625, 17.90380859375, 19.1259765625, 20.34814453125, 21.5703125, 22.79248046875, 24.0146484375, 25.23681640625, 26.458984375, 27.68115234375, 28.9033203125, 30.12548828125, 31.34765625, 32.56982421875, 33.7919921875, 35.01416015625, 36.236328125, 37.45849609375, 38.6806640625, 39.90283203125, 41.125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 1.0, 4.0, 6.0, 4.0, 5.0, 12.0, 8.0, 14.0, 17.0, 9.0, 26.0, 23.0, 47.0, 63.0, 70.0, 105.0, 164.0, 265.0, 536.0, 1418.0, 467.0, 234.0, 154.0, 89.0, 70.0, 61.0, 43.0, 28.0, 30.0, 26.0, 16.0, 10.0, 8.0, 13.0, 2.0, 11.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0390625, -8.768310546875, -8.49755859375, -8.226806640625, -7.9560546875, -7.685302734375, -7.41455078125, -7.143798828125, -6.873046875, -6.602294921875, -6.33154296875, -6.060791015625, -5.7900390625, -5.519287109375, -5.24853515625, -4.977783203125, -4.70703125, -4.436279296875, -4.16552734375, -3.894775390625, -3.6240234375, -3.353271484375, -3.08251953125, -2.811767578125, -2.541015625, -2.270263671875, -1.99951171875, -1.728759765625, -1.4580078125, -1.187255859375, -0.91650390625, -0.645751953125, -0.375, -0.104248046875, 0.16650390625, 0.437255859375, 0.7080078125, 0.978759765625, 1.24951171875, 1.520263671875, 1.791015625, 2.061767578125, 2.33251953125, 2.603271484375, 2.8740234375, 3.144775390625, 3.41552734375, 3.686279296875, 3.95703125, 4.227783203125, 4.49853515625, 4.769287109375, 5.0400390625, 5.310791015625, 5.58154296875, 5.852294921875, 6.123046875, 6.393798828125, 6.66455078125, 6.935302734375, 7.2060546875, 7.476806640625, 7.74755859375, 8.018310546875, 8.2890625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 22.0, 60.0, 135.0, 209.0, 264.0, 170.0, 84.0, 34.0, 16.0, 3.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.54171752929688, -81.52543640136719, -76.50914764404297, -71.49285888671875, -66.47657775878906, -61.46029281616211, -56.444007873535156, -51.4277229309082, -46.41143798828125, -41.3951530456543, -36.378868103027344, -31.36258316040039, -26.346298217773438, -21.330013275146484, -16.31372833251953, -11.297443389892578, -6.281158447265625, -1.2648735046386719, 3.7514114379882812, 8.767696380615234, 13.783981323242188, 18.80026626586914, 23.816551208496094, 28.832836151123047, 33.84912109375, 38.86540603637695, 43.881690979003906, 48.89797592163086, 53.91426086425781, 58.930545806884766, 63.94683074951172, 68.96311950683594, 73.97940063476562, 78.99568176269531, 84.01197052001953, 89.02825927734375, 94.04454040527344, 99.06082153320312, 104.07711029052734, 109.09339904785156, 114.10968017578125, 119.12596130371094, 124.14225006103516, 129.15853881835938, 134.17481994628906, 139.19110107421875, 144.2073974609375, 149.2236785888672, 154.23995971679688, 159.25624084472656, 164.27252197265625, 169.288818359375, 174.3050994873047, 179.32138061523438, 184.33767700195312, 189.3539581298828, 194.3702392578125, 199.3865203857422, 204.40280151367188, 209.41909790039062, 214.4353790283203, 219.45166015625, 224.46795654296875, 229.48423767089844, 234.50051879882812]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 4.0, 14.0, 19.0, 20.0, 25.0, 32.0, 48.0, 60.0, 50.0, 68.0, 92.0, 65.0, 79.0, 76.0, 65.0, 59.0, 43.0, 33.0, 44.0, 27.0, 23.0, 23.0, 13.0, 9.0, 4.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-67.23870849609375, -65.3755874633789, -63.51247024536133, -61.649349212646484, -59.786231994628906, -57.92311096191406, -56.05998992919922, -54.19687271118164, -52.33375549316406, -50.47063446044922, -48.60751724243164, -46.7443962097168, -44.88127899169922, -43.018157958984375, -41.15503692626953, -39.29191970825195, -37.42879867553711, -35.565677642822266, -33.70256042480469, -31.839439392089844, -29.976322174072266, -28.113201141357422, -26.25008201599121, -24.386962890625, -22.52384376525879, -20.660724639892578, -18.797605514526367, -16.934486389160156, -15.071366310119629, -13.208247184753418, -11.34512710571289, -9.48200798034668, -7.618892669677734, -5.755773544311523, -3.8926539421081543, -2.029534339904785, -0.16641521453857422, 1.6967039108276367, 3.559823989868164, 5.422943115234375, 7.286062240600586, 9.149181365966797, 11.012300491333008, 12.875420570373535, 14.738539695739746, 16.60165786743164, 18.464778900146484, 20.327898025512695, 22.191017150878906, 24.054136276245117, 25.917255401611328, 27.780376434326172, 29.64349365234375, 31.506614685058594, 33.36973571777344, 35.232852935791016, 37.095970153808594, 38.95909118652344, 40.822208404541016, 42.68532943725586, 44.54844665527344, 46.41156768798828, 48.274688720703125, 50.1378059387207, 52.00092697143555]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 13.0, 13.0, 15.0, 17.0, 26.0, 37.0, 38.0, 58.0, 82.0, 104.0, 135.0, 181.0, 243.0, 344.0, 564.0, 914.0, 1489.0, 2695.0, 5072.0, 10056.0, 21461.0, 46913.0, 101321.0, 199707.0, 286178.0, 190358.0, 96027.0, 43877.0, 19955.0, 9427.0, 4618.0, 2572.0, 1363.0, 829.0, 538.0, 378.0, 228.0, 170.0, 139.0, 102.0, 76.0, 46.0, 47.0, 38.0, 26.0, 13.0, 9.0, 18.0, 7.0, 8.0, 5.0, 4.0, 3.0, 2.0, 4.0, 1.0], "bins": [-20.5, -19.868408203125, -19.23681640625, -18.605224609375, -17.9736328125, -17.342041015625, -16.71044921875, -16.078857421875, -15.447265625, -14.815673828125, -14.18408203125, -13.552490234375, -12.9208984375, -12.289306640625, -11.65771484375, -11.026123046875, -10.39453125, -9.762939453125, -9.13134765625, -8.499755859375, -7.8681640625, -7.236572265625, -6.60498046875, -5.973388671875, -5.341796875, -4.710205078125, -4.07861328125, -3.447021484375, -2.8154296875, -2.183837890625, -1.55224609375, -0.920654296875, -0.2890625, 0.342529296875, 0.97412109375, 1.605712890625, 2.2373046875, 2.868896484375, 3.50048828125, 4.132080078125, 4.763671875, 5.395263671875, 6.02685546875, 6.658447265625, 7.2900390625, 7.921630859375, 8.55322265625, 9.184814453125, 9.81640625, 10.447998046875, 11.07958984375, 11.711181640625, 12.3427734375, 12.974365234375, 13.60595703125, 14.237548828125, 14.869140625, 15.500732421875, 16.13232421875, 16.763916015625, 17.3955078125, 18.027099609375, 18.65869140625, 19.290283203125, 19.921875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 5.0, 9.0, 15.0, 28.0, 27.0, 43.0, 42.0, 55.0, 67.0, 70.0, 74.0, 96.0, 72.0, 64.0, 70.0, 59.0, 35.0, 36.0, 38.0, 21.0, 23.0, 14.0, 18.0, 4.0, 4.0, 6.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.19140625, -5.0279541015625, -4.864501953125, -4.7010498046875, -4.53759765625, -4.3741455078125, -4.210693359375, -4.0472412109375, -3.8837890625, -3.7203369140625, -3.556884765625, -3.3934326171875, -3.22998046875, -3.0665283203125, -2.903076171875, -2.7396240234375, -2.576171875, -2.4127197265625, -2.249267578125, -2.0858154296875, -1.92236328125, -1.7589111328125, -1.595458984375, -1.4320068359375, -1.2685546875, -1.1051025390625, -0.941650390625, -0.7781982421875, -0.61474609375, -0.4512939453125, -0.287841796875, -0.1243896484375, 0.0390625, 0.2025146484375, 0.365966796875, 0.5294189453125, 0.69287109375, 0.8563232421875, 1.019775390625, 1.1832275390625, 1.3466796875, 1.5101318359375, 1.673583984375, 1.8370361328125, 2.00048828125, 2.1639404296875, 2.327392578125, 2.4908447265625, 2.654296875, 2.8177490234375, 2.981201171875, 3.1446533203125, 3.30810546875, 3.4715576171875, 3.635009765625, 3.7984619140625, 3.9619140625, 4.1253662109375, 4.288818359375, 4.4522705078125, 4.61572265625, 4.7791748046875, 4.942626953125, 5.1060791015625, 5.26953125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 5.0, 9.0, 10.0, 8.0, 13.0, 29.0, 34.0, 57.0, 60.0, 113.0, 135.0, 197.0, 253.0, 416.0, 601.0, 896.0, 1613.0, 2972.0, 6121.0, 13124.0, 30050.0, 71331.0, 158260.0, 279541.0, 249938.0, 129447.0, 56811.0, 24427.0, 10730.0, 4966.0, 2461.0, 1387.0, 832.0, 528.0, 368.0, 244.0, 156.0, 109.0, 77.0, 65.0, 47.0, 42.0, 21.0, 17.0, 13.0, 10.0, 7.0, 3.0, 1.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.765625, -18.1767578125, -17.587890625, -16.9990234375, -16.41015625, -15.8212890625, -15.232421875, -14.6435546875, -14.0546875, -13.4658203125, -12.876953125, -12.2880859375, -11.69921875, -11.1103515625, -10.521484375, -9.9326171875, -9.34375, -8.7548828125, -8.166015625, -7.5771484375, -6.98828125, -6.3994140625, -5.810546875, -5.2216796875, -4.6328125, -4.0439453125, -3.455078125, -2.8662109375, -2.27734375, -1.6884765625, -1.099609375, -0.5107421875, 0.078125, 0.6669921875, 1.255859375, 1.8447265625, 2.43359375, 3.0224609375, 3.611328125, 4.2001953125, 4.7890625, 5.3779296875, 5.966796875, 6.5556640625, 7.14453125, 7.7333984375, 8.322265625, 8.9111328125, 9.5, 10.0888671875, 10.677734375, 11.2666015625, 11.85546875, 12.4443359375, 13.033203125, 13.6220703125, 14.2109375, 14.7998046875, 15.388671875, 15.9775390625, 16.56640625, 17.1552734375, 17.744140625, 18.3330078125, 18.921875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 5.0, 7.0, 6.0, 8.0, 7.0, 22.0, 17.0, 24.0, 16.0, 22.0, 22.0, 35.0, 38.0, 46.0, 45.0, 45.0, 40.0, 50.0, 41.0, 49.0, 58.0, 44.0, 46.0, 29.0, 38.0, 33.0, 32.0, 30.0, 33.0, 24.0, 19.0, 14.0, 20.0, 7.0, 15.0, 4.0, 8.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.53125, -14.99658203125, -14.4619140625, -13.92724609375, -13.392578125, -12.85791015625, -12.3232421875, -11.78857421875, -11.25390625, -10.71923828125, -10.1845703125, -9.64990234375, -9.115234375, -8.58056640625, -8.0458984375, -7.51123046875, -6.9765625, -6.44189453125, -5.9072265625, -5.37255859375, -4.837890625, -4.30322265625, -3.7685546875, -3.23388671875, -2.69921875, -2.16455078125, -1.6298828125, -1.09521484375, -0.560546875, -0.02587890625, 0.5087890625, 1.04345703125, 1.578125, 2.11279296875, 2.6474609375, 3.18212890625, 3.716796875, 4.25146484375, 4.7861328125, 5.32080078125, 5.85546875, 6.39013671875, 6.9248046875, 7.45947265625, 7.994140625, 8.52880859375, 9.0634765625, 9.59814453125, 10.1328125, 10.66748046875, 11.2021484375, 11.73681640625, 12.271484375, 12.80615234375, 13.3408203125, 13.87548828125, 14.41015625, 14.94482421875, 15.4794921875, 16.01416015625, 16.548828125, 17.08349609375, 17.6181640625, 18.15283203125, 18.6875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 6.0, 4.0, 6.0, 7.0, 15.0, 21.0, 40.0, 57.0, 67.0, 107.0, 245.0, 458.0, 1163.0, 2909.0, 9510.0, 47438.0, 350587.0, 528351.0, 85903.0, 14736.0, 4054.0, 1526.0, 629.0, 327.0, 157.0, 69.0, 48.0, 32.0, 26.0, 12.0, 7.0, 10.0, 7.0, 11.0, 6.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.0625, -17.482666015625, -16.90283203125, -16.322998046875, -15.7431640625, -15.163330078125, -14.58349609375, -14.003662109375, -13.423828125, -12.843994140625, -12.26416015625, -11.684326171875, -11.1044921875, -10.524658203125, -9.94482421875, -9.364990234375, -8.78515625, -8.205322265625, -7.62548828125, -7.045654296875, -6.4658203125, -5.885986328125, -5.30615234375, -4.726318359375, -4.146484375, -3.566650390625, -2.98681640625, -2.406982421875, -1.8271484375, -1.247314453125, -0.66748046875, -0.087646484375, 0.4921875, 1.072021484375, 1.65185546875, 2.231689453125, 2.8115234375, 3.391357421875, 3.97119140625, 4.551025390625, 5.130859375, 5.710693359375, 6.29052734375, 6.870361328125, 7.4501953125, 8.030029296875, 8.60986328125, 9.189697265625, 9.76953125, 10.349365234375, 10.92919921875, 11.509033203125, 12.0888671875, 12.668701171875, 13.24853515625, 13.828369140625, 14.408203125, 14.988037109375, 15.56787109375, 16.147705078125, 16.7275390625, 17.307373046875, 17.88720703125, 18.467041015625, 19.046875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 7.0, 7.0, 11.0, 4.0, 9.0, 13.0, 13.0, 21.0, 28.0, 44.0, 49.0, 51.0, 63.0, 79.0, 107.0, 103.0, 73.0, 63.0, 54.0, 39.0, 32.0, 29.0, 18.0, 14.0, 16.0, 12.0, 9.0, 7.0, 5.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0017108917236328125, -0.0016517043113708496, -0.0015925168991088867, -0.0015333294868469238, -0.001474142074584961, -0.001414954662322998, -0.0013557672500610352, -0.0012965798377990723, -0.0012373924255371094, -0.0011782050132751465, -0.0011190176010131836, -0.0010598301887512207, -0.0010006427764892578, -0.0009414553642272949, -0.000882267951965332, -0.0008230805397033691, -0.0007638931274414062, -0.0007047057151794434, -0.0006455183029174805, -0.0005863308906555176, -0.0005271434783935547, -0.0004679560661315918, -0.0004087686538696289, -0.000349581241607666, -0.0002903938293457031, -0.00023120641708374023, -0.00017201900482177734, -0.00011283159255981445, -5.364418029785156e-05, 5.543231964111328e-06, 6.473064422607422e-05, 0.0001239180564880371, 0.00018310546875, 0.0002422928810119629, 0.0003014802932739258, 0.00036066770553588867, 0.00041985511779785156, 0.00047904253005981445, 0.0005382299423217773, 0.0005974173545837402, 0.0006566047668457031, 0.000715792179107666, 0.0007749795913696289, 0.0008341670036315918, 0.0008933544158935547, 0.0009525418281555176, 0.0010117292404174805, 0.0010709166526794434, 0.0011301040649414062, 0.0011892914772033691, 0.001248478889465332, 0.001307666301727295, 0.0013668537139892578, 0.0014260411262512207, 0.0014852285385131836, 0.0015444159507751465, 0.0016036033630371094, 0.0016627907752990723, 0.0017219781875610352, 0.001781165599822998, 0.001840353012084961, 0.0018995404243469238, 0.0019587278366088867, 0.0020179152488708496, 0.0020771026611328125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 6.0, 15.0, 6.0, 20.0, 21.0, 23.0, 36.0, 36.0, 64.0, 104.0, 149.0, 235.0, 427.0, 806.0, 1484.0, 2888.0, 6755.0, 18289.0, 63914.0, 266934.0, 466526.0, 158107.0, 39449.0, 12386.0, 4857.0, 2191.0, 1178.0, 635.0, 357.0, 218.0, 122.0, 102.0, 60.0, 40.0, 24.0, 13.0, 16.0, 7.0, 14.0, 6.0, 6.0, 5.0, 6.0, 5.0, 3.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.578125, -12.1632080078125, -11.748291015625, -11.3333740234375, -10.91845703125, -10.5035400390625, -10.088623046875, -9.6737060546875, -9.2587890625, -8.8438720703125, -8.428955078125, -8.0140380859375, -7.59912109375, -7.1842041015625, -6.769287109375, -6.3543701171875, -5.939453125, -5.5245361328125, -5.109619140625, -4.6947021484375, -4.27978515625, -3.8648681640625, -3.449951171875, -3.0350341796875, -2.6201171875, -2.2052001953125, -1.790283203125, -1.3753662109375, -0.96044921875, -0.5455322265625, -0.130615234375, 0.2843017578125, 0.69921875, 1.1141357421875, 1.529052734375, 1.9439697265625, 2.35888671875, 2.7738037109375, 3.188720703125, 3.6036376953125, 4.0185546875, 4.4334716796875, 4.848388671875, 5.2633056640625, 5.67822265625, 6.0931396484375, 6.508056640625, 6.9229736328125, 7.337890625, 7.7528076171875, 8.167724609375, 8.5826416015625, 8.99755859375, 9.4124755859375, 9.827392578125, 10.2423095703125, 10.6572265625, 11.0721435546875, 11.487060546875, 11.9019775390625, 12.31689453125, 12.7318115234375, 13.146728515625, 13.5616455078125, 13.9765625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 2.0, 4.0, 3.0, 6.0, 6.0, 11.0, 9.0, 14.0, 22.0, 18.0, 33.0, 29.0, 41.0, 41.0, 65.0, 60.0, 69.0, 60.0, 78.0, 79.0, 63.0, 58.0, 41.0, 34.0, 36.0, 27.0, 19.0, 21.0, 9.0, 12.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.73828125, -6.49761962890625, -6.2569580078125, -6.01629638671875, -5.775634765625, -5.53497314453125, -5.2943115234375, -5.05364990234375, -4.81298828125, -4.57232666015625, -4.3316650390625, -4.09100341796875, -3.850341796875, -3.60968017578125, -3.3690185546875, -3.12835693359375, -2.8876953125, -2.64703369140625, -2.4063720703125, -2.16571044921875, -1.925048828125, -1.68438720703125, -1.4437255859375, -1.20306396484375, -0.96240234375, -0.72174072265625, -0.4810791015625, -0.24041748046875, 0.000244140625, 0.24090576171875, 0.4815673828125, 0.72222900390625, 0.962890625, 1.20355224609375, 1.4442138671875, 1.68487548828125, 1.925537109375, 2.16619873046875, 2.4068603515625, 2.64752197265625, 2.88818359375, 3.12884521484375, 3.3695068359375, 3.61016845703125, 3.850830078125, 4.09149169921875, 4.3321533203125, 4.57281494140625, 4.8134765625, 5.05413818359375, 5.2947998046875, 5.53546142578125, 5.776123046875, 6.01678466796875, 6.2574462890625, 6.49810791015625, 6.73876953125, 6.97943115234375, 7.2200927734375, 7.46075439453125, 7.701416015625, 7.94207763671875, 8.1827392578125, 8.42340087890625, 8.6640625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 2.0, 5.0, 12.0, 10.0, 10.0, 18.0, 43.0, 43.0, 70.0, 84.0, 84.0, 103.0, 102.0, 91.0, 92.0, 64.0, 44.0, 30.0, 29.0, 20.0, 12.0, 11.0, 7.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-124.47711181640625, -120.33177947998047, -116.18644714355469, -112.0411148071289, -107.89578247070312, -103.75045776367188, -99.6051254272461, -95.45979309082031, -91.31446075439453, -87.16912841796875, -83.02379608154297, -78.87846374511719, -74.73313903808594, -70.58779907226562, -66.44247436523438, -62.297142028808594, -58.15180969238281, -54.00647735595703, -49.86114501953125, -45.715816497802734, -41.57048416137695, -37.42515182495117, -33.279823303222656, -29.134490966796875, -24.989158630371094, -20.843826293945312, -16.698495864868164, -12.5531644821167, -8.407833099365234, -4.262500762939453, -0.11717033386230469, 4.028160095214844, 8.173477172851562, 12.318808555603027, 16.464139938354492, 20.60947036743164, 24.754802703857422, 28.900135040283203, 33.04546356201172, 37.1907958984375, 41.33612823486328, 45.48146057128906, 49.626792907714844, 53.77212142944336, 57.91745376586914, 62.06278610229492, 66.20811462402344, 70.35344696044922, 74.498779296875, 78.64411163330078, 82.78944396972656, 86.93477630615234, 91.08010864257812, 95.22543334960938, 99.37076568603516, 103.51609802246094, 107.66143035888672, 111.8067626953125, 115.95209503173828, 120.09742736816406, 124.24275207519531, 128.38809204101562, 132.53341674804688, 136.67874145507812, 140.82408142089844]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 4.0, 8.0, 5.0, 3.0, 14.0, 13.0, 14.0, 9.0, 16.0, 31.0, 30.0, 21.0, 34.0, 37.0, 37.0, 42.0, 48.0, 51.0, 51.0, 58.0, 42.0, 53.0, 40.0, 41.0, 45.0, 34.0, 31.0, 37.0, 28.0, 13.0, 21.0, 24.0, 15.0, 6.0, 12.0, 10.0, 6.0, 4.0, 8.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-94.22860717773438, -90.94551849365234, -87.66242980957031, -84.37934875488281, -81.09626007080078, -77.81317138671875, -74.53008270263672, -71.24699401855469, -67.96390533447266, -64.68081665039062, -61.39773178100586, -58.11464309692383, -54.8315544128418, -51.54846954345703, -48.265380859375, -44.98229217529297, -41.6992073059082, -38.41611862182617, -35.133033752441406, -31.849945068359375, -28.566856384277344, -25.283769607543945, -22.000682830810547, -18.717594146728516, -15.434507369995117, -12.151419639587402, -8.868331909179688, -5.585245132446289, -2.302157402038574, 0.9809303283691406, 4.264017105102539, 7.54710578918457, 10.830192565917969, 14.113280296325684, 17.3963680267334, 20.679454803466797, 23.962543487548828, 27.245630264282227, 30.528717041015625, 33.811805725097656, 37.09489440917969, 40.37798309326172, 43.661067962646484, 46.944156646728516, 50.22724533081055, 53.51033020019531, 56.793418884277344, 60.076507568359375, 63.35959243774414, 66.6426773071289, 69.92576599121094, 73.20885467529297, 76.491943359375, 79.77503204345703, 83.05812072753906, 86.34120178222656, 89.6242904663086, 92.90737915039062, 96.19046783447266, 99.47355651855469, 102.75663757324219, 106.03972625732422, 109.32281494140625, 112.60590362548828, 115.88899230957031]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 7.0, 8.0, 5.0, 11.0, 10.0, 4.0, 13.0, 19.0, 42.0, 33.0, 60.0, 99.0, 143.0, 213.0, 314.0, 585.0, 1115.0, 2302.0, 5548.0, 16638.0, 71620.0, 3475166.0, 552518.0, 46316.0, 12308.0, 4650.0, 2044.0, 1076.0, 540.0, 305.0, 190.0, 121.0, 85.0, 53.0, 30.0, 23.0, 21.0, 11.0, 11.0, 17.0, 8.0, 5.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.125, -38.6318359375, -37.138671875, -35.6455078125, -34.15234375, -32.6591796875, -31.166015625, -29.6728515625, -28.1796875, -26.6865234375, -25.193359375, -23.7001953125, -22.20703125, -20.7138671875, -19.220703125, -17.7275390625, -16.234375, -14.7412109375, -13.248046875, -11.7548828125, -10.26171875, -8.7685546875, -7.275390625, -5.7822265625, -4.2890625, -2.7958984375, -1.302734375, 0.1904296875, 1.68359375, 3.1767578125, 4.669921875, 6.1630859375, 7.65625, 9.1494140625, 10.642578125, 12.1357421875, 13.62890625, 15.1220703125, 16.615234375, 18.1083984375, 19.6015625, 21.0947265625, 22.587890625, 24.0810546875, 25.57421875, 27.0673828125, 28.560546875, 30.0537109375, 31.546875, 33.0400390625, 34.533203125, 36.0263671875, 37.51953125, 39.0126953125, 40.505859375, 41.9990234375, 43.4921875, 44.9853515625, 46.478515625, 47.9716796875, 49.46484375, 50.9580078125, 52.451171875, 53.9443359375, 55.4375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 8.0, 1.0, 9.0, 9.0, 11.0, 17.0, 20.0, 27.0, 44.0, 56.0, 60.0, 73.0, 90.0, 62.0, 70.0, 77.0, 69.0, 51.0, 45.0, 44.0, 45.0, 29.0, 15.0, 21.0, 11.0, 12.0, 7.0, 9.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.04296875, -4.8773193359375, -4.711669921875, -4.5460205078125, -4.38037109375, -4.2147216796875, -4.049072265625, -3.8834228515625, -3.7177734375, -3.5521240234375, -3.386474609375, -3.2208251953125, -3.05517578125, -2.8895263671875, -2.723876953125, -2.5582275390625, -2.392578125, -2.2269287109375, -2.061279296875, -1.8956298828125, -1.72998046875, -1.5643310546875, -1.398681640625, -1.2330322265625, -1.0673828125, -0.9017333984375, -0.736083984375, -0.5704345703125, -0.40478515625, -0.2391357421875, -0.073486328125, 0.0921630859375, 0.2578125, 0.4234619140625, 0.589111328125, 0.7547607421875, 0.92041015625, 1.0860595703125, 1.251708984375, 1.4173583984375, 1.5830078125, 1.7486572265625, 1.914306640625, 2.0799560546875, 2.24560546875, 2.4112548828125, 2.576904296875, 2.7425537109375, 2.908203125, 3.0738525390625, 3.239501953125, 3.4051513671875, 3.57080078125, 3.7364501953125, 3.902099609375, 4.0677490234375, 4.2333984375, 4.3990478515625, 4.564697265625, 4.7303466796875, 4.89599609375, 5.0616455078125, 5.227294921875, 5.3929443359375, 5.55859375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 0.0, 2.0, 7.0, 11.0, 23.0, 30.0, 33.0, 44.0, 61.0, 107.0, 176.0, 339.0, 506.0, 863.0, 1643.0, 3231.0, 6451.0, 14048.0, 34225.0, 100022.0, 471700.0, 3146935.0, 288502.0, 74990.0, 27364.0, 11418.0, 5328.0, 2717.0, 1436.0, 788.0, 477.0, 250.0, 162.0, 132.0, 78.0, 59.0, 42.0, 20.0, 20.0, 11.0, 7.0, 6.0, 7.0, 7.0, 4.0, 2.0, 0.0, 1.0], "bins": [-30.984375, -30.1552734375, -29.326171875, -28.4970703125, -27.66796875, -26.8388671875, -26.009765625, -25.1806640625, -24.3515625, -23.5224609375, -22.693359375, -21.8642578125, -21.03515625, -20.2060546875, -19.376953125, -18.5478515625, -17.71875, -16.8896484375, -16.060546875, -15.2314453125, -14.40234375, -13.5732421875, -12.744140625, -11.9150390625, -11.0859375, -10.2568359375, -9.427734375, -8.5986328125, -7.76953125, -6.9404296875, -6.111328125, -5.2822265625, -4.453125, -3.6240234375, -2.794921875, -1.9658203125, -1.13671875, -0.3076171875, 0.521484375, 1.3505859375, 2.1796875, 3.0087890625, 3.837890625, 4.6669921875, 5.49609375, 6.3251953125, 7.154296875, 7.9833984375, 8.8125, 9.6416015625, 10.470703125, 11.2998046875, 12.12890625, 12.9580078125, 13.787109375, 14.6162109375, 15.4453125, 16.2744140625, 17.103515625, 17.9326171875, 18.76171875, 19.5908203125, 20.419921875, 21.2490234375, 22.078125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 8.0, 2.0, 3.0, 3.0, 4.0, 5.0, 8.0, 7.0, 10.0, 12.0, 20.0, 24.0, 39.0, 37.0, 88.0, 112.0, 185.0, 315.0, 1382.0, 978.0, 301.0, 174.0, 110.0, 68.0, 54.0, 25.0, 20.0, 22.0, 17.0, 11.0, 11.0, 7.0, 4.0, 9.0, 1.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.30859375, -7.05596923828125, -6.8033447265625, -6.55072021484375, -6.298095703125, -6.04547119140625, -5.7928466796875, -5.54022216796875, -5.28759765625, -5.03497314453125, -4.7823486328125, -4.52972412109375, -4.277099609375, -4.02447509765625, -3.7718505859375, -3.51922607421875, -3.2666015625, -3.01397705078125, -2.7613525390625, -2.50872802734375, -2.256103515625, -2.00347900390625, -1.7508544921875, -1.49822998046875, -1.24560546875, -0.99298095703125, -0.7403564453125, -0.48773193359375, -0.235107421875, 0.01751708984375, 0.2701416015625, 0.52276611328125, 0.775390625, 1.02801513671875, 1.2806396484375, 1.53326416015625, 1.785888671875, 2.03851318359375, 2.2911376953125, 2.54376220703125, 2.79638671875, 3.04901123046875, 3.3016357421875, 3.55426025390625, 3.806884765625, 4.05950927734375, 4.3121337890625, 4.56475830078125, 4.8173828125, 5.07000732421875, 5.3226318359375, 5.57525634765625, 5.827880859375, 6.08050537109375, 6.3331298828125, 6.58575439453125, 6.83837890625, 7.09100341796875, 7.3436279296875, 7.59625244140625, 7.848876953125, 8.10150146484375, 8.3541259765625, 8.60675048828125, 8.859375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 8.0, 12.0, 5.0, 28.0, 28.0, 56.0, 76.0, 112.0, 109.0, 115.0, 128.0, 96.0, 85.0, 59.0, 27.0, 24.0, 12.0, 10.0, 10.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.83511734008789, -33.99361038208008, -32.152103424072266, -30.31059455871582, -28.469085693359375, -26.627578735351562, -24.78607177734375, -22.944564819335938, -21.103055953979492, -19.26154899597168, -17.420040130615234, -15.578533172607422, -13.737025260925293, -11.895517349243164, -10.054010391235352, -8.212502479553223, -6.370994567871094, -4.529486656188965, -2.687979221343994, -0.8464717864990234, 0.9950361251831055, 2.8365440368652344, 4.678050994873047, 6.519558906555176, 8.361066818237305, 10.202574729919434, 12.044082641601562, 13.885589599609375, 15.727097511291504, 17.568605422973633, 19.410112380981445, 21.25162124633789, 23.09313201904297, 24.93463897705078, 26.776147842407227, 28.61765480041504, 30.459163665771484, 32.3006706237793, 34.14217758178711, 35.98368453979492, 37.8251953125, 39.66670227050781, 41.508209228515625, 43.34971618652344, 45.191226959228516, 47.03273391723633, 48.87424087524414, 50.71574783325195, 52.557254791259766, 54.39876174926758, 56.24026870727539, 58.08177947998047, 59.92328643798828, 61.764793395996094, 63.606300354003906, 65.44780731201172, 67.28931427001953, 69.13082122802734, 70.97232818603516, 72.81383514404297, 74.65534210205078, 76.49685668945312, 78.33836364746094, 80.17987060546875, 82.02137756347656]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 4.0, 4.0, 10.0, 6.0, 14.0, 6.0, 14.0, 11.0, 15.0, 16.0, 36.0, 38.0, 43.0, 39.0, 34.0, 58.0, 38.0, 41.0, 45.0, 53.0, 53.0, 54.0, 44.0, 59.0, 38.0, 35.0, 31.0, 37.0, 20.0, 18.0, 12.0, 22.0, 19.0, 8.0, 8.0, 3.0, 10.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-36.840904235839844, -35.8980598449707, -34.95521926879883, -34.01237487792969, -33.06953430175781, -32.12668991088867, -31.183849334716797, -30.241004943847656, -29.29816436767578, -28.355321884155273, -27.412479400634766, -26.469636917114258, -25.52679443359375, -24.583951950073242, -23.641109466552734, -22.698265075683594, -21.755422592163086, -20.812580108642578, -19.86973762512207, -18.926895141601562, -17.984052658081055, -17.041210174560547, -16.098365783691406, -15.155524253845215, -14.212681770324707, -13.2698392868042, -12.326996803283691, -11.384153366088867, -10.44131088256836, -9.498468399047852, -8.555625915527344, -7.612783432006836, -6.669939041137695, -5.7270965576171875, -4.78425407409668, -3.8414111137390137, -2.898568630218506, -1.955726146697998, -1.012883186340332, -0.07004070281982422, 0.8728017807006836, 1.815644383430481, 2.7584869861602783, 3.7013297080993652, 4.644172191619873, 5.587014675140381, 6.529857635498047, 7.472700119018555, 8.415542602539062, 9.35838508605957, 10.301227569580078, 11.244070053100586, 12.186912536621094, 13.129755020141602, 14.072598457336426, 15.015440940856934, 15.958283424377441, 16.901126861572266, 17.843969345092773, 18.78681182861328, 19.72965431213379, 20.672496795654297, 21.615339279174805, 22.558181762695312, 23.50102424621582]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 2.0, 8.0, 8.0, 11.0, 19.0, 22.0, 30.0, 51.0, 59.0, 92.0, 135.0, 223.0, 317.0, 487.0, 751.0, 1401.0, 2471.0, 4996.0, 10674.0, 24586.0, 58850.0, 141440.0, 300591.0, 280009.0, 127075.0, 52382.0, 22069.0, 9457.0, 4658.0, 2252.0, 1287.0, 731.0, 468.0, 286.0, 205.0, 132.0, 92.0, 69.0, 47.0, 32.0, 24.0, 13.0, 15.0, 10.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.90625, -23.180419921875, -22.45458984375, -21.728759765625, -21.0029296875, -20.277099609375, -19.55126953125, -18.825439453125, -18.099609375, -17.373779296875, -16.64794921875, -15.922119140625, -15.1962890625, -14.470458984375, -13.74462890625, -13.018798828125, -12.29296875, -11.567138671875, -10.84130859375, -10.115478515625, -9.3896484375, -8.663818359375, -7.93798828125, -7.212158203125, -6.486328125, -5.760498046875, -5.03466796875, -4.308837890625, -3.5830078125, -2.857177734375, -2.13134765625, -1.405517578125, -0.6796875, 0.046142578125, 0.77197265625, 1.497802734375, 2.2236328125, 2.949462890625, 3.67529296875, 4.401123046875, 5.126953125, 5.852783203125, 6.57861328125, 7.304443359375, 8.0302734375, 8.756103515625, 9.48193359375, 10.207763671875, 10.93359375, 11.659423828125, 12.38525390625, 13.111083984375, 13.8369140625, 14.562744140625, 15.28857421875, 16.014404296875, 16.740234375, 17.466064453125, 18.19189453125, 18.917724609375, 19.6435546875, 20.369384765625, 21.09521484375, 21.821044921875, 22.546875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 9.0, 12.0, 17.0, 17.0, 24.0, 40.0, 21.0, 59.0, 61.0, 70.0, 81.0, 75.0, 54.0, 68.0, 55.0, 67.0, 51.0, 44.0, 33.0, 31.0, 31.0, 14.0, 14.0, 15.0, 12.0, 10.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.1328125, -4.9700927734375, -4.807373046875, -4.6446533203125, -4.48193359375, -4.3192138671875, -4.156494140625, -3.9937744140625, -3.8310546875, -3.6683349609375, -3.505615234375, -3.3428955078125, -3.18017578125, -3.0174560546875, -2.854736328125, -2.6920166015625, -2.529296875, -2.3665771484375, -2.203857421875, -2.0411376953125, -1.87841796875, -1.7156982421875, -1.552978515625, -1.3902587890625, -1.2275390625, -1.0648193359375, -0.902099609375, -0.7393798828125, -0.57666015625, -0.4139404296875, -0.251220703125, -0.0885009765625, 0.07421875, 0.2369384765625, 0.399658203125, 0.5623779296875, 0.72509765625, 0.8878173828125, 1.050537109375, 1.2132568359375, 1.3759765625, 1.5386962890625, 1.701416015625, 1.8641357421875, 2.02685546875, 2.1895751953125, 2.352294921875, 2.5150146484375, 2.677734375, 2.8404541015625, 3.003173828125, 3.1658935546875, 3.32861328125, 3.4913330078125, 3.654052734375, 3.8167724609375, 3.9794921875, 4.1422119140625, 4.304931640625, 4.4676513671875, 4.63037109375, 4.7930908203125, 4.955810546875, 5.1185302734375, 5.28125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 3.0, 8.0, 14.0, 22.0, 18.0, 38.0, 53.0, 72.0, 96.0, 141.0, 198.0, 318.0, 469.0, 789.0, 1337.0, 2389.0, 4856.0, 10308.0, 24429.0, 61241.0, 147093.0, 304224.0, 273295.0, 126709.0, 51149.0, 20719.0, 9015.0, 4173.0, 2103.0, 1197.0, 699.0, 442.0, 307.0, 187.0, 143.0, 95.0, 62.0, 42.0, 31.0, 20.0, 24.0, 9.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.328125, -17.735107421875, -17.14208984375, -16.549072265625, -15.9560546875, -15.363037109375, -14.77001953125, -14.177001953125, -13.583984375, -12.990966796875, -12.39794921875, -11.804931640625, -11.2119140625, -10.618896484375, -10.02587890625, -9.432861328125, -8.83984375, -8.246826171875, -7.65380859375, -7.060791015625, -6.4677734375, -5.874755859375, -5.28173828125, -4.688720703125, -4.095703125, -3.502685546875, -2.90966796875, -2.316650390625, -1.7236328125, -1.130615234375, -0.53759765625, 0.055419921875, 0.6484375, 1.241455078125, 1.83447265625, 2.427490234375, 3.0205078125, 3.613525390625, 4.20654296875, 4.799560546875, 5.392578125, 5.985595703125, 6.57861328125, 7.171630859375, 7.7646484375, 8.357666015625, 8.95068359375, 9.543701171875, 10.13671875, 10.729736328125, 11.32275390625, 11.915771484375, 12.5087890625, 13.101806640625, 13.69482421875, 14.287841796875, 14.880859375, 15.473876953125, 16.06689453125, 16.659912109375, 17.2529296875, 17.845947265625, 18.43896484375, 19.031982421875, 19.625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 9.0, 7.0, 7.0, 11.0, 9.0, 9.0, 14.0, 15.0, 19.0, 19.0, 22.0, 37.0, 32.0, 26.0, 27.0, 36.0, 29.0, 43.0, 39.0, 43.0, 50.0, 51.0, 38.0, 41.0, 45.0, 38.0, 42.0, 38.0, 28.0, 28.0, 24.0, 14.0, 22.0, 11.0, 18.0, 18.0, 8.0, 2.0, 7.0, 7.0, 2.0, 6.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0], "bins": [-16.421875, -15.94873046875, -15.4755859375, -15.00244140625, -14.529296875, -14.05615234375, -13.5830078125, -13.10986328125, -12.63671875, -12.16357421875, -11.6904296875, -11.21728515625, -10.744140625, -10.27099609375, -9.7978515625, -9.32470703125, -8.8515625, -8.37841796875, -7.9052734375, -7.43212890625, -6.958984375, -6.48583984375, -6.0126953125, -5.53955078125, -5.06640625, -4.59326171875, -4.1201171875, -3.64697265625, -3.173828125, -2.70068359375, -2.2275390625, -1.75439453125, -1.28125, -0.80810546875, -0.3349609375, 0.13818359375, 0.611328125, 1.08447265625, 1.5576171875, 2.03076171875, 2.50390625, 2.97705078125, 3.4501953125, 3.92333984375, 4.396484375, 4.86962890625, 5.3427734375, 5.81591796875, 6.2890625, 6.76220703125, 7.2353515625, 7.70849609375, 8.181640625, 8.65478515625, 9.1279296875, 9.60107421875, 10.07421875, 10.54736328125, 11.0205078125, 11.49365234375, 11.966796875, 12.43994140625, 12.9130859375, 13.38623046875, 13.859375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 7.0, 3.0, 4.0, 9.0, 17.0, 18.0, 38.0, 44.0, 58.0, 99.0, 204.0, 298.0, 467.0, 810.0, 1376.0, 3029.0, 8293.0, 31383.0, 198509.0, 629443.0, 137775.0, 24161.0, 6653.0, 2695.0, 1303.0, 767.0, 460.0, 224.0, 137.0, 86.0, 64.0, 42.0, 23.0, 26.0, 6.0, 11.0, 4.0, 3.0, 7.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.6875, -16.15625, -15.625, -15.09375, -14.5625, -14.03125, -13.5, -12.96875, -12.4375, -11.90625, -11.375, -10.84375, -10.3125, -9.78125, -9.25, -8.71875, -8.1875, -7.65625, -7.125, -6.59375, -6.0625, -5.53125, -5.0, -4.46875, -3.9375, -3.40625, -2.875, -2.34375, -1.8125, -1.28125, -0.75, -0.21875, 0.3125, 0.84375, 1.375, 1.90625, 2.4375, 2.96875, 3.5, 4.03125, 4.5625, 5.09375, 5.625, 6.15625, 6.6875, 7.21875, 7.75, 8.28125, 8.8125, 9.34375, 9.875, 10.40625, 10.9375, 11.46875, 12.0, 12.53125, 13.0625, 13.59375, 14.125, 14.65625, 15.1875, 15.71875, 16.25, 16.78125, 17.3125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 6.0, 4.0, 13.0, 9.0, 14.0, 18.0, 28.0, 43.0, 68.0, 105.0, 191.0, 180.0, 117.0, 67.0, 41.0, 29.0, 21.0, 10.0, 12.0, 7.0, 5.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0033512115478515625, -0.003243178129196167, -0.0031351447105407715, -0.003027111291885376, -0.0029190778732299805, -0.002811044454574585, -0.0027030110359191895, -0.002594977617263794, -0.0024869441986083984, -0.002378910779953003, -0.0022708773612976074, -0.002162843942642212, -0.0020548105239868164, -0.001946777105331421, -0.0018387436866760254, -0.0017307102680206299, -0.0016226768493652344, -0.0015146434307098389, -0.0014066100120544434, -0.0012985765933990479, -0.0011905431747436523, -0.0010825097560882568, -0.0009744763374328613, -0.0008664429187774658, -0.0007584095001220703, -0.0006503760814666748, -0.0005423426628112793, -0.0004343092441558838, -0.0003262758255004883, -0.00021824240684509277, -0.00011020898818969727, -2.175569534301758e-06, 0.00010585784912109375, 0.00021389126777648926, 0.00032192468643188477, 0.0004299581050872803, 0.0005379915237426758, 0.0006460249423980713, 0.0007540583610534668, 0.0008620917797088623, 0.0009701251983642578, 0.0010781586170196533, 0.0011861920356750488, 0.0012942254543304443, 0.0014022588729858398, 0.0015102922916412354, 0.0016183257102966309, 0.0017263591289520264, 0.0018343925476074219, 0.0019424259662628174, 0.002050459384918213, 0.0021584928035736084, 0.002266526222229004, 0.0023745596408843994, 0.002482593059539795, 0.0025906264781951904, 0.002698659896850586, 0.0028066933155059814, 0.002914726734161377, 0.0030227601528167725, 0.003130793571472168, 0.0032388269901275635, 0.003346860408782959, 0.0034548938274383545, 0.00356292724609375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 11.0, 7.0, 10.0, 12.0, 22.0, 31.0, 44.0, 62.0, 118.0, 150.0, 282.0, 396.0, 669.0, 1213.0, 2298.0, 5171.0, 15093.0, 64844.0, 435639.0, 432483.0, 64470.0, 15022.0, 5200.0, 2343.0, 1173.0, 665.0, 399.0, 261.0, 154.0, 95.0, 54.0, 49.0, 25.0, 25.0, 15.0, 14.0, 7.0, 5.0, 4.0, 4.0, 2.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.703125, -15.196533203125, -14.68994140625, -14.183349609375, -13.6767578125, -13.170166015625, -12.66357421875, -12.156982421875, -11.650390625, -11.143798828125, -10.63720703125, -10.130615234375, -9.6240234375, -9.117431640625, -8.61083984375, -8.104248046875, -7.59765625, -7.091064453125, -6.58447265625, -6.077880859375, -5.5712890625, -5.064697265625, -4.55810546875, -4.051513671875, -3.544921875, -3.038330078125, -2.53173828125, -2.025146484375, -1.5185546875, -1.011962890625, -0.50537109375, 0.001220703125, 0.5078125, 1.014404296875, 1.52099609375, 2.027587890625, 2.5341796875, 3.040771484375, 3.54736328125, 4.053955078125, 4.560546875, 5.067138671875, 5.57373046875, 6.080322265625, 6.5869140625, 7.093505859375, 7.60009765625, 8.106689453125, 8.61328125, 9.119873046875, 9.62646484375, 10.133056640625, 10.6396484375, 11.146240234375, 11.65283203125, 12.159423828125, 12.666015625, 13.172607421875, 13.67919921875, 14.185791015625, 14.6923828125, 15.198974609375, 15.70556640625, 16.212158203125, 16.71875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 2.0, 7.0, 13.0, 23.0, 38.0, 52.0, 76.0, 101.0, 124.0, 136.0, 136.0, 85.0, 65.0, 43.0, 29.0, 20.0, 11.0, 6.0, 7.0, 5.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.4609375, -13.079345703125, -12.69775390625, -12.316162109375, -11.9345703125, -11.552978515625, -11.17138671875, -10.789794921875, -10.408203125, -10.026611328125, -9.64501953125, -9.263427734375, -8.8818359375, -8.500244140625, -8.11865234375, -7.737060546875, -7.35546875, -6.973876953125, -6.59228515625, -6.210693359375, -5.8291015625, -5.447509765625, -5.06591796875, -4.684326171875, -4.302734375, -3.921142578125, -3.53955078125, -3.157958984375, -2.7763671875, -2.394775390625, -2.01318359375, -1.631591796875, -1.25, -0.868408203125, -0.48681640625, -0.105224609375, 0.2763671875, 0.657958984375, 1.03955078125, 1.421142578125, 1.802734375, 2.184326171875, 2.56591796875, 2.947509765625, 3.3291015625, 3.710693359375, 4.09228515625, 4.473876953125, 4.85546875, 5.237060546875, 5.61865234375, 6.000244140625, 6.3818359375, 6.763427734375, 7.14501953125, 7.526611328125, 7.908203125, 8.289794921875, 8.67138671875, 9.052978515625, 9.4345703125, 9.816162109375, 10.19775390625, 10.579345703125, 10.9609375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 1.0, 12.0, 11.0, 23.0, 28.0, 45.0, 66.0, 92.0, 123.0, 119.0, 131.0, 107.0, 81.0, 51.0, 42.0, 26.0, 16.0, 11.0, 8.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-198.13973999023438, -192.74169921875, -187.34364318847656, -181.9456024169922, -176.5475616455078, -171.14952087402344, -165.75146484375, -160.35342407226562, -154.95538330078125, -149.55734252929688, -144.15928649902344, -138.76124572753906, -133.3632049560547, -127.96515655517578, -122.56710815429688, -117.1690673828125, -111.7710189819336, -106.37297058105469, -100.97492980957031, -95.5768814086914, -90.17884063720703, -84.78079223632812, -79.38275146484375, -73.98470306396484, -68.58665466308594, -63.1886100769043, -57.790565490722656, -52.39251708984375, -46.994476318359375, -41.59642791748047, -36.19838333129883, -30.800338745117188, -25.402297973632812, -20.004253387451172, -14.606207847595215, -9.208162307739258, -3.810117721557617, 1.5879268646240234, 6.985973358154297, 12.384017944335938, 17.782062530517578, 23.18010711669922, 28.57815170288086, 33.9761962890625, 39.374244689941406, 44.77228546142578, 50.17033386230469, 55.56837844848633, 60.96642303466797, 66.36447143554688, 71.76251220703125, 77.16056060791016, 82.55860137939453, 87.95664978027344, 93.35469055175781, 98.75273895263672, 104.15078735351562, 109.54883575439453, 114.9468765258789, 120.34492492675781, 125.74296569824219, 131.14100646972656, 136.5390625, 141.93710327148438, 147.33514404296875]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 4.0, 5.0, 6.0, 6.0, 6.0, 7.0, 8.0, 21.0, 7.0, 16.0, 13.0, 35.0, 33.0, 37.0, 22.0, 34.0, 38.0, 52.0, 43.0, 56.0, 53.0, 65.0, 45.0, 59.0, 42.0, 47.0, 45.0, 35.0, 23.0, 29.0, 9.0, 23.0, 13.0, 12.0, 7.0, 14.0, 8.0, 5.0, 7.0, 6.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.4470443725586, -98.230712890625, -95.0143814086914, -91.79804992675781, -88.58171081542969, -85.3653793334961, -82.1490478515625, -78.9327163696289, -75.71638488769531, -72.50005340576172, -69.28372192382812, -66.0673828125, -62.851051330566406, -59.63471984863281, -56.41838836669922, -53.202056884765625, -49.9857177734375, -46.769386291503906, -43.55305099487305, -40.33671951293945, -37.120384216308594, -33.904052734375, -30.687721252441406, -27.47138786315918, -24.255054473876953, -21.038721084594727, -17.8223876953125, -14.606056213378906, -11.38972282409668, -8.173389434814453, -4.957057952880859, -1.7407245635986328, 1.475616455078125, 4.691949367523193, 7.908282279968262, 11.124614715576172, 14.340948104858398, 17.557281494140625, 20.77361297607422, 23.989946365356445, 27.206279754638672, 30.4226131439209, 33.638946533203125, 36.85527801513672, 40.07160949707031, 43.28794479370117, 46.504276275634766, 49.720611572265625, 52.93694305419922, 56.15327453613281, 59.36960983276367, 62.585941314697266, 65.80227661132812, 69.01860809326172, 72.23493957519531, 75.4512710571289, 78.6676025390625, 81.8839340209961, 85.10026550292969, 88.31660461425781, 91.5329360961914, 94.749267578125, 97.9655990600586, 101.18193054199219, 104.39826965332031]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 10.0, 4.0, 10.0, 13.0, 12.0, 14.0, 18.0, 29.0, 37.0, 44.0, 63.0, 93.0, 129.0, 221.0, 299.0, 435.0, 660.0, 1148.0, 2045.0, 3834.0, 7857.0, 17940.0, 47756.0, 173206.0, 3038014.0, 733124.0, 105489.0, 33577.0, 13795.0, 6339.0, 3333.0, 1795.0, 1047.0, 666.0, 421.0, 267.0, 182.0, 130.0, 59.0, 46.0, 35.0, 23.0, 21.0, 10.0, 14.0, 8.0, 6.0, 4.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-29.84375, -28.90625, -27.96875, -27.03125, -26.09375, -25.15625, -24.21875, -23.28125, -22.34375, -21.40625, -20.46875, -19.53125, -18.59375, -17.65625, -16.71875, -15.78125, -14.84375, -13.90625, -12.96875, -12.03125, -11.09375, -10.15625, -9.21875, -8.28125, -7.34375, -6.40625, -5.46875, -4.53125, -3.59375, -2.65625, -1.71875, -0.78125, 0.15625, 1.09375, 2.03125, 2.96875, 3.90625, 4.84375, 5.78125, 6.71875, 7.65625, 8.59375, 9.53125, 10.46875, 11.40625, 12.34375, 13.28125, 14.21875, 15.15625, 16.09375, 17.03125, 17.96875, 18.90625, 19.84375, 20.78125, 21.71875, 22.65625, 23.59375, 24.53125, 25.46875, 26.40625, 27.34375, 28.28125, 29.21875, 30.15625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 9.0, 10.0, 21.0, 22.0, 17.0, 47.0, 42.0, 47.0, 69.0, 76.0, 89.0, 69.0, 59.0, 71.0, 76.0, 53.0, 54.0, 32.0, 29.0, 29.0, 14.0, 19.0, 20.0, 9.0, 4.0, 7.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.5859375, -5.416748046875, -5.24755859375, -5.078369140625, -4.9091796875, -4.739990234375, -4.57080078125, -4.401611328125, -4.232421875, -4.063232421875, -3.89404296875, -3.724853515625, -3.5556640625, -3.386474609375, -3.21728515625, -3.048095703125, -2.87890625, -2.709716796875, -2.54052734375, -2.371337890625, -2.2021484375, -2.032958984375, -1.86376953125, -1.694580078125, -1.525390625, -1.356201171875, -1.18701171875, -1.017822265625, -0.8486328125, -0.679443359375, -0.51025390625, -0.341064453125, -0.171875, -0.002685546875, 0.16650390625, 0.335693359375, 0.5048828125, 0.674072265625, 0.84326171875, 1.012451171875, 1.181640625, 1.350830078125, 1.52001953125, 1.689208984375, 1.8583984375, 2.027587890625, 2.19677734375, 2.365966796875, 2.53515625, 2.704345703125, 2.87353515625, 3.042724609375, 3.2119140625, 3.381103515625, 3.55029296875, 3.719482421875, 3.888671875, 4.057861328125, 4.22705078125, 4.396240234375, 4.5654296875, 4.734619140625, 4.90380859375, 5.072998046875, 5.2421875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 7.0, 9.0, 12.0, 16.0, 21.0, 20.0, 44.0, 40.0, 75.0, 76.0, 133.0, 170.0, 278.0, 428.0, 653.0, 1124.0, 1963.0, 3839.0, 8004.0, 21220.0, 76875.0, 461134.0, 3209685.0, 318436.0, 59836.0, 16731.0, 6383.0, 3042.0, 1562.0, 922.0, 522.0, 315.0, 224.0, 132.0, 80.0, 78.0, 53.0, 41.0, 29.0, 23.0, 8.0, 13.0, 8.0, 7.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-32.59375, -31.55615234375, -30.5185546875, -29.48095703125, -28.443359375, -27.40576171875, -26.3681640625, -25.33056640625, -24.29296875, -23.25537109375, -22.2177734375, -21.18017578125, -20.142578125, -19.10498046875, -18.0673828125, -17.02978515625, -15.9921875, -14.95458984375, -13.9169921875, -12.87939453125, -11.841796875, -10.80419921875, -9.7666015625, -8.72900390625, -7.69140625, -6.65380859375, -5.6162109375, -4.57861328125, -3.541015625, -2.50341796875, -1.4658203125, -0.42822265625, 0.609375, 1.64697265625, 2.6845703125, 3.72216796875, 4.759765625, 5.79736328125, 6.8349609375, 7.87255859375, 8.91015625, 9.94775390625, 10.9853515625, 12.02294921875, 13.060546875, 14.09814453125, 15.1357421875, 16.17333984375, 17.2109375, 18.24853515625, 19.2861328125, 20.32373046875, 21.361328125, 22.39892578125, 23.4365234375, 24.47412109375, 25.51171875, 26.54931640625, 27.5869140625, 28.62451171875, 29.662109375, 30.69970703125, 31.7373046875, 32.77490234375, 33.8125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 4.0, 4.0, 10.0, 1.0, 7.0, 10.0, 15.0, 13.0, 22.0, 35.0, 52.0, 75.0, 130.0, 221.0, 406.0, 1390.0, 780.0, 355.0, 199.0, 120.0, 82.0, 50.0, 27.0, 15.0, 20.0, 12.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.484375, -16.0599365234375, -15.635498046875, -15.2110595703125, -14.78662109375, -14.3621826171875, -13.937744140625, -13.5133056640625, -13.0888671875, -12.6644287109375, -12.239990234375, -11.8155517578125, -11.39111328125, -10.9666748046875, -10.542236328125, -10.1177978515625, -9.693359375, -9.2689208984375, -8.844482421875, -8.4200439453125, -7.99560546875, -7.5711669921875, -7.146728515625, -6.7222900390625, -6.2978515625, -5.8734130859375, -5.448974609375, -5.0245361328125, -4.60009765625, -4.1756591796875, -3.751220703125, -3.3267822265625, -2.90234375, -2.4779052734375, -2.053466796875, -1.6290283203125, -1.20458984375, -0.7801513671875, -0.355712890625, 0.0687255859375, 0.4931640625, 0.9176025390625, 1.342041015625, 1.7664794921875, 2.19091796875, 2.6153564453125, 3.039794921875, 3.4642333984375, 3.888671875, 4.3131103515625, 4.737548828125, 5.1619873046875, 5.58642578125, 6.0108642578125, 6.435302734375, 6.8597412109375, 7.2841796875, 7.7086181640625, 8.133056640625, 8.5574951171875, 8.98193359375, 9.4063720703125, 9.830810546875, 10.2552490234375, 10.6796875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 6.0, 9.0, 30.0, 48.0, 106.0, 160.0, 213.0, 205.0, 117.0, 63.0, 22.0, 11.0, 4.0, 6.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-208.431396484375, -203.17308044433594, -197.9147491455078, -192.65643310546875, -187.3981170654297, -182.13978576660156, -176.8814697265625, -171.62313842773438, -166.3648223876953, -161.10650634765625, -155.84817504882812, -150.58985900878906, -145.33154296875, -140.07321166992188, -134.8148956298828, -129.55657958984375, -124.29825592041016, -119.03993225097656, -113.7816162109375, -108.5232925415039, -103.26496887207031, -98.00665283203125, -92.74832916259766, -87.49000549316406, -82.231689453125, -76.9733657836914, -71.71504974365234, -66.45672607421875, -61.198402404785156, -55.94008255004883, -50.6817626953125, -45.423439025878906, -40.16511535644531, -34.906795501708984, -29.64847183227539, -24.390151977539062, -19.1318302154541, -13.87350845336914, -8.615188598632812, -3.3568649291992188, 1.9014549255371094, 7.159776210784912, 12.418097496032715, 17.67641830444336, 22.93474006652832, 28.19306182861328, 33.45138168334961, 38.7097053527832, 43.96802520751953, 49.22634506225586, 54.48466873168945, 59.74298858642578, 65.00131225585938, 70.25962829589844, 75.51795196533203, 80.77627563476562, 86.03459167480469, 91.29291534423828, 96.55123138427734, 101.80955505371094, 107.06787872314453, 112.32620239257812, 117.58451843261719, 122.84284210205078, 128.10116577148438]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 2.0, 11.0, 8.0, 22.0, 31.0, 20.0, 39.0, 33.0, 69.0, 49.0, 57.0, 79.0, 68.0, 78.0, 76.0, 55.0, 64.0, 48.0, 42.0, 33.0, 29.0, 24.0, 18.0, 12.0, 14.0, 10.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.65126037597656, -60.55528259277344, -58.45930480957031, -56.36332702636719, -54.26734924316406, -52.17137145996094, -50.07539749145508, -47.97941970825195, -45.88344192504883, -43.7874641418457, -41.69148635864258, -39.59550857543945, -37.499534606933594, -35.40355682373047, -33.307579040527344, -31.21160125732422, -29.115623474121094, -27.01964569091797, -24.923667907714844, -22.82769203186035, -20.731714248657227, -18.6357364654541, -16.53976058959961, -14.443782806396484, -12.34780502319336, -10.251827239990234, -8.155850410461426, -6.059873104095459, -3.963895797729492, -1.8679180145263672, 0.2280588150024414, 2.32403564453125, 4.420013427734375, 6.515990734100342, 8.611968040466309, 10.707944869995117, 12.803922653198242, 14.899900436401367, 16.99587631225586, 19.091854095458984, 21.18783187866211, 23.283809661865234, 25.37978744506836, 27.47576332092285, 29.571741104125977, 31.6677188873291, 33.763694763183594, 35.85967254638672, 37.955650329589844, 40.05162811279297, 42.147605895996094, 44.24358367919922, 46.339561462402344, 48.43553924560547, 50.53151321411133, 52.62749099731445, 54.72346878051758, 56.8194465637207, 58.91542434692383, 61.01140213012695, 63.10737609863281, 65.20335388183594, 67.29933166503906, 69.39530944824219, 71.49128723144531]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 3.0, 3.0, 4.0, 3.0, 9.0, 20.0, 24.0, 28.0, 42.0, 71.0, 94.0, 142.0, 251.0, 344.0, 655.0, 1171.0, 2523.0, 7051.0, 24578.0, 111913.0, 524481.0, 293358.0, 59086.0, 14142.0, 4418.0, 1783.0, 953.0, 499.0, 280.0, 208.0, 120.0, 81.0, 67.0, 41.0, 30.0, 19.0, 16.0, 8.0, 6.0, 11.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-48.28125, -46.8525390625, -45.423828125, -43.9951171875, -42.56640625, -41.1376953125, -39.708984375, -38.2802734375, -36.8515625, -35.4228515625, -33.994140625, -32.5654296875, -31.13671875, -29.7080078125, -28.279296875, -26.8505859375, -25.421875, -23.9931640625, -22.564453125, -21.1357421875, -19.70703125, -18.2783203125, -16.849609375, -15.4208984375, -13.9921875, -12.5634765625, -11.134765625, -9.7060546875, -8.27734375, -6.8486328125, -5.419921875, -3.9912109375, -2.5625, -1.1337890625, 0.294921875, 1.7236328125, 3.15234375, 4.5810546875, 6.009765625, 7.4384765625, 8.8671875, 10.2958984375, 11.724609375, 13.1533203125, 14.58203125, 16.0107421875, 17.439453125, 18.8681640625, 20.296875, 21.7255859375, 23.154296875, 24.5830078125, 26.01171875, 27.4404296875, 28.869140625, 30.2978515625, 31.7265625, 33.1552734375, 34.583984375, 36.0126953125, 37.44140625, 38.8701171875, 40.298828125, 41.7275390625, 43.15625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 11.0, 15.0, 26.0, 40.0, 49.0, 57.0, 100.0, 87.0, 82.0, 96.0, 92.0, 83.0, 71.0, 46.0, 42.0, 30.0, 24.0, 14.0, 15.0, 9.0, 8.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.69140625, -6.47125244140625, -6.2510986328125, -6.03094482421875, -5.810791015625, -5.59063720703125, -5.3704833984375, -5.15032958984375, -4.93017578125, -4.71002197265625, -4.4898681640625, -4.26971435546875, -4.049560546875, -3.82940673828125, -3.6092529296875, -3.38909912109375, -3.1689453125, -2.94879150390625, -2.7286376953125, -2.50848388671875, -2.288330078125, -2.06817626953125, -1.8480224609375, -1.62786865234375, -1.40771484375, -1.18756103515625, -0.9674072265625, -0.74725341796875, -0.527099609375, -0.30694580078125, -0.0867919921875, 0.13336181640625, 0.353515625, 0.57366943359375, 0.7938232421875, 1.01397705078125, 1.234130859375, 1.45428466796875, 1.6744384765625, 1.89459228515625, 2.11474609375, 2.33489990234375, 2.5550537109375, 2.77520751953125, 2.995361328125, 3.21551513671875, 3.4356689453125, 3.65582275390625, 3.8759765625, 4.09613037109375, 4.3162841796875, 4.53643798828125, 4.756591796875, 4.97674560546875, 5.1968994140625, 5.41705322265625, 5.63720703125, 5.85736083984375, 6.0775146484375, 6.29766845703125, 6.517822265625, 6.73797607421875, 6.9581298828125, 7.17828369140625, 7.3984375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 7.0, 11.0, 10.0, 12.0, 32.0, 38.0, 48.0, 67.0, 104.0, 185.0, 300.0, 424.0, 651.0, 1159.0, 2022.0, 3847.0, 7384.0, 15230.0, 32365.0, 69815.0, 153651.0, 302494.0, 245451.0, 113301.0, 51742.0, 23988.0, 11410.0, 5582.0, 2917.0, 1582.0, 1010.0, 598.0, 354.0, 241.0, 161.0, 124.0, 68.0, 54.0, 35.0, 35.0, 18.0, 8.0, 9.0, 9.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-15.71875, -15.2396240234375, -14.760498046875, -14.2813720703125, -13.80224609375, -13.3231201171875, -12.843994140625, -12.3648681640625, -11.8857421875, -11.4066162109375, -10.927490234375, -10.4483642578125, -9.96923828125, -9.4901123046875, -9.010986328125, -8.5318603515625, -8.052734375, -7.5736083984375, -7.094482421875, -6.6153564453125, -6.13623046875, -5.6571044921875, -5.177978515625, -4.6988525390625, -4.2197265625, -3.7406005859375, -3.261474609375, -2.7823486328125, -2.30322265625, -1.8240966796875, -1.344970703125, -0.8658447265625, -0.38671875, 0.0924072265625, 0.571533203125, 1.0506591796875, 1.52978515625, 2.0089111328125, 2.488037109375, 2.9671630859375, 3.4462890625, 3.9254150390625, 4.404541015625, 4.8836669921875, 5.36279296875, 5.8419189453125, 6.321044921875, 6.8001708984375, 7.279296875, 7.7584228515625, 8.237548828125, 8.7166748046875, 9.19580078125, 9.6749267578125, 10.154052734375, 10.6331787109375, 11.1123046875, 11.5914306640625, 12.070556640625, 12.5496826171875, 13.02880859375, 13.5079345703125, 13.987060546875, 14.4661865234375, 14.9453125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 8.0, 6.0, 4.0, 8.0, 6.0, 10.0, 11.0, 9.0, 12.0, 16.0, 21.0, 21.0, 22.0, 21.0, 38.0, 33.0, 34.0, 30.0, 48.0, 43.0, 43.0, 43.0, 51.0, 50.0, 37.0, 40.0, 38.0, 41.0, 41.0, 34.0, 25.0, 32.0, 20.0, 21.0, 11.0, 15.0, 13.0, 14.0, 7.0, 7.0, 6.0, 3.0, 3.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.515625, -14.06201171875, -13.6083984375, -13.15478515625, -12.701171875, -12.24755859375, -11.7939453125, -11.34033203125, -10.88671875, -10.43310546875, -9.9794921875, -9.52587890625, -9.072265625, -8.61865234375, -8.1650390625, -7.71142578125, -7.2578125, -6.80419921875, -6.3505859375, -5.89697265625, -5.443359375, -4.98974609375, -4.5361328125, -4.08251953125, -3.62890625, -3.17529296875, -2.7216796875, -2.26806640625, -1.814453125, -1.36083984375, -0.9072265625, -0.45361328125, 0.0, 0.45361328125, 0.9072265625, 1.36083984375, 1.814453125, 2.26806640625, 2.7216796875, 3.17529296875, 3.62890625, 4.08251953125, 4.5361328125, 4.98974609375, 5.443359375, 5.89697265625, 6.3505859375, 6.80419921875, 7.2578125, 7.71142578125, 8.1650390625, 8.61865234375, 9.072265625, 9.52587890625, 9.9794921875, 10.43310546875, 10.88671875, 11.34033203125, 11.7939453125, 12.24755859375, 12.701171875, 13.15478515625, 13.6083984375, 14.06201171875, 14.515625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 8.0, 14.0, 10.0, 24.0, 48.0, 65.0, 111.0, 205.0, 427.0, 892.0, 1941.0, 4491.0, 12763.0, 45392.0, 203443.0, 520645.0, 193895.0, 43523.0, 12510.0, 4543.0, 1777.0, 876.0, 400.0, 212.0, 115.0, 71.0, 51.0, 21.0, 19.0, 14.0, 14.0, 10.0, 4.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.953125, -11.5477294921875, -11.142333984375, -10.7369384765625, -10.33154296875, -9.9261474609375, -9.520751953125, -9.1153564453125, -8.7099609375, -8.3045654296875, -7.899169921875, -7.4937744140625, -7.08837890625, -6.6829833984375, -6.277587890625, -5.8721923828125, -5.466796875, -5.0614013671875, -4.656005859375, -4.2506103515625, -3.84521484375, -3.4398193359375, -3.034423828125, -2.6290283203125, -2.2236328125, -1.8182373046875, -1.412841796875, -1.0074462890625, -0.60205078125, -0.1966552734375, 0.208740234375, 0.6141357421875, 1.01953125, 1.4249267578125, 1.830322265625, 2.2357177734375, 2.64111328125, 3.0465087890625, 3.451904296875, 3.8572998046875, 4.2626953125, 4.6680908203125, 5.073486328125, 5.4788818359375, 5.88427734375, 6.2896728515625, 6.695068359375, 7.1004638671875, 7.505859375, 7.9112548828125, 8.316650390625, 8.7220458984375, 9.12744140625, 9.5328369140625, 9.938232421875, 10.3436279296875, 10.7490234375, 11.1544189453125, 11.559814453125, 11.9652099609375, 12.37060546875, 12.7760009765625, 13.181396484375, 13.5867919921875, 13.9921875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 5.0, 8.0, 7.0, 15.0, 18.0, 26.0, 35.0, 36.0, 72.0, 127.0, 211.0, 166.0, 95.0, 55.0, 33.0, 29.0, 15.0, 16.0, 9.0, 8.0, 4.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002529144287109375, -0.002443850040435791, -0.002358555793762207, -0.002273261547088623, -0.002187967300415039, -0.002102673053741455, -0.002017378807067871, -0.0019320845603942871, -0.0018467903137207031, -0.0017614960670471191, -0.0016762018203735352, -0.0015909075736999512, -0.0015056133270263672, -0.0014203190803527832, -0.0013350248336791992, -0.0012497305870056152, -0.0011644363403320312, -0.0010791420936584473, -0.0009938478469848633, -0.0009085536003112793, -0.0008232593536376953, -0.0007379651069641113, -0.0006526708602905273, -0.0005673766136169434, -0.0004820823669433594, -0.0003967881202697754, -0.0003114938735961914, -0.00022619962692260742, -0.00014090538024902344, -5.561113357543945e-05, 2.968311309814453e-05, 0.00011497735977172852, 0.0002002716064453125, 0.0002855658531188965, 0.00037086009979248047, 0.00045615434646606445, 0.0005414485931396484, 0.0006267428398132324, 0.0007120370864868164, 0.0007973313331604004, 0.0008826255798339844, 0.0009679198265075684, 0.0010532140731811523, 0.0011385083198547363, 0.0012238025665283203, 0.0013090968132019043, 0.0013943910598754883, 0.0014796853065490723, 0.0015649795532226562, 0.0016502737998962402, 0.0017355680465698242, 0.0018208622932434082, 0.0019061565399169922, 0.001991450786590576, 0.00207674503326416, 0.002162039279937744, 0.002247333526611328, 0.002332627773284912, 0.002417922019958496, 0.00250321626663208, 0.002588510513305664, 0.002673804759979248, 0.002759099006652832, 0.002844393253326416, 0.0029296875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 2.0, 6.0, 9.0, 10.0, 17.0, 13.0, 20.0, 46.0, 53.0, 91.0, 145.0, 201.0, 393.0, 619.0, 1229.0, 2293.0, 4611.0, 10630.0, 29044.0, 97214.0, 341769.0, 385209.0, 118163.0, 33976.0, 12108.0, 5159.0, 2480.0, 1212.0, 701.0, 438.0, 249.0, 152.0, 88.0, 78.0, 48.0, 15.0, 16.0, 14.0, 11.0, 7.0, 8.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.109375, -10.7734375, -10.4375, -10.1015625, -9.765625, -9.4296875, -9.09375, -8.7578125, -8.421875, -8.0859375, -7.75, -7.4140625, -7.078125, -6.7421875, -6.40625, -6.0703125, -5.734375, -5.3984375, -5.0625, -4.7265625, -4.390625, -4.0546875, -3.71875, -3.3828125, -3.046875, -2.7109375, -2.375, -2.0390625, -1.703125, -1.3671875, -1.03125, -0.6953125, -0.359375, -0.0234375, 0.3125, 0.6484375, 0.984375, 1.3203125, 1.65625, 1.9921875, 2.328125, 2.6640625, 3.0, 3.3359375, 3.671875, 4.0078125, 4.34375, 4.6796875, 5.015625, 5.3515625, 5.6875, 6.0234375, 6.359375, 6.6953125, 7.03125, 7.3671875, 7.703125, 8.0390625, 8.375, 8.7109375, 9.046875, 9.3828125, 9.71875, 10.0546875, 10.390625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 3.0, 8.0, 11.0, 20.0, 25.0, 18.0, 38.0, 33.0, 63.0, 82.0, 84.0, 90.0, 113.0, 92.0, 81.0, 59.0, 41.0, 27.0, 21.0, 23.0, 17.0, 10.0, 12.0, 3.0, 4.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-11.4921875, -11.20684814453125, -10.9215087890625, -10.63616943359375, -10.350830078125, -10.06549072265625, -9.7801513671875, -9.49481201171875, -9.20947265625, -8.92413330078125, -8.6387939453125, -8.35345458984375, -8.068115234375, -7.78277587890625, -7.4974365234375, -7.21209716796875, -6.9267578125, -6.64141845703125, -6.3560791015625, -6.07073974609375, -5.785400390625, -5.50006103515625, -5.2147216796875, -4.92938232421875, -4.64404296875, -4.35870361328125, -4.0733642578125, -3.78802490234375, -3.502685546875, -3.21734619140625, -2.9320068359375, -2.64666748046875, -2.361328125, -2.07598876953125, -1.7906494140625, -1.50531005859375, -1.219970703125, -0.93463134765625, -0.6492919921875, -0.36395263671875, -0.07861328125, 0.20672607421875, 0.4920654296875, 0.77740478515625, 1.062744140625, 1.34808349609375, 1.6334228515625, 1.91876220703125, 2.2041015625, 2.48944091796875, 2.7747802734375, 3.06011962890625, 3.345458984375, 3.63079833984375, 3.9161376953125, 4.20147705078125, 4.48681640625, 4.77215576171875, 5.0574951171875, 5.34283447265625, 5.628173828125, 5.91351318359375, 6.1988525390625, 6.48419189453125, 6.76953125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 3.0, 10.0, 13.0, 22.0, 31.0, 34.0, 61.0, 72.0, 87.0, 118.0, 129.0, 102.0, 93.0, 64.0, 63.0, 19.0, 31.0, 20.0, 16.0, 2.0, 6.0, 0.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-170.14627075195312, -165.8067169189453, -161.46717834472656, -157.12762451171875, -152.78807067871094, -148.4485321044922, -144.10897827148438, -139.76942443847656, -135.4298858642578, -131.09033203125, -126.75078582763672, -122.41123962402344, -118.07169342041016, -113.73214721679688, -109.39259338378906, -105.05304718017578, -100.71349334716797, -96.37394714355469, -92.03439331054688, -87.6948471069336, -83.35530090332031, -79.0157470703125, -74.67620086669922, -70.33665466308594, -65.99710083007812, -61.65755081176758, -57.3180046081543, -52.97845458984375, -48.63890838623047, -44.29935836791992, -39.959808349609375, -35.620262145996094, -31.280723571777344, -26.94117546081543, -22.601627349853516, -18.26207733154297, -13.922529220581055, -9.58298110961914, -5.243431091308594, -0.9038829803466797, 3.4356651306152344, 7.775213718414307, 12.114762306213379, 16.45431137084961, 20.793859481811523, 25.133407592773438, 29.472957611083984, 33.81250762939453, 38.15205383300781, 42.49160385131836, 46.83115005493164, 51.17070007324219, 55.51024627685547, 59.849796295166016, 64.18934631347656, 68.52889251708984, 72.86843872070312, 77.2079849243164, 81.54753875732422, 85.8870849609375, 90.22663116455078, 94.56617736816406, 98.90573120117188, 103.24527740478516, 107.58483123779297]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 12.0, 8.0, 8.0, 19.0, 21.0, 26.0, 25.0, 37.0, 28.0, 45.0, 51.0, 52.0, 54.0, 48.0, 64.0, 45.0, 50.0, 55.0, 34.0, 43.0, 48.0, 35.0, 29.0, 17.0, 26.0, 24.0, 17.0, 19.0, 14.0, 12.0, 9.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.37962341308594, -102.38147735595703, -99.3833236694336, -96.38517761230469, -93.38702392578125, -90.38887786865234, -87.39073181152344, -84.392578125, -81.39442443847656, -78.39627838134766, -75.39812469482422, -72.39997863769531, -69.40182495117188, -66.40367889404297, -63.4055290222168, -60.407379150390625, -57.40923309326172, -54.41108322143555, -51.412933349609375, -48.41478729248047, -45.41663360595703, -42.418487548828125, -39.42033767700195, -36.42218780517578, -33.42403793334961, -30.425888061523438, -27.427738189697266, -24.429590225219727, -21.431440353393555, -18.433290481567383, -15.435142517089844, -12.436992645263672, -9.438850402832031, -6.440701007843018, -3.442551612854004, -0.44440269470214844, 2.5537471771240234, 5.551897048950195, 8.550045013427734, 11.548194885253906, 14.546344757080078, 17.54449462890625, 20.542644500732422, 23.54079246520996, 26.538942337036133, 29.537092208862305, 32.535240173339844, 35.533390045166016, 38.53153991699219, 41.52968978881836, 44.52783966064453, 47.52598571777344, 50.524139404296875, 53.52228546142578, 56.52043533325195, 59.518585205078125, 62.5167350769043, 65.51488494873047, 68.51303100585938, 71.51118469238281, 74.50933074951172, 77.50748443603516, 80.50563049316406, 83.5037841796875, 86.5019302368164]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 3.0, 6.0, 5.0, 9.0, 14.0, 12.0, 27.0, 21.0, 36.0, 58.0, 74.0, 143.0, 240.0, 483.0, 1014.0, 2345.0, 7194.0, 38033.0, 3350046.0, 754917.0, 29646.0, 6160.0, 2021.0, 892.0, 412.0, 198.0, 109.0, 62.0, 38.0, 19.0, 13.0, 15.0, 7.0, 3.0, 7.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-82.8125, -80.685546875, -78.55859375, -76.431640625, -74.3046875, -72.177734375, -70.05078125, -67.923828125, -65.796875, -63.669921875, -61.54296875, -59.416015625, -57.2890625, -55.162109375, -53.03515625, -50.908203125, -48.78125, -46.654296875, -44.52734375, -42.400390625, -40.2734375, -38.146484375, -36.01953125, -33.892578125, -31.765625, -29.638671875, -27.51171875, -25.384765625, -23.2578125, -21.130859375, -19.00390625, -16.876953125, -14.75, -12.623046875, -10.49609375, -8.369140625, -6.2421875, -4.115234375, -1.98828125, 0.138671875, 2.265625, 4.392578125, 6.51953125, 8.646484375, 10.7734375, 12.900390625, 15.02734375, 17.154296875, 19.28125, 21.408203125, 23.53515625, 25.662109375, 27.7890625, 29.916015625, 32.04296875, 34.169921875, 36.296875, 38.423828125, 40.55078125, 42.677734375, 44.8046875, 46.931640625, 49.05859375, 51.185546875, 53.3125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 7.0, 6.0, 11.0, 21.0, 30.0, 39.0, 56.0, 59.0, 72.0, 86.0, 96.0, 82.0, 74.0, 82.0, 63.0, 60.0, 48.0, 36.0, 28.0, 18.0, 13.0, 4.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.375, -6.156982421875, -5.93896484375, -5.720947265625, -5.5029296875, -5.284912109375, -5.06689453125, -4.848876953125, -4.630859375, -4.412841796875, -4.19482421875, -3.976806640625, -3.7587890625, -3.540771484375, -3.32275390625, -3.104736328125, -2.88671875, -2.668701171875, -2.45068359375, -2.232666015625, -2.0146484375, -1.796630859375, -1.57861328125, -1.360595703125, -1.142578125, -0.924560546875, -0.70654296875, -0.488525390625, -0.2705078125, -0.052490234375, 0.16552734375, 0.383544921875, 0.6015625, 0.819580078125, 1.03759765625, 1.255615234375, 1.4736328125, 1.691650390625, 1.90966796875, 2.127685546875, 2.345703125, 2.563720703125, 2.78173828125, 2.999755859375, 3.2177734375, 3.435791015625, 3.65380859375, 3.871826171875, 4.08984375, 4.307861328125, 4.52587890625, 4.743896484375, 4.9619140625, 5.179931640625, 5.39794921875, 5.615966796875, 5.833984375, 6.052001953125, 6.27001953125, 6.488037109375, 6.7060546875, 6.924072265625, 7.14208984375, 7.360107421875, 7.578125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 1.0, 2.0, 6.0, 7.0, 11.0, 8.0, 12.0, 14.0, 27.0, 31.0, 39.0, 54.0, 68.0, 117.0, 197.0, 347.0, 682.0, 1475.0, 3465.0, 10260.0, 37203.0, 190282.0, 3229945.0, 610808.0, 79842.0, 19075.0, 5847.0, 2347.0, 966.0, 443.0, 273.0, 144.0, 75.0, 47.0, 45.0, 21.0, 18.0, 19.0, 10.0, 11.0, 5.0, 11.0, 9.0, 2.0, 3.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-33.875, -32.871337890625, -31.86767578125, -30.864013671875, -29.8603515625, -28.856689453125, -27.85302734375, -26.849365234375, -25.845703125, -24.842041015625, -23.83837890625, -22.834716796875, -21.8310546875, -20.827392578125, -19.82373046875, -18.820068359375, -17.81640625, -16.812744140625, -15.80908203125, -14.805419921875, -13.8017578125, -12.798095703125, -11.79443359375, -10.790771484375, -9.787109375, -8.783447265625, -7.77978515625, -6.776123046875, -5.7724609375, -4.768798828125, -3.76513671875, -2.761474609375, -1.7578125, -0.754150390625, 0.24951171875, 1.253173828125, 2.2568359375, 3.260498046875, 4.26416015625, 5.267822265625, 6.271484375, 7.275146484375, 8.27880859375, 9.282470703125, 10.2861328125, 11.289794921875, 12.29345703125, 13.297119140625, 14.30078125, 15.304443359375, 16.30810546875, 17.311767578125, 18.3154296875, 19.319091796875, 20.32275390625, 21.326416015625, 22.330078125, 23.333740234375, 24.33740234375, 25.341064453125, 26.3447265625, 27.348388671875, 28.35205078125, 29.355712890625, 30.359375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 12.0, 12.0, 22.0, 29.0, 45.0, 58.0, 108.0, 154.0, 342.0, 1020.0, 1357.0, 392.0, 191.0, 125.0, 62.0, 47.0, 28.0, 17.0, 14.0, 8.0, 6.0, 3.0, 2.0, 3.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.4140625, -13.0616455078125, -12.709228515625, -12.3568115234375, -12.00439453125, -11.6519775390625, -11.299560546875, -10.9471435546875, -10.5947265625, -10.2423095703125, -9.889892578125, -9.5374755859375, -9.18505859375, -8.8326416015625, -8.480224609375, -8.1278076171875, -7.775390625, -7.4229736328125, -7.070556640625, -6.7181396484375, -6.36572265625, -6.0133056640625, -5.660888671875, -5.3084716796875, -4.9560546875, -4.6036376953125, -4.251220703125, -3.8988037109375, -3.54638671875, -3.1939697265625, -2.841552734375, -2.4891357421875, -2.13671875, -1.7843017578125, -1.431884765625, -1.0794677734375, -0.72705078125, -0.3746337890625, -0.022216796875, 0.3302001953125, 0.6826171875, 1.0350341796875, 1.387451171875, 1.7398681640625, 2.09228515625, 2.4447021484375, 2.797119140625, 3.1495361328125, 3.501953125, 3.8543701171875, 4.206787109375, 4.5592041015625, 4.91162109375, 5.2640380859375, 5.616455078125, 5.9688720703125, 6.3212890625, 6.6737060546875, 7.026123046875, 7.3785400390625, 7.73095703125, 8.0833740234375, 8.435791015625, 8.7882080078125, 9.140625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 6.0, 10.0, 15.0, 26.0, 47.0, 74.0, 85.0, 113.0, 109.0, 139.0, 114.0, 92.0, 67.0, 46.0, 22.0, 16.0, 9.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.94747543334961, -52.6427116394043, -50.337947845458984, -48.03318405151367, -45.72842025756836, -43.42365646362305, -41.11888885498047, -38.814125061035156, -36.509361267089844, -34.20459747314453, -31.89983367919922, -29.595069885253906, -27.290306091308594, -24.98554229736328, -22.680776596069336, -20.376012802124023, -18.071250915527344, -15.766487121582031, -13.461723327636719, -11.15695858001709, -8.852194786071777, -6.547430992126465, -4.242666244506836, -1.9379024505615234, 0.36686134338378906, 2.6716253757476807, 4.976389408111572, 7.281153678894043, 9.585917472839355, 11.890681266784668, 14.195446014404297, 16.50020980834961, 18.804977416992188, 21.1097412109375, 23.414505004882812, 25.719268798828125, 28.024032592773438, 30.32879638671875, 32.63356018066406, 34.938323974609375, 37.24308776855469, 39.5478515625, 41.85261535644531, 44.157379150390625, 46.46214294433594, 48.76690673828125, 51.07167053222656, 53.376434326171875, 55.68120193481445, 57.985965728759766, 60.29072952270508, 62.59549331665039, 64.90026092529297, 67.20502471923828, 69.5097885131836, 71.8145523071289, 74.11931610107422, 76.42407989501953, 78.72884368896484, 81.03360748291016, 83.33837127685547, 85.64313507080078, 87.9478988647461, 90.2526626586914, 92.55742645263672]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 2.0, 4.0, 8.0, 7.0, 7.0, 12.0, 7.0, 18.0, 17.0, 22.0, 24.0, 29.0, 32.0, 34.0, 39.0, 38.0, 47.0, 44.0, 46.0, 49.0, 49.0, 45.0, 61.0, 47.0, 36.0, 33.0, 36.0, 29.0, 27.0, 29.0, 27.0, 13.0, 11.0, 18.0, 17.0, 12.0, 10.0, 2.0, 6.0, 4.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.967315673828125, -27.91663360595703, -26.865951538085938, -25.815269470214844, -24.76458740234375, -23.713905334472656, -22.66322135925293, -21.612539291381836, -20.561857223510742, -19.51117515563965, -18.460493087768555, -17.40981101989746, -16.359127044677734, -15.308445930480957, -14.257762908935547, -13.207080841064453, -12.15639877319336, -11.105716705322266, -10.055034637451172, -9.004351615905762, -7.953669548034668, -6.902987480163574, -5.852304935455322, -4.80162239074707, -3.7509403228759766, -2.7002580165863037, -1.6495757102966309, -0.598893404006958, 0.45178890228271484, 1.5024709701538086, 2.5531535148620605, 3.6038360595703125, 4.654518127441406, 5.7052001953125, 6.755882740020752, 7.806565284729004, 8.857247352600098, 9.907929420471191, 10.958612442016602, 12.009294509887695, 13.059976577758789, 14.110658645629883, 15.161340713500977, 16.21202278137207, 17.262706756591797, 18.31338882446289, 19.364070892333984, 20.414752960205078, 21.465435028076172, 22.516117095947266, 23.56679916381836, 24.617481231689453, 25.668163299560547, 26.71884536743164, 27.769529342651367, 28.82021141052246, 29.870893478393555, 30.92157554626465, 31.972257614135742, 33.02294158935547, 34.07362365722656, 35.124305725097656, 36.17498779296875, 37.225669860839844, 38.27635192871094]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 5.0, 12.0, 13.0, 19.0, 30.0, 45.0, 82.0, 131.0, 230.0, 436.0, 819.0, 1665.0, 4472.0, 16688.0, 92402.0, 567229.0, 303889.0, 45137.0, 9726.0, 2923.0, 1204.0, 586.0, 286.0, 186.0, 119.0, 69.0, 45.0, 39.0, 21.0, 17.0, 7.0, 4.0, 5.0, 6.0, 1.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.84375, -54.087890625, -52.33203125, -50.576171875, -48.8203125, -47.064453125, -45.30859375, -43.552734375, -41.796875, -40.041015625, -38.28515625, -36.529296875, -34.7734375, -33.017578125, -31.26171875, -29.505859375, -27.75, -25.994140625, -24.23828125, -22.482421875, -20.7265625, -18.970703125, -17.21484375, -15.458984375, -13.703125, -11.947265625, -10.19140625, -8.435546875, -6.6796875, -4.923828125, -3.16796875, -1.412109375, 0.34375, 2.099609375, 3.85546875, 5.611328125, 7.3671875, 9.123046875, 10.87890625, 12.634765625, 14.390625, 16.146484375, 17.90234375, 19.658203125, 21.4140625, 23.169921875, 24.92578125, 26.681640625, 28.4375, 30.193359375, 31.94921875, 33.705078125, 35.4609375, 37.216796875, 38.97265625, 40.728515625, 42.484375, 44.240234375, 45.99609375, 47.751953125, 49.5078125, 51.263671875, 53.01953125, 54.775390625, 56.53125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 2.0, 3.0, 7.0, 9.0, 24.0, 32.0, 42.0, 56.0, 52.0, 61.0, 98.0, 97.0, 77.0, 77.0, 73.0, 65.0, 60.0, 55.0, 36.0, 28.0, 15.0, 17.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.53125, -6.30877685546875, -6.0863037109375, -5.86383056640625, -5.641357421875, -5.41888427734375, -5.1964111328125, -4.97393798828125, -4.75146484375, -4.52899169921875, -4.3065185546875, -4.08404541015625, -3.861572265625, -3.63909912109375, -3.4166259765625, -3.19415283203125, -2.9716796875, -2.74920654296875, -2.5267333984375, -2.30426025390625, -2.081787109375, -1.85931396484375, -1.6368408203125, -1.41436767578125, -1.19189453125, -0.96942138671875, -0.7469482421875, -0.52447509765625, -0.302001953125, -0.07952880859375, 0.1429443359375, 0.36541748046875, 0.587890625, 0.81036376953125, 1.0328369140625, 1.25531005859375, 1.477783203125, 1.70025634765625, 1.9227294921875, 2.14520263671875, 2.36767578125, 2.59014892578125, 2.8126220703125, 3.03509521484375, 3.257568359375, 3.48004150390625, 3.7025146484375, 3.92498779296875, 4.1474609375, 4.36993408203125, 4.5924072265625, 4.81488037109375, 5.037353515625, 5.25982666015625, 5.4822998046875, 5.70477294921875, 5.92724609375, 6.14971923828125, 6.3721923828125, 6.59466552734375, 6.817138671875, 7.03961181640625, 7.2620849609375, 7.48455810546875, 7.70703125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 4.0, 2.0, 3.0, 6.0, 14.0, 14.0, 19.0, 29.0, 43.0, 45.0, 88.0, 137.0, 228.0, 287.0, 477.0, 801.0, 1371.0, 2475.0, 5649.0, 13253.0, 34679.0, 94487.0, 274778.0, 385228.0, 146603.0, 52258.0, 19579.0, 8040.0, 3534.0, 1744.0, 998.0, 565.0, 332.0, 270.0, 162.0, 114.0, 73.0, 53.0, 39.0, 19.0, 18.0, 16.0, 7.0, 6.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.6875, -21.071533203125, -20.45556640625, -19.839599609375, -19.2236328125, -18.607666015625, -17.99169921875, -17.375732421875, -16.759765625, -16.143798828125, -15.52783203125, -14.911865234375, -14.2958984375, -13.679931640625, -13.06396484375, -12.447998046875, -11.83203125, -11.216064453125, -10.60009765625, -9.984130859375, -9.3681640625, -8.752197265625, -8.13623046875, -7.520263671875, -6.904296875, -6.288330078125, -5.67236328125, -5.056396484375, -4.4404296875, -3.824462890625, -3.20849609375, -2.592529296875, -1.9765625, -1.360595703125, -0.74462890625, -0.128662109375, 0.4873046875, 1.103271484375, 1.71923828125, 2.335205078125, 2.951171875, 3.567138671875, 4.18310546875, 4.799072265625, 5.4150390625, 6.031005859375, 6.64697265625, 7.262939453125, 7.87890625, 8.494873046875, 9.11083984375, 9.726806640625, 10.3427734375, 10.958740234375, 11.57470703125, 12.190673828125, 12.806640625, 13.422607421875, 14.03857421875, 14.654541015625, 15.2705078125, 15.886474609375, 16.50244140625, 17.118408203125, 17.734375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 7.0, 7.0, 5.0, 7.0, 9.0, 16.0, 11.0, 14.0, 23.0, 23.0, 24.0, 37.0, 36.0, 33.0, 42.0, 41.0, 39.0, 38.0, 50.0, 43.0, 54.0, 38.0, 38.0, 42.0, 55.0, 31.0, 36.0, 31.0, 37.0, 18.0, 15.0, 17.0, 16.0, 8.0, 11.0, 13.0, 6.0, 5.0, 4.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.171875, -14.7061767578125, -14.240478515625, -13.7747802734375, -13.30908203125, -12.8433837890625, -12.377685546875, -11.9119873046875, -11.4462890625, -10.9805908203125, -10.514892578125, -10.0491943359375, -9.58349609375, -9.1177978515625, -8.652099609375, -8.1864013671875, -7.720703125, -7.2550048828125, -6.789306640625, -6.3236083984375, -5.85791015625, -5.3922119140625, -4.926513671875, -4.4608154296875, -3.9951171875, -3.5294189453125, -3.063720703125, -2.5980224609375, -2.13232421875, -1.6666259765625, -1.200927734375, -0.7352294921875, -0.26953125, 0.1961669921875, 0.661865234375, 1.1275634765625, 1.59326171875, 2.0589599609375, 2.524658203125, 2.9903564453125, 3.4560546875, 3.9217529296875, 4.387451171875, 4.8531494140625, 5.31884765625, 5.7845458984375, 6.250244140625, 6.7159423828125, 7.181640625, 7.6473388671875, 8.113037109375, 8.5787353515625, 9.04443359375, 9.5101318359375, 9.975830078125, 10.4415283203125, 10.9072265625, 11.3729248046875, 11.838623046875, 12.3043212890625, 12.77001953125, 13.2357177734375, 13.701416015625, 14.1671142578125, 14.6328125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 17.0, 8.0, 31.0, 44.0, 68.0, 114.0, 198.0, 325.0, 575.0, 1126.0, 2251.0, 4822.0, 11031.0, 26163.0, 67438.0, 184246.0, 377725.0, 231651.0, 83989.0, 32084.0, 13184.0, 5686.0, 2723.0, 1351.0, 707.0, 400.0, 231.0, 123.0, 100.0, 52.0, 32.0, 15.0, 12.0, 10.0, 9.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.3125, -8.049560546875, -7.78662109375, -7.523681640625, -7.2607421875, -6.997802734375, -6.73486328125, -6.471923828125, -6.208984375, -5.946044921875, -5.68310546875, -5.420166015625, -5.1572265625, -4.894287109375, -4.63134765625, -4.368408203125, -4.10546875, -3.842529296875, -3.57958984375, -3.316650390625, -3.0537109375, -2.790771484375, -2.52783203125, -2.264892578125, -2.001953125, -1.739013671875, -1.47607421875, -1.213134765625, -0.9501953125, -0.687255859375, -0.42431640625, -0.161376953125, 0.1015625, 0.364501953125, 0.62744140625, 0.890380859375, 1.1533203125, 1.416259765625, 1.67919921875, 1.942138671875, 2.205078125, 2.468017578125, 2.73095703125, 2.993896484375, 3.2568359375, 3.519775390625, 3.78271484375, 4.045654296875, 4.30859375, 4.571533203125, 4.83447265625, 5.097412109375, 5.3603515625, 5.623291015625, 5.88623046875, 6.149169921875, 6.412109375, 6.675048828125, 6.93798828125, 7.200927734375, 7.4638671875, 7.726806640625, 7.98974609375, 8.252685546875, 8.515625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 5.0, 3.0, 4.0, 8.0, 8.0, 6.0, 11.0, 8.0, 11.0, 23.0, 21.0, 30.0, 44.0, 48.0, 74.0, 104.0, 113.0, 108.0, 92.0, 57.0, 26.0, 40.0, 26.0, 26.0, 19.0, 19.0, 3.0, 15.0, 8.0, 10.0, 8.0, 2.0, 2.0, 7.0, 4.0, 3.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.001834869384765625, -0.0017755329608917236, -0.0017161965370178223, -0.001656860113143921, -0.0015975236892700195, -0.0015381872653961182, -0.0014788508415222168, -0.0014195144176483154, -0.001360177993774414, -0.0013008415699005127, -0.0012415051460266113, -0.00118216872215271, -0.0011228322982788086, -0.0010634958744049072, -0.0010041594505310059, -0.0009448230266571045, -0.0008854866027832031, -0.0008261501789093018, -0.0007668137550354004, -0.000707477331161499, -0.0006481409072875977, -0.0005888044834136963, -0.0005294680595397949, -0.00047013163566589355, -0.0004107952117919922, -0.0003514587879180908, -0.00029212236404418945, -0.00023278594017028809, -0.00017344951629638672, -0.00011411309242248535, -5.4776668548583984e-05, 4.559755325317383e-06, 6.389617919921875e-05, 0.00012323260307312012, 0.00018256902694702148, 0.00024190545082092285, 0.0003012418746948242, 0.0003605782985687256, 0.00041991472244262695, 0.0004792511463165283, 0.0005385875701904297, 0.0005979239940643311, 0.0006572604179382324, 0.0007165968418121338, 0.0007759332656860352, 0.0008352696895599365, 0.0008946061134338379, 0.0009539425373077393, 0.0010132789611816406, 0.001072615385055542, 0.0011319518089294434, 0.0011912882328033447, 0.001250624656677246, 0.0013099610805511475, 0.0013692975044250488, 0.0014286339282989502, 0.0014879703521728516, 0.001547306776046753, 0.0016066431999206543, 0.0016659796237945557, 0.001725316047668457, 0.0017846524715423584, 0.0018439888954162598, 0.0019033253192901611, 0.0019626617431640625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 4.0, 9.0, 19.0, 28.0, 36.0, 51.0, 88.0, 143.0, 240.0, 425.0, 784.0, 1666.0, 3846.0, 10448.0, 34081.0, 131925.0, 465155.0, 296204.0, 71667.0, 19805.0, 6646.0, 2674.0, 1198.0, 599.0, 328.0, 167.0, 110.0, 63.0, 45.0, 33.0, 21.0, 13.0, 12.0, 7.0, 6.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.609375, -8.261962890625, -7.91455078125, -7.567138671875, -7.2197265625, -6.872314453125, -6.52490234375, -6.177490234375, -5.830078125, -5.482666015625, -5.13525390625, -4.787841796875, -4.4404296875, -4.093017578125, -3.74560546875, -3.398193359375, -3.05078125, -2.703369140625, -2.35595703125, -2.008544921875, -1.6611328125, -1.313720703125, -0.96630859375, -0.618896484375, -0.271484375, 0.075927734375, 0.42333984375, 0.770751953125, 1.1181640625, 1.465576171875, 1.81298828125, 2.160400390625, 2.5078125, 2.855224609375, 3.20263671875, 3.550048828125, 3.8974609375, 4.244873046875, 4.59228515625, 4.939697265625, 5.287109375, 5.634521484375, 5.98193359375, 6.329345703125, 6.6767578125, 7.024169921875, 7.37158203125, 7.718994140625, 8.06640625, 8.413818359375, 8.76123046875, 9.108642578125, 9.4560546875, 9.803466796875, 10.15087890625, 10.498291015625, 10.845703125, 11.193115234375, 11.54052734375, 11.887939453125, 12.2353515625, 12.582763671875, 12.93017578125, 13.277587890625, 13.625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 6.0, 4.0, 8.0, 15.0, 13.0, 17.0, 30.0, 46.0, 42.0, 46.0, 94.0, 91.0, 91.0, 97.0, 93.0, 54.0, 66.0, 50.0, 27.0, 22.0, 18.0, 18.0, 17.0, 9.0, 10.0, 7.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.953125, -6.7120361328125, -6.470947265625, -6.2298583984375, -5.98876953125, -5.7476806640625, -5.506591796875, -5.2655029296875, -5.0244140625, -4.7833251953125, -4.542236328125, -4.3011474609375, -4.06005859375, -3.8189697265625, -3.577880859375, -3.3367919921875, -3.095703125, -2.8546142578125, -2.613525390625, -2.3724365234375, -2.13134765625, -1.8902587890625, -1.649169921875, -1.4080810546875, -1.1669921875, -0.9259033203125, -0.684814453125, -0.4437255859375, -0.20263671875, 0.0384521484375, 0.279541015625, 0.5206298828125, 0.76171875, 1.0028076171875, 1.243896484375, 1.4849853515625, 1.72607421875, 1.9671630859375, 2.208251953125, 2.4493408203125, 2.6904296875, 2.9315185546875, 3.172607421875, 3.4136962890625, 3.65478515625, 3.8958740234375, 4.136962890625, 4.3780517578125, 4.619140625, 4.8602294921875, 5.101318359375, 5.3424072265625, 5.58349609375, 5.8245849609375, 6.065673828125, 6.3067626953125, 6.5478515625, 6.7889404296875, 7.030029296875, 7.2711181640625, 7.51220703125, 7.7532958984375, 7.994384765625, 8.2354736328125, 8.4765625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 7.0, 13.0, 15.0, 22.0, 37.0, 48.0, 59.0, 79.0, 94.0, 82.0, 95.0, 84.0, 85.0, 69.0, 56.0, 51.0, 27.0, 24.0, 21.0, 10.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 5.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-112.95167541503906, -109.37156677246094, -105.79145812988281, -102.21135711669922, -98.6312484741211, -95.05113983154297, -91.47103881835938, -87.89093017578125, -84.31082153320312, -80.730712890625, -77.15060424804688, -73.57050323486328, -69.99039459228516, -66.41028594970703, -62.83018112182617, -59.25007629394531, -55.66996765136719, -52.08985900878906, -48.5097541809082, -44.929649353027344, -41.34954071044922, -37.769432067871094, -34.189327239990234, -30.609220504760742, -27.02911376953125, -23.449007034301758, -19.868900299072266, -16.288793563842773, -12.708686828613281, -9.128580093383789, -5.548473358154297, -1.9683666229248047, 1.6117401123046875, 5.19184684753418, 8.771953582763672, 12.352060317993164, 15.932167053222656, 19.51227378845215, 23.09238052368164, 26.672487258911133, 30.252593994140625, 33.83270263671875, 37.41280746459961, 40.99291229248047, 44.573020935058594, 48.15312957763672, 51.73323440551758, 55.31333923339844, 58.89344787597656, 62.47355651855469, 66.05366516113281, 69.6337661743164, 73.21387481689453, 76.79398345947266, 80.37408447265625, 83.95419311523438, 87.5343017578125, 91.11441040039062, 94.69451904296875, 98.27462005615234, 101.85472869873047, 105.4348373413086, 109.01493835449219, 112.59504699707031, 116.17515563964844]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 1.0, 5.0, 3.0, 1.0, 5.0, 4.0, 12.0, 12.0, 9.0, 10.0, 6.0, 17.0, 21.0, 22.0, 29.0, 30.0, 38.0, 32.0, 32.0, 45.0, 50.0, 51.0, 36.0, 53.0, 35.0, 46.0, 49.0, 38.0, 35.0, 34.0, 24.0, 35.0, 26.0, 30.0, 22.0, 18.0, 17.0, 11.0, 12.0, 9.0, 10.0, 8.0, 12.0, 4.0, 3.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-80.69986724853516, -78.16695404052734, -75.63404083251953, -73.10112762451172, -70.5682144165039, -68.0353012084961, -65.50238800048828, -62.969478607177734, -60.43656539916992, -57.90365219116211, -55.3707389831543, -52.837825775146484, -50.30491638183594, -47.772003173828125, -45.23908996582031, -42.7061767578125, -40.17326354980469, -37.640350341796875, -35.10743713378906, -32.57452392578125, -30.04161262512207, -27.508699417114258, -24.975788116455078, -22.442874908447266, -19.909961700439453, -17.37704849243164, -14.844136238098145, -12.311223983764648, -9.778310775756836, -7.245397567749023, -4.712485313415527, -2.1795730590820312, 0.35333251953125, 2.8862452507019043, 5.419157981872559, 7.952070713043213, 10.484983444213867, 13.01789665222168, 15.550808906555176, 18.083721160888672, 20.616634368896484, 23.149547576904297, 25.68246078491211, 28.21537208557129, 30.7482852935791, 33.28119659423828, 35.814109802246094, 38.347023010253906, 40.87993621826172, 43.41284942626953, 45.945762634277344, 48.478675842285156, 51.01158905029297, 53.54450225830078, 56.07741165161133, 58.61032485961914, 61.14323806762695, 63.676151275634766, 66.20906066894531, 68.74197387695312, 71.27488708496094, 73.80780029296875, 76.34071350097656, 78.87362670898438, 81.40653991699219]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 7.0, 14.0, 15.0, 13.0, 24.0, 37.0, 35.0, 66.0, 98.0, 183.0, 263.0, 489.0, 955.0, 2316.0, 7108.0, 35534.0, 625491.0, 3447203.0, 58876.0, 10271.0, 2996.0, 1142.0, 462.0, 266.0, 151.0, 97.0, 58.0, 32.0, 31.0, 12.0, 8.0, 9.0, 7.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-79.125, -77.04931640625, -74.9736328125, -72.89794921875, -70.822265625, -68.74658203125, -66.6708984375, -64.59521484375, -62.51953125, -60.44384765625, -58.3681640625, -56.29248046875, -54.216796875, -52.14111328125, -50.0654296875, -47.98974609375, -45.9140625, -43.83837890625, -41.7626953125, -39.68701171875, -37.611328125, -35.53564453125, -33.4599609375, -31.38427734375, -29.30859375, -27.23291015625, -25.1572265625, -23.08154296875, -21.005859375, -18.93017578125, -16.8544921875, -14.77880859375, -12.703125, -10.62744140625, -8.5517578125, -6.47607421875, -4.400390625, -2.32470703125, -0.2490234375, 1.82666015625, 3.90234375, 5.97802734375, 8.0537109375, 10.12939453125, 12.205078125, 14.28076171875, 16.3564453125, 18.43212890625, 20.5078125, 22.58349609375, 24.6591796875, 26.73486328125, 28.810546875, 30.88623046875, 32.9619140625, 35.03759765625, 37.11328125, 39.18896484375, 41.2646484375, 43.34033203125, 45.416015625, 47.49169921875, 49.5673828125, 51.64306640625, 53.71875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 3.0, 7.0, 6.0, 14.0, 22.0, 32.0, 40.0, 54.0, 45.0, 69.0, 89.0, 88.0, 77.0, 85.0, 76.0, 68.0, 62.0, 47.0, 30.0, 22.0, 26.0, 14.0, 12.0, 9.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.46484375, -6.2451171875, -6.025390625, -5.8056640625, -5.5859375, -5.3662109375, -5.146484375, -4.9267578125, -4.70703125, -4.4873046875, -4.267578125, -4.0478515625, -3.828125, -3.6083984375, -3.388671875, -3.1689453125, -2.94921875, -2.7294921875, -2.509765625, -2.2900390625, -2.0703125, -1.8505859375, -1.630859375, -1.4111328125, -1.19140625, -0.9716796875, -0.751953125, -0.5322265625, -0.3125, -0.0927734375, 0.126953125, 0.3466796875, 0.56640625, 0.7861328125, 1.005859375, 1.2255859375, 1.4453125, 1.6650390625, 1.884765625, 2.1044921875, 2.32421875, 2.5439453125, 2.763671875, 2.9833984375, 3.203125, 3.4228515625, 3.642578125, 3.8623046875, 4.08203125, 4.3017578125, 4.521484375, 4.7412109375, 4.9609375, 5.1806640625, 5.400390625, 5.6201171875, 5.83984375, 6.0595703125, 6.279296875, 6.4990234375, 6.71875, 6.9384765625, 7.158203125, 7.3779296875, 7.59765625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 7.0, 5.0, 11.0, 15.0, 21.0, 18.0, 29.0, 33.0, 42.0, 57.0, 67.0, 103.0, 125.0, 212.0, 377.0, 815.0, 1847.0, 5395.0, 20291.0, 107753.0, 2051027.0, 1871753.0, 105220.0, 19908.0, 5440.0, 1837.0, 801.0, 327.0, 219.0, 135.0, 108.0, 75.0, 46.0, 37.0, 30.0, 31.0, 22.0, 16.0, 11.0, 8.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-43.5, -42.29150390625, -41.0830078125, -39.87451171875, -38.666015625, -37.45751953125, -36.2490234375, -35.04052734375, -33.83203125, -32.62353515625, -31.4150390625, -30.20654296875, -28.998046875, -27.78955078125, -26.5810546875, -25.37255859375, -24.1640625, -22.95556640625, -21.7470703125, -20.53857421875, -19.330078125, -18.12158203125, -16.9130859375, -15.70458984375, -14.49609375, -13.28759765625, -12.0791015625, -10.87060546875, -9.662109375, -8.45361328125, -7.2451171875, -6.03662109375, -4.828125, -3.61962890625, -2.4111328125, -1.20263671875, 0.005859375, 1.21435546875, 2.4228515625, 3.63134765625, 4.83984375, 6.04833984375, 7.2568359375, 8.46533203125, 9.673828125, 10.88232421875, 12.0908203125, 13.29931640625, 14.5078125, 15.71630859375, 16.9248046875, 18.13330078125, 19.341796875, 20.55029296875, 21.7587890625, 22.96728515625, 24.17578125, 25.38427734375, 26.5927734375, 27.80126953125, 29.009765625, 30.21826171875, 31.4267578125, 32.63525390625, 33.84375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 3.0, 5.0, 4.0, 3.0, 5.0, 9.0, 13.0, 19.0, 20.0, 32.0, 52.0, 66.0, 108.0, 169.0, 275.0, 644.0, 1451.0, 506.0, 235.0, 146.0, 93.0, 75.0, 47.0, 32.0, 17.0, 15.0, 15.0, 6.0, 2.0, 2.0, 4.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-14.703125, -14.3099365234375, -13.916748046875, -13.5235595703125, -13.13037109375, -12.7371826171875, -12.343994140625, -11.9508056640625, -11.5576171875, -11.1644287109375, -10.771240234375, -10.3780517578125, -9.98486328125, -9.5916748046875, -9.198486328125, -8.8052978515625, -8.412109375, -8.0189208984375, -7.625732421875, -7.2325439453125, -6.83935546875, -6.4461669921875, -6.052978515625, -5.6597900390625, -5.2666015625, -4.8734130859375, -4.480224609375, -4.0870361328125, -3.69384765625, -3.3006591796875, -2.907470703125, -2.5142822265625, -2.12109375, -1.7279052734375, -1.334716796875, -0.9415283203125, -0.54833984375, -0.1551513671875, 0.238037109375, 0.6312255859375, 1.0244140625, 1.4176025390625, 1.810791015625, 2.2039794921875, 2.59716796875, 2.9903564453125, 3.383544921875, 3.7767333984375, 4.169921875, 4.5631103515625, 4.956298828125, 5.3494873046875, 5.74267578125, 6.1358642578125, 6.529052734375, 6.9222412109375, 7.3154296875, 7.7086181640625, 8.101806640625, 8.4949951171875, 8.88818359375, 9.2813720703125, 9.674560546875, 10.0677490234375, 10.4609375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 9.0, 18.0, 23.0, 55.0, 63.0, 103.0, 127.0, 141.0, 144.0, 94.0, 81.0, 54.0, 36.0, 21.0, 16.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.6307144165039, -72.41205596923828, -69.19338989257812, -65.9747314453125, -62.756072998046875, -59.53741455078125, -56.31875228881836, -53.10009002685547, -49.881431579589844, -46.66277313232422, -43.44411087036133, -40.22544860839844, -37.00679016113281, -33.78813171386719, -30.569469451904297, -27.35080909729004, -24.13214874267578, -20.913488388061523, -17.694828033447266, -14.476167678833008, -11.25750732421875, -8.038846969604492, -4.820186614990234, -1.6015262603759766, 1.6171340942382812, 4.835794448852539, 8.054454803466797, 11.273115158081055, 14.491775512695312, 17.71043586730957, 20.929096221923828, 24.147756576538086, 27.366409301757812, 30.58506965637207, 33.80373001098633, 37.02239227294922, 40.241050720214844, 43.45970916748047, 46.67837142944336, 49.89703369140625, 53.115692138671875, 56.3343505859375, 59.55301284790039, 62.77167510986328, 65.9903335571289, 69.20899200439453, 72.42765808105469, 75.64631652832031, 78.86497497558594, 82.08363342285156, 85.30229187011719, 88.52095794677734, 91.73961639404297, 94.9582748413086, 98.17694091796875, 101.39559936523438, 104.6142578125, 107.83291625976562, 111.05157470703125, 114.2702407836914, 117.48889923095703, 120.70755767822266, 123.92622375488281, 127.14488220214844, 130.36354064941406]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 6.0, 7.0, 7.0, 15.0, 12.0, 15.0, 16.0, 24.0, 21.0, 21.0, 29.0, 34.0, 49.0, 41.0, 29.0, 44.0, 49.0, 47.0, 47.0, 59.0, 46.0, 36.0, 48.0, 45.0, 42.0, 25.0, 31.0, 32.0, 23.0, 18.0, 18.0, 11.0, 12.0, 6.0, 7.0, 11.0, 4.0, 5.0, 4.0, 0.0, 4.0, 1.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.44134521484375, -35.189483642578125, -33.9376220703125, -32.685760498046875, -31.433900833129883, -30.182039260864258, -28.930179595947266, -27.67831802368164, -26.426456451416016, -25.17459487915039, -23.922733306884766, -22.670873641967773, -21.41901206970215, -20.167150497436523, -18.91529083251953, -17.663429260253906, -16.41156768798828, -15.159706115722656, -13.907845497131348, -12.655984878540039, -11.404123306274414, -10.152261734008789, -8.90040111541748, -7.648540496826172, -6.396678924560547, -5.14481782913208, -3.8929567337036133, -2.6410956382751465, -1.3892345428466797, -0.1373734474182129, 1.114487648010254, 2.3663482666015625, 3.618213653564453, 4.87007474899292, 6.121935844421387, 7.3737969398498535, 8.62565803527832, 9.877519607543945, 11.129380226135254, 12.381240844726562, 13.633102416992188, 14.884963989257812, 16.136825561523438, 17.38868522644043, 18.640546798706055, 19.89240837097168, 21.144268035888672, 22.396129608154297, 23.647991180419922, 24.899852752685547, 26.151714324951172, 27.403573989868164, 28.65543556213379, 29.907297134399414, 31.159156799316406, 32.41101837158203, 33.662879943847656, 34.91474151611328, 36.166603088378906, 37.41846466064453, 38.670326232910156, 39.922183990478516, 41.17404556274414, 42.425907135009766, 43.67776870727539]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 8.0, 3.0, 4.0, 9.0, 9.0, 16.0, 26.0, 28.0, 37.0, 59.0, 80.0, 118.0, 182.0, 288.0, 538.0, 996.0, 2247.0, 5494.0, 17155.0, 70767.0, 503696.0, 367332.0, 56012.0, 14366.0, 4823.0, 1978.0, 952.0, 507.0, 286.0, 176.0, 119.0, 76.0, 39.0, 41.0, 27.0, 16.0, 13.0, 8.0, 3.0, 10.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-50.15625, -48.72021484375, -47.2841796875, -45.84814453125, -44.412109375, -42.97607421875, -41.5400390625, -40.10400390625, -38.66796875, -37.23193359375, -35.7958984375, -34.35986328125, -32.923828125, -31.48779296875, -30.0517578125, -28.61572265625, -27.1796875, -25.74365234375, -24.3076171875, -22.87158203125, -21.435546875, -19.99951171875, -18.5634765625, -17.12744140625, -15.69140625, -14.25537109375, -12.8193359375, -11.38330078125, -9.947265625, -8.51123046875, -7.0751953125, -5.63916015625, -4.203125, -2.76708984375, -1.3310546875, 0.10498046875, 1.541015625, 2.97705078125, 4.4130859375, 5.84912109375, 7.28515625, 8.72119140625, 10.1572265625, 11.59326171875, 13.029296875, 14.46533203125, 15.9013671875, 17.33740234375, 18.7734375, 20.20947265625, 21.6455078125, 23.08154296875, 24.517578125, 25.95361328125, 27.3896484375, 28.82568359375, 30.26171875, 31.69775390625, 33.1337890625, 34.56982421875, 36.005859375, 37.44189453125, 38.8779296875, 40.31396484375, 41.75]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 10.0, 8.0, 17.0, 29.0, 27.0, 31.0, 57.0, 50.0, 77.0, 91.0, 76.0, 93.0, 72.0, 68.0, 68.0, 57.0, 42.0, 40.0, 31.0, 17.0, 10.0, 19.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.5390625, -6.3153076171875, -6.091552734375, -5.8677978515625, -5.64404296875, -5.4202880859375, -5.196533203125, -4.9727783203125, -4.7490234375, -4.5252685546875, -4.301513671875, -4.0777587890625, -3.85400390625, -3.6302490234375, -3.406494140625, -3.1827392578125, -2.958984375, -2.7352294921875, -2.511474609375, -2.2877197265625, -2.06396484375, -1.8402099609375, -1.616455078125, -1.3927001953125, -1.1689453125, -0.9451904296875, -0.721435546875, -0.4976806640625, -0.27392578125, -0.0501708984375, 0.173583984375, 0.3973388671875, 0.62109375, 0.8448486328125, 1.068603515625, 1.2923583984375, 1.51611328125, 1.7398681640625, 1.963623046875, 2.1873779296875, 2.4111328125, 2.6348876953125, 2.858642578125, 3.0823974609375, 3.30615234375, 3.5299072265625, 3.753662109375, 3.9774169921875, 4.201171875, 4.4249267578125, 4.648681640625, 4.8724365234375, 5.09619140625, 5.3199462890625, 5.543701171875, 5.7674560546875, 5.9912109375, 6.2149658203125, 6.438720703125, 6.6624755859375, 6.88623046875, 7.1099853515625, 7.333740234375, 7.5574951171875, 7.78125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 7.0, 8.0, 8.0, 8.0, 17.0, 5.0, 20.0, 24.0, 35.0, 49.0, 75.0, 101.0, 140.0, 190.0, 256.0, 464.0, 769.0, 1342.0, 2880.0, 6741.0, 17057.0, 48185.0, 152633.0, 491289.0, 222039.0, 65555.0, 22603.0, 8378.0, 3460.0, 1698.0, 878.0, 504.0, 372.0, 216.0, 146.0, 113.0, 87.0, 54.0, 40.0, 40.0, 30.0, 10.0, 13.0, 9.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.515625, -20.8564453125, -20.197265625, -19.5380859375, -18.87890625, -18.2197265625, -17.560546875, -16.9013671875, -16.2421875, -15.5830078125, -14.923828125, -14.2646484375, -13.60546875, -12.9462890625, -12.287109375, -11.6279296875, -10.96875, -10.3095703125, -9.650390625, -8.9912109375, -8.33203125, -7.6728515625, -7.013671875, -6.3544921875, -5.6953125, -5.0361328125, -4.376953125, -3.7177734375, -3.05859375, -2.3994140625, -1.740234375, -1.0810546875, -0.421875, 0.2373046875, 0.896484375, 1.5556640625, 2.21484375, 2.8740234375, 3.533203125, 4.1923828125, 4.8515625, 5.5107421875, 6.169921875, 6.8291015625, 7.48828125, 8.1474609375, 8.806640625, 9.4658203125, 10.125, 10.7841796875, 11.443359375, 12.1025390625, 12.76171875, 13.4208984375, 14.080078125, 14.7392578125, 15.3984375, 16.0576171875, 16.716796875, 17.3759765625, 18.03515625, 18.6943359375, 19.353515625, 20.0126953125, 20.671875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 6.0, 8.0, 8.0, 8.0, 11.0, 13.0, 20.0, 22.0, 21.0, 16.0, 28.0, 34.0, 39.0, 32.0, 53.0, 49.0, 40.0, 40.0, 45.0, 36.0, 54.0, 50.0, 34.0, 36.0, 50.0, 36.0, 28.0, 15.0, 28.0, 25.0, 18.0, 20.0, 18.0, 11.0, 12.0, 10.0, 6.0, 4.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-16.6875, -16.1927490234375, -15.697998046875, -15.2032470703125, -14.70849609375, -14.2137451171875, -13.718994140625, -13.2242431640625, -12.7294921875, -12.2347412109375, -11.739990234375, -11.2452392578125, -10.75048828125, -10.2557373046875, -9.760986328125, -9.2662353515625, -8.771484375, -8.2767333984375, -7.781982421875, -7.2872314453125, -6.79248046875, -6.2977294921875, -5.802978515625, -5.3082275390625, -4.8134765625, -4.3187255859375, -3.823974609375, -3.3292236328125, -2.83447265625, -2.3397216796875, -1.844970703125, -1.3502197265625, -0.85546875, -0.3607177734375, 0.134033203125, 0.6287841796875, 1.12353515625, 1.6182861328125, 2.113037109375, 2.6077880859375, 3.1025390625, 3.5972900390625, 4.092041015625, 4.5867919921875, 5.08154296875, 5.5762939453125, 6.071044921875, 6.5657958984375, 7.060546875, 7.5552978515625, 8.050048828125, 8.5447998046875, 9.03955078125, 9.5343017578125, 10.029052734375, 10.5238037109375, 11.0185546875, 11.5133056640625, 12.008056640625, 12.5028076171875, 12.99755859375, 13.4923095703125, 13.987060546875, 14.4818115234375, 14.9765625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 2.0, 1.0, 3.0, 4.0, 13.0, 22.0, 40.0, 52.0, 128.0, 243.0, 880.0, 4858.0, 137969.0, 888389.0, 13596.0, 1610.0, 411.0, 148.0, 77.0, 54.0, 18.0, 18.0, 9.0, 4.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.0, -38.67578125, -37.3515625, -36.02734375, -34.703125, -33.37890625, -32.0546875, -30.73046875, -29.40625, -28.08203125, -26.7578125, -25.43359375, -24.109375, -22.78515625, -21.4609375, -20.13671875, -18.8125, -17.48828125, -16.1640625, -14.83984375, -13.515625, -12.19140625, -10.8671875, -9.54296875, -8.21875, -6.89453125, -5.5703125, -4.24609375, -2.921875, -1.59765625, -0.2734375, 1.05078125, 2.375, 3.69921875, 5.0234375, 6.34765625, 7.671875, 8.99609375, 10.3203125, 11.64453125, 12.96875, 14.29296875, 15.6171875, 16.94140625, 18.265625, 19.58984375, 20.9140625, 22.23828125, 23.5625, 24.88671875, 26.2109375, 27.53515625, 28.859375, 30.18359375, 31.5078125, 32.83203125, 34.15625, 35.48046875, 36.8046875, 38.12890625, 39.453125, 40.77734375, 42.1015625, 43.42578125, 44.75]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 6.0, 9.0, 2.0, 9.0, 15.0, 14.0, 23.0, 26.0, 42.0, 57.0, 188.0, 291.0, 154.0, 41.0, 40.0, 23.0, 17.0, 12.0, 10.0, 8.0, 2.0, 2.0, 6.0, 5.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0026874542236328125, -0.002589315176010132, -0.002491176128387451, -0.0023930370807647705, -0.00229489803314209, -0.002196758985519409, -0.0020986199378967285, -0.002000480890274048, -0.0019023418426513672, -0.0018042027950286865, -0.0017060637474060059, -0.0016079246997833252, -0.0015097856521606445, -0.0014116466045379639, -0.0013135075569152832, -0.0012153685092926025, -0.0011172294616699219, -0.0010190904140472412, -0.0009209513664245605, -0.0008228123188018799, -0.0007246732711791992, -0.0006265342235565186, -0.0005283951759338379, -0.0004302561283111572, -0.00033211708068847656, -0.0002339780330657959, -0.00013583898544311523, -3.769993782043457e-05, 6.0439109802246094e-05, 0.00015857815742492676, 0.0002567172050476074, 0.0003548562526702881, 0.00045299530029296875, 0.0005511343479156494, 0.0006492733955383301, 0.0007474124431610107, 0.0008455514907836914, 0.0009436905384063721, 0.0010418295860290527, 0.0011399686336517334, 0.001238107681274414, 0.0013362467288970947, 0.0014343857765197754, 0.001532524824142456, 0.0016306638717651367, 0.0017288029193878174, 0.001826941967010498, 0.0019250810146331787, 0.0020232200622558594, 0.00212135910987854, 0.0022194981575012207, 0.0023176372051239014, 0.002415776252746582, 0.0025139153003692627, 0.0026120543479919434, 0.002710193395614624, 0.0028083324432373047, 0.0029064714908599854, 0.003004610538482666, 0.0031027495861053467, 0.0032008886337280273, 0.003299027681350708, 0.0033971667289733887, 0.0034953057765960693, 0.00359344482421875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 5.0, 8.0, 7.0, 7.0, 10.0, 12.0, 17.0, 22.0, 23.0, 33.0, 35.0, 59.0, 98.0, 124.0, 195.0, 339.0, 497.0, 791.0, 1407.0, 2589.0, 5371.0, 13662.0, 50592.0, 428704.0, 463779.0, 54019.0, 14073.0, 5622.0, 2700.0, 1408.0, 839.0, 500.0, 329.0, 212.0, 124.0, 85.0, 65.0, 46.0, 28.0, 24.0, 18.0, 12.0, 19.0, 9.0, 9.0, 9.0, 4.0, 5.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-12.3671875, -11.968505859375, -11.56982421875, -11.171142578125, -10.7724609375, -10.373779296875, -9.97509765625, -9.576416015625, -9.177734375, -8.779052734375, -8.38037109375, -7.981689453125, -7.5830078125, -7.184326171875, -6.78564453125, -6.386962890625, -5.98828125, -5.589599609375, -5.19091796875, -4.792236328125, -4.3935546875, -3.994873046875, -3.59619140625, -3.197509765625, -2.798828125, -2.400146484375, -2.00146484375, -1.602783203125, -1.2041015625, -0.805419921875, -0.40673828125, -0.008056640625, 0.390625, 0.789306640625, 1.18798828125, 1.586669921875, 1.9853515625, 2.384033203125, 2.78271484375, 3.181396484375, 3.580078125, 3.978759765625, 4.37744140625, 4.776123046875, 5.1748046875, 5.573486328125, 5.97216796875, 6.370849609375, 6.76953125, 7.168212890625, 7.56689453125, 7.965576171875, 8.3642578125, 8.762939453125, 9.16162109375, 9.560302734375, 9.958984375, 10.357666015625, 10.75634765625, 11.155029296875, 11.5537109375, 11.952392578125, 12.35107421875, 12.749755859375, 13.1484375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 5.0, 3.0, 3.0, 5.0, 7.0, 10.0, 12.0, 13.0, 28.0, 47.0, 89.0, 144.0, 182.0, 155.0, 113.0, 59.0, 38.0, 24.0, 18.0, 10.0, 5.0, 10.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.40625, -12.0269775390625, -11.647705078125, -11.2684326171875, -10.88916015625, -10.5098876953125, -10.130615234375, -9.7513427734375, -9.3720703125, -8.9927978515625, -8.613525390625, -8.2342529296875, -7.85498046875, -7.4757080078125, -7.096435546875, -6.7171630859375, -6.337890625, -5.9586181640625, -5.579345703125, -5.2000732421875, -4.82080078125, -4.4415283203125, -4.062255859375, -3.6829833984375, -3.3037109375, -2.9244384765625, -2.545166015625, -2.1658935546875, -1.78662109375, -1.4073486328125, -1.028076171875, -0.6488037109375, -0.26953125, 0.1097412109375, 0.489013671875, 0.8682861328125, 1.24755859375, 1.6268310546875, 2.006103515625, 2.3853759765625, 2.7646484375, 3.1439208984375, 3.523193359375, 3.9024658203125, 4.28173828125, 4.6610107421875, 5.040283203125, 5.4195556640625, 5.798828125, 6.1781005859375, 6.557373046875, 6.9366455078125, 7.31591796875, 7.6951904296875, 8.074462890625, 8.4537353515625, 8.8330078125, 9.2122802734375, 9.591552734375, 9.9708251953125, 10.35009765625, 10.7293701171875, 11.108642578125, 11.4879150390625, 11.8671875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 8.0, 24.0, 32.0, 72.0, 93.0, 167.0, 178.0, 173.0, 118.0, 71.0, 40.0, 17.0, 6.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-150.31546020507812, -142.99058532714844, -135.66571044921875, -128.3408203125, -121.01595306396484, -113.69107055664062, -106.36619567871094, -99.04132080078125, -91.71644592285156, -84.39157104492188, -77.06668853759766, -69.74181365966797, -62.41693878173828, -55.09206008911133, -47.767181396484375, -40.44230651855469, -33.11742401123047, -25.79254722595215, -18.467670440673828, -11.142791748046875, -3.8179149627685547, 3.5069618225097656, 10.831840515136719, 18.156715393066406, 25.48159408569336, 32.80647277832031, 40.13134765625, 47.45622634887695, 54.781105041503906, 62.105979919433594, 69.43086242675781, 76.7557373046875, 84.08061218261719, 91.40548706054688, 98.7303695678711, 106.05524444580078, 113.38011932373047, 120.70500183105469, 128.02987670898438, 135.35475158691406, 142.67962646484375, 150.00450134277344, 157.32937622070312, 164.65426635742188, 171.97914123535156, 179.30401611328125, 186.62889099121094, 193.95376586914062, 201.27865600585938, 208.60353088378906, 215.92840576171875, 223.2532958984375, 230.5781707763672, 237.90304565429688, 245.22792053222656, 252.55279541015625, 259.8776550292969, 267.2025451660156, 274.52740478515625, 281.852294921875, 289.1771545410156, 296.5020446777344, 303.826904296875, 311.15179443359375, 318.4766845703125]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 8.0, 7.0, 8.0, 10.0, 13.0, 18.0, 19.0, 10.0, 16.0, 23.0, 20.0, 32.0, 36.0, 40.0, 33.0, 35.0, 40.0, 39.0, 38.0, 41.0, 37.0, 35.0, 43.0, 38.0, 40.0, 37.0, 34.0, 29.0, 26.0, 27.0, 23.0, 17.0, 13.0, 24.0, 17.0, 15.0, 17.0, 11.0, 8.0, 3.0, 2.0, 8.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-80.02961730957031, -77.57621765136719, -75.12281036376953, -72.6694107055664, -70.21600341796875, -67.76260375976562, -65.3092041015625, -62.85580062866211, -60.40239715576172, -57.94899368286133, -55.49559020996094, -53.04219055175781, -50.58878707885742, -48.13538360595703, -45.681983947753906, -43.228580474853516, -40.775177001953125, -38.321773529052734, -35.868370056152344, -33.41497039794922, -30.961566925048828, -28.508163452148438, -26.05476188659668, -23.601360321044922, -21.14795684814453, -18.69455337524414, -16.241151809692383, -13.787749290466309, -11.334346771240234, -8.88094425201416, -6.427541732788086, -3.974140167236328, -1.5207366943359375, 0.9326658248901367, 3.386068344116211, 5.839470863342285, 8.29287338256836, 10.746275901794434, 13.199678421020508, 15.653079986572266, 18.106483459472656, 20.559886932373047, 23.013288497924805, 25.466690063476562, 27.920093536376953, 30.373497009277344, 32.82689666748047, 35.28030014038086, 37.73370361328125, 40.18710708618164, 42.64051055908203, 45.093910217285156, 47.54731369018555, 50.00071716308594, 52.45411682128906, 54.90752029418945, 57.360923767089844, 59.814327239990234, 62.267730712890625, 64.72113037109375, 67.17453002929688, 69.62793731689453, 72.08133697509766, 74.53474426269531, 76.98814392089844]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 6.0, 1.0, 5.0, 6.0, 6.0, 11.0, 10.0, 12.0, 9.0, 11.0, 19.0, 26.0, 27.0, 33.0, 54.0, 72.0, 107.0, 177.0, 254.0, 354.0, 568.0, 1042.0, 2054.0, 4198.0, 10439.0, 33865.0, 211604.0, 3700480.0, 179090.0, 31305.0, 9918.0, 4037.0, 1904.0, 1009.0, 552.0, 335.0, 180.0, 144.0, 95.0, 60.0, 50.0, 36.0, 22.0, 16.0, 16.0, 16.0, 13.0, 12.0, 8.0, 5.0, 5.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0], "bins": [-53.5, -51.94775390625, -50.3955078125, -48.84326171875, -47.291015625, -45.73876953125, -44.1865234375, -42.63427734375, -41.08203125, -39.52978515625, -37.9775390625, -36.42529296875, -34.873046875, -33.32080078125, -31.7685546875, -30.21630859375, -28.6640625, -27.11181640625, -25.5595703125, -24.00732421875, -22.455078125, -20.90283203125, -19.3505859375, -17.79833984375, -16.24609375, -14.69384765625, -13.1416015625, -11.58935546875, -10.037109375, -8.48486328125, -6.9326171875, -5.38037109375, -3.828125, -2.27587890625, -0.7236328125, 0.82861328125, 2.380859375, 3.93310546875, 5.4853515625, 7.03759765625, 8.58984375, 10.14208984375, 11.6943359375, 13.24658203125, 14.798828125, 16.35107421875, 17.9033203125, 19.45556640625, 21.0078125, 22.56005859375, 24.1123046875, 25.66455078125, 27.216796875, 28.76904296875, 30.3212890625, 31.87353515625, 33.42578125, 34.97802734375, 36.5302734375, 38.08251953125, 39.634765625, 41.18701171875, 42.7392578125, 44.29150390625, 45.84375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 5.0, 10.0, 14.0, 15.0, 20.0, 28.0, 31.0, 48.0, 58.0, 58.0, 72.0, 84.0, 80.0, 77.0, 66.0, 70.0, 59.0, 60.0, 39.0, 32.0, 16.0, 21.0, 18.0, 14.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3671875, -6.1451416015625, -5.923095703125, -5.7010498046875, -5.47900390625, -5.2569580078125, -5.034912109375, -4.8128662109375, -4.5908203125, -4.3687744140625, -4.146728515625, -3.9246826171875, -3.70263671875, -3.4805908203125, -3.258544921875, -3.0364990234375, -2.814453125, -2.5924072265625, -2.370361328125, -2.1483154296875, -1.92626953125, -1.7042236328125, -1.482177734375, -1.2601318359375, -1.0380859375, -0.8160400390625, -0.593994140625, -0.3719482421875, -0.14990234375, 0.0721435546875, 0.294189453125, 0.5162353515625, 0.73828125, 0.9603271484375, 1.182373046875, 1.4044189453125, 1.62646484375, 1.8485107421875, 2.070556640625, 2.2926025390625, 2.5146484375, 2.7366943359375, 2.958740234375, 3.1807861328125, 3.40283203125, 3.6248779296875, 3.846923828125, 4.0689697265625, 4.291015625, 4.5130615234375, 4.735107421875, 4.9571533203125, 5.17919921875, 5.4012451171875, 5.623291015625, 5.8453369140625, 6.0673828125, 6.2894287109375, 6.511474609375, 6.7335205078125, 6.95556640625, 7.1776123046875, 7.399658203125, 7.6217041015625, 7.84375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 6.0, 6.0, 12.0, 16.0, 21.0, 19.0, 38.0, 41.0, 75.0, 92.0, 133.0, 198.0, 348.0, 481.0, 812.0, 1296.0, 2405.0, 4291.0, 8080.0, 17318.0, 41866.0, 128503.0, 806137.0, 2844663.0, 228447.0, 62663.0, 23623.0, 10494.0, 5194.0, 2808.0, 1589.0, 993.0, 564.0, 359.0, 242.0, 130.0, 96.0, 63.0, 56.0, 29.0, 23.0, 11.0, 16.0, 8.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-24.953125, -24.201416015625, -23.44970703125, -22.697998046875, -21.9462890625, -21.194580078125, -20.44287109375, -19.691162109375, -18.939453125, -18.187744140625, -17.43603515625, -16.684326171875, -15.9326171875, -15.180908203125, -14.42919921875, -13.677490234375, -12.92578125, -12.174072265625, -11.42236328125, -10.670654296875, -9.9189453125, -9.167236328125, -8.41552734375, -7.663818359375, -6.912109375, -6.160400390625, -5.40869140625, -4.656982421875, -3.9052734375, -3.153564453125, -2.40185546875, -1.650146484375, -0.8984375, -0.146728515625, 0.60498046875, 1.356689453125, 2.1083984375, 2.860107421875, 3.61181640625, 4.363525390625, 5.115234375, 5.866943359375, 6.61865234375, 7.370361328125, 8.1220703125, 8.873779296875, 9.62548828125, 10.377197265625, 11.12890625, 11.880615234375, 12.63232421875, 13.384033203125, 14.1357421875, 14.887451171875, 15.63916015625, 16.390869140625, 17.142578125, 17.894287109375, 18.64599609375, 19.397705078125, 20.1494140625, 20.901123046875, 21.65283203125, 22.404541015625, 23.15625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 2.0, 7.0, 10.0, 12.0, 8.0, 16.0, 14.0, 23.0, 31.0, 35.0, 61.0, 107.0, 192.0, 398.0, 1239.0, 1046.0, 341.0, 198.0, 101.0, 78.0, 45.0, 30.0, 22.0, 16.0, 12.0, 7.0, 7.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.59375, -13.2259521484375, -12.858154296875, -12.4903564453125, -12.12255859375, -11.7547607421875, -11.386962890625, -11.0191650390625, -10.6513671875, -10.2835693359375, -9.915771484375, -9.5479736328125, -9.18017578125, -8.8123779296875, -8.444580078125, -8.0767822265625, -7.708984375, -7.3411865234375, -6.973388671875, -6.6055908203125, -6.23779296875, -5.8699951171875, -5.502197265625, -5.1343994140625, -4.7666015625, -4.3988037109375, -4.031005859375, -3.6632080078125, -3.29541015625, -2.9276123046875, -2.559814453125, -2.1920166015625, -1.82421875, -1.4564208984375, -1.088623046875, -0.7208251953125, -0.35302734375, 0.0147705078125, 0.382568359375, 0.7503662109375, 1.1181640625, 1.4859619140625, 1.853759765625, 2.2215576171875, 2.58935546875, 2.9571533203125, 3.324951171875, 3.6927490234375, 4.060546875, 4.4283447265625, 4.796142578125, 5.1639404296875, 5.53173828125, 5.8995361328125, 6.267333984375, 6.6351318359375, 7.0029296875, 7.3707275390625, 7.738525390625, 8.1063232421875, 8.47412109375, 8.8419189453125, 9.209716796875, 9.5775146484375, 9.9453125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 5.0, 9.0, 15.0, 16.0, 31.0, 51.0, 63.0, 97.0, 117.0, 120.0, 135.0, 93.0, 83.0, 59.0, 44.0, 19.0, 29.0, 7.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.90001678466797, -79.15853118896484, -76.41704559326172, -73.67555236816406, -70.93406677246094, -68.19258117675781, -65.45109558105469, -62.70960998535156, -59.96812057495117, -57.22663497924805, -54.485145568847656, -51.74365997314453, -49.002174377441406, -46.260684967041016, -43.51919937133789, -40.7777099609375, -38.036224365234375, -35.29473876953125, -32.55324935913086, -29.811763763427734, -27.070276260375977, -24.32878875732422, -21.587303161621094, -18.845815658569336, -16.104328155517578, -13.36284065246582, -10.621354103088379, -7.8798675537109375, -5.13838005065918, -2.396892547607422, 0.3445930480957031, 3.086080551147461, 5.827568054199219, 8.569055557250977, 11.310542106628418, 14.05202865600586, 16.793516159057617, 19.535003662109375, 22.2764892578125, 25.017976760864258, 27.759464263916016, 30.500951766967773, 33.24243927001953, 35.983924865722656, 38.72541046142578, 41.46689987182617, 44.2083854675293, 46.94987487792969, 49.69136047363281, 52.43284606933594, 55.17433547973633, 57.91582107543945, 60.657310485839844, 63.39879608154297, 66.1402816772461, 68.88176727294922, 71.62326049804688, 74.36474609375, 77.10623168945312, 79.84771728515625, 82.5892105102539, 85.33069610595703, 88.07218170166016, 90.81366729736328, 93.5551528930664]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 5.0, 6.0, 6.0, 7.0, 8.0, 23.0, 21.0, 25.0, 17.0, 30.0, 34.0, 33.0, 33.0, 43.0, 53.0, 57.0, 51.0, 62.0, 43.0, 54.0, 46.0, 43.0, 46.0, 41.0, 34.0, 34.0, 20.0, 21.0, 22.0, 16.0, 14.0, 15.0, 9.0, 5.0, 8.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-40.453407287597656, -39.134368896484375, -37.81532669067383, -36.49628829956055, -35.177249908447266, -33.85820770263672, -32.53916931152344, -31.220130920410156, -29.901090621948242, -28.582050323486328, -27.263011932373047, -25.943971633911133, -24.62493133544922, -23.305892944335938, -21.986852645874023, -20.66781234741211, -19.348773956298828, -18.029733657836914, -16.710695266723633, -15.391654968261719, -14.072615623474121, -12.753576278686523, -11.43453598022461, -10.115496635437012, -8.796457290649414, -7.477417945861816, -6.1583781242370605, -4.839338302612305, -3.520298957824707, -2.2012596130371094, -0.8822197914123535, 0.43682003021240234, 1.755859375, 3.0748989582061768, 4.3939385414123535, 5.712978363037109, 7.032017707824707, 8.351057052612305, 9.670097351074219, 10.989136695861816, 12.308176040649414, 13.627215385437012, 14.94625473022461, 16.265295028686523, 17.584335327148438, 18.90337371826172, 20.222414016723633, 21.541454315185547, 22.860492706298828, 24.179533004760742, 25.498571395874023, 26.817611694335938, 28.13665008544922, 29.455690383911133, 30.774730682373047, 32.09376907348633, 33.412811279296875, 34.731849670410156, 36.0508918762207, 37.369930267333984, 38.688968658447266, 40.00801086425781, 41.327049255371094, 42.646087646484375, 43.965126037597656]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 6.0, 4.0, 7.0, 5.0, 11.0, 21.0, 21.0, 35.0, 53.0, 83.0, 129.0, 243.0, 439.0, 854.0, 2059.0, 7410.0, 36752.0, 299200.0, 622431.0, 62044.0, 11588.0, 2895.0, 1060.0, 461.0, 313.0, 174.0, 88.0, 55.0, 39.0, 25.0, 17.0, 11.0, 11.0, 7.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.71875, -53.0166015625, -51.314453125, -49.6123046875, -47.91015625, -46.2080078125, -44.505859375, -42.8037109375, -41.1015625, -39.3994140625, -37.697265625, -35.9951171875, -34.29296875, -32.5908203125, -30.888671875, -29.1865234375, -27.484375, -25.7822265625, -24.080078125, -22.3779296875, -20.67578125, -18.9736328125, -17.271484375, -15.5693359375, -13.8671875, -12.1650390625, -10.462890625, -8.7607421875, -7.05859375, -5.3564453125, -3.654296875, -1.9521484375, -0.25, 1.4521484375, 3.154296875, 4.8564453125, 6.55859375, 8.2607421875, 9.962890625, 11.6650390625, 13.3671875, 15.0693359375, 16.771484375, 18.4736328125, 20.17578125, 21.8779296875, 23.580078125, 25.2822265625, 26.984375, 28.6865234375, 30.388671875, 32.0908203125, 33.79296875, 35.4951171875, 37.197265625, 38.8994140625, 40.6015625, 42.3037109375, 44.005859375, 45.7080078125, 47.41015625, 49.1123046875, 50.814453125, 52.5166015625, 54.21875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 10.0, 13.0, 9.0, 32.0, 32.0, 45.0, 31.0, 53.0, 54.0, 66.0, 68.0, 75.0, 68.0, 61.0, 57.0, 67.0, 52.0, 58.0, 30.0, 38.0, 23.0, 13.0, 17.0, 16.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.453125, -6.23175048828125, -6.0103759765625, -5.78900146484375, -5.567626953125, -5.34625244140625, -5.1248779296875, -4.90350341796875, -4.68212890625, -4.46075439453125, -4.2393798828125, -4.01800537109375, -3.796630859375, -3.57525634765625, -3.3538818359375, -3.13250732421875, -2.9111328125, -2.68975830078125, -2.4683837890625, -2.24700927734375, -2.025634765625, -1.80426025390625, -1.5828857421875, -1.36151123046875, -1.14013671875, -0.91876220703125, -0.6973876953125, -0.47601318359375, -0.254638671875, -0.03326416015625, 0.1881103515625, 0.40948486328125, 0.630859375, 0.85223388671875, 1.0736083984375, 1.29498291015625, 1.516357421875, 1.73773193359375, 1.9591064453125, 2.18048095703125, 2.40185546875, 2.62322998046875, 2.8446044921875, 3.06597900390625, 3.287353515625, 3.50872802734375, 3.7301025390625, 3.95147705078125, 4.1728515625, 4.39422607421875, 4.6156005859375, 4.83697509765625, 5.058349609375, 5.27972412109375, 5.5010986328125, 5.72247314453125, 5.94384765625, 6.16522216796875, 6.3865966796875, 6.60797119140625, 6.829345703125, 7.05072021484375, 7.2720947265625, 7.49346923828125, 7.71484375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 8.0, 8.0, 15.0, 21.0, 23.0, 24.0, 46.0, 91.0, 156.0, 226.0, 455.0, 853.0, 1937.0, 4635.0, 12262.0, 35784.0, 141052.0, 654659.0, 139948.0, 35693.0, 12267.0, 4619.0, 1865.0, 864.0, 429.0, 229.0, 130.0, 81.0, 57.0, 31.0, 15.0, 21.0, 6.0, 10.0, 12.0, 3.0, 1.0, 6.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0], "bins": [-27.859375, -26.974853515625, -26.09033203125, -25.205810546875, -24.3212890625, -23.436767578125, -22.55224609375, -21.667724609375, -20.783203125, -19.898681640625, -19.01416015625, -18.129638671875, -17.2451171875, -16.360595703125, -15.47607421875, -14.591552734375, -13.70703125, -12.822509765625, -11.93798828125, -11.053466796875, -10.1689453125, -9.284423828125, -8.39990234375, -7.515380859375, -6.630859375, -5.746337890625, -4.86181640625, -3.977294921875, -3.0927734375, -2.208251953125, -1.32373046875, -0.439208984375, 0.4453125, 1.329833984375, 2.21435546875, 3.098876953125, 3.9833984375, 4.867919921875, 5.75244140625, 6.636962890625, 7.521484375, 8.406005859375, 9.29052734375, 10.175048828125, 11.0595703125, 11.944091796875, 12.82861328125, 13.713134765625, 14.59765625, 15.482177734375, 16.36669921875, 17.251220703125, 18.1357421875, 19.020263671875, 19.90478515625, 20.789306640625, 21.673828125, 22.558349609375, 23.44287109375, 24.327392578125, 25.2119140625, 26.096435546875, 26.98095703125, 27.865478515625, 28.75]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 8.0, 8.0, 14.0, 17.0, 23.0, 43.0, 42.0, 51.0, 54.0, 61.0, 87.0, 86.0, 69.0, 84.0, 69.0, 50.0, 55.0, 42.0, 37.0, 19.0, 14.0, 20.0, 17.0, 7.0, 8.0, 10.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-30.140625, -29.181884765625, -28.22314453125, -27.264404296875, -26.3056640625, -25.346923828125, -24.38818359375, -23.429443359375, -22.470703125, -21.511962890625, -20.55322265625, -19.594482421875, -18.6357421875, -17.677001953125, -16.71826171875, -15.759521484375, -14.80078125, -13.842041015625, -12.88330078125, -11.924560546875, -10.9658203125, -10.007080078125, -9.04833984375, -8.089599609375, -7.130859375, -6.172119140625, -5.21337890625, -4.254638671875, -3.2958984375, -2.337158203125, -1.37841796875, -0.419677734375, 0.5390625, 1.497802734375, 2.45654296875, 3.415283203125, 4.3740234375, 5.332763671875, 6.29150390625, 7.250244140625, 8.208984375, 9.167724609375, 10.12646484375, 11.085205078125, 12.0439453125, 13.002685546875, 13.96142578125, 14.920166015625, 15.87890625, 16.837646484375, 17.79638671875, 18.755126953125, 19.7138671875, 20.672607421875, 21.63134765625, 22.590087890625, 23.548828125, 24.507568359375, 25.46630859375, 26.425048828125, 27.3837890625, 28.342529296875, 29.30126953125, 30.260009765625, 31.21875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 4.0, 14.0, 10.0, 20.0, 20.0, 28.0, 39.0, 75.0, 129.0, 238.0, 503.0, 1056.0, 2567.0, 7512.0, 22328.0, 82802.0, 685063.0, 193280.0, 35062.0, 11045.0, 3885.0, 1424.0, 713.0, 294.0, 150.0, 97.0, 61.0, 35.0, 29.0, 16.0, 21.0, 15.0, 7.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.578125, -11.12744140625, -10.6767578125, -10.22607421875, -9.775390625, -9.32470703125, -8.8740234375, -8.42333984375, -7.97265625, -7.52197265625, -7.0712890625, -6.62060546875, -6.169921875, -5.71923828125, -5.2685546875, -4.81787109375, -4.3671875, -3.91650390625, -3.4658203125, -3.01513671875, -2.564453125, -2.11376953125, -1.6630859375, -1.21240234375, -0.76171875, -0.31103515625, 0.1396484375, 0.59033203125, 1.041015625, 1.49169921875, 1.9423828125, 2.39306640625, 2.84375, 3.29443359375, 3.7451171875, 4.19580078125, 4.646484375, 5.09716796875, 5.5478515625, 5.99853515625, 6.44921875, 6.89990234375, 7.3505859375, 7.80126953125, 8.251953125, 8.70263671875, 9.1533203125, 9.60400390625, 10.0546875, 10.50537109375, 10.9560546875, 11.40673828125, 11.857421875, 12.30810546875, 12.7587890625, 13.20947265625, 13.66015625, 14.11083984375, 14.5615234375, 15.01220703125, 15.462890625, 15.91357421875, 16.3642578125, 16.81494140625, 17.265625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 3.0, 3.0, 1.0, 8.0, 7.0, 10.0, 13.0, 16.0, 22.0, 29.0, 20.0, 52.0, 119.0, 301.0, 213.0, 67.0, 21.0, 11.0, 14.0, 15.0, 8.0, 10.0, 4.0, 3.0, 6.0, 6.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.002307891845703125, -0.0022275447845458984, -0.002147197723388672, -0.0020668506622314453, -0.0019865036010742188, -0.0019061565399169922, -0.0018258094787597656, -0.001745462417602539, -0.0016651153564453125, -0.001584768295288086, -0.0015044212341308594, -0.0014240741729736328, -0.0013437271118164062, -0.0012633800506591797, -0.0011830329895019531, -0.0011026859283447266, -0.0010223388671875, -0.0009419918060302734, -0.0008616447448730469, -0.0007812976837158203, -0.0007009506225585938, -0.0006206035614013672, -0.0005402565002441406, -0.00045990943908691406, -0.0003795623779296875, -0.00029921531677246094, -0.00021886825561523438, -0.0001385211944580078, -5.817413330078125e-05, 2.2172927856445312e-05, 0.00010251998901367188, 0.00018286705017089844, 0.000263214111328125, 0.00034356117248535156, 0.0004239082336425781, 0.0005042552947998047, 0.0005846023559570312, 0.0006649494171142578, 0.0007452964782714844, 0.0008256435394287109, 0.0009059906005859375, 0.000986337661743164, 0.0010666847229003906, 0.0011470317840576172, 0.0012273788452148438, 0.0013077259063720703, 0.0013880729675292969, 0.0014684200286865234, 0.00154876708984375, 0.0016291141510009766, 0.0017094612121582031, 0.0017898082733154297, 0.0018701553344726562, 0.0019505023956298828, 0.0020308494567871094, 0.002111196517944336, 0.0021915435791015625, 0.002271890640258789, 0.0023522377014160156, 0.002432584762573242, 0.0025129318237304688, 0.0025932788848876953, 0.002673625946044922, 0.0027539730072021484, 0.002834320068359375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 5.0, 11.0, 21.0, 25.0, 30.0, 48.0, 54.0, 80.0, 139.0, 174.0, 332.0, 661.0, 1499.0, 4452.0, 15395.0, 56150.0, 615770.0, 298360.0, 38462.0, 10912.0, 3438.0, 1184.0, 557.0, 300.0, 163.0, 113.0, 60.0, 49.0, 32.0, 20.0, 16.0, 10.0, 13.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.484375, -14.982666015625, -14.48095703125, -13.979248046875, -13.4775390625, -12.975830078125, -12.47412109375, -11.972412109375, -11.470703125, -10.968994140625, -10.46728515625, -9.965576171875, -9.4638671875, -8.962158203125, -8.46044921875, -7.958740234375, -7.45703125, -6.955322265625, -6.45361328125, -5.951904296875, -5.4501953125, -4.948486328125, -4.44677734375, -3.945068359375, -3.443359375, -2.941650390625, -2.43994140625, -1.938232421875, -1.4365234375, -0.934814453125, -0.43310546875, 0.068603515625, 0.5703125, 1.072021484375, 1.57373046875, 2.075439453125, 2.5771484375, 3.078857421875, 3.58056640625, 4.082275390625, 4.583984375, 5.085693359375, 5.58740234375, 6.089111328125, 6.5908203125, 7.092529296875, 7.59423828125, 8.095947265625, 8.59765625, 9.099365234375, 9.60107421875, 10.102783203125, 10.6044921875, 11.106201171875, 11.60791015625, 12.109619140625, 12.611328125, 13.113037109375, 13.61474609375, 14.116455078125, 14.6181640625, 15.119873046875, 15.62158203125, 16.123291015625, 16.625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 5.0, 3.0, 2.0, 4.0, 10.0, 9.0, 11.0, 15.0, 13.0, 17.0, 26.0, 50.0, 105.0, 186.0, 171.0, 119.0, 82.0, 54.0, 25.0, 24.0, 12.0, 13.0, 13.0, 4.0, 8.0, 5.0, 3.0, 4.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.28125, -10.9346923828125, -10.588134765625, -10.2415771484375, -9.89501953125, -9.5484619140625, -9.201904296875, -8.8553466796875, -8.5087890625, -8.1622314453125, -7.815673828125, -7.4691162109375, -7.12255859375, -6.7760009765625, -6.429443359375, -6.0828857421875, -5.736328125, -5.3897705078125, -5.043212890625, -4.6966552734375, -4.35009765625, -4.0035400390625, -3.656982421875, -3.3104248046875, -2.9638671875, -2.6173095703125, -2.270751953125, -1.9241943359375, -1.57763671875, -1.2310791015625, -0.884521484375, -0.5379638671875, -0.19140625, 0.1551513671875, 0.501708984375, 0.8482666015625, 1.19482421875, 1.5413818359375, 1.887939453125, 2.2344970703125, 2.5810546875, 2.9276123046875, 3.274169921875, 3.6207275390625, 3.96728515625, 4.3138427734375, 4.660400390625, 5.0069580078125, 5.353515625, 5.7000732421875, 6.046630859375, 6.3931884765625, 6.73974609375, 7.0863037109375, 7.432861328125, 7.7794189453125, 8.1259765625, 8.4725341796875, 8.819091796875, 9.1656494140625, 9.51220703125, 9.8587646484375, 10.205322265625, 10.5518798828125, 10.8984375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 5.0, 16.0, 34.0, 44.0, 83.0, 111.0, 133.0, 147.0, 145.0, 129.0, 76.0, 38.0, 20.0, 10.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.25495910644531, -88.2148208618164, -82.17469024658203, -76.13455200195312, -70.09442138671875, -64.05428314208984, -58.01414489746094, -51.9740104675293, -45.933876037597656, -39.893741607666016, -33.853607177734375, -27.81346893310547, -21.773334503173828, -15.733200073242188, -9.693061828613281, -3.6529273986816406, 2.38720703125, 8.427342414855957, 14.467477798461914, 20.507614135742188, 26.547748565673828, 32.58788299560547, 38.628021240234375, 44.668155670166016, 50.708290100097656, 56.7484245300293, 62.78855895996094, 68.82869720458984, 74.86883544921875, 80.90896606445312, 86.94910430908203, 92.98924255371094, 99.02938842773438, 105.06952667236328, 111.10965728759766, 117.14979553222656, 123.18992614746094, 129.23007202148438, 135.27020263671875, 141.31033325195312, 147.3504638671875, 153.39059448242188, 159.4307403564453, 165.4708709716797, 171.51100158691406, 177.5511474609375, 183.59127807617188, 189.63140869140625, 195.6715545654297, 201.71168518066406, 207.7518310546875, 213.79196166992188, 219.83209228515625, 225.87222290039062, 231.91236877441406, 237.95249938964844, 243.99264526367188, 250.03277587890625, 256.0729064941406, 262.113037109375, 268.1531982421875, 274.1933288574219, 280.23345947265625, 286.2735900878906, 292.313720703125]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 1.0, 8.0, 10.0, 8.0, 13.0, 11.0, 14.0, 21.0, 25.0, 18.0, 25.0, 24.0, 34.0, 31.0, 26.0, 37.0, 42.0, 45.0, 37.0, 46.0, 27.0, 44.0, 40.0, 41.0, 39.0, 33.0, 37.0, 31.0, 23.0, 29.0, 23.0, 24.0, 18.0, 16.0, 17.0, 16.0, 15.0, 16.0, 9.0, 7.0, 3.0, 8.0, 6.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-69.92535400390625, -67.42276000976562, -64.920166015625, -62.41757583618164, -59.91498565673828, -57.412391662597656, -54.90979766845703, -52.407203674316406, -49.90461349487305, -47.40201950073242, -44.89942932128906, -42.39683532714844, -39.89424133300781, -37.39165115356445, -34.88905715942383, -32.38646697998047, -29.883872985839844, -27.38128089904785, -24.87868881225586, -22.376094818115234, -19.873502731323242, -17.37091064453125, -14.868317604064941, -12.365724563598633, -9.86313247680664, -7.36053991317749, -4.85794734954834, -2.3553547859191895, 0.14723777770996094, 2.649829864501953, 5.152422904968262, 7.65501594543457, 10.157608032226562, 12.660200119018555, 15.162793159484863, 17.665386199951172, 20.167978286743164, 22.670570373535156, 25.17316436767578, 27.675756454467773, 30.178348541259766, 32.68094253540039, 35.18353271484375, 37.686126708984375, 40.188720703125, 42.69131088256836, 45.193904876708984, 47.696495056152344, 50.19908905029297, 52.701683044433594, 55.20427322387695, 57.70686721801758, 60.20945739746094, 62.71205139160156, 65.21464538574219, 67.71723937988281, 70.21983337402344, 72.72242736816406, 75.22502136230469, 77.72760772705078, 80.2302017211914, 82.73279571533203, 85.23538970947266, 87.73798370361328, 90.24057006835938]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 7.0, 3.0, 6.0, 6.0, 13.0, 20.0, 19.0, 20.0, 38.0, 58.0, 72.0, 87.0, 134.0, 193.0, 289.0, 443.0, 753.0, 1471.0, 3081.0, 7278.0, 20886.0, 78184.0, 2598929.0, 1373696.0, 74863.0, 20074.0, 7047.0, 3170.0, 1446.0, 809.0, 407.0, 247.0, 171.0, 108.0, 74.0, 54.0, 36.0, 27.0, 16.0, 11.0, 12.0, 10.0, 8.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-60.3125, -58.48388671875, -56.6552734375, -54.82666015625, -52.998046875, -51.16943359375, -49.3408203125, -47.51220703125, -45.68359375, -43.85498046875, -42.0263671875, -40.19775390625, -38.369140625, -36.54052734375, -34.7119140625, -32.88330078125, -31.0546875, -29.22607421875, -27.3974609375, -25.56884765625, -23.740234375, -21.91162109375, -20.0830078125, -18.25439453125, -16.42578125, -14.59716796875, -12.7685546875, -10.93994140625, -9.111328125, -7.28271484375, -5.4541015625, -3.62548828125, -1.796875, 0.03173828125, 1.8603515625, 3.68896484375, 5.517578125, 7.34619140625, 9.1748046875, 11.00341796875, 12.83203125, 14.66064453125, 16.4892578125, 18.31787109375, 20.146484375, 21.97509765625, 23.8037109375, 25.63232421875, 27.4609375, 29.28955078125, 31.1181640625, 32.94677734375, 34.775390625, 36.60400390625, 38.4326171875, 40.26123046875, 42.08984375, 43.91845703125, 45.7470703125, 47.57568359375, 49.404296875, 51.23291015625, 53.0615234375, 54.89013671875, 56.71875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 9.0, 16.0, 12.0, 25.0, 25.0, 30.0, 40.0, 45.0, 50.0, 56.0, 61.0, 65.0, 65.0, 65.0, 67.0, 62.0, 53.0, 58.0, 43.0, 38.0, 21.0, 27.0, 15.0, 18.0, 10.0, 8.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.30078125, -6.08184814453125, -5.8629150390625, -5.64398193359375, -5.425048828125, -5.20611572265625, -4.9871826171875, -4.76824951171875, -4.54931640625, -4.33038330078125, -4.1114501953125, -3.89251708984375, -3.673583984375, -3.45465087890625, -3.2357177734375, -3.01678466796875, -2.7978515625, -2.57891845703125, -2.3599853515625, -2.14105224609375, -1.922119140625, -1.70318603515625, -1.4842529296875, -1.26531982421875, -1.04638671875, -0.82745361328125, -0.6085205078125, -0.38958740234375, -0.170654296875, 0.04827880859375, 0.2672119140625, 0.48614501953125, 0.705078125, 0.92401123046875, 1.1429443359375, 1.36187744140625, 1.580810546875, 1.79974365234375, 2.0186767578125, 2.23760986328125, 2.45654296875, 2.67547607421875, 2.8944091796875, 3.11334228515625, 3.332275390625, 3.55120849609375, 3.7701416015625, 3.98907470703125, 4.2080078125, 4.42694091796875, 4.6458740234375, 4.86480712890625, 5.083740234375, 5.30267333984375, 5.5216064453125, 5.74053955078125, 5.95947265625, 6.17840576171875, 6.3973388671875, 6.61627197265625, 6.835205078125, 7.05413818359375, 7.2730712890625, 7.49200439453125, 7.7109375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 8.0, 4.0, 5.0, 4.0, 12.0, 13.0, 18.0, 20.0, 44.0, 50.0, 55.0, 87.0, 112.0, 172.0, 233.0, 341.0, 510.0, 861.0, 1468.0, 2629.0, 5180.0, 10668.0, 24235.0, 64335.0, 235996.0, 3121609.0, 553227.0, 106104.0, 36108.0, 14812.0, 6986.0, 3586.0, 1841.0, 1072.0, 610.0, 423.0, 243.0, 174.0, 120.0, 78.0, 51.0, 47.0, 39.0, 21.0, 17.0, 11.0, 14.0, 10.0, 7.0, 4.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-30.328125, -29.401123046875, -28.47412109375, -27.547119140625, -26.6201171875, -25.693115234375, -24.76611328125, -23.839111328125, -22.912109375, -21.985107421875, -21.05810546875, -20.131103515625, -19.2041015625, -18.277099609375, -17.35009765625, -16.423095703125, -15.49609375, -14.569091796875, -13.64208984375, -12.715087890625, -11.7880859375, -10.861083984375, -9.93408203125, -9.007080078125, -8.080078125, -7.153076171875, -6.22607421875, -5.299072265625, -4.3720703125, -3.445068359375, -2.51806640625, -1.591064453125, -0.6640625, 0.262939453125, 1.18994140625, 2.116943359375, 3.0439453125, 3.970947265625, 4.89794921875, 5.824951171875, 6.751953125, 7.678955078125, 8.60595703125, 9.532958984375, 10.4599609375, 11.386962890625, 12.31396484375, 13.240966796875, 14.16796875, 15.094970703125, 16.02197265625, 16.948974609375, 17.8759765625, 18.802978515625, 19.72998046875, 20.656982421875, 21.583984375, 22.510986328125, 23.43798828125, 24.364990234375, 25.2919921875, 26.218994140625, 27.14599609375, 28.072998046875, 29.0]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 5.0, 5.0, 8.0, 10.0, 9.0, 16.0, 22.0, 47.0, 45.0, 83.0, 157.0, 316.0, 1723.0, 982.0, 282.0, 145.0, 66.0, 42.0, 34.0, 21.0, 17.0, 10.0, 5.0, 9.0, 6.0, 1.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.34375, -21.79736328125, -21.2509765625, -20.70458984375, -20.158203125, -19.61181640625, -19.0654296875, -18.51904296875, -17.97265625, -17.42626953125, -16.8798828125, -16.33349609375, -15.787109375, -15.24072265625, -14.6943359375, -14.14794921875, -13.6015625, -13.05517578125, -12.5087890625, -11.96240234375, -11.416015625, -10.86962890625, -10.3232421875, -9.77685546875, -9.23046875, -8.68408203125, -8.1376953125, -7.59130859375, -7.044921875, -6.49853515625, -5.9521484375, -5.40576171875, -4.859375, -4.31298828125, -3.7666015625, -3.22021484375, -2.673828125, -2.12744140625, -1.5810546875, -1.03466796875, -0.48828125, 0.05810546875, 0.6044921875, 1.15087890625, 1.697265625, 2.24365234375, 2.7900390625, 3.33642578125, 3.8828125, 4.42919921875, 4.9755859375, 5.52197265625, 6.068359375, 6.61474609375, 7.1611328125, 7.70751953125, 8.25390625, 8.80029296875, 9.3466796875, 9.89306640625, 10.439453125, 10.98583984375, 11.5322265625, 12.07861328125, 12.625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 14.0, 46.0, 75.0, 153.0, 196.0, 241.0, 143.0, 71.0, 37.0, 14.0, 5.0, 7.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-230.5846405029297, -225.5850830078125, -220.58551025390625, -215.58595275878906, -210.58639526367188, -205.58682250976562, -200.58726501464844, -195.58770751953125, -190.588134765625, -185.5885772705078, -180.58900451660156, -175.58944702148438, -170.5898895263672, -165.59031677246094, -160.59075927734375, -155.5911865234375, -150.59164428710938, -145.5920867919922, -140.59251403808594, -135.59295654296875, -130.59339904785156, -125.59382629394531, -120.59426879882812, -115.5947036743164, -110.59513854980469, -105.59557342529297, -100.59601593017578, -95.59645080566406, -90.59688568115234, -85.59732055664062, -80.59776306152344, -75.59819793701172, -70.59862518310547, -65.59906005859375, -60.5994987487793, -55.599937438964844, -50.600372314453125, -45.60081100463867, -40.60124969482422, -35.6016845703125, -30.602123260498047, -25.60256004333496, -20.602996826171875, -15.603435516357422, -10.603872299194336, -5.60430908203125, -0.6047477722167969, 4.394817352294922, 9.394378662109375, 14.393941879272461, 19.393505096435547, 24.39306640625, 29.392629623413086, 34.39219284057617, 39.391754150390625, 44.391319274902344, 49.3908805847168, 54.39044189453125, 59.39000701904297, 64.38957214355469, 69.38912963867188, 74.3886947631836, 79.38825988769531, 84.3878173828125, 89.38738250732422]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 11.0, 5.0, 12.0, 19.0, 23.0, 26.0, 37.0, 35.0, 37.0, 40.0, 37.0, 47.0, 56.0, 42.0, 57.0, 59.0, 71.0, 49.0, 45.0, 43.0, 41.0, 32.0, 42.0, 34.0, 24.0, 21.0, 15.0, 11.0, 9.0, 7.0, 7.0, 2.0, 2.0, 6.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.89250564575195, -50.052852630615234, -48.213199615478516, -46.37354278564453, -44.53388977050781, -42.694236755371094, -40.854583740234375, -39.014930725097656, -37.17527770996094, -35.33562469482422, -33.4959716796875, -31.65631675720215, -29.816661834716797, -27.977008819580078, -26.13735580444336, -24.29770278930664, -22.458045959472656, -20.618392944335938, -18.778738021850586, -16.939085006713867, -15.099431037902832, -13.259777069091797, -11.420124053955078, -9.580470085144043, -7.740816116333008, -5.901162147521973, -4.061508655548096, -2.2218551635742188, -0.3822011947631836, 1.4574527740478516, 3.2971057891845703, 5.1367597579956055, 6.976417541503906, 8.816071510314941, 10.655725479125977, 12.495378494262695, 14.33503246307373, 16.174686431884766, 18.014339447021484, 19.853992462158203, 21.693647384643555, 23.533300399780273, 25.372955322265625, 27.212608337402344, 29.052261352539062, 30.891916275024414, 32.7315673828125, 34.571224212646484, 36.4108772277832, 38.25053024291992, 40.09018325805664, 41.929840087890625, 43.769493103027344, 45.60914611816406, 47.44879913330078, 49.2884521484375, 51.12810516357422, 52.96775817871094, 54.807411193847656, 56.647064208984375, 58.48672103881836, 60.32637405395508, 62.1660270690918, 64.00568389892578, 65.8453369140625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 4.0, 4.0, 9.0, 17.0, 26.0, 39.0, 60.0, 90.0, 139.0, 219.0, 388.0, 697.0, 1468.0, 3676.0, 11004.0, 41872.0, 175244.0, 570900.0, 181550.0, 42741.0, 11454.0, 3754.0, 1504.0, 694.0, 382.0, 212.0, 144.0, 92.0, 58.0, 37.0, 27.0, 18.0, 15.0, 2.0, 3.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.25, -40.9091796875, -39.568359375, -38.2275390625, -36.88671875, -35.5458984375, -34.205078125, -32.8642578125, -31.5234375, -30.1826171875, -28.841796875, -27.5009765625, -26.16015625, -24.8193359375, -23.478515625, -22.1376953125, -20.796875, -19.4560546875, -18.115234375, -16.7744140625, -15.43359375, -14.0927734375, -12.751953125, -11.4111328125, -10.0703125, -8.7294921875, -7.388671875, -6.0478515625, -4.70703125, -3.3662109375, -2.025390625, -0.6845703125, 0.65625, 1.9970703125, 3.337890625, 4.6787109375, 6.01953125, 7.3603515625, 8.701171875, 10.0419921875, 11.3828125, 12.7236328125, 14.064453125, 15.4052734375, 16.74609375, 18.0869140625, 19.427734375, 20.7685546875, 22.109375, 23.4501953125, 24.791015625, 26.1318359375, 27.47265625, 28.8134765625, 30.154296875, 31.4951171875, 32.8359375, 34.1767578125, 35.517578125, 36.8583984375, 38.19921875, 39.5400390625, 40.880859375, 42.2216796875, 43.5625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 8.0, 11.0, 15.0, 28.0, 31.0, 34.0, 40.0, 50.0, 46.0, 47.0, 51.0, 57.0, 71.0, 53.0, 66.0, 62.0, 62.0, 43.0, 49.0, 36.0, 41.0, 26.0, 18.0, 20.0, 10.0, 6.0, 8.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.8125, -6.578125, -6.34375, -6.109375, -5.875, -5.640625, -5.40625, -5.171875, -4.9375, -4.703125, -4.46875, -4.234375, -4.0, -3.765625, -3.53125, -3.296875, -3.0625, -2.828125, -2.59375, -2.359375, -2.125, -1.890625, -1.65625, -1.421875, -1.1875, -0.953125, -0.71875, -0.484375, -0.25, -0.015625, 0.21875, 0.453125, 0.6875, 0.921875, 1.15625, 1.390625, 1.625, 1.859375, 2.09375, 2.328125, 2.5625, 2.796875, 3.03125, 3.265625, 3.5, 3.734375, 3.96875, 4.203125, 4.4375, 4.671875, 4.90625, 5.140625, 5.375, 5.609375, 5.84375, 6.078125, 6.3125, 6.546875, 6.78125, 7.015625, 7.25, 7.484375, 7.71875, 7.953125, 8.1875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 4.0, 7.0, 5.0, 16.0, 13.0, 18.0, 27.0, 29.0, 68.0, 81.0, 122.0, 143.0, 217.0, 309.0, 440.0, 750.0, 1407.0, 2930.0, 7551.0, 23520.0, 81335.0, 331784.0, 443985.0, 105917.0, 30546.0, 9769.0, 3513.0, 1612.0, 806.0, 498.0, 313.0, 228.0, 160.0, 139.0, 73.0, 74.0, 39.0, 40.0, 26.0, 14.0, 11.0, 11.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.421875, -22.6171875, -21.8125, -21.0078125, -20.203125, -19.3984375, -18.59375, -17.7890625, -16.984375, -16.1796875, -15.375, -14.5703125, -13.765625, -12.9609375, -12.15625, -11.3515625, -10.546875, -9.7421875, -8.9375, -8.1328125, -7.328125, -6.5234375, -5.71875, -4.9140625, -4.109375, -3.3046875, -2.5, -1.6953125, -0.890625, -0.0859375, 0.71875, 1.5234375, 2.328125, 3.1328125, 3.9375, 4.7421875, 5.546875, 6.3515625, 7.15625, 7.9609375, 8.765625, 9.5703125, 10.375, 11.1796875, 11.984375, 12.7890625, 13.59375, 14.3984375, 15.203125, 16.0078125, 16.8125, 17.6171875, 18.421875, 19.2265625, 20.03125, 20.8359375, 21.640625, 22.4453125, 23.25, 24.0546875, 24.859375, 25.6640625, 26.46875, 27.2734375, 28.078125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 5.0, 2.0, 10.0, 4.0, 7.0, 15.0, 8.0, 14.0, 20.0, 18.0, 26.0, 27.0, 25.0, 37.0, 33.0, 32.0, 30.0, 40.0, 43.0, 38.0, 48.0, 61.0, 50.0, 46.0, 40.0, 49.0, 38.0, 33.0, 24.0, 26.0, 23.0, 28.0, 16.0, 24.0, 18.0, 5.0, 11.0, 8.0, 5.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-21.640625, -20.98828125, -20.3359375, -19.68359375, -19.03125, -18.37890625, -17.7265625, -17.07421875, -16.421875, -15.76953125, -15.1171875, -14.46484375, -13.8125, -13.16015625, -12.5078125, -11.85546875, -11.203125, -10.55078125, -9.8984375, -9.24609375, -8.59375, -7.94140625, -7.2890625, -6.63671875, -5.984375, -5.33203125, -4.6796875, -4.02734375, -3.375, -2.72265625, -2.0703125, -1.41796875, -0.765625, -0.11328125, 0.5390625, 1.19140625, 1.84375, 2.49609375, 3.1484375, 3.80078125, 4.453125, 5.10546875, 5.7578125, 6.41015625, 7.0625, 7.71484375, 8.3671875, 9.01953125, 9.671875, 10.32421875, 10.9765625, 11.62890625, 12.28125, 12.93359375, 13.5859375, 14.23828125, 14.890625, 15.54296875, 16.1953125, 16.84765625, 17.5, 18.15234375, 18.8046875, 19.45703125, 20.109375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 14.0, 7.0, 21.0, 24.0, 41.0, 49.0, 92.0, 120.0, 233.0, 408.0, 665.0, 1271.0, 2684.0, 6003.0, 15796.0, 46962.0, 162076.0, 521630.0, 201526.0, 56899.0, 18840.0, 7015.0, 2951.0, 1426.0, 741.0, 430.0, 240.0, 145.0, 93.0, 55.0, 32.0, 20.0, 18.0, 10.0, 6.0, 1.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0703125, -8.7529296875, -8.435546875, -8.1181640625, -7.80078125, -7.4833984375, -7.166015625, -6.8486328125, -6.53125, -6.2138671875, -5.896484375, -5.5791015625, -5.26171875, -4.9443359375, -4.626953125, -4.3095703125, -3.9921875, -3.6748046875, -3.357421875, -3.0400390625, -2.72265625, -2.4052734375, -2.087890625, -1.7705078125, -1.453125, -1.1357421875, -0.818359375, -0.5009765625, -0.18359375, 0.1337890625, 0.451171875, 0.7685546875, 1.0859375, 1.4033203125, 1.720703125, 2.0380859375, 2.35546875, 2.6728515625, 2.990234375, 3.3076171875, 3.625, 3.9423828125, 4.259765625, 4.5771484375, 4.89453125, 5.2119140625, 5.529296875, 5.8466796875, 6.1640625, 6.4814453125, 6.798828125, 7.1162109375, 7.43359375, 7.7509765625, 8.068359375, 8.3857421875, 8.703125, 9.0205078125, 9.337890625, 9.6552734375, 9.97265625, 10.2900390625, 10.607421875, 10.9248046875, 11.2421875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 4.0, 4.0, 8.0, 10.0, 10.0, 6.0, 19.0, 14.0, 15.0, 30.0, 40.0, 35.0, 49.0, 92.0, 140.0, 168.0, 100.0, 48.0, 38.0, 29.0, 28.0, 26.0, 17.0, 16.0, 10.0, 8.0, 4.0, 8.0, 10.0, 5.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018281936645507812, -0.0017672628164291382, -0.0017063319683074951, -0.001645401120185852, -0.001584470272064209, -0.001523539423942566, -0.0014626085758209229, -0.0014016777276992798, -0.0013407468795776367, -0.0012798160314559937, -0.0012188851833343506, -0.0011579543352127075, -0.0010970234870910645, -0.0010360926389694214, -0.0009751617908477783, -0.0009142309427261353, -0.0008533000946044922, -0.0007923692464828491, -0.0007314383983612061, -0.000670507550239563, -0.0006095767021179199, -0.0005486458539962769, -0.0004877150058746338, -0.0004267841577529907, -0.00036585330963134766, -0.0003049224615097046, -0.00024399161338806152, -0.00018306076526641846, -0.0001221299171447754, -6.119906902313232e-05, -2.682209014892578e-07, 6.066262722015381e-05, 0.00012159347534179688, 0.00018252432346343994, 0.000243455171585083, 0.0003043860197067261, 0.00036531686782836914, 0.0004262477159500122, 0.0004871785640716553, 0.0005481094121932983, 0.0006090402603149414, 0.0006699711084365845, 0.0007309019565582275, 0.0007918328046798706, 0.0008527636528015137, 0.0009136945009231567, 0.0009746253490447998, 0.0010355561971664429, 0.001096487045288086, 0.001157417893409729, 0.001218348741531372, 0.0012792795896530151, 0.0013402104377746582, 0.0014011412858963013, 0.0014620721340179443, 0.0015230029821395874, 0.0015839338302612305, 0.0016448646783828735, 0.0017057955265045166, 0.0017667263746261597, 0.0018276572227478027, 0.0018885880708694458, 0.0019495189189910889, 0.002010449767112732, 0.002071380615234375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 5.0, 12.0, 16.0, 26.0, 35.0, 58.0, 122.0, 246.0, 583.0, 1631.0, 5149.0, 25797.0, 306857.0, 642657.0, 53339.0, 8197.0, 2286.0, 809.0, 358.0, 151.0, 78.0, 55.0, 25.0, 24.0, 9.0, 11.0, 7.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-27.40625, -26.70654296875, -26.0068359375, -25.30712890625, -24.607421875, -23.90771484375, -23.2080078125, -22.50830078125, -21.80859375, -21.10888671875, -20.4091796875, -19.70947265625, -19.009765625, -18.31005859375, -17.6103515625, -16.91064453125, -16.2109375, -15.51123046875, -14.8115234375, -14.11181640625, -13.412109375, -12.71240234375, -12.0126953125, -11.31298828125, -10.61328125, -9.91357421875, -9.2138671875, -8.51416015625, -7.814453125, -7.11474609375, -6.4150390625, -5.71533203125, -5.015625, -4.31591796875, -3.6162109375, -2.91650390625, -2.216796875, -1.51708984375, -0.8173828125, -0.11767578125, 0.58203125, 1.28173828125, 1.9814453125, 2.68115234375, 3.380859375, 4.08056640625, 4.7802734375, 5.47998046875, 6.1796875, 6.87939453125, 7.5791015625, 8.27880859375, 8.978515625, 9.67822265625, 10.3779296875, 11.07763671875, 11.77734375, 12.47705078125, 13.1767578125, 13.87646484375, 14.576171875, 15.27587890625, 15.9755859375, 16.67529296875, 17.375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 7.0, 6.0, 21.0, 13.0, 22.0, 24.0, 51.0, 79.0, 112.0, 119.0, 142.0, 139.0, 80.0, 56.0, 41.0, 31.0, 15.0, 12.0, 7.0, 7.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.859375, -19.3773193359375, -18.895263671875, -18.4132080078125, -17.93115234375, -17.4490966796875, -16.967041015625, -16.4849853515625, -16.0029296875, -15.5208740234375, -15.038818359375, -14.5567626953125, -14.07470703125, -13.5926513671875, -13.110595703125, -12.6285400390625, -12.146484375, -11.6644287109375, -11.182373046875, -10.7003173828125, -10.21826171875, -9.7362060546875, -9.254150390625, -8.7720947265625, -8.2900390625, -7.8079833984375, -7.325927734375, -6.8438720703125, -6.36181640625, -5.8797607421875, -5.397705078125, -4.9156494140625, -4.43359375, -3.9515380859375, -3.469482421875, -2.9874267578125, -2.50537109375, -2.0233154296875, -1.541259765625, -1.0592041015625, -0.5771484375, -0.0950927734375, 0.386962890625, 0.8690185546875, 1.35107421875, 1.8331298828125, 2.315185546875, 2.7972412109375, 3.279296875, 3.7613525390625, 4.243408203125, 4.7254638671875, 5.20751953125, 5.6895751953125, 6.171630859375, 6.6536865234375, 7.1357421875, 7.6177978515625, 8.099853515625, 8.5819091796875, 9.06396484375, 9.5460205078125, 10.028076171875, 10.5101318359375, 10.9921875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 19.0, 99.0, 272.0, 385.0, 185.0, 50.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-173.3323974609375, -154.78855895996094, -136.24472045898438, -117.70086669921875, -99.15702819824219, -80.61318969726562, -62.06934356689453, -43.52549743652344, -24.981658935546875, -6.437816619873047, 12.106025695800781, 30.64986801147461, 49.19371032714844, 67.737548828125, 86.2813949584961, 104.82524108886719, 123.36907958984375, 141.9129180908203, 160.45675659179688, 179.0006103515625, 197.54444885253906, 216.08828735351562, 234.63214111328125, 253.1759796142578, 271.7198181152344, 290.263671875, 308.8074951171875, 327.3513488769531, 345.89520263671875, 364.43902587890625, 382.9828796386719, 401.5267333984375, 420.07049560546875, 438.6143493652344, 457.1581726074219, 475.7020263671875, 494.245849609375, 512.7896728515625, 531.3335571289062, 549.8773803710938, 568.4212646484375, 586.965087890625, 605.5089721679688, 624.0527954101562, 642.5966186523438, 661.1405029296875, 679.684326171875, 698.2281494140625, 716.77197265625, 735.3157958984375, 753.8596801757812, 772.4035034179688, 790.9473266601562, 809.4912109375, 828.0350341796875, 846.578857421875, 865.1226806640625, 883.66650390625, 902.2103881835938, 920.7542114257812, 939.2980346679688, 957.8419189453125, 976.3857421875, 994.9295654296875, 1013.4734497070312]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 4.0, 10.0, 7.0, 12.0, 10.0, 16.0, 20.0, 28.0, 26.0, 22.0, 25.0, 46.0, 37.0, 42.0, 40.0, 43.0, 42.0, 41.0, 50.0, 40.0, 47.0, 41.0, 38.0, 47.0, 42.0, 33.0, 30.0, 28.0, 18.0, 12.0, 20.0, 17.0, 13.0, 19.0, 9.0, 5.0, 10.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.46636962890625, -107.0630111694336, -103.65966033935547, -100.25630187988281, -96.85295104980469, -93.44959259033203, -90.0462417602539, -86.64288330078125, -83.23953247070312, -79.83617401123047, -76.43282318115234, -73.02946472167969, -69.62611389160156, -66.2227554321289, -62.81940460205078, -59.416046142578125, -56.012691497802734, -52.609336853027344, -49.20598220825195, -45.80262756347656, -42.39927291870117, -38.99591827392578, -35.592559814453125, -32.189208984375, -28.785852432250977, -25.382497787475586, -21.979143142700195, -18.575786590576172, -15.172432899475098, -11.76907730102539, -8.36572265625, -4.962368011474609, -1.5590133666992188, 1.844341516494751, 5.247696399688721, 8.65105152130127, 12.05440616607666, 15.457761764526367, 18.861116409301758, 22.26447105407715, 25.66782569885254, 29.07118034362793, 32.47453689575195, 35.877891540527344, 39.281246185302734, 42.684600830078125, 46.087955474853516, 49.491310119628906, 52.8946647644043, 56.29801940917969, 59.70137405395508, 63.10472869873047, 66.50808715820312, 69.91143798828125, 73.3147964477539, 76.71814727783203, 80.12150573730469, 83.52486419677734, 86.92821502685547, 90.33157348632812, 93.73492431640625, 97.1382827758789, 100.54163360595703, 103.94499206542969, 107.34834289550781]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 5.0, 7.0, 11.0, 16.0, 22.0, 26.0, 47.0, 40.0, 63.0, 99.0, 113.0, 226.0, 283.0, 489.0, 873.0, 1705.0, 3690.0, 9825.0, 31905.0, 156006.0, 3355582.0, 536644.0, 67453.0, 17510.0, 6224.0, 2539.0, 1254.0, 625.0, 357.0, 234.0, 140.0, 91.0, 46.0, 43.0, 29.0, 19.0, 8.0, 8.0, 7.0, 5.0, 5.0, 2.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-61.3125, -59.64453125, -57.9765625, -56.30859375, -54.640625, -52.97265625, -51.3046875, -49.63671875, -47.96875, -46.30078125, -44.6328125, -42.96484375, -41.296875, -39.62890625, -37.9609375, -36.29296875, -34.625, -32.95703125, -31.2890625, -29.62109375, -27.953125, -26.28515625, -24.6171875, -22.94921875, -21.28125, -19.61328125, -17.9453125, -16.27734375, -14.609375, -12.94140625, -11.2734375, -9.60546875, -7.9375, -6.26953125, -4.6015625, -2.93359375, -1.265625, 0.40234375, 2.0703125, 3.73828125, 5.40625, 7.07421875, 8.7421875, 10.41015625, 12.078125, 13.74609375, 15.4140625, 17.08203125, 18.75, 20.41796875, 22.0859375, 23.75390625, 25.421875, 27.08984375, 28.7578125, 30.42578125, 32.09375, 33.76171875, 35.4296875, 37.09765625, 38.765625, 40.43359375, 42.1015625, 43.76953125, 45.4375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 6.0, 6.0, 9.0, 14.0, 16.0, 21.0, 23.0, 34.0, 43.0, 45.0, 51.0, 62.0, 46.0, 50.0, 60.0, 57.0, 66.0, 53.0, 77.0, 51.0, 48.0, 39.0, 30.0, 26.0, 26.0, 11.0, 10.0, 10.0, 3.0, 7.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.67578125, -6.44586181640625, -6.2159423828125, -5.98602294921875, -5.756103515625, -5.52618408203125, -5.2962646484375, -5.06634521484375, -4.83642578125, -4.60650634765625, -4.3765869140625, -4.14666748046875, -3.916748046875, -3.68682861328125, -3.4569091796875, -3.22698974609375, -2.9970703125, -2.76715087890625, -2.5372314453125, -2.30731201171875, -2.077392578125, -1.84747314453125, -1.6175537109375, -1.38763427734375, -1.15771484375, -0.92779541015625, -0.6978759765625, -0.46795654296875, -0.238037109375, -0.00811767578125, 0.2218017578125, 0.45172119140625, 0.681640625, 0.91156005859375, 1.1414794921875, 1.37139892578125, 1.601318359375, 1.83123779296875, 2.0611572265625, 2.29107666015625, 2.52099609375, 2.75091552734375, 2.9808349609375, 3.21075439453125, 3.440673828125, 3.67059326171875, 3.9005126953125, 4.13043212890625, 4.3603515625, 4.59027099609375, 4.8201904296875, 5.05010986328125, 5.280029296875, 5.50994873046875, 5.7398681640625, 5.96978759765625, 6.19970703125, 6.42962646484375, 6.6595458984375, 6.88946533203125, 7.119384765625, 7.34930419921875, 7.5792236328125, 7.80914306640625, 8.0390625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 8.0, 7.0, 9.0, 14.0, 17.0, 30.0, 53.0, 59.0, 103.0, 145.0, 240.0, 331.0, 563.0, 1081.0, 2342.0, 5838.0, 18982.0, 84261.0, 629513.0, 3169822.0, 221557.0, 41242.0, 10627.0, 3719.0, 1598.0, 789.0, 504.0, 278.0, 184.0, 109.0, 77.0, 64.0, 25.0, 35.0, 19.0, 13.0, 7.0, 14.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-43.375, -42.109375, -40.84375, -39.578125, -38.3125, -37.046875, -35.78125, -34.515625, -33.25, -31.984375, -30.71875, -29.453125, -28.1875, -26.921875, -25.65625, -24.390625, -23.125, -21.859375, -20.59375, -19.328125, -18.0625, -16.796875, -15.53125, -14.265625, -13.0, -11.734375, -10.46875, -9.203125, -7.9375, -6.671875, -5.40625, -4.140625, -2.875, -1.609375, -0.34375, 0.921875, 2.1875, 3.453125, 4.71875, 5.984375, 7.25, 8.515625, 9.78125, 11.046875, 12.3125, 13.578125, 14.84375, 16.109375, 17.375, 18.640625, 19.90625, 21.171875, 22.4375, 23.703125, 24.96875, 26.234375, 27.5, 28.765625, 30.03125, 31.296875, 32.5625, 33.828125, 35.09375, 36.359375, 37.625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 5.0, 9.0, 12.0, 12.0, 20.0, 24.0, 22.0, 50.0, 74.0, 114.0, 162.0, 313.0, 722.0, 1365.0, 485.0, 259.0, 125.0, 85.0, 73.0, 41.0, 26.0, 15.0, 18.0, 14.0, 8.0, 4.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.625, -18.0968017578125, -17.568603515625, -17.0404052734375, -16.51220703125, -15.9840087890625, -15.455810546875, -14.9276123046875, -14.3994140625, -13.8712158203125, -13.343017578125, -12.8148193359375, -12.28662109375, -11.7584228515625, -11.230224609375, -10.7020263671875, -10.173828125, -9.6456298828125, -9.117431640625, -8.5892333984375, -8.06103515625, -7.5328369140625, -7.004638671875, -6.4764404296875, -5.9482421875, -5.4200439453125, -4.891845703125, -4.3636474609375, -3.83544921875, -3.3072509765625, -2.779052734375, -2.2508544921875, -1.72265625, -1.1944580078125, -0.666259765625, -0.1380615234375, 0.39013671875, 0.9183349609375, 1.446533203125, 1.9747314453125, 2.5029296875, 3.0311279296875, 3.559326171875, 4.0875244140625, 4.61572265625, 5.1439208984375, 5.672119140625, 6.2003173828125, 6.728515625, 7.2567138671875, 7.784912109375, 8.3131103515625, 8.84130859375, 9.3695068359375, 9.897705078125, 10.4259033203125, 10.9541015625, 11.4822998046875, 12.010498046875, 12.5386962890625, 13.06689453125, 13.5950927734375, 14.123291015625, 14.6514892578125, 15.1796875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 9.0, 15.0, 19.0, 30.0, 41.0, 65.0, 94.0, 98.0, 111.0, 121.0, 125.0, 87.0, 68.0, 47.0, 26.0, 26.0, 6.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.21259307861328, -84.56591796875, -80.91924285888672, -77.27256774902344, -73.62589263916016, -69.97921752929688, -66.3325424194336, -62.68586730957031, -59.03919219970703, -55.39251708984375, -51.74584197998047, -48.09916687011719, -44.452491760253906, -40.805816650390625, -37.159141540527344, -33.51246643066406, -29.86579132080078, -26.2191162109375, -22.57244110107422, -18.925765991210938, -15.279090881347656, -11.632415771484375, -7.985740661621094, -4.3390655517578125, -0.6923904418945312, 2.95428466796875, 6.600959777832031, 10.247634887695312, 13.894309997558594, 17.540985107421875, 21.187660217285156, 24.834335327148438, 28.48101806640625, 32.12769317626953, 35.77436828613281, 39.421043395996094, 43.067718505859375, 46.714393615722656, 50.36106872558594, 54.00774383544922, 57.6544189453125, 61.30109405517578, 64.94776916503906, 68.59444427490234, 72.24111938476562, 75.8877944946289, 79.53446960449219, 83.18114471435547, 86.82781982421875, 90.47449493408203, 94.12117004394531, 97.7678451538086, 101.41452026367188, 105.06119537353516, 108.70787048339844, 112.35454559326172, 116.001220703125, 119.64789581298828, 123.29457092285156, 126.94124603271484, 130.58792114257812, 134.23458862304688, 137.8812713623047, 141.5279541015625, 145.17462158203125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 6.0, 6.0, 11.0, 14.0, 15.0, 12.0, 22.0, 35.0, 19.0, 29.0, 46.0, 49.0, 46.0, 56.0, 57.0, 45.0, 53.0, 74.0, 51.0, 61.0, 59.0, 40.0, 39.0, 34.0, 31.0, 21.0, 17.0, 11.0, 15.0, 4.0, 6.0, 6.0, 3.0, 3.0, 1.0, 1.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.87149047851562, -70.60835266113281, -68.34522247314453, -66.08208465576172, -63.818946838378906, -61.55581283569336, -59.29267883300781, -57.029541015625, -54.76640701293945, -52.503273010253906, -50.240135192871094, -47.97700119018555, -45.7138671875, -43.45072937011719, -41.18759536743164, -38.924461364746094, -36.66132354736328, -34.398189544677734, -32.13505172729492, -29.871917724609375, -27.608781814575195, -25.345645904541016, -23.08251190185547, -20.81937599182129, -18.55624008178711, -16.29310417175293, -14.029969215393066, -11.766834259033203, -9.503698348999023, -7.240562438964844, -4.9774274826049805, -2.714292526245117, -0.4511566162109375, 1.811978816986084, 4.0751142501831055, 6.338249683380127, 8.601385116577148, 10.864521026611328, 13.127655982971191, 15.390790939331055, 17.653926849365234, 19.917062759399414, 22.180198669433594, 24.44333267211914, 26.70646858215332, 28.9696044921875, 31.232738494873047, 33.495872497558594, 35.759010314941406, 38.02214431762695, 40.285282135009766, 42.54841613769531, 44.811553955078125, 47.07468795776367, 49.33782196044922, 51.60095977783203, 53.86409378051758, 56.127227783203125, 58.39036560058594, 60.653499603271484, 62.91663360595703, 65.17977142333984, 67.44290924072266, 69.70603942871094, 71.96917724609375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 6.0, 6.0, 9.0, 15.0, 13.0, 24.0, 31.0, 32.0, 73.0, 101.0, 140.0, 216.0, 404.0, 780.0, 1578.0, 3671.0, 10028.0, 34147.0, 149603.0, 500407.0, 264418.0, 57745.0, 15580.0, 5145.0, 2054.0, 1021.0, 496.0, 286.0, 170.0, 103.0, 78.0, 57.0, 41.0, 18.0, 16.0, 6.0, 8.0, 7.0, 8.0, 3.0, 3.0, 5.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-42.96875, -41.72998046875, -40.4912109375, -39.25244140625, -38.013671875, -36.77490234375, -35.5361328125, -34.29736328125, -33.05859375, -31.81982421875, -30.5810546875, -29.34228515625, -28.103515625, -26.86474609375, -25.6259765625, -24.38720703125, -23.1484375, -21.90966796875, -20.6708984375, -19.43212890625, -18.193359375, -16.95458984375, -15.7158203125, -14.47705078125, -13.23828125, -11.99951171875, -10.7607421875, -9.52197265625, -8.283203125, -7.04443359375, -5.8056640625, -4.56689453125, -3.328125, -2.08935546875, -0.8505859375, 0.38818359375, 1.626953125, 2.86572265625, 4.1044921875, 5.34326171875, 6.58203125, 7.82080078125, 9.0595703125, 10.29833984375, 11.537109375, 12.77587890625, 14.0146484375, 15.25341796875, 16.4921875, 17.73095703125, 18.9697265625, 20.20849609375, 21.447265625, 22.68603515625, 23.9248046875, 25.16357421875, 26.40234375, 27.64111328125, 28.8798828125, 30.11865234375, 31.357421875, 32.59619140625, 33.8349609375, 35.07373046875, 36.3125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 7.0, 6.0, 14.0, 12.0, 20.0, 18.0, 23.0, 31.0, 38.0, 40.0, 65.0, 55.0, 58.0, 54.0, 59.0, 60.0, 58.0, 74.0, 44.0, 52.0, 43.0, 30.0, 33.0, 26.0, 17.0, 20.0, 15.0, 10.0, 4.0, 1.0, 8.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.51171875, -7.26812744140625, -7.0245361328125, -6.78094482421875, -6.537353515625, -6.29376220703125, -6.0501708984375, -5.80657958984375, -5.56298828125, -5.31939697265625, -5.0758056640625, -4.83221435546875, -4.588623046875, -4.34503173828125, -4.1014404296875, -3.85784912109375, -3.6142578125, -3.37066650390625, -3.1270751953125, -2.88348388671875, -2.639892578125, -2.39630126953125, -2.1527099609375, -1.90911865234375, -1.66552734375, -1.42193603515625, -1.1783447265625, -0.93475341796875, -0.691162109375, -0.44757080078125, -0.2039794921875, 0.03961181640625, 0.283203125, 0.52679443359375, 0.7703857421875, 1.01397705078125, 1.257568359375, 1.50115966796875, 1.7447509765625, 1.98834228515625, 2.23193359375, 2.47552490234375, 2.7191162109375, 2.96270751953125, 3.206298828125, 3.44989013671875, 3.6934814453125, 3.93707275390625, 4.1806640625, 4.42425537109375, 4.6678466796875, 4.91143798828125, 5.155029296875, 5.39862060546875, 5.6422119140625, 5.88580322265625, 6.12939453125, 6.37298583984375, 6.6165771484375, 6.86016845703125, 7.103759765625, 7.34735107421875, 7.5909423828125, 7.83453369140625, 8.078125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 5.0, 5.0, 7.0, 12.0, 11.0, 12.0, 21.0, 40.0, 47.0, 62.0, 92.0, 135.0, 181.0, 222.0, 330.0, 446.0, 720.0, 1324.0, 2410.0, 5119.0, 11597.0, 29056.0, 88491.0, 320924.0, 403258.0, 119398.0, 37474.0, 14088.0, 5949.0, 2934.0, 1522.0, 826.0, 535.0, 378.0, 290.0, 173.0, 128.0, 104.0, 65.0, 44.0, 46.0, 25.0, 12.0, 14.0, 11.0, 4.0, 5.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-24.734375, -23.987548828125, -23.24072265625, -22.493896484375, -21.7470703125, -21.000244140625, -20.25341796875, -19.506591796875, -18.759765625, -18.012939453125, -17.26611328125, -16.519287109375, -15.7724609375, -15.025634765625, -14.27880859375, -13.531982421875, -12.78515625, -12.038330078125, -11.29150390625, -10.544677734375, -9.7978515625, -9.051025390625, -8.30419921875, -7.557373046875, -6.810546875, -6.063720703125, -5.31689453125, -4.570068359375, -3.8232421875, -3.076416015625, -2.32958984375, -1.582763671875, -0.8359375, -0.089111328125, 0.65771484375, 1.404541015625, 2.1513671875, 2.898193359375, 3.64501953125, 4.391845703125, 5.138671875, 5.885498046875, 6.63232421875, 7.379150390625, 8.1259765625, 8.872802734375, 9.61962890625, 10.366455078125, 11.11328125, 11.860107421875, 12.60693359375, 13.353759765625, 14.1005859375, 14.847412109375, 15.59423828125, 16.341064453125, 17.087890625, 17.834716796875, 18.58154296875, 19.328369140625, 20.0751953125, 20.822021484375, 21.56884765625, 22.315673828125, 23.0625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 1.0, 2.0, 4.0, 5.0, 3.0, 9.0, 9.0, 9.0, 8.0, 16.0, 25.0, 19.0, 28.0, 26.0, 29.0, 38.0, 48.0, 34.0, 59.0, 40.0, 71.0, 61.0, 54.0, 50.0, 49.0, 41.0, 49.0, 33.0, 30.0, 28.0, 19.0, 24.0, 25.0, 11.0, 7.0, 10.0, 5.0, 8.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-28.421875, -27.52490234375, -26.6279296875, -25.73095703125, -24.833984375, -23.93701171875, -23.0400390625, -22.14306640625, -21.24609375, -20.34912109375, -19.4521484375, -18.55517578125, -17.658203125, -16.76123046875, -15.8642578125, -14.96728515625, -14.0703125, -13.17333984375, -12.2763671875, -11.37939453125, -10.482421875, -9.58544921875, -8.6884765625, -7.79150390625, -6.89453125, -5.99755859375, -5.1005859375, -4.20361328125, -3.306640625, -2.40966796875, -1.5126953125, -0.61572265625, 0.28125, 1.17822265625, 2.0751953125, 2.97216796875, 3.869140625, 4.76611328125, 5.6630859375, 6.56005859375, 7.45703125, 8.35400390625, 9.2509765625, 10.14794921875, 11.044921875, 11.94189453125, 12.8388671875, 13.73583984375, 14.6328125, 15.52978515625, 16.4267578125, 17.32373046875, 18.220703125, 19.11767578125, 20.0146484375, 20.91162109375, 21.80859375, 22.70556640625, 23.6025390625, 24.49951171875, 25.396484375, 26.29345703125, 27.1904296875, 28.08740234375, 28.984375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 12.0, 11.0, 19.0, 47.0, 69.0, 109.0, 244.0, 612.0, 1733.0, 7103.0, 53215.0, 536627.0, 403379.0, 37301.0, 5558.0, 1487.0, 514.0, 231.0, 94.0, 64.0, 43.0, 25.0, 10.0, 16.0, 8.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.765625, -19.165283203125, -18.56494140625, -17.964599609375, -17.3642578125, -16.763916015625, -16.16357421875, -15.563232421875, -14.962890625, -14.362548828125, -13.76220703125, -13.161865234375, -12.5615234375, -11.961181640625, -11.36083984375, -10.760498046875, -10.16015625, -9.559814453125, -8.95947265625, -8.359130859375, -7.7587890625, -7.158447265625, -6.55810546875, -5.957763671875, -5.357421875, -4.757080078125, -4.15673828125, -3.556396484375, -2.9560546875, -2.355712890625, -1.75537109375, -1.155029296875, -0.5546875, 0.045654296875, 0.64599609375, 1.246337890625, 1.8466796875, 2.447021484375, 3.04736328125, 3.647705078125, 4.248046875, 4.848388671875, 5.44873046875, 6.049072265625, 6.6494140625, 7.249755859375, 7.85009765625, 8.450439453125, 9.05078125, 9.651123046875, 10.25146484375, 10.851806640625, 11.4521484375, 12.052490234375, 12.65283203125, 13.253173828125, 13.853515625, 14.453857421875, 15.05419921875, 15.654541015625, 16.2548828125, 16.855224609375, 17.45556640625, 18.055908203125, 18.65625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 6.0, 17.0, 10.0, 22.0, 31.0, 36.0, 43.0, 54.0, 94.0, 85.0, 113.0, 116.0, 97.0, 68.0, 48.0, 47.0, 22.0, 22.0, 14.0, 18.0, 8.0, 9.0, 3.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00229644775390625, -0.0022340863943099976, -0.002171725034713745, -0.0021093636751174927, -0.0020470023155212402, -0.001984640955924988, -0.0019222795963287354, -0.001859918236732483, -0.0017975568771362305, -0.001735195517539978, -0.0016728341579437256, -0.0016104727983474731, -0.0015481114387512207, -0.0014857500791549683, -0.0014233887195587158, -0.0013610273599624634, -0.001298666000366211, -0.0012363046407699585, -0.001173943281173706, -0.0011115819215774536, -0.0010492205619812012, -0.0009868592023849487, -0.0009244978427886963, -0.0008621364831924438, -0.0007997751235961914, -0.000737413763999939, -0.0006750524044036865, -0.0006126910448074341, -0.0005503296852111816, -0.0004879683256149292, -0.00042560696601867676, -0.0003632456064224243, -0.0003008842468261719, -0.00023852288722991943, -0.000176161527633667, -0.00011380016803741455, -5.143880844116211e-05, 1.0922551155090332e-05, 7.328391075134277e-05, 0.00013564527034759521, 0.00019800662994384766, 0.0002603679895401001, 0.00032272934913635254, 0.000385090708732605, 0.0004474520683288574, 0.0005098134279251099, 0.0005721747875213623, 0.0006345361471176147, 0.0006968975067138672, 0.0007592588663101196, 0.0008216202259063721, 0.0008839815855026245, 0.000946342945098877, 0.0010087043046951294, 0.0010710656642913818, 0.0011334270238876343, 0.0011957883834838867, 0.0012581497430801392, 0.0013205111026763916, 0.001382872462272644, 0.0014452338218688965, 0.001507595181465149, 0.0015699565410614014, 0.0016323179006576538, 0.0016946792602539062]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 8.0, 6.0, 15.0, 14.0, 32.0, 56.0, 107.0, 248.0, 603.0, 1883.0, 10689.0, 217064.0, 763655.0, 48082.0, 4312.0, 1037.0, 380.0, 188.0, 73.0, 45.0, 19.0, 19.0, 12.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.46875, -28.63330078125, -27.7978515625, -26.96240234375, -26.126953125, -25.29150390625, -24.4560546875, -23.62060546875, -22.78515625, -21.94970703125, -21.1142578125, -20.27880859375, -19.443359375, -18.60791015625, -17.7724609375, -16.93701171875, -16.1015625, -15.26611328125, -14.4306640625, -13.59521484375, -12.759765625, -11.92431640625, -11.0888671875, -10.25341796875, -9.41796875, -8.58251953125, -7.7470703125, -6.91162109375, -6.076171875, -5.24072265625, -4.4052734375, -3.56982421875, -2.734375, -1.89892578125, -1.0634765625, -0.22802734375, 0.607421875, 1.44287109375, 2.2783203125, 3.11376953125, 3.94921875, 4.78466796875, 5.6201171875, 6.45556640625, 7.291015625, 8.12646484375, 8.9619140625, 9.79736328125, 10.6328125, 11.46826171875, 12.3037109375, 13.13916015625, 13.974609375, 14.81005859375, 15.6455078125, 16.48095703125, 17.31640625, 18.15185546875, 18.9873046875, 19.82275390625, 20.658203125, 21.49365234375, 22.3291015625, 23.16455078125, 24.0]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 4.0, 10.0, 12.0, 20.0, 22.0, 36.0, 56.0, 75.0, 88.0, 121.0, 111.0, 121.0, 93.0, 77.0, 40.0, 35.0, 24.0, 21.0, 11.0, 4.0, 3.0, 1.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-19.015625, -18.542724609375, -18.06982421875, -17.596923828125, -17.1240234375, -16.651123046875, -16.17822265625, -15.705322265625, -15.232421875, -14.759521484375, -14.28662109375, -13.813720703125, -13.3408203125, -12.867919921875, -12.39501953125, -11.922119140625, -11.44921875, -10.976318359375, -10.50341796875, -10.030517578125, -9.5576171875, -9.084716796875, -8.61181640625, -8.138916015625, -7.666015625, -7.193115234375, -6.72021484375, -6.247314453125, -5.7744140625, -5.301513671875, -4.82861328125, -4.355712890625, -3.8828125, -3.409912109375, -2.93701171875, -2.464111328125, -1.9912109375, -1.518310546875, -1.04541015625, -0.572509765625, -0.099609375, 0.373291015625, 0.84619140625, 1.319091796875, 1.7919921875, 2.264892578125, 2.73779296875, 3.210693359375, 3.68359375, 4.156494140625, 4.62939453125, 5.102294921875, 5.5751953125, 6.048095703125, 6.52099609375, 6.993896484375, 7.466796875, 7.939697265625, 8.41259765625, 8.885498046875, 9.3583984375, 9.831298828125, 10.30419921875, 10.777099609375, 11.25]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 13.0, 8.0, 21.0, 26.0, 35.0, 53.0, 64.0, 88.0, 102.0, 102.0, 99.0, 105.0, 85.0, 67.0, 48.0, 22.0, 23.0, 16.0, 13.0, 7.0, 4.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-235.3284454345703, -229.6723175048828, -224.0161895751953, -218.3600616455078, -212.7039337158203, -207.0478057861328, -201.39166259765625, -195.73553466796875, -190.07940673828125, -184.42327880859375, -178.76715087890625, -173.11102294921875, -167.45489501953125, -161.79876708984375, -156.14263916015625, -150.48651123046875, -144.83038330078125, -139.17425537109375, -133.51812744140625, -127.86199951171875, -122.20587158203125, -116.54974365234375, -110.89360809326172, -105.23748016357422, -99.58135223388672, -93.92522430419922, -88.26909637451172, -82.61296081542969, -76.95683288574219, -71.30070495605469, -65.64457702636719, -59.98844909667969, -54.33232116699219, -48.67619323730469, -43.02006530761719, -37.36393356323242, -31.707805633544922, -26.051677703857422, -20.395545959472656, -14.739418029785156, -9.083290100097656, -3.42716121673584, 2.2289676666259766, 7.885097503662109, 13.54122543334961, 19.19735336303711, 24.853485107421875, 30.509613037109375, 36.165740966796875, 41.821868896484375, 47.477996826171875, 53.13412857055664, 58.79025650024414, 64.44638061523438, 70.1025161743164, 75.7586441040039, 81.4147720336914, 87.0708999633789, 92.7270278930664, 98.38316345214844, 104.03929138183594, 109.69541931152344, 115.35154724121094, 121.00767517089844, 126.66380310058594]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 8.0, 5.0, 5.0, 13.0, 13.0, 9.0, 10.0, 25.0, 18.0, 26.0, 30.0, 26.0, 34.0, 44.0, 34.0, 36.0, 39.0, 43.0, 52.0, 49.0, 40.0, 34.0, 46.0, 35.0, 46.0, 37.0, 33.0, 29.0, 39.0, 27.0, 18.0, 12.0, 10.0, 11.0, 14.0, 9.0, 13.0, 7.0, 7.0, 4.0, 2.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-127.31553649902344, -123.28887939453125, -119.2622299194336, -115.2355728149414, -111.20892333984375, -107.18226623535156, -103.15560913085938, -99.12895202636719, -95.10230255126953, -91.07564544677734, -87.04899597167969, -83.0223388671875, -78.99568176269531, -74.96903228759766, -70.94237518310547, -66.91572570800781, -62.889068603515625, -58.8624153137207, -54.83576202392578, -50.809104919433594, -46.78245162963867, -42.75579833984375, -38.72914123535156, -34.70248794555664, -30.67583465576172, -26.649181365966797, -22.622526168823242, -18.595870971679688, -14.569217681884766, -10.542564392089844, -6.515909194946289, -2.4892539978027344, 1.5373992919921875, 5.564053535461426, 9.590707778930664, 13.617362022399902, 17.64401626586914, 21.670669555664062, 25.697324752807617, 29.723979949951172, 33.750633239746094, 37.777286529541016, 41.80393981933594, 45.830596923828125, 49.85725021362305, 53.88390350341797, 57.910560607910156, 61.93721389770508, 65.9638671875, 69.99052429199219, 74.01717376708984, 78.04383087158203, 82.07048034667969, 86.09713745117188, 90.12379455566406, 94.15045166015625, 98.1771011352539, 102.2037582397461, 106.23040771484375, 110.25706481933594, 114.28372192382812, 118.31037139892578, 122.33702850341797, 126.36367797851562, 130.3903350830078]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 1.0, 10.0, 11.0, 15.0, 16.0, 32.0, 35.0, 57.0, 58.0, 126.0, 147.0, 241.0, 415.0, 772.0, 1791.0, 4352.0, 13796.0, 106406.0, 4020231.0, 32475.0, 7768.0, 2773.0, 1191.0, 582.0, 332.0, 192.0, 129.0, 106.0, 68.0, 35.0, 27.0, 20.0, 21.0, 15.0, 11.0, 11.0, 7.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-106.25, -103.611328125, -100.97265625, -98.333984375, -95.6953125, -93.056640625, -90.41796875, -87.779296875, -85.140625, -82.501953125, -79.86328125, -77.224609375, -74.5859375, -71.947265625, -69.30859375, -66.669921875, -64.03125, -61.392578125, -58.75390625, -56.115234375, -53.4765625, -50.837890625, -48.19921875, -45.560546875, -42.921875, -40.283203125, -37.64453125, -35.005859375, -32.3671875, -29.728515625, -27.08984375, -24.451171875, -21.8125, -19.173828125, -16.53515625, -13.896484375, -11.2578125, -8.619140625, -5.98046875, -3.341796875, -0.703125, 1.935546875, 4.57421875, 7.212890625, 9.8515625, 12.490234375, 15.12890625, 17.767578125, 20.40625, 23.044921875, 25.68359375, 28.322265625, 30.9609375, 33.599609375, 36.23828125, 38.876953125, 41.515625, 44.154296875, 46.79296875, 49.431640625, 52.0703125, 54.708984375, 57.34765625, 59.986328125, 62.625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 3.0, 4.0, 2.0, 3.0, 7.0, 19.0, 10.0, 18.0, 24.0, 25.0, 28.0, 37.0, 44.0, 43.0, 41.0, 31.0, 49.0, 59.0, 49.0, 67.0, 55.0, 59.0, 55.0, 54.0, 41.0, 39.0, 39.0, 25.0, 13.0, 10.0, 10.0, 10.0, 6.0, 7.0, 6.0, 4.0, 3.0, 0.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.1796875, -7.921142578125, -7.66259765625, -7.404052734375, -7.1455078125, -6.886962890625, -6.62841796875, -6.369873046875, -6.111328125, -5.852783203125, -5.59423828125, -5.335693359375, -5.0771484375, -4.818603515625, -4.56005859375, -4.301513671875, -4.04296875, -3.784423828125, -3.52587890625, -3.267333984375, -3.0087890625, -2.750244140625, -2.49169921875, -2.233154296875, -1.974609375, -1.716064453125, -1.45751953125, -1.198974609375, -0.9404296875, -0.681884765625, -0.42333984375, -0.164794921875, 0.09375, 0.352294921875, 0.61083984375, 0.869384765625, 1.1279296875, 1.386474609375, 1.64501953125, 1.903564453125, 2.162109375, 2.420654296875, 2.67919921875, 2.937744140625, 3.1962890625, 3.454833984375, 3.71337890625, 3.971923828125, 4.23046875, 4.489013671875, 4.74755859375, 5.006103515625, 5.2646484375, 5.523193359375, 5.78173828125, 6.040283203125, 6.298828125, 6.557373046875, 6.81591796875, 7.074462890625, 7.3330078125, 7.591552734375, 7.85009765625, 8.108642578125, 8.3671875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 8.0, 15.0, 29.0, 47.0, 86.0, 144.0, 243.0, 398.0, 769.0, 1257.0, 2575.0, 5422.0, 13504.0, 50659.0, 3791144.0, 280432.0, 29681.0, 9546.0, 4070.0, 1945.0, 1044.0, 562.0, 302.0, 183.0, 83.0, 51.0, 39.0, 26.0, 15.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-52.75, -51.3916015625, -50.033203125, -48.6748046875, -47.31640625, -45.9580078125, -44.599609375, -43.2412109375, -41.8828125, -40.5244140625, -39.166015625, -37.8076171875, -36.44921875, -35.0908203125, -33.732421875, -32.3740234375, -31.015625, -29.6572265625, -28.298828125, -26.9404296875, -25.58203125, -24.2236328125, -22.865234375, -21.5068359375, -20.1484375, -18.7900390625, -17.431640625, -16.0732421875, -14.71484375, -13.3564453125, -11.998046875, -10.6396484375, -9.28125, -7.9228515625, -6.564453125, -5.2060546875, -3.84765625, -2.4892578125, -1.130859375, 0.2275390625, 1.5859375, 2.9443359375, 4.302734375, 5.6611328125, 7.01953125, 8.3779296875, 9.736328125, 11.0947265625, 12.453125, 13.8115234375, 15.169921875, 16.5283203125, 17.88671875, 19.2451171875, 20.603515625, 21.9619140625, 23.3203125, 24.6787109375, 26.037109375, 27.3955078125, 28.75390625, 30.1123046875, 31.470703125, 32.8291015625, 34.1875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 8.0, 9.0, 6.0, 17.0, 18.0, 23.0, 23.0, 63.0, 106.0, 260.0, 3008.0, 286.0, 96.0, 58.0, 18.0, 11.0, 12.0, 7.0, 6.0, 6.0, 7.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.4140625, -7.2052001953125, -6.996337890625, -6.7874755859375, -6.57861328125, -6.3697509765625, -6.160888671875, -5.9520263671875, -5.7431640625, -5.5343017578125, -5.325439453125, -5.1165771484375, -4.90771484375, -4.6988525390625, -4.489990234375, -4.2811279296875, -4.072265625, -3.8634033203125, -3.654541015625, -3.4456787109375, -3.23681640625, -3.0279541015625, -2.819091796875, -2.6102294921875, -2.4013671875, -2.1925048828125, -1.983642578125, -1.7747802734375, -1.56591796875, -1.3570556640625, -1.148193359375, -0.9393310546875, -0.73046875, -0.5216064453125, -0.312744140625, -0.1038818359375, 0.10498046875, 0.3138427734375, 0.522705078125, 0.7315673828125, 0.9404296875, 1.1492919921875, 1.358154296875, 1.5670166015625, 1.77587890625, 1.9847412109375, 2.193603515625, 2.4024658203125, 2.611328125, 2.8201904296875, 3.029052734375, 3.2379150390625, 3.44677734375, 3.6556396484375, 3.864501953125, 4.0733642578125, 4.2822265625, 4.4910888671875, 4.699951171875, 4.9088134765625, 5.11767578125, 5.3265380859375, 5.535400390625, 5.7442626953125, 5.953125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 6.0, 2.0, 4.0, 10.0, 14.0, 12.0, 21.0, 24.0, 40.0, 55.0, 70.0, 93.0, 104.0, 115.0, 112.0, 89.0, 79.0, 48.0, 41.0, 23.0, 15.0, 9.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.55391311645508, -39.42695999145508, -38.30000305175781, -37.17304992675781, -36.04609680175781, -34.91913986206055, -33.79218673706055, -32.66522979736328, -31.53827667236328, -30.41132164001465, -29.284366607666016, -28.157413482666016, -27.030458450317383, -25.90350341796875, -24.77655029296875, -23.649595260620117, -22.522640228271484, -21.39568519592285, -20.26873016357422, -19.14177703857422, -18.014822006225586, -16.887866973876953, -15.760912895202637, -14.63395881652832, -13.507003784179688, -12.380048751831055, -11.253094673156738, -10.126140594482422, -8.999185562133789, -7.8722310066223145, -6.74527645111084, -5.618321895599365, -4.491367340087891, -3.364412784576416, -2.2374582290649414, -1.1105036735534668, 0.016450881958007812, 1.1434054374694824, 2.270359992980957, 3.3973145484924316, 4.524269104003906, 5.651223659515381, 6.7781782150268555, 7.90513277053833, 9.032087326049805, 10.159042358398438, 11.285996437072754, 12.41295051574707, 13.539905548095703, 14.666860580444336, 15.793814659118652, 16.92076873779297, 18.0477237701416, 19.174678802490234, 20.301631927490234, 21.428586959838867, 22.5555419921875, 23.682497024536133, 24.809452056884766, 25.936405181884766, 27.0633602142334, 28.19031524658203, 29.31726837158203, 30.444223403930664, 31.571178436279297]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 6.0, 4.0, 9.0, 9.0, 10.0, 19.0, 23.0, 21.0, 23.0, 12.0, 22.0, 32.0, 30.0, 31.0, 26.0, 33.0, 34.0, 38.0, 27.0, 41.0, 36.0, 35.0, 48.0, 37.0, 35.0, 43.0, 45.0, 38.0, 27.0, 39.0, 31.0, 30.0, 22.0, 23.0, 20.0, 10.0, 12.0, 10.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.270694732666016, -24.47759246826172, -23.684490203857422, -22.891387939453125, -22.098285675048828, -21.30518341064453, -20.512081146240234, -19.718978881835938, -18.92587661743164, -18.132774353027344, -17.339672088623047, -16.54656982421875, -15.753467559814453, -14.960365295410156, -14.167262077331543, -13.374159812927246, -12.581056594848633, -11.787954330444336, -10.994852066040039, -10.201749801635742, -9.408647537231445, -8.615545272827148, -7.822442054748535, -7.029339790344238, -6.236237525939941, -5.4431352615356445, -4.650032997131348, -3.8569302558898926, -3.0638279914855957, -2.270725727081299, -1.4776229858398438, -0.6845207214355469, 0.10858154296875, 0.9016839265823364, 1.6947863101959229, 2.487888813018799, 3.2809910774230957, 4.074093341827393, 4.867196083068848, 5.6602983474731445, 6.453400611877441, 7.246502876281738, 8.039605140686035, 8.832708358764648, 9.625810623168945, 10.418912887573242, 11.212015151977539, 12.005117416381836, 12.798219680786133, 13.59132194519043, 14.384424209594727, 15.177526473999023, 15.97062873840332, 16.763731002807617, 17.556835174560547, 18.349937438964844, 19.14303970336914, 19.936141967773438, 20.729244232177734, 21.52234649658203, 22.315448760986328, 23.108551025390625, 23.901653289794922, 24.69475555419922, 25.487857818603516]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 6.0, 4.0, 6.0, 7.0, 4.0, 10.0, 12.0, 21.0, 35.0, 64.0, 69.0, 132.0, 179.0, 310.0, 595.0, 1216.0, 2852.0, 7145.0, 21009.0, 67947.0, 226928.0, 430164.0, 200170.0, 59791.0, 18445.0, 6373.0, 2520.0, 1167.0, 554.0, 321.0, 184.0, 103.0, 66.0, 58.0, 19.0, 22.0, 19.0, 12.0, 10.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.71875, -29.77197265625, -28.8251953125, -27.87841796875, -26.931640625, -25.98486328125, -25.0380859375, -24.09130859375, -23.14453125, -22.19775390625, -21.2509765625, -20.30419921875, -19.357421875, -18.41064453125, -17.4638671875, -16.51708984375, -15.5703125, -14.62353515625, -13.6767578125, -12.72998046875, -11.783203125, -10.83642578125, -9.8896484375, -8.94287109375, -7.99609375, -7.04931640625, -6.1025390625, -5.15576171875, -4.208984375, -3.26220703125, -2.3154296875, -1.36865234375, -0.421875, 0.52490234375, 1.4716796875, 2.41845703125, 3.365234375, 4.31201171875, 5.2587890625, 6.20556640625, 7.15234375, 8.09912109375, 9.0458984375, 9.99267578125, 10.939453125, 11.88623046875, 12.8330078125, 13.77978515625, 14.7265625, 15.67333984375, 16.6201171875, 17.56689453125, 18.513671875, 19.46044921875, 20.4072265625, 21.35400390625, 22.30078125, 23.24755859375, 24.1943359375, 25.14111328125, 26.087890625, 27.03466796875, 27.9814453125, 28.92822265625, 29.875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 0.0, 3.0, 2.0, 5.0, 8.0, 8.0, 9.0, 16.0, 15.0, 12.0, 22.0, 19.0, 38.0, 29.0, 31.0, 31.0, 41.0, 52.0, 40.0, 47.0, 37.0, 48.0, 52.0, 35.0, 49.0, 47.0, 48.0, 36.0, 46.0, 42.0, 28.0, 22.0, 22.0, 19.0, 7.0, 9.0, 5.0, 4.0, 4.0, 5.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.6171875, -8.34326171875, -8.0693359375, -7.79541015625, -7.521484375, -7.24755859375, -6.9736328125, -6.69970703125, -6.42578125, -6.15185546875, -5.8779296875, -5.60400390625, -5.330078125, -5.05615234375, -4.7822265625, -4.50830078125, -4.234375, -3.96044921875, -3.6865234375, -3.41259765625, -3.138671875, -2.86474609375, -2.5908203125, -2.31689453125, -2.04296875, -1.76904296875, -1.4951171875, -1.22119140625, -0.947265625, -0.67333984375, -0.3994140625, -0.12548828125, 0.1484375, 0.42236328125, 0.6962890625, 0.97021484375, 1.244140625, 1.51806640625, 1.7919921875, 2.06591796875, 2.33984375, 2.61376953125, 2.8876953125, 3.16162109375, 3.435546875, 3.70947265625, 3.9833984375, 4.25732421875, 4.53125, 4.80517578125, 5.0791015625, 5.35302734375, 5.626953125, 5.90087890625, 6.1748046875, 6.44873046875, 6.72265625, 6.99658203125, 7.2705078125, 7.54443359375, 7.818359375, 8.09228515625, 8.3662109375, 8.64013671875, 8.9140625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 8.0, 14.0, 25.0, 55.0, 110.0, 209.0, 464.0, 977.0, 2512.0, 18545.0, 562776.0, 443551.0, 15174.0, 2362.0, 938.0, 446.0, 199.0, 87.0, 49.0, 22.0, 9.0, 8.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-58.28125, -56.03662109375, -53.7919921875, -51.54736328125, -49.302734375, -47.05810546875, -44.8134765625, -42.56884765625, -40.32421875, -38.07958984375, -35.8349609375, -33.59033203125, -31.345703125, -29.10107421875, -26.8564453125, -24.61181640625, -22.3671875, -20.12255859375, -17.8779296875, -15.63330078125, -13.388671875, -11.14404296875, -8.8994140625, -6.65478515625, -4.41015625, -2.16552734375, 0.0791015625, 2.32373046875, 4.568359375, 6.81298828125, 9.0576171875, 11.30224609375, 13.546875, 15.79150390625, 18.0361328125, 20.28076171875, 22.525390625, 24.77001953125, 27.0146484375, 29.25927734375, 31.50390625, 33.74853515625, 35.9931640625, 38.23779296875, 40.482421875, 42.72705078125, 44.9716796875, 47.21630859375, 49.4609375, 51.70556640625, 53.9501953125, 56.19482421875, 58.439453125, 60.68408203125, 62.9287109375, 65.17333984375, 67.41796875, 69.66259765625, 71.9072265625, 74.15185546875, 76.396484375, 78.64111328125, 80.8857421875, 83.13037109375, 85.375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 10.0, 13.0, 30.0, 44.0, 60.0, 77.0, 101.0, 98.0, 114.0, 118.0, 112.0, 76.0, 52.0, 39.0, 30.0, 22.0, 9.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.625, -107.6796875, -104.734375, -101.7890625, -98.84375, -95.8984375, -92.953125, -90.0078125, -87.0625, -84.1171875, -81.171875, -78.2265625, -75.28125, -72.3359375, -69.390625, -66.4453125, -63.5, -60.5546875, -57.609375, -54.6640625, -51.71875, -48.7734375, -45.828125, -42.8828125, -39.9375, -36.9921875, -34.046875, -31.1015625, -28.15625, -25.2109375, -22.265625, -19.3203125, -16.375, -13.4296875, -10.484375, -7.5390625, -4.59375, -1.6484375, 1.296875, 4.2421875, 7.1875, 10.1328125, 13.078125, 16.0234375, 18.96875, 21.9140625, 24.859375, 27.8046875, 30.75, 33.6953125, 36.640625, 39.5859375, 42.53125, 45.4765625, 48.421875, 51.3671875, 54.3125, 57.2578125, 60.203125, 63.1484375, 66.09375, 69.0390625, 71.984375, 74.9296875, 77.875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 4.0, 7.0, 9.0, 7.0, 15.0, 20.0, 44.0, 33.0, 62.0, 102.0, 148.0, 219.0, 473.0, 1057.0, 2538.0, 8309.0, 54343.0, 775019.0, 182709.0, 16536.0, 3967.0, 1442.0, 615.0, 348.0, 169.0, 121.0, 65.0, 52.0, 30.0, 26.0, 15.0, 16.0, 8.0, 8.0, 5.0, 2.0, 3.0, 0.0, 2.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-30.6875, -29.803466796875, -28.91943359375, -28.035400390625, -27.1513671875, -26.267333984375, -25.38330078125, -24.499267578125, -23.615234375, -22.731201171875, -21.84716796875, -20.963134765625, -20.0791015625, -19.195068359375, -18.31103515625, -17.427001953125, -16.54296875, -15.658935546875, -14.77490234375, -13.890869140625, -13.0068359375, -12.122802734375, -11.23876953125, -10.354736328125, -9.470703125, -8.586669921875, -7.70263671875, -6.818603515625, -5.9345703125, -5.050537109375, -4.16650390625, -3.282470703125, -2.3984375, -1.514404296875, -0.63037109375, 0.253662109375, 1.1376953125, 2.021728515625, 2.90576171875, 3.789794921875, 4.673828125, 5.557861328125, 6.44189453125, 7.325927734375, 8.2099609375, 9.093994140625, 9.97802734375, 10.862060546875, 11.74609375, 12.630126953125, 13.51416015625, 14.398193359375, 15.2822265625, 16.166259765625, 17.05029296875, 17.934326171875, 18.818359375, 19.702392578125, 20.58642578125, 21.470458984375, 22.3544921875, 23.238525390625, 24.12255859375, 25.006591796875, 25.890625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 2.0, 5.0, 6.0, 6.0, 7.0, 15.0, 24.0, 36.0, 64.0, 75.0, 118.0, 148.0, 126.0, 108.0, 87.0, 56.0, 32.0, 20.0, 19.0, 12.0, 8.0, 11.0, 3.0, 5.0, 3.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.003002166748046875, -0.0029165446758270264, -0.0028309226036071777, -0.002745300531387329, -0.0026596784591674805, -0.002574056386947632, -0.002488434314727783, -0.0024028122425079346, -0.002317190170288086, -0.0022315680980682373, -0.0021459460258483887, -0.00206032395362854, -0.0019747018814086914, -0.0018890798091888428, -0.0018034577369689941, -0.0017178356647491455, -0.0016322135925292969, -0.0015465915203094482, -0.0014609694480895996, -0.001375347375869751, -0.0012897253036499023, -0.0012041032314300537, -0.001118481159210205, -0.0010328590869903564, -0.0009472370147705078, -0.0008616149425506592, -0.0007759928703308105, -0.0006903707981109619, -0.0006047487258911133, -0.0005191266536712646, -0.000433504581451416, -0.0003478825092315674, -0.00026226043701171875, -0.00017663836479187012, -9.101629257202148e-05, -5.3942203521728516e-06, 8.022785186767578e-05, 0.00016584992408752441, 0.00025147199630737305, 0.0003370940685272217, 0.0004227161407470703, 0.0005083382129669189, 0.0005939602851867676, 0.0006795823574066162, 0.0007652044296264648, 0.0008508265018463135, 0.0009364485740661621, 0.0010220706462860107, 0.0011076927185058594, 0.001193314790725708, 0.0012789368629455566, 0.0013645589351654053, 0.001450181007385254, 0.0015358030796051025, 0.0016214251518249512, 0.0017070472240447998, 0.0017926692962646484, 0.001878291368484497, 0.0019639134407043457, 0.0020495355129241943, 0.002135157585144043, 0.0022207796573638916, 0.0023064017295837402, 0.002392023801803589, 0.0024776458740234375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 7.0, 3.0, 9.0, 7.0, 14.0, 13.0, 24.0, 44.0, 68.0, 116.0, 214.0, 567.0, 1869.0, 8555.0, 154911.0, 852601.0, 24143.0, 3608.0, 1005.0, 352.0, 162.0, 89.0, 46.0, 32.0, 25.0, 20.0, 18.0, 6.0, 6.0, 5.0, 4.0, 5.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-44.53125, -43.267578125, -42.00390625, -40.740234375, -39.4765625, -38.212890625, -36.94921875, -35.685546875, -34.421875, -33.158203125, -31.89453125, -30.630859375, -29.3671875, -28.103515625, -26.83984375, -25.576171875, -24.3125, -23.048828125, -21.78515625, -20.521484375, -19.2578125, -17.994140625, -16.73046875, -15.466796875, -14.203125, -12.939453125, -11.67578125, -10.412109375, -9.1484375, -7.884765625, -6.62109375, -5.357421875, -4.09375, -2.830078125, -1.56640625, -0.302734375, 0.9609375, 2.224609375, 3.48828125, 4.751953125, 6.015625, 7.279296875, 8.54296875, 9.806640625, 11.0703125, 12.333984375, 13.59765625, 14.861328125, 16.125, 17.388671875, 18.65234375, 19.916015625, 21.1796875, 22.443359375, 23.70703125, 24.970703125, 26.234375, 27.498046875, 28.76171875, 30.025390625, 31.2890625, 32.552734375, 33.81640625, 35.080078125, 36.34375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 3.0, 4.0, 6.0, 5.0, 7.0, 25.0, 57.0, 129.0, 272.0, 260.0, 129.0, 51.0, 25.0, 18.0, 10.0, 1.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.78125, -27.34130859375, -25.9013671875, -24.46142578125, -23.021484375, -21.58154296875, -20.1416015625, -18.70166015625, -17.26171875, -15.82177734375, -14.3818359375, -12.94189453125, -11.501953125, -10.06201171875, -8.6220703125, -7.18212890625, -5.7421875, -4.30224609375, -2.8623046875, -1.42236328125, 0.017578125, 1.45751953125, 2.8974609375, 4.33740234375, 5.77734375, 7.21728515625, 8.6572265625, 10.09716796875, 11.537109375, 12.97705078125, 14.4169921875, 15.85693359375, 17.296875, 18.73681640625, 20.1767578125, 21.61669921875, 23.056640625, 24.49658203125, 25.9365234375, 27.37646484375, 28.81640625, 30.25634765625, 31.6962890625, 33.13623046875, 34.576171875, 36.01611328125, 37.4560546875, 38.89599609375, 40.3359375, 41.77587890625, 43.2158203125, 44.65576171875, 46.095703125, 47.53564453125, 48.9755859375, 50.41552734375, 51.85546875, 53.29541015625, 54.7353515625, 56.17529296875, 57.615234375, 59.05517578125, 60.4951171875, 61.93505859375, 63.375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 7.0, 12.0, 26.0, 39.0, 64.0, 79.0, 141.0, 136.0, 135.0, 111.0, 79.0, 63.0, 46.0, 28.0, 16.0, 9.0, 5.0, 5.0, 3.0], "bins": [-508.4969787597656, -498.9168395996094, -489.33673095703125, -479.756591796875, -470.17645263671875, -460.5963439941406, -451.0162048339844, -441.43609619140625, -431.85595703125, -422.27581787109375, -412.6957092285156, -403.1155700683594, -393.53546142578125, -383.955322265625, -374.37518310546875, -364.7950439453125, -355.2149353027344, -345.6347961425781, -336.0546875, -326.47454833984375, -316.8944091796875, -307.3143005371094, -297.7341613769531, -288.154052734375, -278.57391357421875, -268.9937744140625, -259.4136657714844, -249.83352661132812, -240.25340270996094, -230.67327880859375, -221.0931396484375, -211.5130157470703, -201.93287658691406, -192.35275268554688, -182.77261352539062, -173.19248962402344, -163.61236572265625, -154.03224182128906, -144.45211791992188, -134.87197875976562, -125.29185485839844, -115.71173095703125, -106.13159942626953, -96.55146789550781, -86.97134399414062, -77.39122009277344, -67.81108856201172, -58.23095703125, -48.65083312988281, -39.07070541381836, -29.490577697753906, -19.910449981689453, -10.330322265625, -0.7501945495605469, 8.829933166503906, 18.410064697265625, 27.990188598632812, 37.570316314697266, 47.15044403076172, 56.73057174682617, 66.31069946289062, 75.89082336425781, 85.47095489501953, 95.05108642578125, 104.63121032714844]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 4.0, 11.0, 6.0, 14.0, 22.0, 25.0, 18.0, 22.0, 28.0, 31.0, 44.0, 33.0, 41.0, 48.0, 48.0, 48.0, 56.0, 48.0, 48.0, 46.0, 40.0, 47.0, 34.0, 42.0, 28.0, 26.0, 24.0, 21.0, 20.0, 20.0, 14.0, 12.0, 7.0, 7.0, 3.0, 5.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-222.62237548828125, -215.91629028320312, -209.210205078125, -202.50411987304688, -195.7980499267578, -189.0919647216797, -182.38587951660156, -175.67979431152344, -168.97372436523438, -162.26763916015625, -155.56155395507812, -148.85546875, -142.14939880371094, -135.4433135986328, -128.7372283935547, -122.03114318847656, -115.32505798339844, -108.61897277832031, -101.91289520263672, -95.2068099975586, -88.500732421875, -81.79464721679688, -75.08856201171875, -68.38247680664062, -61.67639923095703, -54.97031784057617, -48.26423645019531, -41.55815124511719, -34.85206985473633, -28.14598846435547, -21.439903259277344, -14.733821868896484, -8.027740478515625, -1.3216581344604492, 5.384424209594727, 12.090507507324219, 18.796588897705078, 25.502670288085938, 32.20875549316406, 38.91483688354492, 45.62091827392578, 52.32699966430664, 59.0330810546875, 65.73916625976562, 72.44525146484375, 79.15132904052734, 85.85741424560547, 92.56349182128906, 99.26957702636719, 105.97566223144531, 112.6817398071289, 119.38782501220703, 126.09390258789062, 132.79998779296875, 139.50607299804688, 146.212158203125, 152.91824340820312, 159.62432861328125, 166.33041381835938, 173.0364990234375, 179.74256896972656, 186.4486541748047, 193.1547393798828, 199.86082458496094, 206.56689453125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 6.0, 1.0, 7.0, 9.0, 6.0, 12.0, 19.0, 31.0, 48.0, 51.0, 87.0, 109.0, 187.0, 348.0, 595.0, 1204.0, 2508.0, 6710.0, 25521.0, 3249366.0, 870753.0, 24844.0, 6616.0, 2555.0, 1210.0, 574.0, 321.0, 204.0, 123.0, 77.0, 45.0, 43.0, 32.0, 15.0, 20.0, 12.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-75.8125, -73.76318359375, -71.7138671875, -69.66455078125, -67.615234375, -65.56591796875, -63.5166015625, -61.46728515625, -59.41796875, -57.36865234375, -55.3193359375, -53.27001953125, -51.220703125, -49.17138671875, -47.1220703125, -45.07275390625, -43.0234375, -40.97412109375, -38.9248046875, -36.87548828125, -34.826171875, -32.77685546875, -30.7275390625, -28.67822265625, -26.62890625, -24.57958984375, -22.5302734375, -20.48095703125, -18.431640625, -16.38232421875, -14.3330078125, -12.28369140625, -10.234375, -8.18505859375, -6.1357421875, -4.08642578125, -2.037109375, 0.01220703125, 2.0615234375, 4.11083984375, 6.16015625, 8.20947265625, 10.2587890625, 12.30810546875, 14.357421875, 16.40673828125, 18.4560546875, 20.50537109375, 22.5546875, 24.60400390625, 26.6533203125, 28.70263671875, 30.751953125, 32.80126953125, 34.8505859375, 36.89990234375, 38.94921875, 40.99853515625, 43.0478515625, 45.09716796875, 47.146484375, 49.19580078125, 51.2451171875, 53.29443359375, 55.34375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 2.0, 10.0, 9.0, 12.0, 19.0, 21.0, 26.0, 32.0, 20.0, 37.0, 32.0, 46.0, 46.0, 37.0, 46.0, 56.0, 55.0, 47.0, 64.0, 45.0, 41.0, 52.0, 46.0, 28.0, 28.0, 31.0, 28.0, 23.0, 15.0, 10.0, 7.0, 7.0, 5.0, 9.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-9.2265625, -8.934814453125, -8.64306640625, -8.351318359375, -8.0595703125, -7.767822265625, -7.47607421875, -7.184326171875, -6.892578125, -6.600830078125, -6.30908203125, -6.017333984375, -5.7255859375, -5.433837890625, -5.14208984375, -4.850341796875, -4.55859375, -4.266845703125, -3.97509765625, -3.683349609375, -3.3916015625, -3.099853515625, -2.80810546875, -2.516357421875, -2.224609375, -1.932861328125, -1.64111328125, -1.349365234375, -1.0576171875, -0.765869140625, -0.47412109375, -0.182373046875, 0.109375, 0.401123046875, 0.69287109375, 0.984619140625, 1.2763671875, 1.568115234375, 1.85986328125, 2.151611328125, 2.443359375, 2.735107421875, 3.02685546875, 3.318603515625, 3.6103515625, 3.902099609375, 4.19384765625, 4.485595703125, 4.77734375, 5.069091796875, 5.36083984375, 5.652587890625, 5.9443359375, 6.236083984375, 6.52783203125, 6.819580078125, 7.111328125, 7.403076171875, 7.69482421875, 7.986572265625, 8.2783203125, 8.570068359375, 8.86181640625, 9.153564453125, 9.4453125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 0.0, 1.0, 1.0, 1.0, 4.0, 9.0, 6.0, 5.0, 7.0, 12.0, 19.0, 14.0, 21.0, 26.0, 33.0, 54.0, 90.0, 167.0, 248.0, 512.0, 1264.0, 3257.0, 10300.0, 61218.0, 3998428.0, 98831.0, 13069.0, 3915.0, 1393.0, 586.0, 292.0, 140.0, 115.0, 47.0, 42.0, 40.0, 21.0, 14.0, 18.0, 11.0, 18.0, 7.0, 12.0, 7.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-57.09375, -55.22705078125, -53.3603515625, -51.49365234375, -49.626953125, -47.76025390625, -45.8935546875, -44.02685546875, -42.16015625, -40.29345703125, -38.4267578125, -36.56005859375, -34.693359375, -32.82666015625, -30.9599609375, -29.09326171875, -27.2265625, -25.35986328125, -23.4931640625, -21.62646484375, -19.759765625, -17.89306640625, -16.0263671875, -14.15966796875, -12.29296875, -10.42626953125, -8.5595703125, -6.69287109375, -4.826171875, -2.95947265625, -1.0927734375, 0.77392578125, 2.640625, 4.50732421875, 6.3740234375, 8.24072265625, 10.107421875, 11.97412109375, 13.8408203125, 15.70751953125, 17.57421875, 19.44091796875, 21.3076171875, 23.17431640625, 25.041015625, 26.90771484375, 28.7744140625, 30.64111328125, 32.5078125, 34.37451171875, 36.2412109375, 38.10791015625, 39.974609375, 41.84130859375, 43.7080078125, 45.57470703125, 47.44140625, 49.30810546875, 51.1748046875, 53.04150390625, 54.908203125, 56.77490234375, 58.6416015625, 60.50830078125, 62.375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 6.0, 14.0, 13.0, 18.0, 22.0, 51.0, 117.0, 448.0, 3049.0, 188.0, 71.0, 30.0, 16.0, 9.0, 5.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.13671875, -6.74468994140625, -6.3526611328125, -5.96063232421875, -5.568603515625, -5.17657470703125, -4.7845458984375, -4.39251708984375, -4.00048828125, -3.60845947265625, -3.2164306640625, -2.82440185546875, -2.432373046875, -2.04034423828125, -1.6483154296875, -1.25628662109375, -0.8642578125, -0.47222900390625, -0.0802001953125, 0.31182861328125, 0.703857421875, 1.09588623046875, 1.4879150390625, 1.87994384765625, 2.27197265625, 2.66400146484375, 3.0560302734375, 3.44805908203125, 3.840087890625, 4.23211669921875, 4.6241455078125, 5.01617431640625, 5.408203125, 5.80023193359375, 6.1922607421875, 6.58428955078125, 6.976318359375, 7.36834716796875, 7.7603759765625, 8.15240478515625, 8.54443359375, 8.93646240234375, 9.3284912109375, 9.72052001953125, 10.112548828125, 10.50457763671875, 10.8966064453125, 11.28863525390625, 11.6806640625, 12.07269287109375, 12.4647216796875, 12.85675048828125, 13.248779296875, 13.64080810546875, 14.0328369140625, 14.42486572265625, 14.81689453125, 15.20892333984375, 15.6009521484375, 15.99298095703125, 16.385009765625, 16.77703857421875, 17.1690673828125, 17.56109619140625, 17.953125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 6.0, 19.0, 21.0, 32.0, 70.0, 101.0, 149.0, 154.0, 131.0, 121.0, 73.0, 61.0, 26.0, 17.0, 13.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-89.9949722290039, -88.09232330322266, -86.1896743774414, -84.28702545166016, -82.3843765258789, -80.48172760009766, -78.5790786743164, -76.67642974853516, -74.7737808227539, -72.87113189697266, -70.9684829711914, -69.06583404541016, -67.1631851196289, -65.26053619384766, -63.357887268066406, -61.455238342285156, -59.55258560180664, -57.64993667602539, -55.74728775024414, -53.84463882446289, -51.94198989868164, -50.03934097290039, -48.136688232421875, -46.234039306640625, -44.331390380859375, -42.428741455078125, -40.526092529296875, -38.623443603515625, -36.720794677734375, -34.818145751953125, -32.915496826171875, -31.012845993041992, -29.11020278930664, -27.20755386352539, -25.30490493774414, -23.40225601196289, -21.49960708618164, -19.59695816040039, -17.694307327270508, -15.791658401489258, -13.889009475708008, -11.986360549926758, -10.083711624145508, -8.181061744689941, -6.278412818908691, -4.375763893127441, -2.473114013671875, -0.570465087890625, 1.332183837890625, 3.234833002090454, 5.137482166290283, 7.040131568908691, 8.942780494689941, 10.845429420471191, 12.748079299926758, 14.650728225708008, 16.553377151489258, 18.456026077270508, 20.358675003051758, 22.26132583618164, 24.16397476196289, 26.06662368774414, 27.96927261352539, 29.87192153930664, 31.77457046508789]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 8.0, 7.0, 10.0, 8.0, 10.0, 11.0, 24.0, 22.0, 26.0, 35.0, 41.0, 45.0, 49.0, 55.0, 37.0, 39.0, 45.0, 50.0, 45.0, 37.0, 46.0, 38.0, 47.0, 35.0, 35.0, 28.0, 23.0, 30.0, 14.0, 16.0, 19.0, 15.0, 18.0, 7.0, 8.0, 9.0, 6.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.405664443969727, -25.60245704650879, -24.79924774169922, -23.99604034423828, -23.19283103942871, -22.389623641967773, -21.586414337158203, -20.783206939697266, -19.979997634887695, -19.176790237426758, -18.373580932617188, -17.57037353515625, -16.76716423034668, -15.963956832885742, -15.160747528076172, -14.357540130615234, -13.55433177947998, -12.751123428344727, -11.947915077209473, -11.144706726074219, -10.341498374938965, -9.538290023803711, -8.735082626342773, -7.931873798370361, -7.128665447235107, -6.3254570960998535, -5.5222487449646, -4.719040870666504, -3.915832281112671, -3.112624168395996, -2.309415817260742, -1.5062074661254883, -0.7029991149902344, 0.10020917654037476, 0.9034174680709839, 1.7066256999969482, 2.509834051132202, 3.313042163848877, 4.116250514984131, 4.919458866119385, 5.722667217254639, 6.525875568389893, 7.3290839195251465, 8.132291793823242, 8.935500144958496, 9.73870849609375, 10.541916847229004, 11.345125198364258, 12.148333549499512, 12.951541900634766, 13.75475025177002, 14.557958602905273, 15.361166954040527, 16.16437530517578, 16.96758270263672, 17.77079200744629, 18.573999404907227, 19.377206802368164, 20.180416107177734, 20.983623504638672, 21.786832809448242, 22.59004020690918, 23.39324951171875, 24.196456909179688, 24.999666213989258]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 11.0, 10.0, 13.0, 29.0, 30.0, 72.0, 142.0, 280.0, 552.0, 1234.0, 3571.0, 11198.0, 42035.0, 168499.0, 470327.0, 259883.0, 65539.0, 17063.0, 4869.0, 1750.0, 705.0, 331.0, 188.0, 98.0, 52.0, 27.0, 21.0, 5.0, 8.0, 7.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.578125, -27.703125, -26.828125, -25.953125, -25.078125, -24.203125, -23.328125, -22.453125, -21.578125, -20.703125, -19.828125, -18.953125, -18.078125, -17.203125, -16.328125, -15.453125, -14.578125, -13.703125, -12.828125, -11.953125, -11.078125, -10.203125, -9.328125, -8.453125, -7.578125, -6.703125, -5.828125, -4.953125, -4.078125, -3.203125, -2.328125, -1.453125, -0.578125, 0.296875, 1.171875, 2.046875, 2.921875, 3.796875, 4.671875, 5.546875, 6.421875, 7.296875, 8.171875, 9.046875, 9.921875, 10.796875, 11.671875, 12.546875, 13.421875, 14.296875, 15.171875, 16.046875, 16.921875, 17.796875, 18.671875, 19.546875, 20.421875, 21.296875, 22.171875, 23.046875, 23.921875, 24.796875, 25.671875, 26.546875, 27.421875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 3.0, 6.0, 4.0, 15.0, 10.0, 11.0, 14.0, 14.0, 30.0, 33.0, 33.0, 38.0, 34.0, 39.0, 44.0, 46.0, 39.0, 57.0, 47.0, 66.0, 44.0, 41.0, 46.0, 61.0, 38.0, 30.0, 24.0, 30.0, 24.0, 11.0, 16.0, 14.0, 9.0, 12.0, 4.0, 11.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.2734375, -8.977783203125, -8.68212890625, -8.386474609375, -8.0908203125, -7.795166015625, -7.49951171875, -7.203857421875, -6.908203125, -6.612548828125, -6.31689453125, -6.021240234375, -5.7255859375, -5.429931640625, -5.13427734375, -4.838623046875, -4.54296875, -4.247314453125, -3.95166015625, -3.656005859375, -3.3603515625, -3.064697265625, -2.76904296875, -2.473388671875, -2.177734375, -1.882080078125, -1.58642578125, -1.290771484375, -0.9951171875, -0.699462890625, -0.40380859375, -0.108154296875, 0.1875, 0.483154296875, 0.77880859375, 1.074462890625, 1.3701171875, 1.665771484375, 1.96142578125, 2.257080078125, 2.552734375, 2.848388671875, 3.14404296875, 3.439697265625, 3.7353515625, 4.031005859375, 4.32666015625, 4.622314453125, 4.91796875, 5.213623046875, 5.50927734375, 5.804931640625, 6.1005859375, 6.396240234375, 6.69189453125, 6.987548828125, 7.283203125, 7.578857421875, 7.87451171875, 8.170166015625, 8.4658203125, 8.761474609375, 9.05712890625, 9.352783203125, 9.6484375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 15.0, 26.0, 34.0, 53.0, 79.0, 163.0, 288.0, 456.0, 833.0, 1662.0, 4774.0, 44373.0, 733209.0, 243451.0, 13688.0, 2734.0, 1184.0, 643.0, 377.0, 218.0, 121.0, 80.0, 40.0, 28.0, 8.0, 7.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.96875, -38.41796875, -36.8671875, -35.31640625, -33.765625, -32.21484375, -30.6640625, -29.11328125, -27.5625, -26.01171875, -24.4609375, -22.91015625, -21.359375, -19.80859375, -18.2578125, -16.70703125, -15.15625, -13.60546875, -12.0546875, -10.50390625, -8.953125, -7.40234375, -5.8515625, -4.30078125, -2.75, -1.19921875, 0.3515625, 1.90234375, 3.453125, 5.00390625, 6.5546875, 8.10546875, 9.65625, 11.20703125, 12.7578125, 14.30859375, 15.859375, 17.41015625, 18.9609375, 20.51171875, 22.0625, 23.61328125, 25.1640625, 26.71484375, 28.265625, 29.81640625, 31.3671875, 32.91796875, 34.46875, 36.01953125, 37.5703125, 39.12109375, 40.671875, 42.22265625, 43.7734375, 45.32421875, 46.875, 48.42578125, 49.9765625, 51.52734375, 53.078125, 54.62890625, 56.1796875, 57.73046875, 59.28125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 4.0, 9.0, 15.0, 17.0, 20.0, 21.0, 42.0, 46.0, 50.0, 59.0, 70.0, 66.0, 75.0, 71.0, 74.0, 78.0, 58.0, 57.0, 46.0, 33.0, 30.0, 16.0, 15.0, 8.0, 10.0, 10.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.59375, -41.77978515625, -39.9658203125, -38.15185546875, -36.337890625, -34.52392578125, -32.7099609375, -30.89599609375, -29.08203125, -27.26806640625, -25.4541015625, -23.64013671875, -21.826171875, -20.01220703125, -18.1982421875, -16.38427734375, -14.5703125, -12.75634765625, -10.9423828125, -9.12841796875, -7.314453125, -5.50048828125, -3.6865234375, -1.87255859375, -0.05859375, 1.75537109375, 3.5693359375, 5.38330078125, 7.197265625, 9.01123046875, 10.8251953125, 12.63916015625, 14.453125, 16.26708984375, 18.0810546875, 19.89501953125, 21.708984375, 23.52294921875, 25.3369140625, 27.15087890625, 28.96484375, 30.77880859375, 32.5927734375, 34.40673828125, 36.220703125, 38.03466796875, 39.8486328125, 41.66259765625, 43.4765625, 45.29052734375, 47.1044921875, 48.91845703125, 50.732421875, 52.54638671875, 54.3603515625, 56.17431640625, 57.98828125, 59.80224609375, 61.6162109375, 63.43017578125, 65.244140625, 67.05810546875, 68.8720703125, 70.68603515625, 72.5]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 9.0, 12.0, 8.0, 10.0, 24.0, 45.0, 59.0, 89.0, 123.0, 238.0, 433.0, 850.0, 2036.0, 6585.0, 34613.0, 404461.0, 543005.0, 43727.0, 7843.0, 2284.0, 990.0, 457.0, 247.0, 126.0, 91.0, 57.0, 49.0, 27.0, 12.0, 16.0, 8.0, 6.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.6640625, -13.1187744140625, -12.573486328125, -12.0281982421875, -11.48291015625, -10.9376220703125, -10.392333984375, -9.8470458984375, -9.3017578125, -8.7564697265625, -8.211181640625, -7.6658935546875, -7.12060546875, -6.5753173828125, -6.030029296875, -5.4847412109375, -4.939453125, -4.3941650390625, -3.848876953125, -3.3035888671875, -2.75830078125, -2.2130126953125, -1.667724609375, -1.1224365234375, -0.5771484375, -0.0318603515625, 0.513427734375, 1.0587158203125, 1.60400390625, 2.1492919921875, 2.694580078125, 3.2398681640625, 3.78515625, 4.3304443359375, 4.875732421875, 5.4210205078125, 5.96630859375, 6.5115966796875, 7.056884765625, 7.6021728515625, 8.1474609375, 8.6927490234375, 9.238037109375, 9.7833251953125, 10.32861328125, 10.8739013671875, 11.419189453125, 11.9644775390625, 12.509765625, 13.0550537109375, 13.600341796875, 14.1456298828125, 14.69091796875, 15.2362060546875, 15.781494140625, 16.3267822265625, 16.8720703125, 17.4173583984375, 17.962646484375, 18.5079345703125, 19.05322265625, 19.5985107421875, 20.143798828125, 20.6890869140625, 21.234375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 1.0, 4.0, 9.0, 14.0, 10.0, 14.0, 25.0, 31.0, 33.0, 54.0, 66.0, 99.0, 113.0, 127.0, 97.0, 74.0, 57.0, 45.0, 37.0, 23.0, 16.0, 10.0, 6.0, 6.0, 5.0, 9.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.001434326171875, -0.0013771653175354004, -0.0013200044631958008, -0.0012628436088562012, -0.0012056827545166016, -0.001148521900177002, -0.0010913610458374023, -0.0010342001914978027, -0.0009770393371582031, -0.0009198784828186035, -0.0008627176284790039, -0.0008055567741394043, -0.0007483959197998047, -0.0006912350654602051, -0.0006340742111206055, -0.0005769133567810059, -0.0005197525024414062, -0.00046259164810180664, -0.00040543079376220703, -0.0003482699394226074, -0.0002911090850830078, -0.0002339482307434082, -0.0001767873764038086, -0.00011962652206420898, -6.246566772460938e-05, -5.304813385009766e-06, 5.1856040954589844e-05, 0.00010901689529418945, 0.00016617774963378906, 0.00022333860397338867, 0.0002804994583129883, 0.0003376603126525879, 0.0003948211669921875, 0.0004519820213317871, 0.0005091428756713867, 0.0005663037300109863, 0.0006234645843505859, 0.0006806254386901855, 0.0007377862930297852, 0.0007949471473693848, 0.0008521080017089844, 0.000909268856048584, 0.0009664297103881836, 0.0010235905647277832, 0.0010807514190673828, 0.0011379122734069824, 0.001195073127746582, 0.0012522339820861816, 0.0013093948364257812, 0.0013665556907653809, 0.0014237165451049805, 0.00148087739944458, 0.0015380382537841797, 0.0015951991081237793, 0.001652359962463379, 0.0017095208168029785, 0.0017666816711425781, 0.0018238425254821777, 0.0018810033798217773, 0.001938164234161377, 0.0019953250885009766, 0.002052485942840576, 0.0021096467971801758, 0.0021668076515197754, 0.002223968505859375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 7.0, 14.0, 17.0, 26.0, 46.0, 55.0, 98.0, 165.0, 305.0, 585.0, 1263.0, 3653.0, 15599.0, 130711.0, 755682.0, 119440.0, 14740.0, 3647.0, 1174.0, 593.0, 299.0, 157.0, 94.0, 63.0, 33.0, 28.0, 16.0, 14.0, 8.0, 9.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.828125, -20.2724609375, -19.716796875, -19.1611328125, -18.60546875, -18.0498046875, -17.494140625, -16.9384765625, -16.3828125, -15.8271484375, -15.271484375, -14.7158203125, -14.16015625, -13.6044921875, -13.048828125, -12.4931640625, -11.9375, -11.3818359375, -10.826171875, -10.2705078125, -9.71484375, -9.1591796875, -8.603515625, -8.0478515625, -7.4921875, -6.9365234375, -6.380859375, -5.8251953125, -5.26953125, -4.7138671875, -4.158203125, -3.6025390625, -3.046875, -2.4912109375, -1.935546875, -1.3798828125, -0.82421875, -0.2685546875, 0.287109375, 0.8427734375, 1.3984375, 1.9541015625, 2.509765625, 3.0654296875, 3.62109375, 4.1767578125, 4.732421875, 5.2880859375, 5.84375, 6.3994140625, 6.955078125, 7.5107421875, 8.06640625, 8.6220703125, 9.177734375, 9.7333984375, 10.2890625, 10.8447265625, 11.400390625, 11.9560546875, 12.51171875, 13.0673828125, 13.623046875, 14.1787109375, 14.734375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 6.0, 10.0, 13.0, 17.0, 36.0, 68.0, 133.0, 184.0, 240.0, 141.0, 57.0, 49.0, 26.0, 9.0, 9.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.25, -19.33349609375, -18.4169921875, -17.50048828125, -16.583984375, -15.66748046875, -14.7509765625, -13.83447265625, -12.91796875, -12.00146484375, -11.0849609375, -10.16845703125, -9.251953125, -8.33544921875, -7.4189453125, -6.50244140625, -5.5859375, -4.66943359375, -3.7529296875, -2.83642578125, -1.919921875, -1.00341796875, -0.0869140625, 0.82958984375, 1.74609375, 2.66259765625, 3.5791015625, 4.49560546875, 5.412109375, 6.32861328125, 7.2451171875, 8.16162109375, 9.078125, 9.99462890625, 10.9111328125, 11.82763671875, 12.744140625, 13.66064453125, 14.5771484375, 15.49365234375, 16.41015625, 17.32666015625, 18.2431640625, 19.15966796875, 20.076171875, 20.99267578125, 21.9091796875, 22.82568359375, 23.7421875, 24.65869140625, 25.5751953125, 26.49169921875, 27.408203125, 28.32470703125, 29.2412109375, 30.15771484375, 31.07421875, 31.99072265625, 32.9072265625, 33.82373046875, 34.740234375, 35.65673828125, 36.5732421875, 37.48974609375, 38.40625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 25.0, 139.0, 441.0, 288.0, 96.0, 16.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-244.26541137695312, -218.94081115722656, -193.61619567871094, -168.29159545898438, -142.96697998046875, -117.64237976074219, -92.31777954101562, -66.9931640625, -41.66856384277344, -16.343957901000977, 8.980648040771484, 34.30525207519531, 59.629859924316406, 84.9544677734375, 110.27906799316406, 135.6036834716797, 160.92828369140625, 186.2528839111328, 211.57749938964844, 236.902099609375, 262.2267150878906, 287.55133056640625, 312.87591552734375, 338.2005310058594, 363.525146484375, 388.8497619628906, 414.1743469238281, 439.49896240234375, 464.8235778808594, 490.148193359375, 515.4727783203125, 540.79736328125, 566.1220092773438, 591.4465942382812, 616.771240234375, 642.0958251953125, 667.42041015625, 692.7450561523438, 718.0696411132812, 743.394287109375, 768.7188720703125, 794.04345703125, 819.3681030273438, 844.6926879882812, 870.0172729492188, 895.3419189453125, 920.66650390625, 945.9910888671875, 971.315673828125, 996.6402587890625, 1021.9649047851562, 1047.28955078125, 1072.6141357421875, 1097.938720703125, 1123.2633056640625, 1148.587890625, 1173.91259765625, 1199.2371826171875, 1224.561767578125, 1249.886474609375, 1275.2110595703125, 1300.53564453125, 1325.8602294921875, 1351.184814453125, 1376.5093994140625]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 6.0, 8.0, 4.0, 13.0, 6.0, 8.0, 11.0, 20.0, 29.0, 17.0, 19.0, 22.0, 26.0, 26.0, 49.0, 41.0, 36.0, 39.0, 49.0, 45.0, 42.0, 40.0, 43.0, 36.0, 48.0, 36.0, 38.0, 32.0, 27.0, 30.0, 20.0, 25.0, 15.0, 17.0, 18.0, 14.0, 5.0, 9.0, 6.0, 6.0, 7.0, 4.0, 4.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-178.16281127929688, -173.02392578125, -167.88502502441406, -162.74612426757812, -157.60723876953125, -152.46835327148438, -147.32945251464844, -142.1905517578125, -137.05166625976562, -131.91278076171875, -126.77388000488281, -121.6349868774414, -116.49609375, -111.3572006225586, -106.21830749511719, -101.07941436767578, -95.94052124023438, -90.80162811279297, -85.66273498535156, -80.52384185791016, -75.38494873046875, -70.24605560302734, -65.10716247558594, -59.96826934814453, -54.829376220703125, -49.69048309326172, -44.55158996582031, -39.412696838378906, -34.2738037109375, -29.134910583496094, -23.996017456054688, -18.85712432861328, -13.718231201171875, -8.579338073730469, -3.4404449462890625, 1.6984481811523438, 6.83734130859375, 11.976234436035156, 17.115127563476562, 22.25402069091797, 27.392913818359375, 32.53180694580078, 37.67070007324219, 42.809593200683594, 47.948486328125, 53.087379455566406, 58.22627258300781, 63.36516571044922, 68.50405883789062, 73.64295196533203, 78.78184509277344, 83.92073822021484, 89.05963134765625, 94.19852447509766, 99.33741760253906, 104.47631072998047, 109.61520385742188, 114.75409698486328, 119.89299011230469, 125.0318832397461, 130.1707763671875, 135.30966186523438, 140.4485626220703, 145.58746337890625, 150.72634887695312]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 11.0, 17.0, 18.0, 44.0, 65.0, 115.0, 141.0, 284.0, 490.0, 1038.0, 3321.0, 15871.0, 4115522.0, 48429.0, 5784.0, 1611.0, 645.0, 359.0, 201.0, 102.0, 70.0, 53.0, 28.0, 19.0, 13.0, 5.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0], "bins": [-109.9375, -107.1689453125, -104.400390625, -101.6318359375, -98.86328125, -96.0947265625, -93.326171875, -90.5576171875, -87.7890625, -85.0205078125, -82.251953125, -79.4833984375, -76.71484375, -73.9462890625, -71.177734375, -68.4091796875, -65.640625, -62.8720703125, -60.103515625, -57.3349609375, -54.56640625, -51.7978515625, -49.029296875, -46.2607421875, -43.4921875, -40.7236328125, -37.955078125, -35.1865234375, -32.41796875, -29.6494140625, -26.880859375, -24.1123046875, -21.34375, -18.5751953125, -15.806640625, -13.0380859375, -10.26953125, -7.5009765625, -4.732421875, -1.9638671875, 0.8046875, 3.5732421875, 6.341796875, 9.1103515625, 11.87890625, 14.6474609375, 17.416015625, 20.1845703125, 22.953125, 25.7216796875, 28.490234375, 31.2587890625, 34.02734375, 36.7958984375, 39.564453125, 42.3330078125, 45.1015625, 47.8701171875, 50.638671875, 53.4072265625, 56.17578125, 58.9443359375, 61.712890625, 64.4814453125, 67.25]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 3.0, 2.0, 1.0, 8.0, 9.0, 10.0, 13.0, 15.0, 27.0, 27.0, 32.0, 29.0, 38.0, 21.0, 45.0, 44.0, 33.0, 54.0, 58.0, 49.0, 51.0, 54.0, 45.0, 43.0, 50.0, 39.0, 31.0, 33.0, 30.0, 28.0, 16.0, 15.0, 7.0, 10.0, 5.0, 8.0, 8.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.296875, -8.991455078125, -8.68603515625, -8.380615234375, -8.0751953125, -7.769775390625, -7.46435546875, -7.158935546875, -6.853515625, -6.548095703125, -6.24267578125, -5.937255859375, -5.6318359375, -5.326416015625, -5.02099609375, -4.715576171875, -4.41015625, -4.104736328125, -3.79931640625, -3.493896484375, -3.1884765625, -2.883056640625, -2.57763671875, -2.272216796875, -1.966796875, -1.661376953125, -1.35595703125, -1.050537109375, -0.7451171875, -0.439697265625, -0.13427734375, 0.171142578125, 0.4765625, 0.781982421875, 1.08740234375, 1.392822265625, 1.6982421875, 2.003662109375, 2.30908203125, 2.614501953125, 2.919921875, 3.225341796875, 3.53076171875, 3.836181640625, 4.1416015625, 4.447021484375, 4.75244140625, 5.057861328125, 5.36328125, 5.668701171875, 5.97412109375, 6.279541015625, 6.5849609375, 6.890380859375, 7.19580078125, 7.501220703125, 7.806640625, 8.112060546875, 8.41748046875, 8.722900390625, 9.0283203125, 9.333740234375, 9.63916015625, 9.944580078125, 10.25]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 8.0, 6.0, 6.0, 13.0, 13.0, 14.0, 13.0, 30.0, 25.0, 36.0, 42.0, 54.0, 69.0, 85.0, 125.0, 150.0, 233.0, 399.0, 925.0, 2327.0, 9396.0, 92209.0, 4059176.0, 21436.0, 4325.0, 1419.0, 595.0, 298.0, 205.0, 133.0, 105.0, 90.0, 61.0, 39.0, 43.0, 22.0, 37.0, 23.0, 22.0, 14.0, 14.0, 17.0, 7.0, 6.0, 5.0, 5.0, 5.0, 0.0, 3.0, 2.0], "bins": [-67.0625, -65.2119140625, -63.361328125, -61.5107421875, -59.66015625, -57.8095703125, -55.958984375, -54.1083984375, -52.2578125, -50.4072265625, -48.556640625, -46.7060546875, -44.85546875, -43.0048828125, -41.154296875, -39.3037109375, -37.453125, -35.6025390625, -33.751953125, -31.9013671875, -30.05078125, -28.2001953125, -26.349609375, -24.4990234375, -22.6484375, -20.7978515625, -18.947265625, -17.0966796875, -15.24609375, -13.3955078125, -11.544921875, -9.6943359375, -7.84375, -5.9931640625, -4.142578125, -2.2919921875, -0.44140625, 1.4091796875, 3.259765625, 5.1103515625, 6.9609375, 8.8115234375, 10.662109375, 12.5126953125, 14.36328125, 16.2138671875, 18.064453125, 19.9150390625, 21.765625, 23.6162109375, 25.466796875, 27.3173828125, 29.16796875, 31.0185546875, 32.869140625, 34.7197265625, 36.5703125, 38.4208984375, 40.271484375, 42.1220703125, 43.97265625, 45.8232421875, 47.673828125, 49.5244140625, 51.375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 6.0, 5.0, 20.0, 26.0, 61.0, 337.0, 3450.0, 91.0, 33.0, 19.0, 8.0, 9.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.6484375, -8.2745361328125, -7.900634765625, -7.5267333984375, -7.15283203125, -6.7789306640625, -6.405029296875, -6.0311279296875, -5.6572265625, -5.2833251953125, -4.909423828125, -4.5355224609375, -4.16162109375, -3.7877197265625, -3.413818359375, -3.0399169921875, -2.666015625, -2.2921142578125, -1.918212890625, -1.5443115234375, -1.17041015625, -0.7965087890625, -0.422607421875, -0.0487060546875, 0.3251953125, 0.6990966796875, 1.072998046875, 1.4468994140625, 1.82080078125, 2.1947021484375, 2.568603515625, 2.9425048828125, 3.31640625, 3.6903076171875, 4.064208984375, 4.4381103515625, 4.81201171875, 5.1859130859375, 5.559814453125, 5.9337158203125, 6.3076171875, 6.6815185546875, 7.055419921875, 7.4293212890625, 7.80322265625, 8.1771240234375, 8.551025390625, 8.9249267578125, 9.298828125, 9.6727294921875, 10.046630859375, 10.4205322265625, 10.79443359375, 11.1683349609375, 11.542236328125, 11.9161376953125, 12.2900390625, 12.6639404296875, 13.037841796875, 13.4117431640625, 13.78564453125, 14.1595458984375, 14.533447265625, 14.9073486328125, 15.28125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 4.0, 7.0, 18.0, 22.0, 20.0, 42.0, 57.0, 101.0, 105.0, 109.0, 124.0, 87.0, 74.0, 63.0, 54.0, 29.0, 29.0, 14.0, 12.0, 11.0, 5.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-48.419193267822266, -47.24048614501953, -46.0617790222168, -44.88307571411133, -43.704368591308594, -42.52566146850586, -41.346954345703125, -40.16824722290039, -38.989540100097656, -37.81083297729492, -36.63212585449219, -35.45342254638672, -34.274715423583984, -33.09600830078125, -31.917301177978516, -30.73859405517578, -29.559890747070312, -28.381183624267578, -27.202478408813477, -26.023771286010742, -24.84506607055664, -23.666358947753906, -22.487651824951172, -21.308944702148438, -20.130239486694336, -18.9515323638916, -17.7728271484375, -16.594120025634766, -15.415413856506348, -14.23670768737793, -13.058000564575195, -11.879294395446777, -10.700584411621094, -9.521878242492676, -8.343172073364258, -7.164464950561523, -5.9857587814331055, -4.8070526123046875, -3.6283459663391113, -2.449639320373535, -1.2709331512451172, -0.09222674369812012, 1.086479663848877, 2.265186071395874, 3.443892478942871, 4.622598648071289, 5.801305294036865, 6.980011940002441, 8.15871810913086, 9.337424278259277, 10.516130447387695, 11.69483757019043, 12.873543739318848, 14.052249908447266, 15.23095703125, 16.409664154052734, 17.588369369506836, 18.76707649230957, 19.945781707763672, 21.124488830566406, 22.30319595336914, 23.481901168823242, 24.660608291625977, 25.839313507080078, 27.018020629882812]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 6.0, 9.0, 11.0, 11.0, 10.0, 12.0, 12.0, 17.0, 23.0, 15.0, 20.0, 31.0, 30.0, 34.0, 29.0, 28.0, 34.0, 26.0, 22.0, 37.0, 34.0, 39.0, 32.0, 37.0, 48.0, 38.0, 33.0, 37.0, 33.0, 26.0, 31.0, 27.0, 22.0, 20.0, 20.0, 14.0, 14.0, 13.0, 10.0, 13.0, 10.0, 8.0, 11.0, 7.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-19.241703033447266, -18.67993927001953, -18.118175506591797, -17.556411743164062, -16.994647979736328, -16.432884216308594, -15.871121406555176, -15.309357643127441, -14.747593879699707, -14.185830116271973, -13.624066352844238, -13.062302589416504, -12.500539779663086, -11.938776016235352, -11.377012252807617, -10.815248489379883, -10.253484725952148, -9.691720962524414, -9.12995719909668, -8.568193435668945, -8.006429672241211, -7.444666385650635, -6.882903099060059, -6.321139335632324, -5.75937557220459, -5.1976118087768555, -4.635848045349121, -4.074084758758545, -3.5123209953308105, -2.950557231903076, -2.388793706893921, -1.8270301818847656, -1.2652664184570312, -0.7035027742385864, -0.1417391300201416, 0.4200245141983032, 0.981788158416748, 1.5435519218444824, 2.1053154468536377, 2.667078971862793, 3.2288427352905273, 3.7906064987182617, 4.352370262145996, 4.914133548736572, 5.475897312164307, 6.037661075592041, 6.599424362182617, 7.161188125610352, 7.722951889038086, 8.28471565246582, 8.846479415893555, 9.408243179321289, 9.970006942749023, 10.531770706176758, 11.093533515930176, 11.65529727935791, 12.217061042785645, 12.778824806213379, 13.340588569641113, 13.902352333068848, 14.464115142822266, 15.02587890625, 15.587642669677734, 16.14940643310547, 16.711170196533203]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 1.0, 4.0, 7.0, 8.0, 17.0, 12.0, 38.0, 73.0, 120.0, 217.0, 428.0, 817.0, 1788.0, 4186.0, 10190.0, 27728.0, 79977.0, 236872.0, 404255.0, 183652.0, 62130.0, 21463.0, 8301.0, 3316.0, 1461.0, 692.0, 354.0, 196.0, 96.0, 56.0, 35.0, 25.0, 15.0, 10.0, 7.0, 8.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.796875, -19.166015625, -18.53515625, -17.904296875, -17.2734375, -16.642578125, -16.01171875, -15.380859375, -14.75, -14.119140625, -13.48828125, -12.857421875, -12.2265625, -11.595703125, -10.96484375, -10.333984375, -9.703125, -9.072265625, -8.44140625, -7.810546875, -7.1796875, -6.548828125, -5.91796875, -5.287109375, -4.65625, -4.025390625, -3.39453125, -2.763671875, -2.1328125, -1.501953125, -0.87109375, -0.240234375, 0.390625, 1.021484375, 1.65234375, 2.283203125, 2.9140625, 3.544921875, 4.17578125, 4.806640625, 5.4375, 6.068359375, 6.69921875, 7.330078125, 7.9609375, 8.591796875, 9.22265625, 9.853515625, 10.484375, 11.115234375, 11.74609375, 12.376953125, 13.0078125, 13.638671875, 14.26953125, 14.900390625, 15.53125, 16.162109375, 16.79296875, 17.423828125, 18.0546875, 18.685546875, 19.31640625, 19.947265625, 20.578125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 10.0, 8.0, 10.0, 13.0, 13.0, 19.0, 23.0, 34.0, 33.0, 40.0, 35.0, 46.0, 42.0, 53.0, 50.0, 51.0, 58.0, 39.0, 51.0, 56.0, 53.0, 44.0, 30.0, 37.0, 29.0, 15.0, 24.0, 19.0, 13.0, 10.0, 11.0, 7.0, 3.0, 6.0, 6.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.265625, -9.92431640625, -9.5830078125, -9.24169921875, -8.900390625, -8.55908203125, -8.2177734375, -7.87646484375, -7.53515625, -7.19384765625, -6.8525390625, -6.51123046875, -6.169921875, -5.82861328125, -5.4873046875, -5.14599609375, -4.8046875, -4.46337890625, -4.1220703125, -3.78076171875, -3.439453125, -3.09814453125, -2.7568359375, -2.41552734375, -2.07421875, -1.73291015625, -1.3916015625, -1.05029296875, -0.708984375, -0.36767578125, -0.0263671875, 0.31494140625, 0.65625, 0.99755859375, 1.3388671875, 1.68017578125, 2.021484375, 2.36279296875, 2.7041015625, 3.04541015625, 3.38671875, 3.72802734375, 4.0693359375, 4.41064453125, 4.751953125, 5.09326171875, 5.4345703125, 5.77587890625, 6.1171875, 6.45849609375, 6.7998046875, 7.14111328125, 7.482421875, 7.82373046875, 8.1650390625, 8.50634765625, 8.84765625, 9.18896484375, 9.5302734375, 9.87158203125, 10.212890625, 10.55419921875, 10.8955078125, 11.23681640625, 11.578125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 3.0, 5.0, 5.0, 10.0, 7.0, 9.0, 20.0, 22.0, 20.0, 36.0, 50.0, 76.0, 111.0, 173.0, 238.0, 347.0, 443.0, 708.0, 1154.0, 2318.0, 6471.0, 33648.0, 324858.0, 598475.0, 62309.0, 10067.0, 3040.0, 1395.0, 778.0, 538.0, 354.0, 270.0, 191.0, 115.0, 71.0, 64.0, 35.0, 26.0, 30.0, 17.0, 10.0, 12.0, 9.0, 4.0, 5.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-31.765625, -30.745849609375, -29.72607421875, -28.706298828125, -27.6865234375, -26.666748046875, -25.64697265625, -24.627197265625, -23.607421875, -22.587646484375, -21.56787109375, -20.548095703125, -19.5283203125, -18.508544921875, -17.48876953125, -16.468994140625, -15.44921875, -14.429443359375, -13.40966796875, -12.389892578125, -11.3701171875, -10.350341796875, -9.33056640625, -8.310791015625, -7.291015625, -6.271240234375, -5.25146484375, -4.231689453125, -3.2119140625, -2.192138671875, -1.17236328125, -0.152587890625, 0.8671875, 1.886962890625, 2.90673828125, 3.926513671875, 4.9462890625, 5.966064453125, 6.98583984375, 8.005615234375, 9.025390625, 10.045166015625, 11.06494140625, 12.084716796875, 13.1044921875, 14.124267578125, 15.14404296875, 16.163818359375, 17.18359375, 18.203369140625, 19.22314453125, 20.242919921875, 21.2626953125, 22.282470703125, 23.30224609375, 24.322021484375, 25.341796875, 26.361572265625, 27.38134765625, 28.401123046875, 29.4208984375, 30.440673828125, 31.46044921875, 32.480224609375, 33.5]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 12.0, 7.0, 13.0, 17.0, 19.0, 19.0, 24.0, 42.0, 53.0, 55.0, 53.0, 53.0, 58.0, 54.0, 63.0, 54.0, 53.0, 42.0, 38.0, 51.0, 52.0, 36.0, 29.0, 24.0, 18.0, 23.0, 7.0, 9.0, 9.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.125, -53.56982421875, -52.0146484375, -50.45947265625, -48.904296875, -47.34912109375, -45.7939453125, -44.23876953125, -42.68359375, -41.12841796875, -39.5732421875, -38.01806640625, -36.462890625, -34.90771484375, -33.3525390625, -31.79736328125, -30.2421875, -28.68701171875, -27.1318359375, -25.57666015625, -24.021484375, -22.46630859375, -20.9111328125, -19.35595703125, -17.80078125, -16.24560546875, -14.6904296875, -13.13525390625, -11.580078125, -10.02490234375, -8.4697265625, -6.91455078125, -5.359375, -3.80419921875, -2.2490234375, -0.69384765625, 0.861328125, 2.41650390625, 3.9716796875, 5.52685546875, 7.08203125, 8.63720703125, 10.1923828125, 11.74755859375, 13.302734375, 14.85791015625, 16.4130859375, 17.96826171875, 19.5234375, 21.07861328125, 22.6337890625, 24.18896484375, 25.744140625, 27.29931640625, 28.8544921875, 30.40966796875, 31.96484375, 33.52001953125, 35.0751953125, 36.63037109375, 38.185546875, 39.74072265625, 41.2958984375, 42.85107421875, 44.40625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 4.0, 9.0, 11.0, 5.0, 14.0, 28.0, 40.0, 49.0, 77.0, 119.0, 165.0, 288.0, 459.0, 798.0, 1317.0, 2793.0, 6530.0, 22286.0, 161042.0, 736286.0, 90036.0, 15713.0, 5184.0, 2346.0, 1136.0, 648.0, 424.0, 227.0, 161.0, 96.0, 66.0, 43.0, 34.0, 28.0, 13.0, 25.0, 17.0, 8.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.3828125, -12.969482421875, -12.55615234375, -12.142822265625, -11.7294921875, -11.316162109375, -10.90283203125, -10.489501953125, -10.076171875, -9.662841796875, -9.24951171875, -8.836181640625, -8.4228515625, -8.009521484375, -7.59619140625, -7.182861328125, -6.76953125, -6.356201171875, -5.94287109375, -5.529541015625, -5.1162109375, -4.702880859375, -4.28955078125, -3.876220703125, -3.462890625, -3.049560546875, -2.63623046875, -2.222900390625, -1.8095703125, -1.396240234375, -0.98291015625, -0.569580078125, -0.15625, 0.257080078125, 0.67041015625, 1.083740234375, 1.4970703125, 1.910400390625, 2.32373046875, 2.737060546875, 3.150390625, 3.563720703125, 3.97705078125, 4.390380859375, 4.8037109375, 5.217041015625, 5.63037109375, 6.043701171875, 6.45703125, 6.870361328125, 7.28369140625, 7.697021484375, 8.1103515625, 8.523681640625, 8.93701171875, 9.350341796875, 9.763671875, 10.177001953125, 10.59033203125, 11.003662109375, 11.4169921875, 11.830322265625, 12.24365234375, 12.656982421875, 13.0703125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 1.0, 4.0, 8.0, 10.0, 15.0, 26.0, 35.0, 46.0, 91.0, 141.0, 190.0, 146.0, 96.0, 48.0, 32.0, 30.0, 18.0, 14.0, 10.0, 8.0, 5.0, 5.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.002407073974609375, -0.0023307204246520996, -0.0022543668746948242, -0.002178013324737549, -0.0021016597747802734, -0.002025306224822998, -0.0019489526748657227, -0.0018725991249084473, -0.0017962455749511719, -0.0017198920249938965, -0.001643538475036621, -0.0015671849250793457, -0.0014908313751220703, -0.001414477825164795, -0.0013381242752075195, -0.0012617707252502441, -0.0011854171752929688, -0.0011090636253356934, -0.001032710075378418, -0.0009563565254211426, -0.0008800029754638672, -0.0008036494255065918, -0.0007272958755493164, -0.000650942325592041, -0.0005745887756347656, -0.0004982352256774902, -0.00042188167572021484, -0.00034552812576293945, -0.00026917457580566406, -0.00019282102584838867, -0.00011646747589111328, -4.011392593383789e-05, 3.62396240234375e-05, 0.00011259317398071289, 0.00018894672393798828, 0.00026530027389526367, 0.00034165382385253906, 0.00041800737380981445, 0.0004943609237670898, 0.0005707144737243652, 0.0006470680236816406, 0.000723421573638916, 0.0007997751235961914, 0.0008761286735534668, 0.0009524822235107422, 0.0010288357734680176, 0.001105189323425293, 0.0011815428733825684, 0.0012578964233398438, 0.0013342499732971191, 0.0014106035232543945, 0.00148695707321167, 0.0015633106231689453, 0.0016396641731262207, 0.001716017723083496, 0.0017923712730407715, 0.0018687248229980469, 0.0019450783729553223, 0.0020214319229125977, 0.002097785472869873, 0.0021741390228271484, 0.002250492572784424, 0.0023268461227416992, 0.0024031996726989746, 0.00247955322265625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 8.0, 6.0, 9.0, 13.0, 16.0, 19.0, 33.0, 40.0, 55.0, 75.0, 97.0, 172.0, 291.0, 430.0, 718.0, 1195.0, 2318.0, 5579.0, 18537.0, 135847.0, 744524.0, 111568.0, 16597.0, 5078.0, 2202.0, 1246.0, 699.0, 369.0, 270.0, 160.0, 103.0, 76.0, 55.0, 42.0, 30.0, 14.0, 21.0, 8.0, 11.0, 9.0, 2.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-14.8984375, -14.439453125, -13.98046875, -13.521484375, -13.0625, -12.603515625, -12.14453125, -11.685546875, -11.2265625, -10.767578125, -10.30859375, -9.849609375, -9.390625, -8.931640625, -8.47265625, -8.013671875, -7.5546875, -7.095703125, -6.63671875, -6.177734375, -5.71875, -5.259765625, -4.80078125, -4.341796875, -3.8828125, -3.423828125, -2.96484375, -2.505859375, -2.046875, -1.587890625, -1.12890625, -0.669921875, -0.2109375, 0.248046875, 0.70703125, 1.166015625, 1.625, 2.083984375, 2.54296875, 3.001953125, 3.4609375, 3.919921875, 4.37890625, 4.837890625, 5.296875, 5.755859375, 6.21484375, 6.673828125, 7.1328125, 7.591796875, 8.05078125, 8.509765625, 8.96875, 9.427734375, 9.88671875, 10.345703125, 10.8046875, 11.263671875, 11.72265625, 12.181640625, 12.640625, 13.099609375, 13.55859375, 14.017578125, 14.4765625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 3.0, 12.0, 18.0, 27.0, 42.0, 67.0, 118.0, 174.0, 200.0, 141.0, 81.0, 38.0, 29.0, 14.0, 11.0, 7.0, 7.0, 2.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.046875, -17.405517578125, -16.76416015625, -16.122802734375, -15.4814453125, -14.840087890625, -14.19873046875, -13.557373046875, -12.916015625, -12.274658203125, -11.63330078125, -10.991943359375, -10.3505859375, -9.709228515625, -9.06787109375, -8.426513671875, -7.78515625, -7.143798828125, -6.50244140625, -5.861083984375, -5.2197265625, -4.578369140625, -3.93701171875, -3.295654296875, -2.654296875, -2.012939453125, -1.37158203125, -0.730224609375, -0.0888671875, 0.552490234375, 1.19384765625, 1.835205078125, 2.4765625, 3.117919921875, 3.75927734375, 4.400634765625, 5.0419921875, 5.683349609375, 6.32470703125, 6.966064453125, 7.607421875, 8.248779296875, 8.89013671875, 9.531494140625, 10.1728515625, 10.814208984375, 11.45556640625, 12.096923828125, 12.73828125, 13.379638671875, 14.02099609375, 14.662353515625, 15.3037109375, 15.945068359375, 16.58642578125, 17.227783203125, 17.869140625, 18.510498046875, 19.15185546875, 19.793212890625, 20.4345703125, 21.075927734375, 21.71728515625, 22.358642578125, 23.0]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 5.0, 13.0, 23.0, 78.0, 247.0, 405.0, 181.0, 49.0, 8.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1205.760498046875, -1184.0751953125, -1162.389892578125, -1140.7044677734375, -1119.0191650390625, -1097.3338623046875, -1075.6485595703125, -1053.963134765625, -1032.27783203125, -1010.592529296875, -988.9071655273438, -967.2218627929688, -945.5364990234375, -923.8511962890625, -902.1658935546875, -880.4805297851562, -858.7952270507812, -837.1099243164062, -815.424560546875, -793.7392578125, -772.0538940429688, -750.3685913085938, -728.6832275390625, -706.9979248046875, -685.3126220703125, -663.6273193359375, -641.9419555664062, -620.2566528320312, -598.5712890625, -576.885986328125, -555.20068359375, -533.5153198242188, -511.83001708984375, -490.1446838378906, -468.4593505859375, -446.7740478515625, -425.08868408203125, -403.40338134765625, -381.7180480957031, -360.03271484375, -338.34735107421875, -316.6620178222656, -294.9766845703125, -273.2913818359375, -251.6060333251953, -229.9207000732422, -208.23538208007812, -186.550048828125, -164.86473083496094, -143.1793975830078, -121.49407196044922, -99.80874633789062, -78.1234130859375, -56.438079833984375, -34.75276184082031, -13.067428588867188, 8.617904663085938, 30.303234100341797, 51.988563537597656, 73.67388916015625, 95.35922241210938, 117.0445556640625, 138.72987365722656, 160.4152069091797, 182.1005401611328]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 10.0, 11.0, 10.0, 17.0, 14.0, 16.0, 24.0, 21.0, 29.0, 25.0, 30.0, 41.0, 46.0, 37.0, 49.0, 64.0, 57.0, 51.0, 54.0, 48.0, 53.0, 45.0, 36.0, 33.0, 26.0, 31.0, 20.0, 25.0, 16.0, 8.0, 7.0, 13.0, 6.0, 9.0, 5.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-217.52169799804688, -211.4401397705078, -205.3585662841797, -199.27700805664062, -193.1954345703125, -187.11387634277344, -181.03231811523438, -174.95074462890625, -168.8691864013672, -162.78762817382812, -156.7060546875, -150.62449645996094, -144.54293823242188, -138.46136474609375, -132.3798065185547, -126.2982406616211, -120.2166748046875, -114.1351089477539, -108.05354309082031, -101.97198486328125, -95.89041900634766, -89.80885314941406, -83.727294921875, -77.6457290649414, -71.56416320800781, -65.48259735107422, -59.40103530883789, -53.31947326660156, -47.23790740966797, -41.156341552734375, -35.07477951049805, -28.99321746826172, -22.911636352539062, -16.8300724029541, -10.74850845336914, -4.66694450378418, 1.4146194458007812, 7.496183395385742, 13.577747344970703, 19.65930938720703, 25.740875244140625, 31.822439193725586, 37.90400314331055, 43.985565185546875, 50.06713104248047, 56.14869689941406, 62.23025894165039, 68.31182098388672, 74.39338684082031, 80.4749526977539, 86.5565185546875, 92.63807678222656, 98.71964263916016, 104.80120849609375, 110.88276672363281, 116.9643325805664, 123.0458984375, 129.12745666503906, 135.2090301513672, 141.29058837890625, 147.37216186523438, 153.45372009277344, 159.5352783203125, 165.61685180664062, 171.6984100341797]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 5.0, 1.0, 4.0, 7.0, 11.0, 9.0, 17.0, 25.0, 30.0, 31.0, 55.0, 64.0, 81.0, 99.0, 137.0, 162.0, 306.0, 459.0, 803.0, 1498.0, 2904.0, 7437.0, 28103.0, 3862896.0, 258001.0, 19475.0, 6013.0, 2430.0, 1206.0, 682.0, 403.0, 251.0, 185.0, 119.0, 80.0, 58.0, 50.0, 52.0, 30.0, 36.0, 23.0, 19.0, 13.0, 10.0, 5.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.375, -41.0458984375, -39.716796875, -38.3876953125, -37.05859375, -35.7294921875, -34.400390625, -33.0712890625, -31.7421875, -30.4130859375, -29.083984375, -27.7548828125, -26.42578125, -25.0966796875, -23.767578125, -22.4384765625, -21.109375, -19.7802734375, -18.451171875, -17.1220703125, -15.79296875, -14.4638671875, -13.134765625, -11.8056640625, -10.4765625, -9.1474609375, -7.818359375, -6.4892578125, -5.16015625, -3.8310546875, -2.501953125, -1.1728515625, 0.15625, 1.4853515625, 2.814453125, 4.1435546875, 5.47265625, 6.8017578125, 8.130859375, 9.4599609375, 10.7890625, 12.1181640625, 13.447265625, 14.7763671875, 16.10546875, 17.4345703125, 18.763671875, 20.0927734375, 21.421875, 22.7509765625, 24.080078125, 25.4091796875, 26.73828125, 28.0673828125, 29.396484375, 30.7255859375, 32.0546875, 33.3837890625, 34.712890625, 36.0419921875, 37.37109375, 38.7001953125, 40.029296875, 41.3583984375, 42.6875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 4.0, 2.0, 9.0, 7.0, 9.0, 12.0, 10.0, 18.0, 25.0, 25.0, 40.0, 33.0, 48.0, 47.0, 49.0, 45.0, 51.0, 61.0, 46.0, 58.0, 57.0, 49.0, 47.0, 49.0, 32.0, 28.0, 24.0, 19.0, 18.0, 17.0, 18.0, 12.0, 10.0, 8.0, 4.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.984375, -11.65966796875, -11.3349609375, -11.01025390625, -10.685546875, -10.36083984375, -10.0361328125, -9.71142578125, -9.38671875, -9.06201171875, -8.7373046875, -8.41259765625, -8.087890625, -7.76318359375, -7.4384765625, -7.11376953125, -6.7890625, -6.46435546875, -6.1396484375, -5.81494140625, -5.490234375, -5.16552734375, -4.8408203125, -4.51611328125, -4.19140625, -3.86669921875, -3.5419921875, -3.21728515625, -2.892578125, -2.56787109375, -2.2431640625, -1.91845703125, -1.59375, -1.26904296875, -0.9443359375, -0.61962890625, -0.294921875, 0.02978515625, 0.3544921875, 0.67919921875, 1.00390625, 1.32861328125, 1.6533203125, 1.97802734375, 2.302734375, 2.62744140625, 2.9521484375, 3.27685546875, 3.6015625, 3.92626953125, 4.2509765625, 4.57568359375, 4.900390625, 5.22509765625, 5.5498046875, 5.87451171875, 6.19921875, 6.52392578125, 6.8486328125, 7.17333984375, 7.498046875, 7.82275390625, 8.1474609375, 8.47216796875, 8.796875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 4.0, 4.0, 7.0, 15.0, 12.0, 15.0, 21.0, 33.0, 43.0, 56.0, 60.0, 106.0, 121.0, 177.0, 303.0, 503.0, 942.0, 2184.0, 6296.0, 25475.0, 3731981.0, 397021.0, 19553.0, 5216.0, 1893.0, 832.0, 456.0, 274.0, 174.0, 128.0, 99.0, 69.0, 56.0, 37.0, 26.0, 23.0, 13.0, 18.0, 14.0, 7.0, 5.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.9375, -44.49853515625, -43.0595703125, -41.62060546875, -40.181640625, -38.74267578125, -37.3037109375, -35.86474609375, -34.42578125, -32.98681640625, -31.5478515625, -30.10888671875, -28.669921875, -27.23095703125, -25.7919921875, -24.35302734375, -22.9140625, -21.47509765625, -20.0361328125, -18.59716796875, -17.158203125, -15.71923828125, -14.2802734375, -12.84130859375, -11.40234375, -9.96337890625, -8.5244140625, -7.08544921875, -5.646484375, -4.20751953125, -2.7685546875, -1.32958984375, 0.109375, 1.54833984375, 2.9873046875, 4.42626953125, 5.865234375, 7.30419921875, 8.7431640625, 10.18212890625, 11.62109375, 13.06005859375, 14.4990234375, 15.93798828125, 17.376953125, 18.81591796875, 20.2548828125, 21.69384765625, 23.1328125, 24.57177734375, 26.0107421875, 27.44970703125, 28.888671875, 30.32763671875, 31.7666015625, 33.20556640625, 34.64453125, 36.08349609375, 37.5224609375, 38.96142578125, 40.400390625, 41.83935546875, 43.2783203125, 44.71728515625, 46.15625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 5.0, 11.0, 12.0, 18.0, 28.0, 66.0, 336.0, 3280.0, 188.0, 60.0, 34.0, 14.0, 8.0, 10.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9140625, -9.2679443359375, -8.621826171875, -7.9757080078125, -7.32958984375, -6.6834716796875, -6.037353515625, -5.3912353515625, -4.7451171875, -4.0989990234375, -3.452880859375, -2.8067626953125, -2.16064453125, -1.5145263671875, -0.868408203125, -0.2222900390625, 0.423828125, 1.0699462890625, 1.716064453125, 2.3621826171875, 3.00830078125, 3.6544189453125, 4.300537109375, 4.9466552734375, 5.5927734375, 6.2388916015625, 6.885009765625, 7.5311279296875, 8.17724609375, 8.8233642578125, 9.469482421875, 10.1156005859375, 10.76171875, 11.4078369140625, 12.053955078125, 12.7000732421875, 13.34619140625, 13.9923095703125, 14.638427734375, 15.2845458984375, 15.9306640625, 16.5767822265625, 17.222900390625, 17.8690185546875, 18.51513671875, 19.1612548828125, 19.807373046875, 20.4534912109375, 21.099609375, 21.7457275390625, 22.391845703125, 23.0379638671875, 23.68408203125, 24.3302001953125, 24.976318359375, 25.6224365234375, 26.2685546875, 26.9146728515625, 27.560791015625, 28.2069091796875, 28.85302734375, 29.4991455078125, 30.145263671875, 30.7913818359375, 31.4375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 6.0, 10.0, 14.0, 23.0, 40.0, 51.0, 58.0, 91.0, 115.0, 106.0, 116.0, 100.0, 69.0, 63.0, 43.0, 34.0, 15.0, 15.0, 12.0, 4.0, 7.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.596824645996094, -38.90652084350586, -37.21621322631836, -35.525909423828125, -33.83560562133789, -32.145301818847656, -30.454994201660156, -28.764690399169922, -27.074386596679688, -25.38408088684082, -23.693777084350586, -22.00347137451172, -20.313167572021484, -18.622861862182617, -16.93255615234375, -15.242252349853516, -13.551946640014648, -11.861641883850098, -10.171337127685547, -8.48103141784668, -6.790727138519287, -5.100421905517578, -3.4101171493530273, -1.7198123931884766, -0.02950763702392578, 1.6607972383499146, 3.351102113723755, 5.041407108306885, 6.7317118644714355, 8.422017097473145, 10.112321853637695, 11.802626609802246, 13.492931365966797, 15.183236122131348, 16.8735408782959, 18.563846588134766, 20.254150390625, 21.944456100463867, 23.634761810302734, 25.32506561279297, 27.015369415283203, 28.70567512512207, 30.395978927612305, 32.08628463745117, 33.776588439941406, 35.466896057128906, 37.15719985961914, 38.847503662109375, 40.537811279296875, 42.22811508178711, 43.91842269897461, 45.608726501464844, 47.29903030395508, 48.98933410644531, 50.67964172363281, 52.36994552612305, 54.06024932861328, 55.750553131103516, 57.440860748291016, 59.13116455078125, 60.821468353271484, 62.51177215576172, 64.20207977294922, 65.89237976074219, 67.58268737792969]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 4.0, 9.0, 2.0, 8.0, 8.0, 13.0, 14.0, 20.0, 32.0, 39.0, 44.0, 45.0, 60.0, 57.0, 60.0, 64.0, 87.0, 57.0, 62.0, 45.0, 58.0, 47.0, 41.0, 26.0, 19.0, 25.0, 13.0, 15.0, 7.0, 6.0, 7.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.510215759277344, -42.01044845581055, -40.510677337646484, -39.01091003417969, -37.511138916015625, -36.01137161254883, -34.51160430908203, -33.01183319091797, -31.51206398010254, -30.01229476928711, -28.51252555847168, -27.01275634765625, -25.512989044189453, -24.01321792602539, -22.513450622558594, -21.013681411743164, -19.513912200927734, -18.014142990112305, -16.514373779296875, -15.014605522155762, -13.514836311340332, -12.015067100524902, -10.515298843383789, -9.01552963256836, -7.51576042175293, -6.0159912109375, -4.5162224769592285, -3.016453742980957, -1.5166845321655273, -0.016915321350097656, 1.4828529357910156, 2.9826221466064453, 4.482391357421875, 5.982160568237305, 7.481929302215576, 8.981698036193848, 10.481467247009277, 11.981236457824707, 13.48100471496582, 14.98077392578125, 16.48054313659668, 17.98031234741211, 19.48008155822754, 20.97985076904297, 22.479618072509766, 23.979389190673828, 25.479156494140625, 26.978925704956055, 28.478694915771484, 29.978464126586914, 31.478233337402344, 32.97800064086914, 34.4777717590332, 35.9775390625, 37.47731018066406, 38.97707748413086, 40.476844787597656, 41.97661209106445, 43.476383209228516, 44.97615051269531, 46.475921630859375, 47.97568893432617, 49.47545623779297, 50.97522735595703, 52.474998474121094]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 6.0, 3.0, 12.0, 13.0, 23.0, 32.0, 53.0, 85.0, 124.0, 187.0, 329.0, 499.0, 869.0, 1549.0, 2925.0, 5946.0, 12910.0, 29176.0, 69268.0, 161973.0, 337900.0, 241252.0, 103173.0, 43808.0, 18909.0, 8463.0, 4073.0, 2094.0, 1205.0, 650.0, 376.0, 235.0, 145.0, 107.0, 66.0, 46.0, 26.0, 12.0, 15.0, 7.0, 5.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.609375, -21.918701171875, -21.22802734375, -20.537353515625, -19.8466796875, -19.156005859375, -18.46533203125, -17.774658203125, -17.083984375, -16.393310546875, -15.70263671875, -15.011962890625, -14.3212890625, -13.630615234375, -12.93994140625, -12.249267578125, -11.55859375, -10.867919921875, -10.17724609375, -9.486572265625, -8.7958984375, -8.105224609375, -7.41455078125, -6.723876953125, -6.033203125, -5.342529296875, -4.65185546875, -3.961181640625, -3.2705078125, -2.579833984375, -1.88916015625, -1.198486328125, -0.5078125, 0.182861328125, 0.87353515625, 1.564208984375, 2.2548828125, 2.945556640625, 3.63623046875, 4.326904296875, 5.017578125, 5.708251953125, 6.39892578125, 7.089599609375, 7.7802734375, 8.470947265625, 9.16162109375, 9.852294921875, 10.54296875, 11.233642578125, 11.92431640625, 12.614990234375, 13.3056640625, 13.996337890625, 14.68701171875, 15.377685546875, 16.068359375, 16.759033203125, 17.44970703125, 18.140380859375, 18.8310546875, 19.521728515625, 20.21240234375, 20.903076171875, 21.59375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 7.0, 5.0, 4.0, 8.0, 12.0, 11.0, 19.0, 13.0, 25.0, 26.0, 32.0, 32.0, 40.0, 36.0, 44.0, 40.0, 31.0, 54.0, 53.0, 46.0, 42.0, 48.0, 54.0, 33.0, 41.0, 36.0, 38.0, 32.0, 18.0, 27.0, 16.0, 19.0, 10.0, 14.0, 6.0, 7.0, 3.0, 5.0, 4.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.8203125, -10.51025390625, -10.2001953125, -9.89013671875, -9.580078125, -9.27001953125, -8.9599609375, -8.64990234375, -8.33984375, -8.02978515625, -7.7197265625, -7.40966796875, -7.099609375, -6.78955078125, -6.4794921875, -6.16943359375, -5.859375, -5.54931640625, -5.2392578125, -4.92919921875, -4.619140625, -4.30908203125, -3.9990234375, -3.68896484375, -3.37890625, -3.06884765625, -2.7587890625, -2.44873046875, -2.138671875, -1.82861328125, -1.5185546875, -1.20849609375, -0.8984375, -0.58837890625, -0.2783203125, 0.03173828125, 0.341796875, 0.65185546875, 0.9619140625, 1.27197265625, 1.58203125, 1.89208984375, 2.2021484375, 2.51220703125, 2.822265625, 3.13232421875, 3.4423828125, 3.75244140625, 4.0625, 4.37255859375, 4.6826171875, 4.99267578125, 5.302734375, 5.61279296875, 5.9228515625, 6.23291015625, 6.54296875, 6.85302734375, 7.1630859375, 7.47314453125, 7.783203125, 8.09326171875, 8.4033203125, 8.71337890625, 9.0234375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 3.0, 7.0, 14.0, 18.0, 16.0, 27.0, 42.0, 44.0, 77.0, 115.0, 170.0, 255.0, 442.0, 814.0, 1865.0, 5990.0, 31811.0, 339280.0, 600206.0, 53926.0, 8566.0, 2526.0, 938.0, 498.0, 286.0, 193.0, 127.0, 73.0, 55.0, 52.0, 30.0, 16.0, 19.0, 13.0, 8.0, 8.0, 7.0, 4.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.625, -45.126953125, -43.62890625, -42.130859375, -40.6328125, -39.134765625, -37.63671875, -36.138671875, -34.640625, -33.142578125, -31.64453125, -30.146484375, -28.6484375, -27.150390625, -25.65234375, -24.154296875, -22.65625, -21.158203125, -19.66015625, -18.162109375, -16.6640625, -15.166015625, -13.66796875, -12.169921875, -10.671875, -9.173828125, -7.67578125, -6.177734375, -4.6796875, -3.181640625, -1.68359375, -0.185546875, 1.3125, 2.810546875, 4.30859375, 5.806640625, 7.3046875, 8.802734375, 10.30078125, 11.798828125, 13.296875, 14.794921875, 16.29296875, 17.791015625, 19.2890625, 20.787109375, 22.28515625, 23.783203125, 25.28125, 26.779296875, 28.27734375, 29.775390625, 31.2734375, 32.771484375, 34.26953125, 35.767578125, 37.265625, 38.763671875, 40.26171875, 41.759765625, 43.2578125, 44.755859375, 46.25390625, 47.751953125, 49.25]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 1.0, 4.0, 4.0, 4.0, 7.0, 11.0, 16.0, 22.0, 16.0, 15.0, 23.0, 29.0, 30.0, 27.0, 27.0, 33.0, 29.0, 41.0, 47.0, 51.0, 48.0, 38.0, 47.0, 56.0, 52.0, 48.0, 38.0, 24.0, 37.0, 29.0, 30.0, 12.0, 16.0, 18.0, 18.0, 10.0, 7.0, 9.0, 4.0, 5.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-45.1875, -43.9326171875, -42.677734375, -41.4228515625, -40.16796875, -38.9130859375, -37.658203125, -36.4033203125, -35.1484375, -33.8935546875, -32.638671875, -31.3837890625, -30.12890625, -28.8740234375, -27.619140625, -26.3642578125, -25.109375, -23.8544921875, -22.599609375, -21.3447265625, -20.08984375, -18.8349609375, -17.580078125, -16.3251953125, -15.0703125, -13.8154296875, -12.560546875, -11.3056640625, -10.05078125, -8.7958984375, -7.541015625, -6.2861328125, -5.03125, -3.7763671875, -2.521484375, -1.2666015625, -0.01171875, 1.2431640625, 2.498046875, 3.7529296875, 5.0078125, 6.2626953125, 7.517578125, 8.7724609375, 10.02734375, 11.2822265625, 12.537109375, 13.7919921875, 15.046875, 16.3017578125, 17.556640625, 18.8115234375, 20.06640625, 21.3212890625, 22.576171875, 23.8310546875, 25.0859375, 26.3408203125, 27.595703125, 28.8505859375, 30.10546875, 31.3603515625, 32.615234375, 33.8701171875, 35.125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 4.0, 4.0, 12.0, 11.0, 21.0, 15.0, 35.0, 38.0, 64.0, 89.0, 129.0, 210.0, 328.0, 523.0, 1007.0, 2122.0, 4875.0, 13264.0, 44023.0, 177114.0, 584329.0, 158966.0, 39975.0, 12414.0, 4636.0, 1956.0, 1004.0, 494.0, 283.0, 192.0, 123.0, 73.0, 62.0, 43.0, 28.0, 16.0, 21.0, 9.0, 10.0, 10.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-10.71875, -10.41650390625, -10.1142578125, -9.81201171875, -9.509765625, -9.20751953125, -8.9052734375, -8.60302734375, -8.30078125, -7.99853515625, -7.6962890625, -7.39404296875, -7.091796875, -6.78955078125, -6.4873046875, -6.18505859375, -5.8828125, -5.58056640625, -5.2783203125, -4.97607421875, -4.673828125, -4.37158203125, -4.0693359375, -3.76708984375, -3.46484375, -3.16259765625, -2.8603515625, -2.55810546875, -2.255859375, -1.95361328125, -1.6513671875, -1.34912109375, -1.046875, -0.74462890625, -0.4423828125, -0.14013671875, 0.162109375, 0.46435546875, 0.7666015625, 1.06884765625, 1.37109375, 1.67333984375, 1.9755859375, 2.27783203125, 2.580078125, 2.88232421875, 3.1845703125, 3.48681640625, 3.7890625, 4.09130859375, 4.3935546875, 4.69580078125, 4.998046875, 5.30029296875, 5.6025390625, 5.90478515625, 6.20703125, 6.50927734375, 6.8115234375, 7.11376953125, 7.416015625, 7.71826171875, 8.0205078125, 8.32275390625, 8.625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 8.0, 7.0, 9.0, 21.0, 19.0, 33.0, 56.0, 57.0, 83.0, 198.0, 179.0, 95.0, 69.0, 45.0, 25.0, 25.0, 18.0, 9.0, 11.0, 5.0, 7.0, 8.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00411224365234375, -0.004006743431091309, -0.003901243209838867, -0.0037957429885864258, -0.0036902427673339844, -0.003584742546081543, -0.0034792423248291016, -0.00337374210357666, -0.0032682418823242188, -0.0031627416610717773, -0.003057241439819336, -0.0029517412185668945, -0.002846240997314453, -0.0027407407760620117, -0.0026352405548095703, -0.002529740333557129, -0.0024242401123046875, -0.002318739891052246, -0.0022132396697998047, -0.0021077394485473633, -0.002002239227294922, -0.0018967390060424805, -0.001791238784790039, -0.0016857385635375977, -0.0015802383422851562, -0.0014747381210327148, -0.0013692378997802734, -0.001263737678527832, -0.0011582374572753906, -0.0010527372360229492, -0.0009472370147705078, -0.0008417367935180664, -0.000736236572265625, -0.0006307363510131836, -0.0005252361297607422, -0.0004197359085083008, -0.0003142356872558594, -0.00020873546600341797, -0.00010323524475097656, 2.2649765014648438e-06, 0.00010776519775390625, 0.00021326541900634766, 0.00031876564025878906, 0.00042426586151123047, 0.0005297660827636719, 0.0006352663040161133, 0.0007407665252685547, 0.0008462667465209961, 0.0009517669677734375, 0.001057267189025879, 0.0011627674102783203, 0.0012682676315307617, 0.0013737678527832031, 0.0014792680740356445, 0.001584768295288086, 0.0016902685165405273, 0.0017957687377929688, 0.0019012689590454102, 0.0020067691802978516, 0.002112269401550293, 0.0022177696228027344, 0.0023232698440551758, 0.002428770065307617, 0.0025342702865600586, 0.0026397705078125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 6.0, 2.0, 2.0, 4.0, 6.0, 16.0, 18.0, 12.0, 19.0, 39.0, 42.0, 66.0, 98.0, 153.0, 292.0, 527.0, 1187.0, 3305.0, 12039.0, 72217.0, 683106.0, 238393.0, 27326.0, 6133.0, 1895.0, 746.0, 347.0, 190.0, 107.0, 71.0, 53.0, 40.0, 36.0, 20.0, 15.0, 10.0, 6.0, 4.0, 0.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.6875, -16.177978515625, -15.66845703125, -15.158935546875, -14.6494140625, -14.139892578125, -13.63037109375, -13.120849609375, -12.611328125, -12.101806640625, -11.59228515625, -11.082763671875, -10.5732421875, -10.063720703125, -9.55419921875, -9.044677734375, -8.53515625, -8.025634765625, -7.51611328125, -7.006591796875, -6.4970703125, -5.987548828125, -5.47802734375, -4.968505859375, -4.458984375, -3.949462890625, -3.43994140625, -2.930419921875, -2.4208984375, -1.911376953125, -1.40185546875, -0.892333984375, -0.3828125, 0.126708984375, 0.63623046875, 1.145751953125, 1.6552734375, 2.164794921875, 2.67431640625, 3.183837890625, 3.693359375, 4.202880859375, 4.71240234375, 5.221923828125, 5.7314453125, 6.240966796875, 6.75048828125, 7.260009765625, 7.76953125, 8.279052734375, 8.78857421875, 9.298095703125, 9.8076171875, 10.317138671875, 10.82666015625, 11.336181640625, 11.845703125, 12.355224609375, 12.86474609375, 13.374267578125, 13.8837890625, 14.393310546875, 14.90283203125, 15.412353515625, 15.921875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 5.0, 6.0, 3.0, 4.0, 12.0, 10.0, 9.0, 20.0, 16.0, 26.0, 34.0, 52.0, 49.0, 71.0, 81.0, 93.0, 113.0, 79.0, 57.0, 67.0, 47.0, 32.0, 22.0, 27.0, 15.0, 10.0, 6.0, 11.0, 2.0, 5.0, 6.0, 6.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.3203125, -13.9244384765625, -13.528564453125, -13.1326904296875, -12.73681640625, -12.3409423828125, -11.945068359375, -11.5491943359375, -11.1533203125, -10.7574462890625, -10.361572265625, -9.9656982421875, -9.56982421875, -9.1739501953125, -8.778076171875, -8.3822021484375, -7.986328125, -7.5904541015625, -7.194580078125, -6.7987060546875, -6.40283203125, -6.0069580078125, -5.611083984375, -5.2152099609375, -4.8193359375, -4.4234619140625, -4.027587890625, -3.6317138671875, -3.23583984375, -2.8399658203125, -2.444091796875, -2.0482177734375, -1.65234375, -1.2564697265625, -0.860595703125, -0.4647216796875, -0.06884765625, 0.3270263671875, 0.722900390625, 1.1187744140625, 1.5146484375, 1.9105224609375, 2.306396484375, 2.7022705078125, 3.09814453125, 3.4940185546875, 3.889892578125, 4.2857666015625, 4.681640625, 5.0775146484375, 5.473388671875, 5.8692626953125, 6.26513671875, 6.6610107421875, 7.056884765625, 7.4527587890625, 7.8486328125, 8.2445068359375, 8.640380859375, 9.0362548828125, 9.43212890625, 9.8280029296875, 10.223876953125, 10.6197509765625, 11.015625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 4.0, 12.0, 25.0, 42.0, 63.0, 101.0, 128.0, 147.0, 122.0, 101.0, 93.0, 48.0, 42.0, 27.0, 16.0, 12.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-323.1836242675781, -314.6053161621094, -306.0269775390625, -297.44866943359375, -288.870361328125, -280.29205322265625, -271.7137451171875, -263.1354064941406, -254.55709838867188, -245.97879028320312, -237.4004669189453, -228.8221435546875, -220.24383544921875, -211.66552734375, -203.0872039794922, -194.50888061523438, -185.93057250976562, -177.35226440429688, -168.77394104003906, -160.19561767578125, -151.6173095703125, -143.03900146484375, -134.46067810058594, -125.88236236572266, -117.30404663085938, -108.7257308959961, -100.14741516113281, -91.56909942626953, -82.99078369140625, -74.41246795654297, -65.83415222167969, -57.255836486816406, -48.67755126953125, -40.09923553466797, -31.520919799804688, -22.942604064941406, -14.364288330078125, -5.785972595214844, 2.7923431396484375, 11.370658874511719, 19.948974609375, 28.52729034423828, 37.10560607910156, 45.683921813964844, 54.262237548828125, 62.840553283691406, 71.41886901855469, 79.99718475341797, 88.57550048828125, 97.15381622314453, 105.73213195800781, 114.3104476928711, 122.88876342773438, 131.46707153320312, 140.04539489746094, 148.62371826171875, 157.2020263671875, 165.78033447265625, 174.35865783691406, 182.93698120117188, 191.51528930664062, 200.09359741210938, 208.6719207763672, 217.250244140625, 225.82855224609375]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 7.0, 7.0, 6.0, 10.0, 15.0, 13.0, 11.0, 14.0, 29.0, 22.0, 31.0, 39.0, 44.0, 45.0, 56.0, 57.0, 56.0, 55.0, 67.0, 55.0, 43.0, 47.0, 37.0, 34.0, 34.0, 34.0, 26.0, 25.0, 15.0, 14.0, 16.0, 13.0, 8.0, 11.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-211.02838134765625, -204.46856689453125, -197.90875244140625, -191.34893798828125, -184.78912353515625, -178.22930908203125, -171.66949462890625, -165.10968017578125, -158.54986572265625, -151.99005126953125, -145.43023681640625, -138.87042236328125, -132.31060791015625, -125.75079345703125, -119.19097900390625, -112.63116455078125, -106.07135772705078, -99.51154327392578, -92.95172882080078, -86.39191436767578, -79.83209991455078, -73.27229309082031, -66.71247863769531, -60.15266036987305, -53.59284591674805, -47.03303146362305, -40.47321701049805, -33.91340637207031, -27.35359001159668, -20.793777465820312, -14.233963012695312, -7.6741485595703125, -1.1143341064453125, 5.445479869842529, 12.005293846130371, 18.565107345581055, 25.124921798706055, 31.684734344482422, 38.24454879760742, 44.80436325073242, 51.36417770385742, 57.92399215698242, 64.48380279541016, 71.04361724853516, 77.60343170166016, 84.16324615478516, 90.72306060791016, 97.28287506103516, 103.84268951416016, 110.40250396728516, 116.96231842041016, 123.52213287353516, 130.08193969726562, 136.64175415039062, 143.20156860351562, 149.76138305664062, 156.32119750976562, 162.88101196289062, 169.44082641601562, 176.00064086914062, 182.56045532226562, 189.12026977539062, 195.68008422851562, 202.23989868164062, 208.79971313476562]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 3.0, 4.0, 4.0, 4.0, 13.0, 9.0, 13.0, 18.0, 33.0, 40.0, 40.0, 92.0, 106.0, 187.0, 310.0, 590.0, 1064.0, 2054.0, 4515.0, 10056.0, 25994.0, 80283.0, 558579.0, 3138987.0, 277329.0, 58158.0, 20265.0, 8218.0, 3666.0, 1715.0, 878.0, 487.0, 239.0, 128.0, 73.0, 44.0, 35.0, 20.0, 13.0, 8.0, 5.0, 9.0, 2.0, 1.0], "bins": [-28.28125, -27.6290283203125, -26.976806640625, -26.3245849609375, -25.67236328125, -25.0201416015625, -24.367919921875, -23.7156982421875, -23.0634765625, -22.4112548828125, -21.759033203125, -21.1068115234375, -20.45458984375, -19.8023681640625, -19.150146484375, -18.4979248046875, -17.845703125, -17.1934814453125, -16.541259765625, -15.8890380859375, -15.23681640625, -14.5845947265625, -13.932373046875, -13.2801513671875, -12.6279296875, -11.9757080078125, -11.323486328125, -10.6712646484375, -10.01904296875, -9.3668212890625, -8.714599609375, -8.0623779296875, -7.41015625, -6.7579345703125, -6.105712890625, -5.4534912109375, -4.80126953125, -4.1490478515625, -3.496826171875, -2.8446044921875, -2.1923828125, -1.5401611328125, -0.887939453125, -0.2357177734375, 0.41650390625, 1.0687255859375, 1.720947265625, 2.3731689453125, 3.025390625, 3.6776123046875, 4.329833984375, 4.9820556640625, 5.63427734375, 6.2864990234375, 6.938720703125, 7.5909423828125, 8.2431640625, 8.8953857421875, 9.547607421875, 10.1998291015625, 10.85205078125, 11.5042724609375, 12.156494140625, 12.8087158203125, 13.4609375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 12.0, 15.0, 10.0, 25.0, 36.0, 34.0, 61.0, 68.0, 106.0, 95.0, 96.0, 90.0, 89.0, 66.0, 67.0, 44.0, 33.0, 16.0, 19.0, 11.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-26.46875, -25.9085693359375, -25.348388671875, -24.7882080078125, -24.22802734375, -23.6678466796875, -23.107666015625, -22.5474853515625, -21.9873046875, -21.4271240234375, -20.866943359375, -20.3067626953125, -19.74658203125, -19.1864013671875, -18.626220703125, -18.0660400390625, -17.505859375, -16.9456787109375, -16.385498046875, -15.8253173828125, -15.26513671875, -14.7049560546875, -14.144775390625, -13.5845947265625, -13.0244140625, -12.4642333984375, -11.904052734375, -11.3438720703125, -10.78369140625, -10.2235107421875, -9.663330078125, -9.1031494140625, -8.54296875, -7.9827880859375, -7.422607421875, -6.8624267578125, -6.30224609375, -5.7420654296875, -5.181884765625, -4.6217041015625, -4.0615234375, -3.5013427734375, -2.941162109375, -2.3809814453125, -1.82080078125, -1.2606201171875, -0.700439453125, -0.1402587890625, 0.419921875, 0.9801025390625, 1.540283203125, 2.1004638671875, 2.66064453125, 3.2208251953125, 3.781005859375, 4.3411865234375, 4.9013671875, 5.4615478515625, 6.021728515625, 6.5819091796875, 7.14208984375, 7.7022705078125, 8.262451171875, 8.8226318359375, 9.3828125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 6.0, 5.0, 7.0, 14.0, 17.0, 27.0, 42.0, 67.0, 162.0, 292.0, 706.0, 1807.0, 5597.0, 21024.0, 128700.0, 3454732.0, 520909.0, 44914.0, 10075.0, 2995.0, 1183.0, 480.0, 223.0, 125.0, 68.0, 33.0, 20.0, 14.0, 9.0, 14.0, 7.0, 4.0, 2.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.4375, -27.33251953125, -26.2275390625, -25.12255859375, -24.017578125, -22.91259765625, -21.8076171875, -20.70263671875, -19.59765625, -18.49267578125, -17.3876953125, -16.28271484375, -15.177734375, -14.07275390625, -12.9677734375, -11.86279296875, -10.7578125, -9.65283203125, -8.5478515625, -7.44287109375, -6.337890625, -5.23291015625, -4.1279296875, -3.02294921875, -1.91796875, -0.81298828125, 0.2919921875, 1.39697265625, 2.501953125, 3.60693359375, 4.7119140625, 5.81689453125, 6.921875, 8.02685546875, 9.1318359375, 10.23681640625, 11.341796875, 12.44677734375, 13.5517578125, 14.65673828125, 15.76171875, 16.86669921875, 17.9716796875, 19.07666015625, 20.181640625, 21.28662109375, 22.3916015625, 23.49658203125, 24.6015625, 25.70654296875, 26.8115234375, 27.91650390625, 29.021484375, 30.12646484375, 31.2314453125, 32.33642578125, 33.44140625, 34.54638671875, 35.6513671875, 36.75634765625, 37.861328125, 38.96630859375, 40.0712890625, 41.17626953125, 42.28125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 8.0, 8.0, 12.0, 11.0, 20.0, 25.0, 37.0, 55.0, 87.0, 142.0, 310.0, 651.0, 1208.0, 707.0, 346.0, 146.0, 101.0, 68.0, 44.0, 26.0, 13.0, 10.0, 8.0, 9.0, 7.0, 7.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.625, -32.591796875, -31.55859375, -30.525390625, -29.4921875, -28.458984375, -27.42578125, -26.392578125, -25.359375, -24.326171875, -23.29296875, -22.259765625, -21.2265625, -20.193359375, -19.16015625, -18.126953125, -17.09375, -16.060546875, -15.02734375, -13.994140625, -12.9609375, -11.927734375, -10.89453125, -9.861328125, -8.828125, -7.794921875, -6.76171875, -5.728515625, -4.6953125, -3.662109375, -2.62890625, -1.595703125, -0.5625, 0.470703125, 1.50390625, 2.537109375, 3.5703125, 4.603515625, 5.63671875, 6.669921875, 7.703125, 8.736328125, 9.76953125, 10.802734375, 11.8359375, 12.869140625, 13.90234375, 14.935546875, 15.96875, 17.001953125, 18.03515625, 19.068359375, 20.1015625, 21.134765625, 22.16796875, 23.201171875, 24.234375, 25.267578125, 26.30078125, 27.333984375, 28.3671875, 29.400390625, 30.43359375, 31.466796875, 32.5]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 6.0, 9.0, 19.0, 29.0, 46.0, 60.0, 107.0, 128.0, 173.0, 149.0, 100.0, 66.0, 39.0, 21.0, 9.0, 5.0, 7.0, 4.0, 3.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-175.53738403320312, -168.53370666503906, -161.53001403808594, -154.52633666992188, -147.5226593017578, -140.5189666748047, -133.51528930664062, -126.51160430908203, -119.50791931152344, -112.50423431396484, -105.50055694580078, -98.49687194824219, -91.4931869506836, -84.489501953125, -77.48582458496094, -70.48213958740234, -63.47846221923828, -56.47478103637695, -49.47109603881836, -42.46741485595703, -35.46372985839844, -28.46004867553711, -21.45636749267578, -14.452682495117188, -7.449001312255859, -0.44531869888305664, 6.558363914489746, 13.56204605102539, 20.56572914123535, 27.569412231445312, 34.57309341430664, 41.576778411865234, 48.58045959472656, 55.58414077758789, 62.587825775146484, 69.59150695800781, 76.5951919555664, 83.598876953125, 90.60255432128906, 97.60623931884766, 104.60992431640625, 111.61360931396484, 118.6172866821289, 125.6209716796875, 132.62464904785156, 139.6283416748047, 146.63201904296875, 153.63571166992188, 160.63937377929688, 167.64305114746094, 174.64674377441406, 181.65042114257812, 188.6540985107422, 195.6577911376953, 202.66146850585938, 209.6651611328125, 216.66883850097656, 223.67251586914062, 230.67620849609375, 237.6798858642578, 244.68356323242188, 251.687255859375, 258.69091796875, 265.6946105957031, 272.69830322265625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 7.0, 9.0, 7.0, 9.0, 18.0, 21.0, 19.0, 27.0, 41.0, 33.0, 41.0, 56.0, 55.0, 56.0, 58.0, 71.0, 66.0, 42.0, 52.0, 61.0, 45.0, 33.0, 39.0, 27.0, 23.0, 24.0, 13.0, 18.0, 11.0, 9.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-146.96173095703125, -142.18417358398438, -137.4066162109375, -132.62905883789062, -127.85150146484375, -123.07394409179688, -118.29638671875, -113.51882934570312, -108.74127197265625, -103.96371459960938, -99.1861572265625, -94.40859985351562, -89.63104248046875, -84.85348510742188, -80.075927734375, -75.29837036132812, -70.52080535888672, -65.74324798583984, -60.96569061279297, -56.188133239746094, -51.41057586669922, -46.633018493652344, -41.8554573059082, -37.07789993286133, -32.30034255981445, -27.522785186767578, -22.745227813720703, -17.967668533325195, -13.19011116027832, -8.412553787231445, -3.6349945068359375, 1.1425628662109375, 5.9201202392578125, 10.697677612304688, 15.475235939025879, 20.25279426574707, 25.030351638793945, 29.80790901184082, 34.58546829223633, 39.3630256652832, 44.14058303833008, 48.91814041137695, 53.69569778442383, 58.47325897216797, 63.250816345214844, 68.02837371826172, 72.8059310913086, 77.58348846435547, 82.36104583740234, 87.13860321044922, 91.9161605834961, 96.69371795654297, 101.47127532958984, 106.24883270263672, 111.02639770507812, 115.803955078125, 120.58151245117188, 125.35906982421875, 130.13662719726562, 134.9141845703125, 139.69174194335938, 144.46929931640625, 149.24685668945312, 154.0244140625, 158.80197143554688]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 3.0, 7.0, 15.0, 17.0, 35.0, 45.0, 62.0, 139.0, 216.0, 408.0, 765.0, 1281.0, 2781.0, 5798.0, 13661.0, 34182.0, 94420.0, 314450.0, 388709.0, 119561.0, 42097.0, 16246.0, 7066.0, 3191.0, 1527.0, 814.0, 444.0, 234.0, 137.0, 87.0, 57.0, 40.0, 22.0, 14.0, 7.0, 8.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.625, -22.865478515625, -22.10595703125, -21.346435546875, -20.5869140625, -19.827392578125, -19.06787109375, -18.308349609375, -17.548828125, -16.789306640625, -16.02978515625, -15.270263671875, -14.5107421875, -13.751220703125, -12.99169921875, -12.232177734375, -11.47265625, -10.713134765625, -9.95361328125, -9.194091796875, -8.4345703125, -7.675048828125, -6.91552734375, -6.156005859375, -5.396484375, -4.636962890625, -3.87744140625, -3.117919921875, -2.3583984375, -1.598876953125, -0.83935546875, -0.079833984375, 0.6796875, 1.439208984375, 2.19873046875, 2.958251953125, 3.7177734375, 4.477294921875, 5.23681640625, 5.996337890625, 6.755859375, 7.515380859375, 8.27490234375, 9.034423828125, 9.7939453125, 10.553466796875, 11.31298828125, 12.072509765625, 12.83203125, 13.591552734375, 14.35107421875, 15.110595703125, 15.8701171875, 16.629638671875, 17.38916015625, 18.148681640625, 18.908203125, 19.667724609375, 20.42724609375, 21.186767578125, 21.9462890625, 22.705810546875, 23.46533203125, 24.224853515625, 24.984375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 10.0, 6.0, 9.0, 16.0, 14.0, 21.0, 26.0, 30.0, 38.0, 41.0, 57.0, 58.0, 80.0, 65.0, 61.0, 56.0, 57.0, 56.0, 54.0, 46.0, 46.0, 39.0, 35.0, 21.0, 9.0, 12.0, 10.0, 8.0, 4.0, 6.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.4296875, -15.057373046875, -14.68505859375, -14.312744140625, -13.9404296875, -13.568115234375, -13.19580078125, -12.823486328125, -12.451171875, -12.078857421875, -11.70654296875, -11.334228515625, -10.9619140625, -10.589599609375, -10.21728515625, -9.844970703125, -9.47265625, -9.100341796875, -8.72802734375, -8.355712890625, -7.9833984375, -7.611083984375, -7.23876953125, -6.866455078125, -6.494140625, -6.121826171875, -5.74951171875, -5.377197265625, -5.0048828125, -4.632568359375, -4.26025390625, -3.887939453125, -3.515625, -3.143310546875, -2.77099609375, -2.398681640625, -2.0263671875, -1.654052734375, -1.28173828125, -0.909423828125, -0.537109375, -0.164794921875, 0.20751953125, 0.579833984375, 0.9521484375, 1.324462890625, 1.69677734375, 2.069091796875, 2.44140625, 2.813720703125, 3.18603515625, 3.558349609375, 3.9306640625, 4.302978515625, 4.67529296875, 5.047607421875, 5.419921875, 5.792236328125, 6.16455078125, 6.536865234375, 6.9091796875, 7.281494140625, 7.65380859375, 8.026123046875, 8.3984375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 7.0, 4.0, 3.0, 9.0, 15.0, 18.0, 23.0, 32.0, 38.0, 73.0, 108.0, 150.0, 267.0, 498.0, 1234.0, 3812.0, 24015.0, 668599.0, 328827.0, 15663.0, 2914.0, 1011.0, 462.0, 276.0, 145.0, 106.0, 87.0, 52.0, 36.0, 29.0, 11.0, 13.0, 6.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.53125, -54.57568359375, -52.6201171875, -50.66455078125, -48.708984375, -46.75341796875, -44.7978515625, -42.84228515625, -40.88671875, -38.93115234375, -36.9755859375, -35.02001953125, -33.064453125, -31.10888671875, -29.1533203125, -27.19775390625, -25.2421875, -23.28662109375, -21.3310546875, -19.37548828125, -17.419921875, -15.46435546875, -13.5087890625, -11.55322265625, -9.59765625, -7.64208984375, -5.6865234375, -3.73095703125, -1.775390625, 0.18017578125, 2.1357421875, 4.09130859375, 6.046875, 8.00244140625, 9.9580078125, 11.91357421875, 13.869140625, 15.82470703125, 17.7802734375, 19.73583984375, 21.69140625, 23.64697265625, 25.6025390625, 27.55810546875, 29.513671875, 31.46923828125, 33.4248046875, 35.38037109375, 37.3359375, 39.29150390625, 41.2470703125, 43.20263671875, 45.158203125, 47.11376953125, 49.0693359375, 51.02490234375, 52.98046875, 54.93603515625, 56.8916015625, 58.84716796875, 60.802734375, 62.75830078125, 64.7138671875, 66.66943359375, 68.625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 4.0, 8.0, 13.0, 9.0, 15.0, 23.0, 24.0, 26.0, 35.0, 38.0, 32.0, 43.0, 55.0, 51.0, 48.0, 51.0, 61.0, 46.0, 58.0, 55.0, 46.0, 45.0, 39.0, 24.0, 25.0, 25.0, 22.0, 14.0, 13.0, 14.0, 8.0, 7.0, 10.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-48.65625, -47.298828125, -45.94140625, -44.583984375, -43.2265625, -41.869140625, -40.51171875, -39.154296875, -37.796875, -36.439453125, -35.08203125, -33.724609375, -32.3671875, -31.009765625, -29.65234375, -28.294921875, -26.9375, -25.580078125, -24.22265625, -22.865234375, -21.5078125, -20.150390625, -18.79296875, -17.435546875, -16.078125, -14.720703125, -13.36328125, -12.005859375, -10.6484375, -9.291015625, -7.93359375, -6.576171875, -5.21875, -3.861328125, -2.50390625, -1.146484375, 0.2109375, 1.568359375, 2.92578125, 4.283203125, 5.640625, 6.998046875, 8.35546875, 9.712890625, 11.0703125, 12.427734375, 13.78515625, 15.142578125, 16.5, 17.857421875, 19.21484375, 20.572265625, 21.9296875, 23.287109375, 24.64453125, 26.001953125, 27.359375, 28.716796875, 30.07421875, 31.431640625, 32.7890625, 34.146484375, 35.50390625, 36.861328125, 38.21875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 6.0, 5.0, 11.0, 7.0, 11.0, 10.0, 26.0, 36.0, 36.0, 79.0, 135.0, 217.0, 512.0, 1391.0, 4739.0, 28253.0, 597664.0, 385559.0, 23670.0, 4000.0, 1190.0, 460.0, 219.0, 118.0, 79.0, 36.0, 22.0, 17.0, 12.0, 9.0, 4.0, 6.0, 3.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.0, -16.391845703125, -15.78369140625, -15.175537109375, -14.5673828125, -13.959228515625, -13.35107421875, -12.742919921875, -12.134765625, -11.526611328125, -10.91845703125, -10.310302734375, -9.7021484375, -9.093994140625, -8.48583984375, -7.877685546875, -7.26953125, -6.661376953125, -6.05322265625, -5.445068359375, -4.8369140625, -4.228759765625, -3.62060546875, -3.012451171875, -2.404296875, -1.796142578125, -1.18798828125, -0.579833984375, 0.0283203125, 0.636474609375, 1.24462890625, 1.852783203125, 2.4609375, 3.069091796875, 3.67724609375, 4.285400390625, 4.8935546875, 5.501708984375, 6.10986328125, 6.718017578125, 7.326171875, 7.934326171875, 8.54248046875, 9.150634765625, 9.7587890625, 10.366943359375, 10.97509765625, 11.583251953125, 12.19140625, 12.799560546875, 13.40771484375, 14.015869140625, 14.6240234375, 15.232177734375, 15.84033203125, 16.448486328125, 17.056640625, 17.664794921875, 18.27294921875, 18.881103515625, 19.4892578125, 20.097412109375, 20.70556640625, 21.313720703125, 21.921875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 9.0, 15.0, 17.0, 14.0, 32.0, 32.0, 42.0, 83.0, 166.0, 252.0, 111.0, 68.0, 38.0, 20.0, 35.0, 11.0, 17.0, 10.0, 11.0, 4.0, 7.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024356842041015625, -0.002326756715774536, -0.0022178292274475098, -0.0021089017391204834, -0.001999974250793457, -0.0018910467624664307, -0.0017821192741394043, -0.001673191785812378, -0.0015642642974853516, -0.0014553368091583252, -0.0013464093208312988, -0.0012374818325042725, -0.001128554344177246, -0.0010196268558502197, -0.0009106993675231934, -0.000801771879196167, -0.0006928443908691406, -0.0005839169025421143, -0.0004749894142150879, -0.0003660619258880615, -0.00025713443756103516, -0.0001482069492340088, -3.927946090698242e-05, 6.964802742004395e-05, 0.0001785755157470703, 0.0002875030040740967, 0.00039643049240112305, 0.0005053579807281494, 0.0006142854690551758, 0.0007232129573822021, 0.0008321404457092285, 0.0009410679340362549, 0.0010499954223632812, 0.0011589229106903076, 0.001267850399017334, 0.0013767778873443604, 0.0014857053756713867, 0.001594632863998413, 0.0017035603523254395, 0.0018124878406524658, 0.0019214153289794922, 0.0020303428173065186, 0.002139270305633545, 0.0022481977939605713, 0.0023571252822875977, 0.002466052770614624, 0.0025749802589416504, 0.0026839077472686768, 0.002792835235595703, 0.0029017627239227295, 0.003010690212249756, 0.0031196177005767822, 0.0032285451889038086, 0.003337472677230835, 0.0034464001655578613, 0.0035553276538848877, 0.003664255142211914, 0.0037731826305389404, 0.003882110118865967, 0.003991037607192993, 0.0040999650955200195, 0.004208892583847046, 0.004317820072174072, 0.004426747560501099, 0.004535675048828125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 2.0, 1.0, 8.0, 5.0, 7.0, 11.0, 15.0, 17.0, 30.0, 79.0, 105.0, 163.0, 369.0, 807.0, 2690.0, 17775.0, 662528.0, 347841.0, 12518.0, 2184.0, 670.0, 332.0, 150.0, 79.0, 62.0, 36.0, 21.0, 21.0, 16.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.453125, -16.69189453125, -15.9306640625, -15.16943359375, -14.408203125, -13.64697265625, -12.8857421875, -12.12451171875, -11.36328125, -10.60205078125, -9.8408203125, -9.07958984375, -8.318359375, -7.55712890625, -6.7958984375, -6.03466796875, -5.2734375, -4.51220703125, -3.7509765625, -2.98974609375, -2.228515625, -1.46728515625, -0.7060546875, 0.05517578125, 0.81640625, 1.57763671875, 2.3388671875, 3.10009765625, 3.861328125, 4.62255859375, 5.3837890625, 6.14501953125, 6.90625, 7.66748046875, 8.4287109375, 9.18994140625, 9.951171875, 10.71240234375, 11.4736328125, 12.23486328125, 12.99609375, 13.75732421875, 14.5185546875, 15.27978515625, 16.041015625, 16.80224609375, 17.5634765625, 18.32470703125, 19.0859375, 19.84716796875, 20.6083984375, 21.36962890625, 22.130859375, 22.89208984375, 23.6533203125, 24.41455078125, 25.17578125, 25.93701171875, 26.6982421875, 27.45947265625, 28.220703125, 28.98193359375, 29.7431640625, 30.50439453125, 31.265625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 8.0, 6.0, 5.0, 13.0, 10.0, 16.0, 14.0, 28.0, 30.0, 44.0, 49.0, 50.0, 64.0, 69.0, 75.0, 74.0, 73.0, 60.0, 53.0, 49.0, 44.0, 20.0, 22.0, 29.0, 13.0, 12.0, 11.0, 9.0, 8.0, 5.0, 2.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.5390625, -9.2216796875, -8.904296875, -8.5869140625, -8.26953125, -7.9521484375, -7.634765625, -7.3173828125, -7.0, -6.6826171875, -6.365234375, -6.0478515625, -5.73046875, -5.4130859375, -5.095703125, -4.7783203125, -4.4609375, -4.1435546875, -3.826171875, -3.5087890625, -3.19140625, -2.8740234375, -2.556640625, -2.2392578125, -1.921875, -1.6044921875, -1.287109375, -0.9697265625, -0.65234375, -0.3349609375, -0.017578125, 0.2998046875, 0.6171875, 0.9345703125, 1.251953125, 1.5693359375, 1.88671875, 2.2041015625, 2.521484375, 2.8388671875, 3.15625, 3.4736328125, 3.791015625, 4.1083984375, 4.42578125, 4.7431640625, 5.060546875, 5.3779296875, 5.6953125, 6.0126953125, 6.330078125, 6.6474609375, 6.96484375, 7.2822265625, 7.599609375, 7.9169921875, 8.234375, 8.5517578125, 8.869140625, 9.1865234375, 9.50390625, 9.8212890625, 10.138671875, 10.4560546875, 10.7734375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 13.0, 46.0, 177.0, 352.0, 276.0, 97.0, 28.0, 10.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-759.293212890625, -741.135986328125, -722.978759765625, -704.821533203125, -686.664306640625, -668.507080078125, -650.349853515625, -632.1925659179688, -614.0353393554688, -595.8781127929688, -577.7208862304688, -559.5636596679688, -541.4064331054688, -523.2491455078125, -505.0919494628906, -486.9347229003906, -468.7774963378906, -450.6202697753906, -432.4630432128906, -414.3057861328125, -396.1485595703125, -377.9913330078125, -359.8341064453125, -341.6768798828125, -323.5196533203125, -305.3624267578125, -287.2052001953125, -269.0479736328125, -250.89071655273438, -232.73348999023438, -214.57626342773438, -196.41903686523438, -178.26177978515625, -160.10455322265625, -141.9473114013672, -123.79008483886719, -105.63285064697266, -87.47561645507812, -69.31838989257812, -51.161155700683594, -33.00392150878906, -14.846689224243164, 3.3105430603027344, 21.4677734375, 39.62500762939453, 57.78224182128906, 75.93946838378906, 94.0967025756836, 112.25393676757812, 130.41116333007812, 148.5684051513672, 166.7256317138672, 184.88287353515625, 203.04010009765625, 221.19732666015625, 239.35455322265625, 257.51177978515625, 275.66900634765625, 293.82623291015625, 311.98345947265625, 330.1407165527344, 348.2979431152344, 366.4551696777344, 384.6123962402344, 402.7696533203125]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 6.0, 8.0, 17.0, 10.0, 11.0, 20.0, 20.0, 14.0, 37.0, 24.0, 26.0, 40.0, 35.0, 58.0, 47.0, 69.0, 64.0, 69.0, 67.0, 61.0, 41.0, 36.0, 37.0, 26.0, 34.0, 29.0, 20.0, 17.0, 12.0, 16.0, 11.0, 8.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-163.42391967773438, -157.95399475097656, -152.48406982421875, -147.01414489746094, -141.54421997070312, -136.07431030273438, -130.60438537597656, -125.13446044921875, -119.66453552246094, -114.19461059570312, -108.72468566894531, -103.25476837158203, -97.78484344482422, -92.3149185180664, -86.84500122070312, -81.37507629394531, -75.9051513671875, -70.43522644042969, -64.96530151367188, -59.495384216308594, -54.02545928955078, -48.55553436279297, -43.08561325073242, -37.615692138671875, -32.14576721191406, -26.675844192504883, -21.205921173095703, -15.735998153686523, -10.266075134277344, -4.796152114868164, 0.6737709045410156, 6.1436920166015625, 11.613632202148438, 17.083555221557617, 22.553478240966797, 28.023401260375977, 33.493324279785156, 38.96324920654297, 44.433170318603516, 49.90309143066406, 55.373016357421875, 60.84294128417969, 66.3128662109375, 71.78278350830078, 77.2527084350586, 82.7226333618164, 88.19255065917969, 93.6624755859375, 99.13240051269531, 104.60232543945312, 110.07225036621094, 115.54216766357422, 121.01209259033203, 126.48201751708984, 131.95193481445312, 137.42185974121094, 142.89178466796875, 148.36170959472656, 153.83163452148438, 159.3015594482422, 164.771484375, 170.24139404296875, 175.71131896972656, 181.18124389648438, 186.6511688232422]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 1.0, 4.0, 6.0, 12.0, 14.0, 16.0, 24.0, 41.0, 92.0, 161.0, 276.0, 478.0, 1049.0, 2305.0, 5380.0, 14836.0, 53818.0, 491048.0, 3361974.0, 208857.0, 35301.0, 10857.0, 4170.0, 1863.0, 806.0, 395.0, 198.0, 104.0, 85.0, 36.0, 30.0, 23.0, 7.0, 6.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.921875, -13.299072265625, -12.67626953125, -12.053466796875, -11.4306640625, -10.807861328125, -10.18505859375, -9.562255859375, -8.939453125, -8.316650390625, -7.69384765625, -7.071044921875, -6.4482421875, -5.825439453125, -5.20263671875, -4.579833984375, -3.95703125, -3.334228515625, -2.71142578125, -2.088623046875, -1.4658203125, -0.843017578125, -0.22021484375, 0.402587890625, 1.025390625, 1.648193359375, 2.27099609375, 2.893798828125, 3.5166015625, 4.139404296875, 4.76220703125, 5.385009765625, 6.0078125, 6.630615234375, 7.25341796875, 7.876220703125, 8.4990234375, 9.121826171875, 9.74462890625, 10.367431640625, 10.990234375, 11.613037109375, 12.23583984375, 12.858642578125, 13.4814453125, 14.104248046875, 14.72705078125, 15.349853515625, 15.97265625, 16.595458984375, 17.21826171875, 17.841064453125, 18.4638671875, 19.086669921875, 19.70947265625, 20.332275390625, 20.955078125, 21.577880859375, 22.20068359375, 22.823486328125, 23.4462890625, 24.069091796875, 24.69189453125, 25.314697265625, 25.9375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 8.0, 14.0, 23.0, 22.0, 44.0, 41.0, 53.0, 78.0, 96.0, 87.0, 83.0, 96.0, 81.0, 79.0, 63.0, 41.0, 34.0, 18.0, 16.0, 7.0, 4.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3828125, -11.8736572265625, -11.364501953125, -10.8553466796875, -10.34619140625, -9.8370361328125, -9.327880859375, -8.8187255859375, -8.3095703125, -7.8004150390625, -7.291259765625, -6.7821044921875, -6.27294921875, -5.7637939453125, -5.254638671875, -4.7454833984375, -4.236328125, -3.7271728515625, -3.218017578125, -2.7088623046875, -2.19970703125, -1.6905517578125, -1.181396484375, -0.6722412109375, -0.1630859375, 0.3460693359375, 0.855224609375, 1.3643798828125, 1.87353515625, 2.3826904296875, 2.891845703125, 3.4010009765625, 3.91015625, 4.4193115234375, 4.928466796875, 5.4376220703125, 5.94677734375, 6.4559326171875, 6.965087890625, 7.4742431640625, 7.9833984375, 8.4925537109375, 9.001708984375, 9.5108642578125, 10.02001953125, 10.5291748046875, 11.038330078125, 11.5474853515625, 12.056640625, 12.5657958984375, 13.074951171875, 13.5841064453125, 14.09326171875, 14.6024169921875, 15.111572265625, 15.6207275390625, 16.1298828125, 16.6390380859375, 17.148193359375, 17.6573486328125, 18.16650390625, 18.6756591796875, 19.184814453125, 19.6939697265625, 20.203125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 6.0, 4.0, 8.0, 8.0, 27.0, 34.0, 59.0, 82.0, 168.0, 283.0, 528.0, 1030.0, 2070.0, 4214.0, 9500.0, 24550.0, 80043.0, 532537.0, 3136640.0, 306742.0, 60038.0, 19922.0, 8037.0, 3787.0, 1865.0, 1007.0, 514.0, 230.0, 147.0, 88.0, 33.0, 28.0, 30.0, 9.0, 8.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.7109375, -15.0921630859375, -14.473388671875, -13.8546142578125, -13.23583984375, -12.6170654296875, -11.998291015625, -11.3795166015625, -10.7607421875, -10.1419677734375, -9.523193359375, -8.9044189453125, -8.28564453125, -7.6668701171875, -7.048095703125, -6.4293212890625, -5.810546875, -5.1917724609375, -4.572998046875, -3.9542236328125, -3.33544921875, -2.7166748046875, -2.097900390625, -1.4791259765625, -0.8603515625, -0.2415771484375, 0.377197265625, 0.9959716796875, 1.61474609375, 2.2335205078125, 2.852294921875, 3.4710693359375, 4.08984375, 4.7086181640625, 5.327392578125, 5.9461669921875, 6.56494140625, 7.1837158203125, 7.802490234375, 8.4212646484375, 9.0400390625, 9.6588134765625, 10.277587890625, 10.8963623046875, 11.51513671875, 12.1339111328125, 12.752685546875, 13.3714599609375, 13.990234375, 14.6090087890625, 15.227783203125, 15.8465576171875, 16.46533203125, 17.0841064453125, 17.702880859375, 18.3216552734375, 18.9404296875, 19.5592041015625, 20.177978515625, 20.7967529296875, 21.41552734375, 22.0343017578125, 22.653076171875, 23.2718505859375, 23.890625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 4.0, 9.0, 13.0, 21.0, 12.0, 17.0, 39.0, 56.0, 56.0, 98.0, 166.0, 323.0, 592.0, 932.0, 724.0, 385.0, 197.0, 121.0, 79.0, 67.0, 32.0, 35.0, 16.0, 16.0, 7.0, 8.0, 6.0, 10.0, 5.0, 9.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-23.5, -22.822021484375, -22.14404296875, -21.466064453125, -20.7880859375, -20.110107421875, -19.43212890625, -18.754150390625, -18.076171875, -17.398193359375, -16.72021484375, -16.042236328125, -15.3642578125, -14.686279296875, -14.00830078125, -13.330322265625, -12.65234375, -11.974365234375, -11.29638671875, -10.618408203125, -9.9404296875, -9.262451171875, -8.58447265625, -7.906494140625, -7.228515625, -6.550537109375, -5.87255859375, -5.194580078125, -4.5166015625, -3.838623046875, -3.16064453125, -2.482666015625, -1.8046875, -1.126708984375, -0.44873046875, 0.229248046875, 0.9072265625, 1.585205078125, 2.26318359375, 2.941162109375, 3.619140625, 4.297119140625, 4.97509765625, 5.653076171875, 6.3310546875, 7.009033203125, 7.68701171875, 8.364990234375, 9.04296875, 9.720947265625, 10.39892578125, 11.076904296875, 11.7548828125, 12.432861328125, 13.11083984375, 13.788818359375, 14.466796875, 15.144775390625, 15.82275390625, 16.500732421875, 17.1787109375, 17.856689453125, 18.53466796875, 19.212646484375, 19.890625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 17.0, 22.0, 45.0, 80.0, 180.0, 240.0, 218.0, 103.0, 52.0, 18.0, 9.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-160.85206604003906, -152.69747924804688, -144.54290771484375, -136.38832092285156, -128.23373413085938, -120.07915496826172, -111.92457580566406, -103.76998901367188, -95.61540985107422, -87.46083068847656, -79.30624389648438, -71.15166473388672, -62.9970817565918, -54.842498779296875, -46.68791961669922, -38.5333366394043, -30.378753662109375, -22.224170684814453, -14.069589614868164, -5.915008544921875, 2.239574432373047, 10.394157409667969, 18.548736572265625, 26.703319549560547, 34.85790252685547, 43.01248550415039, 51.16706848144531, 59.32164764404297, 67.47622680664062, 75.63081359863281, 83.78539276123047, 91.93997192382812, 100.09454345703125, 108.2491226196289, 116.4037094116211, 124.55828857421875, 132.71287536621094, 140.86746215820312, 149.02203369140625, 157.17662048339844, 165.33120727539062, 173.4857940673828, 181.64036560058594, 189.79495239257812, 197.9495391845703, 206.1041259765625, 214.25869750976562, 222.4132843017578, 230.56785583496094, 238.72244262695312, 246.87701416015625, 255.03160095214844, 263.1861877441406, 271.34075927734375, 279.495361328125, 287.6499328613281, 295.80450439453125, 303.9590759277344, 312.1136779785156, 320.26824951171875, 328.4228210449219, 336.5774230957031, 344.73199462890625, 352.8865661621094, 361.0411682128906]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 8.0, 10.0, 11.0, 16.0, 20.0, 10.0, 24.0, 21.0, 38.0, 29.0, 35.0, 47.0, 41.0, 54.0, 54.0, 58.0, 43.0, 54.0, 53.0, 44.0, 43.0, 40.0, 35.0, 35.0, 40.0, 22.0, 26.0, 15.0, 18.0, 16.0, 6.0, 9.0, 6.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.60320281982422, -86.44063568115234, -83.278076171875, -80.11550903320312, -76.95294189453125, -73.79037475585938, -70.62781524658203, -67.46524810791016, -64.30268859863281, -61.1401252746582, -57.97755813598633, -54.81499481201172, -51.652427673339844, -48.489864349365234, -45.327301025390625, -42.16473388671875, -39.002166748046875, -35.839603424072266, -32.67703628540039, -29.51447296142578, -26.35190773010254, -23.189342498779297, -20.026779174804688, -16.864213943481445, -13.701648712158203, -10.539083480834961, -7.376519203186035, -4.213954925537109, -1.0513896942138672, 2.111175537109375, 5.273738861083984, 8.436304092407227, 11.598876953125, 14.761442184448242, 17.924007415771484, 21.086570739746094, 24.249135971069336, 27.411701202392578, 30.574264526367188, 33.73683166503906, 36.89939498901367, 40.06195831298828, 43.224525451660156, 46.387088775634766, 49.549652099609375, 52.71221923828125, 55.87478256225586, 59.03734588623047, 62.199913024902344, 65.36248016357422, 68.52503967285156, 71.68760681152344, 74.85017395019531, 78.01274108886719, 81.17530059814453, 84.3378677368164, 87.50042724609375, 90.66299438476562, 93.82555389404297, 96.98812103271484, 100.15068817138672, 103.31324768066406, 106.47581481933594, 109.63838195800781, 112.80094909667969]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 9.0, 10.0, 17.0, 28.0, 28.0, 60.0, 111.0, 148.0, 239.0, 461.0, 704.0, 1258.0, 2415.0, 4740.0, 9606.0, 21042.0, 49490.0, 131982.0, 349189.0, 296176.0, 105110.0, 40957.0, 17641.0, 8239.0, 4085.0, 2088.0, 1107.0, 665.0, 350.0, 223.0, 123.0, 91.0, 57.0, 42.0, 31.0, 16.0, 7.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.40625, -17.8291015625, -17.251953125, -16.6748046875, -16.09765625, -15.5205078125, -14.943359375, -14.3662109375, -13.7890625, -13.2119140625, -12.634765625, -12.0576171875, -11.48046875, -10.9033203125, -10.326171875, -9.7490234375, -9.171875, -8.5947265625, -8.017578125, -7.4404296875, -6.86328125, -6.2861328125, -5.708984375, -5.1318359375, -4.5546875, -3.9775390625, -3.400390625, -2.8232421875, -2.24609375, -1.6689453125, -1.091796875, -0.5146484375, 0.0625, 0.6396484375, 1.216796875, 1.7939453125, 2.37109375, 2.9482421875, 3.525390625, 4.1025390625, 4.6796875, 5.2568359375, 5.833984375, 6.4111328125, 6.98828125, 7.5654296875, 8.142578125, 8.7197265625, 9.296875, 9.8740234375, 10.451171875, 11.0283203125, 11.60546875, 12.1826171875, 12.759765625, 13.3369140625, 13.9140625, 14.4912109375, 15.068359375, 15.6455078125, 16.22265625, 16.7998046875, 17.376953125, 17.9541015625, 18.53125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 9.0, 6.0, 14.0, 21.0, 20.0, 27.0, 25.0, 39.0, 54.0, 64.0, 48.0, 70.0, 58.0, 70.0, 59.0, 72.0, 76.0, 68.0, 55.0, 37.0, 22.0, 25.0, 14.0, 11.0, 6.0, 16.0, 4.0, 7.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9453125, -13.5399169921875, -13.134521484375, -12.7291259765625, -12.32373046875, -11.9183349609375, -11.512939453125, -11.1075439453125, -10.7021484375, -10.2967529296875, -9.891357421875, -9.4859619140625, -9.08056640625, -8.6751708984375, -8.269775390625, -7.8643798828125, -7.458984375, -7.0535888671875, -6.648193359375, -6.2427978515625, -5.83740234375, -5.4320068359375, -5.026611328125, -4.6212158203125, -4.2158203125, -3.8104248046875, -3.405029296875, -2.9996337890625, -2.59423828125, -2.1888427734375, -1.783447265625, -1.3780517578125, -0.97265625, -0.5672607421875, -0.161865234375, 0.2435302734375, 0.64892578125, 1.0543212890625, 1.459716796875, 1.8651123046875, 2.2705078125, 2.6759033203125, 3.081298828125, 3.4866943359375, 3.89208984375, 4.2974853515625, 4.702880859375, 5.1082763671875, 5.513671875, 5.9190673828125, 6.324462890625, 6.7298583984375, 7.13525390625, 7.5406494140625, 7.946044921875, 8.3514404296875, 8.7568359375, 9.1622314453125, 9.567626953125, 9.9730224609375, 10.37841796875, 10.7838134765625, 11.189208984375, 11.5946044921875, 12.0]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 1.0, 3.0, 7.0, 10.0, 9.0, 12.0, 18.0, 23.0, 34.0, 55.0, 57.0, 90.0, 131.0, 196.0, 372.0, 681.0, 1411.0, 3488.0, 11502.0, 54190.0, 426041.0, 475259.0, 56187.0, 12008.0, 3627.0, 1422.0, 716.0, 356.0, 213.0, 145.0, 90.0, 60.0, 36.0, 28.0, 24.0, 17.0, 10.0, 5.0, 3.0, 3.0, 4.0, 4.0, 3.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 5.0], "bins": [-38.6875, -37.58251953125, -36.4775390625, -35.37255859375, -34.267578125, -33.16259765625, -32.0576171875, -30.95263671875, -29.84765625, -28.74267578125, -27.6376953125, -26.53271484375, -25.427734375, -24.32275390625, -23.2177734375, -22.11279296875, -21.0078125, -19.90283203125, -18.7978515625, -17.69287109375, -16.587890625, -15.48291015625, -14.3779296875, -13.27294921875, -12.16796875, -11.06298828125, -9.9580078125, -8.85302734375, -7.748046875, -6.64306640625, -5.5380859375, -4.43310546875, -3.328125, -2.22314453125, -1.1181640625, -0.01318359375, 1.091796875, 2.19677734375, 3.3017578125, 4.40673828125, 5.51171875, 6.61669921875, 7.7216796875, 8.82666015625, 9.931640625, 11.03662109375, 12.1416015625, 13.24658203125, 14.3515625, 15.45654296875, 16.5615234375, 17.66650390625, 18.771484375, 19.87646484375, 20.9814453125, 22.08642578125, 23.19140625, 24.29638671875, 25.4013671875, 26.50634765625, 27.611328125, 28.71630859375, 29.8212890625, 30.92626953125, 32.03125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 5.0, 3.0, 6.0, 10.0, 19.0, 19.0, 21.0, 29.0, 22.0, 44.0, 46.0, 47.0, 39.0, 37.0, 66.0, 50.0, 58.0, 59.0, 56.0, 50.0, 38.0, 50.0, 40.0, 34.0, 29.0, 18.0, 16.0, 17.0, 14.0, 9.0, 8.0, 7.0, 11.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-41.5625, -40.29248046875, -39.0224609375, -37.75244140625, -36.482421875, -35.21240234375, -33.9423828125, -32.67236328125, -31.40234375, -30.13232421875, -28.8623046875, -27.59228515625, -26.322265625, -25.05224609375, -23.7822265625, -22.51220703125, -21.2421875, -19.97216796875, -18.7021484375, -17.43212890625, -16.162109375, -14.89208984375, -13.6220703125, -12.35205078125, -11.08203125, -9.81201171875, -8.5419921875, -7.27197265625, -6.001953125, -4.73193359375, -3.4619140625, -2.19189453125, -0.921875, 0.34814453125, 1.6181640625, 2.88818359375, 4.158203125, 5.42822265625, 6.6982421875, 7.96826171875, 9.23828125, 10.50830078125, 11.7783203125, 13.04833984375, 14.318359375, 15.58837890625, 16.8583984375, 18.12841796875, 19.3984375, 20.66845703125, 21.9384765625, 23.20849609375, 24.478515625, 25.74853515625, 27.0185546875, 28.28857421875, 29.55859375, 30.82861328125, 32.0986328125, 33.36865234375, 34.638671875, 35.90869140625, 37.1787109375, 38.44873046875, 39.71875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 7.0, 8.0, 7.0, 18.0, 29.0, 87.0, 146.0, 571.0, 3590.0, 117607.0, 908200.0, 16480.0, 1285.0, 303.0, 109.0, 42.0, 28.0, 8.0, 9.0, 12.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.765625, -27.815185546875, -26.86474609375, -25.914306640625, -24.9638671875, -24.013427734375, -23.06298828125, -22.112548828125, -21.162109375, -20.211669921875, -19.26123046875, -18.310791015625, -17.3603515625, -16.409912109375, -15.45947265625, -14.509033203125, -13.55859375, -12.608154296875, -11.65771484375, -10.707275390625, -9.7568359375, -8.806396484375, -7.85595703125, -6.905517578125, -5.955078125, -5.004638671875, -4.05419921875, -3.103759765625, -2.1533203125, -1.202880859375, -0.25244140625, 0.697998046875, 1.6484375, 2.598876953125, 3.54931640625, 4.499755859375, 5.4501953125, 6.400634765625, 7.35107421875, 8.301513671875, 9.251953125, 10.202392578125, 11.15283203125, 12.103271484375, 13.0537109375, 14.004150390625, 14.95458984375, 15.905029296875, 16.85546875, 17.805908203125, 18.75634765625, 19.706787109375, 20.6572265625, 21.607666015625, 22.55810546875, 23.508544921875, 24.458984375, 25.409423828125, 26.35986328125, 27.310302734375, 28.2607421875, 29.211181640625, 30.16162109375, 31.112060546875, 32.0625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 10.0, 6.0, 6.0, 13.0, 17.0, 23.0, 38.0, 50.0, 73.0, 102.0, 145.0, 149.0, 100.0, 65.0, 56.0, 32.0, 26.0, 14.0, 21.0, 17.0, 10.0, 5.0, 4.0, 1.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.002696990966796875, -0.002612859010696411, -0.0025287270545959473, -0.0024445950984954834, -0.0023604631423950195, -0.0022763311862945557, -0.002192199230194092, -0.002108067274093628, -0.002023935317993164, -0.0019398033618927002, -0.0018556714057922363, -0.0017715394496917725, -0.0016874074935913086, -0.0016032755374908447, -0.0015191435813903809, -0.001435011625289917, -0.0013508796691894531, -0.0012667477130889893, -0.0011826157569885254, -0.0010984838008880615, -0.0010143518447875977, -0.0009302198886871338, -0.0008460879325866699, -0.0007619559764862061, -0.0006778240203857422, -0.0005936920642852783, -0.0005095601081848145, -0.0004254281520843506, -0.0003412961959838867, -0.00025716423988342285, -0.00017303228378295898, -8.890032768249512e-05, -4.76837158203125e-06, 7.936358451843262e-05, 0.00016349554061889648, 0.00024762749671936035, 0.0003317594528198242, 0.0004158914089202881, 0.000500023365020752, 0.0005841553211212158, 0.0006682872772216797, 0.0007524192333221436, 0.0008365511894226074, 0.0009206831455230713, 0.0010048151016235352, 0.001088947057723999, 0.0011730790138244629, 0.0012572109699249268, 0.0013413429260253906, 0.0014254748821258545, 0.0015096068382263184, 0.0015937387943267822, 0.001677870750427246, 0.00176200270652771, 0.0018461346626281738, 0.0019302666187286377, 0.0020143985748291016, 0.0020985305309295654, 0.0021826624870300293, 0.002266794443130493, 0.002350926399230957, 0.002435058355331421, 0.0025191903114318848, 0.0026033222675323486, 0.0026874542236328125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 8.0, 4.0, 8.0, 7.0, 12.0, 16.0, 18.0, 43.0, 65.0, 73.0, 168.0, 242.0, 516.0, 1049.0, 2353.0, 8235.0, 43404.0, 483501.0, 453005.0, 43291.0, 8048.0, 2452.0, 908.0, 438.0, 287.0, 157.0, 102.0, 55.0, 29.0, 20.0, 12.0, 10.0, 5.0, 5.0, 7.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.359375, -10.95361328125, -10.5478515625, -10.14208984375, -9.736328125, -9.33056640625, -8.9248046875, -8.51904296875, -8.11328125, -7.70751953125, -7.3017578125, -6.89599609375, -6.490234375, -6.08447265625, -5.6787109375, -5.27294921875, -4.8671875, -4.46142578125, -4.0556640625, -3.64990234375, -3.244140625, -2.83837890625, -2.4326171875, -2.02685546875, -1.62109375, -1.21533203125, -0.8095703125, -0.40380859375, 0.001953125, 0.40771484375, 0.8134765625, 1.21923828125, 1.625, 2.03076171875, 2.4365234375, 2.84228515625, 3.248046875, 3.65380859375, 4.0595703125, 4.46533203125, 4.87109375, 5.27685546875, 5.6826171875, 6.08837890625, 6.494140625, 6.89990234375, 7.3056640625, 7.71142578125, 8.1171875, 8.52294921875, 8.9287109375, 9.33447265625, 9.740234375, 10.14599609375, 10.5517578125, 10.95751953125, 11.36328125, 11.76904296875, 12.1748046875, 12.58056640625, 12.986328125, 13.39208984375, 13.7978515625, 14.20361328125, 14.609375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 8.0, 8.0, 17.0, 13.0, 15.0, 22.0, 25.0, 25.0, 40.0, 34.0, 38.0, 59.0, 61.0, 60.0, 57.0, 63.0, 69.0, 59.0, 49.0, 54.0, 36.0, 32.0, 29.0, 16.0, 19.0, 8.0, 13.0, 12.0, 8.0, 9.0, 6.0, 6.0, 4.0, 6.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.78515625, -7.5465087890625, -7.307861328125, -7.0692138671875, -6.83056640625, -6.5919189453125, -6.353271484375, -6.1146240234375, -5.8759765625, -5.6373291015625, -5.398681640625, -5.1600341796875, -4.92138671875, -4.6827392578125, -4.444091796875, -4.2054443359375, -3.966796875, -3.7281494140625, -3.489501953125, -3.2508544921875, -3.01220703125, -2.7735595703125, -2.534912109375, -2.2962646484375, -2.0576171875, -1.8189697265625, -1.580322265625, -1.3416748046875, -1.10302734375, -0.8643798828125, -0.625732421875, -0.3870849609375, -0.1484375, 0.0902099609375, 0.328857421875, 0.5675048828125, 0.80615234375, 1.0447998046875, 1.283447265625, 1.5220947265625, 1.7607421875, 1.9993896484375, 2.238037109375, 2.4766845703125, 2.71533203125, 2.9539794921875, 3.192626953125, 3.4312744140625, 3.669921875, 3.9085693359375, 4.147216796875, 4.3858642578125, 4.62451171875, 4.8631591796875, 5.101806640625, 5.3404541015625, 5.5791015625, 5.8177490234375, 6.056396484375, 6.2950439453125, 6.53369140625, 6.7723388671875, 7.010986328125, 7.2496337890625, 7.48828125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 6.0, 19.0, 16.0, 49.0, 76.0, 125.0, 181.0, 198.0, 128.0, 81.0, 47.0, 26.0, 19.0, 12.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-127.72358703613281, -120.23841857910156, -112.75325012207031, -105.26807403564453, -97.78290557861328, -90.29773712158203, -82.81256103515625, -75.327392578125, -67.84222412109375, -60.3570556640625, -52.871883392333984, -45.38671112060547, -37.90154266357422, -30.41637420654297, -22.931201934814453, -15.446029663085938, -7.9608612060546875, -0.4756908416748047, 7.009479522705078, 14.494649887084961, 21.979820251464844, 29.464988708496094, 36.95016098022461, 44.435333251953125, 51.920501708984375, 59.405670166015625, 66.89083862304688, 74.37601470947266, 81.8611831665039, 89.34635162353516, 96.83152770996094, 104.31669616699219, 111.8018798828125, 119.28704833984375, 126.772216796875, 134.25738525390625, 141.7425537109375, 149.22772216796875, 156.71290588378906, 164.1980743408203, 171.68324279785156, 179.1684112548828, 186.65357971191406, 194.1387481689453, 201.62393188476562, 209.10910034179688, 216.59426879882812, 224.07943725585938, 231.56460571289062, 239.04977416992188, 246.53494262695312, 254.02011108398438, 261.5052795410156, 268.9904479980469, 276.4756164550781, 283.9608154296875, 291.44598388671875, 298.93115234375, 306.41632080078125, 313.9014892578125, 321.38665771484375, 328.871826171875, 336.35699462890625, 343.8421630859375, 351.32733154296875]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 7.0, 6.0, 8.0, 11.0, 6.0, 13.0, 9.0, 15.0, 20.0, 22.0, 20.0, 39.0, 29.0, 49.0, 36.0, 42.0, 34.0, 54.0, 48.0, 52.0, 69.0, 49.0, 54.0, 40.0, 25.0, 33.0, 26.0, 32.0, 20.0, 19.0, 18.0, 10.0, 13.0, 16.0, 11.0, 14.0, 4.0, 9.0, 4.0, 6.0, 1.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0], "bins": [-161.04635620117188, -156.62799072265625, -152.20962524414062, -147.79124450683594, -143.3728790283203, -138.9545135498047, -134.53614807128906, -130.11778259277344, -125.69940948486328, -121.28104400634766, -116.8626708984375, -112.44430541992188, -108.02593994140625, -103.6075668334961, -99.18920135498047, -94.77082824707031, -90.35246276855469, -85.93409729003906, -81.5157241821289, -77.09735870361328, -72.67898559570312, -68.2606201171875, -63.842254638671875, -59.423885345458984, -55.005516052246094, -50.5871467590332, -46.16877746582031, -41.75041198730469, -37.3320426940918, -32.913673400878906, -28.49530601501465, -24.07693862915039, -19.6585693359375, -15.240200996398926, -10.821832656860352, -6.403464317321777, -1.9850959777832031, 2.4332733154296875, 6.851640701293945, 11.270008087158203, 15.688377380371094, 20.106746673583984, 24.525114059448242, 28.9434814453125, 33.36185073852539, 37.78022003173828, 42.198585510253906, 46.6169548034668, 51.03532409667969, 55.45369338989258, 59.87206268310547, 64.2904281616211, 68.70880126953125, 73.12716674804688, 77.5455322265625, 81.96389770507812, 86.38227081298828, 90.8006362915039, 95.21900939941406, 99.63737487792969, 104.05574035644531, 108.47411346435547, 112.8924789428711, 117.31085205078125, 121.72921752929688]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 4.0, 10.0, 18.0, 19.0, 23.0, 46.0, 98.0, 154.0, 313.0, 695.0, 1589.0, 4021.0, 11284.0, 36967.0, 168136.0, 1368859.0, 2223541.0, 299672.0, 54776.0, 15164.0, 5174.0, 2064.0, 814.0, 392.0, 205.0, 85.0, 58.0, 36.0, 14.0, 11.0, 8.0, 11.0, 8.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.859375, -12.418212890625, -11.97705078125, -11.535888671875, -11.0947265625, -10.653564453125, -10.21240234375, -9.771240234375, -9.330078125, -8.888916015625, -8.44775390625, -8.006591796875, -7.5654296875, -7.124267578125, -6.68310546875, -6.241943359375, -5.80078125, -5.359619140625, -4.91845703125, -4.477294921875, -4.0361328125, -3.594970703125, -3.15380859375, -2.712646484375, -2.271484375, -1.830322265625, -1.38916015625, -0.947998046875, -0.5068359375, -0.065673828125, 0.37548828125, 0.816650390625, 1.2578125, 1.698974609375, 2.14013671875, 2.581298828125, 3.0224609375, 3.463623046875, 3.90478515625, 4.345947265625, 4.787109375, 5.228271484375, 5.66943359375, 6.110595703125, 6.5517578125, 6.992919921875, 7.43408203125, 7.875244140625, 8.31640625, 8.757568359375, 9.19873046875, 9.639892578125, 10.0810546875, 10.522216796875, 10.96337890625, 11.404541015625, 11.845703125, 12.286865234375, 12.72802734375, 13.169189453125, 13.6103515625, 14.051513671875, 14.49267578125, 14.933837890625, 15.375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 6.0, 7.0, 8.0, 18.0, 23.0, 33.0, 45.0, 48.0, 73.0, 61.0, 75.0, 89.0, 75.0, 95.0, 81.0, 63.0, 76.0, 36.0, 30.0, 22.0, 20.0, 9.0, 8.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2421875, -8.7821044921875, -8.322021484375, -7.8619384765625, -7.40185546875, -6.9417724609375, -6.481689453125, -6.0216064453125, -5.5615234375, -5.1014404296875, -4.641357421875, -4.1812744140625, -3.72119140625, -3.2611083984375, -2.801025390625, -2.3409423828125, -1.880859375, -1.4207763671875, -0.960693359375, -0.5006103515625, -0.04052734375, 0.4195556640625, 0.879638671875, 1.3397216796875, 1.7998046875, 2.2598876953125, 2.719970703125, 3.1800537109375, 3.64013671875, 4.1002197265625, 4.560302734375, 5.0203857421875, 5.48046875, 5.9405517578125, 6.400634765625, 6.8607177734375, 7.32080078125, 7.7808837890625, 8.240966796875, 8.7010498046875, 9.1611328125, 9.6212158203125, 10.081298828125, 10.5413818359375, 11.00146484375, 11.4615478515625, 11.921630859375, 12.3817138671875, 12.841796875, 13.3018798828125, 13.761962890625, 14.2220458984375, 14.68212890625, 15.1422119140625, 15.602294921875, 16.0623779296875, 16.5224609375, 16.9825439453125, 17.442626953125, 17.9027099609375, 18.36279296875, 18.8228759765625, 19.282958984375, 19.7430419921875, 20.203125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 7.0, 13.0, 11.0, 18.0, 26.0, 49.0, 57.0, 113.0, 230.0, 425.0, 976.0, 2402.0, 6760.0, 23376.0, 106262.0, 1004354.0, 2753207.0, 235013.0, 42635.0, 11734.0, 3880.0, 1451.0, 609.0, 273.0, 161.0, 71.0, 47.0, 42.0, 30.0, 18.0, 14.0, 6.0, 7.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.078125, -24.421875, -23.765625, -23.109375, -22.453125, -21.796875, -21.140625, -20.484375, -19.828125, -19.171875, -18.515625, -17.859375, -17.203125, -16.546875, -15.890625, -15.234375, -14.578125, -13.921875, -13.265625, -12.609375, -11.953125, -11.296875, -10.640625, -9.984375, -9.328125, -8.671875, -8.015625, -7.359375, -6.703125, -6.046875, -5.390625, -4.734375, -4.078125, -3.421875, -2.765625, -2.109375, -1.453125, -0.796875, -0.140625, 0.515625, 1.171875, 1.828125, 2.484375, 3.140625, 3.796875, 4.453125, 5.109375, 5.765625, 6.421875, 7.078125, 7.734375, 8.390625, 9.046875, 9.703125, 10.359375, 11.015625, 11.671875, 12.328125, 12.984375, 13.640625, 14.296875, 14.953125, 15.609375, 16.265625, 16.921875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 3.0, 3.0, 9.0, 10.0, 10.0, 17.0, 10.0, 18.0, 24.0, 41.0, 56.0, 77.0, 81.0, 138.0, 162.0, 268.0, 391.0, 526.0, 603.0, 510.0, 304.0, 215.0, 151.0, 104.0, 83.0, 63.0, 44.0, 25.0, 20.0, 19.0, 24.0, 8.0, 10.0, 8.0, 4.0, 11.0, 7.0, 3.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.328125, -20.70703125, -20.0859375, -19.46484375, -18.84375, -18.22265625, -17.6015625, -16.98046875, -16.359375, -15.73828125, -15.1171875, -14.49609375, -13.875, -13.25390625, -12.6328125, -12.01171875, -11.390625, -10.76953125, -10.1484375, -9.52734375, -8.90625, -8.28515625, -7.6640625, -7.04296875, -6.421875, -5.80078125, -5.1796875, -4.55859375, -3.9375, -3.31640625, -2.6953125, -2.07421875, -1.453125, -0.83203125, -0.2109375, 0.41015625, 1.03125, 1.65234375, 2.2734375, 2.89453125, 3.515625, 4.13671875, 4.7578125, 5.37890625, 6.0, 6.62109375, 7.2421875, 7.86328125, 8.484375, 9.10546875, 9.7265625, 10.34765625, 10.96875, 11.58984375, 12.2109375, 12.83203125, 13.453125, 14.07421875, 14.6953125, 15.31640625, 15.9375, 16.55859375, 17.1796875, 17.80078125, 18.421875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 4.0, 5.0, 7.0, 14.0, 32.0, 57.0, 115.0, 191.0, 220.0, 146.0, 111.0, 47.0, 21.0, 17.0, 5.0, 4.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-387.7190246582031, -379.2105712890625, -370.7021484375, -362.1936950683594, -353.68524169921875, -345.17681884765625, -336.6683654785156, -328.159912109375, -319.6514892578125, -311.1430358886719, -302.6346130371094, -294.12615966796875, -285.6177062988281, -277.1092529296875, -268.600830078125, -260.0923767089844, -251.58392333984375, -243.0754852294922, -234.56703186035156, -226.05859375, -217.55014038085938, -209.0417022705078, -200.53326416015625, -192.02481079101562, -183.51637268066406, -175.0079345703125, -166.49948120117188, -157.9910430908203, -149.48260498046875, -140.97415161132812, -132.46571350097656, -123.95726776123047, -115.44882202148438, -106.94037628173828, -98.43193054199219, -89.92349243164062, -81.41504669189453, -72.90660095214844, -64.39816284179688, -55.88971710205078, -47.38127136230469, -38.872825622558594, -30.364383697509766, -21.855939865112305, -13.347496032714844, -4.83905029296875, 3.669391632080078, 12.177833557128906, 20.686279296875, 29.19472312927246, 37.70316696166992, 46.21160888671875, 54.720054626464844, 63.22850036621094, 71.7369384765625, 80.2453842163086, 88.75382995605469, 97.26227569580078, 105.77072143554688, 114.27915954589844, 122.78760528564453, 131.29605102539062, 139.8044891357422, 148.31292724609375, 156.82138061523438]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 11.0, 9.0, 11.0, 17.0, 21.0, 28.0, 54.0, 38.0, 63.0, 70.0, 62.0, 73.0, 64.0, 84.0, 73.0, 69.0, 60.0, 43.0, 36.0, 35.0, 22.0, 20.0, 10.0, 9.0, 9.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-191.76797485351562, -186.1566162109375, -180.5452423095703, -174.9338836669922, -169.322509765625, -163.71115112304688, -158.09979248046875, -152.48841857910156, -146.87705993652344, -141.2657012939453, -135.65432739257812, -130.04296875, -124.43160247802734, -118.82023620605469, -113.20886993408203, -107.59750366210938, -101.98613739013672, -96.37477111816406, -90.7634048461914, -85.15203857421875, -79.54067993164062, -73.92931365966797, -68.31794738769531, -62.70658493041992, -57.095218658447266, -51.48385238647461, -45.87248992919922, -40.26112365722656, -34.649757385253906, -29.038394927978516, -23.42702865600586, -17.81566619873047, -12.204299926757812, -6.592935085296631, -0.9815702438354492, 4.629795074462891, 10.241159439086914, 15.852523803710938, 21.463890075683594, 27.075252532958984, 32.68661880493164, 38.2979850769043, 43.90934753417969, 49.520713806152344, 55.132080078125, 60.74344253540039, 66.35481262207031, 71.96617126464844, 77.5775375366211, 83.18890380859375, 88.8002700805664, 94.41163635253906, 100.02299499511719, 105.63436126708984, 111.2457275390625, 116.85708618164062, 122.46846008300781, 128.07981872558594, 133.69119262695312, 139.30255126953125, 144.91392517089844, 150.52528381347656, 156.13665771484375, 161.74801635742188, 167.359375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 8.0, 7.0, 6.0, 11.0, 16.0, 17.0, 24.0, 51.0, 55.0, 71.0, 127.0, 180.0, 340.0, 542.0, 887.0, 1668.0, 3149.0, 6180.0, 12952.0, 27516.0, 58961.0, 127150.0, 261667.0, 280633.0, 140905.0, 65970.0, 30837.0, 14005.0, 6923.0, 3430.0, 1699.0, 992.0, 561.0, 372.0, 218.0, 142.0, 93.0, 56.0, 39.0, 35.0, 22.0, 16.0, 12.0, 5.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.2421875, -14.7515869140625, -14.260986328125, -13.7703857421875, -13.27978515625, -12.7891845703125, -12.298583984375, -11.8079833984375, -11.3173828125, -10.8267822265625, -10.336181640625, -9.8455810546875, -9.35498046875, -8.8643798828125, -8.373779296875, -7.8831787109375, -7.392578125, -6.9019775390625, -6.411376953125, -5.9207763671875, -5.43017578125, -4.9395751953125, -4.448974609375, -3.9583740234375, -3.4677734375, -2.9771728515625, -2.486572265625, -1.9959716796875, -1.50537109375, -1.0147705078125, -0.524169921875, -0.0335693359375, 0.45703125, 0.9476318359375, 1.438232421875, 1.9288330078125, 2.41943359375, 2.9100341796875, 3.400634765625, 3.8912353515625, 4.3818359375, 4.8724365234375, 5.363037109375, 5.8536376953125, 6.34423828125, 6.8348388671875, 7.325439453125, 7.8160400390625, 8.306640625, 8.7972412109375, 9.287841796875, 9.7784423828125, 10.26904296875, 10.7596435546875, 11.250244140625, 11.7408447265625, 12.2314453125, 12.7220458984375, 13.212646484375, 13.7032470703125, 14.19384765625, 14.6844482421875, 15.175048828125, 15.6656494140625, 16.15625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 5.0, 6.0, 9.0, 12.0, 7.0, 14.0, 11.0, 17.0, 20.0, 22.0, 27.0, 29.0, 28.0, 21.0, 31.0, 33.0, 53.0, 46.0, 53.0, 46.0, 61.0, 47.0, 33.0, 53.0, 31.0, 41.0, 38.0, 36.0, 24.0, 24.0, 23.0, 18.0, 20.0, 12.0, 11.0, 7.0, 10.0, 9.0, 6.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-9.125, -8.86468505859375, -8.6043701171875, -8.34405517578125, -8.083740234375, -7.82342529296875, -7.5631103515625, -7.30279541015625, -7.04248046875, -6.78216552734375, -6.5218505859375, -6.26153564453125, -6.001220703125, -5.74090576171875, -5.4805908203125, -5.22027587890625, -4.9599609375, -4.69964599609375, -4.4393310546875, -4.17901611328125, -3.918701171875, -3.65838623046875, -3.3980712890625, -3.13775634765625, -2.87744140625, -2.61712646484375, -2.3568115234375, -2.09649658203125, -1.836181640625, -1.57586669921875, -1.3155517578125, -1.05523681640625, -0.794921875, -0.53460693359375, -0.2742919921875, -0.01397705078125, 0.246337890625, 0.50665283203125, 0.7669677734375, 1.02728271484375, 1.28759765625, 1.54791259765625, 1.8082275390625, 2.06854248046875, 2.328857421875, 2.58917236328125, 2.8494873046875, 3.10980224609375, 3.3701171875, 3.63043212890625, 3.8907470703125, 4.15106201171875, 4.411376953125, 4.67169189453125, 4.9320068359375, 5.19232177734375, 5.45263671875, 5.71295166015625, 5.9732666015625, 6.23358154296875, 6.493896484375, 6.75421142578125, 7.0145263671875, 7.27484130859375, 7.53515625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 6.0, 4.0, 5.0, 3.0, 3.0, 11.0, 13.0, 19.0, 24.0, 42.0, 31.0, 64.0, 100.0, 133.0, 193.0, 354.0, 628.0, 1224.0, 2548.0, 8022.0, 59406.0, 783701.0, 169481.0, 15199.0, 3737.0, 1576.0, 822.0, 471.0, 257.0, 135.0, 112.0, 68.0, 54.0, 28.0, 23.0, 15.0, 13.0, 10.0, 7.0, 2.0, 3.0, 7.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.03125, -48.34619140625, -46.6611328125, -44.97607421875, -43.291015625, -41.60595703125, -39.9208984375, -38.23583984375, -36.55078125, -34.86572265625, -33.1806640625, -31.49560546875, -29.810546875, -28.12548828125, -26.4404296875, -24.75537109375, -23.0703125, -21.38525390625, -19.7001953125, -18.01513671875, -16.330078125, -14.64501953125, -12.9599609375, -11.27490234375, -9.58984375, -7.90478515625, -6.2197265625, -4.53466796875, -2.849609375, -1.16455078125, 0.5205078125, 2.20556640625, 3.890625, 5.57568359375, 7.2607421875, 8.94580078125, 10.630859375, 12.31591796875, 14.0009765625, 15.68603515625, 17.37109375, 19.05615234375, 20.7412109375, 22.42626953125, 24.111328125, 25.79638671875, 27.4814453125, 29.16650390625, 30.8515625, 32.53662109375, 34.2216796875, 35.90673828125, 37.591796875, 39.27685546875, 40.9619140625, 42.64697265625, 44.33203125, 46.01708984375, 47.7021484375, 49.38720703125, 51.072265625, 52.75732421875, 54.4423828125, 56.12744140625, 57.8125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 11.0, 4.0, 9.0, 10.0, 20.0, 18.0, 22.0, 32.0, 30.0, 43.0, 43.0, 38.0, 53.0, 63.0, 64.0, 61.0, 50.0, 49.0, 44.0, 49.0, 41.0, 38.0, 34.0, 19.0, 23.0, 27.0, 17.0, 18.0, 19.0, 11.0, 9.0, 7.0, 5.0, 3.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.40625, -39.041015625, -37.67578125, -36.310546875, -34.9453125, -33.580078125, -32.21484375, -30.849609375, -29.484375, -28.119140625, -26.75390625, -25.388671875, -24.0234375, -22.658203125, -21.29296875, -19.927734375, -18.5625, -17.197265625, -15.83203125, -14.466796875, -13.1015625, -11.736328125, -10.37109375, -9.005859375, -7.640625, -6.275390625, -4.91015625, -3.544921875, -2.1796875, -0.814453125, 0.55078125, 1.916015625, 3.28125, 4.646484375, 6.01171875, 7.376953125, 8.7421875, 10.107421875, 11.47265625, 12.837890625, 14.203125, 15.568359375, 16.93359375, 18.298828125, 19.6640625, 21.029296875, 22.39453125, 23.759765625, 25.125, 26.490234375, 27.85546875, 29.220703125, 30.5859375, 31.951171875, 33.31640625, 34.681640625, 36.046875, 37.412109375, 38.77734375, 40.142578125, 41.5078125, 42.873046875, 44.23828125, 45.603515625, 46.96875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 6.0, 11.0, 8.0, 15.0, 15.0, 19.0, 53.0, 85.0, 194.0, 448.0, 1451.0, 6795.0, 84091.0, 865932.0, 80445.0, 6541.0, 1499.0, 500.0, 205.0, 87.0, 54.0, 28.0, 17.0, 17.0, 11.0, 8.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-21.640625, -21.047607421875, -20.45458984375, -19.861572265625, -19.2685546875, -18.675537109375, -18.08251953125, -17.489501953125, -16.896484375, -16.303466796875, -15.71044921875, -15.117431640625, -14.5244140625, -13.931396484375, -13.33837890625, -12.745361328125, -12.15234375, -11.559326171875, -10.96630859375, -10.373291015625, -9.7802734375, -9.187255859375, -8.59423828125, -8.001220703125, -7.408203125, -6.815185546875, -6.22216796875, -5.629150390625, -5.0361328125, -4.443115234375, -3.85009765625, -3.257080078125, -2.6640625, -2.071044921875, -1.47802734375, -0.885009765625, -0.2919921875, 0.301025390625, 0.89404296875, 1.487060546875, 2.080078125, 2.673095703125, 3.26611328125, 3.859130859375, 4.4521484375, 5.045166015625, 5.63818359375, 6.231201171875, 6.82421875, 7.417236328125, 8.01025390625, 8.603271484375, 9.1962890625, 9.789306640625, 10.38232421875, 10.975341796875, 11.568359375, 12.161376953125, 12.75439453125, 13.347412109375, 13.9404296875, 14.533447265625, 15.12646484375, 15.719482421875, 16.3125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 2.0, 4.0, 3.0, 7.0, 6.0, 6.0, 7.0, 10.0, 11.0, 7.0, 12.0, 20.0, 15.0, 25.0, 28.0, 28.0, 52.0, 49.0, 67.0, 95.0, 111.0, 91.0, 53.0, 56.0, 39.0, 35.0, 24.0, 24.0, 23.0, 18.0, 9.0, 10.0, 13.0, 5.0, 3.0, 7.0, 10.0, 2.0, 5.0, 4.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0018405914306640625, -0.0017780065536499023, -0.0017154216766357422, -0.001652836799621582, -0.0015902519226074219, -0.0015276670455932617, -0.0014650821685791016, -0.0014024972915649414, -0.0013399124145507812, -0.001277327537536621, -0.001214742660522461, -0.0011521577835083008, -0.0010895729064941406, -0.0010269880294799805, -0.0009644031524658203, -0.0009018182754516602, -0.0008392333984375, -0.0007766485214233398, -0.0007140636444091797, -0.0006514787673950195, -0.0005888938903808594, -0.0005263090133666992, -0.00046372413635253906, -0.0004011392593383789, -0.00033855438232421875, -0.0002759695053100586, -0.00021338462829589844, -0.00015079975128173828, -8.821487426757812e-05, -2.562999725341797e-05, 3.695487976074219e-05, 9.953975677490234e-05, 0.0001621246337890625, 0.00022470951080322266, 0.0002872943878173828, 0.00034987926483154297, 0.0004124641418457031, 0.0004750490188598633, 0.0005376338958740234, 0.0006002187728881836, 0.0006628036499023438, 0.0007253885269165039, 0.0007879734039306641, 0.0008505582809448242, 0.0009131431579589844, 0.0009757280349731445, 0.0010383129119873047, 0.0011008977890014648, 0.001163482666015625, 0.0012260675430297852, 0.0012886524200439453, 0.0013512372970581055, 0.0014138221740722656, 0.0014764070510864258, 0.001538991928100586, 0.001601576805114746, 0.0016641616821289062, 0.0017267465591430664, 0.0017893314361572266, 0.0018519163131713867, 0.0019145011901855469, 0.001977086067199707, 0.002039670944213867, 0.0021022558212280273, 0.0021648406982421875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 5.0, 12.0, 11.0, 11.0, 25.0, 36.0, 58.0, 76.0, 113.0, 190.0, 278.0, 546.0, 1005.0, 2402.0, 7342.0, 43846.0, 638656.0, 316859.0, 27441.0, 5529.0, 1981.0, 862.0, 456.0, 292.0, 146.0, 120.0, 75.0, 58.0, 31.0, 25.0, 21.0, 9.0, 10.0, 6.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-13.1015625, -12.72607421875, -12.3505859375, -11.97509765625, -11.599609375, -11.22412109375, -10.8486328125, -10.47314453125, -10.09765625, -9.72216796875, -9.3466796875, -8.97119140625, -8.595703125, -8.22021484375, -7.8447265625, -7.46923828125, -7.09375, -6.71826171875, -6.3427734375, -5.96728515625, -5.591796875, -5.21630859375, -4.8408203125, -4.46533203125, -4.08984375, -3.71435546875, -3.3388671875, -2.96337890625, -2.587890625, -2.21240234375, -1.8369140625, -1.46142578125, -1.0859375, -0.71044921875, -0.3349609375, 0.04052734375, 0.416015625, 0.79150390625, 1.1669921875, 1.54248046875, 1.91796875, 2.29345703125, 2.6689453125, 3.04443359375, 3.419921875, 3.79541015625, 4.1708984375, 4.54638671875, 4.921875, 5.29736328125, 5.6728515625, 6.04833984375, 6.423828125, 6.79931640625, 7.1748046875, 7.55029296875, 7.92578125, 8.30126953125, 8.6767578125, 9.05224609375, 9.427734375, 9.80322265625, 10.1787109375, 10.55419921875, 10.9296875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 6.0, 3.0, 7.0, 6.0, 5.0, 12.0, 17.0, 22.0, 24.0, 27.0, 37.0, 41.0, 45.0, 54.0, 68.0, 65.0, 71.0, 59.0, 55.0, 55.0, 51.0, 48.0, 31.0, 39.0, 28.0, 27.0, 19.0, 23.0, 10.0, 8.0, 7.0, 9.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-8.0, -7.76959228515625, -7.5391845703125, -7.30877685546875, -7.078369140625, -6.84796142578125, -6.6175537109375, -6.38714599609375, -6.15673828125, -5.92633056640625, -5.6959228515625, -5.46551513671875, -5.235107421875, -5.00469970703125, -4.7742919921875, -4.54388427734375, -4.3134765625, -4.08306884765625, -3.8526611328125, -3.62225341796875, -3.391845703125, -3.16143798828125, -2.9310302734375, -2.70062255859375, -2.47021484375, -2.23980712890625, -2.0093994140625, -1.77899169921875, -1.548583984375, -1.31817626953125, -1.0877685546875, -0.85736083984375, -0.626953125, -0.39654541015625, -0.1661376953125, 0.06427001953125, 0.294677734375, 0.52508544921875, 0.7554931640625, 0.98590087890625, 1.21630859375, 1.44671630859375, 1.6771240234375, 1.90753173828125, 2.137939453125, 2.36834716796875, 2.5987548828125, 2.82916259765625, 3.0595703125, 3.28997802734375, 3.5203857421875, 3.75079345703125, 3.981201171875, 4.21160888671875, 4.4420166015625, 4.67242431640625, 4.90283203125, 5.13323974609375, 5.3636474609375, 5.59405517578125, 5.824462890625, 6.05487060546875, 6.2852783203125, 6.51568603515625, 6.74609375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 15.0, 17.0, 35.0, 54.0, 88.0, 102.0, 179.0, 177.0, 121.0, 75.0, 61.0, 35.0, 9.0, 9.0, 4.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-209.99990844726562, -203.25262451171875, -196.50535583496094, -189.75807189941406, -183.0107879638672, -176.26351928710938, -169.5162353515625, -162.76895141601562, -156.0216827392578, -149.27439880371094, -142.52713012695312, -135.77984619140625, -129.03256225585938, -122.28529357910156, -115.53800964355469, -108.79073333740234, -102.04344940185547, -95.29617309570312, -88.54888916015625, -81.8016128540039, -75.05433654785156, -68.30705261230469, -61.559776306152344, -54.8125, -48.06521987915039, -41.31793975830078, -34.57066345214844, -27.823383331298828, -21.07610511779785, -14.328826904296875, -7.581546783447266, -0.8342704772949219, 5.9130096435546875, 12.660287857055664, 19.40756607055664, 26.15484619140625, 32.902122497558594, 39.6494026184082, 46.39668273925781, 53.143959045410156, 59.891239166259766, 66.63851928710938, 73.38579559326172, 80.13307189941406, 86.88035583496094, 93.62763214111328, 100.37490844726562, 107.1221923828125, 113.86946868896484, 120.61674499511719, 127.36402893066406, 134.11129760742188, 140.85858154296875, 147.60586547851562, 154.3531494140625, 161.1004180908203, 167.8477020263672, 174.59498596191406, 181.34225463867188, 188.08953857421875, 194.83682250976562, 201.58409118652344, 208.3313751220703, 215.07864379882812, 221.825927734375]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 8.0, 5.0, 3.0, 12.0, 7.0, 6.0, 12.0, 8.0, 8.0, 20.0, 13.0, 12.0, 18.0, 24.0, 24.0, 19.0, 29.0, 41.0, 42.0, 33.0, 46.0, 45.0, 58.0, 63.0, 43.0, 50.0, 40.0, 37.0, 31.0, 33.0, 16.0, 26.0, 21.0, 19.0, 17.0, 19.0, 14.0, 17.0, 6.0, 14.0, 5.0, 6.0, 7.0, 3.0, 6.0, 3.0, 6.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-111.57177734375, -107.85650634765625, -104.14122772216797, -100.42595672607422, -96.71067810058594, -92.99540710449219, -89.28013610839844, -85.56485748291016, -81.8495864868164, -78.13431549072266, -74.41903686523438, -70.70376586914062, -66.98848724365234, -63.273216247558594, -59.55794143676758, -55.84266662597656, -52.12739181518555, -48.41211700439453, -44.696842193603516, -40.9815673828125, -37.26629638671875, -33.551021575927734, -29.83574676513672, -26.120473861694336, -22.40519905090332, -18.689924240112305, -14.974651336669922, -11.259376525878906, -7.544102668762207, -3.828828811645508, -0.11355400085449219, 3.6017189025878906, 7.316993713378906, 11.032267570495605, 14.747541427612305, 18.46281623840332, 22.178089141845703, 25.89336395263672, 29.608638763427734, 33.32391357421875, 37.0391845703125, 40.754459381103516, 44.46973419189453, 48.18500518798828, 51.9002799987793, 55.61555480957031, 59.33082962036133, 63.046104431152344, 66.76138305664062, 70.47665405273438, 74.19193267822266, 77.9072036743164, 81.62248229980469, 85.33775329589844, 89.05302429199219, 92.76830291748047, 96.48357391357422, 100.19884490966797, 103.91412353515625, 107.62939453125, 111.34467315673828, 115.05994415283203, 118.77522277832031, 122.49049377441406, 126.20576477050781]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 4.0, 8.0, 13.0, 24.0, 25.0, 46.0, 79.0, 123.0, 238.0, 523.0, 1121.0, 2725.0, 7525.0, 26153.0, 128974.0, 1537959.0, 2255109.0, 185679.0, 32980.0, 9229.0, 3272.0, 1250.0, 577.0, 282.0, 151.0, 91.0, 37.0, 32.0, 25.0, 8.0, 7.0, 9.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.8984375, -15.3870849609375, -14.875732421875, -14.3643798828125, -13.85302734375, -13.3416748046875, -12.830322265625, -12.3189697265625, -11.8076171875, -11.2962646484375, -10.784912109375, -10.2735595703125, -9.76220703125, -9.2508544921875, -8.739501953125, -8.2281494140625, -7.716796875, -7.2054443359375, -6.694091796875, -6.1827392578125, -5.67138671875, -5.1600341796875, -4.648681640625, -4.1373291015625, -3.6259765625, -3.1146240234375, -2.603271484375, -2.0919189453125, -1.58056640625, -1.0692138671875, -0.557861328125, -0.0465087890625, 0.46484375, 0.9761962890625, 1.487548828125, 1.9989013671875, 2.51025390625, 3.0216064453125, 3.532958984375, 4.0443115234375, 4.5556640625, 5.0670166015625, 5.578369140625, 6.0897216796875, 6.60107421875, 7.1124267578125, 7.623779296875, 8.1351318359375, 8.646484375, 9.1578369140625, 9.669189453125, 10.1805419921875, 10.69189453125, 11.2032470703125, 11.714599609375, 12.2259521484375, 12.7373046875, 13.2486572265625, 13.760009765625, 14.2713623046875, 14.78271484375, 15.2940673828125, 15.805419921875, 16.3167724609375, 16.828125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 3.0, 9.0, 4.0, 14.0, 18.0, 19.0, 19.0, 21.0, 29.0, 36.0, 41.0, 37.0, 37.0, 50.0, 54.0, 66.0, 55.0, 53.0, 48.0, 40.0, 43.0, 45.0, 43.0, 35.0, 25.0, 29.0, 27.0, 21.0, 9.0, 12.0, 14.0, 5.0, 11.0, 3.0, 7.0, 5.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.953125, -8.6717529296875, -8.390380859375, -8.1090087890625, -7.82763671875, -7.5462646484375, -7.264892578125, -6.9835205078125, -6.7021484375, -6.4207763671875, -6.139404296875, -5.8580322265625, -5.57666015625, -5.2952880859375, -5.013916015625, -4.7325439453125, -4.451171875, -4.1697998046875, -3.888427734375, -3.6070556640625, -3.32568359375, -3.0443115234375, -2.762939453125, -2.4815673828125, -2.2001953125, -1.9188232421875, -1.637451171875, -1.3560791015625, -1.07470703125, -0.7933349609375, -0.511962890625, -0.2305908203125, 0.05078125, 0.3321533203125, 0.613525390625, 0.8948974609375, 1.17626953125, 1.4576416015625, 1.739013671875, 2.0203857421875, 2.3017578125, 2.5831298828125, 2.864501953125, 3.1458740234375, 3.42724609375, 3.7086181640625, 3.989990234375, 4.2713623046875, 4.552734375, 4.8341064453125, 5.115478515625, 5.3968505859375, 5.67822265625, 5.9595947265625, 6.240966796875, 6.5223388671875, 6.8037109375, 7.0850830078125, 7.366455078125, 7.6478271484375, 7.92919921875, 8.2105712890625, 8.491943359375, 8.7733154296875, 9.0546875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 8.0, 3.0, 16.0, 12.0, 28.0, 38.0, 77.0, 146.0, 308.0, 637.0, 1476.0, 4008.0, 14277.0, 76936.0, 1282585.0, 2650944.0, 130460.0, 22837.0, 5879.0, 2064.0, 785.0, 356.0, 176.0, 90.0, 53.0, 35.0, 17.0, 10.0, 7.0, 8.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.453125, -25.57470703125, -24.6962890625, -23.81787109375, -22.939453125, -22.06103515625, -21.1826171875, -20.30419921875, -19.42578125, -18.54736328125, -17.6689453125, -16.79052734375, -15.912109375, -15.03369140625, -14.1552734375, -13.27685546875, -12.3984375, -11.52001953125, -10.6416015625, -9.76318359375, -8.884765625, -8.00634765625, -7.1279296875, -6.24951171875, -5.37109375, -4.49267578125, -3.6142578125, -2.73583984375, -1.857421875, -0.97900390625, -0.1005859375, 0.77783203125, 1.65625, 2.53466796875, 3.4130859375, 4.29150390625, 5.169921875, 6.04833984375, 6.9267578125, 7.80517578125, 8.68359375, 9.56201171875, 10.4404296875, 11.31884765625, 12.197265625, 13.07568359375, 13.9541015625, 14.83251953125, 15.7109375, 16.58935546875, 17.4677734375, 18.34619140625, 19.224609375, 20.10302734375, 20.9814453125, 21.85986328125, 22.73828125, 23.61669921875, 24.4951171875, 25.37353515625, 26.251953125, 27.13037109375, 28.0087890625, 28.88720703125, 29.765625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 2.0, 6.0, 7.0, 9.0, 13.0, 20.0, 24.0, 32.0, 34.0, 70.0, 113.0, 163.0, 270.0, 375.0, 537.0, 717.0, 590.0, 361.0, 223.0, 136.0, 69.0, 77.0, 62.0, 34.0, 31.0, 20.0, 16.0, 11.0, 13.0, 4.0, 9.0, 4.0, 1.0, 6.0, 0.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-23.453125, -22.729736328125, -22.00634765625, -21.282958984375, -20.5595703125, -19.836181640625, -19.11279296875, -18.389404296875, -17.666015625, -16.942626953125, -16.21923828125, -15.495849609375, -14.7724609375, -14.049072265625, -13.32568359375, -12.602294921875, -11.87890625, -11.155517578125, -10.43212890625, -9.708740234375, -8.9853515625, -8.261962890625, -7.53857421875, -6.815185546875, -6.091796875, -5.368408203125, -4.64501953125, -3.921630859375, -3.1982421875, -2.474853515625, -1.75146484375, -1.028076171875, -0.3046875, 0.418701171875, 1.14208984375, 1.865478515625, 2.5888671875, 3.312255859375, 4.03564453125, 4.759033203125, 5.482421875, 6.205810546875, 6.92919921875, 7.652587890625, 8.3759765625, 9.099365234375, 9.82275390625, 10.546142578125, 11.26953125, 11.992919921875, 12.71630859375, 13.439697265625, 14.1630859375, 14.886474609375, 15.60986328125, 16.333251953125, 17.056640625, 17.780029296875, 18.50341796875, 19.226806640625, 19.9501953125, 20.673583984375, 21.39697265625, 22.120361328125, 22.84375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 7.0, 12.0, 11.0, 25.0, 64.0, 123.0, 150.0, 164.0, 144.0, 128.0, 83.0, 39.0, 25.0, 7.0, 5.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-236.2582550048828, -228.53550720214844, -220.812744140625, -213.08999633789062, -205.36724853515625, -197.6444854736328, -189.92173767089844, -182.198974609375, -174.47622680664062, -166.75347900390625, -159.0307159423828, -151.30796813964844, -143.585205078125, -135.86245727539062, -128.13970947265625, -120.41695404052734, -112.69419860839844, -104.97144317626953, -97.24868774414062, -89.52593994140625, -81.80318450927734, -74.08042907714844, -66.35768127441406, -58.634925842285156, -50.91217041015625, -43.189414978027344, -35.4666633605957, -27.74390983581543, -20.021156311035156, -12.29840087890625, -4.575649261474609, 3.1471023559570312, 10.869873046875, 18.592626571655273, 26.315380096435547, 34.03813171386719, 41.760887145996094, 49.483642578125, 57.20639419555664, 64.92914581298828, 72.65190124511719, 80.3746566772461, 88.097412109375, 95.82015991210938, 103.54291534423828, 111.26567077636719, 118.98841857910156, 126.71117401123047, 134.43392944335938, 142.15667724609375, 149.8794403076172, 157.60218811035156, 165.324951171875, 173.04769897460938, 180.77044677734375, 188.49319458007812, 196.21595764160156, 203.93870544433594, 211.66146850585938, 219.38421630859375, 227.10696411132812, 234.82972717285156, 242.55247497558594, 250.27523803710938, 257.99798583984375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 4.0, 5.0, 8.0, 15.0, 9.0, 17.0, 17.0, 8.0, 21.0, 18.0, 27.0, 36.0, 21.0, 49.0, 36.0, 58.0, 33.0, 41.0, 36.0, 47.0, 50.0, 52.0, 32.0, 34.0, 43.0, 49.0, 31.0, 29.0, 39.0, 21.0, 21.0, 13.0, 16.0, 12.0, 13.0, 14.0, 6.0, 4.0, 6.0, 3.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-109.94772338867188, -106.66331481933594, -103.37890625, -100.09449768066406, -96.81008911132812, -93.52568054199219, -90.24127197265625, -86.95685577392578, -83.67244720458984, -80.3880386352539, -77.10363006591797, -73.81922149658203, -70.5348129272461, -67.25039672851562, -63.96599197387695, -60.68157958984375, -57.39717483520508, -54.11276626586914, -50.8283576965332, -47.5439453125, -44.25953674316406, -40.975128173828125, -37.69071960449219, -34.40631103515625, -31.12190055847168, -27.837491989135742, -24.553081512451172, -21.268672943115234, -17.984264373779297, -14.699853897094727, -11.415445327758789, -8.131034851074219, -4.846626281738281, -1.5622169971466064, 1.7221922874450684, 5.006601333618164, 8.291010856628418, 11.575420379638672, 14.85982894897461, 18.14423942565918, 21.428647994995117, 24.713056564331055, 27.997467041015625, 31.281875610351562, 34.5662841796875, 37.85069274902344, 41.135101318359375, 44.41951370239258, 47.703922271728516, 50.98833084106445, 54.27273941040039, 57.557151794433594, 60.84156036376953, 64.12596893310547, 67.4103775024414, 70.69478607177734, 73.97919464111328, 77.26360321044922, 80.54801177978516, 83.8324203491211, 87.11682891845703, 90.4012451171875, 93.68565368652344, 96.97006225585938, 100.25447082519531]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 10.0, 10.0, 19.0, 12.0, 25.0, 47.0, 58.0, 87.0, 136.0, 250.0, 345.0, 539.0, 892.0, 1500.0, 2559.0, 4573.0, 8199.0, 15835.0, 31512.0, 65515.0, 144740.0, 287233.0, 255090.0, 118550.0, 54101.0, 26469.0, 13404.0, 7049.0, 4025.0, 2248.0, 1310.0, 817.0, 478.0, 324.0, 176.0, 131.0, 81.0, 74.0, 45.0, 28.0, 14.0, 15.0, 11.0, 5.0, 2.0, 8.0, 2.0, 1.0, 4.0, 2.0, 1.0], "bins": [-15.53125, -15.0859375, -14.640625, -14.1953125, -13.75, -13.3046875, -12.859375, -12.4140625, -11.96875, -11.5234375, -11.078125, -10.6328125, -10.1875, -9.7421875, -9.296875, -8.8515625, -8.40625, -7.9609375, -7.515625, -7.0703125, -6.625, -6.1796875, -5.734375, -5.2890625, -4.84375, -4.3984375, -3.953125, -3.5078125, -3.0625, -2.6171875, -2.171875, -1.7265625, -1.28125, -0.8359375, -0.390625, 0.0546875, 0.5, 0.9453125, 1.390625, 1.8359375, 2.28125, 2.7265625, 3.171875, 3.6171875, 4.0625, 4.5078125, 4.953125, 5.3984375, 5.84375, 6.2890625, 6.734375, 7.1796875, 7.625, 8.0703125, 8.515625, 8.9609375, 9.40625, 9.8515625, 10.296875, 10.7421875, 11.1875, 11.6328125, 12.078125, 12.5234375, 12.96875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 12.0, 7.0, 10.0, 13.0, 12.0, 23.0, 16.0, 24.0, 30.0, 41.0, 31.0, 40.0, 42.0, 34.0, 49.0, 47.0, 43.0, 34.0, 35.0, 43.0, 38.0, 42.0, 47.0, 34.0, 37.0, 50.0, 25.0, 21.0, 16.0, 26.0, 10.0, 15.0, 19.0, 6.0, 5.0, 4.0, 7.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-8.921875, -8.6478271484375, -8.373779296875, -8.0997314453125, -7.82568359375, -7.5516357421875, -7.277587890625, -7.0035400390625, -6.7294921875, -6.4554443359375, -6.181396484375, -5.9073486328125, -5.63330078125, -5.3592529296875, -5.085205078125, -4.8111572265625, -4.537109375, -4.2630615234375, -3.989013671875, -3.7149658203125, -3.44091796875, -3.1668701171875, -2.892822265625, -2.6187744140625, -2.3447265625, -2.0706787109375, -1.796630859375, -1.5225830078125, -1.24853515625, -0.9744873046875, -0.700439453125, -0.4263916015625, -0.15234375, 0.1217041015625, 0.395751953125, 0.6697998046875, 0.94384765625, 1.2178955078125, 1.491943359375, 1.7659912109375, 2.0400390625, 2.3140869140625, 2.588134765625, 2.8621826171875, 3.13623046875, 3.4102783203125, 3.684326171875, 3.9583740234375, 4.232421875, 4.5064697265625, 4.780517578125, 5.0545654296875, 5.32861328125, 5.6026611328125, 5.876708984375, 6.1507568359375, 6.4248046875, 6.6988525390625, 6.972900390625, 7.2469482421875, 7.52099609375, 7.7950439453125, 8.069091796875, 8.3431396484375, 8.6171875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 2.0, 3.0, 6.0, 12.0, 10.0, 14.0, 19.0, 31.0, 30.0, 47.0, 61.0, 81.0, 99.0, 194.0, 259.0, 393.0, 657.0, 1069.0, 2140.0, 5073.0, 17493.0, 96416.0, 704505.0, 179430.0, 27498.0, 6951.0, 2654.0, 1294.0, 791.0, 463.0, 287.0, 177.0, 118.0, 84.0, 47.0, 39.0, 34.0, 13.0, 21.0, 12.0, 11.0, 5.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-38.84375, -37.72265625, -36.6015625, -35.48046875, -34.359375, -33.23828125, -32.1171875, -30.99609375, -29.875, -28.75390625, -27.6328125, -26.51171875, -25.390625, -24.26953125, -23.1484375, -22.02734375, -20.90625, -19.78515625, -18.6640625, -17.54296875, -16.421875, -15.30078125, -14.1796875, -13.05859375, -11.9375, -10.81640625, -9.6953125, -8.57421875, -7.453125, -6.33203125, -5.2109375, -4.08984375, -2.96875, -1.84765625, -0.7265625, 0.39453125, 1.515625, 2.63671875, 3.7578125, 4.87890625, 6.0, 7.12109375, 8.2421875, 9.36328125, 10.484375, 11.60546875, 12.7265625, 13.84765625, 14.96875, 16.08984375, 17.2109375, 18.33203125, 19.453125, 20.57421875, 21.6953125, 22.81640625, 23.9375, 25.05859375, 26.1796875, 27.30078125, 28.421875, 29.54296875, 30.6640625, 31.78515625, 32.90625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 6.0, 6.0, 11.0, 11.0, 11.0, 18.0, 27.0, 22.0, 31.0, 46.0, 50.0, 57.0, 56.0, 65.0, 66.0, 64.0, 70.0, 57.0, 63.0, 44.0, 45.0, 36.0, 29.0, 30.0, 22.0, 16.0, 10.0, 10.0, 9.0, 3.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-49.25, -47.78271484375, -46.3154296875, -44.84814453125, -43.380859375, -41.91357421875, -40.4462890625, -38.97900390625, -37.51171875, -36.04443359375, -34.5771484375, -33.10986328125, -31.642578125, -30.17529296875, -28.7080078125, -27.24072265625, -25.7734375, -24.30615234375, -22.8388671875, -21.37158203125, -19.904296875, -18.43701171875, -16.9697265625, -15.50244140625, -14.03515625, -12.56787109375, -11.1005859375, -9.63330078125, -8.166015625, -6.69873046875, -5.2314453125, -3.76416015625, -2.296875, -0.82958984375, 0.6376953125, 2.10498046875, 3.572265625, 5.03955078125, 6.5068359375, 7.97412109375, 9.44140625, 10.90869140625, 12.3759765625, 13.84326171875, 15.310546875, 16.77783203125, 18.2451171875, 19.71240234375, 21.1796875, 22.64697265625, 24.1142578125, 25.58154296875, 27.048828125, 28.51611328125, 29.9833984375, 31.45068359375, 32.91796875, 34.38525390625, 35.8525390625, 37.31982421875, 38.787109375, 40.25439453125, 41.7216796875, 43.18896484375, 44.65625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 6.0, 10.0, 5.0, 14.0, 11.0, 20.0, 32.0, 55.0, 94.0, 191.0, 357.0, 868.0, 2865.0, 13837.0, 127510.0, 803874.0, 84491.0, 10474.0, 2342.0, 761.0, 324.0, 177.0, 79.0, 47.0, 24.0, 21.0, 16.0, 17.0, 11.0, 12.0, 6.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.6875, -16.274658203125, -15.86181640625, -15.448974609375, -15.0361328125, -14.623291015625, -14.21044921875, -13.797607421875, -13.384765625, -12.971923828125, -12.55908203125, -12.146240234375, -11.7333984375, -11.320556640625, -10.90771484375, -10.494873046875, -10.08203125, -9.669189453125, -9.25634765625, -8.843505859375, -8.4306640625, -8.017822265625, -7.60498046875, -7.192138671875, -6.779296875, -6.366455078125, -5.95361328125, -5.540771484375, -5.1279296875, -4.715087890625, -4.30224609375, -3.889404296875, -3.4765625, -3.063720703125, -2.65087890625, -2.238037109375, -1.8251953125, -1.412353515625, -0.99951171875, -0.586669921875, -0.173828125, 0.239013671875, 0.65185546875, 1.064697265625, 1.4775390625, 1.890380859375, 2.30322265625, 2.716064453125, 3.12890625, 3.541748046875, 3.95458984375, 4.367431640625, 4.7802734375, 5.193115234375, 5.60595703125, 6.018798828125, 6.431640625, 6.844482421875, 7.25732421875, 7.670166015625, 8.0830078125, 8.495849609375, 8.90869140625, 9.321533203125, 9.734375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 5.0, 12.0, 11.0, 16.0, 22.0, 25.0, 18.0, 39.0, 77.0, 130.0, 143.0, 118.0, 107.0, 77.0, 53.0, 37.0, 27.0, 13.0, 19.0, 13.0, 9.0, 5.0, 4.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022945404052734375, -0.002214968204498291, -0.0021353960037231445, -0.002055823802947998, -0.0019762516021728516, -0.001896679401397705, -0.0018171072006225586, -0.0017375349998474121, -0.0016579627990722656, -0.0015783905982971191, -0.0014988183975219727, -0.0014192461967468262, -0.0013396739959716797, -0.0012601017951965332, -0.0011805295944213867, -0.0011009573936462402, -0.0010213851928710938, -0.0009418129920959473, -0.0008622407913208008, -0.0007826685905456543, -0.0007030963897705078, -0.0006235241889953613, -0.0005439519882202148, -0.00046437978744506836, -0.0003848075866699219, -0.0003052353858947754, -0.0002256631851196289, -0.00014609098434448242, -6.651878356933594e-05, 1.3053417205810547e-05, 9.262561798095703e-05, 0.00017219781875610352, 0.00025177001953125, 0.0003313422203063965, 0.00041091442108154297, 0.0004904866218566895, 0.0005700588226318359, 0.0006496310234069824, 0.0007292032241821289, 0.0008087754249572754, 0.0008883476257324219, 0.0009679198265075684, 0.0010474920272827148, 0.0011270642280578613, 0.0012066364288330078, 0.0012862086296081543, 0.0013657808303833008, 0.0014453530311584473, 0.0015249252319335938, 0.0016044974327087402, 0.0016840696334838867, 0.0017636418342590332, 0.0018432140350341797, 0.0019227862358093262, 0.0020023584365844727, 0.002081930637359619, 0.0021615028381347656, 0.002241075038909912, 0.0023206472396850586, 0.002400219440460205, 0.0024797916412353516, 0.002559363842010498, 0.0026389360427856445, 0.002718508243560791, 0.0027980804443359375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [5.0, 3.0, 3.0, 4.0, 7.0, 15.0, 21.0, 25.0, 36.0, 66.0, 116.0, 198.0, 361.0, 714.0, 1591.0, 4217.0, 17275.0, 153733.0, 755797.0, 95625.0, 12519.0, 3447.0, 1358.0, 683.0, 318.0, 174.0, 81.0, 65.0, 33.0, 23.0, 16.0, 12.0, 9.0, 4.0, 5.0, 4.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.80859375, -5.49298095703125, -5.1773681640625, -4.86175537109375, -4.546142578125, -4.23052978515625, -3.9149169921875, -3.59930419921875, -3.28369140625, -2.96807861328125, -2.6524658203125, -2.33685302734375, -2.021240234375, -1.70562744140625, -1.3900146484375, -1.07440185546875, -0.7587890625, -0.44317626953125, -0.1275634765625, 0.18804931640625, 0.503662109375, 0.81927490234375, 1.1348876953125, 1.45050048828125, 1.76611328125, 2.08172607421875, 2.3973388671875, 2.71295166015625, 3.028564453125, 3.34417724609375, 3.6597900390625, 3.97540283203125, 4.291015625, 4.60662841796875, 4.9222412109375, 5.23785400390625, 5.553466796875, 5.86907958984375, 6.1846923828125, 6.50030517578125, 6.81591796875, 7.13153076171875, 7.4471435546875, 7.76275634765625, 8.078369140625, 8.39398193359375, 8.7095947265625, 9.02520751953125, 9.3408203125, 9.65643310546875, 9.9720458984375, 10.28765869140625, 10.603271484375, 10.91888427734375, 11.2344970703125, 11.55010986328125, 11.86572265625, 12.18133544921875, 12.4969482421875, 12.81256103515625, 13.128173828125, 13.44378662109375, 13.7593994140625, 14.07501220703125, 14.390625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 3.0, 4.0, 3.0, 11.0, 8.0, 14.0, 9.0, 15.0, 13.0, 38.0, 25.0, 38.0, 38.0, 58.0, 71.0, 62.0, 58.0, 79.0, 83.0, 89.0, 46.0, 60.0, 47.0, 25.0, 26.0, 17.0, 16.0, 17.0, 14.0, 4.0, 9.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.3984375, -5.181884765625, -4.96533203125, -4.748779296875, -4.5322265625, -4.315673828125, -4.09912109375, -3.882568359375, -3.666015625, -3.449462890625, -3.23291015625, -3.016357421875, -2.7998046875, -2.583251953125, -2.36669921875, -2.150146484375, -1.93359375, -1.717041015625, -1.50048828125, -1.283935546875, -1.0673828125, -0.850830078125, -0.63427734375, -0.417724609375, -0.201171875, 0.015380859375, 0.23193359375, 0.448486328125, 0.6650390625, 0.881591796875, 1.09814453125, 1.314697265625, 1.53125, 1.747802734375, 1.96435546875, 2.180908203125, 2.3974609375, 2.614013671875, 2.83056640625, 3.047119140625, 3.263671875, 3.480224609375, 3.69677734375, 3.913330078125, 4.1298828125, 4.346435546875, 4.56298828125, 4.779541015625, 4.99609375, 5.212646484375, 5.42919921875, 5.645751953125, 5.8623046875, 6.078857421875, 6.29541015625, 6.511962890625, 6.728515625, 6.945068359375, 7.16162109375, 7.378173828125, 7.5947265625, 7.811279296875, 8.02783203125, 8.244384765625, 8.4609375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 11.0, 9.0, 18.0, 26.0, 42.0, 42.0, 95.0, 88.0, 162.0, 145.0, 108.0, 71.0, 60.0, 45.0, 23.0, 10.0, 10.0, 3.0, 4.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-134.34353637695312, -129.54766845703125, -124.75180053710938, -119.9559326171875, -115.16007232666016, -110.36420440673828, -105.5683364868164, -100.77247619628906, -95.97660827636719, -91.18074035644531, -86.38487243652344, -81.58900451660156, -76.79314422607422, -71.99727630615234, -67.20140838623047, -62.40554428100586, -57.60967254638672, -52.813804626464844, -48.017940521240234, -43.22207260131836, -38.42620849609375, -33.630340576171875, -28.83447265625, -24.03860855102539, -19.242740631103516, -14.446874618530273, -9.651007652282715, -4.855140686035156, -0.05927467346191406, 4.736591339111328, 9.532459259033203, 14.328323364257812, 19.124191284179688, 23.92005729675293, 28.715923309326172, 33.51179122924805, 38.307655334472656, 43.10352325439453, 47.899391174316406, 52.695255279541016, 57.49112319946289, 62.286991119384766, 67.08285522460938, 71.87872314453125, 76.67459106445312, 81.470458984375, 86.26632690429688, 91.06218719482422, 95.8580551147461, 100.65392303466797, 105.44979095458984, 110.24565124511719, 115.04151916503906, 119.83738708496094, 124.63325500488281, 129.4291229248047, 134.22499084472656, 139.02085876464844, 143.8167266845703, 148.6125946044922, 153.40846252441406, 158.20431518554688, 163.00018310546875, 167.79605102539062, 172.5919189453125]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 3.0, 2.0, 2.0, 4.0, 4.0, 2.0, 6.0, 7.0, 10.0, 8.0, 5.0, 8.0, 17.0, 14.0, 20.0, 28.0, 24.0, 22.0, 29.0, 29.0, 40.0, 57.0, 49.0, 71.0, 65.0, 60.0, 53.0, 42.0, 40.0, 41.0, 24.0, 31.0, 31.0, 18.0, 20.0, 14.0, 9.0, 16.0, 15.0, 16.0, 11.0, 13.0, 11.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-134.8965301513672, -130.94078063964844, -126.98502349853516, -123.0292739868164, -119.07351684570312, -115.11776733398438, -111.16201782226562, -107.20626068115234, -103.25050354003906, -99.29475402832031, -95.33899688720703, -91.38324737548828, -87.427490234375, -83.47174072265625, -79.5159912109375, -75.56023406982422, -71.60448455810547, -67.64873504638672, -63.69297790527344, -59.73722839355469, -55.781471252441406, -51.825721740722656, -47.86996841430664, -43.914215087890625, -39.95846176147461, -36.002708435058594, -32.04695510864258, -28.091203689575195, -24.13545036315918, -20.179697036743164, -16.22394561767578, -12.268192291259766, -8.31243896484375, -4.356686115264893, -0.40093326568603516, 3.554819107055664, 7.51057243347168, 11.466325759887695, 15.422077178955078, 19.377830505371094, 23.33358383178711, 27.289337158203125, 31.24509048461914, 35.200843811035156, 39.156593322753906, 43.11235046386719, 47.06809997558594, 51.02385330200195, 54.97960662841797, 58.935359954833984, 62.89111328125, 66.84686279296875, 70.80261993408203, 74.75836944580078, 78.71412658691406, 82.66987609863281, 86.62562561035156, 90.58137512207031, 94.5371322631836, 98.49288177490234, 102.44863891601562, 106.40438842773438, 110.36013793945312, 114.3158950805664, 118.27165222167969]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 9.0, 7.0, 13.0, 18.0, 29.0, 27.0, 32.0, 83.0, 87.0, 161.0, 213.0, 387.0, 704.0, 1200.0, 2277.0, 4474.0, 9704.0, 25516.0, 94732.0, 692234.0, 2582123.0, 646031.0, 90286.0, 24958.0, 9448.0, 4380.0, 2202.0, 1204.0, 677.0, 385.0, 243.0, 146.0, 107.0, 63.0, 43.0, 17.0, 19.0, 17.0, 8.0, 7.0, 7.0, 2.0, 3.0, 5.0, 0.0, 4.0, 1.0, 0.0, 1.0], "bins": [-13.3671875, -12.990478515625, -12.61376953125, -12.237060546875, -11.8603515625, -11.483642578125, -11.10693359375, -10.730224609375, -10.353515625, -9.976806640625, -9.60009765625, -9.223388671875, -8.8466796875, -8.469970703125, -8.09326171875, -7.716552734375, -7.33984375, -6.963134765625, -6.58642578125, -6.209716796875, -5.8330078125, -5.456298828125, -5.07958984375, -4.702880859375, -4.326171875, -3.949462890625, -3.57275390625, -3.196044921875, -2.8193359375, -2.442626953125, -2.06591796875, -1.689208984375, -1.3125, -0.935791015625, -0.55908203125, -0.182373046875, 0.1943359375, 0.571044921875, 0.94775390625, 1.324462890625, 1.701171875, 2.077880859375, 2.45458984375, 2.831298828125, 3.2080078125, 3.584716796875, 3.96142578125, 4.338134765625, 4.71484375, 5.091552734375, 5.46826171875, 5.844970703125, 6.2216796875, 6.598388671875, 6.97509765625, 7.351806640625, 7.728515625, 8.105224609375, 8.48193359375, 8.858642578125, 9.2353515625, 9.612060546875, 9.98876953125, 10.365478515625, 10.7421875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 1.0, 3.0, 6.0, 11.0, 8.0, 12.0, 16.0, 15.0, 36.0, 43.0, 32.0, 50.0, 47.0, 56.0, 72.0, 52.0, 67.0, 72.0, 62.0, 58.0, 45.0, 43.0, 59.0, 35.0, 26.0, 24.0, 14.0, 15.0, 6.0, 7.0, 10.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.265625, -10.90771484375, -10.5498046875, -10.19189453125, -9.833984375, -9.47607421875, -9.1181640625, -8.76025390625, -8.40234375, -8.04443359375, -7.6865234375, -7.32861328125, -6.970703125, -6.61279296875, -6.2548828125, -5.89697265625, -5.5390625, -5.18115234375, -4.8232421875, -4.46533203125, -4.107421875, -3.74951171875, -3.3916015625, -3.03369140625, -2.67578125, -2.31787109375, -1.9599609375, -1.60205078125, -1.244140625, -0.88623046875, -0.5283203125, -0.17041015625, 0.1875, 0.54541015625, 0.9033203125, 1.26123046875, 1.619140625, 1.97705078125, 2.3349609375, 2.69287109375, 3.05078125, 3.40869140625, 3.7666015625, 4.12451171875, 4.482421875, 4.84033203125, 5.1982421875, 5.55615234375, 5.9140625, 6.27197265625, 6.6298828125, 6.98779296875, 7.345703125, 7.70361328125, 8.0615234375, 8.41943359375, 8.77734375, 9.13525390625, 9.4931640625, 9.85107421875, 10.208984375, 10.56689453125, 10.9248046875, 11.28271484375, 11.640625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 0.0, 3.0, 7.0, 7.0, 21.0, 28.0, 47.0, 76.0, 103.0, 234.0, 448.0, 977.0, 2685.0, 10107.0, 56151.0, 1060055.0, 2930452.0, 110042.0, 16673.0, 3885.0, 1254.0, 510.0, 254.0, 95.0, 54.0, 41.0, 28.0, 12.0, 8.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.46875, -25.5908203125, -24.712890625, -23.8349609375, -22.95703125, -22.0791015625, -21.201171875, -20.3232421875, -19.4453125, -18.5673828125, -17.689453125, -16.8115234375, -15.93359375, -15.0556640625, -14.177734375, -13.2998046875, -12.421875, -11.5439453125, -10.666015625, -9.7880859375, -8.91015625, -8.0322265625, -7.154296875, -6.2763671875, -5.3984375, -4.5205078125, -3.642578125, -2.7646484375, -1.88671875, -1.0087890625, -0.130859375, 0.7470703125, 1.625, 2.5029296875, 3.380859375, 4.2587890625, 5.13671875, 6.0146484375, 6.892578125, 7.7705078125, 8.6484375, 9.5263671875, 10.404296875, 11.2822265625, 12.16015625, 13.0380859375, 13.916015625, 14.7939453125, 15.671875, 16.5498046875, 17.427734375, 18.3056640625, 19.18359375, 20.0615234375, 20.939453125, 21.8173828125, 22.6953125, 23.5732421875, 24.451171875, 25.3291015625, 26.20703125, 27.0849609375, 27.962890625, 28.8408203125, 29.71875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 7.0, 12.0, 17.0, 21.0, 24.0, 46.0, 61.0, 108.0, 190.0, 363.0, 622.0, 875.0, 718.0, 434.0, 204.0, 104.0, 79.0, 68.0, 35.0, 31.0, 20.0, 11.0, 8.0, 6.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-36.90625, -36.061767578125, -35.21728515625, -34.372802734375, -33.5283203125, -32.683837890625, -31.83935546875, -30.994873046875, -30.150390625, -29.305908203125, -28.46142578125, -27.616943359375, -26.7724609375, -25.927978515625, -25.08349609375, -24.239013671875, -23.39453125, -22.550048828125, -21.70556640625, -20.861083984375, -20.0166015625, -19.172119140625, -18.32763671875, -17.483154296875, -16.638671875, -15.794189453125, -14.94970703125, -14.105224609375, -13.2607421875, -12.416259765625, -11.57177734375, -10.727294921875, -9.8828125, -9.038330078125, -8.19384765625, -7.349365234375, -6.5048828125, -5.660400390625, -4.81591796875, -3.971435546875, -3.126953125, -2.282470703125, -1.43798828125, -0.593505859375, 0.2509765625, 1.095458984375, 1.93994140625, 2.784423828125, 3.62890625, 4.473388671875, 5.31787109375, 6.162353515625, 7.0068359375, 7.851318359375, 8.69580078125, 9.540283203125, 10.384765625, 11.229248046875, 12.07373046875, 12.918212890625, 13.7626953125, 14.607177734375, 15.45166015625, 16.296142578125, 17.140625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 11.0, 24.0, 49.0, 87.0, 132.0, 172.0, 192.0, 145.0, 82.0, 49.0, 15.0, 16.0, 5.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-195.04254150390625, -188.08555603027344, -181.12857055664062, -174.17160034179688, -167.21461486816406, -160.25762939453125, -153.30064392089844, -146.34365844726562, -139.38668823242188, -132.42970275878906, -125.47272491455078, -118.51573944091797, -111.55876159667969, -104.60177612304688, -97.64479064941406, -90.68780517578125, -83.73081970214844, -76.77383422851562, -69.81685638427734, -62.85987091064453, -55.902889251708984, -48.94590759277344, -41.988922119140625, -35.03194046020508, -28.07495880126953, -21.117977142333984, -14.160993576049805, -7.204010009765625, -0.24702835083007812, 6.709953308105469, 13.666938781738281, 20.623920440673828, 27.580886840820312, 34.53786849975586, 41.494850158691406, 48.45183563232422, 55.408817291259766, 62.36579895019531, 69.32278442382812, 76.27976989746094, 83.23674774169922, 90.19373321533203, 97.15071105957031, 104.10769653320312, 111.06468200683594, 118.02165985107422, 124.97864532470703, 131.9356231689453, 138.89260864257812, 145.84959411621094, 152.80657958984375, 159.7635498046875, 166.7205352783203, 173.67752075195312, 180.63450622558594, 187.59149169921875, 194.5484619140625, 201.5054473876953, 208.46243286132812, 215.41940307617188, 222.3763885498047, 229.3333740234375, 236.2903594970703, 243.24734497070312, 250.20433044433594]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 2.0, 3.0, 4.0, 8.0, 9.0, 9.0, 19.0, 22.0, 18.0, 31.0, 30.0, 27.0, 42.0, 47.0, 41.0, 39.0, 52.0, 52.0, 57.0, 47.0, 46.0, 45.0, 50.0, 36.0, 42.0, 45.0, 36.0, 32.0, 18.0, 20.0, 20.0, 16.0, 8.0, 8.0, 2.0, 8.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.86061096191406, -95.53082275390625, -92.20103454589844, -88.87124633789062, -85.54145812988281, -82.211669921875, -78.88188171386719, -75.55209350585938, -72.22230529785156, -68.89251708984375, -65.56272888183594, -62.232940673828125, -58.90315246582031, -55.5733642578125, -52.24357223510742, -48.91378402709961, -45.58399200439453, -42.25420379638672, -38.924415588378906, -35.594627380371094, -32.26483917236328, -28.935049057006836, -25.60525894165039, -22.275470733642578, -18.945682525634766, -15.615894317626953, -12.286105155944824, -8.956315994262695, -5.626527786254883, -2.2967395782470703, 1.033050537109375, 4.3628387451171875, 7.692634582519531, 11.022422790527344, 14.352211952209473, 17.6820011138916, 21.011789321899414, 24.341577529907227, 27.671367645263672, 31.001155853271484, 34.3309440612793, 37.66073226928711, 40.99052047729492, 44.3203125, 47.65010070800781, 50.979888916015625, 54.30967712402344, 57.63946533203125, 60.96925354003906, 64.29904174804688, 67.62882995605469, 70.9586181640625, 74.28840637207031, 77.61819458007812, 80.94798278808594, 84.27777099609375, 87.60755920410156, 90.93734741210938, 94.26713562011719, 97.596923828125, 100.92671203613281, 104.25650024414062, 107.58628845214844, 110.91607666015625, 114.2458724975586]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 7.0, 3.0, 6.0, 2.0, 12.0, 18.0, 20.0, 32.0, 39.0, 58.0, 81.0, 117.0, 187.0, 251.0, 407.0, 586.0, 914.0, 1349.0, 2199.0, 3779.0, 6185.0, 11124.0, 19682.0, 36638.0, 69382.0, 125813.0, 199962.0, 218867.0, 155312.0, 88962.0, 47591.0, 25280.0, 13679.0, 7812.0, 4574.0, 2735.0, 1718.0, 1086.0, 662.0, 463.0, 290.0, 212.0, 133.0, 97.0, 66.0, 61.0, 31.0, 17.0, 15.0, 12.0, 8.0, 7.0, 6.0, 3.0, 2.0, 4.0, 3.0], "bins": [-9.109375, -8.843017578125, -8.57666015625, -8.310302734375, -8.0439453125, -7.777587890625, -7.51123046875, -7.244873046875, -6.978515625, -6.712158203125, -6.44580078125, -6.179443359375, -5.9130859375, -5.646728515625, -5.38037109375, -5.114013671875, -4.84765625, -4.581298828125, -4.31494140625, -4.048583984375, -3.7822265625, -3.515869140625, -3.24951171875, -2.983154296875, -2.716796875, -2.450439453125, -2.18408203125, -1.917724609375, -1.6513671875, -1.385009765625, -1.11865234375, -0.852294921875, -0.5859375, -0.319580078125, -0.05322265625, 0.213134765625, 0.4794921875, 0.745849609375, 1.01220703125, 1.278564453125, 1.544921875, 1.811279296875, 2.07763671875, 2.343994140625, 2.6103515625, 2.876708984375, 3.14306640625, 3.409423828125, 3.67578125, 3.942138671875, 4.20849609375, 4.474853515625, 4.7412109375, 5.007568359375, 5.27392578125, 5.540283203125, 5.806640625, 6.072998046875, 6.33935546875, 6.605712890625, 6.8720703125, 7.138427734375, 7.40478515625, 7.671142578125, 7.9375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 6.0, 8.0, 5.0, 8.0, 13.0, 16.0, 8.0, 22.0, 29.0, 25.0, 40.0, 26.0, 45.0, 39.0, 30.0, 40.0, 43.0, 32.0, 49.0, 58.0, 51.0, 36.0, 40.0, 47.0, 34.0, 22.0, 33.0, 46.0, 23.0, 23.0, 19.0, 17.0, 12.0, 15.0, 4.0, 7.0, 5.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0], "bins": [-9.6484375, -9.3707275390625, -9.093017578125, -8.8153076171875, -8.53759765625, -8.2598876953125, -7.982177734375, -7.7044677734375, -7.4267578125, -7.1490478515625, -6.871337890625, -6.5936279296875, -6.31591796875, -6.0382080078125, -5.760498046875, -5.4827880859375, -5.205078125, -4.9273681640625, -4.649658203125, -4.3719482421875, -4.09423828125, -3.8165283203125, -3.538818359375, -3.2611083984375, -2.9833984375, -2.7056884765625, -2.427978515625, -2.1502685546875, -1.87255859375, -1.5948486328125, -1.317138671875, -1.0394287109375, -0.76171875, -0.4840087890625, -0.206298828125, 0.0714111328125, 0.34912109375, 0.6268310546875, 0.904541015625, 1.1822509765625, 1.4599609375, 1.7376708984375, 2.015380859375, 2.2930908203125, 2.57080078125, 2.8485107421875, 3.126220703125, 3.4039306640625, 3.681640625, 3.9593505859375, 4.237060546875, 4.5147705078125, 4.79248046875, 5.0701904296875, 5.347900390625, 5.6256103515625, 5.9033203125, 6.1810302734375, 6.458740234375, 6.7364501953125, 7.01416015625, 7.2918701171875, 7.569580078125, 7.8472900390625, 8.125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 6.0, 9.0, 16.0, 10.0, 23.0, 64.0, 93.0, 201.0, 529.0, 1769.0, 7521.0, 54523.0, 689451.0, 263447.0, 24765.0, 4292.0, 1101.0, 394.0, 132.0, 84.0, 55.0, 25.0, 15.0, 9.0, 9.0, 4.0, 4.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.46875, -38.3017578125, -37.134765625, -35.9677734375, -34.80078125, -33.6337890625, -32.466796875, -31.2998046875, -30.1328125, -28.9658203125, -27.798828125, -26.6318359375, -25.46484375, -24.2978515625, -23.130859375, -21.9638671875, -20.796875, -19.6298828125, -18.462890625, -17.2958984375, -16.12890625, -14.9619140625, -13.794921875, -12.6279296875, -11.4609375, -10.2939453125, -9.126953125, -7.9599609375, -6.79296875, -5.6259765625, -4.458984375, -3.2919921875, -2.125, -0.9580078125, 0.208984375, 1.3759765625, 2.54296875, 3.7099609375, 4.876953125, 6.0439453125, 7.2109375, 8.3779296875, 9.544921875, 10.7119140625, 11.87890625, 13.0458984375, 14.212890625, 15.3798828125, 16.546875, 17.7138671875, 18.880859375, 20.0478515625, 21.21484375, 22.3818359375, 23.548828125, 24.7158203125, 25.8828125, 27.0498046875, 28.216796875, 29.3837890625, 30.55078125, 31.7177734375, 32.884765625, 34.0517578125, 35.21875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 7.0, 12.0, 12.0, 13.0, 20.0, 32.0, 26.0, 32.0, 50.0, 60.0, 53.0, 75.0, 60.0, 59.0, 69.0, 72.0, 61.0, 63.0, 44.0, 45.0, 30.0, 17.0, 18.0, 13.0, 17.0, 8.0, 11.0, 4.0, 6.0, 2.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.6875, -47.2333984375, -45.779296875, -44.3251953125, -42.87109375, -41.4169921875, -39.962890625, -38.5087890625, -37.0546875, -35.6005859375, -34.146484375, -32.6923828125, -31.23828125, -29.7841796875, -28.330078125, -26.8759765625, -25.421875, -23.9677734375, -22.513671875, -21.0595703125, -19.60546875, -18.1513671875, -16.697265625, -15.2431640625, -13.7890625, -12.3349609375, -10.880859375, -9.4267578125, -7.97265625, -6.5185546875, -5.064453125, -3.6103515625, -2.15625, -0.7021484375, 0.751953125, 2.2060546875, 3.66015625, 5.1142578125, 6.568359375, 8.0224609375, 9.4765625, 10.9306640625, 12.384765625, 13.8388671875, 15.29296875, 16.7470703125, 18.201171875, 19.6552734375, 21.109375, 22.5634765625, 24.017578125, 25.4716796875, 26.92578125, 28.3798828125, 29.833984375, 31.2880859375, 32.7421875, 34.1962890625, 35.650390625, 37.1044921875, 38.55859375, 40.0126953125, 41.466796875, 42.9208984375, 44.375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 11.0, 3.0, 11.0, 13.0, 16.0, 18.0, 34.0, 64.0, 97.0, 170.0, 290.0, 616.0, 1352.0, 3858.0, 12069.0, 50173.0, 262702.0, 599656.0, 88265.0, 19710.0, 5697.0, 2006.0, 841.0, 366.0, 193.0, 108.0, 73.0, 45.0, 27.0, 17.0, 14.0, 18.0, 7.0, 10.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.40234375, -6.21502685546875, -6.0277099609375, -5.84039306640625, -5.653076171875, -5.46575927734375, -5.2784423828125, -5.09112548828125, -4.90380859375, -4.71649169921875, -4.5291748046875, -4.34185791015625, -4.154541015625, -3.96722412109375, -3.7799072265625, -3.59259033203125, -3.4052734375, -3.21795654296875, -3.0306396484375, -2.84332275390625, -2.656005859375, -2.46868896484375, -2.2813720703125, -2.09405517578125, -1.90673828125, -1.71942138671875, -1.5321044921875, -1.34478759765625, -1.157470703125, -0.97015380859375, -0.7828369140625, -0.59552001953125, -0.408203125, -0.22088623046875, -0.0335693359375, 0.15374755859375, 0.341064453125, 0.52838134765625, 0.7156982421875, 0.90301513671875, 1.09033203125, 1.27764892578125, 1.4649658203125, 1.65228271484375, 1.839599609375, 2.02691650390625, 2.2142333984375, 2.40155029296875, 2.5888671875, 2.77618408203125, 2.9635009765625, 3.15081787109375, 3.338134765625, 3.52545166015625, 3.7127685546875, 3.90008544921875, 4.08740234375, 4.27471923828125, 4.4620361328125, 4.64935302734375, 4.836669921875, 5.02398681640625, 5.2113037109375, 5.39862060546875, 5.5859375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 6.0, 4.0, 7.0, 8.0, 20.0, 25.0, 39.0, 67.0, 98.0, 136.0, 149.0, 133.0, 100.0, 66.0, 50.0, 23.0, 15.0, 9.0, 16.0, 6.0, 9.0, 5.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013942718505859375, -0.0013399720191955566, -0.0012856721878051758, -0.001231372356414795, -0.001177072525024414, -0.0011227726936340332, -0.0010684728622436523, -0.0010141730308532715, -0.0009598731994628906, -0.0009055733680725098, -0.0008512735366821289, -0.000796973705291748, -0.0007426738739013672, -0.0006883740425109863, -0.0006340742111206055, -0.0005797743797302246, -0.0005254745483398438, -0.0004711747169494629, -0.00041687488555908203, -0.00036257505416870117, -0.0003082752227783203, -0.00025397539138793945, -0.0001996755599975586, -0.00014537572860717773, -9.107589721679688e-05, -3.6776065826416016e-05, 1.7523765563964844e-05, 7.18235969543457e-05, 0.00012612342834472656, 0.00018042325973510742, 0.00023472309112548828, 0.00028902292251586914, 0.00034332275390625, 0.00039762258529663086, 0.0004519224166870117, 0.0005062222480773926, 0.0005605220794677734, 0.0006148219108581543, 0.0006691217422485352, 0.000723421573638916, 0.0007777214050292969, 0.0008320212364196777, 0.0008863210678100586, 0.0009406208992004395, 0.0009949207305908203, 0.0010492205619812012, 0.001103520393371582, 0.0011578202247619629, 0.0012121200561523438, 0.0012664198875427246, 0.0013207197189331055, 0.0013750195503234863, 0.0014293193817138672, 0.001483619213104248, 0.001537919044494629, 0.0015922188758850098, 0.0016465187072753906, 0.0017008185386657715, 0.0017551183700561523, 0.0018094182014465332, 0.001863718032836914, 0.001918017864227295, 0.0019723176956176758, 0.0020266175270080566, 0.0020809173583984375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 6.0, 8.0, 10.0, 12.0, 21.0, 16.0, 21.0, 46.0, 70.0, 110.0, 175.0, 393.0, 608.0, 1264.0, 2667.0, 7161.0, 21799.0, 84201.0, 513893.0, 314695.0, 71189.0, 18890.0, 6233.0, 2456.0, 1188.0, 602.0, 289.0, 192.0, 128.0, 65.0, 39.0, 36.0, 18.0, 12.0, 9.0, 7.0, 7.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.04296875, -5.86492919921875, -5.6868896484375, -5.50885009765625, -5.330810546875, -5.15277099609375, -4.9747314453125, -4.79669189453125, -4.61865234375, -4.44061279296875, -4.2625732421875, -4.08453369140625, -3.906494140625, -3.72845458984375, -3.5504150390625, -3.37237548828125, -3.1943359375, -3.01629638671875, -2.8382568359375, -2.66021728515625, -2.482177734375, -2.30413818359375, -2.1260986328125, -1.94805908203125, -1.77001953125, -1.59197998046875, -1.4139404296875, -1.23590087890625, -1.057861328125, -0.87982177734375, -0.7017822265625, -0.52374267578125, -0.345703125, -0.16766357421875, 0.0103759765625, 0.18841552734375, 0.366455078125, 0.54449462890625, 0.7225341796875, 0.90057373046875, 1.07861328125, 1.25665283203125, 1.4346923828125, 1.61273193359375, 1.790771484375, 1.96881103515625, 2.1468505859375, 2.32489013671875, 2.5029296875, 2.68096923828125, 2.8590087890625, 3.03704833984375, 3.215087890625, 3.39312744140625, 3.5711669921875, 3.74920654296875, 3.92724609375, 4.10528564453125, 4.2833251953125, 4.46136474609375, 4.639404296875, 4.81744384765625, 4.9954833984375, 5.17352294921875, 5.3515625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 3.0, 0.0, 6.0, 8.0, 9.0, 14.0, 25.0, 13.0, 36.0, 34.0, 49.0, 44.0, 64.0, 73.0, 77.0, 75.0, 83.0, 81.0, 57.0, 58.0, 52.0, 25.0, 24.0, 20.0, 17.0, 13.0, 10.0, 7.0, 4.0, 6.0, 3.0, 0.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-5.7890625, -5.61181640625, -5.4345703125, -5.25732421875, -5.080078125, -4.90283203125, -4.7255859375, -4.54833984375, -4.37109375, -4.19384765625, -4.0166015625, -3.83935546875, -3.662109375, -3.48486328125, -3.3076171875, -3.13037109375, -2.953125, -2.77587890625, -2.5986328125, -2.42138671875, -2.244140625, -2.06689453125, -1.8896484375, -1.71240234375, -1.53515625, -1.35791015625, -1.1806640625, -1.00341796875, -0.826171875, -0.64892578125, -0.4716796875, -0.29443359375, -0.1171875, 0.06005859375, 0.2373046875, 0.41455078125, 0.591796875, 0.76904296875, 0.9462890625, 1.12353515625, 1.30078125, 1.47802734375, 1.6552734375, 1.83251953125, 2.009765625, 2.18701171875, 2.3642578125, 2.54150390625, 2.71875, 2.89599609375, 3.0732421875, 3.25048828125, 3.427734375, 3.60498046875, 3.7822265625, 3.95947265625, 4.13671875, 4.31396484375, 4.4912109375, 4.66845703125, 4.845703125, 5.02294921875, 5.2001953125, 5.37744140625, 5.5546875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 10.0, 13.0, 18.0, 31.0, 51.0, 105.0, 136.0, 253.0, 182.0, 82.0, 51.0, 20.0, 16.0, 9.0, 2.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-205.0234375, -199.57162475585938, -194.11981201171875, -188.66799926757812, -183.21620178222656, -177.76438903808594, -172.3125762939453, -166.8607635498047, -161.40896606445312, -155.9571533203125, -150.50534057617188, -145.05352783203125, -139.6017303466797, -134.14991760253906, -128.69810485839844, -123.24629211425781, -117.79447937011719, -112.34266662597656, -106.89086151123047, -101.43904876708984, -95.98724365234375, -90.53543090820312, -85.0836181640625, -79.63180541992188, -74.18000030517578, -68.72818756103516, -63.27638244628906, -57.82456970214844, -52.37276077270508, -46.92095184326172, -41.469139099121094, -36.017330169677734, -30.565521240234375, -25.113712310791016, -19.661901473999023, -14.210090637207031, -8.758281707763672, -3.3064727783203125, 2.1453399658203125, 7.597148895263672, 13.048957824707031, 18.50076675415039, 23.952577590942383, 29.404388427734375, 34.856197357177734, 40.308006286621094, 45.75981903076172, 51.21162796020508, 56.66343688964844, 62.1152458190918, 67.56705474853516, 73.01886749267578, 78.47067260742188, 83.9224853515625, 89.37429809570312, 94.82611083984375, 100.27791595458984, 105.72972869873047, 111.18153381347656, 116.63334655761719, 122.08515930175781, 127.5369644165039, 132.98876953125, 138.44058227539062, 143.89239501953125]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 3.0, 4.0, 6.0, 2.0, 14.0, 5.0, 17.0, 19.0, 17.0, 19.0, 15.0, 36.0, 30.0, 33.0, 28.0, 29.0, 35.0, 45.0, 66.0, 72.0, 84.0, 79.0, 48.0, 46.0, 24.0, 31.0, 31.0, 27.0, 27.0, 15.0, 18.0, 14.0, 10.0, 8.0, 9.0, 7.0, 6.0, 6.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-127.94464874267578, -123.81725311279297, -119.68984985351562, -115.56245422363281, -111.43505096435547, -107.30765533447266, -103.18025207519531, -99.0528564453125, -94.92546081542969, -90.79806518554688, -86.67066192626953, -82.54326629638672, -78.41586303710938, -74.28846740722656, -70.16107177734375, -66.0336685180664, -61.90626525878906, -57.778865814208984, -53.651466369628906, -49.524070739746094, -45.39666748046875, -41.26927185058594, -37.14187240600586, -33.01447296142578, -28.887073516845703, -24.759674072265625, -20.632274627685547, -16.5048770904541, -12.377477645874023, -8.250078201293945, -4.1226806640625, 0.004718780517578125, 4.1321258544921875, 8.259525299072266, 12.386923789978027, 16.51432228088379, 20.641721725463867, 24.769121170043945, 28.89651870727539, 33.02391815185547, 37.15131759643555, 41.278717041015625, 45.4061164855957, 49.53351593017578, 53.660911560058594, 57.78831481933594, 61.91571044921875, 66.04310607910156, 70.1705093383789, 74.29790496826172, 78.42530822753906, 82.55270385742188, 86.68010711669922, 90.80750274658203, 94.93490600585938, 99.06230163574219, 103.189697265625, 107.31709289550781, 111.44449615478516, 115.57189178466797, 119.69929504394531, 123.82669067382812, 127.95408630371094, 132.08148193359375, 136.20889282226562]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 7.0, 6.0, 12.0, 16.0, 23.0, 33.0, 50.0, 75.0, 123.0, 204.0, 381.0, 617.0, 1156.0, 2366.0, 5134.0, 13302.0, 42798.0, 196682.0, 1096309.0, 2129235.0, 557554.0, 104343.0, 26856.0, 9229.0, 3778.0, 1786.0, 939.0, 492.0, 298.0, 189.0, 93.0, 64.0, 34.0, 41.0, 16.0, 12.0, 16.0, 5.0, 4.0, 2.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2578125, -8.97119140625, -8.6845703125, -8.39794921875, -8.111328125, -7.82470703125, -7.5380859375, -7.25146484375, -6.96484375, -6.67822265625, -6.3916015625, -6.10498046875, -5.818359375, -5.53173828125, -5.2451171875, -4.95849609375, -4.671875, -4.38525390625, -4.0986328125, -3.81201171875, -3.525390625, -3.23876953125, -2.9521484375, -2.66552734375, -2.37890625, -2.09228515625, -1.8056640625, -1.51904296875, -1.232421875, -0.94580078125, -0.6591796875, -0.37255859375, -0.0859375, 0.20068359375, 0.4873046875, 0.77392578125, 1.060546875, 1.34716796875, 1.6337890625, 1.92041015625, 2.20703125, 2.49365234375, 2.7802734375, 3.06689453125, 3.353515625, 3.64013671875, 3.9267578125, 4.21337890625, 4.5, 4.78662109375, 5.0732421875, 5.35986328125, 5.646484375, 5.93310546875, 6.2197265625, 6.50634765625, 6.79296875, 7.07958984375, 7.3662109375, 7.65283203125, 7.939453125, 8.22607421875, 8.5126953125, 8.79931640625, 9.0859375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 3.0, 7.0, 9.0, 16.0, 10.0, 17.0, 25.0, 22.0, 27.0, 26.0, 33.0, 44.0, 45.0, 48.0, 55.0, 53.0, 59.0, 48.0, 54.0, 49.0, 27.0, 52.0, 47.0, 30.0, 22.0, 31.0, 26.0, 27.0, 20.0, 18.0, 10.0, 2.0, 8.0, 5.0, 3.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.609375, -9.3175048828125, -9.025634765625, -8.7337646484375, -8.44189453125, -8.1500244140625, -7.858154296875, -7.5662841796875, -7.2744140625, -6.9825439453125, -6.690673828125, -6.3988037109375, -6.10693359375, -5.8150634765625, -5.523193359375, -5.2313232421875, -4.939453125, -4.6475830078125, -4.355712890625, -4.0638427734375, -3.77197265625, -3.4801025390625, -3.188232421875, -2.8963623046875, -2.6044921875, -2.3126220703125, -2.020751953125, -1.7288818359375, -1.43701171875, -1.1451416015625, -0.853271484375, -0.5614013671875, -0.26953125, 0.0223388671875, 0.314208984375, 0.6060791015625, 0.89794921875, 1.1898193359375, 1.481689453125, 1.7735595703125, 2.0654296875, 2.3572998046875, 2.649169921875, 2.9410400390625, 3.23291015625, 3.5247802734375, 3.816650390625, 4.1085205078125, 4.400390625, 4.6922607421875, 4.984130859375, 5.2760009765625, 5.56787109375, 5.8597412109375, 6.151611328125, 6.4434814453125, 6.7353515625, 7.0272216796875, 7.319091796875, 7.6109619140625, 7.90283203125, 8.1947021484375, 8.486572265625, 8.7784423828125, 9.0703125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 9.0, 4.0, 15.0, 16.0, 31.0, 37.0, 62.0, 91.0, 209.0, 608.0, 2767.0, 16524.0, 286867.0, 3753722.0, 119788.0, 10569.0, 1974.0, 530.0, 197.0, 80.0, 63.0, 36.0, 22.0, 20.0, 9.0, 9.0, 6.0, 6.0, 3.0, 5.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.09375, -36.15185546875, -35.2099609375, -34.26806640625, -33.326171875, -32.38427734375, -31.4423828125, -30.50048828125, -29.55859375, -28.61669921875, -27.6748046875, -26.73291015625, -25.791015625, -24.84912109375, -23.9072265625, -22.96533203125, -22.0234375, -21.08154296875, -20.1396484375, -19.19775390625, -18.255859375, -17.31396484375, -16.3720703125, -15.43017578125, -14.48828125, -13.54638671875, -12.6044921875, -11.66259765625, -10.720703125, -9.77880859375, -8.8369140625, -7.89501953125, -6.953125, -6.01123046875, -5.0693359375, -4.12744140625, -3.185546875, -2.24365234375, -1.3017578125, -0.35986328125, 0.58203125, 1.52392578125, 2.4658203125, 3.40771484375, 4.349609375, 5.29150390625, 6.2333984375, 7.17529296875, 8.1171875, 9.05908203125, 10.0009765625, 10.94287109375, 11.884765625, 12.82666015625, 13.7685546875, 14.71044921875, 15.65234375, 16.59423828125, 17.5361328125, 18.47802734375, 19.419921875, 20.36181640625, 21.3037109375, 22.24560546875, 23.1875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 6.0, 14.0, 11.0, 10.0, 20.0, 26.0, 47.0, 46.0, 73.0, 127.0, 224.0, 316.0, 492.0, 656.0, 624.0, 494.0, 289.0, 181.0, 128.0, 65.0, 62.0, 39.0, 28.0, 17.0, 22.0, 13.0, 10.0, 6.0, 10.0, 6.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.4765625, -14.9232177734375, -14.369873046875, -13.8165283203125, -13.26318359375, -12.7098388671875, -12.156494140625, -11.6031494140625, -11.0498046875, -10.4964599609375, -9.943115234375, -9.3897705078125, -8.83642578125, -8.2830810546875, -7.729736328125, -7.1763916015625, -6.623046875, -6.0697021484375, -5.516357421875, -4.9630126953125, -4.40966796875, -3.8563232421875, -3.302978515625, -2.7496337890625, -2.1962890625, -1.6429443359375, -1.089599609375, -0.5362548828125, 0.01708984375, 0.5704345703125, 1.123779296875, 1.6771240234375, 2.23046875, 2.7838134765625, 3.337158203125, 3.8905029296875, 4.44384765625, 4.9971923828125, 5.550537109375, 6.1038818359375, 6.6572265625, 7.2105712890625, 7.763916015625, 8.3172607421875, 8.87060546875, 9.4239501953125, 9.977294921875, 10.5306396484375, 11.083984375, 11.6373291015625, 12.190673828125, 12.7440185546875, 13.29736328125, 13.8507080078125, 14.404052734375, 14.9573974609375, 15.5107421875, 16.0640869140625, 16.617431640625, 17.1707763671875, 17.72412109375, 18.2774658203125, 18.830810546875, 19.3841552734375, 19.9375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 8.0, 2.0, 14.0, 26.0, 61.0, 107.0, 158.0, 213.0, 186.0, 107.0, 52.0, 38.0, 7.0, 6.0, 8.0, 6.0, 5.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-180.15582275390625, -174.40408325195312, -168.65232849121094, -162.9005889892578, -157.14883422851562, -151.3970947265625, -145.64535522460938, -139.8936004638672, -134.14186096191406, -128.39012145996094, -122.63836669921875, -116.88662719726562, -111.13488006591797, -105.38313293457031, -99.63138580322266, -93.879638671875, -88.12789154052734, -82.37614440917969, -76.62439727783203, -70.87265014648438, -65.12091064453125, -59.369163513183594, -53.61741638183594, -47.86567306518555, -42.11392593383789, -36.362178802490234, -30.610435485839844, -24.858688354492188, -19.106943130493164, -13.35519790649414, -7.603450775146484, -1.8517074584960938, 3.9000396728515625, 9.651784896850586, 15.403531074523926, 21.155277252197266, 26.90702247619629, 32.65876770019531, 38.41051483154297, 44.16225814819336, 49.914005279541016, 55.66575241088867, 61.41749572753906, 67.16924285888672, 72.92098999023438, 78.6727294921875, 84.42448425292969, 90.17622375488281, 95.92797088623047, 101.67971801757812, 107.43146514892578, 113.18321228027344, 118.93495178222656, 124.68669891357422, 130.43844604492188, 136.190185546875, 141.9419403076172, 147.6936798095703, 153.4454345703125, 159.19717407226562, 164.9489288330078, 170.70066833496094, 176.45242309570312, 182.20416259765625, 187.95590209960938]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 4.0, 6.0, 8.0, 7.0, 8.0, 13.0, 11.0, 18.0, 20.0, 23.0, 30.0, 28.0, 32.0, 40.0, 33.0, 43.0, 52.0, 55.0, 45.0, 49.0, 45.0, 56.0, 47.0, 49.0, 44.0, 28.0, 36.0, 21.0, 28.0, 22.0, 16.0, 14.0, 23.0, 7.0, 13.0, 6.0, 7.0, 7.0, 5.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-84.37347412109375, -82.02715301513672, -79.68082427978516, -77.33450317382812, -74.9881820678711, -72.64185333251953, -70.2955322265625, -67.94920349121094, -65.6028823852539, -63.25655746459961, -60.91023635864258, -58.56391143798828, -56.217586517333984, -53.87126159667969, -51.524940490722656, -49.17861557006836, -46.83229446411133, -44.48596954345703, -42.1396484375, -39.7933235168457, -37.446998596191406, -35.100677490234375, -32.75435256958008, -30.40802764892578, -28.061704635620117, -25.715381622314453, -23.369056701660156, -21.022733688354492, -18.676410675048828, -16.33008575439453, -13.983762741088867, -11.63743782043457, -9.291114807128906, -6.944790840148926, -4.5984673500061035, -2.2521438598632812, 0.09418010711669922, 2.4405040740966797, 4.786827087402344, 7.133152008056641, 9.479475021362305, 11.825798988342285, 14.172122955322266, 16.51844596862793, 18.864768981933594, 21.21109390258789, 23.557416915893555, 25.90374183654785, 28.250064849853516, 30.59638786315918, 32.942710876464844, 35.28903579711914, 37.63536071777344, 39.98168182373047, 42.328006744384766, 44.67433166503906, 47.020652770996094, 49.36697769165039, 51.71329879760742, 54.05962371826172, 56.405948638916016, 58.75227355957031, 61.098594665527344, 63.44491958618164, 65.79124450683594]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 6.0, 11.0, 10.0, 6.0, 24.0, 27.0, 26.0, 42.0, 52.0, 61.0, 142.0, 169.0, 281.0, 389.0, 604.0, 995.0, 1552.0, 2475.0, 4153.0, 7235.0, 13018.0, 24064.0, 45385.0, 87082.0, 157752.0, 236027.0, 205549.0, 121508.0, 64117.0, 33438.0, 17921.0, 9960.0, 5619.0, 3390.0, 1958.0, 1209.0, 765.0, 470.0, 339.0, 237.0, 158.0, 93.0, 71.0, 51.0, 37.0, 32.0, 11.0, 8.0, 14.0, 5.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.0, -7.7481689453125, -7.496337890625, -7.2445068359375, -6.99267578125, -6.7408447265625, -6.489013671875, -6.2371826171875, -5.9853515625, -5.7335205078125, -5.481689453125, -5.2298583984375, -4.97802734375, -4.7261962890625, -4.474365234375, -4.2225341796875, -3.970703125, -3.7188720703125, -3.467041015625, -3.2152099609375, -2.96337890625, -2.7115478515625, -2.459716796875, -2.2078857421875, -1.9560546875, -1.7042236328125, -1.452392578125, -1.2005615234375, -0.94873046875, -0.6968994140625, -0.445068359375, -0.1932373046875, 0.05859375, 0.3104248046875, 0.562255859375, 0.8140869140625, 1.06591796875, 1.3177490234375, 1.569580078125, 1.8214111328125, 2.0732421875, 2.3250732421875, 2.576904296875, 2.8287353515625, 3.08056640625, 3.3323974609375, 3.584228515625, 3.8360595703125, 4.087890625, 4.3397216796875, 4.591552734375, 4.8433837890625, 5.09521484375, 5.3470458984375, 5.598876953125, 5.8507080078125, 6.1025390625, 6.3543701171875, 6.606201171875, 6.8580322265625, 7.10986328125, 7.3616943359375, 7.613525390625, 7.8653564453125, 8.1171875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 6.0, 3.0, 8.0, 6.0, 6.0, 6.0, 9.0, 16.0, 17.0, 27.0, 29.0, 23.0, 41.0, 35.0, 41.0, 44.0, 37.0, 43.0, 51.0, 50.0, 55.0, 45.0, 45.0, 45.0, 36.0, 41.0, 32.0, 35.0, 34.0, 29.0, 17.0, 17.0, 17.0, 9.0, 4.0, 13.0, 8.0, 4.0, 1.0, 6.0, 4.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.8203125, -8.5352783203125, -8.250244140625, -7.9652099609375, -7.68017578125, -7.3951416015625, -7.110107421875, -6.8250732421875, -6.5400390625, -6.2550048828125, -5.969970703125, -5.6849365234375, -5.39990234375, -5.1148681640625, -4.829833984375, -4.5447998046875, -4.259765625, -3.9747314453125, -3.689697265625, -3.4046630859375, -3.11962890625, -2.8345947265625, -2.549560546875, -2.2645263671875, -1.9794921875, -1.6944580078125, -1.409423828125, -1.1243896484375, -0.83935546875, -0.5543212890625, -0.269287109375, 0.0157470703125, 0.30078125, 0.5858154296875, 0.870849609375, 1.1558837890625, 1.44091796875, 1.7259521484375, 2.010986328125, 2.2960205078125, 2.5810546875, 2.8660888671875, 3.151123046875, 3.4361572265625, 3.72119140625, 4.0062255859375, 4.291259765625, 4.5762939453125, 4.861328125, 5.1463623046875, 5.431396484375, 5.7164306640625, 6.00146484375, 6.2864990234375, 6.571533203125, 6.8565673828125, 7.1416015625, 7.4266357421875, 7.711669921875, 7.9967041015625, 8.28173828125, 8.5667724609375, 8.851806640625, 9.1368408203125, 9.421875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 4.0, 5.0, 4.0, 8.0, 11.0, 12.0, 13.0, 16.0, 22.0, 55.0, 51.0, 81.0, 119.0, 147.0, 210.0, 313.0, 521.0, 893.0, 1632.0, 3562.0, 9034.0, 28702.0, 111642.0, 595057.0, 218812.0, 52194.0, 14914.0, 5286.0, 2253.0, 1131.0, 625.0, 411.0, 245.0, 155.0, 120.0, 80.0, 69.0, 35.0, 27.0, 20.0, 16.0, 10.0, 14.0, 4.0, 6.0, 5.0, 6.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-19.5, -18.921875, -18.34375, -17.765625, -17.1875, -16.609375, -16.03125, -15.453125, -14.875, -14.296875, -13.71875, -13.140625, -12.5625, -11.984375, -11.40625, -10.828125, -10.25, -9.671875, -9.09375, -8.515625, -7.9375, -7.359375, -6.78125, -6.203125, -5.625, -5.046875, -4.46875, -3.890625, -3.3125, -2.734375, -2.15625, -1.578125, -1.0, -0.421875, 0.15625, 0.734375, 1.3125, 1.890625, 2.46875, 3.046875, 3.625, 4.203125, 4.78125, 5.359375, 5.9375, 6.515625, 7.09375, 7.671875, 8.25, 8.828125, 9.40625, 9.984375, 10.5625, 11.140625, 11.71875, 12.296875, 12.875, 13.453125, 14.03125, 14.609375, 15.1875, 15.765625, 16.34375, 16.921875, 17.5]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 6.0, 6.0, 8.0, 14.0, 11.0, 9.0, 16.0, 15.0, 22.0, 31.0, 37.0, 35.0, 41.0, 65.0, 65.0, 66.0, 76.0, 64.0, 53.0, 50.0, 54.0, 52.0, 44.0, 35.0, 21.0, 26.0, 15.0, 20.0, 9.0, 10.0, 8.0, 7.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-43.03125, -41.7705078125, -40.509765625, -39.2490234375, -37.98828125, -36.7275390625, -35.466796875, -34.2060546875, -32.9453125, -31.6845703125, -30.423828125, -29.1630859375, -27.90234375, -26.6416015625, -25.380859375, -24.1201171875, -22.859375, -21.5986328125, -20.337890625, -19.0771484375, -17.81640625, -16.5556640625, -15.294921875, -14.0341796875, -12.7734375, -11.5126953125, -10.251953125, -8.9912109375, -7.73046875, -6.4697265625, -5.208984375, -3.9482421875, -2.6875, -1.4267578125, -0.166015625, 1.0947265625, 2.35546875, 3.6162109375, 4.876953125, 6.1376953125, 7.3984375, 8.6591796875, 9.919921875, 11.1806640625, 12.44140625, 13.7021484375, 14.962890625, 16.2236328125, 17.484375, 18.7451171875, 20.005859375, 21.2666015625, 22.52734375, 23.7880859375, 25.048828125, 26.3095703125, 27.5703125, 28.8310546875, 30.091796875, 31.3525390625, 32.61328125, 33.8740234375, 35.134765625, 36.3955078125, 37.65625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 5.0, 4.0, 8.0, 11.0, 17.0, 13.0, 26.0, 27.0, 35.0, 53.0, 84.0, 120.0, 191.0, 312.0, 474.0, 872.0, 1671.0, 3576.0, 8041.0, 21809.0, 71017.0, 533259.0, 307647.0, 64307.0, 20316.0, 7552.0, 3296.0, 1604.0, 870.0, 478.0, 275.0, 174.0, 126.0, 89.0, 66.0, 23.0, 32.0, 19.0, 8.0, 10.0, 10.0, 6.0, 4.0, 1.0, 5.0, 9.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.833984375, -3.706024169921875, -3.57806396484375, -3.450103759765625, -3.3221435546875, -3.194183349609375, -3.06622314453125, -2.938262939453125, -2.810302734375, -2.682342529296875, -2.55438232421875, -2.426422119140625, -2.2984619140625, -2.170501708984375, -2.04254150390625, -1.914581298828125, -1.78662109375, -1.658660888671875, -1.53070068359375, -1.402740478515625, -1.2747802734375, -1.146820068359375, -1.01885986328125, -0.890899658203125, -0.762939453125, -0.634979248046875, -0.50701904296875, -0.379058837890625, -0.2510986328125, -0.123138427734375, 0.00482177734375, 0.132781982421875, 0.2607421875, 0.388702392578125, 0.51666259765625, 0.644622802734375, 0.7725830078125, 0.900543212890625, 1.02850341796875, 1.156463623046875, 1.284423828125, 1.412384033203125, 1.54034423828125, 1.668304443359375, 1.7962646484375, 1.924224853515625, 2.05218505859375, 2.180145263671875, 2.30810546875, 2.436065673828125, 2.56402587890625, 2.691986083984375, 2.8199462890625, 2.947906494140625, 3.07586669921875, 3.203826904296875, 3.331787109375, 3.459747314453125, 3.58770751953125, 3.715667724609375, 3.8436279296875, 3.971588134765625, 4.09954833984375, 4.227508544921875, 4.35546875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 7.0, 4.0, 9.0, 16.0, 23.0, 28.0, 29.0, 50.0, 59.0, 92.0, 150.0, 160.0, 114.0, 60.0, 57.0, 45.0, 23.0, 16.0, 8.0, 13.0, 8.0, 4.0, 4.0, 4.0, 4.0, 4.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0013828277587890625, -0.0013410300016403198, -0.0012992322444915771, -0.0012574344873428345, -0.0012156367301940918, -0.0011738389730453491, -0.0011320412158966064, -0.0010902434587478638, -0.001048445701599121, -0.0010066479444503784, -0.0009648501873016357, -0.0009230524301528931, -0.0008812546730041504, -0.0008394569158554077, -0.000797659158706665, -0.0007558614015579224, -0.0007140636444091797, -0.000672265887260437, -0.0006304681301116943, -0.0005886703729629517, -0.000546872615814209, -0.0005050748586654663, -0.00046327710151672363, -0.00042147934436798096, -0.0003796815872192383, -0.0003378838300704956, -0.00029608607292175293, -0.00025428831577301025, -0.00021249055862426758, -0.0001706928014755249, -0.00012889504432678223, -8.709728717803955e-05, -4.5299530029296875e-05, -3.5017728805541992e-06, 3.8295984268188477e-05, 8.009374141693115e-05, 0.00012189149856567383, 0.0001636892557144165, 0.00020548701286315918, 0.00024728477001190186, 0.00028908252716064453, 0.0003308802843093872, 0.0003726780414581299, 0.00041447579860687256, 0.00045627355575561523, 0.0004980713129043579, 0.0005398690700531006, 0.0005816668272018433, 0.0006234645843505859, 0.0006652623414993286, 0.0007070600986480713, 0.000748857855796814, 0.0007906556129455566, 0.0008324533700942993, 0.000874251127243042, 0.0009160488843917847, 0.0009578466415405273, 0.00099964439868927, 0.0010414421558380127, 0.0010832399129867554, 0.001125037670135498, 0.0011668354272842407, 0.0012086331844329834, 0.001250430941581726, 0.0012922286987304688]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 2.0, 7.0, 4.0, 4.0, 9.0, 9.0, 18.0, 24.0, 35.0, 45.0, 85.0, 115.0, 175.0, 308.0, 577.0, 1063.0, 2345.0, 5857.0, 19205.0, 81502.0, 669564.0, 211296.0, 38646.0, 10418.0, 3786.0, 1589.0, 770.0, 420.0, 265.0, 133.0, 84.0, 47.0, 53.0, 36.0, 18.0, 16.0, 10.0, 4.0, 10.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.421875, -4.2432861328125, -4.064697265625, -3.8861083984375, -3.70751953125, -3.5289306640625, -3.350341796875, -3.1717529296875, -2.9931640625, -2.8145751953125, -2.635986328125, -2.4573974609375, -2.27880859375, -2.1002197265625, -1.921630859375, -1.7430419921875, -1.564453125, -1.3858642578125, -1.207275390625, -1.0286865234375, -0.85009765625, -0.6715087890625, -0.492919921875, -0.3143310546875, -0.1357421875, 0.0428466796875, 0.221435546875, 0.4000244140625, 0.57861328125, 0.7572021484375, 0.935791015625, 1.1143798828125, 1.29296875, 1.4715576171875, 1.650146484375, 1.8287353515625, 2.00732421875, 2.1859130859375, 2.364501953125, 2.5430908203125, 2.7216796875, 2.9002685546875, 3.078857421875, 3.2574462890625, 3.43603515625, 3.6146240234375, 3.793212890625, 3.9718017578125, 4.150390625, 4.3289794921875, 4.507568359375, 4.6861572265625, 4.86474609375, 5.0433349609375, 5.221923828125, 5.4005126953125, 5.5791015625, 5.7576904296875, 5.936279296875, 6.1148681640625, 6.29345703125, 6.4720458984375, 6.650634765625, 6.8292236328125, 7.0078125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 9.0, 10.0, 25.0, 20.0, 48.0, 58.0, 84.0, 118.0, 136.0, 135.0, 91.0, 84.0, 46.0, 32.0, 24.0, 18.0, 17.0, 10.0, 3.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.828125, -9.56207275390625, -9.2960205078125, -9.02996826171875, -8.763916015625, -8.49786376953125, -8.2318115234375, -7.96575927734375, -7.69970703125, -7.43365478515625, -7.1676025390625, -6.90155029296875, -6.635498046875, -6.36944580078125, -6.1033935546875, -5.83734130859375, -5.5712890625, -5.30523681640625, -5.0391845703125, -4.77313232421875, -4.507080078125, -4.24102783203125, -3.9749755859375, -3.70892333984375, -3.44287109375, -3.17681884765625, -2.9107666015625, -2.64471435546875, -2.378662109375, -2.11260986328125, -1.8465576171875, -1.58050537109375, -1.314453125, -1.04840087890625, -0.7823486328125, -0.51629638671875, -0.250244140625, 0.01580810546875, 0.2818603515625, 0.54791259765625, 0.81396484375, 1.08001708984375, 1.3460693359375, 1.61212158203125, 1.878173828125, 2.14422607421875, 2.4102783203125, 2.67633056640625, 2.9423828125, 3.20843505859375, 3.4744873046875, 3.74053955078125, 4.006591796875, 4.27264404296875, 4.5386962890625, 4.80474853515625, 5.07080078125, 5.33685302734375, 5.6029052734375, 5.86895751953125, 6.135009765625, 6.40106201171875, 6.6671142578125, 6.93316650390625, 7.19921875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 2.0, 6.0, 7.0, 13.0, 16.0, 21.0, 48.0, 66.0, 109.0, 203.0, 229.0, 86.0, 75.0, 48.0, 36.0, 12.0, 4.0, 7.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-121.24506378173828, -116.77388000488281, -112.30268859863281, -107.83150482177734, -103.36032104492188, -98.8891372680664, -94.41795349121094, -89.94676208496094, -85.47557830810547, -81.00439453125, -76.533203125, -72.06201934814453, -67.59083557128906, -63.119651794433594, -58.64846420288086, -54.177276611328125, -49.706092834472656, -45.23490905761719, -40.76372146606445, -36.29253387451172, -31.82135009765625, -27.35016441345215, -22.878978729248047, -18.407793045043945, -13.936607360839844, -9.465421676635742, -4.994235992431641, -0.5230503082275391, 3.9481353759765625, 8.419321060180664, 12.890506744384766, 17.361692428588867, 21.8328857421875, 26.3040714263916, 30.775257110595703, 35.24644470214844, 39.717628479003906, 44.188812255859375, 48.65999984741211, 53.131187438964844, 57.60237121582031, 62.07355499267578, 66.54473876953125, 71.01593017578125, 75.48711395263672, 79.95829772949219, 84.42948913574219, 88.90067291259766, 93.37185668945312, 97.8430404663086, 102.31422424316406, 106.78541564941406, 111.25659942626953, 115.727783203125, 120.198974609375, 124.67015838623047, 129.14134216308594, 133.61253356933594, 138.08370971679688, 142.55490112304688, 147.02609252929688, 151.4972686767578, 155.9684600830078, 160.43963623046875, 164.91082763671875]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 9.0, 7.0, 2.0, 7.0, 7.0, 8.0, 13.0, 15.0, 11.0, 23.0, 18.0, 17.0, 24.0, 24.0, 25.0, 35.0, 43.0, 46.0, 78.0, 100.0, 101.0, 56.0, 41.0, 33.0, 34.0, 32.0, 26.0, 31.0, 28.0, 22.0, 13.0, 11.0, 14.0, 8.0, 9.0, 7.0, 4.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-138.1339874267578, -134.18905639648438, -130.244140625, -126.29920959472656, -122.35428619384766, -118.40935516357422, -114.46443176269531, -110.51950073242188, -106.57457733154297, -102.62965393066406, -98.68472290039062, -94.73979949951172, -90.79487609863281, -86.84994506835938, -82.90502166748047, -78.96009826660156, -75.01516723632812, -71.07024383544922, -67.12531280517578, -63.180389404296875, -59.2354621887207, -55.29053497314453, -51.345611572265625, -47.40068435668945, -43.45576477050781, -39.51083755493164, -35.565914154052734, -31.620986938476562, -27.67605972290039, -23.73113441467285, -19.786209106445312, -15.84128189086914, -11.896354675292969, -7.951428413391113, -4.006502628326416, -0.06157684326171875, 3.8833494186401367, 7.828275680541992, 11.773200988769531, 15.718128204345703, 19.663053512573242, 23.60797882080078, 27.552906036376953, 31.497831344604492, 35.44275665283203, 39.3876838684082, 43.332611083984375, 47.27753448486328, 51.22246170043945, 55.167388916015625, 59.11231231689453, 63.0572395324707, 67.00216674804688, 70.94709014892578, 74.89201354980469, 78.83694458007812, 82.78186798095703, 86.72679138183594, 90.67172241210938, 94.61664581298828, 98.56156921386719, 102.50650024414062, 106.45142364501953, 110.39634704589844, 114.34127807617188]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 4.0, 6.0, 12.0, 11.0, 10.0, 17.0, 23.0, 39.0, 66.0, 65.0, 116.0, 168.0, 248.0, 424.0, 759.0, 1388.0, 2719.0, 5688.0, 13087.0, 34265.0, 108575.0, 414201.0, 1455456.0, 1524402.0, 448673.0, 120043.0, 37879.0, 13800.0, 5844.0, 2829.0, 1485.0, 769.0, 401.0, 287.0, 170.0, 111.0, 76.0, 47.0, 33.0, 27.0, 17.0, 16.0, 11.0, 6.0, 7.0, 4.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.94140625, -7.68548583984375, -7.4295654296875, -7.17364501953125, -6.917724609375, -6.66180419921875, -6.4058837890625, -6.14996337890625, -5.89404296875, -5.63812255859375, -5.3822021484375, -5.12628173828125, -4.870361328125, -4.61444091796875, -4.3585205078125, -4.10260009765625, -3.8466796875, -3.59075927734375, -3.3348388671875, -3.07891845703125, -2.822998046875, -2.56707763671875, -2.3111572265625, -2.05523681640625, -1.79931640625, -1.54339599609375, -1.2874755859375, -1.03155517578125, -0.775634765625, -0.51971435546875, -0.2637939453125, -0.00787353515625, 0.248046875, 0.50396728515625, 0.7598876953125, 1.01580810546875, 1.271728515625, 1.52764892578125, 1.7835693359375, 2.03948974609375, 2.29541015625, 2.55133056640625, 2.8072509765625, 3.06317138671875, 3.319091796875, 3.57501220703125, 3.8309326171875, 4.08685302734375, 4.3427734375, 4.59869384765625, 4.8546142578125, 5.11053466796875, 5.366455078125, 5.62237548828125, 5.8782958984375, 6.13421630859375, 6.39013671875, 6.64605712890625, 6.9019775390625, 7.15789794921875, 7.413818359375, 7.66973876953125, 7.9256591796875, 8.18157958984375, 8.4375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 2.0, 10.0, 1.0, 4.0, 4.0, 6.0, 15.0, 11.0, 25.0, 22.0, 22.0, 30.0, 38.0, 42.0, 42.0, 49.0, 49.0, 53.0, 47.0, 57.0, 58.0, 36.0, 47.0, 40.0, 49.0, 42.0, 36.0, 29.0, 33.0, 21.0, 20.0, 13.0, 13.0, 8.0, 7.0, 5.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.828125, -8.527587890625, -8.22705078125, -7.926513671875, -7.6259765625, -7.325439453125, -7.02490234375, -6.724365234375, -6.423828125, -6.123291015625, -5.82275390625, -5.522216796875, -5.2216796875, -4.921142578125, -4.62060546875, -4.320068359375, -4.01953125, -3.718994140625, -3.41845703125, -3.117919921875, -2.8173828125, -2.516845703125, -2.21630859375, -1.915771484375, -1.615234375, -1.314697265625, -1.01416015625, -0.713623046875, -0.4130859375, -0.112548828125, 0.18798828125, 0.488525390625, 0.7890625, 1.089599609375, 1.39013671875, 1.690673828125, 1.9912109375, 2.291748046875, 2.59228515625, 2.892822265625, 3.193359375, 3.493896484375, 3.79443359375, 4.094970703125, 4.3955078125, 4.696044921875, 4.99658203125, 5.297119140625, 5.59765625, 5.898193359375, 6.19873046875, 6.499267578125, 6.7998046875, 7.100341796875, 7.40087890625, 7.701416015625, 8.001953125, 8.302490234375, 8.60302734375, 8.903564453125, 9.2041015625, 9.504638671875, 9.80517578125, 10.105712890625, 10.40625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 9.0, 11.0, 15.0, 23.0, 31.0, 58.0, 85.0, 158.0, 348.0, 952.0, 3981.0, 33527.0, 1595886.0, 2509063.0, 43742.0, 4621.0, 1010.0, 375.0, 159.0, 77.0, 48.0, 27.0, 24.0, 15.0, 8.0, 8.0, 11.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.3125, -27.400634765625, -26.48876953125, -25.576904296875, -24.6650390625, -23.753173828125, -22.84130859375, -21.929443359375, -21.017578125, -20.105712890625, -19.19384765625, -18.281982421875, -17.3701171875, -16.458251953125, -15.54638671875, -14.634521484375, -13.72265625, -12.810791015625, -11.89892578125, -10.987060546875, -10.0751953125, -9.163330078125, -8.25146484375, -7.339599609375, -6.427734375, -5.515869140625, -4.60400390625, -3.692138671875, -2.7802734375, -1.868408203125, -0.95654296875, -0.044677734375, 0.8671875, 1.779052734375, 2.69091796875, 3.602783203125, 4.5146484375, 5.426513671875, 6.33837890625, 7.250244140625, 8.162109375, 9.073974609375, 9.98583984375, 10.897705078125, 11.8095703125, 12.721435546875, 13.63330078125, 14.545166015625, 15.45703125, 16.368896484375, 17.28076171875, 18.192626953125, 19.1044921875, 20.016357421875, 20.92822265625, 21.840087890625, 22.751953125, 23.663818359375, 24.57568359375, 25.487548828125, 26.3994140625, 27.311279296875, 28.22314453125, 29.135009765625, 30.046875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 6.0, 7.0, 3.0, 9.0, 4.0, 7.0, 19.0, 30.0, 35.0, 39.0, 55.0, 100.0, 153.0, 229.0, 373.0, 542.0, 684.0, 609.0, 395.0, 257.0, 152.0, 112.0, 70.0, 62.0, 39.0, 24.0, 17.0, 15.0, 12.0, 6.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.515625, -18.91943359375, -18.3232421875, -17.72705078125, -17.130859375, -16.53466796875, -15.9384765625, -15.34228515625, -14.74609375, -14.14990234375, -13.5537109375, -12.95751953125, -12.361328125, -11.76513671875, -11.1689453125, -10.57275390625, -9.9765625, -9.38037109375, -8.7841796875, -8.18798828125, -7.591796875, -6.99560546875, -6.3994140625, -5.80322265625, -5.20703125, -4.61083984375, -4.0146484375, -3.41845703125, -2.822265625, -2.22607421875, -1.6298828125, -1.03369140625, -0.4375, 0.15869140625, 0.7548828125, 1.35107421875, 1.947265625, 2.54345703125, 3.1396484375, 3.73583984375, 4.33203125, 4.92822265625, 5.5244140625, 6.12060546875, 6.716796875, 7.31298828125, 7.9091796875, 8.50537109375, 9.1015625, 9.69775390625, 10.2939453125, 10.89013671875, 11.486328125, 12.08251953125, 12.6787109375, 13.27490234375, 13.87109375, 14.46728515625, 15.0634765625, 15.65966796875, 16.255859375, 16.85205078125, 17.4482421875, 18.04443359375, 18.640625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 7.0, 9.0, 29.0, 38.0, 61.0, 92.0, 147.0, 161.0, 160.0, 131.0, 59.0, 44.0, 22.0, 14.0, 9.0, 5.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-157.23345947265625, -152.586669921875, -147.93988037109375, -143.29307556152344, -138.6462860107422, -133.99949645996094, -129.3527069091797, -124.7059097290039, -120.05911254882812, -115.41232299804688, -110.7655258178711, -106.11873626708984, -101.47193908691406, -96.82514953613281, -92.17835998535156, -87.53156280517578, -82.88477325439453, -78.23798370361328, -73.5911865234375, -68.94439697265625, -64.29759979248047, -59.65081024169922, -55.0040168762207, -50.35722351074219, -45.71043014526367, -41.063636779785156, -36.41684341430664, -31.770051956176758, -27.123258590698242, -22.476465225219727, -17.829673767089844, -13.182880401611328, -8.536087036132812, -3.889294147491455, 0.7574987411499023, 5.404291152954102, 10.051084518432617, 14.697877883911133, 19.344669342041016, 23.99146270751953, 28.638256072998047, 33.28504943847656, 37.93184280395508, 42.578636169433594, 47.225425720214844, 51.872222900390625, 56.519012451171875, 61.16580581665039, 65.8125991821289, 70.45938873291016, 75.10618591308594, 79.75297546386719, 84.39977264404297, 89.04656219482422, 93.693359375, 98.34014892578125, 102.9869384765625, 107.63372802734375, 112.28052520751953, 116.92731475830078, 121.57411193847656, 126.22090148925781, 130.86769104003906, 135.51449584960938, 140.16128540039062]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 0.0, 3.0, 3.0, 3.0, 5.0, 6.0, 5.0, 7.0, 13.0, 19.0, 14.0, 22.0, 20.0, 14.0, 26.0, 23.0, 39.0, 30.0, 35.0, 41.0, 38.0, 32.0, 38.0, 41.0, 51.0, 52.0, 37.0, 30.0, 43.0, 44.0, 42.0, 28.0, 29.0, 34.0, 21.0, 22.0, 21.0, 12.0, 14.0, 15.0, 7.0, 4.0, 7.0, 5.0, 4.0, 0.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-81.135498046875, -78.60028076171875, -76.0650634765625, -73.52985382080078, -70.99463653564453, -68.45941925048828, -65.92420196533203, -63.38898468017578, -60.8537712097168, -58.31855392456055, -55.78334045410156, -53.24812316894531, -50.71290588378906, -48.17769241333008, -45.64247512817383, -43.107261657714844, -40.572044372558594, -38.036827087402344, -35.50161361694336, -32.96639633178711, -30.431180953979492, -27.895965576171875, -25.360748291015625, -22.825532913208008, -20.29031753540039, -17.755102157592773, -15.21988582611084, -12.684669494628906, -10.149454116821289, -7.614238739013672, -5.079022407531738, -2.5438060760498047, -0.0085906982421875, 2.526625156402588, 5.061841011047363, 7.597056865692139, 10.132272720336914, 12.667488098144531, 15.202704429626465, 17.7379207611084, 20.273136138916016, 22.808351516723633, 25.34356689453125, 27.8787841796875, 30.413999557495117, 32.949214935302734, 35.484432220458984, 38.01964569091797, 40.55486297607422, 43.09008026123047, 45.62529373168945, 48.1605110168457, 50.69572448730469, 53.23094177246094, 55.76615905761719, 58.30137634277344, 60.83658981323242, 63.37180709838867, 65.90702056884766, 68.4422378540039, 70.97745513916016, 73.51266479492188, 76.04788208007812, 78.58309936523438, 81.11831665039062]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 7.0, 7.0, 10.0, 17.0, 36.0, 43.0, 87.0, 149.0, 229.0, 414.0, 723.0, 1365.0, 2702.0, 5568.0, 11989.0, 28238.0, 70062.0, 181946.0, 358186.0, 231795.0, 90294.0, 35999.0, 14966.0, 6899.0, 3149.0, 1669.0, 899.0, 476.0, 266.0, 129.0, 76.0, 58.0, 36.0, 25.0, 17.0, 7.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.6328125, -14.22216796875, -13.8115234375, -13.40087890625, -12.990234375, -12.57958984375, -12.1689453125, -11.75830078125, -11.34765625, -10.93701171875, -10.5263671875, -10.11572265625, -9.705078125, -9.29443359375, -8.8837890625, -8.47314453125, -8.0625, -7.65185546875, -7.2412109375, -6.83056640625, -6.419921875, -6.00927734375, -5.5986328125, -5.18798828125, -4.77734375, -4.36669921875, -3.9560546875, -3.54541015625, -3.134765625, -2.72412109375, -2.3134765625, -1.90283203125, -1.4921875, -1.08154296875, -0.6708984375, -0.26025390625, 0.150390625, 0.56103515625, 0.9716796875, 1.38232421875, 1.79296875, 2.20361328125, 2.6142578125, 3.02490234375, 3.435546875, 3.84619140625, 4.2568359375, 4.66748046875, 5.078125, 5.48876953125, 5.8994140625, 6.31005859375, 6.720703125, 7.13134765625, 7.5419921875, 7.95263671875, 8.36328125, 8.77392578125, 9.1845703125, 9.59521484375, 10.005859375, 10.41650390625, 10.8271484375, 11.23779296875, 11.6484375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 4.0, 7.0, 5.0, 10.0, 11.0, 19.0, 22.0, 15.0, 29.0, 26.0, 25.0, 39.0, 34.0, 40.0, 42.0, 55.0, 59.0, 57.0, 40.0, 48.0, 52.0, 50.0, 41.0, 49.0, 42.0, 27.0, 23.0, 30.0, 18.0, 13.0, 17.0, 12.0, 11.0, 7.0, 7.0, 6.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.671875, -8.361572265625, -8.05126953125, -7.740966796875, -7.4306640625, -7.120361328125, -6.81005859375, -6.499755859375, -6.189453125, -5.879150390625, -5.56884765625, -5.258544921875, -4.9482421875, -4.637939453125, -4.32763671875, -4.017333984375, -3.70703125, -3.396728515625, -3.08642578125, -2.776123046875, -2.4658203125, -2.155517578125, -1.84521484375, -1.534912109375, -1.224609375, -0.914306640625, -0.60400390625, -0.293701171875, 0.0166015625, 0.326904296875, 0.63720703125, 0.947509765625, 1.2578125, 1.568115234375, 1.87841796875, 2.188720703125, 2.4990234375, 2.809326171875, 3.11962890625, 3.429931640625, 3.740234375, 4.050537109375, 4.36083984375, 4.671142578125, 4.9814453125, 5.291748046875, 5.60205078125, 5.912353515625, 6.22265625, 6.532958984375, 6.84326171875, 7.153564453125, 7.4638671875, 7.774169921875, 8.08447265625, 8.394775390625, 8.705078125, 9.015380859375, 9.32568359375, 9.635986328125, 9.9462890625, 10.256591796875, 10.56689453125, 10.877197265625, 11.1875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 5.0, 8.0, 8.0, 12.0, 23.0, 31.0, 32.0, 56.0, 58.0, 87.0, 142.0, 191.0, 254.0, 354.0, 641.0, 924.0, 1666.0, 3669.0, 10293.0, 40822.0, 246439.0, 653307.0, 64671.0, 14654.0, 4858.0, 2047.0, 1182.0, 689.0, 428.0, 262.0, 218.0, 140.0, 100.0, 80.0, 58.0, 36.0, 34.0, 29.0, 11.0, 10.0, 11.0, 3.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.875, -22.163330078125, -21.45166015625, -20.739990234375, -20.0283203125, -19.316650390625, -18.60498046875, -17.893310546875, -17.181640625, -16.469970703125, -15.75830078125, -15.046630859375, -14.3349609375, -13.623291015625, -12.91162109375, -12.199951171875, -11.48828125, -10.776611328125, -10.06494140625, -9.353271484375, -8.6416015625, -7.929931640625, -7.21826171875, -6.506591796875, -5.794921875, -5.083251953125, -4.37158203125, -3.659912109375, -2.9482421875, -2.236572265625, -1.52490234375, -0.813232421875, -0.1015625, 0.610107421875, 1.32177734375, 2.033447265625, 2.7451171875, 3.456787109375, 4.16845703125, 4.880126953125, 5.591796875, 6.303466796875, 7.01513671875, 7.726806640625, 8.4384765625, 9.150146484375, 9.86181640625, 10.573486328125, 11.28515625, 11.996826171875, 12.70849609375, 13.420166015625, 14.1318359375, 14.843505859375, 15.55517578125, 16.266845703125, 16.978515625, 17.690185546875, 18.40185546875, 19.113525390625, 19.8251953125, 20.536865234375, 21.24853515625, 21.960205078125, 22.671875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 6.0, 3.0, 9.0, 15.0, 10.0, 17.0, 20.0, 23.0, 19.0, 28.0, 29.0, 46.0, 40.0, 55.0, 58.0, 68.0, 68.0, 48.0, 55.0, 54.0, 59.0, 45.0, 39.0, 37.0, 20.0, 28.0, 23.0, 12.0, 14.0, 11.0, 2.0, 10.0, 13.0, 3.0, 7.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-38.1875, -37.0224609375, -35.857421875, -34.6923828125, -33.52734375, -32.3623046875, -31.197265625, -30.0322265625, -28.8671875, -27.7021484375, -26.537109375, -25.3720703125, -24.20703125, -23.0419921875, -21.876953125, -20.7119140625, -19.546875, -18.3818359375, -17.216796875, -16.0517578125, -14.88671875, -13.7216796875, -12.556640625, -11.3916015625, -10.2265625, -9.0615234375, -7.896484375, -6.7314453125, -5.56640625, -4.4013671875, -3.236328125, -2.0712890625, -0.90625, 0.2587890625, 1.423828125, 2.5888671875, 3.75390625, 4.9189453125, 6.083984375, 7.2490234375, 8.4140625, 9.5791015625, 10.744140625, 11.9091796875, 13.07421875, 14.2392578125, 15.404296875, 16.5693359375, 17.734375, 18.8994140625, 20.064453125, 21.2294921875, 22.39453125, 23.5595703125, 24.724609375, 25.8896484375, 27.0546875, 28.2197265625, 29.384765625, 30.5498046875, 31.71484375, 32.8798828125, 34.044921875, 35.2099609375, 36.375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 4.0, 2.0, 2.0, 9.0, 14.0, 16.0, 25.0, 21.0, 26.0, 43.0, 63.0, 111.0, 151.0, 233.0, 477.0, 956.0, 2433.0, 7993.0, 37578.0, 711626.0, 251592.0, 25201.0, 6104.0, 1979.0, 837.0, 396.0, 224.0, 127.0, 87.0, 65.0, 20.0, 32.0, 23.0, 21.0, 19.0, 10.0, 7.0, 12.0, 4.0, 9.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.0546875, -4.89105224609375, -4.7274169921875, -4.56378173828125, -4.400146484375, -4.23651123046875, -4.0728759765625, -3.90924072265625, -3.74560546875, -3.58197021484375, -3.4183349609375, -3.25469970703125, -3.091064453125, -2.92742919921875, -2.7637939453125, -2.60015869140625, -2.4365234375, -2.27288818359375, -2.1092529296875, -1.94561767578125, -1.781982421875, -1.61834716796875, -1.4547119140625, -1.29107666015625, -1.12744140625, -0.96380615234375, -0.8001708984375, -0.63653564453125, -0.472900390625, -0.30926513671875, -0.1456298828125, 0.01800537109375, 0.181640625, 0.34527587890625, 0.5089111328125, 0.67254638671875, 0.836181640625, 0.99981689453125, 1.1634521484375, 1.32708740234375, 1.49072265625, 1.65435791015625, 1.8179931640625, 1.98162841796875, 2.145263671875, 2.30889892578125, 2.4725341796875, 2.63616943359375, 2.7998046875, 2.96343994140625, 3.1270751953125, 3.29071044921875, 3.454345703125, 3.61798095703125, 3.7816162109375, 3.94525146484375, 4.10888671875, 4.27252197265625, 4.4361572265625, 4.59979248046875, 4.763427734375, 4.92706298828125, 5.0906982421875, 5.25433349609375, 5.41796875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 3.0, 7.0, 5.0, 8.0, 7.0, 13.0, 15.0, 21.0, 34.0, 58.0, 81.0, 116.0, 170.0, 143.0, 104.0, 70.0, 31.0, 23.0, 11.0, 7.0, 11.0, 8.0, 11.0, 5.0, 5.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0012054443359375, -0.0011696070432662964, -0.0011337697505950928, -0.0010979324579238892, -0.0010620951652526855, -0.001026257872581482, -0.0009904205799102783, -0.0009545832872390747, -0.0009187459945678711, -0.0008829087018966675, -0.0008470714092254639, -0.0008112341165542603, -0.0007753968238830566, -0.000739559531211853, -0.0007037222385406494, -0.0006678849458694458, -0.0006320476531982422, -0.0005962103605270386, -0.000560373067855835, -0.0005245357751846313, -0.0004886984825134277, -0.0004528611898422241, -0.0004170238971710205, -0.0003811866044998169, -0.0003453493118286133, -0.00030951201915740967, -0.00027367472648620605, -0.00023783743381500244, -0.00020200014114379883, -0.00016616284847259521, -0.0001303255558013916, -9.448826313018799e-05, -5.8650970458984375e-05, -2.2813677787780762e-05, 1.3023614883422852e-05, 4.8860907554626465e-05, 8.469820022583008e-05, 0.00012053549289703369, 0.0001563727855682373, 0.00019221007823944092, 0.00022804737091064453, 0.00026388466358184814, 0.00029972195625305176, 0.00033555924892425537, 0.000371396541595459, 0.0004072338342666626, 0.0004430711269378662, 0.0004789084196090698, 0.0005147457122802734, 0.000550583004951477, 0.0005864202976226807, 0.0006222575902938843, 0.0006580948829650879, 0.0006939321756362915, 0.0007297694683074951, 0.0007656067609786987, 0.0008014440536499023, 0.000837281346321106, 0.0008731186389923096, 0.0009089559316635132, 0.0009447932243347168, 0.0009806305170059204, 0.001016467809677124, 0.0010523051023483276, 0.0010881423950195312]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 7.0, 5.0, 8.0, 14.0, 19.0, 32.0, 35.0, 35.0, 71.0, 107.0, 153.0, 246.0, 371.0, 639.0, 1143.0, 2335.0, 5153.0, 13697.0, 48232.0, 272256.0, 614091.0, 61475.0, 16460.0, 6026.0, 2583.0, 1306.0, 727.0, 447.0, 304.0, 179.0, 120.0, 82.0, 60.0, 31.0, 28.0, 26.0, 16.0, 16.0, 13.0, 6.0, 2.0, 6.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.419921875, -3.302337646484375, -3.18475341796875, -3.067169189453125, -2.9495849609375, -2.832000732421875, -2.71441650390625, -2.596832275390625, -2.479248046875, -2.361663818359375, -2.24407958984375, -2.126495361328125, -2.0089111328125, -1.891326904296875, -1.77374267578125, -1.656158447265625, -1.53857421875, -1.420989990234375, -1.30340576171875, -1.185821533203125, -1.0682373046875, -0.950653076171875, -0.83306884765625, -0.715484619140625, -0.597900390625, -0.480316162109375, -0.36273193359375, -0.245147705078125, -0.1275634765625, -0.009979248046875, 0.10760498046875, 0.225189208984375, 0.3427734375, 0.460357666015625, 0.57794189453125, 0.695526123046875, 0.8131103515625, 0.930694580078125, 1.04827880859375, 1.165863037109375, 1.283447265625, 1.401031494140625, 1.51861572265625, 1.636199951171875, 1.7537841796875, 1.871368408203125, 1.98895263671875, 2.106536865234375, 2.22412109375, 2.341705322265625, 2.45928955078125, 2.576873779296875, 2.6944580078125, 2.812042236328125, 2.92962646484375, 3.047210693359375, 3.164794921875, 3.282379150390625, 3.39996337890625, 3.517547607421875, 3.6351318359375, 3.752716064453125, 3.87030029296875, 3.987884521484375, 4.10546875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 6.0, 10.0, 9.0, 8.0, 14.0, 20.0, 27.0, 29.0, 34.0, 35.0, 54.0, 74.0, 90.0, 77.0, 81.0, 84.0, 67.0, 63.0, 34.0, 38.0, 32.0, 18.0, 22.0, 19.0, 12.0, 7.0, 5.0, 5.0, 7.0, 3.0, 2.0, 8.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.47265625, -4.341278076171875, -4.20989990234375, -4.078521728515625, -3.9471435546875, -3.815765380859375, -3.68438720703125, -3.553009033203125, -3.421630859375, -3.290252685546875, -3.15887451171875, -3.027496337890625, -2.8961181640625, -2.764739990234375, -2.63336181640625, -2.501983642578125, -2.37060546875, -2.239227294921875, -2.10784912109375, -1.976470947265625, -1.8450927734375, -1.713714599609375, -1.58233642578125, -1.450958251953125, -1.319580078125, -1.188201904296875, -1.05682373046875, -0.925445556640625, -0.7940673828125, -0.662689208984375, -0.53131103515625, -0.399932861328125, -0.2685546875, -0.137176513671875, -0.00579833984375, 0.125579833984375, 0.2569580078125, 0.388336181640625, 0.51971435546875, 0.651092529296875, 0.782470703125, 0.913848876953125, 1.04522705078125, 1.176605224609375, 1.3079833984375, 1.439361572265625, 1.57073974609375, 1.702117919921875, 1.83349609375, 1.964874267578125, 2.09625244140625, 2.227630615234375, 2.3590087890625, 2.490386962890625, 2.62176513671875, 2.753143310546875, 2.884521484375, 3.015899658203125, 3.14727783203125, 3.278656005859375, 3.4100341796875, 3.541412353515625, 3.67279052734375, 3.804168701171875, 3.935546875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 1.0, 4.0, 9.0, 17.0, 44.0, 55.0, 127.0, 380.0, 166.0, 101.0, 42.0, 19.0, 17.0, 6.0, 4.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-184.843505859375, -179.34193420410156, -173.84036254882812, -168.3387908935547, -162.83721923828125, -157.33566284179688, -151.83409118652344, -146.33251953125, -140.83094787597656, -135.32937622070312, -129.8278045654297, -124.32624053955078, -118.82466888427734, -113.3230972290039, -107.821533203125, -102.31996154785156, -96.81838989257812, -91.31681823730469, -85.81524658203125, -80.31368255615234, -74.8121109008789, -69.31053924560547, -63.8089714050293, -58.307403564453125, -52.80583190917969, -47.30426025390625, -41.80269241333008, -36.301124572753906, -30.79955291748047, -25.297983169555664, -19.79641342163086, -14.294845581054688, -8.79327392578125, -3.2917041778564453, 2.2098655700683594, 7.711435317993164, 13.213005065917969, 18.714574813842773, 24.216144561767578, 29.71771240234375, 35.21928405761719, 40.720855712890625, 46.2224235534668, 51.72399139404297, 57.225563049316406, 62.727134704589844, 68.22869873046875, 73.73027038574219, 79.23184204101562, 84.73341369628906, 90.2349853515625, 95.7365493774414, 101.23812103271484, 106.73969268798828, 112.24125671386719, 117.74282836914062, 123.24440002441406, 128.7459716796875, 134.24754333496094, 139.74911499023438, 145.25067138671875, 150.7522430419922, 156.25381469726562, 161.75538635253906, 167.2569580078125]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 4.0, 3.0, 11.0, 2.0, 7.0, 14.0, 18.0, 18.0, 22.0, 22.0, 33.0, 26.0, 36.0, 23.0, 44.0, 52.0, 114.0, 120.0, 77.0, 57.0, 30.0, 34.0, 33.0, 26.0, 23.0, 22.0, 18.0, 18.0, 14.0, 19.0, 11.0, 10.0, 9.0, 3.0, 4.0, 4.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-124.07186126708984, -120.24730682373047, -116.4227523803711, -112.59819793701172, -108.77363586425781, -104.94908142089844, -101.12452697753906, -97.29997253417969, -93.47541809082031, -89.65086364746094, -85.82630920410156, -82.00175476074219, -78.17720031738281, -74.35264587402344, -70.52808380126953, -66.70352935791016, -62.87897491455078, -59.054420471191406, -55.22986602783203, -51.40530776977539, -47.580753326416016, -43.75619888305664, -39.931640625, -36.107086181640625, -32.28253173828125, -28.457977294921875, -24.633420944213867, -20.80886459350586, -16.984310150146484, -13.15975570678711, -9.335199356079102, -5.510643005371094, -1.6860809326171875, 2.138474464416504, 5.963029861450195, 9.787585258483887, 13.612140655517578, 17.436695098876953, 21.26125144958496, 25.08580780029297, 28.910362243652344, 32.73491668701172, 36.559471130371094, 40.384029388427734, 44.20858383178711, 48.033138275146484, 51.857696533203125, 55.6822509765625, 59.506805419921875, 63.33135986328125, 67.15591430664062, 70.98046875, 74.80502319335938, 78.62957763671875, 82.45413970947266, 86.27869415283203, 90.1032485961914, 93.92780303955078, 97.75235748291016, 101.57691192626953, 105.40147399902344, 109.22602844238281, 113.05058288574219, 116.87513732910156, 120.69969177246094]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 12.0, 8.0, 10.0, 9.0, 19.0, 20.0, 40.0, 53.0, 70.0, 106.0, 146.0, 225.0, 320.0, 548.0, 888.0, 1536.0, 2958.0, 6238.0, 15937.0, 54800.0, 263145.0, 1170191.0, 1907127.0, 598606.0, 122088.0, 29766.0, 9790.0, 4293.0, 2203.0, 1182.0, 669.0, 439.0, 256.0, 169.0, 128.0, 84.0, 57.0, 40.0, 23.0, 17.0, 18.0, 14.0, 8.0, 11.0, 7.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0], "bins": [-12.6171875, -12.2489013671875, -11.880615234375, -11.5123291015625, -11.14404296875, -10.7757568359375, -10.407470703125, -10.0391845703125, -9.6708984375, -9.3026123046875, -8.934326171875, -8.5660400390625, -8.19775390625, -7.8294677734375, -7.461181640625, -7.0928955078125, -6.724609375, -6.3563232421875, -5.988037109375, -5.6197509765625, -5.25146484375, -4.8831787109375, -4.514892578125, -4.1466064453125, -3.7783203125, -3.4100341796875, -3.041748046875, -2.6734619140625, -2.30517578125, -1.9368896484375, -1.568603515625, -1.2003173828125, -0.83203125, -0.4637451171875, -0.095458984375, 0.2728271484375, 0.64111328125, 1.0093994140625, 1.377685546875, 1.7459716796875, 2.1142578125, 2.4825439453125, 2.850830078125, 3.2191162109375, 3.58740234375, 3.9556884765625, 4.323974609375, 4.6922607421875, 5.060546875, 5.4288330078125, 5.797119140625, 6.1654052734375, 6.53369140625, 6.9019775390625, 7.270263671875, 7.6385498046875, 8.0068359375, 8.3751220703125, 8.743408203125, 9.1116943359375, 9.47998046875, 9.8482666015625, 10.216552734375, 10.5848388671875, 10.953125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 9.0, 8.0, 8.0, 16.0, 12.0, 14.0, 21.0, 20.0, 26.0, 20.0, 29.0, 33.0, 42.0, 41.0, 43.0, 65.0, 48.0, 41.0, 46.0, 53.0, 66.0, 41.0, 42.0, 47.0, 31.0, 31.0, 22.0, 28.0, 19.0, 21.0, 13.0, 10.0, 4.0, 12.0, 3.0, 8.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6953125, -8.41357421875, -8.1318359375, -7.85009765625, -7.568359375, -7.28662109375, -7.0048828125, -6.72314453125, -6.44140625, -6.15966796875, -5.8779296875, -5.59619140625, -5.314453125, -5.03271484375, -4.7509765625, -4.46923828125, -4.1875, -3.90576171875, -3.6240234375, -3.34228515625, -3.060546875, -2.77880859375, -2.4970703125, -2.21533203125, -1.93359375, -1.65185546875, -1.3701171875, -1.08837890625, -0.806640625, -0.52490234375, -0.2431640625, 0.03857421875, 0.3203125, 0.60205078125, 0.8837890625, 1.16552734375, 1.447265625, 1.72900390625, 2.0107421875, 2.29248046875, 2.57421875, 2.85595703125, 3.1376953125, 3.41943359375, 3.701171875, 3.98291015625, 4.2646484375, 4.54638671875, 4.828125, 5.10986328125, 5.3916015625, 5.67333984375, 5.955078125, 6.23681640625, 6.5185546875, 6.80029296875, 7.08203125, 7.36376953125, 7.6455078125, 7.92724609375, 8.208984375, 8.49072265625, 8.7724609375, 9.05419921875, 9.3359375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 7.0, 13.0, 10.0, 10.0, 17.0, 18.0, 30.0, 38.0, 44.0, 84.0, 113.0, 156.0, 208.0, 364.0, 603.0, 1185.0, 3048.0, 10677.0, 72664.0, 3065464.0, 988634.0, 39085.0, 7153.0, 2191.0, 963.0, 513.0, 307.0, 205.0, 135.0, 85.0, 67.0, 56.0, 41.0, 31.0, 13.0, 15.0, 8.0, 10.0, 6.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.453125, -25.567626953125, -24.68212890625, -23.796630859375, -22.9111328125, -22.025634765625, -21.14013671875, -20.254638671875, -19.369140625, -18.483642578125, -17.59814453125, -16.712646484375, -15.8271484375, -14.941650390625, -14.05615234375, -13.170654296875, -12.28515625, -11.399658203125, -10.51416015625, -9.628662109375, -8.7431640625, -7.857666015625, -6.97216796875, -6.086669921875, -5.201171875, -4.315673828125, -3.43017578125, -2.544677734375, -1.6591796875, -0.773681640625, 0.11181640625, 0.997314453125, 1.8828125, 2.768310546875, 3.65380859375, 4.539306640625, 5.4248046875, 6.310302734375, 7.19580078125, 8.081298828125, 8.966796875, 9.852294921875, 10.73779296875, 11.623291015625, 12.5087890625, 13.394287109375, 14.27978515625, 15.165283203125, 16.05078125, 16.936279296875, 17.82177734375, 18.707275390625, 19.5927734375, 20.478271484375, 21.36376953125, 22.249267578125, 23.134765625, 24.020263671875, 24.90576171875, 25.791259765625, 26.6767578125, 27.562255859375, 28.44775390625, 29.333251953125, 30.21875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 3.0, 5.0, 10.0, 8.0, 7.0, 15.0, 12.0, 18.0, 30.0, 28.0, 39.0, 66.0, 77.0, 97.0, 130.0, 211.0, 307.0, 370.0, 492.0, 501.0, 434.0, 358.0, 246.0, 171.0, 119.0, 77.0, 56.0, 41.0, 28.0, 25.0, 16.0, 19.0, 11.0, 8.0, 7.0, 8.0, 5.0, 6.0, 1.0, 2.0, 4.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.84375, -21.2099609375, -20.576171875, -19.9423828125, -19.30859375, -18.6748046875, -18.041015625, -17.4072265625, -16.7734375, -16.1396484375, -15.505859375, -14.8720703125, -14.23828125, -13.6044921875, -12.970703125, -12.3369140625, -11.703125, -11.0693359375, -10.435546875, -9.8017578125, -9.16796875, -8.5341796875, -7.900390625, -7.2666015625, -6.6328125, -5.9990234375, -5.365234375, -4.7314453125, -4.09765625, -3.4638671875, -2.830078125, -2.1962890625, -1.5625, -0.9287109375, -0.294921875, 0.3388671875, 0.97265625, 1.6064453125, 2.240234375, 2.8740234375, 3.5078125, 4.1416015625, 4.775390625, 5.4091796875, 6.04296875, 6.6767578125, 7.310546875, 7.9443359375, 8.578125, 9.2119140625, 9.845703125, 10.4794921875, 11.11328125, 11.7470703125, 12.380859375, 13.0146484375, 13.6484375, 14.2822265625, 14.916015625, 15.5498046875, 16.18359375, 16.8173828125, 17.451171875, 18.0849609375, 18.71875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 8.0, 10.0, 16.0, 25.0, 31.0, 45.0, 77.0, 125.0, 153.0, 164.0, 129.0, 88.0, 41.0, 31.0, 22.0, 14.0, 6.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-179.49951171875, -172.38548278808594, -165.27145385742188, -158.15740966796875, -151.0433807373047, -143.92935180664062, -136.81532287597656, -129.7012939453125, -122.5872573852539, -115.47322845458984, -108.35919189453125, -101.24516296386719, -94.13113403320312, -87.01709747314453, -79.90306854248047, -72.78903198242188, -65.67500305175781, -58.560970306396484, -51.446937561035156, -44.332908630371094, -37.218875885009766, -30.104843139648438, -22.990814208984375, -15.876781463623047, -8.762748718261719, -1.648716926574707, 5.465314865112305, 12.579345703125, 19.693378448486328, 26.807411193847656, 33.92144012451172, 41.03547286987305, 48.149505615234375, 55.2635383605957, 62.37757110595703, 69.4916000366211, 76.60563659667969, 83.71966552734375, 90.83369445800781, 97.94772338867188, 105.06175994873047, 112.17578887939453, 119.28982543945312, 126.40385437011719, 133.51788330078125, 140.63192749023438, 147.74594116210938, 154.8599853515625, 161.97401428222656, 169.08804321289062, 176.2020721435547, 183.31610107421875, 190.43014526367188, 197.54417419433594, 204.658203125, 211.77223205566406, 218.88626098632812, 226.0002899169922, 233.11431884765625, 240.22836303710938, 247.34239196777344, 254.4564208984375, 261.5704345703125, 268.6844787597656, 275.79852294921875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 15.0, 8.0, 9.0, 11.0, 9.0, 19.0, 20.0, 26.0, 22.0, 26.0, 31.0, 27.0, 34.0, 34.0, 53.0, 37.0, 49.0, 57.0, 51.0, 50.0, 32.0, 36.0, 39.0, 29.0, 33.0, 30.0, 31.0, 36.0, 18.0, 25.0, 18.0, 15.0, 6.0, 12.0, 3.0, 4.0, 5.0, 5.0, 3.0, 8.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-104.94803619384766, -101.1576156616211, -97.36720275878906, -93.5767822265625, -89.78636169433594, -85.99594116210938, -82.20552825927734, -78.41510772705078, -74.62469482421875, -70.83427429199219, -67.04386138916016, -63.253440856933594, -59.46302032470703, -55.672603607177734, -51.88218688964844, -48.091766357421875, -44.30134582519531, -40.510929107666016, -36.72050857543945, -32.930091857910156, -29.139673233032227, -25.349254608154297, -21.558837890625, -17.76841926574707, -13.97800064086914, -10.187582015991211, -6.397164344787598, -2.6067466735839844, 1.1836719512939453, 4.974090576171875, 8.764507293701172, 12.554925918579102, 16.345352172851562, 20.135770797729492, 23.926189422607422, 27.71660614013672, 31.50702476501465, 35.29744338989258, 39.087860107421875, 42.87828063964844, 46.668697357177734, 50.45911407470703, 54.249534606933594, 58.03995132446289, 61.83036804199219, 65.62078857421875, 69.41120910644531, 73.20162200927734, 76.9920425415039, 80.78246307373047, 84.5728759765625, 88.36329650878906, 92.15371704101562, 95.94413757324219, 99.73455047607422, 103.52497100830078, 107.31538391113281, 111.10580444335938, 114.8962173461914, 118.68663787841797, 122.47705841064453, 126.26747131347656, 130.05789184570312, 133.8483123779297, 137.63873291015625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 7.0, 3.0, 10.0, 10.0, 20.0, 34.0, 56.0, 98.0, 171.0, 269.0, 452.0, 796.0, 1531.0, 3245.0, 7660.0, 20067.0, 61939.0, 223328.0, 498038.0, 157852.0, 45725.0, 15496.0, 6059.0, 2780.0, 1277.0, 653.0, 378.0, 240.0, 136.0, 83.0, 58.0, 33.0, 18.0, 16.0, 8.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-17.8125, -17.32275390625, -16.8330078125, -16.34326171875, -15.853515625, -15.36376953125, -14.8740234375, -14.38427734375, -13.89453125, -13.40478515625, -12.9150390625, -12.42529296875, -11.935546875, -11.44580078125, -10.9560546875, -10.46630859375, -9.9765625, -9.48681640625, -8.9970703125, -8.50732421875, -8.017578125, -7.52783203125, -7.0380859375, -6.54833984375, -6.05859375, -5.56884765625, -5.0791015625, -4.58935546875, -4.099609375, -3.60986328125, -3.1201171875, -2.63037109375, -2.140625, -1.65087890625, -1.1611328125, -0.67138671875, -0.181640625, 0.30810546875, 0.7978515625, 1.28759765625, 1.77734375, 2.26708984375, 2.7568359375, 3.24658203125, 3.736328125, 4.22607421875, 4.7158203125, 5.20556640625, 5.6953125, 6.18505859375, 6.6748046875, 7.16455078125, 7.654296875, 8.14404296875, 8.6337890625, 9.12353515625, 9.61328125, 10.10302734375, 10.5927734375, 11.08251953125, 11.572265625, 12.06201171875, 12.5517578125, 13.04150390625, 13.53125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 3.0, 8.0, 10.0, 7.0, 12.0, 22.0, 25.0, 31.0, 28.0, 39.0, 37.0, 36.0, 48.0, 55.0, 67.0, 58.0, 51.0, 59.0, 61.0, 46.0, 59.0, 51.0, 35.0, 36.0, 26.0, 20.0, 16.0, 13.0, 8.0, 11.0, 10.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.234375, -12.8675537109375, -12.500732421875, -12.1339111328125, -11.76708984375, -11.4002685546875, -11.033447265625, -10.6666259765625, -10.2998046875, -9.9329833984375, -9.566162109375, -9.1993408203125, -8.83251953125, -8.4656982421875, -8.098876953125, -7.7320556640625, -7.365234375, -6.9984130859375, -6.631591796875, -6.2647705078125, -5.89794921875, -5.5311279296875, -5.164306640625, -4.7974853515625, -4.4306640625, -4.0638427734375, -3.697021484375, -3.3302001953125, -2.96337890625, -2.5965576171875, -2.229736328125, -1.8629150390625, -1.49609375, -1.1292724609375, -0.762451171875, -0.3956298828125, -0.02880859375, 0.3380126953125, 0.704833984375, 1.0716552734375, 1.4384765625, 1.8052978515625, 2.172119140625, 2.5389404296875, 2.90576171875, 3.2725830078125, 3.639404296875, 4.0062255859375, 4.373046875, 4.7398681640625, 5.106689453125, 5.4735107421875, 5.84033203125, 6.2071533203125, 6.573974609375, 6.9407958984375, 7.3076171875, 7.6744384765625, 8.041259765625, 8.4080810546875, 8.77490234375, 9.1417236328125, 9.508544921875, 9.8753662109375, 10.2421875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 6.0, 5.0, 6.0, 4.0, 10.0, 22.0, 33.0, 34.0, 52.0, 89.0, 130.0, 233.0, 422.0, 854.0, 2374.0, 10242.0, 122118.0, 858776.0, 44252.0, 5667.0, 1605.0, 667.0, 346.0, 175.0, 128.0, 103.0, 52.0, 52.0, 17.0, 18.0, 15.0, 13.0, 7.0, 10.0, 8.0, 6.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-22.859375, -22.080078125, -21.30078125, -20.521484375, -19.7421875, -18.962890625, -18.18359375, -17.404296875, -16.625, -15.845703125, -15.06640625, -14.287109375, -13.5078125, -12.728515625, -11.94921875, -11.169921875, -10.390625, -9.611328125, -8.83203125, -8.052734375, -7.2734375, -6.494140625, -5.71484375, -4.935546875, -4.15625, -3.376953125, -2.59765625, -1.818359375, -1.0390625, -0.259765625, 0.51953125, 1.298828125, 2.078125, 2.857421875, 3.63671875, 4.416015625, 5.1953125, 5.974609375, 6.75390625, 7.533203125, 8.3125, 9.091796875, 9.87109375, 10.650390625, 11.4296875, 12.208984375, 12.98828125, 13.767578125, 14.546875, 15.326171875, 16.10546875, 16.884765625, 17.6640625, 18.443359375, 19.22265625, 20.001953125, 20.78125, 21.560546875, 22.33984375, 23.119140625, 23.8984375, 24.677734375, 25.45703125, 26.236328125, 27.015625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 9.0, 6.0, 9.0, 13.0, 13.0, 16.0, 30.0, 29.0, 43.0, 45.0, 54.0, 69.0, 101.0, 93.0, 99.0, 62.0, 52.0, 45.0, 33.0, 27.0, 37.0, 29.0, 19.0, 12.0, 13.0, 7.0, 6.0, 9.0, 1.0, 2.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.78125, -39.24658203125, -37.7119140625, -36.17724609375, -34.642578125, -33.10791015625, -31.5732421875, -30.03857421875, -28.50390625, -26.96923828125, -25.4345703125, -23.89990234375, -22.365234375, -20.83056640625, -19.2958984375, -17.76123046875, -16.2265625, -14.69189453125, -13.1572265625, -11.62255859375, -10.087890625, -8.55322265625, -7.0185546875, -5.48388671875, -3.94921875, -2.41455078125, -0.8798828125, 0.65478515625, 2.189453125, 3.72412109375, 5.2587890625, 6.79345703125, 8.328125, 9.86279296875, 11.3974609375, 12.93212890625, 14.466796875, 16.00146484375, 17.5361328125, 19.07080078125, 20.60546875, 22.14013671875, 23.6748046875, 25.20947265625, 26.744140625, 28.27880859375, 29.8134765625, 31.34814453125, 32.8828125, 34.41748046875, 35.9521484375, 37.48681640625, 39.021484375, 40.55615234375, 42.0908203125, 43.62548828125, 45.16015625, 46.69482421875, 48.2294921875, 49.76416015625, 51.298828125, 52.83349609375, 54.3681640625, 55.90283203125, 57.4375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 4.0, 2.0, 4.0, 3.0, 3.0, 7.0, 3.0, 17.0, 10.0, 20.0, 27.0, 56.0, 48.0, 133.0, 173.0, 258.0, 561.0, 1280.0, 3705.0, 14211.0, 92873.0, 868815.0, 51813.0, 9707.0, 2708.0, 988.0, 411.0, 240.0, 154.0, 104.0, 58.0, 35.0, 26.0, 23.0, 13.0, 11.0, 10.0, 10.0, 4.0, 3.0, 5.0, 5.0, 3.0, 1.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.361328125, -2.2835693359375, -2.205810546875, -2.1280517578125, -2.05029296875, -1.9725341796875, -1.894775390625, -1.8170166015625, -1.7392578125, -1.6614990234375, -1.583740234375, -1.5059814453125, -1.42822265625, -1.3504638671875, -1.272705078125, -1.1949462890625, -1.1171875, -1.0394287109375, -0.961669921875, -0.8839111328125, -0.80615234375, -0.7283935546875, -0.650634765625, -0.5728759765625, -0.4951171875, -0.4173583984375, -0.339599609375, -0.2618408203125, -0.18408203125, -0.1063232421875, -0.028564453125, 0.0491943359375, 0.126953125, 0.2047119140625, 0.282470703125, 0.3602294921875, 0.43798828125, 0.5157470703125, 0.593505859375, 0.6712646484375, 0.7490234375, 0.8267822265625, 0.904541015625, 0.9822998046875, 1.06005859375, 1.1378173828125, 1.215576171875, 1.2933349609375, 1.37109375, 1.4488525390625, 1.526611328125, 1.6043701171875, 1.68212890625, 1.7598876953125, 1.837646484375, 1.9154052734375, 1.9931640625, 2.0709228515625, 2.148681640625, 2.2264404296875, 2.30419921875, 2.3819580078125, 2.459716796875, 2.5374755859375, 2.615234375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 4.0, 6.0, 11.0, 10.0, 13.0, 12.0, 16.0, 22.0, 34.0, 35.0, 65.0, 105.0, 116.0, 126.0, 111.0, 105.0, 58.0, 31.0, 25.0, 22.0, 14.0, 14.0, 7.0, 7.0, 13.0, 7.0, 2.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0005545616149902344, -0.0005383715033531189, -0.0005221813917160034, -0.0005059912800788879, -0.0004898011684417725, -0.000473611056804657, -0.0004574209451675415, -0.000441230833530426, -0.00042504072189331055, -0.00040885061025619507, -0.0003926604986190796, -0.0003764703869819641, -0.00036028027534484863, -0.00034409016370773315, -0.0003279000520706177, -0.0003117099404335022, -0.0002955198287963867, -0.00027932971715927124, -0.00026313960552215576, -0.0002469494938850403, -0.0002307593822479248, -0.00021456927061080933, -0.00019837915897369385, -0.00018218904733657837, -0.0001659989356994629, -0.0001498088240623474, -0.00013361871242523193, -0.00011742860078811646, -0.00010123848915100098, -8.50483775138855e-05, -6.885826587677002e-05, -5.266815423965454e-05, -3.647804260253906e-05, -2.0287930965423584e-05, -4.0978193283081055e-06, 1.2092292308807373e-05, 2.828240394592285e-05, 4.447251558303833e-05, 6.066262722015381e-05, 7.685273885726929e-05, 9.304285049438477e-05, 0.00010923296213150024, 0.00012542307376861572, 0.0001416131854057312, 0.00015780329704284668, 0.00017399340867996216, 0.00019018352031707764, 0.00020637363195419312, 0.0002225637435913086, 0.00023875385522842407, 0.00025494396686553955, 0.00027113407850265503, 0.0002873241901397705, 0.000303514301776886, 0.00031970441341400146, 0.00033589452505111694, 0.0003520846366882324, 0.0003682747483253479, 0.0003844648599624634, 0.00040065497159957886, 0.00041684508323669434, 0.0004330351948738098, 0.0004492253065109253, 0.00046541541814804077, 0.00048160552978515625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 8.0, 2.0, 7.0, 7.0, 11.0, 18.0, 22.0, 51.0, 62.0, 100.0, 131.0, 205.0, 353.0, 588.0, 1080.0, 2223.0, 4893.0, 12605.0, 38467.0, 230551.0, 662821.0, 63326.0, 18174.0, 6579.0, 2927.0, 1343.0, 785.0, 435.0, 245.0, 165.0, 110.0, 71.0, 55.0, 34.0, 27.0, 14.0, 9.0, 14.0, 8.0, 8.0, 5.0, 3.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.66015625, -1.6085662841796875, -1.556976318359375, -1.5053863525390625, -1.45379638671875, -1.4022064208984375, -1.350616455078125, -1.2990264892578125, -1.2474365234375, -1.1958465576171875, -1.144256591796875, -1.0926666259765625, -1.04107666015625, -0.9894866943359375, -0.937896728515625, -0.8863067626953125, -0.834716796875, -0.7831268310546875, -0.731536865234375, -0.6799468994140625, -0.62835693359375, -0.5767669677734375, -0.525177001953125, -0.4735870361328125, -0.4219970703125, -0.3704071044921875, -0.318817138671875, -0.2672271728515625, -0.21563720703125, -0.1640472412109375, -0.112457275390625, -0.0608673095703125, -0.00927734375, 0.0423126220703125, 0.093902587890625, 0.1454925537109375, 0.19708251953125, 0.2486724853515625, 0.300262451171875, 0.3518524169921875, 0.4034423828125, 0.4550323486328125, 0.506622314453125, 0.5582122802734375, 0.60980224609375, 0.6613922119140625, 0.712982177734375, 0.7645721435546875, 0.816162109375, 0.8677520751953125, 0.919342041015625, 0.9709320068359375, 1.02252197265625, 1.0741119384765625, 1.125701904296875, 1.1772918701171875, 1.2288818359375, 1.2804718017578125, 1.332061767578125, 1.3836517333984375, 1.43524169921875, 1.4868316650390625, 1.538421630859375, 1.5900115966796875, 1.6416015625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 11.0, 7.0, 19.0, 17.0, 17.0, 20.0, 53.0, 37.0, 42.0, 74.0, 91.0, 125.0, 126.0, 83.0, 60.0, 46.0, 35.0, 38.0, 21.0, 18.0, 8.0, 14.0, 7.0, 7.0, 6.0, 1.0, 5.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.54296875, -2.4447021484375, -2.346435546875, -2.2481689453125, -2.14990234375, -2.0516357421875, -1.953369140625, -1.8551025390625, -1.7568359375, -1.6585693359375, -1.560302734375, -1.4620361328125, -1.36376953125, -1.2655029296875, -1.167236328125, -1.0689697265625, -0.970703125, -0.8724365234375, -0.774169921875, -0.6759033203125, -0.57763671875, -0.4793701171875, -0.381103515625, -0.2828369140625, -0.1845703125, -0.0863037109375, 0.011962890625, 0.1102294921875, 0.20849609375, 0.3067626953125, 0.405029296875, 0.5032958984375, 0.6015625, 0.6998291015625, 0.798095703125, 0.8963623046875, 0.99462890625, 1.0928955078125, 1.191162109375, 1.2894287109375, 1.3876953125, 1.4859619140625, 1.584228515625, 1.6824951171875, 1.78076171875, 1.8790283203125, 1.977294921875, 2.0755615234375, 2.173828125, 2.2720947265625, 2.370361328125, 2.4686279296875, 2.56689453125, 2.6651611328125, 2.763427734375, 2.8616943359375, 2.9599609375, 3.0582275390625, 3.156494140625, 3.2547607421875, 3.35302734375, 3.4512939453125, 3.549560546875, 3.6478271484375, 3.74609375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 2.0, 3.0, 5.0, 15.0, 12.0, 16.0, 34.0, 75.0, 186.0, 267.0, 203.0, 93.0, 48.0, 18.0, 6.0, 6.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-147.26199340820312, -142.27487182617188, -137.2877655029297, -132.30064392089844, -127.31353759765625, -122.326416015625, -117.33930206298828, -112.35218811035156, -107.36507415771484, -102.37796020507812, -97.3908462524414, -92.40373229980469, -87.41661071777344, -82.42950439453125, -77.4423828125, -72.45526885986328, -67.46815490722656, -62.481040954589844, -57.493927001953125, -52.50680923461914, -47.51969528198242, -42.5325813293457, -37.54546356201172, -32.558349609375, -27.57123565673828, -22.584121704101562, -17.59700584411621, -12.609890937805176, -7.622776031494141, -2.635662078857422, 2.3514537811279297, 7.338569641113281, 12.325698852539062, 17.31281280517578, 22.299928665161133, 27.287044525146484, 32.2741584777832, 37.26127243041992, 42.248390197753906, 47.235504150390625, 52.222618103027344, 57.20973205566406, 62.19684600830078, 67.1839599609375, 72.17108154296875, 77.15818786621094, 82.14530944824219, 87.1324234008789, 92.11953735351562, 97.10665130615234, 102.09376525878906, 107.08087921142578, 112.0679931640625, 117.05511474609375, 122.04222869873047, 127.02934265136719, 132.01644897460938, 137.00357055664062, 141.9906768798828, 146.97779846191406, 151.96490478515625, 156.9520263671875, 161.9391326904297, 166.92625427246094, 171.9133758544922]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 2.0, 7.0, 7.0, 12.0, 9.0, 16.0, 19.0, 23.0, 24.0, 61.0, 112.0, 98.0, 44.0, 46.0, 41.0, 35.0, 63.0, 84.0, 94.0, 55.0, 38.0, 14.0, 21.0, 10.0, 11.0, 9.0, 6.0, 3.0, 7.0, 6.0, 1.0, 5.0, 2.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-124.95172882080078, -121.33545684814453, -117.71917724609375, -114.1029052734375, -110.48663330078125, -106.870361328125, -103.25408935546875, -99.63780975341797, -96.02153778076172, -92.40526580810547, -88.78898620605469, -85.17271423339844, -81.55644226074219, -77.94017028808594, -74.32389831542969, -70.7076187133789, -67.09134674072266, -63.475074768066406, -59.85879898071289, -56.242523193359375, -52.626251220703125, -49.009979248046875, -45.39370346069336, -41.777427673339844, -38.161155700683594, -34.544883728027344, -30.928607940673828, -27.312334060668945, -23.696060180664062, -20.07978630065918, -16.463512420654297, -12.847238540649414, -9.230972290039062, -5.61469841003418, -1.9984245300292969, 1.617849349975586, 5.234123229980469, 8.850397109985352, 12.466670989990234, 16.082944869995117, 19.69921875, 23.315492630004883, 26.931766510009766, 30.54804039001465, 34.16431427001953, 37.78058624267578, 41.3968620300293, 45.01313781738281, 48.62940979003906, 52.24568176269531, 55.86195755004883, 59.478233337402344, 63.094505310058594, 66.71077728271484, 70.32705688476562, 73.94332885742188, 77.55960083007812, 81.17587280273438, 84.79214477539062, 88.4084243774414, 92.02469635009766, 95.6409683227539, 99.25724792480469, 102.87351989746094, 106.48979187011719]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 3.0, 3.0, 5.0, 8.0, 7.0, 9.0, 9.0, 14.0, 5.0, 15.0, 14.0, 23.0, 32.0, 25.0, 32.0, 32.0, 48.0, 94.0, 246.0, 96.0, 42.0, 25.0, 37.0, 33.0, 16.0, 17.0, 21.0, 14.0, 9.0, 16.0, 10.0, 5.0, 5.0, 8.0, 5.0, 6.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.61328125, -7.34576416015625, -7.0782470703125, -6.81072998046875, -6.543212890625, -6.27569580078125, -6.0081787109375, -5.74066162109375, -5.47314453125, -5.20562744140625, -4.9381103515625, -4.67059326171875, -4.403076171875, -4.13555908203125, -3.8680419921875, -3.60052490234375, -3.3330078125, -3.06549072265625, -2.7979736328125, -2.53045654296875, -2.262939453125, -1.99542236328125, -1.7279052734375, -1.46038818359375, -1.19287109375, -0.92535400390625, -0.6578369140625, -0.39031982421875, -0.122802734375, 0.14471435546875, 0.4122314453125, 0.67974853515625, 0.947265625, 1.21478271484375, 1.4822998046875, 1.74981689453125, 2.017333984375, 2.28485107421875, 2.5523681640625, 2.81988525390625, 3.08740234375, 3.35491943359375, 3.6224365234375, 3.88995361328125, 4.157470703125, 4.42498779296875, 4.6925048828125, 4.96002197265625, 5.2275390625, 5.49505615234375, 5.7625732421875, 6.03009033203125, 6.297607421875, 6.56512451171875, 6.8326416015625, 7.10015869140625, 7.36767578125, 7.63519287109375, 7.9027099609375, 8.17022705078125, 8.437744140625, 8.70526123046875, 8.9727783203125, 9.24029541015625, 9.5078125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 0.0, 0.0, 3.0, 4.0, 5.0, 5.0, 7.0, 9.0, 5.0, 10.0, 8.0, 12.0, 23.0, 38.0, 42.0, 75.0, 92.0, 187.0, 331.0, 764.0, 2098.0, 6646.0, 74963.0, 8287627.0, 10675.0, 2911.0, 1032.0, 449.0, 194.0, 133.0, 69.0, 44.0, 29.0, 16.0, 10.0, 16.0, 12.0, 7.0, 11.0, 9.0, 6.0, 6.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-82.97441101074219, -80.68035888671875, -78.38629913330078, -76.09224700927734, -73.79818725585938, -71.50413513183594, -69.21007537841797, -66.91602325439453, -64.62196350097656, -62.32790756225586, -60.033851623535156, -57.73979568481445, -55.44573974609375, -53.15168380737305, -50.857627868652344, -48.563575744628906, -46.2695198059082, -43.9754638671875, -41.6814079284668, -39.387351989746094, -37.09329605102539, -34.79924011230469, -32.50518798828125, -30.211130142211914, -27.91707420349121, -25.623018264770508, -23.328962326049805, -21.034908294677734, -18.74085235595703, -16.446796417236328, -14.152740478515625, -11.858684539794922, -9.564624786376953, -7.27056884765625, -4.976513385772705, -2.68245792388916, -0.38840198516845703, 1.905653953552246, 4.199708938598633, 6.493764877319336, 8.787820816040039, 11.081876754760742, 13.375932693481445, 15.669987678527832, 17.96404266357422, 20.258098602294922, 22.552154541015625, 24.846210479736328, 27.14026641845703, 29.434322357177734, 31.728378295898438, 34.02243423461914, 36.316490173339844, 38.61054611206055, 40.90460205078125, 43.19865417480469, 45.492713928222656, 47.78676986694336, 50.08082580566406, 52.374881744384766, 54.66893768310547, 56.96299362182617, 59.257049560546875, 61.55110168457031, 63.845157623291016]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 8.0, 8.0, 8.0, 3.0, 3.0, 4.0, 3.0, 8.0, 2.0, 1.0, 6.0, 1.0, 3.0, 4.0, 3.0, 4.0, 1.0, 0.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-137.78854370117188, -133.39793395996094, -129.00733947753906, -124.61672973632812, -120.22612762451172, -115.83552551269531, -111.44491577148438, -107.05431365966797, -102.66371154785156, -98.27310943603516, -93.88250732421875, -89.49189758300781, -85.1012954711914, -80.710693359375, -76.32008361816406, -71.92948150634766, -67.53887939453125, -63.148277282714844, -58.75767135620117, -54.3670654296875, -49.976463317871094, -45.58586120605469, -41.195255279541016, -36.804649353027344, -32.41404724121094, -28.0234432220459, -23.63283920288086, -19.24223518371582, -14.851631164550781, -10.461027145385742, -6.070423126220703, -1.679819107055664, 2.7107696533203125, 7.101373672485352, 11.49197769165039, 15.88258171081543, 20.27318572998047, 24.663789749145508, 29.054393768310547, 33.44499969482422, 37.835601806640625, 42.22620391845703, 46.6168098449707, 51.007415771484375, 55.39801788330078, 59.78861999511719, 64.17922973632812, 68.56983184814453, 72.96043395996094, 77.35103607177734, 81.74163818359375, 86.13224792480469, 90.5228500366211, 94.9134521484375, 99.30406188964844, 103.69466400146484, 108.08526611328125, 112.47586822509766, 116.86647033691406, 121.257080078125, 125.6476821899414, 130.0382843017578, 134.42889404296875, 138.81948852539062, 143.21009826660156]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 5.0, 8.0, 14.0, 22.0, 27.0, 38.0, 58.0, 84.0, 190.0, 311.0, 605.0, 1232.0, 2483.0, 5178.0, 11607.0, 25812.0, 60052.0, 127009.0, 148140.0, 78800.0, 34558.0, 15165.0, 6690.0, 3061.0, 1483.0, 734.0, 368.0, 219.0, 97.0, 86.0, 47.0, 33.0, 19.0, 9.0, 5.0, 7.0, 6.0, 7.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.1875, -53.52294921875, -51.8583984375, -50.19384765625, -48.529296875, -46.86474609375, -45.2001953125, -43.53564453125, -41.87109375, -40.20654296875, -38.5419921875, -36.87744140625, -35.212890625, -33.54833984375, -31.8837890625, -30.21923828125, -28.5546875, -26.89013671875, -25.2255859375, -23.56103515625, -21.896484375, -20.23193359375, -18.5673828125, -16.90283203125, -15.23828125, -13.57373046875, -11.9091796875, -10.24462890625, -8.580078125, -6.91552734375, -5.2509765625, -3.58642578125, -1.921875, -0.25732421875, 1.4072265625, 3.07177734375, 4.736328125, 6.40087890625, 8.0654296875, 9.72998046875, 11.39453125, 13.05908203125, 14.7236328125, 16.38818359375, 18.052734375, 19.71728515625, 21.3818359375, 23.04638671875, 24.7109375, 26.37548828125, 28.0400390625, 29.70458984375, 31.369140625, 33.03369140625, 34.6982421875, 36.36279296875, 38.02734375, 39.69189453125, 41.3564453125, 43.02099609375, 44.685546875, 46.35009765625, 48.0146484375, 49.67919921875, 51.34375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 1.0, 5.0, 5.0, 7.0, 6.0, 13.0, 10.0, 19.0, 12.0, 27.0, 26.0, 42.0, 45.0, 54.0, 47.0, 38.0, 52.0, 63.0, 60.0, 72.0, 67.0, 48.0, 50.0, 52.0, 40.0, 33.0, 29.0, 15.0, 13.0, 7.0, 9.0, 10.0, 5.0, 7.0, 6.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.0078125, -11.654052734375, -11.30029296875, -10.946533203125, -10.5927734375, -10.239013671875, -9.88525390625, -9.531494140625, -9.177734375, -8.823974609375, -8.47021484375, -8.116455078125, -7.7626953125, -7.408935546875, -7.05517578125, -6.701416015625, -6.34765625, -5.993896484375, -5.64013671875, -5.286376953125, -4.9326171875, -4.578857421875, -4.22509765625, -3.871337890625, -3.517578125, -3.163818359375, -2.81005859375, -2.456298828125, -2.1025390625, -1.748779296875, -1.39501953125, -1.041259765625, -0.6875, -0.333740234375, 0.02001953125, 0.373779296875, 0.7275390625, 1.081298828125, 1.43505859375, 1.788818359375, 2.142578125, 2.496337890625, 2.85009765625, 3.203857421875, 3.5576171875, 3.911376953125, 4.26513671875, 4.618896484375, 4.97265625, 5.326416015625, 5.68017578125, 6.033935546875, 6.3876953125, 6.741455078125, 7.09521484375, 7.448974609375, 7.802734375, 8.156494140625, 8.51025390625, 8.864013671875, 9.2177734375, 9.571533203125, 9.92529296875, 10.279052734375, 10.6328125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 3.0, 10.0, 3.0, 7.0, 10.0, 24.0, 93.0, 127.0, 108.0, 48.0, 16.0, 15.0, 6.0, 14.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-148.16116333007812, -144.475830078125, -140.79049682617188, -137.10516357421875, -133.41983032226562, -129.73448181152344, -126.04914855957031, -122.36381530761719, -118.67848205566406, -114.99314880371094, -111.30781555175781, -107.62247467041016, -103.93714141845703, -100.2518081665039, -96.56646728515625, -92.88113403320312, -89.19580078125, -85.51046752929688, -81.82513427734375, -78.1397933959961, -74.45446014404297, -70.76912689208984, -67.08378601074219, -63.39845275878906, -59.71311950683594, -56.02778625488281, -52.34244918823242, -48.65711212158203, -44.971778869628906, -41.28644561767578, -37.60110855102539, -33.915771484375, -30.230438232421875, -26.545103073120117, -22.85976791381836, -19.1744327545166, -15.489097595214844, -11.803762435913086, -8.118427276611328, -4.43309211730957, -0.7477569580078125, 2.9375782012939453, 6.622913360595703, 10.308248519897461, 13.993583679199219, 17.678918838500977, 21.364253997802734, 25.049589157104492, 28.73492431640625, 32.420257568359375, 36.105594635009766, 39.790931701660156, 43.47626495361328, 47.161598205566406, 50.8469352722168, 54.53227233886719, 58.21760559082031, 61.90293884277344, 65.58827209472656, 69.27361297607422, 72.95894622802734, 76.64427947998047, 80.32962036132812, 84.01495361328125, 87.70028686523438]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 2.0, 1.0, 4.0, 6.0, 0.0, 3.0, 5.0, 11.0, 15.0, 28.0, 72.0, 94.0, 74.0, 52.0, 26.0, 19.0, 16.0, 4.0, 6.0, 8.0, 5.0, 4.0, 3.0, 5.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-52.82432556152344, -51.05133819580078, -49.27835464477539, -47.50537109375, -45.732383728027344, -43.95939636230469, -42.1864128112793, -40.413429260253906, -38.64044189453125, -36.867454528808594, -35.0944709777832, -33.32148742675781, -31.548500061035156, -29.775514602661133, -28.00252914428711, -26.229543685913086, -24.456558227539062, -22.68357276916504, -20.910587310791016, -19.137601852416992, -17.36461639404297, -15.591630935668945, -13.818645477294922, -12.045660018920898, -10.272674560546875, -8.499689102172852, -6.726703643798828, -4.953718185424805, -3.1807327270507812, -1.4077472686767578, 0.3652381896972656, 2.138223648071289, 3.911212921142578, 5.684198379516602, 7.457183837890625, 9.230169296264648, 11.003154754638672, 12.776140213012695, 14.549125671386719, 16.322111129760742, 18.095096588134766, 19.86808204650879, 21.641067504882812, 23.414052963256836, 25.18703842163086, 26.960023880004883, 28.733009338378906, 30.50599479675293, 32.27898025512695, 34.051963806152344, 35.824951171875, 37.597938537597656, 39.37092208862305, 41.14390563964844, 42.916893005371094, 44.68988037109375, 46.46286392211914, 48.23584747314453, 50.00883483886719, 51.781822204589844, 53.554805755615234, 55.327789306640625, 57.10077667236328, 58.87376403808594, 60.64674758911133]}, "eval/loss": 0.9911340475082397, "eval/wer": 0.14885806694842946, "eval/runtime": 870.6822, "eval/samples_per_second": 3.034, "eval/steps_per_second": 0.38} \ No newline at end of file +{"train/loss": 0.4733, "train/learning_rate": 2.396080760095012e-06, "train/epoch": 18.5, "train/global_step": 16500, "_runtime": 107983, "_timestamp": 1646769222, "_step": 16510, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [6.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 6.0, 4.0, 9.0, 10.0, 29843.0, 559.0, 32.0, 7.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-152.375, -148.1171875, -143.859375, -139.6015625, -135.34375, -131.0859375, -126.828125, -122.5703125, -118.3125, -114.0546875, -109.796875, -105.5390625, -101.28125, -97.0234375, -92.765625, -88.5078125, -84.25, -79.9921875, -75.734375, -71.4765625, -67.21875, -62.9609375, -58.703125, -54.4453125, -50.1875, -45.9296875, -41.671875, -37.4140625, -33.15625, -28.8984375, -24.640625, -20.3828125, -16.125, -11.8671875, -7.609375, -3.3515625, 0.90625, 5.1640625, 9.421875, 13.6796875, 17.9375, 22.1953125, 26.453125, 30.7109375, 34.96875, 39.2265625, 43.484375, 47.7421875, 52.0, 56.2578125, 60.515625, 64.7734375, 69.03125, 73.2890625, 77.546875, 81.8046875, 86.0625, 90.3203125, 94.578125, 98.8359375, 103.09375, 107.3515625, 111.609375, 115.8671875, 120.125]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 4.0, 10.0, 20.0, 13.0, 18.0, 20.0, 19.0, 21.0, 35.0, 34.0, 44.0, 48.0, 45.0, 48.0, 44.0, 60.0, 34.0, 58.0, 57.0, 54.0, 59.0, 45.0, 45.0, 39.0, 28.0, 17.0, 17.0, 19.0, 14.0, 8.0, 7.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.37356567382812, -89.39723205566406, -87.4208984375, -85.44456481933594, -83.46823120117188, -81.49189758300781, -79.51555633544922, -77.53922271728516, -75.5628890991211, -73.58655548095703, -71.61022186279297, -69.6338882446289, -67.65755462646484, -65.68121337890625, -63.70488357543945, -61.728546142578125, -59.75221252441406, -57.77587890625, -55.79954528808594, -53.82320785522461, -51.84687423706055, -49.870540618896484, -47.89420700073242, -45.917869567871094, -43.9415397644043, -41.965206146240234, -39.98887252807617, -38.012535095214844, -36.03620147705078, -34.05986785888672, -32.083534240722656, -30.10719871520996, -28.130863189697266, -26.154529571533203, -24.178194046020508, -22.201860427856445, -20.22552490234375, -18.249191284179688, -16.272857666015625, -14.29652214050293, -12.32018756866455, -10.343852996826172, -8.367518424987793, -6.391184329986572, -4.414849758148193, -2.4385156631469727, -0.46218109130859375, 1.5141534805297852, 3.490488052368164, 5.466822624206543, 7.443157196044922, 9.419490814208984, 11.39582633972168, 13.372159957885742, 15.348494529724121, 17.3248291015625, 19.301162719726562, 21.277496337890625, 23.25383186340332, 25.230165481567383, 27.206501007080078, 29.18283462524414, 31.159168243408203, 33.13550567626953, 35.111839294433594]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 4.0, 4.0, 4.0, 4.0, 8.0, 8.0, 9.0, 11.0, 17.0, 11.0, 12.0, 15.0, 18.0, 20.0, 17.0, 28.0, 28.0, 31.0, 35.0, 38.0, 38.0, 42.0, 36.0, 36.0, 37.0, 44.0, 33.0, 33.0, 31.0, 35.0, 23.0, 34.0, 30.0, 35.0, 20.0, 19.0, 24.0, 22.0, 14.0, 17.0, 11.0, 13.0, 9.0, 9.0, 7.0, 8.0, 11.0, 4.0, 4.0, 2.0, 3.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-36.794132232666016, -35.45803451538086, -34.12193298339844, -32.78583526611328, -31.44973373413086, -30.113636016845703, -28.777536392211914, -27.441436767578125, -26.105337142944336, -24.769237518310547, -23.433137893676758, -22.09703826904297, -20.760940551757812, -19.42483901977539, -18.088741302490234, -16.752641677856445, -15.416542053222656, -14.080442428588867, -12.744342803955078, -11.408244132995605, -10.072144508361816, -8.736044883728027, -7.399946212768555, -6.063846588134766, -4.727746963500977, -3.3916475772857666, -2.0555481910705566, -0.7194490432739258, 0.6166505813598633, 1.9527502059936523, 3.288848876953125, 4.624948501586914, 5.961051940917969, 7.297151565551758, 8.633251190185547, 9.96934986114502, 11.305449485778809, 12.641549110412598, 13.97764778137207, 15.31374740600586, 16.64984703063965, 17.985946655273438, 19.322046279907227, 20.658145904541016, 21.994243621826172, 23.330345153808594, 24.66644287109375, 26.00254249572754, 27.338642120361328, 28.674741744995117, 30.010841369628906, 31.346939086914062, 32.683040618896484, 34.01913833618164, 35.35523986816406, 36.69133758544922, 38.027435302734375, 39.36353302001953, 40.69963455200195, 42.03573226928711, 43.37183380126953, 44.70793151855469, 46.044029235839844, 47.380130767822266, 48.71623229980469]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 13.0, 13.0, 24.0, 26.0, 56.0, 72.0, 129.0, 197.0, 328.0, 491.0, 764.0, 1168.0, 1827.0, 2862.0, 4224.0, 6468.0, 9429.0, 13568.0, 19808.0, 27758.0, 37523.0, 49670.0, 63077.0, 76823.0, 89742.0, 106775.0, 116325.0, 91238.0, 79377.0, 65309.0, 51533.0, 38934.0, 28801.0, 20435.0, 14370.0, 9832.0, 6658.0, 4510.0, 2917.0, 1975.0, 1319.0, 828.0, 522.0, 319.0, 179.0, 135.0, 78.0, 55.0, 27.0, 19.0, 14.0, 12.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-156.75, -151.861328125, -146.97265625, -142.083984375, -137.1953125, -132.306640625, -127.41796875, -122.529296875, -117.640625, -112.751953125, -107.86328125, -102.974609375, -98.0859375, -93.197265625, -88.30859375, -83.419921875, -78.53125, -73.642578125, -68.75390625, -63.865234375, -58.9765625, -54.087890625, -49.19921875, -44.310546875, -39.421875, -34.533203125, -29.64453125, -24.755859375, -19.8671875, -14.978515625, -10.08984375, -5.201171875, -0.3125, 4.576171875, 9.46484375, 14.353515625, 19.2421875, 24.130859375, 29.01953125, 33.908203125, 38.796875, 43.685546875, 48.57421875, 53.462890625, 58.3515625, 63.240234375, 68.12890625, 73.017578125, 77.90625, 82.794921875, 87.68359375, 92.572265625, 97.4609375, 102.349609375, 107.23828125, 112.126953125, 117.015625, 121.904296875, 126.79296875, 131.681640625, 136.5703125, 141.458984375, 146.34765625, 151.236328125, 156.125]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 7.0, 6.0, 10.0, 13.0, 14.0, 12.0, 21.0, 15.0, 27.0, 33.0, 40.0, 29.0, 34.0, 40.0, 39.0, 41.0, 29.0, 44.0, 67.0, 51.0, 45.0, 44.0, 36.0, 47.0, 32.0, 36.0, 31.0, 26.0, 22.0, 15.0, 19.0, 7.0, 16.0, 15.0, 9.0, 5.0, 4.0, 8.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.8125, -73.2578125, -70.703125, -68.1484375, -65.59375, -63.0390625, -60.484375, -57.9296875, -55.375, -52.8203125, -50.265625, -47.7109375, -45.15625, -42.6015625, -40.046875, -37.4921875, -34.9375, -32.3828125, -29.828125, -27.2734375, -24.71875, -22.1640625, -19.609375, -17.0546875, -14.5, -11.9453125, -9.390625, -6.8359375, -4.28125, -1.7265625, 0.828125, 3.3828125, 5.9375, 8.4921875, 11.046875, 13.6015625, 16.15625, 18.7109375, 21.265625, 23.8203125, 26.375, 28.9296875, 31.484375, 34.0390625, 36.59375, 39.1484375, 41.703125, 44.2578125, 46.8125, 49.3671875, 51.921875, 54.4765625, 57.03125, 59.5859375, 62.140625, 64.6953125, 67.25, 69.8046875, 72.359375, 74.9140625, 77.46875, 80.0234375, 82.578125, 85.1328125, 87.6875]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 6.0, 7.0, 3.0, 7.0, 14.0, 32.0, 16.0, 13.0, 30.0, 26.0, 42.0, 48.0, 44.0, 53.0, 56.0, 50.0, 44.0, 59.0, 54.0, 51.0, 45.0, 36.0, 41.0, 29.0, 30.0, 26.0, 17.0, 19.0, 22.0, 21.0, 18.0, 3.0, 10.0, 7.0, 7.0, 2.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-65.42303466796875, -63.57600021362305, -61.728965759277344, -59.881927490234375, -58.03489303588867, -56.18785858154297, -54.340824127197266, -52.49378967285156, -50.646751403808594, -48.79971694946289, -46.95268249511719, -45.10564422607422, -43.258609771728516, -41.41157531738281, -39.56454086303711, -37.717506408691406, -35.87046813964844, -34.023433685302734, -32.17639923095703, -30.329362869262695, -28.48232650756836, -26.635292053222656, -24.788257598876953, -22.941221237182617, -21.094188690185547, -19.247154235839844, -17.400117874145508, -15.553083419799805, -13.706047058105469, -11.859012603759766, -10.011977195739746, -8.164941787719727, -6.317905426025391, -4.470870018005371, -2.6238348484039307, -0.7767996788024902, 1.0702357292175293, 2.9172706604003906, 4.76430606842041, 6.61134147644043, 8.45837688446045, 10.305412292480469, 12.152447700500488, 13.999483108520508, 15.846517562866211, 17.693553924560547, 19.54058837890625, 21.387622833251953, 23.23465919494629, 25.081693649291992, 26.928730010986328, 28.77576446533203, 30.622800827026367, 32.46983337402344, 34.316871643066406, 36.16390609741211, 38.01094055175781, 39.857975006103516, 41.70500946044922, 43.55204772949219, 45.39908218383789, 47.246116638183594, 49.0931510925293, 50.940185546875, 52.78722381591797]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 5.0, 4.0, 5.0, 6.0, 4.0, 4.0, 5.0, 12.0, 11.0, 12.0, 14.0, 19.0, 23.0, 21.0, 28.0, 32.0, 33.0, 30.0, 28.0, 37.0, 43.0, 36.0, 38.0, 54.0, 46.0, 48.0, 36.0, 23.0, 36.0, 30.0, 29.0, 37.0, 23.0, 35.0, 15.0, 19.0, 26.0, 25.0, 16.0, 14.0, 10.0, 9.0, 2.0, 8.0, 2.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-50.88264846801758, -49.40705871582031, -47.93146896362305, -46.45587921142578, -44.98028564453125, -43.504695892333984, -42.02910614013672, -40.55351638793945, -39.07792663574219, -37.60233688354492, -36.126747131347656, -34.651153564453125, -33.17556381225586, -31.699974060058594, -30.224384307861328, -28.748794555664062, -27.27320098876953, -25.797611236572266, -24.322019577026367, -22.8464298248291, -21.370838165283203, -19.895248413085938, -18.419658660888672, -16.944068908691406, -15.468477249145508, -13.992886543273926, -12.517295837402344, -11.041706085205078, -9.566115379333496, -8.090524673461914, -6.614934921264648, -5.139344215393066, -3.6637496948242188, -2.188159227371216, -0.7125687599182129, 0.7630214691162109, 2.238612174987793, 3.714202880859375, 5.189792633056641, 6.665383338928223, 8.140974044799805, 9.616564750671387, 11.092155456542969, 12.567745208740234, 14.043335914611816, 15.518926620483398, 16.994516372680664, 18.470108032226562, 19.945697784423828, 21.421287536621094, 22.896879196166992, 24.372468948364258, 25.848060607910156, 27.323650360107422, 28.799240112304688, 30.274829864501953, 31.75042152404785, 33.22601318359375, 34.701602935791016, 36.17719268798828, 37.65278244018555, 39.12837219238281, 40.603965759277344, 42.07955551147461, 43.555145263671875]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 6.0, 0.0, 9.0, 13.0, 15.0, 32.0, 58.0, 85.0, 139.0, 202.0, 366.0, 617.0, 961.0, 1654.0, 2701.0, 4324.0, 7131.0, 11835.0, 19698.0, 31826.0, 52893.0, 87757.0, 144813.0, 240014.0, 393268.0, 625653.0, 817063.0, 671117.0, 427333.0, 259498.0, 155774.0, 94216.0, 56348.0, 34108.0, 20619.0, 12445.0, 7630.0, 4643.0, 2879.0, 1673.0, 1125.0, 641.0, 427.0, 252.0, 170.0, 98.0, 57.0, 44.0, 20.0, 18.0, 13.0, 8.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-72.75, -70.291015625, -67.83203125, -65.373046875, -62.9140625, -60.455078125, -57.99609375, -55.537109375, -53.078125, -50.619140625, -48.16015625, -45.701171875, -43.2421875, -40.783203125, -38.32421875, -35.865234375, -33.40625, -30.947265625, -28.48828125, -26.029296875, -23.5703125, -21.111328125, -18.65234375, -16.193359375, -13.734375, -11.275390625, -8.81640625, -6.357421875, -3.8984375, -1.439453125, 1.01953125, 3.478515625, 5.9375, 8.396484375, 10.85546875, 13.314453125, 15.7734375, 18.232421875, 20.69140625, 23.150390625, 25.609375, 28.068359375, 30.52734375, 32.986328125, 35.4453125, 37.904296875, 40.36328125, 42.822265625, 45.28125, 47.740234375, 50.19921875, 52.658203125, 55.1171875, 57.576171875, 60.03515625, 62.494140625, 64.953125, 67.412109375, 69.87109375, 72.330078125, 74.7890625, 77.248046875, 79.70703125, 82.166015625, 84.625]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 3.0, 1.0, 5.0, 6.0, 7.0, 3.0, 7.0, 12.0, 14.0, 11.0, 15.0, 15.0, 30.0, 21.0, 29.0, 36.0, 31.0, 34.0, 33.0, 36.0, 35.0, 47.0, 52.0, 47.0, 48.0, 42.0, 32.0, 32.0, 36.0, 33.0, 37.0, 23.0, 33.0, 36.0, 18.0, 17.0, 16.0, 14.0, 16.0, 10.0, 8.0, 7.0, 7.0, 3.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.09375, -41.681640625, -40.26953125, -38.857421875, -37.4453125, -36.033203125, -34.62109375, -33.208984375, -31.796875, -30.384765625, -28.97265625, -27.560546875, -26.1484375, -24.736328125, -23.32421875, -21.912109375, -20.5, -19.087890625, -17.67578125, -16.263671875, -14.8515625, -13.439453125, -12.02734375, -10.615234375, -9.203125, -7.791015625, -6.37890625, -4.966796875, -3.5546875, -2.142578125, -0.73046875, 0.681640625, 2.09375, 3.505859375, 4.91796875, 6.330078125, 7.7421875, 9.154296875, 10.56640625, 11.978515625, 13.390625, 14.802734375, 16.21484375, 17.626953125, 19.0390625, 20.451171875, 21.86328125, 23.275390625, 24.6875, 26.099609375, 27.51171875, 28.923828125, 30.3359375, 31.748046875, 33.16015625, 34.572265625, 35.984375, 37.396484375, 38.80859375, 40.220703125, 41.6328125, 43.044921875, 44.45703125, 45.869140625, 47.28125]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 6.0, 6.0, 7.0, 19.0, 28.0, 46.0, 57.0, 121.0, 151.0, 266.0, 375.0, 623.0, 993.0, 1590.0, 2507.0, 4097.0, 6662.0, 11216.0, 18623.0, 30088.0, 49947.0, 81719.0, 129107.0, 203494.0, 311466.0, 457373.0, 615137.0, 666599.0, 538384.0, 380723.0, 253529.0, 162996.0, 103030.0, 63514.0, 38639.0, 23834.0, 14575.0, 8728.0, 5461.0, 3263.0, 1994.0, 1229.0, 728.0, 504.0, 309.0, 189.0, 111.0, 83.0, 46.0, 43.0, 26.0, 13.0, 5.0, 9.0, 5.0, 1.0, 1.0, 1.0, 2.0], "bins": [-52.125, -50.5087890625, -48.892578125, -47.2763671875, -45.66015625, -44.0439453125, -42.427734375, -40.8115234375, -39.1953125, -37.5791015625, -35.962890625, -34.3466796875, -32.73046875, -31.1142578125, -29.498046875, -27.8818359375, -26.265625, -24.6494140625, -23.033203125, -21.4169921875, -19.80078125, -18.1845703125, -16.568359375, -14.9521484375, -13.3359375, -11.7197265625, -10.103515625, -8.4873046875, -6.87109375, -5.2548828125, -3.638671875, -2.0224609375, -0.40625, 1.2099609375, 2.826171875, 4.4423828125, 6.05859375, 7.6748046875, 9.291015625, 10.9072265625, 12.5234375, 14.1396484375, 15.755859375, 17.3720703125, 18.98828125, 20.6044921875, 22.220703125, 23.8369140625, 25.453125, 27.0693359375, 28.685546875, 30.3017578125, 31.91796875, 33.5341796875, 35.150390625, 36.7666015625, 38.3828125, 39.9990234375, 41.615234375, 43.2314453125, 44.84765625, 46.4638671875, 48.080078125, 49.6962890625, 51.3125]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 3.0, 3.0, 6.0, 9.0, 11.0, 16.0, 17.0, 28.0, 20.0, 34.0, 37.0, 60.0, 69.0, 81.0, 90.0, 101.0, 114.0, 149.0, 167.0, 208.0, 223.0, 194.0, 227.0, 215.0, 214.0, 230.0, 228.0, 201.0, 179.0, 138.0, 119.0, 129.0, 102.0, 83.0, 74.0, 64.0, 43.0, 37.0, 27.0, 27.0, 20.0, 18.0, 19.0, 9.0, 3.0, 8.0, 5.0, 6.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 3.0], "bins": [-20.640625, -19.992919921875, -19.34521484375, -18.697509765625, -18.0498046875, -17.402099609375, -16.75439453125, -16.106689453125, -15.458984375, -14.811279296875, -14.16357421875, -13.515869140625, -12.8681640625, -12.220458984375, -11.57275390625, -10.925048828125, -10.27734375, -9.629638671875, -8.98193359375, -8.334228515625, -7.6865234375, -7.038818359375, -6.39111328125, -5.743408203125, -5.095703125, -4.447998046875, -3.80029296875, -3.152587890625, -2.5048828125, -1.857177734375, -1.20947265625, -0.561767578125, 0.0859375, 0.733642578125, 1.38134765625, 2.029052734375, 2.6767578125, 3.324462890625, 3.97216796875, 4.619873046875, 5.267578125, 5.915283203125, 6.56298828125, 7.210693359375, 7.8583984375, 8.506103515625, 9.15380859375, 9.801513671875, 10.44921875, 11.096923828125, 11.74462890625, 12.392333984375, 13.0400390625, 13.687744140625, 14.33544921875, 14.983154296875, 15.630859375, 16.278564453125, 16.92626953125, 17.573974609375, 18.2216796875, 18.869384765625, 19.51708984375, 20.164794921875, 20.8125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 3.0, 3.0, 5.0, 6.0, 11.0, 17.0, 10.0, 16.0, 24.0, 29.0, 34.0, 32.0, 45.0, 58.0, 47.0, 58.0, 58.0, 58.0, 55.0, 52.0, 64.0, 52.0, 30.0, 43.0, 32.0, 19.0, 29.0, 29.0, 21.0, 12.0, 8.0, 16.0, 7.0, 6.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.025115966796875, -51.130428314208984, -49.23573684692383, -47.34104919433594, -45.44636154174805, -43.551673889160156, -41.656982421875, -39.76229476928711, -37.86760711669922, -35.97291946411133, -34.07822799682617, -32.18354034423828, -30.28885269165039, -28.394163131713867, -26.499473571777344, -24.604785919189453, -22.71009635925293, -20.815406799316406, -18.920719146728516, -17.026029586791992, -15.131341934204102, -13.236652374267578, -11.341963768005371, -9.447275161743164, -7.552586555480957, -5.65789794921875, -3.763209104537964, -1.8685202598571777, 0.026168346405029297, 1.9208574295043945, 3.8155460357666016, 5.710234642028809, 7.604923248291016, 9.499611854553223, 11.39430046081543, 13.288990020751953, 15.183677673339844, 17.078367233276367, 18.97305679321289, 20.86774444580078, 22.762432098388672, 24.657121658325195, 26.551809310913086, 28.44649887084961, 30.3411865234375, 32.235877990722656, 34.13056564331055, 36.02525329589844, 37.919944763183594, 39.814632415771484, 41.70932388305664, 43.60401153564453, 45.49869918823242, 47.39338684082031, 49.28807830810547, 51.18276596069336, 53.07745361328125, 54.97214126586914, 56.8668327331543, 58.76152038574219, 60.65620803833008, 62.55089569091797, 64.44558715820312, 66.34027099609375, 68.2349624633789]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 8.0, 4.0, 14.0, 8.0, 16.0, 15.0, 23.0, 25.0, 27.0, 20.0, 41.0, 42.0, 39.0, 38.0, 33.0, 45.0, 40.0, 44.0, 42.0, 54.0, 39.0, 33.0, 46.0, 49.0, 27.0, 36.0, 30.0, 19.0, 23.0, 22.0, 15.0, 16.0, 13.0, 10.0, 10.0, 10.0, 6.0, 9.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-51.110984802246094, -49.5527458190918, -47.9945068359375, -46.4362678527832, -44.878028869628906, -43.319786071777344, -41.76155090332031, -40.20330810546875, -38.64506912231445, -37.086830139160156, -35.52859115600586, -33.97035217285156, -32.412113189697266, -30.853872299194336, -29.29563331604004, -27.73739242553711, -26.179155349731445, -24.62091636657715, -23.06267738342285, -21.504436492919922, -19.946197509765625, -18.387958526611328, -16.82971954345703, -15.271479606628418, -13.713240623474121, -12.155001640319824, -10.596761703491211, -9.038522720336914, -7.480283260345459, -5.922043800354004, -4.363804817199707, -2.8055648803710938, -1.2473258972167969, 0.31091344356536865, 1.8691527843475342, 3.42739200592041, 4.985631465911865, 6.54387092590332, 8.102109909057617, 9.66034984588623, 11.218588829040527, 12.776827812194824, 14.335067749023438, 15.893306732177734, 17.45154571533203, 19.009784698486328, 20.568023681640625, 22.126264572143555, 23.68450355529785, 25.24274253845215, 26.800981521606445, 28.359222412109375, 29.917461395263672, 31.47570037841797, 33.033939361572266, 34.59217834472656, 36.15041732788086, 37.708656311035156, 39.26689529418945, 40.82513427734375, 42.38337326049805, 43.941612243652344, 45.499855041503906, 47.0580940246582, 48.6163330078125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 3.0, 4.0, 15.0, 23.0, 32.0, 44.0, 73.0, 96.0, 157.0, 248.0, 396.0, 589.0, 920.0, 1469.0, 2392.0, 3856.0, 6127.0, 10113.0, 16022.0, 25536.0, 41061.0, 64380.0, 99191.0, 141595.0, 167529.0, 152642.0, 112334.0, 74454.0, 47626.0, 30105.0, 18746.0, 11643.0, 7161.0, 4525.0, 2804.0, 1726.0, 1059.0, 675.0, 424.0, 261.0, 175.0, 113.0, 71.0, 50.0, 39.0, 16.0, 19.0, 14.0, 6.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.0625, -67.77734375, -65.4921875, -63.20703125, -60.921875, -58.63671875, -56.3515625, -54.06640625, -51.78125, -49.49609375, -47.2109375, -44.92578125, -42.640625, -40.35546875, -38.0703125, -35.78515625, -33.5, -31.21484375, -28.9296875, -26.64453125, -24.359375, -22.07421875, -19.7890625, -17.50390625, -15.21875, -12.93359375, -10.6484375, -8.36328125, -6.078125, -3.79296875, -1.5078125, 0.77734375, 3.0625, 5.34765625, 7.6328125, 9.91796875, 12.203125, 14.48828125, 16.7734375, 19.05859375, 21.34375, 23.62890625, 25.9140625, 28.19921875, 30.484375, 32.76953125, 35.0546875, 37.33984375, 39.625, 41.91015625, 44.1953125, 46.48046875, 48.765625, 51.05078125, 53.3359375, 55.62109375, 57.90625, 60.19140625, 62.4765625, 64.76171875, 67.046875, 69.33203125, 71.6171875, 73.90234375, 76.1875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 6.0, 2.0, 4.0, 4.0, 8.0, 8.0, 9.0, 14.0, 15.0, 15.0, 19.0, 25.0, 32.0, 34.0, 38.0, 37.0, 34.0, 42.0, 49.0, 42.0, 35.0, 37.0, 38.0, 48.0, 39.0, 32.0, 42.0, 44.0, 43.0, 29.0, 43.0, 24.0, 24.0, 15.0, 15.0, 17.0, 6.0, 12.0, 8.0, 8.0, 4.0, 2.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.8125, -47.40771484375, -46.0029296875, -44.59814453125, -43.193359375, -41.78857421875, -40.3837890625, -38.97900390625, -37.57421875, -36.16943359375, -34.7646484375, -33.35986328125, -31.955078125, -30.55029296875, -29.1455078125, -27.74072265625, -26.3359375, -24.93115234375, -23.5263671875, -22.12158203125, -20.716796875, -19.31201171875, -17.9072265625, -16.50244140625, -15.09765625, -13.69287109375, -12.2880859375, -10.88330078125, -9.478515625, -8.07373046875, -6.6689453125, -5.26416015625, -3.859375, -2.45458984375, -1.0498046875, 0.35498046875, 1.759765625, 3.16455078125, 4.5693359375, 5.97412109375, 7.37890625, 8.78369140625, 10.1884765625, 11.59326171875, 12.998046875, 14.40283203125, 15.8076171875, 17.21240234375, 18.6171875, 20.02197265625, 21.4267578125, 22.83154296875, 24.236328125, 25.64111328125, 27.0458984375, 28.45068359375, 29.85546875, 31.26025390625, 32.6650390625, 34.06982421875, 35.474609375, 36.87939453125, 38.2841796875, 39.68896484375, 41.09375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 8.0, 4.0, 14.0, 13.0, 26.0, 37.0, 72.0, 92.0, 107.0, 181.0, 215.0, 342.0, 490.0, 779.0, 1210.0, 1768.0, 2678.0, 4109.0, 6199.0, 10165.0, 15909.0, 25812.0, 43268.0, 75312.0, 130976.0, 204790.0, 204443.0, 131067.0, 75118.0, 43207.0, 25931.0, 15873.0, 9891.0, 6455.0, 4074.0, 2661.0, 1782.0, 1066.0, 750.0, 507.0, 349.0, 232.0, 181.0, 118.0, 96.0, 60.0, 39.0, 27.0, 21.0, 17.0, 7.0, 7.0, 7.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-86.1875, -83.4072265625, -80.626953125, -77.8466796875, -75.06640625, -72.2861328125, -69.505859375, -66.7255859375, -63.9453125, -61.1650390625, -58.384765625, -55.6044921875, -52.82421875, -50.0439453125, -47.263671875, -44.4833984375, -41.703125, -38.9228515625, -36.142578125, -33.3623046875, -30.58203125, -27.8017578125, -25.021484375, -22.2412109375, -19.4609375, -16.6806640625, -13.900390625, -11.1201171875, -8.33984375, -5.5595703125, -2.779296875, 0.0009765625, 2.78125, 5.5615234375, 8.341796875, 11.1220703125, 13.90234375, 16.6826171875, 19.462890625, 22.2431640625, 25.0234375, 27.8037109375, 30.583984375, 33.3642578125, 36.14453125, 38.9248046875, 41.705078125, 44.4853515625, 47.265625, 50.0458984375, 52.826171875, 55.6064453125, 58.38671875, 61.1669921875, 63.947265625, 66.7275390625, 69.5078125, 72.2880859375, 75.068359375, 77.8486328125, 80.62890625, 83.4091796875, 86.189453125, 88.9697265625, 91.75]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 4.0, 8.0, 10.0, 6.0, 14.0, 21.0, 14.0, 15.0, 21.0, 18.0, 24.0, 30.0, 26.0, 31.0, 26.0, 41.0, 39.0, 43.0, 35.0, 50.0, 42.0, 52.0, 41.0, 33.0, 35.0, 45.0, 37.0, 33.0, 28.0, 22.0, 29.0, 28.0, 17.0, 15.0, 15.0, 14.0, 13.0, 9.0, 4.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.953125, -28.998046875, -28.04296875, -27.087890625, -26.1328125, -25.177734375, -24.22265625, -23.267578125, -22.3125, -21.357421875, -20.40234375, -19.447265625, -18.4921875, -17.537109375, -16.58203125, -15.626953125, -14.671875, -13.716796875, -12.76171875, -11.806640625, -10.8515625, -9.896484375, -8.94140625, -7.986328125, -7.03125, -6.076171875, -5.12109375, -4.166015625, -3.2109375, -2.255859375, -1.30078125, -0.345703125, 0.609375, 1.564453125, 2.51953125, 3.474609375, 4.4296875, 5.384765625, 6.33984375, 7.294921875, 8.25, 9.205078125, 10.16015625, 11.115234375, 12.0703125, 13.025390625, 13.98046875, 14.935546875, 15.890625, 16.845703125, 17.80078125, 18.755859375, 19.7109375, 20.666015625, 21.62109375, 22.576171875, 23.53125, 24.486328125, 25.44140625, 26.396484375, 27.3515625, 28.306640625, 29.26171875, 30.216796875, 31.171875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 7.0, 8.0, 11.0, 20.0, 20.0, 33.0, 32.0, 59.0, 86.0, 143.0, 202.0, 262.0, 384.0, 597.0, 883.0, 1433.0, 2373.0, 3931.0, 7266.0, 13785.0, 28084.0, 61056.0, 138088.0, 277547.0, 267570.0, 130051.0, 57779.0, 26888.0, 12982.0, 6872.0, 3877.0, 2180.0, 1405.0, 841.0, 563.0, 378.0, 267.0, 187.0, 110.0, 96.0, 58.0, 41.0, 33.0, 25.0, 12.0, 11.0, 11.0, 7.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-52.40625, -50.6572265625, -48.908203125, -47.1591796875, -45.41015625, -43.6611328125, -41.912109375, -40.1630859375, -38.4140625, -36.6650390625, -34.916015625, -33.1669921875, -31.41796875, -29.6689453125, -27.919921875, -26.1708984375, -24.421875, -22.6728515625, -20.923828125, -19.1748046875, -17.42578125, -15.6767578125, -13.927734375, -12.1787109375, -10.4296875, -8.6806640625, -6.931640625, -5.1826171875, -3.43359375, -1.6845703125, 0.064453125, 1.8134765625, 3.5625, 5.3115234375, 7.060546875, 8.8095703125, 10.55859375, 12.3076171875, 14.056640625, 15.8056640625, 17.5546875, 19.3037109375, 21.052734375, 22.8017578125, 24.55078125, 26.2998046875, 28.048828125, 29.7978515625, 31.546875, 33.2958984375, 35.044921875, 36.7939453125, 38.54296875, 40.2919921875, 42.041015625, 43.7900390625, 45.5390625, 47.2880859375, 49.037109375, 50.7861328125, 52.53515625, 54.2841796875, 56.033203125, 57.7822265625, 59.53125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 8.0, 4.0, 2.0, 5.0, 7.0, 10.0, 12.0, 20.0, 31.0, 35.0, 71.0, 92.0, 128.0, 149.0, 134.0, 93.0, 67.0, 39.0, 30.0, 19.0, 11.0, 8.0, 7.0, 7.0, 8.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.007198333740234375, -0.007005929946899414, -0.006813526153564453, -0.006621122360229492, -0.006428718566894531, -0.00623631477355957, -0.006043910980224609, -0.0058515071868896484, -0.0056591033935546875, -0.0054666996002197266, -0.005274295806884766, -0.005081892013549805, -0.004889488220214844, -0.004697084426879883, -0.004504680633544922, -0.004312276840209961, -0.004119873046875, -0.003927469253540039, -0.003735065460205078, -0.003542661666870117, -0.0033502578735351562, -0.0031578540802001953, -0.0029654502868652344, -0.0027730464935302734, -0.0025806427001953125, -0.0023882389068603516, -0.0021958351135253906, -0.0020034313201904297, -0.0018110275268554688, -0.0016186237335205078, -0.0014262199401855469, -0.001233816146850586, -0.001041412353515625, -0.0008490085601806641, -0.0006566047668457031, -0.0004642009735107422, -0.00027179718017578125, -7.939338684082031e-05, 0.00011301040649414062, 0.00030541419982910156, 0.0004978179931640625, 0.0006902217864990234, 0.0008826255798339844, 0.0010750293731689453, 0.0012674331665039062, 0.0014598369598388672, 0.0016522407531738281, 0.001844644546508789, 0.00203704833984375, 0.002229452133178711, 0.002421855926513672, 0.002614259719848633, 0.0028066635131835938, 0.0029990673065185547, 0.0031914710998535156, 0.0033838748931884766, 0.0035762786865234375, 0.0037686824798583984, 0.003961086273193359, 0.00415349006652832, 0.004345893859863281, 0.004538297653198242, 0.004730701446533203, 0.004923105239868164, 0.005115509033203125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 2.0, 10.0, 10.0, 10.0, 17.0, 18.0, 31.0, 41.0, 45.0, 82.0, 104.0, 154.0, 186.0, 235.0, 395.0, 515.0, 709.0, 1013.0, 1583.0, 2290.0, 3754.0, 6352.0, 11129.0, 20777.0, 42057.0, 85285.0, 160447.0, 234828.0, 212059.0, 127680.0, 64996.0, 31925.0, 16417.0, 8811.0, 5042.0, 3152.0, 1983.0, 1323.0, 885.0, 655.0, 410.0, 332.0, 203.0, 171.0, 125.0, 97.0, 60.0, 42.0, 39.0, 30.0, 17.0, 8.0, 5.0, 9.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0], "bins": [-58.9375, -57.08447265625, -55.2314453125, -53.37841796875, -51.525390625, -49.67236328125, -47.8193359375, -45.96630859375, -44.11328125, -42.26025390625, -40.4072265625, -38.55419921875, -36.701171875, -34.84814453125, -32.9951171875, -31.14208984375, -29.2890625, -27.43603515625, -25.5830078125, -23.72998046875, -21.876953125, -20.02392578125, -18.1708984375, -16.31787109375, -14.46484375, -12.61181640625, -10.7587890625, -8.90576171875, -7.052734375, -5.19970703125, -3.3466796875, -1.49365234375, 0.359375, 2.21240234375, 4.0654296875, 5.91845703125, 7.771484375, 9.62451171875, 11.4775390625, 13.33056640625, 15.18359375, 17.03662109375, 18.8896484375, 20.74267578125, 22.595703125, 24.44873046875, 26.3017578125, 28.15478515625, 30.0078125, 31.86083984375, 33.7138671875, 35.56689453125, 37.419921875, 39.27294921875, 41.1259765625, 42.97900390625, 44.83203125, 46.68505859375, 48.5380859375, 50.39111328125, 52.244140625, 54.09716796875, 55.9501953125, 57.80322265625, 59.65625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 3.0, 7.0, 5.0, 5.0, 7.0, 13.0, 11.0, 16.0, 29.0, 38.0, 46.0, 65.0, 78.0, 77.0, 69.0, 91.0, 65.0, 74.0, 53.0, 55.0, 46.0, 34.0, 33.0, 23.0, 14.0, 7.0, 7.0, 8.0, 4.0, 3.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.375, -23.684326171875, -22.99365234375, -22.302978515625, -21.6123046875, -20.921630859375, -20.23095703125, -19.540283203125, -18.849609375, -18.158935546875, -17.46826171875, -16.777587890625, -16.0869140625, -15.396240234375, -14.70556640625, -14.014892578125, -13.32421875, -12.633544921875, -11.94287109375, -11.252197265625, -10.5615234375, -9.870849609375, -9.18017578125, -8.489501953125, -7.798828125, -7.108154296875, -6.41748046875, -5.726806640625, -5.0361328125, -4.345458984375, -3.65478515625, -2.964111328125, -2.2734375, -1.582763671875, -0.89208984375, -0.201416015625, 0.4892578125, 1.179931640625, 1.87060546875, 2.561279296875, 3.251953125, 3.942626953125, 4.63330078125, 5.323974609375, 6.0146484375, 6.705322265625, 7.39599609375, 8.086669921875, 8.77734375, 9.468017578125, 10.15869140625, 10.849365234375, 11.5400390625, 12.230712890625, 12.92138671875, 13.612060546875, 14.302734375, 14.993408203125, 15.68408203125, 16.374755859375, 17.0654296875, 17.756103515625, 18.44677734375, 19.137451171875, 19.828125]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 4.0, 10.0, 8.0, 11.0, 12.0, 8.0, 20.0, 20.0, 27.0, 36.0, 38.0, 47.0, 42.0, 46.0, 48.0, 54.0, 59.0, 65.0, 41.0, 61.0, 45.0, 43.0, 37.0, 24.0, 37.0, 33.0, 20.0, 19.0, 16.0, 11.0, 14.0, 10.0, 5.0, 6.0, 2.0, 4.0, 3.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.323360443115234, -46.77022171020508, -45.21708297729492, -43.663944244384766, -42.110809326171875, -40.55767059326172, -39.00453186035156, -37.451393127441406, -35.89825439453125, -34.345115661621094, -32.79197692871094, -31.238840103149414, -29.685701370239258, -28.1325626373291, -26.579425811767578, -25.026287078857422, -23.473148345947266, -21.92000961303711, -20.366870880126953, -18.81373405456543, -17.260595321655273, -15.707456588745117, -14.154318809509277, -12.601181030273438, -11.048042297363281, -9.494903564453125, -7.941765785217285, -6.388627529144287, -4.835489273071289, -3.282351016998291, -1.729212760925293, -0.17607498168945312, 1.3770599365234375, 2.9301981925964355, 4.483336448669434, 6.036474704742432, 7.58961296081543, 9.142751693725586, 10.695889472961426, 12.249027252197266, 13.802165985107422, 15.355304718017578, 16.908443450927734, 18.461580276489258, 20.014719009399414, 21.56785774230957, 23.120994567871094, 24.67413330078125, 26.227272033691406, 27.780410766601562, 29.33354949951172, 30.886686325073242, 32.43982696533203, 33.99296188354492, 35.54610061645508, 37.099239349365234, 38.65237808227539, 40.20551681518555, 41.7586555480957, 43.31179428100586, 44.86492919921875, 46.418067932128906, 47.97120666503906, 49.52434539794922, 51.077484130859375]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 2.0, 4.0, 7.0, 6.0, 12.0, 10.0, 15.0, 15.0, 21.0, 18.0, 23.0, 28.0, 28.0, 33.0, 41.0, 38.0, 45.0, 24.0, 31.0, 42.0, 44.0, 43.0, 41.0, 43.0, 40.0, 39.0, 28.0, 46.0, 32.0, 21.0, 26.0, 21.0, 26.0, 19.0, 18.0, 10.0, 11.0, 10.0, 9.0, 13.0, 7.0, 8.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-40.124786376953125, -38.834556579589844, -37.54433059692383, -36.25410079956055, -34.963871002197266, -33.67364501953125, -32.38341522216797, -31.093185424804688, -29.80295753479004, -28.51272964477539, -27.22249984741211, -25.93227195739746, -24.642044067382812, -23.35181427001953, -22.061586380004883, -20.771358489990234, -19.481128692626953, -18.190900802612305, -16.900671005249023, -15.610443115234375, -14.32021427154541, -13.029985427856445, -11.739757537841797, -10.449528694152832, -9.159299850463867, -7.869071006774902, -6.578842639923096, -5.288614273071289, -3.998385429382324, -2.7081565856933594, -1.4179282188415527, -0.1276998519897461, 1.1625289916992188, 2.4527575969696045, 3.7429862022399902, 5.033214569091797, 6.323443412780762, 7.613672256469727, 8.903900146484375, 10.19412899017334, 11.484357833862305, 12.77458667755127, 14.064815521240234, 15.355043411254883, 16.64527130126953, 17.935501098632812, 19.22572898864746, 20.51595687866211, 21.80618667602539, 23.09641456604004, 24.38664436340332, 25.67687225341797, 26.96710205078125, 28.2573299407959, 29.547557830810547, 30.837787628173828, 32.128013610839844, 33.418243408203125, 34.70846939086914, 35.99869918823242, 37.2889289855957, 38.57915496826172, 39.869384765625, 41.15961456298828, 42.44984436035156]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 6.0, 10.0, 22.0, 25.0, 34.0, 65.0, 92.0, 124.0, 219.0, 334.0, 530.0, 757.0, 1176.0, 1829.0, 2873.0, 4350.0, 6533.0, 9795.0, 14543.0, 21615.0, 30894.0, 43421.0, 58789.0, 77051.0, 95229.0, 109021.0, 113198.0, 106108.0, 91761.0, 73891.0, 55727.0, 40390.0, 28460.0, 19735.0, 13406.0, 8986.0, 6073.0, 3986.0, 2581.0, 1672.0, 1154.0, 748.0, 475.0, 305.0, 220.0, 132.0, 79.0, 54.0, 33.0, 20.0, 12.0, 11.0, 4.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.71875, -44.16357421875, -42.6083984375, -41.05322265625, -39.498046875, -37.94287109375, -36.3876953125, -34.83251953125, -33.27734375, -31.72216796875, -30.1669921875, -28.61181640625, -27.056640625, -25.50146484375, -23.9462890625, -22.39111328125, -20.8359375, -19.28076171875, -17.7255859375, -16.17041015625, -14.615234375, -13.06005859375, -11.5048828125, -9.94970703125, -8.39453125, -6.83935546875, -5.2841796875, -3.72900390625, -2.173828125, -0.61865234375, 0.9365234375, 2.49169921875, 4.046875, 5.60205078125, 7.1572265625, 8.71240234375, 10.267578125, 11.82275390625, 13.3779296875, 14.93310546875, 16.48828125, 18.04345703125, 19.5986328125, 21.15380859375, 22.708984375, 24.26416015625, 25.8193359375, 27.37451171875, 28.9296875, 30.48486328125, 32.0400390625, 33.59521484375, 35.150390625, 36.70556640625, 38.2607421875, 39.81591796875, 41.37109375, 42.92626953125, 44.4814453125, 46.03662109375, 47.591796875, 49.14697265625, 50.7021484375, 52.25732421875, 53.8125]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 3.0, 5.0, 6.0, 8.0, 8.0, 11.0, 13.0, 16.0, 22.0, 24.0, 27.0, 23.0, 20.0, 42.0, 39.0, 32.0, 40.0, 30.0, 41.0, 36.0, 47.0, 40.0, 41.0, 43.0, 38.0, 33.0, 43.0, 28.0, 36.0, 25.0, 20.0, 30.0, 18.0, 23.0, 15.0, 20.0, 11.0, 9.0, 9.0, 5.0, 5.0, 4.0, 5.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.71875, -39.4833984375, -38.248046875, -37.0126953125, -35.77734375, -34.5419921875, -33.306640625, -32.0712890625, -30.8359375, -29.6005859375, -28.365234375, -27.1298828125, -25.89453125, -24.6591796875, -23.423828125, -22.1884765625, -20.953125, -19.7177734375, -18.482421875, -17.2470703125, -16.01171875, -14.7763671875, -13.541015625, -12.3056640625, -11.0703125, -9.8349609375, -8.599609375, -7.3642578125, -6.12890625, -4.8935546875, -3.658203125, -2.4228515625, -1.1875, 0.0478515625, 1.283203125, 2.5185546875, 3.75390625, 4.9892578125, 6.224609375, 7.4599609375, 8.6953125, 9.9306640625, 11.166015625, 12.4013671875, 13.63671875, 14.8720703125, 16.107421875, 17.3427734375, 18.578125, 19.8134765625, 21.048828125, 22.2841796875, 23.51953125, 24.7548828125, 25.990234375, 27.2255859375, 28.4609375, 29.6962890625, 30.931640625, 32.1669921875, 33.40234375, 34.6376953125, 35.873046875, 37.1083984375, 38.34375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 8.0, 12.0, 17.0, 24.0, 33.0, 55.0, 71.0, 142.0, 207.0, 381.0, 584.0, 1000.0, 1550.0, 2660.0, 4235.0, 6869.0, 10683.0, 16924.0, 26056.0, 39306.0, 56705.0, 77478.0, 99242.0, 116452.0, 122375.0, 116808.0, 100090.0, 78909.0, 57618.0, 39550.0, 26481.0, 17060.0, 10829.0, 6885.0, 4226.0, 2632.0, 1666.0, 1041.0, 657.0, 371.0, 259.0, 138.0, 121.0, 67.0, 30.0, 17.0, 20.0, 7.0, 12.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.09375, -47.5361328125, -45.978515625, -44.4208984375, -42.86328125, -41.3056640625, -39.748046875, -38.1904296875, -36.6328125, -35.0751953125, -33.517578125, -31.9599609375, -30.40234375, -28.8447265625, -27.287109375, -25.7294921875, -24.171875, -22.6142578125, -21.056640625, -19.4990234375, -17.94140625, -16.3837890625, -14.826171875, -13.2685546875, -11.7109375, -10.1533203125, -8.595703125, -7.0380859375, -5.48046875, -3.9228515625, -2.365234375, -0.8076171875, 0.75, 2.3076171875, 3.865234375, 5.4228515625, 6.98046875, 8.5380859375, 10.095703125, 11.6533203125, 13.2109375, 14.7685546875, 16.326171875, 17.8837890625, 19.44140625, 20.9990234375, 22.556640625, 24.1142578125, 25.671875, 27.2294921875, 28.787109375, 30.3447265625, 31.90234375, 33.4599609375, 35.017578125, 36.5751953125, 38.1328125, 39.6904296875, 41.248046875, 42.8056640625, 44.36328125, 45.9208984375, 47.478515625, 49.0361328125, 50.59375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 0.0, 2.0, 4.0, 7.0, 7.0, 11.0, 8.0, 14.0, 14.0, 14.0, 30.0, 31.0, 35.0, 38.0, 36.0, 41.0, 46.0, 42.0, 48.0, 41.0, 44.0, 33.0, 47.0, 41.0, 41.0, 44.0, 39.0, 32.0, 28.0, 21.0, 25.0, 21.0, 24.0, 12.0, 14.0, 12.0, 9.0, 13.0, 10.0, 8.0, 4.0, 7.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.65625, -25.7744140625, -24.892578125, -24.0107421875, -23.12890625, -22.2470703125, -21.365234375, -20.4833984375, -19.6015625, -18.7197265625, -17.837890625, -16.9560546875, -16.07421875, -15.1923828125, -14.310546875, -13.4287109375, -12.546875, -11.6650390625, -10.783203125, -9.9013671875, -9.01953125, -8.1376953125, -7.255859375, -6.3740234375, -5.4921875, -4.6103515625, -3.728515625, -2.8466796875, -1.96484375, -1.0830078125, -0.201171875, 0.6806640625, 1.5625, 2.4443359375, 3.326171875, 4.2080078125, 5.08984375, 5.9716796875, 6.853515625, 7.7353515625, 8.6171875, 9.4990234375, 10.380859375, 11.2626953125, 12.14453125, 13.0263671875, 13.908203125, 14.7900390625, 15.671875, 16.5537109375, 17.435546875, 18.3173828125, 19.19921875, 20.0810546875, 20.962890625, 21.8447265625, 22.7265625, 23.6083984375, 24.490234375, 25.3720703125, 26.25390625, 27.1357421875, 28.017578125, 28.8994140625, 29.78125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 4.0, 7.0, 10.0, 12.0, 10.0, 20.0, 24.0, 26.0, 50.0, 82.0, 110.0, 180.0, 264.0, 447.0, 674.0, 1102.0, 1866.0, 3084.0, 5350.0, 9154.0, 16577.0, 30117.0, 55293.0, 96902.0, 152385.0, 191425.0, 180564.0, 128160.0, 76956.0, 43129.0, 23697.0, 12963.0, 7333.0, 4182.0, 2379.0, 1464.0, 902.0, 575.0, 379.0, 247.0, 132.0, 99.0, 74.0, 42.0, 34.0, 27.0, 17.0, 13.0, 7.0, 6.0, 1.0, 5.0, 0.0, 1.0, 0.0, 2.0], "bins": [-32.4375, -31.4775390625, -30.517578125, -29.5576171875, -28.59765625, -27.6376953125, -26.677734375, -25.7177734375, -24.7578125, -23.7978515625, -22.837890625, -21.8779296875, -20.91796875, -19.9580078125, -18.998046875, -18.0380859375, -17.078125, -16.1181640625, -15.158203125, -14.1982421875, -13.23828125, -12.2783203125, -11.318359375, -10.3583984375, -9.3984375, -8.4384765625, -7.478515625, -6.5185546875, -5.55859375, -4.5986328125, -3.638671875, -2.6787109375, -1.71875, -0.7587890625, 0.201171875, 1.1611328125, 2.12109375, 3.0810546875, 4.041015625, 5.0009765625, 5.9609375, 6.9208984375, 7.880859375, 8.8408203125, 9.80078125, 10.7607421875, 11.720703125, 12.6806640625, 13.640625, 14.6005859375, 15.560546875, 16.5205078125, 17.48046875, 18.4404296875, 19.400390625, 20.3603515625, 21.3203125, 22.2802734375, 23.240234375, 24.2001953125, 25.16015625, 26.1201171875, 27.080078125, 28.0400390625, 29.0]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 6.0, 11.0, 8.0, 7.0, 12.0, 14.0, 33.0, 21.0, 35.0, 44.0, 51.0, 63.0, 73.0, 79.0, 72.0, 90.0, 71.0, 64.0, 51.0, 49.0, 34.0, 33.0, 18.0, 21.0, 14.0, 11.0, 7.0, 6.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00359344482421875, -0.0034618377685546875, -0.003330230712890625, -0.0031986236572265625, -0.0030670166015625, -0.0029354095458984375, -0.002803802490234375, -0.0026721954345703125, -0.00254058837890625, -0.0024089813232421875, -0.002277374267578125, -0.0021457672119140625, -0.00201416015625, -0.0018825531005859375, -0.001750946044921875, -0.0016193389892578125, -0.00148773193359375, -0.0013561248779296875, -0.001224517822265625, -0.0010929107666015625, -0.0009613037109375, -0.0008296966552734375, -0.000698089599609375, -0.0005664825439453125, -0.00043487548828125, -0.0003032684326171875, -0.000171661376953125, -4.00543212890625e-05, 9.1552734375e-05, 0.0002231597900390625, 0.000354766845703125, 0.0004863739013671875, 0.00061798095703125, 0.0007495880126953125, 0.000881195068359375, 0.0010128021240234375, 0.0011444091796875, 0.0012760162353515625, 0.001407623291015625, 0.0015392303466796875, 0.00167083740234375, 0.0018024444580078125, 0.001934051513671875, 0.0020656585693359375, 0.002197265625, 0.0023288726806640625, 0.002460479736328125, 0.0025920867919921875, 0.00272369384765625, 0.0028553009033203125, 0.002986907958984375, 0.0031185150146484375, 0.0032501220703125, 0.0033817291259765625, 0.003513336181640625, 0.0036449432373046875, 0.00377655029296875, 0.0039081573486328125, 0.004039764404296875, 0.0041713714599609375, 0.004302978515625, 0.0044345855712890625, 0.004566192626953125, 0.0046977996826171875, 0.00482940673828125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 9.0, 9.0, 11.0, 17.0, 22.0, 55.0, 66.0, 91.0, 177.0, 327.0, 505.0, 915.0, 1496.0, 2697.0, 4865.0, 8771.0, 15906.0, 28275.0, 50341.0, 86621.0, 137645.0, 181689.0, 182552.0, 138966.0, 88788.0, 51775.0, 29160.0, 16305.0, 8878.0, 4953.0, 2863.0, 1590.0, 904.0, 521.0, 327.0, 165.0, 112.0, 67.0, 41.0, 28.0, 19.0, 14.0, 6.0, 8.0, 8.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-31.0625, -30.175537109375, -29.28857421875, -28.401611328125, -27.5146484375, -26.627685546875, -25.74072265625, -24.853759765625, -23.966796875, -23.079833984375, -22.19287109375, -21.305908203125, -20.4189453125, -19.531982421875, -18.64501953125, -17.758056640625, -16.87109375, -15.984130859375, -15.09716796875, -14.210205078125, -13.3232421875, -12.436279296875, -11.54931640625, -10.662353515625, -9.775390625, -8.888427734375, -8.00146484375, -7.114501953125, -6.2275390625, -5.340576171875, -4.45361328125, -3.566650390625, -2.6796875, -1.792724609375, -0.90576171875, -0.018798828125, 0.8681640625, 1.755126953125, 2.64208984375, 3.529052734375, 4.416015625, 5.302978515625, 6.18994140625, 7.076904296875, 7.9638671875, 8.850830078125, 9.73779296875, 10.624755859375, 11.51171875, 12.398681640625, 13.28564453125, 14.172607421875, 15.0595703125, 15.946533203125, 16.83349609375, 17.720458984375, 18.607421875, 19.494384765625, 20.38134765625, 21.268310546875, 22.1552734375, 23.042236328125, 23.92919921875, 24.816162109375, 25.703125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 9.0, 5.0, 4.0, 16.0, 8.0, 6.0, 13.0, 16.0, 21.0, 23.0, 23.0, 21.0, 35.0, 32.0, 36.0, 44.0, 38.0, 39.0, 41.0, 51.0, 39.0, 51.0, 38.0, 43.0, 27.0, 34.0, 37.0, 34.0, 18.0, 31.0, 19.0, 17.0, 21.0, 25.0, 17.0, 6.0, 13.0, 15.0, 7.0, 7.0, 1.0, 8.0, 1.0, 4.0, 4.0, 4.0, 3.0, 2.0], "bins": [-8.2265625, -8.0003662109375, -7.774169921875, -7.5479736328125, -7.32177734375, -7.0955810546875, -6.869384765625, -6.6431884765625, -6.4169921875, -6.1907958984375, -5.964599609375, -5.7384033203125, -5.51220703125, -5.2860107421875, -5.059814453125, -4.8336181640625, -4.607421875, -4.3812255859375, -4.155029296875, -3.9288330078125, -3.70263671875, -3.4764404296875, -3.250244140625, -3.0240478515625, -2.7978515625, -2.5716552734375, -2.345458984375, -2.1192626953125, -1.89306640625, -1.6668701171875, -1.440673828125, -1.2144775390625, -0.98828125, -0.7620849609375, -0.535888671875, -0.3096923828125, -0.08349609375, 0.1427001953125, 0.368896484375, 0.5950927734375, 0.8212890625, 1.0474853515625, 1.273681640625, 1.4998779296875, 1.72607421875, 1.9522705078125, 2.178466796875, 2.4046630859375, 2.630859375, 2.8570556640625, 3.083251953125, 3.3094482421875, 3.53564453125, 3.7618408203125, 3.988037109375, 4.2142333984375, 4.4404296875, 4.6666259765625, 4.892822265625, 5.1190185546875, 5.34521484375, 5.5714111328125, 5.797607421875, 6.0238037109375, 6.25]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 4.0, 2.0, 4.0, 5.0, 4.0, 9.0, 8.0, 10.0, 12.0, 20.0, 17.0, 18.0, 20.0, 28.0, 35.0, 45.0, 50.0, 37.0, 49.0, 40.0, 51.0, 52.0, 53.0, 64.0, 46.0, 40.0, 44.0, 38.0, 37.0, 25.0, 31.0, 29.0, 13.0, 15.0, 9.0, 15.0, 4.0, 7.0, 5.0, 4.0, 2.0, 4.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.981536865234375, -49.49579620361328, -48.01005554199219, -46.524314880371094, -45.03857421875, -43.55283737182617, -42.06709671020508, -40.581356048583984, -39.09561538696289, -37.6098747253418, -36.1241340637207, -34.63839340209961, -33.15265655517578, -31.666913986206055, -30.181175231933594, -28.6954345703125, -27.209693908691406, -25.723953247070312, -24.23821258544922, -22.752473831176758, -21.266733169555664, -19.78099250793457, -18.29525375366211, -16.809513092041016, -15.323772430419922, -13.838031768798828, -12.35229206085205, -10.866552352905273, -9.38081169128418, -7.895071506500244, -6.409331321716309, -4.923591613769531, -3.4378509521484375, -1.952110767364502, -0.4663705825805664, 1.0193696022033691, 2.5051097869873047, 3.9908499717712402, 5.476590156555176, 6.962329864501953, 8.448070526123047, 9.93381118774414, 11.419550895690918, 12.905290603637695, 14.391031265258789, 15.876771926879883, 17.362510681152344, 18.848251342773438, 20.33399200439453, 21.819732666015625, 23.30547332763672, 24.79121208190918, 26.276952743530273, 27.762693405151367, 29.248432159423828, 30.734172821044922, 32.219913482666016, 33.70565414428711, 35.1913948059082, 36.6771354675293, 38.162872314453125, 39.64861297607422, 41.13435363769531, 42.620094299316406, 44.1058349609375]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 5.0, 2.0, 3.0, 15.0, 15.0, 10.0, 17.0, 14.0, 19.0, 20.0, 21.0, 11.0, 29.0, 25.0, 35.0, 36.0, 45.0, 39.0, 41.0, 36.0, 40.0, 28.0, 41.0, 46.0, 40.0, 32.0, 33.0, 40.0, 33.0, 32.0, 22.0, 26.0, 22.0, 22.0, 20.0, 19.0, 11.0, 11.0, 7.0, 8.0, 8.0, 6.0, 2.0, 7.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-38.29981994628906, -37.08195495605469, -35.86408615112305, -34.64622116088867, -33.42835235595703, -32.210487365722656, -30.99262237548828, -29.774755477905273, -28.556888580322266, -27.339021682739258, -26.12115478515625, -24.903289794921875, -23.685422897338867, -22.46755599975586, -21.249691009521484, -20.031824111938477, -18.81395721435547, -17.59609031677246, -16.378223419189453, -15.160358428955078, -13.94249153137207, -12.724624633789062, -11.506758689880371, -10.28889274597168, -9.071025848388672, -7.853159427642822, -6.635293006896973, -5.417426586151123, -4.199560165405273, -2.981693744659424, -1.7638273239135742, -0.5459613800048828, 0.6719093322753906, 1.8897757530212402, 3.10764217376709, 4.3255085945129395, 5.543375015258789, 6.761241436004639, 7.979107856750488, 9.19697380065918, 10.414840698242188, 11.632707595825195, 12.850573539733887, 14.068439483642578, 15.286306381225586, 16.504173278808594, 17.72203826904297, 18.939905166625977, 20.157772064208984, 21.375638961791992, 22.593505859375, 23.811370849609375, 25.029237747192383, 26.24710464477539, 27.464969635009766, 28.682836532592773, 29.90070343017578, 31.11857032775879, 32.3364372253418, 33.55430221557617, 34.77217102050781, 35.99003601074219, 37.20790100097656, 38.42576599121094, 39.64363479614258]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 7.0, 14.0, 14.0, 27.0, 32.0, 53.0, 98.0, 152.0, 244.0, 431.0, 643.0, 972.0, 1822.0, 2874.0, 4797.0, 7849.0, 12910.0, 21224.0, 35494.0, 59015.0, 97620.0, 162853.0, 274503.0, 456357.0, 697170.0, 792942.0, 609792.0, 381767.0, 229022.0, 136434.0, 81559.0, 49406.0, 29688.0, 18009.0, 11093.0, 6715.0, 4018.0, 2559.0, 1595.0, 933.0, 577.0, 393.0, 223.0, 150.0, 98.0, 65.0, 23.0, 21.0, 12.0, 9.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.21875, -46.57373046875, -44.9287109375, -43.28369140625, -41.638671875, -39.99365234375, -38.3486328125, -36.70361328125, -35.05859375, -33.41357421875, -31.7685546875, -30.12353515625, -28.478515625, -26.83349609375, -25.1884765625, -23.54345703125, -21.8984375, -20.25341796875, -18.6083984375, -16.96337890625, -15.318359375, -13.67333984375, -12.0283203125, -10.38330078125, -8.73828125, -7.09326171875, -5.4482421875, -3.80322265625, -2.158203125, -0.51318359375, 1.1318359375, 2.77685546875, 4.421875, 6.06689453125, 7.7119140625, 9.35693359375, 11.001953125, 12.64697265625, 14.2919921875, 15.93701171875, 17.58203125, 19.22705078125, 20.8720703125, 22.51708984375, 24.162109375, 25.80712890625, 27.4521484375, 29.09716796875, 30.7421875, 32.38720703125, 34.0322265625, 35.67724609375, 37.322265625, 38.96728515625, 40.6123046875, 42.25732421875, 43.90234375, 45.54736328125, 47.1923828125, 48.83740234375, 50.482421875, 52.12744140625, 53.7724609375, 55.41748046875, 57.0625]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 2.0, 5.0, 10.0, 10.0, 14.0, 13.0, 9.0, 18.0, 16.0, 18.0, 24.0, 24.0, 22.0, 21.0, 26.0, 35.0, 48.0, 40.0, 29.0, 31.0, 44.0, 33.0, 27.0, 48.0, 48.0, 32.0, 33.0, 41.0, 29.0, 36.0, 26.0, 22.0, 18.0, 19.0, 23.0, 17.0, 15.0, 16.0, 10.0, 12.0, 6.0, 5.0, 6.0, 6.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-26.421875, -25.588134765625, -24.75439453125, -23.920654296875, -23.0869140625, -22.253173828125, -21.41943359375, -20.585693359375, -19.751953125, -18.918212890625, -18.08447265625, -17.250732421875, -16.4169921875, -15.583251953125, -14.74951171875, -13.915771484375, -13.08203125, -12.248291015625, -11.41455078125, -10.580810546875, -9.7470703125, -8.913330078125, -8.07958984375, -7.245849609375, -6.412109375, -5.578369140625, -4.74462890625, -3.910888671875, -3.0771484375, -2.243408203125, -1.40966796875, -0.575927734375, 0.2578125, 1.091552734375, 1.92529296875, 2.759033203125, 3.5927734375, 4.426513671875, 5.26025390625, 6.093994140625, 6.927734375, 7.761474609375, 8.59521484375, 9.428955078125, 10.2626953125, 11.096435546875, 11.93017578125, 12.763916015625, 13.59765625, 14.431396484375, 15.26513671875, 16.098876953125, 16.9326171875, 17.766357421875, 18.60009765625, 19.433837890625, 20.267578125, 21.101318359375, 21.93505859375, 22.768798828125, 23.6025390625, 24.436279296875, 25.27001953125, 26.103759765625, 26.9375]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 5.0, 11.0, 15.0, 18.0, 36.0, 53.0, 83.0, 110.0, 187.0, 294.0, 440.0, 638.0, 1099.0, 1673.0, 2685.0, 4127.0, 6414.0, 10538.0, 16654.0, 27840.0, 44657.0, 72249.0, 115211.0, 182281.0, 279534.0, 412011.0, 554941.0, 634405.0, 574812.0, 433036.0, 296568.0, 194404.0, 124004.0, 77427.0, 47157.0, 29709.0, 18295.0, 11438.0, 6991.0, 4440.0, 2814.0, 1806.0, 1102.0, 696.0, 486.0, 285.0, 202.0, 127.0, 99.0, 57.0, 34.0, 40.0, 20.0, 13.0, 6.0, 4.0, 5.0, 3.0, 3.0, 0.0, 2.0], "bins": [-33.15625, -32.07177734375, -30.9873046875, -29.90283203125, -28.818359375, -27.73388671875, -26.6494140625, -25.56494140625, -24.48046875, -23.39599609375, -22.3115234375, -21.22705078125, -20.142578125, -19.05810546875, -17.9736328125, -16.88916015625, -15.8046875, -14.72021484375, -13.6357421875, -12.55126953125, -11.466796875, -10.38232421875, -9.2978515625, -8.21337890625, -7.12890625, -6.04443359375, -4.9599609375, -3.87548828125, -2.791015625, -1.70654296875, -0.6220703125, 0.46240234375, 1.546875, 2.63134765625, 3.7158203125, 4.80029296875, 5.884765625, 6.96923828125, 8.0537109375, 9.13818359375, 10.22265625, 11.30712890625, 12.3916015625, 13.47607421875, 14.560546875, 15.64501953125, 16.7294921875, 17.81396484375, 18.8984375, 19.98291015625, 21.0673828125, 22.15185546875, 23.236328125, 24.32080078125, 25.4052734375, 26.48974609375, 27.57421875, 28.65869140625, 29.7431640625, 30.82763671875, 31.912109375, 32.99658203125, 34.0810546875, 35.16552734375, 36.25]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 5.0, 10.0, 5.0, 5.0, 5.0, 11.0, 14.0, 13.0, 14.0, 30.0, 21.0, 31.0, 42.0, 67.0, 75.0, 80.0, 80.0, 86.0, 125.0, 124.0, 167.0, 188.0, 176.0, 212.0, 193.0, 213.0, 223.0, 215.0, 172.0, 188.0, 172.0, 171.0, 151.0, 122.0, 110.0, 110.0, 85.0, 72.0, 55.0, 41.0, 34.0, 42.0, 24.0, 23.0, 15.0, 14.0, 14.0, 8.0, 9.0, 3.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0], "bins": [-13.8828125, -13.4676513671875, -13.052490234375, -12.6373291015625, -12.22216796875, -11.8070068359375, -11.391845703125, -10.9766845703125, -10.5615234375, -10.1463623046875, -9.731201171875, -9.3160400390625, -8.90087890625, -8.4857177734375, -8.070556640625, -7.6553955078125, -7.240234375, -6.8250732421875, -6.409912109375, -5.9947509765625, -5.57958984375, -5.1644287109375, -4.749267578125, -4.3341064453125, -3.9189453125, -3.5037841796875, -3.088623046875, -2.6734619140625, -2.25830078125, -1.8431396484375, -1.427978515625, -1.0128173828125, -0.59765625, -0.1824951171875, 0.232666015625, 0.6478271484375, 1.06298828125, 1.4781494140625, 1.893310546875, 2.3084716796875, 2.7236328125, 3.1387939453125, 3.553955078125, 3.9691162109375, 4.38427734375, 4.7994384765625, 5.214599609375, 5.6297607421875, 6.044921875, 6.4600830078125, 6.875244140625, 7.2904052734375, 7.70556640625, 8.1207275390625, 8.535888671875, 8.9510498046875, 9.3662109375, 9.7813720703125, 10.196533203125, 10.6116943359375, 11.02685546875, 11.4420166015625, 11.857177734375, 12.2723388671875, 12.6875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 10.0, 8.0, 10.0, 17.0, 22.0, 12.0, 20.0, 22.0, 23.0, 27.0, 37.0, 24.0, 49.0, 36.0, 46.0, 49.0, 45.0, 42.0, 52.0, 39.0, 45.0, 56.0, 32.0, 40.0, 41.0, 30.0, 19.0, 23.0, 22.0, 18.0, 25.0, 12.0, 4.0, 16.0, 6.0, 6.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.14870071411133, -34.011474609375, -32.87424850463867, -31.737022399902344, -30.599796295166016, -29.462570190429688, -28.32534408569336, -27.18811798095703, -26.050891876220703, -24.913665771484375, -23.776439666748047, -22.63921356201172, -21.50198745727539, -20.364761352539062, -19.227535247802734, -18.090309143066406, -16.953083038330078, -15.81585693359375, -14.678630828857422, -13.541404724121094, -12.404178619384766, -11.266952514648438, -10.12972640991211, -8.992500305175781, -7.855274200439453, -6.718048095703125, -5.580821990966797, -4.443595886230469, -3.3063697814941406, -2.1691436767578125, -1.0319175720214844, 0.10530853271484375, 1.2425384521484375, 2.3797645568847656, 3.5169906616210938, 4.654216766357422, 5.79144287109375, 6.928668975830078, 8.065895080566406, 9.203121185302734, 10.340347290039062, 11.47757339477539, 12.614799499511719, 13.752025604248047, 14.889251708984375, 16.026477813720703, 17.16370391845703, 18.30093002319336, 19.438156127929688, 20.575382232666016, 21.712608337402344, 22.849834442138672, 23.987060546875, 25.124286651611328, 26.261512756347656, 27.398738861083984, 28.535964965820312, 29.67319107055664, 30.81041717529297, 31.947643280029297, 33.084869384765625, 34.22209548950195, 35.35932159423828, 36.49654769897461, 37.63377380371094]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 5.0, 5.0, 2.0, 7.0, 3.0, 10.0, 11.0, 12.0, 10.0, 6.0, 20.0, 25.0, 19.0, 25.0, 34.0, 21.0, 41.0, 32.0, 36.0, 38.0, 41.0, 41.0, 36.0, 34.0, 41.0, 28.0, 47.0, 43.0, 42.0, 39.0, 31.0, 23.0, 19.0, 25.0, 23.0, 21.0, 11.0, 15.0, 20.0, 21.0, 7.0, 3.0, 5.0, 9.0, 5.0, 6.0, 2.0, 3.0, 4.0, 0.0, 0.0, 3.0], "bins": [-34.7421989440918, -33.759281158447266, -32.776363372802734, -31.793445587158203, -30.810527801513672, -29.82761001586914, -28.84469223022461, -27.861774444580078, -26.878856658935547, -25.895938873291016, -24.913021087646484, -23.930103302001953, -22.947185516357422, -21.96426773071289, -20.98134994506836, -19.998432159423828, -19.01551628112793, -18.0325984954834, -17.049680709838867, -16.066762924194336, -15.083845138549805, -14.100927352905273, -13.118010520935059, -12.135092735290527, -11.152174949645996, -10.169257164001465, -9.186339378356934, -8.203422546386719, -7.220504283905029, -6.237586498260498, -5.254669189453125, -4.271751403808594, -3.2888355255126953, -2.305917739868164, -1.323000192642212, -0.34008264541625977, 0.6428351402282715, 1.6257529258728027, 2.608670234680176, 3.591588020324707, 4.574505805969238, 5.5574235916137695, 6.540341377258301, 7.523258686065674, 8.506175994873047, 9.489093780517578, 10.47201156616211, 11.45492935180664, 12.437847137451172, 13.420764923095703, 14.403682708740234, 15.386600494384766, 16.369518280029297, 17.352436065673828, 18.33535385131836, 19.31827163696289, 20.301189422607422, 21.284107208251953, 22.267024993896484, 23.249942779541016, 24.232860565185547, 25.215778350830078, 26.19869613647461, 27.18161392211914, 28.16452980041504]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 6.0, 10.0, 14.0, 21.0, 23.0, 32.0, 59.0, 81.0, 143.0, 234.0, 367.0, 557.0, 950.0, 1498.0, 2338.0, 3804.0, 6295.0, 10408.0, 17148.0, 27423.0, 43267.0, 64741.0, 92306.0, 119095.0, 136371.0, 136208.0, 117855.0, 90910.0, 63828.0, 42380.0, 26948.0, 16931.0, 10093.0, 6295.0, 3809.0, 2284.0, 1412.0, 907.0, 561.0, 357.0, 219.0, 139.0, 73.0, 59.0, 38.0, 22.0, 19.0, 8.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-63.4375, -61.3896484375, -59.341796875, -57.2939453125, -55.24609375, -53.1982421875, -51.150390625, -49.1025390625, -47.0546875, -45.0068359375, -42.958984375, -40.9111328125, -38.86328125, -36.8154296875, -34.767578125, -32.7197265625, -30.671875, -28.6240234375, -26.576171875, -24.5283203125, -22.48046875, -20.4326171875, -18.384765625, -16.3369140625, -14.2890625, -12.2412109375, -10.193359375, -8.1455078125, -6.09765625, -4.0498046875, -2.001953125, 0.0458984375, 2.09375, 4.1416015625, 6.189453125, 8.2373046875, 10.28515625, 12.3330078125, 14.380859375, 16.4287109375, 18.4765625, 20.5244140625, 22.572265625, 24.6201171875, 26.66796875, 28.7158203125, 30.763671875, 32.8115234375, 34.859375, 36.9072265625, 38.955078125, 41.0029296875, 43.05078125, 45.0986328125, 47.146484375, 49.1943359375, 51.2421875, 53.2900390625, 55.337890625, 57.3857421875, 59.43359375, 61.4814453125, 63.529296875, 65.5771484375, 67.625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 6.0, 5.0, 4.0, 4.0, 8.0, 11.0, 13.0, 13.0, 9.0, 13.0, 25.0, 25.0, 17.0, 20.0, 29.0, 24.0, 28.0, 38.0, 38.0, 37.0, 37.0, 38.0, 43.0, 32.0, 32.0, 43.0, 37.0, 40.0, 34.0, 39.0, 35.0, 22.0, 28.0, 18.0, 29.0, 21.0, 17.0, 15.0, 15.0, 8.0, 8.0, 7.0, 10.0, 8.0, 2.0, 4.0, 2.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-21.8125, -21.13916015625, -20.4658203125, -19.79248046875, -19.119140625, -18.44580078125, -17.7724609375, -17.09912109375, -16.42578125, -15.75244140625, -15.0791015625, -14.40576171875, -13.732421875, -13.05908203125, -12.3857421875, -11.71240234375, -11.0390625, -10.36572265625, -9.6923828125, -9.01904296875, -8.345703125, -7.67236328125, -6.9990234375, -6.32568359375, -5.65234375, -4.97900390625, -4.3056640625, -3.63232421875, -2.958984375, -2.28564453125, -1.6123046875, -0.93896484375, -0.265625, 0.40771484375, 1.0810546875, 1.75439453125, 2.427734375, 3.10107421875, 3.7744140625, 4.44775390625, 5.12109375, 5.79443359375, 6.4677734375, 7.14111328125, 7.814453125, 8.48779296875, 9.1611328125, 9.83447265625, 10.5078125, 11.18115234375, 11.8544921875, 12.52783203125, 13.201171875, 13.87451171875, 14.5478515625, 15.22119140625, 15.89453125, 16.56787109375, 17.2412109375, 17.91455078125, 18.587890625, 19.26123046875, 19.9345703125, 20.60791015625, 21.28125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 8.0, 12.0, 16.0, 14.0, 22.0, 35.0, 53.0, 68.0, 102.0, 135.0, 209.0, 335.0, 485.0, 770.0, 1204.0, 1908.0, 3059.0, 5209.0, 8505.0, 14525.0, 24673.0, 43364.0, 73875.0, 123686.0, 185867.0, 201833.0, 144874.0, 88896.0, 51515.0, 29689.0, 17296.0, 10216.0, 6028.0, 3740.0, 2330.0, 1391.0, 924.0, 537.0, 368.0, 232.0, 177.0, 110.0, 85.0, 61.0, 46.0, 22.0, 20.0, 5.0, 7.0, 9.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0], "bins": [-87.8125, -85.1650390625, -82.517578125, -79.8701171875, -77.22265625, -74.5751953125, -71.927734375, -69.2802734375, -66.6328125, -63.9853515625, -61.337890625, -58.6904296875, -56.04296875, -53.3955078125, -50.748046875, -48.1005859375, -45.453125, -42.8056640625, -40.158203125, -37.5107421875, -34.86328125, -32.2158203125, -29.568359375, -26.9208984375, -24.2734375, -21.6259765625, -18.978515625, -16.3310546875, -13.68359375, -11.0361328125, -8.388671875, -5.7412109375, -3.09375, -0.4462890625, 2.201171875, 4.8486328125, 7.49609375, 10.1435546875, 12.791015625, 15.4384765625, 18.0859375, 20.7333984375, 23.380859375, 26.0283203125, 28.67578125, 31.3232421875, 33.970703125, 36.6181640625, 39.265625, 41.9130859375, 44.560546875, 47.2080078125, 49.85546875, 52.5029296875, 55.150390625, 57.7978515625, 60.4453125, 63.0927734375, 65.740234375, 68.3876953125, 71.03515625, 73.6826171875, 76.330078125, 78.9775390625, 81.625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 1.0, 5.0, 3.0, 4.0, 4.0, 5.0, 14.0, 8.0, 17.0, 21.0, 12.0, 27.0, 19.0, 26.0, 33.0, 29.0, 30.0, 32.0, 37.0, 35.0, 39.0, 47.0, 27.0, 45.0, 38.0, 36.0, 43.0, 37.0, 39.0, 26.0, 45.0, 28.0, 19.0, 26.0, 23.0, 25.0, 16.0, 11.0, 14.0, 8.0, 4.0, 8.0, 6.0, 1.0, 9.0, 1.0, 4.0, 1.0, 6.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-17.1875, -16.66455078125, -16.1416015625, -15.61865234375, -15.095703125, -14.57275390625, -14.0498046875, -13.52685546875, -13.00390625, -12.48095703125, -11.9580078125, -11.43505859375, -10.912109375, -10.38916015625, -9.8662109375, -9.34326171875, -8.8203125, -8.29736328125, -7.7744140625, -7.25146484375, -6.728515625, -6.20556640625, -5.6826171875, -5.15966796875, -4.63671875, -4.11376953125, -3.5908203125, -3.06787109375, -2.544921875, -2.02197265625, -1.4990234375, -0.97607421875, -0.453125, 0.06982421875, 0.5927734375, 1.11572265625, 1.638671875, 2.16162109375, 2.6845703125, 3.20751953125, 3.73046875, 4.25341796875, 4.7763671875, 5.29931640625, 5.822265625, 6.34521484375, 6.8681640625, 7.39111328125, 7.9140625, 8.43701171875, 8.9599609375, 9.48291015625, 10.005859375, 10.52880859375, 11.0517578125, 11.57470703125, 12.09765625, 12.62060546875, 13.1435546875, 13.66650390625, 14.189453125, 14.71240234375, 15.2353515625, 15.75830078125, 16.28125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [6.0, 1.0, 1.0, 5.0, 11.0, 10.0, 21.0, 24.0, 25.0, 40.0, 61.0, 112.0, 125.0, 168.0, 261.0, 381.0, 598.0, 927.0, 1362.0, 2084.0, 3203.0, 4990.0, 8069.0, 13036.0, 22977.0, 40316.0, 75764.0, 150583.0, 272433.0, 212684.0, 106720.0, 55556.0, 30286.0, 17504.0, 10365.0, 6394.0, 3956.0, 2584.0, 1603.0, 1085.0, 711.0, 491.0, 328.0, 214.0, 150.0, 106.0, 87.0, 50.0, 28.0, 23.0, 18.0, 10.0, 4.0, 6.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-44.71875, -43.16357421875, -41.6083984375, -40.05322265625, -38.498046875, -36.94287109375, -35.3876953125, -33.83251953125, -32.27734375, -30.72216796875, -29.1669921875, -27.61181640625, -26.056640625, -24.50146484375, -22.9462890625, -21.39111328125, -19.8359375, -18.28076171875, -16.7255859375, -15.17041015625, -13.615234375, -12.06005859375, -10.5048828125, -8.94970703125, -7.39453125, -5.83935546875, -4.2841796875, -2.72900390625, -1.173828125, 0.38134765625, 1.9365234375, 3.49169921875, 5.046875, 6.60205078125, 8.1572265625, 9.71240234375, 11.267578125, 12.82275390625, 14.3779296875, 15.93310546875, 17.48828125, 19.04345703125, 20.5986328125, 22.15380859375, 23.708984375, 25.26416015625, 26.8193359375, 28.37451171875, 29.9296875, 31.48486328125, 33.0400390625, 34.59521484375, 36.150390625, 37.70556640625, 39.2607421875, 40.81591796875, 42.37109375, 43.92626953125, 45.4814453125, 47.03662109375, 48.591796875, 50.14697265625, 51.7021484375, 53.25732421875, 54.8125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 7.0, 7.0, 12.0, 14.0, 17.0, 21.0, 22.0, 25.0, 45.0, 49.0, 65.0, 61.0, 83.0, 84.0, 68.0, 77.0, 74.0, 47.0, 44.0, 29.0, 29.0, 19.0, 22.0, 11.0, 10.0, 9.0, 13.0, 9.0, 6.0, 6.0, 2.0, 3.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00629425048828125, -0.006113946437835693, -0.005933642387390137, -0.00575333833694458, -0.0055730342864990234, -0.005392730236053467, -0.00521242618560791, -0.0050321221351623535, -0.004851818084716797, -0.00467151403427124, -0.004491209983825684, -0.004310905933380127, -0.00413060188293457, -0.003950297832489014, -0.003769993782043457, -0.0035896897315979004, -0.0034093856811523438, -0.003229081630706787, -0.0030487775802612305, -0.002868473529815674, -0.002688169479370117, -0.0025078654289245605, -0.002327561378479004, -0.0021472573280334473, -0.0019669532775878906, -0.001786649227142334, -0.0016063451766967773, -0.0014260411262512207, -0.001245737075805664, -0.0010654330253601074, -0.0008851289749145508, -0.0007048249244689941, -0.0005245208740234375, -0.00034421682357788086, -0.00016391277313232422, 1.6391277313232422e-05, 0.00019669532775878906, 0.0003769993782043457, 0.0005573034286499023, 0.000737607479095459, 0.0009179115295410156, 0.0010982155799865723, 0.001278519630432129, 0.0014588236808776855, 0.0016391277313232422, 0.0018194317817687988, 0.0019997358322143555, 0.002180039882659912, 0.0023603439331054688, 0.0025406479835510254, 0.002720952033996582, 0.0029012560844421387, 0.0030815601348876953, 0.003261864185333252, 0.0034421682357788086, 0.0036224722862243652, 0.003802776336669922, 0.0039830803871154785, 0.004163384437561035, 0.004343688488006592, 0.0045239925384521484, 0.004704296588897705, 0.004884600639343262, 0.005064904689788818, 0.005245208740234375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [6.0, 0.0, 5.0, 3.0, 7.0, 9.0, 12.0, 17.0, 17.0, 30.0, 36.0, 58.0, 94.0, 97.0, 146.0, 242.0, 361.0, 437.0, 687.0, 933.0, 1386.0, 1950.0, 2952.0, 4184.0, 6316.0, 9500.0, 14604.0, 22662.0, 37091.0, 60431.0, 97744.0, 152891.0, 193256.0, 160675.0, 105038.0, 64728.0, 39074.0, 24263.0, 15574.0, 10086.0, 6727.0, 4479.0, 3023.0, 2085.0, 1434.0, 965.0, 613.0, 479.0, 362.0, 236.0, 160.0, 107.0, 80.0, 60.0, 53.0, 31.0, 23.0, 21.0, 11.0, 8.0, 7.0, 4.0, 4.0, 2.0], "bins": [-29.171875, -28.276123046875, -27.38037109375, -26.484619140625, -25.5888671875, -24.693115234375, -23.79736328125, -22.901611328125, -22.005859375, -21.110107421875, -20.21435546875, -19.318603515625, -18.4228515625, -17.527099609375, -16.63134765625, -15.735595703125, -14.83984375, -13.944091796875, -13.04833984375, -12.152587890625, -11.2568359375, -10.361083984375, -9.46533203125, -8.569580078125, -7.673828125, -6.778076171875, -5.88232421875, -4.986572265625, -4.0908203125, -3.195068359375, -2.29931640625, -1.403564453125, -0.5078125, 0.387939453125, 1.28369140625, 2.179443359375, 3.0751953125, 3.970947265625, 4.86669921875, 5.762451171875, 6.658203125, 7.553955078125, 8.44970703125, 9.345458984375, 10.2412109375, 11.136962890625, 12.03271484375, 12.928466796875, 13.82421875, 14.719970703125, 15.61572265625, 16.511474609375, 17.4072265625, 18.302978515625, 19.19873046875, 20.094482421875, 20.990234375, 21.885986328125, 22.78173828125, 23.677490234375, 24.5732421875, 25.468994140625, 26.36474609375, 27.260498046875, 28.15625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 0.0, 3.0, 3.0, 5.0, 6.0, 5.0, 7.0, 6.0, 14.0, 10.0, 11.0, 16.0, 24.0, 18.0, 26.0, 26.0, 30.0, 33.0, 33.0, 49.0, 38.0, 49.0, 60.0, 49.0, 54.0, 57.0, 47.0, 33.0, 36.0, 33.0, 21.0, 34.0, 25.0, 20.0, 20.0, 12.0, 17.0, 10.0, 9.0, 12.0, 9.0, 9.0, 6.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.609375, -8.3157958984375, -8.022216796875, -7.7286376953125, -7.43505859375, -7.1414794921875, -6.847900390625, -6.5543212890625, -6.2607421875, -5.9671630859375, -5.673583984375, -5.3800048828125, -5.08642578125, -4.7928466796875, -4.499267578125, -4.2056884765625, -3.912109375, -3.6185302734375, -3.324951171875, -3.0313720703125, -2.73779296875, -2.4442138671875, -2.150634765625, -1.8570556640625, -1.5634765625, -1.2698974609375, -0.976318359375, -0.6827392578125, -0.38916015625, -0.0955810546875, 0.197998046875, 0.4915771484375, 0.78515625, 1.0787353515625, 1.372314453125, 1.6658935546875, 1.95947265625, 2.2530517578125, 2.546630859375, 2.8402099609375, 3.1337890625, 3.4273681640625, 3.720947265625, 4.0145263671875, 4.30810546875, 4.6016845703125, 4.895263671875, 5.1888427734375, 5.482421875, 5.7760009765625, 6.069580078125, 6.3631591796875, 6.65673828125, 6.9503173828125, 7.243896484375, 7.5374755859375, 7.8310546875, 8.1246337890625, 8.418212890625, 8.7117919921875, 9.00537109375, 9.2989501953125, 9.592529296875, 9.8861083984375, 10.1796875]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 6.0, 2.0, 3.0, 5.0, 4.0, 9.0, 11.0, 14.0, 14.0, 18.0, 18.0, 18.0, 29.0, 30.0, 29.0, 38.0, 39.0, 65.0, 43.0, 40.0, 40.0, 55.0, 52.0, 43.0, 46.0, 38.0, 41.0, 48.0, 27.0, 27.0, 36.0, 18.0, 12.0, 12.0, 15.0, 18.0, 11.0, 7.0, 0.0, 2.0, 4.0, 2.0, 1.0, 5.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.590118408203125, -25.74036407470703, -24.890609741210938, -24.040857315063477, -23.191102981567383, -22.34134864807129, -21.491596221923828, -20.641841888427734, -19.79208755493164, -18.942333221435547, -18.092578887939453, -17.242826461791992, -16.3930721282959, -15.543317794799805, -14.693564414978027, -13.84381103515625, -12.994056701660156, -12.144302368164062, -11.294548988342285, -10.444795608520508, -9.595041275024414, -8.74528694152832, -7.895533561706543, -7.045779705047607, -6.196025848388672, -5.346271991729736, -4.496518135070801, -3.6467642784118652, -2.7970104217529297, -1.9472565650939941, -1.0975027084350586, -0.24774885177612305, 0.6020069122314453, 1.4517607688903809, 2.3015146255493164, 3.151268482208252, 4.0010223388671875, 4.850776195526123, 5.700530052185059, 6.550283908843994, 7.40003776550293, 8.249792098999023, 9.0995454788208, 9.949298858642578, 10.799053192138672, 11.648807525634766, 12.498560905456543, 13.34831428527832, 14.198068618774414, 15.047822952270508, 15.897576332092285, 16.747329711914062, 17.597084045410156, 18.44683837890625, 19.296592712402344, 20.146345138549805, 20.9960994720459, 21.845853805541992, 22.695606231689453, 23.545360565185547, 24.39511489868164, 25.244869232177734, 26.094623565673828, 26.94437599182129, 27.794130325317383]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 4.0, 4.0, 11.0, 5.0, 9.0, 7.0, 12.0, 27.0, 17.0, 15.0, 19.0, 25.0, 23.0, 39.0, 35.0, 30.0, 40.0, 25.0, 38.0, 46.0, 39.0, 38.0, 41.0, 40.0, 53.0, 41.0, 34.0, 32.0, 21.0, 27.0, 25.0, 24.0, 20.0, 20.0, 16.0, 17.0, 9.0, 14.0, 12.0, 4.0, 13.0, 3.0, 4.0, 4.0, 5.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.874345779418945, -22.16553497314453, -21.45672607421875, -20.747915267944336, -20.039104461669922, -19.330293655395508, -18.621482849121094, -17.912673950195312, -17.2038631439209, -16.495052337646484, -15.786242485046387, -15.077432632446289, -14.368621826171875, -13.659811019897461, -12.951001167297363, -12.242191314697266, -11.533380508422852, -10.824569702148438, -10.11575984954834, -9.406949996948242, -8.698139190673828, -7.989328861236572, -7.280518531799316, -6.5717082023620605, -5.862897872924805, -5.154087543487549, -4.445277214050293, -3.736466884613037, -3.0276565551757812, -2.3188462257385254, -1.6100358963012695, -0.9012255668640137, -0.19241714477539062, 0.5163931846618652, 1.225203514099121, 1.934013843536377, 2.642824172973633, 3.3516345024108887, 4.0604448318481445, 4.7692551612854, 5.478065490722656, 6.186875820159912, 6.895686149597168, 7.604496479034424, 8.31330680847168, 9.022117614746094, 9.730927467346191, 10.439737319946289, 11.148548126220703, 11.857358932495117, 12.566168785095215, 13.274978637695312, 13.983789443969727, 14.69260025024414, 15.401410102844238, 16.110219955444336, 16.81903076171875, 17.527841567993164, 18.236652374267578, 18.94546127319336, 19.654272079467773, 20.363082885742188, 21.07189178466797, 21.780702590942383, 22.489513397216797]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 11.0, 20.0, 40.0, 59.0, 81.0, 127.0, 204.0, 334.0, 521.0, 774.0, 1313.0, 2046.0, 3265.0, 5196.0, 7942.0, 12459.0, 19258.0, 29706.0, 44334.0, 63675.0, 86913.0, 111440.0, 127943.0, 129319.0, 112850.0, 89917.0, 66041.0, 46022.0, 30572.0, 20257.0, 13050.0, 8375.0, 5225.0, 3394.0, 2198.0, 1306.0, 852.0, 562.0, 369.0, 223.0, 138.0, 94.0, 47.0, 33.0, 13.0, 15.0, 6.0, 12.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.296875, -20.588134765625, -19.87939453125, -19.170654296875, -18.4619140625, -17.753173828125, -17.04443359375, -16.335693359375, -15.626953125, -14.918212890625, -14.20947265625, -13.500732421875, -12.7919921875, -12.083251953125, -11.37451171875, -10.665771484375, -9.95703125, -9.248291015625, -8.53955078125, -7.830810546875, -7.1220703125, -6.413330078125, -5.70458984375, -4.995849609375, -4.287109375, -3.578369140625, -2.86962890625, -2.160888671875, -1.4521484375, -0.743408203125, -0.03466796875, 0.674072265625, 1.3828125, 2.091552734375, 2.80029296875, 3.509033203125, 4.2177734375, 4.926513671875, 5.63525390625, 6.343994140625, 7.052734375, 7.761474609375, 8.47021484375, 9.178955078125, 9.8876953125, 10.596435546875, 11.30517578125, 12.013916015625, 12.72265625, 13.431396484375, 14.14013671875, 14.848876953125, 15.5576171875, 16.266357421875, 16.97509765625, 17.683837890625, 18.392578125, 19.101318359375, 19.81005859375, 20.518798828125, 21.2275390625, 21.936279296875, 22.64501953125, 23.353759765625, 24.0625]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 6.0, 11.0, 7.0, 5.0, 10.0, 8.0, 9.0, 15.0, 18.0, 18.0, 21.0, 23.0, 26.0, 28.0, 26.0, 42.0, 35.0, 43.0, 32.0, 42.0, 39.0, 53.0, 34.0, 41.0, 35.0, 36.0, 37.0, 29.0, 34.0, 38.0, 26.0, 17.0, 23.0, 23.0, 8.0, 14.0, 15.0, 11.0, 11.0, 7.0, 10.0, 7.0, 2.0, 5.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-21.4375, -20.774658203125, -20.11181640625, -19.448974609375, -18.7861328125, -18.123291015625, -17.46044921875, -16.797607421875, -16.134765625, -15.471923828125, -14.80908203125, -14.146240234375, -13.4833984375, -12.820556640625, -12.15771484375, -11.494873046875, -10.83203125, -10.169189453125, -9.50634765625, -8.843505859375, -8.1806640625, -7.517822265625, -6.85498046875, -6.192138671875, -5.529296875, -4.866455078125, -4.20361328125, -3.540771484375, -2.8779296875, -2.215087890625, -1.55224609375, -0.889404296875, -0.2265625, 0.436279296875, 1.09912109375, 1.761962890625, 2.4248046875, 3.087646484375, 3.75048828125, 4.413330078125, 5.076171875, 5.739013671875, 6.40185546875, 7.064697265625, 7.7275390625, 8.390380859375, 9.05322265625, 9.716064453125, 10.37890625, 11.041748046875, 11.70458984375, 12.367431640625, 13.0302734375, 13.693115234375, 14.35595703125, 15.018798828125, 15.681640625, 16.344482421875, 17.00732421875, 17.670166015625, 18.3330078125, 18.995849609375, 19.65869140625, 20.321533203125, 20.984375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 9.0, 9.0, 21.0, 43.0, 48.0, 83.0, 126.0, 154.0, 295.0, 424.0, 777.0, 1230.0, 2023.0, 3193.0, 5300.0, 8592.0, 14011.0, 22927.0, 37107.0, 58574.0, 87670.0, 122809.0, 151272.0, 151534.0, 126653.0, 91761.0, 60990.0, 38877.0, 23782.0, 14914.0, 9060.0, 5516.0, 3265.0, 2073.0, 1296.0, 803.0, 472.0, 339.0, 195.0, 130.0, 76.0, 47.0, 23.0, 24.0, 8.0, 14.0, 6.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.3125, -26.432861328125, -25.55322265625, -24.673583984375, -23.7939453125, -22.914306640625, -22.03466796875, -21.155029296875, -20.275390625, -19.395751953125, -18.51611328125, -17.636474609375, -16.7568359375, -15.877197265625, -14.99755859375, -14.117919921875, -13.23828125, -12.358642578125, -11.47900390625, -10.599365234375, -9.7197265625, -8.840087890625, -7.96044921875, -7.080810546875, -6.201171875, -5.321533203125, -4.44189453125, -3.562255859375, -2.6826171875, -1.802978515625, -0.92333984375, -0.043701171875, 0.8359375, 1.715576171875, 2.59521484375, 3.474853515625, 4.3544921875, 5.234130859375, 6.11376953125, 6.993408203125, 7.873046875, 8.752685546875, 9.63232421875, 10.511962890625, 11.3916015625, 12.271240234375, 13.15087890625, 14.030517578125, 14.91015625, 15.789794921875, 16.66943359375, 17.549072265625, 18.4287109375, 19.308349609375, 20.18798828125, 21.067626953125, 21.947265625, 22.826904296875, 23.70654296875, 24.586181640625, 25.4658203125, 26.345458984375, 27.22509765625, 28.104736328125, 28.984375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 7.0, 3.0, 1.0, 6.0, 9.0, 5.0, 7.0, 8.0, 17.0, 20.0, 24.0, 28.0, 20.0, 27.0, 34.0, 11.0, 27.0, 38.0, 31.0, 36.0, 35.0, 35.0, 52.0, 40.0, 41.0, 37.0, 34.0, 33.0, 33.0, 32.0, 40.0, 32.0, 21.0, 22.0, 19.0, 22.0, 23.0, 11.0, 16.0, 11.0, 15.0, 10.0, 5.0, 8.0, 8.0, 5.0, 4.0, 4.0, 1.0, 4.0, 1.0, 0.0, 5.0, 1.0], "bins": [-16.171875, -15.698486328125, -15.22509765625, -14.751708984375, -14.2783203125, -13.804931640625, -13.33154296875, -12.858154296875, -12.384765625, -11.911376953125, -11.43798828125, -10.964599609375, -10.4912109375, -10.017822265625, -9.54443359375, -9.071044921875, -8.59765625, -8.124267578125, -7.65087890625, -7.177490234375, -6.7041015625, -6.230712890625, -5.75732421875, -5.283935546875, -4.810546875, -4.337158203125, -3.86376953125, -3.390380859375, -2.9169921875, -2.443603515625, -1.97021484375, -1.496826171875, -1.0234375, -0.550048828125, -0.07666015625, 0.396728515625, 0.8701171875, 1.343505859375, 1.81689453125, 2.290283203125, 2.763671875, 3.237060546875, 3.71044921875, 4.183837890625, 4.6572265625, 5.130615234375, 5.60400390625, 6.077392578125, 6.55078125, 7.024169921875, 7.49755859375, 7.970947265625, 8.4443359375, 8.917724609375, 9.39111328125, 9.864501953125, 10.337890625, 10.811279296875, 11.28466796875, 11.758056640625, 12.2314453125, 12.704833984375, 13.17822265625, 13.651611328125, 14.125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 5.0, 9.0, 12.0, 24.0, 35.0, 52.0, 67.0, 88.0, 122.0, 216.0, 296.0, 468.0, 736.0, 1181.0, 2031.0, 3690.0, 7434.0, 15823.0, 37305.0, 93890.0, 226332.0, 328168.0, 193503.0, 77735.0, 31130.0, 13556.0, 6455.0, 3311.0, 1820.0, 1038.0, 640.0, 439.0, 304.0, 197.0, 140.0, 98.0, 68.0, 53.0, 26.0, 23.0, 10.0, 8.0, 9.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.65625, -32.47119140625, -31.2861328125, -30.10107421875, -28.916015625, -27.73095703125, -26.5458984375, -25.36083984375, -24.17578125, -22.99072265625, -21.8056640625, -20.62060546875, -19.435546875, -18.25048828125, -17.0654296875, -15.88037109375, -14.6953125, -13.51025390625, -12.3251953125, -11.14013671875, -9.955078125, -8.77001953125, -7.5849609375, -6.39990234375, -5.21484375, -4.02978515625, -2.8447265625, -1.65966796875, -0.474609375, 0.71044921875, 1.8955078125, 3.08056640625, 4.265625, 5.45068359375, 6.6357421875, 7.82080078125, 9.005859375, 10.19091796875, 11.3759765625, 12.56103515625, 13.74609375, 14.93115234375, 16.1162109375, 17.30126953125, 18.486328125, 19.67138671875, 20.8564453125, 22.04150390625, 23.2265625, 24.41162109375, 25.5966796875, 26.78173828125, 27.966796875, 29.15185546875, 30.3369140625, 31.52197265625, 32.70703125, 33.89208984375, 35.0771484375, 36.26220703125, 37.447265625, 38.63232421875, 39.8173828125, 41.00244140625, 42.1875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 4.0, 3.0, 4.0, 7.0, 9.0, 13.0, 6.0, 17.0, 23.0, 34.0, 41.0, 66.0, 66.0, 66.0, 65.0, 88.0, 85.0, 72.0, 80.0, 54.0, 51.0, 36.0, 24.0, 22.0, 13.0, 17.0, 14.0, 12.0, 8.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00267791748046875, -0.0025843679904937744, -0.002490818500518799, -0.0023972690105438232, -0.0023037195205688477, -0.002210170030593872, -0.0021166205406188965, -0.002023071050643921, -0.0019295215606689453, -0.0018359720706939697, -0.0017424225807189941, -0.0016488730907440186, -0.001555323600769043, -0.0014617741107940674, -0.0013682246208190918, -0.0012746751308441162, -0.0011811256408691406, -0.001087576150894165, -0.0009940266609191895, -0.0009004771709442139, -0.0008069276809692383, -0.0007133781909942627, -0.0006198287010192871, -0.0005262792110443115, -0.00043272972106933594, -0.00033918023109436035, -0.00024563074111938477, -0.00015208125114440918, -5.8531761169433594e-05, 3.501772880554199e-05, 0.00012856721878051758, 0.00022211670875549316, 0.00031566619873046875, 0.00040921568870544434, 0.0005027651786804199, 0.0005963146686553955, 0.0006898641586303711, 0.0007834136486053467, 0.0008769631385803223, 0.0009705126285552979, 0.0010640621185302734, 0.001157611608505249, 0.0012511610984802246, 0.0013447105884552002, 0.0014382600784301758, 0.0015318095684051514, 0.001625359058380127, 0.0017189085483551025, 0.0018124580383300781, 0.0019060075283050537, 0.0019995570182800293, 0.002093106508255005, 0.0021866559982299805, 0.002280205488204956, 0.0023737549781799316, 0.0024673044681549072, 0.002560853958129883, 0.0026544034481048584, 0.002747952938079834, 0.0028415024280548096, 0.002935051918029785, 0.0030286014080047607, 0.0031221508979797363, 0.003215700387954712, 0.0033092498779296875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 10.0, 15.0, 13.0, 32.0, 32.0, 42.0, 72.0, 108.0, 123.0, 165.0, 265.0, 378.0, 569.0, 855.0, 1403.0, 2232.0, 3779.0, 6572.0, 12301.0, 23380.0, 46768.0, 92495.0, 167042.0, 230618.0, 201879.0, 124093.0, 64306.0, 31377.0, 16330.0, 8788.0, 4843.0, 2773.0, 1625.0, 1033.0, 682.0, 460.0, 335.0, 226.0, 127.0, 113.0, 89.0, 54.0, 49.0, 42.0, 20.0, 13.0, 4.0, 5.0, 7.0, 5.0, 1.0, 3.0, 3.0, 1.0, 2.0], "bins": [-23.96875, -23.236328125, -22.50390625, -21.771484375, -21.0390625, -20.306640625, -19.57421875, -18.841796875, -18.109375, -17.376953125, -16.64453125, -15.912109375, -15.1796875, -14.447265625, -13.71484375, -12.982421875, -12.25, -11.517578125, -10.78515625, -10.052734375, -9.3203125, -8.587890625, -7.85546875, -7.123046875, -6.390625, -5.658203125, -4.92578125, -4.193359375, -3.4609375, -2.728515625, -1.99609375, -1.263671875, -0.53125, 0.201171875, 0.93359375, 1.666015625, 2.3984375, 3.130859375, 3.86328125, 4.595703125, 5.328125, 6.060546875, 6.79296875, 7.525390625, 8.2578125, 8.990234375, 9.72265625, 10.455078125, 11.1875, 11.919921875, 12.65234375, 13.384765625, 14.1171875, 14.849609375, 15.58203125, 16.314453125, 17.046875, 17.779296875, 18.51171875, 19.244140625, 19.9765625, 20.708984375, 21.44140625, 22.173828125, 22.90625]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 6.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 7.0, 6.0, 3.0, 7.0, 9.0, 22.0, 18.0, 29.0, 27.0, 30.0, 43.0, 54.0, 53.0, 59.0, 58.0, 67.0, 70.0, 66.0, 69.0, 58.0, 48.0, 31.0, 35.0, 29.0, 17.0, 20.0, 10.0, 12.0, 10.0, 7.0, 5.0, 7.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.34375, -8.08990478515625, -7.8360595703125, -7.58221435546875, -7.328369140625, -7.07452392578125, -6.8206787109375, -6.56683349609375, -6.31298828125, -6.05914306640625, -5.8052978515625, -5.55145263671875, -5.297607421875, -5.04376220703125, -4.7899169921875, -4.53607177734375, -4.2822265625, -4.02838134765625, -3.7745361328125, -3.52069091796875, -3.266845703125, -3.01300048828125, -2.7591552734375, -2.50531005859375, -2.25146484375, -1.99761962890625, -1.7437744140625, -1.48992919921875, -1.236083984375, -0.98223876953125, -0.7283935546875, -0.47454833984375, -0.220703125, 0.03314208984375, 0.2869873046875, 0.54083251953125, 0.794677734375, 1.04852294921875, 1.3023681640625, 1.55621337890625, 1.81005859375, 2.06390380859375, 2.3177490234375, 2.57159423828125, 2.825439453125, 3.07928466796875, 3.3331298828125, 3.58697509765625, 3.8408203125, 4.09466552734375, 4.3485107421875, 4.60235595703125, 4.856201171875, 5.11004638671875, 5.3638916015625, 5.61773681640625, 5.87158203125, 6.12542724609375, 6.3792724609375, 6.63311767578125, 6.886962890625, 7.14080810546875, 7.3946533203125, 7.64849853515625, 7.90234375]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 5.0, 3.0, 4.0, 2.0, 9.0, 16.0, 15.0, 16.0, 17.0, 15.0, 21.0, 19.0, 23.0, 38.0, 34.0, 37.0, 48.0, 59.0, 58.0, 51.0, 55.0, 58.0, 56.0, 53.0, 34.0, 37.0, 33.0, 29.0, 24.0, 21.0, 26.0, 21.0, 12.0, 7.0, 14.0, 6.0, 3.0, 3.0, 6.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.149505615234375, -26.284074783325195, -25.418643951416016, -24.553211212158203, -23.687780380249023, -22.822349548339844, -21.95691680908203, -21.09148597717285, -20.226055145263672, -19.360624313354492, -18.495193481445312, -17.6297607421875, -16.76432991027832, -15.89889907836914, -15.033467292785645, -14.168035507202148, -13.302604675292969, -12.437173843383789, -11.571742057800293, -10.706310272216797, -9.840879440307617, -8.975448608398438, -8.110016822814941, -7.2445855140686035, -6.379154205322266, -5.513722896575928, -4.64829158782959, -3.782860279083252, -2.917428970336914, -2.051997661590576, -1.1865663528442383, -0.3211350440979004, 0.5442943572998047, 1.4097256660461426, 2.2751569747924805, 3.1405882835388184, 4.006019592285156, 4.871450901031494, 5.736882209777832, 6.60231351852417, 7.467744827270508, 8.333175659179688, 9.198607444763184, 10.06403923034668, 10.92947006225586, 11.794900894165039, 12.660332679748535, 13.525764465332031, 14.391195297241211, 15.25662612915039, 16.122058868408203, 16.987489700317383, 17.852920532226562, 18.718351364135742, 19.583782196044922, 20.449214935302734, 21.314645767211914, 22.180076599121094, 23.045509338378906, 23.910940170288086, 24.776371002197266, 25.641801834106445, 26.507232666015625, 27.372665405273438, 28.238096237182617]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 7.0, 3.0, 4.0, 3.0, 7.0, 7.0, 10.0, 7.0, 10.0, 6.0, 19.0, 19.0, 15.0, 7.0, 21.0, 25.0, 31.0, 31.0, 38.0, 26.0, 40.0, 39.0, 30.0, 50.0, 43.0, 42.0, 42.0, 33.0, 49.0, 38.0, 42.0, 27.0, 34.0, 20.0, 21.0, 32.0, 11.0, 18.0, 13.0, 26.0, 12.0, 10.0, 9.0, 8.0, 6.0, 5.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0], "bins": [-25.594215393066406, -24.87730598449707, -24.160396575927734, -23.443485260009766, -22.72657585144043, -22.009666442871094, -21.292757034301758, -20.575847625732422, -19.858936309814453, -19.142026901245117, -18.42511749267578, -17.708206176757812, -16.991296768188477, -16.27438735961914, -15.557477951049805, -14.840567588806152, -14.123658180236816, -13.40674877166748, -12.689838409423828, -11.972929000854492, -11.25601863861084, -10.539109230041504, -9.822198867797852, -9.105289459228516, -8.38838005065918, -7.6714701652526855, -6.954560279846191, -6.2376508712768555, -5.520740509033203, -4.803831100463867, -4.086921215057373, -3.370011329650879, -2.6531009674072266, -1.9361910820007324, -1.2192813158035278, -0.5023715496063232, 0.2145383358001709, 0.931448221206665, 1.64835786819458, 2.365267753601074, 3.0821776390075684, 3.7990875244140625, 4.515997409820557, 5.232907295227051, 5.949816703796387, 6.666727066040039, 7.383636474609375, 8.100545883178711, 8.817456245422363, 9.5343656539917, 10.251276016235352, 10.968185424804688, 11.68509578704834, 12.402005195617676, 13.118915557861328, 13.835824966430664, 14.552734375, 15.269643783569336, 15.986554145812988, 16.70346450805664, 17.420373916625977, 18.137283325195312, 18.85419273376465, 19.571102142333984, 20.288013458251953]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 6.0, 10.0, 16.0, 19.0, 29.0, 40.0, 40.0, 73.0, 135.0, 203.0, 392.0, 638.0, 1095.0, 1944.0, 3739.0, 7189.0, 14545.0, 29801.0, 64075.0, 140770.0, 328985.0, 757380.0, 1198534.0, 902649.0, 411310.0, 176298.0, 79609.0, 37178.0, 18053.0, 8925.0, 4641.0, 2539.0, 1422.0, 746.0, 473.0, 294.0, 164.0, 109.0, 68.0, 49.0, 34.0, 22.0, 18.0, 10.0, 3.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-30.0625, -29.0126953125, -27.962890625, -26.9130859375, -25.86328125, -24.8134765625, -23.763671875, -22.7138671875, -21.6640625, -20.6142578125, -19.564453125, -18.5146484375, -17.46484375, -16.4150390625, -15.365234375, -14.3154296875, -13.265625, -12.2158203125, -11.166015625, -10.1162109375, -9.06640625, -8.0166015625, -6.966796875, -5.9169921875, -4.8671875, -3.8173828125, -2.767578125, -1.7177734375, -0.66796875, 0.3818359375, 1.431640625, 2.4814453125, 3.53125, 4.5810546875, 5.630859375, 6.6806640625, 7.73046875, 8.7802734375, 9.830078125, 10.8798828125, 11.9296875, 12.9794921875, 14.029296875, 15.0791015625, 16.12890625, 17.1787109375, 18.228515625, 19.2783203125, 20.328125, 21.3779296875, 22.427734375, 23.4775390625, 24.52734375, 25.5771484375, 26.626953125, 27.6767578125, 28.7265625, 29.7763671875, 30.826171875, 31.8759765625, 32.92578125, 33.9755859375, 35.025390625, 36.0751953125, 37.125]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 6.0, 7.0, 6.0, 3.0, 15.0, 12.0, 14.0, 18.0, 16.0, 16.0, 20.0, 30.0, 34.0, 26.0, 31.0, 37.0, 37.0, 40.0, 39.0, 48.0, 37.0, 48.0, 34.0, 42.0, 28.0, 32.0, 46.0, 45.0, 32.0, 40.0, 24.0, 16.0, 21.0, 19.0, 14.0, 16.0, 7.0, 11.0, 10.0, 7.0, 8.0, 6.0, 0.0, 1.0, 2.0, 0.0, 6.0, 1.0, 4.0], "bins": [-20.140625, -19.5838623046875, -19.027099609375, -18.4703369140625, -17.91357421875, -17.3568115234375, -16.800048828125, -16.2432861328125, -15.6865234375, -15.1297607421875, -14.572998046875, -14.0162353515625, -13.45947265625, -12.9027099609375, -12.345947265625, -11.7891845703125, -11.232421875, -10.6756591796875, -10.118896484375, -9.5621337890625, -9.00537109375, -8.4486083984375, -7.891845703125, -7.3350830078125, -6.7783203125, -6.2215576171875, -5.664794921875, -5.1080322265625, -4.55126953125, -3.9945068359375, -3.437744140625, -2.8809814453125, -2.32421875, -1.7674560546875, -1.210693359375, -0.6539306640625, -0.09716796875, 0.4595947265625, 1.016357421875, 1.5731201171875, 2.1298828125, 2.6866455078125, 3.243408203125, 3.8001708984375, 4.35693359375, 4.9136962890625, 5.470458984375, 6.0272216796875, 6.583984375, 7.1407470703125, 7.697509765625, 8.2542724609375, 8.81103515625, 9.3677978515625, 9.924560546875, 10.4813232421875, 11.0380859375, 11.5948486328125, 12.151611328125, 12.7083740234375, 13.26513671875, 13.8218994140625, 14.378662109375, 14.9354248046875, 15.4921875]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 8.0, 8.0, 8.0, 13.0, 22.0, 37.0, 47.0, 94.0, 125.0, 200.0, 389.0, 600.0, 1098.0, 2135.0, 3979.0, 7384.0, 14308.0, 28427.0, 56037.0, 110949.0, 219489.0, 422902.0, 746622.0, 972283.0, 742610.0, 420364.0, 218103.0, 110824.0, 56435.0, 28199.0, 14584.0, 7456.0, 3878.0, 2027.0, 1090.0, 603.0, 341.0, 193.0, 151.0, 82.0, 49.0, 45.0, 25.0, 14.0, 9.0, 13.0, 4.0, 4.0, 3.0, 4.0, 1.0, 6.0, 0.0, 1.0], "bins": [-29.546875, -28.664794921875, -27.78271484375, -26.900634765625, -26.0185546875, -25.136474609375, -24.25439453125, -23.372314453125, -22.490234375, -21.608154296875, -20.72607421875, -19.843994140625, -18.9619140625, -18.079833984375, -17.19775390625, -16.315673828125, -15.43359375, -14.551513671875, -13.66943359375, -12.787353515625, -11.9052734375, -11.023193359375, -10.14111328125, -9.259033203125, -8.376953125, -7.494873046875, -6.61279296875, -5.730712890625, -4.8486328125, -3.966552734375, -3.08447265625, -2.202392578125, -1.3203125, -0.438232421875, 0.44384765625, 1.325927734375, 2.2080078125, 3.090087890625, 3.97216796875, 4.854248046875, 5.736328125, 6.618408203125, 7.50048828125, 8.382568359375, 9.2646484375, 10.146728515625, 11.02880859375, 11.910888671875, 12.79296875, 13.675048828125, 14.55712890625, 15.439208984375, 16.3212890625, 17.203369140625, 18.08544921875, 18.967529296875, 19.849609375, 20.731689453125, 21.61376953125, 22.495849609375, 23.3779296875, 24.260009765625, 25.14208984375, 26.024169921875, 26.90625]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 3.0, 9.0, 11.0, 14.0, 24.0, 24.0, 29.0, 34.0, 50.0, 50.0, 62.0, 83.0, 108.0, 119.0, 169.0, 169.0, 184.0, 211.0, 261.0, 263.0, 260.0, 264.0, 261.0, 225.0, 226.0, 178.0, 152.0, 128.0, 108.0, 92.0, 66.0, 59.0, 47.0, 35.0, 33.0, 16.0, 19.0, 15.0, 6.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0], "bins": [-11.265625, -10.98223876953125, -10.6988525390625, -10.41546630859375, -10.132080078125, -9.84869384765625, -9.5653076171875, -9.28192138671875, -8.99853515625, -8.71514892578125, -8.4317626953125, -8.14837646484375, -7.864990234375, -7.58160400390625, -7.2982177734375, -7.01483154296875, -6.7314453125, -6.44805908203125, -6.1646728515625, -5.88128662109375, -5.597900390625, -5.31451416015625, -5.0311279296875, -4.74774169921875, -4.46435546875, -4.18096923828125, -3.8975830078125, -3.61419677734375, -3.330810546875, -3.04742431640625, -2.7640380859375, -2.48065185546875, -2.197265625, -1.91387939453125, -1.6304931640625, -1.34710693359375, -1.063720703125, -0.78033447265625, -0.4969482421875, -0.21356201171875, 0.06982421875, 0.35321044921875, 0.6365966796875, 0.91998291015625, 1.203369140625, 1.48675537109375, 1.7701416015625, 2.05352783203125, 2.3369140625, 2.62030029296875, 2.9036865234375, 3.18707275390625, 3.470458984375, 3.75384521484375, 4.0372314453125, 4.32061767578125, 4.60400390625, 4.88739013671875, 5.1707763671875, 5.45416259765625, 5.737548828125, 6.02093505859375, 6.3043212890625, 6.58770751953125, 6.87109375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 1.0, 4.0, 3.0, 9.0, 8.0, 16.0, 10.0, 17.0, 18.0, 25.0, 30.0, 30.0, 44.0, 32.0, 35.0, 52.0, 49.0, 54.0, 57.0, 62.0, 48.0, 60.0, 54.0, 51.0, 34.0, 31.0, 24.0, 29.0, 23.0, 22.0, 15.0, 12.0, 15.0, 9.0, 7.0, 6.0, 0.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.61591148376465, -25.807968139648438, -25.000022888183594, -24.192079544067383, -23.384136199951172, -22.576190948486328, -21.768247604370117, -20.960304260253906, -20.152359008789062, -19.34441566467285, -18.536470413208008, -17.728527069091797, -16.920581817626953, -16.112638473510742, -15.304695129394531, -14.496750831604004, -13.688806533813477, -12.88086223602295, -12.072917938232422, -11.264974594116211, -10.457030296325684, -9.649085998535156, -8.841142654418945, -8.033198356628418, -7.225254058837891, -6.417309761047363, -5.609365940093994, -4.801422119140625, -3.9934778213500977, -3.1855335235595703, -2.377589702606201, -1.569645881652832, -0.7617034912109375, 0.04624056816101074, 0.854184627532959, 1.6621286869049072, 2.4700727462768555, 3.278017044067383, 4.085960865020752, 4.893904685974121, 5.701848983764648, 6.509793281555176, 7.317737102508545, 8.125680923461914, 8.933625221252441, 9.741569519042969, 10.54951286315918, 11.357457160949707, 12.165401458740234, 12.973345756530762, 13.781290054321289, 14.5892333984375, 15.397177696228027, 16.205121994018555, 17.013065338134766, 17.82101058959961, 18.62895393371582, 19.43689727783203, 20.244842529296875, 21.052785873413086, 21.860729217529297, 22.66867446899414, 23.47661781311035, 24.284561157226562, 25.092506408691406]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 3.0, 5.0, 6.0, 15.0, 8.0, 10.0, 8.0, 15.0, 19.0, 10.0, 13.0, 20.0, 14.0, 21.0, 24.0, 35.0, 37.0, 26.0, 27.0, 26.0, 33.0, 43.0, 24.0, 38.0, 39.0, 34.0, 41.0, 44.0, 32.0, 26.0, 39.0, 27.0, 23.0, 21.0, 28.0, 24.0, 27.0, 27.0, 25.0, 16.0, 10.0, 3.0, 8.0, 7.0, 4.0, 5.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0], "bins": [-18.963850021362305, -18.39661979675293, -17.829391479492188, -17.262161254882812, -16.694931030273438, -16.127700805664062, -15.56047248840332, -14.993242263793945, -14.426012992858887, -13.858783721923828, -13.291553497314453, -12.724324226379395, -12.157094955444336, -11.589864730834961, -11.022635459899902, -10.455406188964844, -9.888175964355469, -9.32094669342041, -8.753716468811035, -8.186487197875977, -7.61925745010376, -7.052027702331543, -6.484798431396484, -5.917568683624268, -5.350338935852051, -4.783109188079834, -4.215879440307617, -3.6486501693725586, -3.081420421600342, -2.514190673828125, -1.9469611644744873, -1.3797316551208496, -0.8125038146972656, -0.24527418613433838, 0.32195544242858887, 0.8891850709915161, 1.4564146995544434, 2.02364444732666, 2.590873956680298, 3.1581034660339355, 3.7253332138061523, 4.292562961578369, 4.859792709350586, 5.4270219802856445, 5.994251728057861, 6.561481475830078, 7.128710746765137, 7.6959404945373535, 8.26317024230957, 8.830399513244629, 9.397629737854004, 9.964859008789062, 10.532089233398438, 11.099318504333496, 11.666547775268555, 12.23377799987793, 12.801007270812988, 13.368236541748047, 13.935466766357422, 14.50269603729248, 15.069925308227539, 15.637155532836914, 16.20438575744629, 16.77161407470703, 17.338844299316406]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 8.0, 8.0, 14.0, 19.0, 26.0, 39.0, 58.0, 93.0, 152.0, 204.0, 334.0, 495.0, 743.0, 1109.0, 1628.0, 2787.0, 4120.0, 6520.0, 10517.0, 17327.0, 27917.0, 45801.0, 73928.0, 116221.0, 165047.0, 180387.0, 143419.0, 94948.0, 59323.0, 36292.0, 21903.0, 13584.0, 8538.0, 5369.0, 3271.0, 2237.0, 1384.0, 964.0, 604.0, 414.0, 283.0, 166.0, 131.0, 84.0, 55.0, 26.0, 25.0, 17.0, 9.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0], "bins": [-55.03125, -53.42529296875, -51.8193359375, -50.21337890625, -48.607421875, -47.00146484375, -45.3955078125, -43.78955078125, -42.18359375, -40.57763671875, -38.9716796875, -37.36572265625, -35.759765625, -34.15380859375, -32.5478515625, -30.94189453125, -29.3359375, -27.72998046875, -26.1240234375, -24.51806640625, -22.912109375, -21.30615234375, -19.7001953125, -18.09423828125, -16.48828125, -14.88232421875, -13.2763671875, -11.67041015625, -10.064453125, -8.45849609375, -6.8525390625, -5.24658203125, -3.640625, -2.03466796875, -0.4287109375, 1.17724609375, 2.783203125, 4.38916015625, 5.9951171875, 7.60107421875, 9.20703125, 10.81298828125, 12.4189453125, 14.02490234375, 15.630859375, 17.23681640625, 18.8427734375, 20.44873046875, 22.0546875, 23.66064453125, 25.2666015625, 26.87255859375, 28.478515625, 30.08447265625, 31.6904296875, 33.29638671875, 34.90234375, 36.50830078125, 38.1142578125, 39.72021484375, 41.326171875, 42.93212890625, 44.5380859375, 46.14404296875, 47.75]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 4.0, 8.0, 11.0, 15.0, 11.0, 18.0, 18.0, 20.0, 20.0, 20.0, 23.0, 32.0, 27.0, 24.0, 33.0, 31.0, 55.0, 38.0, 33.0, 36.0, 47.0, 37.0, 45.0, 53.0, 31.0, 45.0, 28.0, 33.0, 33.0, 23.0, 28.0, 27.0, 18.0, 14.0, 16.0, 17.0, 7.0, 5.0, 5.0, 1.0, 4.0, 3.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-19.734375, -19.167236328125, -18.60009765625, -18.032958984375, -17.4658203125, -16.898681640625, -16.33154296875, -15.764404296875, -15.197265625, -14.630126953125, -14.06298828125, -13.495849609375, -12.9287109375, -12.361572265625, -11.79443359375, -11.227294921875, -10.66015625, -10.093017578125, -9.52587890625, -8.958740234375, -8.3916015625, -7.824462890625, -7.25732421875, -6.690185546875, -6.123046875, -5.555908203125, -4.98876953125, -4.421630859375, -3.8544921875, -3.287353515625, -2.72021484375, -2.153076171875, -1.5859375, -1.018798828125, -0.45166015625, 0.115478515625, 0.6826171875, 1.249755859375, 1.81689453125, 2.384033203125, 2.951171875, 3.518310546875, 4.08544921875, 4.652587890625, 5.2197265625, 5.786865234375, 6.35400390625, 6.921142578125, 7.48828125, 8.055419921875, 8.62255859375, 9.189697265625, 9.7568359375, 10.323974609375, 10.89111328125, 11.458251953125, 12.025390625, 12.592529296875, 13.15966796875, 13.726806640625, 14.2939453125, 14.861083984375, 15.42822265625, 15.995361328125, 16.5625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 7.0, 8.0, 13.0, 20.0, 23.0, 33.0, 55.0, 50.0, 110.0, 195.0, 278.0, 390.0, 628.0, 999.0, 1556.0, 2499.0, 4050.0, 6426.0, 10859.0, 17719.0, 29636.0, 51209.0, 89309.0, 151029.0, 218621.0, 186587.0, 114507.0, 66139.0, 38094.0, 22564.0, 13515.0, 8048.0, 4951.0, 3092.0, 1924.0, 1239.0, 788.0, 476.0, 342.0, 204.0, 129.0, 82.0, 61.0, 32.0, 24.0, 12.0, 15.0, 8.0, 4.0, 3.0, 1.0, 3.0, 1.0], "bins": [-55.25, -53.70361328125, -52.1572265625, -50.61083984375, -49.064453125, -47.51806640625, -45.9716796875, -44.42529296875, -42.87890625, -41.33251953125, -39.7861328125, -38.23974609375, -36.693359375, -35.14697265625, -33.6005859375, -32.05419921875, -30.5078125, -28.96142578125, -27.4150390625, -25.86865234375, -24.322265625, -22.77587890625, -21.2294921875, -19.68310546875, -18.13671875, -16.59033203125, -15.0439453125, -13.49755859375, -11.951171875, -10.40478515625, -8.8583984375, -7.31201171875, -5.765625, -4.21923828125, -2.6728515625, -1.12646484375, 0.419921875, 1.96630859375, 3.5126953125, 5.05908203125, 6.60546875, 8.15185546875, 9.6982421875, 11.24462890625, 12.791015625, 14.33740234375, 15.8837890625, 17.43017578125, 18.9765625, 20.52294921875, 22.0693359375, 23.61572265625, 25.162109375, 26.70849609375, 28.2548828125, 29.80126953125, 31.34765625, 32.89404296875, 34.4404296875, 35.98681640625, 37.533203125, 39.07958984375, 40.6259765625, 42.17236328125, 43.71875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 10.0, 10.0, 10.0, 8.0, 17.0, 16.0, 28.0, 18.0, 26.0, 31.0, 42.0, 26.0, 47.0, 44.0, 42.0, 44.0, 53.0, 51.0, 41.0, 54.0, 37.0, 39.0, 36.0, 43.0, 41.0, 19.0, 31.0, 25.0, 23.0, 12.0, 13.0, 12.0, 12.0, 11.0, 6.0, 4.0, 4.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.203125, -12.738525390625, -12.27392578125, -11.809326171875, -11.3447265625, -10.880126953125, -10.41552734375, -9.950927734375, -9.486328125, -9.021728515625, -8.55712890625, -8.092529296875, -7.6279296875, -7.163330078125, -6.69873046875, -6.234130859375, -5.76953125, -5.304931640625, -4.84033203125, -4.375732421875, -3.9111328125, -3.446533203125, -2.98193359375, -2.517333984375, -2.052734375, -1.588134765625, -1.12353515625, -0.658935546875, -0.1943359375, 0.270263671875, 0.73486328125, 1.199462890625, 1.6640625, 2.128662109375, 2.59326171875, 3.057861328125, 3.5224609375, 3.987060546875, 4.45166015625, 4.916259765625, 5.380859375, 5.845458984375, 6.31005859375, 6.774658203125, 7.2392578125, 7.703857421875, 8.16845703125, 8.633056640625, 9.09765625, 9.562255859375, 10.02685546875, 10.491455078125, 10.9560546875, 11.420654296875, 11.88525390625, 12.349853515625, 12.814453125, 13.279052734375, 13.74365234375, 14.208251953125, 14.6728515625, 15.137451171875, 15.60205078125, 16.066650390625, 16.53125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 7.0, 4.0, 5.0, 12.0, 14.0, 8.0, 23.0, 39.0, 36.0, 54.0, 119.0, 160.0, 270.0, 448.0, 712.0, 1374.0, 2695.0, 5023.0, 10373.0, 23981.0, 59545.0, 173257.0, 422047.0, 221130.0, 73494.0, 28639.0, 12327.0, 5922.0, 3004.0, 1594.0, 866.0, 538.0, 292.0, 169.0, 124.0, 95.0, 54.0, 34.0, 19.0, 14.0, 7.0, 9.0, 7.0, 9.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-47.6875, -46.1787109375, -44.669921875, -43.1611328125, -41.65234375, -40.1435546875, -38.634765625, -37.1259765625, -35.6171875, -34.1083984375, -32.599609375, -31.0908203125, -29.58203125, -28.0732421875, -26.564453125, -25.0556640625, -23.546875, -22.0380859375, -20.529296875, -19.0205078125, -17.51171875, -16.0029296875, -14.494140625, -12.9853515625, -11.4765625, -9.9677734375, -8.458984375, -6.9501953125, -5.44140625, -3.9326171875, -2.423828125, -0.9150390625, 0.59375, 2.1025390625, 3.611328125, 5.1201171875, 6.62890625, 8.1376953125, 9.646484375, 11.1552734375, 12.6640625, 14.1728515625, 15.681640625, 17.1904296875, 18.69921875, 20.2080078125, 21.716796875, 23.2255859375, 24.734375, 26.2431640625, 27.751953125, 29.2607421875, 30.76953125, 32.2783203125, 33.787109375, 35.2958984375, 36.8046875, 38.3134765625, 39.822265625, 41.3310546875, 42.83984375, 44.3486328125, 45.857421875, 47.3662109375, 48.875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 2.0, 4.0, 8.0, 10.0, 12.0, 26.0, 18.0, 39.0, 75.0, 101.0, 154.0, 179.0, 123.0, 84.0, 45.0, 43.0, 23.0, 13.0, 13.0, 5.0, 4.0, 2.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0063323974609375, -0.006166338920593262, -0.0060002803802490234, -0.005834221839904785, -0.005668163299560547, -0.005502104759216309, -0.00533604621887207, -0.005169987678527832, -0.005003929138183594, -0.0048378705978393555, -0.004671812057495117, -0.004505753517150879, -0.004339694976806641, -0.004173636436462402, -0.004007577896118164, -0.0038415193557739258, -0.0036754608154296875, -0.0035094022750854492, -0.003343343734741211, -0.0031772851943969727, -0.0030112266540527344, -0.002845168113708496, -0.002679109573364258, -0.0025130510330200195, -0.0023469924926757812, -0.002180933952331543, -0.0020148754119873047, -0.0018488168716430664, -0.0016827583312988281, -0.0015166997909545898, -0.0013506412506103516, -0.0011845827102661133, -0.001018524169921875, -0.0008524656295776367, -0.0006864070892333984, -0.0005203485488891602, -0.0003542900085449219, -0.0001882314682006836, -2.2172927856445312e-05, 0.00014388561248779297, 0.00030994415283203125, 0.00047600269317626953, 0.0006420612335205078, 0.0008081197738647461, 0.0009741783142089844, 0.0011402368545532227, 0.001306295394897461, 0.0014723539352416992, 0.0016384124755859375, 0.0018044710159301758, 0.001970529556274414, 0.0021365880966186523, 0.0023026466369628906, 0.002468705177307129, 0.002634763717651367, 0.0028008222579956055, 0.0029668807983398438, 0.003132939338684082, 0.0032989978790283203, 0.0034650564193725586, 0.003631114959716797, 0.003797173500061035, 0.0039632320404052734, 0.004129290580749512, 0.00429534912109375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 6.0, 12.0, 16.0, 14.0, 26.0, 38.0, 57.0, 103.0, 148.0, 232.0, 370.0, 579.0, 952.0, 1470.0, 2456.0, 3779.0, 6862.0, 11724.0, 20516.0, 36638.0, 66921.0, 121261.0, 197310.0, 222119.0, 155425.0, 88166.0, 48194.0, 26423.0, 14909.0, 8535.0, 5194.0, 3051.0, 1879.0, 1195.0, 691.0, 454.0, 297.0, 184.0, 111.0, 75.0, 57.0, 38.0, 18.0, 17.0, 12.0, 4.0, 7.0, 7.0, 3.0, 3.0, 1.0, 2.0], "bins": [-24.046875, -23.3642578125, -22.681640625, -21.9990234375, -21.31640625, -20.6337890625, -19.951171875, -19.2685546875, -18.5859375, -17.9033203125, -17.220703125, -16.5380859375, -15.85546875, -15.1728515625, -14.490234375, -13.8076171875, -13.125, -12.4423828125, -11.759765625, -11.0771484375, -10.39453125, -9.7119140625, -9.029296875, -8.3466796875, -7.6640625, -6.9814453125, -6.298828125, -5.6162109375, -4.93359375, -4.2509765625, -3.568359375, -2.8857421875, -2.203125, -1.5205078125, -0.837890625, -0.1552734375, 0.52734375, 1.2099609375, 1.892578125, 2.5751953125, 3.2578125, 3.9404296875, 4.623046875, 5.3056640625, 5.98828125, 6.6708984375, 7.353515625, 8.0361328125, 8.71875, 9.4013671875, 10.083984375, 10.7666015625, 11.44921875, 12.1318359375, 12.814453125, 13.4970703125, 14.1796875, 14.8623046875, 15.544921875, 16.2275390625, 16.91015625, 17.5927734375, 18.275390625, 18.9580078125, 19.640625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 1.0, 5.0, 1.0, 3.0, 9.0, 8.0, 7.0, 16.0, 11.0, 16.0, 19.0, 22.0, 38.0, 35.0, 31.0, 38.0, 41.0, 66.0, 61.0, 57.0, 60.0, 64.0, 56.0, 36.0, 50.0, 43.0, 31.0, 31.0, 32.0, 26.0, 17.0, 15.0, 11.0, 10.0, 7.0, 7.0, 7.0, 3.0, 0.0, 3.0, 2.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.12109375, -5.89984130859375, -5.6785888671875, -5.45733642578125, -5.236083984375, -5.01483154296875, -4.7935791015625, -4.57232666015625, -4.35107421875, -4.12982177734375, -3.9085693359375, -3.68731689453125, -3.466064453125, -3.24481201171875, -3.0235595703125, -2.80230712890625, -2.5810546875, -2.35980224609375, -2.1385498046875, -1.91729736328125, -1.696044921875, -1.47479248046875, -1.2535400390625, -1.03228759765625, -0.81103515625, -0.58978271484375, -0.3685302734375, -0.14727783203125, 0.073974609375, 0.29522705078125, 0.5164794921875, 0.73773193359375, 0.958984375, 1.18023681640625, 1.4014892578125, 1.62274169921875, 1.843994140625, 2.06524658203125, 2.2864990234375, 2.50775146484375, 2.72900390625, 2.95025634765625, 3.1715087890625, 3.39276123046875, 3.614013671875, 3.83526611328125, 4.0565185546875, 4.27777099609375, 4.4990234375, 4.72027587890625, 4.9415283203125, 5.16278076171875, 5.384033203125, 5.60528564453125, 5.8265380859375, 6.04779052734375, 6.26904296875, 6.49029541015625, 6.7115478515625, 6.93280029296875, 7.154052734375, 7.37530517578125, 7.5965576171875, 7.81781005859375, 8.0390625]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 2.0, 2.0, 5.0, 2.0, 7.0, 3.0, 11.0, 17.0, 21.0, 12.0, 14.0, 18.0, 28.0, 41.0, 28.0, 40.0, 42.0, 42.0, 46.0, 60.0, 53.0, 58.0, 47.0, 49.0, 48.0, 44.0, 32.0, 30.0, 28.0, 34.0, 22.0, 17.0, 13.0, 16.0, 13.0, 13.0, 14.0, 8.0, 2.0, 6.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.716218948364258, -17.10547637939453, -16.494731903076172, -15.883988380432129, -15.273244857788086, -14.66250228881836, -14.051758766174316, -13.441015243530273, -12.83027172088623, -12.219528198242188, -11.608784675598145, -10.998041152954102, -10.387298583984375, -9.776554107666016, -9.165811538696289, -8.555068016052246, -7.944324493408203, -7.33358097076416, -6.722837448120117, -6.112094402313232, -5.5013508796691895, -4.8906073570251465, -4.279864311218262, -3.6691207885742188, -3.058377265930176, -2.447633743286133, -1.836890459060669, -1.2261470556259155, -0.6154036521911621, -0.004660129547119141, 0.6060831546783447, 1.2168264389038086, 1.8275699615478516, 2.4383134841918945, 3.0490567684173584, 3.6598000526428223, 4.270543575286865, 4.881287097930908, 5.492030143737793, 6.102773666381836, 6.713517189025879, 7.324260711669922, 7.935004234313965, 8.545747756958008, 9.156490325927734, 9.767234802246094, 10.37797737121582, 10.988720893859863, 11.599464416503906, 12.21020793914795, 12.820951461791992, 13.431694984436035, 14.042438507080078, 14.653181076049805, 15.263924598693848, 15.87466812133789, 16.48541259765625, 17.096155166625977, 17.706899642944336, 18.317642211914062, 18.928386688232422, 19.53912925720215, 20.149873733520508, 20.760616302490234, 21.37135887145996]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 2.0, 6.0, 3.0, 10.0, 3.0, 11.0, 7.0, 11.0, 9.0, 16.0, 19.0, 25.0, 7.0, 20.0, 16.0, 16.0, 31.0, 28.0, 25.0, 27.0, 26.0, 31.0, 38.0, 37.0, 48.0, 34.0, 33.0, 34.0, 38.0, 40.0, 24.0, 26.0, 36.0, 30.0, 39.0, 28.0, 26.0, 23.0, 20.0, 16.0, 14.0, 14.0, 11.0, 7.0, 10.0, 3.0, 8.0, 5.0, 3.0, 5.0, 4.0, 0.0, 2.0, 2.0, 2.0], "bins": [-15.952142715454102, -15.489089965820312, -15.026036262512207, -14.562983512878418, -14.099930763244629, -13.636877059936523, -13.173824310302734, -12.710771560668945, -12.247718811035156, -11.784666061401367, -11.321612358093262, -10.858559608459473, -10.395506858825684, -9.932453155517578, -9.469400405883789, -9.00634765625, -8.543293952941895, -8.080241203308105, -7.617187976837158, -7.154134750366211, -6.691082000732422, -6.228028774261475, -5.764975547790527, -5.301922798156738, -4.838869571685791, -4.375816345214844, -3.9127635955810547, -3.4497103691101074, -2.9866573810577393, -2.523604393005371, -2.060551166534424, -1.5974981784820557, -1.1344451904296875, -0.6713921427726746, -0.20833909511566162, 0.2547140121459961, 0.7177670001983643, 1.1808199882507324, 1.6438732147216797, 2.106926202774048, 2.569979190826416, 3.033032178878784, 3.4960851669311523, 3.9591383934020996, 4.422191619873047, 4.885244369506836, 5.348297595977783, 5.8113508224487305, 6.2744035720825195, 6.737456798553467, 7.200509548187256, 7.663562774658203, 8.126615524291992, 8.589668273925781, 9.052721977233887, 9.515774726867676, 9.978828430175781, 10.44188117980957, 10.904934883117676, 11.367987632751465, 11.831040382385254, 12.29409408569336, 12.757146835327148, 13.220199584960938, 13.683252334594727]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 5.0, 0.0, 3.0, 9.0, 16.0, 19.0, 29.0, 47.0, 55.0, 109.0, 171.0, 228.0, 376.0, 600.0, 933.0, 1345.0, 2104.0, 3200.0, 4914.0, 7927.0, 11628.0, 17931.0, 26828.0, 39293.0, 56017.0, 76647.0, 97887.0, 116202.0, 122878.0, 115679.0, 97586.0, 75650.0, 55746.0, 39352.0, 26012.0, 17682.0, 11662.0, 7668.0, 4910.0, 3145.0, 2144.0, 1325.0, 860.0, 589.0, 427.0, 249.0, 151.0, 98.0, 66.0, 62.0, 39.0, 33.0, 10.0, 5.0, 6.0, 7.0, 4.0, 1.0, 1.0, 2.0], "bins": [-14.1015625, -13.66748046875, -13.2333984375, -12.79931640625, -12.365234375, -11.93115234375, -11.4970703125, -11.06298828125, -10.62890625, -10.19482421875, -9.7607421875, -9.32666015625, -8.892578125, -8.45849609375, -8.0244140625, -7.59033203125, -7.15625, -6.72216796875, -6.2880859375, -5.85400390625, -5.419921875, -4.98583984375, -4.5517578125, -4.11767578125, -3.68359375, -3.24951171875, -2.8154296875, -2.38134765625, -1.947265625, -1.51318359375, -1.0791015625, -0.64501953125, -0.2109375, 0.22314453125, 0.6572265625, 1.09130859375, 1.525390625, 1.95947265625, 2.3935546875, 2.82763671875, 3.26171875, 3.69580078125, 4.1298828125, 4.56396484375, 4.998046875, 5.43212890625, 5.8662109375, 6.30029296875, 6.734375, 7.16845703125, 7.6025390625, 8.03662109375, 8.470703125, 8.90478515625, 9.3388671875, 9.77294921875, 10.20703125, 10.64111328125, 11.0751953125, 11.50927734375, 11.943359375, 12.37744140625, 12.8115234375, 13.24560546875, 13.6796875]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 3.0, 7.0, 7.0, 11.0, 10.0, 12.0, 13.0, 13.0, 15.0, 26.0, 21.0, 26.0, 22.0, 19.0, 26.0, 31.0, 33.0, 45.0, 34.0, 38.0, 26.0, 41.0, 36.0, 34.0, 41.0, 46.0, 41.0, 38.0, 31.0, 39.0, 35.0, 24.0, 22.0, 26.0, 18.0, 24.0, 12.0, 13.0, 6.0, 8.0, 3.0, 4.0, 9.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-17.0, -16.5118408203125, -16.023681640625, -15.5355224609375, -15.04736328125, -14.5592041015625, -14.071044921875, -13.5828857421875, -13.0947265625, -12.6065673828125, -12.118408203125, -11.6302490234375, -11.14208984375, -10.6539306640625, -10.165771484375, -9.6776123046875, -9.189453125, -8.7012939453125, -8.213134765625, -7.7249755859375, -7.23681640625, -6.7486572265625, -6.260498046875, -5.7723388671875, -5.2841796875, -4.7960205078125, -4.307861328125, -3.8197021484375, -3.33154296875, -2.8433837890625, -2.355224609375, -1.8670654296875, -1.37890625, -0.8907470703125, -0.402587890625, 0.0855712890625, 0.57373046875, 1.0618896484375, 1.550048828125, 2.0382080078125, 2.5263671875, 3.0145263671875, 3.502685546875, 3.9908447265625, 4.47900390625, 4.9671630859375, 5.455322265625, 5.9434814453125, 6.431640625, 6.9197998046875, 7.407958984375, 7.8961181640625, 8.38427734375, 8.8724365234375, 9.360595703125, 9.8487548828125, 10.3369140625, 10.8250732421875, 11.313232421875, 11.8013916015625, 12.28955078125, 12.7777099609375, 13.265869140625, 13.7540283203125, 14.2421875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 6.0, 11.0, 18.0, 26.0, 38.0, 65.0, 96.0, 138.0, 245.0, 403.0, 635.0, 1006.0, 1641.0, 2600.0, 4256.0, 7128.0, 11837.0, 19805.0, 33984.0, 56633.0, 90273.0, 131245.0, 162559.0, 163079.0, 131186.0, 89765.0, 56385.0, 33461.0, 19884.0, 11973.0, 7049.0, 4295.0, 2544.0, 1616.0, 994.0, 577.0, 409.0, 243.0, 167.0, 112.0, 60.0, 45.0, 26.0, 16.0, 8.0, 8.0, 5.0, 5.0, 1.0, 0.0, 1.0, 2.0], "bins": [-18.9375, -18.3963623046875, -17.855224609375, -17.3140869140625, -16.77294921875, -16.2318115234375, -15.690673828125, -15.1495361328125, -14.6083984375, -14.0672607421875, -13.526123046875, -12.9849853515625, -12.44384765625, -11.9027099609375, -11.361572265625, -10.8204345703125, -10.279296875, -9.7381591796875, -9.197021484375, -8.6558837890625, -8.11474609375, -7.5736083984375, -7.032470703125, -6.4913330078125, -5.9501953125, -5.4090576171875, -4.867919921875, -4.3267822265625, -3.78564453125, -3.2445068359375, -2.703369140625, -2.1622314453125, -1.62109375, -1.0799560546875, -0.538818359375, 0.0023193359375, 0.54345703125, 1.0845947265625, 1.625732421875, 2.1668701171875, 2.7080078125, 3.2491455078125, 3.790283203125, 4.3314208984375, 4.87255859375, 5.4136962890625, 5.954833984375, 6.4959716796875, 7.037109375, 7.5782470703125, 8.119384765625, 8.6605224609375, 9.20166015625, 9.7427978515625, 10.283935546875, 10.8250732421875, 11.3662109375, 11.9073486328125, 12.448486328125, 12.9896240234375, 13.53076171875, 14.0718994140625, 14.613037109375, 15.1541748046875, 15.6953125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 0.0, 5.0, 9.0, 6.0, 8.0, 13.0, 7.0, 11.0, 16.0, 20.0, 31.0, 26.0, 29.0, 24.0, 42.0, 57.0, 40.0, 39.0, 28.0, 37.0, 36.0, 51.0, 46.0, 37.0, 39.0, 52.0, 41.0, 38.0, 25.0, 30.0, 25.0, 21.0, 17.0, 20.0, 20.0, 10.0, 10.0, 11.0, 7.0, 7.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0], "bins": [-12.0859375, -11.73095703125, -11.3759765625, -11.02099609375, -10.666015625, -10.31103515625, -9.9560546875, -9.60107421875, -9.24609375, -8.89111328125, -8.5361328125, -8.18115234375, -7.826171875, -7.47119140625, -7.1162109375, -6.76123046875, -6.40625, -6.05126953125, -5.6962890625, -5.34130859375, -4.986328125, -4.63134765625, -4.2763671875, -3.92138671875, -3.56640625, -3.21142578125, -2.8564453125, -2.50146484375, -2.146484375, -1.79150390625, -1.4365234375, -1.08154296875, -0.7265625, -0.37158203125, -0.0166015625, 0.33837890625, 0.693359375, 1.04833984375, 1.4033203125, 1.75830078125, 2.11328125, 2.46826171875, 2.8232421875, 3.17822265625, 3.533203125, 3.88818359375, 4.2431640625, 4.59814453125, 4.953125, 5.30810546875, 5.6630859375, 6.01806640625, 6.373046875, 6.72802734375, 7.0830078125, 7.43798828125, 7.79296875, 8.14794921875, 8.5029296875, 8.85791015625, 9.212890625, 9.56787109375, 9.9228515625, 10.27783203125, 10.6328125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 6.0, 2.0, 7.0, 10.0, 11.0, 11.0, 16.0, 45.0, 49.0, 67.0, 116.0, 182.0, 265.0, 416.0, 721.0, 1105.0, 1865.0, 3070.0, 5470.0, 9774.0, 18251.0, 36446.0, 75226.0, 151489.0, 243525.0, 230707.0, 134680.0, 65333.0, 32259.0, 16489.0, 8825.0, 4873.0, 2820.0, 1666.0, 1007.0, 639.0, 410.0, 247.0, 168.0, 100.0, 66.0, 53.0, 30.0, 15.0, 9.0, 6.0, 5.0, 1.0, 7.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.203125, -14.67724609375, -14.1513671875, -13.62548828125, -13.099609375, -12.57373046875, -12.0478515625, -11.52197265625, -10.99609375, -10.47021484375, -9.9443359375, -9.41845703125, -8.892578125, -8.36669921875, -7.8408203125, -7.31494140625, -6.7890625, -6.26318359375, -5.7373046875, -5.21142578125, -4.685546875, -4.15966796875, -3.6337890625, -3.10791015625, -2.58203125, -2.05615234375, -1.5302734375, -1.00439453125, -0.478515625, 0.04736328125, 0.5732421875, 1.09912109375, 1.625, 2.15087890625, 2.6767578125, 3.20263671875, 3.728515625, 4.25439453125, 4.7802734375, 5.30615234375, 5.83203125, 6.35791015625, 6.8837890625, 7.40966796875, 7.935546875, 8.46142578125, 8.9873046875, 9.51318359375, 10.0390625, 10.56494140625, 11.0908203125, 11.61669921875, 12.142578125, 12.66845703125, 13.1943359375, 13.72021484375, 14.24609375, 14.77197265625, 15.2978515625, 15.82373046875, 16.349609375, 16.87548828125, 17.4013671875, 17.92724609375, 18.453125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 10.0, 8.0, 8.0, 12.0, 16.0, 27.0, 28.0, 47.0, 38.0, 59.0, 71.0, 82.0, 73.0, 90.0, 77.0, 64.0, 57.0, 42.0, 46.0, 39.0, 28.0, 18.0, 11.0, 8.0, 12.0, 8.0, 4.0, 2.0, 6.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019388198852539062, -0.0018799751996994019, -0.0018211305141448975, -0.001762285828590393, -0.0017034411430358887, -0.0016445964574813843, -0.0015857517719268799, -0.0015269070863723755, -0.001468062400817871, -0.0014092177152633667, -0.0013503730297088623, -0.001291528344154358, -0.0012326836585998535, -0.0011738389730453491, -0.0011149942874908447, -0.0010561496019363403, -0.000997304916381836, -0.0009384602308273315, -0.0008796155452728271, -0.0008207708597183228, -0.0007619261741638184, -0.000703081488609314, -0.0006442368030548096, -0.0005853921175003052, -0.0005265474319458008, -0.0004677027463912964, -0.000408858060836792, -0.0003500133752822876, -0.0002911686897277832, -0.0002323240041732788, -0.00017347931861877441, -0.00011463463306427002, -5.5789947509765625e-05, 3.0547380447387695e-06, 6.189942359924316e-05, 0.00012074410915374756, 0.00017958879470825195, 0.00023843348026275635, 0.00029727816581726074, 0.00035612285137176514, 0.00041496753692626953, 0.0004738122224807739, 0.0005326569080352783, 0.0005915015935897827, 0.0006503462791442871, 0.0007091909646987915, 0.0007680356502532959, 0.0008268803358078003, 0.0008857250213623047, 0.0009445697069168091, 0.0010034143924713135, 0.0010622590780258179, 0.0011211037635803223, 0.0011799484491348267, 0.001238793134689331, 0.0012976378202438354, 0.0013564825057983398, 0.0014153271913528442, 0.0014741718769073486, 0.001533016562461853, 0.0015918612480163574, 0.0016507059335708618, 0.0017095506191253662, 0.0017683953046798706, 0.001827239990234375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 9.0, 7.0, 14.0, 17.0, 28.0, 33.0, 44.0, 73.0, 77.0, 131.0, 203.0, 269.0, 393.0, 583.0, 917.0, 1412.0, 2358.0, 3821.0, 6765.0, 11526.0, 21451.0, 39784.0, 74939.0, 134561.0, 205545.0, 213045.0, 148133.0, 83228.0, 44121.0, 23500.0, 13006.0, 7272.0, 4198.0, 2532.0, 1511.0, 1013.0, 617.0, 451.0, 293.0, 203.0, 160.0, 101.0, 48.0, 57.0, 28.0, 21.0, 21.0, 9.0, 11.0, 10.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-14.7890625, -14.328125, -13.8671875, -13.40625, -12.9453125, -12.484375, -12.0234375, -11.5625, -11.1015625, -10.640625, -10.1796875, -9.71875, -9.2578125, -8.796875, -8.3359375, -7.875, -7.4140625, -6.953125, -6.4921875, -6.03125, -5.5703125, -5.109375, -4.6484375, -4.1875, -3.7265625, -3.265625, -2.8046875, -2.34375, -1.8828125, -1.421875, -0.9609375, -0.5, -0.0390625, 0.421875, 0.8828125, 1.34375, 1.8046875, 2.265625, 2.7265625, 3.1875, 3.6484375, 4.109375, 4.5703125, 5.03125, 5.4921875, 5.953125, 6.4140625, 6.875, 7.3359375, 7.796875, 8.2578125, 8.71875, 9.1796875, 9.640625, 10.1015625, 10.5625, 11.0234375, 11.484375, 11.9453125, 12.40625, 12.8671875, 13.328125, 13.7890625, 14.25, 14.7109375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 4.0, 7.0, 4.0, 6.0, 4.0, 8.0, 13.0, 16.0, 14.0, 16.0, 22.0, 27.0, 35.0, 43.0, 39.0, 35.0, 48.0, 52.0, 57.0, 58.0, 47.0, 48.0, 51.0, 48.0, 47.0, 29.0, 38.0, 39.0, 35.0, 22.0, 9.0, 18.0, 9.0, 7.0, 11.0, 7.0, 6.0, 8.0, 3.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0390625, -3.91998291015625, -3.8009033203125, -3.68182373046875, -3.562744140625, -3.44366455078125, -3.3245849609375, -3.20550537109375, -3.08642578125, -2.96734619140625, -2.8482666015625, -2.72918701171875, -2.610107421875, -2.49102783203125, -2.3719482421875, -2.25286865234375, -2.1337890625, -2.01470947265625, -1.8956298828125, -1.77655029296875, -1.657470703125, -1.53839111328125, -1.4193115234375, -1.30023193359375, -1.18115234375, -1.06207275390625, -0.9429931640625, -0.82391357421875, -0.704833984375, -0.58575439453125, -0.4666748046875, -0.34759521484375, -0.228515625, -0.10943603515625, 0.0096435546875, 0.12872314453125, 0.247802734375, 0.36688232421875, 0.4859619140625, 0.60504150390625, 0.72412109375, 0.84320068359375, 0.9622802734375, 1.08135986328125, 1.200439453125, 1.31951904296875, 1.4385986328125, 1.55767822265625, 1.6767578125, 1.79583740234375, 1.9149169921875, 2.03399658203125, 2.153076171875, 2.27215576171875, 2.3912353515625, 2.51031494140625, 2.62939453125, 2.74847412109375, 2.8675537109375, 2.98663330078125, 3.105712890625, 3.22479248046875, 3.3438720703125, 3.46295166015625, 3.58203125]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 4.0, 7.0, 8.0, 9.0, 14.0, 13.0, 20.0, 21.0, 16.0, 24.0, 41.0, 44.0, 29.0, 54.0, 54.0, 49.0, 49.0, 61.0, 53.0, 53.0, 38.0, 56.0, 35.0, 31.0, 33.0, 23.0, 34.0, 19.0, 20.0, 22.0, 9.0, 7.0, 11.0, 6.0, 6.0, 3.0, 7.0, 7.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.620800018310547, -17.036314010620117, -16.451826095581055, -15.867340087890625, -15.282854080200195, -14.69836711883545, -14.113880157470703, -13.529394149780273, -12.944907188415527, -12.360420227050781, -11.775934219360352, -11.191447257995605, -10.60696029663086, -10.02247428894043, -9.437987327575684, -8.853500366210938, -8.269014358520508, -7.68452787399292, -7.100041389465332, -6.515554428100586, -5.931067943572998, -5.34658145904541, -4.762094497680664, -4.177608013153076, -3.5931215286254883, -3.0086350440979004, -2.4241483211517334, -1.839661717414856, -1.2551751136779785, -0.6706886291503906, -0.08620190620422363, 0.49828481674194336, 1.082773208618164, 1.6672598123550415, 2.251746416091919, 2.836233139038086, 3.420719623565674, 4.005206108093262, 4.589693069458008, 5.174179553985596, 5.758666038513184, 6.3431525230407715, 6.927639007568359, 7.5121259689331055, 8.096612930297852, 8.681098937988281, 9.265585899353027, 9.850072860717773, 10.434558868408203, 11.01904582977295, 11.603531837463379, 12.188018798828125, 12.772504806518555, 13.3569917678833, 13.941478729248047, 14.525964736938477, 15.110451698303223, 15.694938659667969, 16.2794246673584, 16.863910675048828, 17.44839859008789, 18.03288459777832, 18.61737060546875, 19.201858520507812, 19.786344528198242]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 9.0, 5.0, 10.0, 12.0, 11.0, 7.0, 16.0, 13.0, 12.0, 15.0, 19.0, 21.0, 24.0, 18.0, 24.0, 31.0, 31.0, 28.0, 30.0, 32.0, 36.0, 39.0, 38.0, 34.0, 37.0, 33.0, 42.0, 35.0, 36.0, 29.0, 34.0, 34.0, 21.0, 28.0, 23.0, 21.0, 24.0, 14.0, 11.0, 13.0, 18.0, 10.0, 4.0, 3.0, 5.0, 4.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-14.68523120880127, -14.213888168334961, -13.742544174194336, -13.271201133728027, -12.799858093261719, -12.328514099121094, -11.857171058654785, -11.385828018188477, -10.914484024047852, -10.443140983581543, -9.971796989440918, -9.50045394897461, -9.029109954833984, -8.557766914367676, -8.086423873901367, -7.6150803565979, -7.143736839294434, -6.672393321990967, -6.2010498046875, -5.729706764221191, -5.258363246917725, -4.787019729614258, -4.315676689147949, -3.8443331718444824, -3.3729896545410156, -2.901646137237549, -2.430302858352661, -1.9589594602584839, -1.4876160621643066, -1.0162725448608398, -0.5449292659759521, -0.07358598709106445, 0.39775657653808594, 0.8690999746322632, 1.3404433727264404, 1.8117867708206177, 2.283130168914795, 2.7544736862182617, 3.2258169651031494, 3.697160243988037, 4.168503761291504, 4.639847278594971, 5.1111907958984375, 5.582533836364746, 6.053877353668213, 6.52522087097168, 6.996563911437988, 7.467907428741455, 7.939250946044922, 8.41059398651123, 8.881937980651855, 9.353281021118164, 9.824625015258789, 10.295968055725098, 10.767311096191406, 11.238655090332031, 11.70999813079834, 12.181341171264648, 12.652685165405273, 13.124028205871582, 13.59537124633789, 14.066715240478516, 14.538058280944824, 15.009401321411133, 15.480745315551758]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 11.0, 30.0, 21.0, 30.0, 45.0, 78.0, 125.0, 181.0, 256.0, 409.0, 629.0, 987.0, 1613.0, 2600.0, 3996.0, 6389.0, 10570.0, 17536.0, 29591.0, 52230.0, 95677.0, 185083.0, 375865.0, 697923.0, 940429.0, 801701.0, 469654.0, 231632.0, 117300.0, 62804.0, 35188.0, 20507.0, 12638.0, 7662.0, 4791.0, 2964.0, 1800.0, 1173.0, 777.0, 508.0, 308.0, 203.0, 125.0, 93.0, 58.0, 29.0, 23.0, 13.0, 10.0, 6.0, 8.0, 1.0, 0.0, 3.0], "bins": [-16.5625, -16.084716796875, -15.60693359375, -15.129150390625, -14.6513671875, -14.173583984375, -13.69580078125, -13.218017578125, -12.740234375, -12.262451171875, -11.78466796875, -11.306884765625, -10.8291015625, -10.351318359375, -9.87353515625, -9.395751953125, -8.91796875, -8.440185546875, -7.96240234375, -7.484619140625, -7.0068359375, -6.529052734375, -6.05126953125, -5.573486328125, -5.095703125, -4.617919921875, -4.14013671875, -3.662353515625, -3.1845703125, -2.706787109375, -2.22900390625, -1.751220703125, -1.2734375, -0.795654296875, -0.31787109375, 0.159912109375, 0.6376953125, 1.115478515625, 1.59326171875, 2.071044921875, 2.548828125, 3.026611328125, 3.50439453125, 3.982177734375, 4.4599609375, 4.937744140625, 5.41552734375, 5.893310546875, 6.37109375, 6.848876953125, 7.32666015625, 7.804443359375, 8.2822265625, 8.760009765625, 9.23779296875, 9.715576171875, 10.193359375, 10.671142578125, 11.14892578125, 11.626708984375, 12.1044921875, 12.582275390625, 13.06005859375, 13.537841796875, 14.015625]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 5.0, 4.0, 7.0, 7.0, 12.0, 11.0, 10.0, 11.0, 12.0, 17.0, 18.0, 32.0, 22.0, 23.0, 25.0, 22.0, 29.0, 38.0, 26.0, 41.0, 40.0, 50.0, 35.0, 39.0, 39.0, 44.0, 38.0, 35.0, 43.0, 30.0, 28.0, 31.0, 21.0, 34.0, 26.0, 14.0, 20.0, 11.0, 10.0, 9.0, 9.0, 7.0, 6.0, 5.0, 3.0, 4.0, 1.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-12.015625, -11.651123046875, -11.28662109375, -10.922119140625, -10.5576171875, -10.193115234375, -9.82861328125, -9.464111328125, -9.099609375, -8.735107421875, -8.37060546875, -8.006103515625, -7.6416015625, -7.277099609375, -6.91259765625, -6.548095703125, -6.18359375, -5.819091796875, -5.45458984375, -5.090087890625, -4.7255859375, -4.361083984375, -3.99658203125, -3.632080078125, -3.267578125, -2.903076171875, -2.53857421875, -2.174072265625, -1.8095703125, -1.445068359375, -1.08056640625, -0.716064453125, -0.3515625, 0.012939453125, 0.37744140625, 0.741943359375, 1.1064453125, 1.470947265625, 1.83544921875, 2.199951171875, 2.564453125, 2.928955078125, 3.29345703125, 3.657958984375, 4.0224609375, 4.386962890625, 4.75146484375, 5.115966796875, 5.48046875, 5.844970703125, 6.20947265625, 6.573974609375, 6.9384765625, 7.302978515625, 7.66748046875, 8.031982421875, 8.396484375, 8.760986328125, 9.12548828125, 9.489990234375, 9.8544921875, 10.218994140625, 10.58349609375, 10.947998046875, 11.3125]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 14.0, 18.0, 25.0, 33.0, 62.0, 110.0, 158.0, 211.0, 351.0, 505.0, 831.0, 1294.0, 2048.0, 3141.0, 4922.0, 8049.0, 12843.0, 21172.0, 35686.0, 60859.0, 103867.0, 179548.0, 311525.0, 527289.0, 787556.0, 801985.0, 548323.0, 326000.0, 188539.0, 108952.0, 63584.0, 37184.0, 22432.0, 13162.0, 8182.0, 5080.0, 3242.0, 2012.0, 1257.0, 820.0, 518.0, 330.0, 228.0, 122.0, 70.0, 54.0, 36.0, 18.0, 12.0, 10.0, 6.0, 5.0, 6.0, 2.0], "bins": [-15.984375, -15.5281982421875, -15.072021484375, -14.6158447265625, -14.15966796875, -13.7034912109375, -13.247314453125, -12.7911376953125, -12.3349609375, -11.8787841796875, -11.422607421875, -10.9664306640625, -10.51025390625, -10.0540771484375, -9.597900390625, -9.1417236328125, -8.685546875, -8.2293701171875, -7.773193359375, -7.3170166015625, -6.86083984375, -6.4046630859375, -5.948486328125, -5.4923095703125, -5.0361328125, -4.5799560546875, -4.123779296875, -3.6676025390625, -3.21142578125, -2.7552490234375, -2.299072265625, -1.8428955078125, -1.38671875, -0.9305419921875, -0.474365234375, -0.0181884765625, 0.43798828125, 0.8941650390625, 1.350341796875, 1.8065185546875, 2.2626953125, 2.7188720703125, 3.175048828125, 3.6312255859375, 4.08740234375, 4.5435791015625, 4.999755859375, 5.4559326171875, 5.912109375, 6.3682861328125, 6.824462890625, 7.2806396484375, 7.73681640625, 8.1929931640625, 8.649169921875, 9.1053466796875, 9.5615234375, 10.0177001953125, 10.473876953125, 10.9300537109375, 11.38623046875, 11.8424072265625, 12.298583984375, 12.7547607421875, 13.2109375]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 5.0, 9.0, 5.0, 13.0, 16.0, 16.0, 29.0, 33.0, 39.0, 51.0, 65.0, 96.0, 113.0, 118.0, 152.0, 189.0, 217.0, 217.0, 226.0, 276.0, 251.0, 289.0, 236.0, 225.0, 205.0, 167.0, 132.0, 134.0, 102.0, 85.0, 88.0, 53.0, 40.0, 28.0, 34.0, 25.0, 19.0, 21.0, 13.0, 12.0, 12.0, 7.0, 4.0, 3.0, 2.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0], "bins": [-5.8671875, -5.6893310546875, -5.511474609375, -5.3336181640625, -5.15576171875, -4.9779052734375, -4.800048828125, -4.6221923828125, -4.4443359375, -4.2664794921875, -4.088623046875, -3.9107666015625, -3.73291015625, -3.5550537109375, -3.377197265625, -3.1993408203125, -3.021484375, -2.8436279296875, -2.665771484375, -2.4879150390625, -2.31005859375, -2.1322021484375, -1.954345703125, -1.7764892578125, -1.5986328125, -1.4207763671875, -1.242919921875, -1.0650634765625, -0.88720703125, -0.7093505859375, -0.531494140625, -0.3536376953125, -0.17578125, 0.0020751953125, 0.179931640625, 0.3577880859375, 0.53564453125, 0.7135009765625, 0.891357421875, 1.0692138671875, 1.2470703125, 1.4249267578125, 1.602783203125, 1.7806396484375, 1.95849609375, 2.1363525390625, 2.314208984375, 2.4920654296875, 2.669921875, 2.8477783203125, 3.025634765625, 3.2034912109375, 3.38134765625, 3.5592041015625, 3.737060546875, 3.9149169921875, 4.0927734375, 4.2706298828125, 4.448486328125, 4.6263427734375, 4.80419921875, 4.9820556640625, 5.159912109375, 5.3377685546875, 5.515625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 2.0, 8.0, 8.0, 17.0, 14.0, 21.0, 23.0, 20.0, 29.0, 42.0, 27.0, 38.0, 53.0, 50.0, 50.0, 53.0, 52.0, 57.0, 53.0, 52.0, 46.0, 47.0, 42.0, 37.0, 26.0, 26.0, 21.0, 16.0, 12.0, 19.0, 10.0, 10.0, 6.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.505298614501953, -13.981097221374512, -13.45689582824707, -12.932694435119629, -12.408493041992188, -11.88429069519043, -11.360089302062988, -10.835887908935547, -10.311686515808105, -9.787485122680664, -9.263283729553223, -8.739082336425781, -8.214879989624023, -7.69067907333374, -7.166477203369141, -6.642275810241699, -6.118074417114258, -5.593873023986816, -5.069671630859375, -4.545469760894775, -4.021268367767334, -3.4970669746398926, -2.972865343093872, -2.4486637115478516, -1.9244623184204102, -1.4002608060836792, -0.8760592937469482, -0.3518577814102173, 0.17234373092651367, 0.6965451240539551, 1.2207467555999756, 1.744948387145996, 2.2691497802734375, 2.793351173400879, 3.3175528049468994, 3.84175443649292, 4.365955829620361, 4.890157222747803, 5.414359092712402, 5.938560485839844, 6.462761878967285, 6.986963272094727, 7.511164665222168, 8.03536605834961, 8.559568405151367, 9.083768844604492, 9.60797119140625, 10.132172584533691, 10.656373977661133, 11.180575370788574, 11.704776763916016, 12.228978157043457, 12.753179550170898, 13.277381896972656, 13.801583290100098, 14.325784683227539, 14.84998607635498, 15.374187469482422, 15.898388862609863, 16.422590255737305, 16.946792602539062, 17.470993041992188, 17.995195388793945, 18.519397735595703, 19.043598175048828]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 7.0, 11.0, 10.0, 9.0, 8.0, 10.0, 14.0, 14.0, 16.0, 12.0, 21.0, 38.0, 21.0, 32.0, 33.0, 30.0, 37.0, 42.0, 43.0, 41.0, 45.0, 42.0, 36.0, 46.0, 47.0, 27.0, 42.0, 44.0, 30.0, 28.0, 25.0, 19.0, 19.0, 21.0, 14.0, 15.0, 10.0, 13.0, 8.0, 6.0, 8.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-15.387277603149414, -14.947333335876465, -14.507389068603516, -14.067444801330566, -13.627500534057617, -13.187556266784668, -12.747611999511719, -12.30766773223877, -11.86772346496582, -11.427779197692871, -10.987834930419922, -10.547890663146973, -10.107946395874023, -9.668002128601074, -9.228057861328125, -8.788113594055176, -8.348169326782227, -7.908225059509277, -7.468280792236328, -7.028336524963379, -6.58839225769043, -6.1484479904174805, -5.708503723144531, -5.268559455871582, -4.828614234924316, -4.388669967651367, -3.948725700378418, -3.5087814331054688, -3.0688371658325195, -2.628892660140991, -2.188948392868042, -1.7490041255950928, -1.3090600967407227, -0.8691158294677734, -0.42917150259017944, 0.01077282428741455, 0.45071709156036377, 0.8906614780426025, 1.3306057453155518, 1.770550012588501, 2.21049427986145, 2.6504385471343994, 3.0903828144073486, 3.530327320098877, 3.970271587371826, 4.410215854644775, 4.850160121917725, 5.290104389190674, 5.730048656463623, 6.169992923736572, 6.6099371910095215, 7.049881458282471, 7.48982572555542, 7.929770469665527, 8.369714736938477, 8.809659004211426, 9.249603271484375, 9.689547538757324, 10.129491806030273, 10.569436073303223, 11.009380340576172, 11.449324607849121, 11.88926887512207, 12.32921314239502, 12.769157409667969]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 5.0, 5.0, 7.0, 10.0, 13.0, 27.0, 27.0, 34.0, 59.0, 93.0, 116.0, 147.0, 186.0, 262.0, 399.0, 612.0, 923.0, 1307.0, 1826.0, 2898.0, 4759.0, 7747.0, 13245.0, 23766.0, 46432.0, 95602.0, 198380.0, 276168.0, 185866.0, 88857.0, 43253.0, 22529.0, 12530.0, 7337.0, 4540.0, 2825.0, 1807.0, 1236.0, 824.0, 553.0, 408.0, 288.0, 197.0, 128.0, 93.0, 65.0, 58.0, 30.0, 26.0, 17.0, 14.0, 8.0, 10.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-33.09375, -32.04150390625, -30.9892578125, -29.93701171875, -28.884765625, -27.83251953125, -26.7802734375, -25.72802734375, -24.67578125, -23.62353515625, -22.5712890625, -21.51904296875, -20.466796875, -19.41455078125, -18.3623046875, -17.31005859375, -16.2578125, -15.20556640625, -14.1533203125, -13.10107421875, -12.048828125, -10.99658203125, -9.9443359375, -8.89208984375, -7.83984375, -6.78759765625, -5.7353515625, -4.68310546875, -3.630859375, -2.57861328125, -1.5263671875, -0.47412109375, 0.578125, 1.63037109375, 2.6826171875, 3.73486328125, 4.787109375, 5.83935546875, 6.8916015625, 7.94384765625, 8.99609375, 10.04833984375, 11.1005859375, 12.15283203125, 13.205078125, 14.25732421875, 15.3095703125, 16.36181640625, 17.4140625, 18.46630859375, 19.5185546875, 20.57080078125, 21.623046875, 22.67529296875, 23.7275390625, 24.77978515625, 25.83203125, 26.88427734375, 27.9365234375, 28.98876953125, 30.041015625, 31.09326171875, 32.1455078125, 33.19775390625, 34.25]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 6.0, 12.0, 6.0, 17.0, 7.0, 8.0, 14.0, 14.0, 13.0, 22.0, 21.0, 27.0, 32.0, 35.0, 38.0, 43.0, 36.0, 54.0, 39.0, 39.0, 38.0, 46.0, 40.0, 46.0, 43.0, 41.0, 39.0, 36.0, 27.0, 25.0, 22.0, 23.0, 14.0, 17.0, 16.0, 11.0, 11.0, 10.0, 6.0, 2.0, 7.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.203125, -14.77294921875, -14.3427734375, -13.91259765625, -13.482421875, -13.05224609375, -12.6220703125, -12.19189453125, -11.76171875, -11.33154296875, -10.9013671875, -10.47119140625, -10.041015625, -9.61083984375, -9.1806640625, -8.75048828125, -8.3203125, -7.89013671875, -7.4599609375, -7.02978515625, -6.599609375, -6.16943359375, -5.7392578125, -5.30908203125, -4.87890625, -4.44873046875, -4.0185546875, -3.58837890625, -3.158203125, -2.72802734375, -2.2978515625, -1.86767578125, -1.4375, -1.00732421875, -0.5771484375, -0.14697265625, 0.283203125, 0.71337890625, 1.1435546875, 1.57373046875, 2.00390625, 2.43408203125, 2.8642578125, 3.29443359375, 3.724609375, 4.15478515625, 4.5849609375, 5.01513671875, 5.4453125, 5.87548828125, 6.3056640625, 6.73583984375, 7.166015625, 7.59619140625, 8.0263671875, 8.45654296875, 8.88671875, 9.31689453125, 9.7470703125, 10.17724609375, 10.607421875, 11.03759765625, 11.4677734375, 11.89794921875, 12.328125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 7.0, 5.0, 9.0, 12.0, 9.0, 27.0, 35.0, 42.0, 84.0, 89.0, 132.0, 211.0, 263.0, 389.0, 588.0, 859.0, 1283.0, 1930.0, 2967.0, 4638.0, 7539.0, 11937.0, 20456.0, 36812.0, 71375.0, 146917.0, 266219.0, 228071.0, 114650.0, 56152.0, 29907.0, 16871.0, 10020.0, 6206.0, 3929.0, 2624.0, 1740.0, 1072.0, 771.0, 519.0, 373.0, 237.0, 172.0, 125.0, 78.0, 52.0, 50.0, 35.0, 26.0, 14.0, 11.0, 11.0, 8.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.359375, -26.442138671875, -25.52490234375, -24.607666015625, -23.6904296875, -22.773193359375, -21.85595703125, -20.938720703125, -20.021484375, -19.104248046875, -18.18701171875, -17.269775390625, -16.3525390625, -15.435302734375, -14.51806640625, -13.600830078125, -12.68359375, -11.766357421875, -10.84912109375, -9.931884765625, -9.0146484375, -8.097412109375, -7.18017578125, -6.262939453125, -5.345703125, -4.428466796875, -3.51123046875, -2.593994140625, -1.6767578125, -0.759521484375, 0.15771484375, 1.074951171875, 1.9921875, 2.909423828125, 3.82666015625, 4.743896484375, 5.6611328125, 6.578369140625, 7.49560546875, 8.412841796875, 9.330078125, 10.247314453125, 11.16455078125, 12.081787109375, 12.9990234375, 13.916259765625, 14.83349609375, 15.750732421875, 16.66796875, 17.585205078125, 18.50244140625, 19.419677734375, 20.3369140625, 21.254150390625, 22.17138671875, 23.088623046875, 24.005859375, 24.923095703125, 25.84033203125, 26.757568359375, 27.6748046875, 28.592041015625, 29.50927734375, 30.426513671875, 31.34375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 7.0, 3.0, 5.0, 8.0, 9.0, 12.0, 13.0, 19.0, 15.0, 11.0, 19.0, 21.0, 21.0, 22.0, 28.0, 28.0, 37.0, 36.0, 47.0, 47.0, 42.0, 44.0, 45.0, 47.0, 30.0, 50.0, 35.0, 35.0, 30.0, 35.0, 34.0, 22.0, 21.0, 22.0, 15.0, 22.0, 11.0, 11.0, 11.0, 4.0, 9.0, 7.0, 5.0, 2.0, 1.0, 7.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-9.453125, -9.178466796875, -8.90380859375, -8.629150390625, -8.3544921875, -8.079833984375, -7.80517578125, -7.530517578125, -7.255859375, -6.981201171875, -6.70654296875, -6.431884765625, -6.1572265625, -5.882568359375, -5.60791015625, -5.333251953125, -5.05859375, -4.783935546875, -4.50927734375, -4.234619140625, -3.9599609375, -3.685302734375, -3.41064453125, -3.135986328125, -2.861328125, -2.586669921875, -2.31201171875, -2.037353515625, -1.7626953125, -1.488037109375, -1.21337890625, -0.938720703125, -0.6640625, -0.389404296875, -0.11474609375, 0.159912109375, 0.4345703125, 0.709228515625, 0.98388671875, 1.258544921875, 1.533203125, 1.807861328125, 2.08251953125, 2.357177734375, 2.6318359375, 2.906494140625, 3.18115234375, 3.455810546875, 3.73046875, 4.005126953125, 4.27978515625, 4.554443359375, 4.8291015625, 5.103759765625, 5.37841796875, 5.653076171875, 5.927734375, 6.202392578125, 6.47705078125, 6.751708984375, 7.0263671875, 7.301025390625, 7.57568359375, 7.850341796875, 8.125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 2.0, 15.0, 10.0, 13.0, 22.0, 35.0, 30.0, 66.0, 75.0, 92.0, 175.0, 229.0, 402.0, 639.0, 965.0, 1491.0, 2669.0, 4641.0, 8698.0, 17820.0, 39572.0, 95947.0, 240864.0, 342642.0, 168155.0, 65911.0, 27937.0, 13161.0, 6754.0, 3739.0, 2122.0, 1328.0, 800.0, 497.0, 328.0, 195.0, 155.0, 95.0, 81.0, 54.0, 44.0, 23.0, 13.0, 13.0, 13.0, 7.0, 5.0, 5.0, 2.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.828125, -15.3056640625, -14.783203125, -14.2607421875, -13.73828125, -13.2158203125, -12.693359375, -12.1708984375, -11.6484375, -11.1259765625, -10.603515625, -10.0810546875, -9.55859375, -9.0361328125, -8.513671875, -7.9912109375, -7.46875, -6.9462890625, -6.423828125, -5.9013671875, -5.37890625, -4.8564453125, -4.333984375, -3.8115234375, -3.2890625, -2.7666015625, -2.244140625, -1.7216796875, -1.19921875, -0.6767578125, -0.154296875, 0.3681640625, 0.890625, 1.4130859375, 1.935546875, 2.4580078125, 2.98046875, 3.5029296875, 4.025390625, 4.5478515625, 5.0703125, 5.5927734375, 6.115234375, 6.6376953125, 7.16015625, 7.6826171875, 8.205078125, 8.7275390625, 9.25, 9.7724609375, 10.294921875, 10.8173828125, 11.33984375, 11.8623046875, 12.384765625, 12.9072265625, 13.4296875, 13.9521484375, 14.474609375, 14.9970703125, 15.51953125, 16.0419921875, 16.564453125, 17.0869140625, 17.609375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 3.0, 1.0, 9.0, 15.0, 18.0, 21.0, 41.0, 48.0, 94.0, 139.0, 159.0, 133.0, 102.0, 81.0, 36.0, 19.0, 19.0, 14.0, 14.0, 11.0, 4.0, 5.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017681121826171875, -0.0017173439264297485, -0.0016665756702423096, -0.0016158074140548706, -0.0015650391578674316, -0.0015142709016799927, -0.0014635026454925537, -0.0014127343893051147, -0.0013619661331176758, -0.0013111978769302368, -0.0012604296207427979, -0.0012096613645553589, -0.00115889310836792, -0.001108124852180481, -0.001057356595993042, -0.001006588339805603, -0.0009558200836181641, -0.0009050518274307251, -0.0008542835712432861, -0.0008035153150558472, -0.0007527470588684082, -0.0007019788026809692, -0.0006512105464935303, -0.0006004422903060913, -0.0005496740341186523, -0.0004989057779312134, -0.0004481375217437744, -0.00039736926555633545, -0.0003466010093688965, -0.0002958327531814575, -0.00024506449699401855, -0.0001942962408065796, -0.00014352798461914062, -9.275972843170166e-05, -4.1991472244262695e-05, 8.77678394317627e-06, 5.9545040130615234e-05, 0.0001103132963180542, 0.00016108155250549316, 0.00021184980869293213, 0.0002626180648803711, 0.00031338632106781006, 0.000364154577255249, 0.000414922833442688, 0.00046569108963012695, 0.0005164593458175659, 0.0005672276020050049, 0.0006179958581924438, 0.0006687641143798828, 0.0007195323705673218, 0.0007703006267547607, 0.0008210688829421997, 0.0008718371391296387, 0.0009226053953170776, 0.0009733736515045166, 0.0010241419076919556, 0.0010749101638793945, 0.0011256784200668335, 0.0011764466762542725, 0.0012272149324417114, 0.0012779831886291504, 0.0013287514448165894, 0.0013795197010040283, 0.0014302879571914673, 0.0014810562133789062]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 5.0, 6.0, 8.0, 16.0, 21.0, 24.0, 35.0, 42.0, 65.0, 90.0, 111.0, 199.0, 268.0, 386.0, 546.0, 809.0, 1258.0, 1930.0, 3094.0, 5016.0, 8425.0, 14298.0, 25466.0, 46627.0, 87067.0, 152642.0, 216686.0, 198496.0, 126866.0, 69326.0, 37567.0, 20630.0, 11877.0, 6947.0, 4130.0, 2626.0, 1626.0, 1033.0, 721.0, 458.0, 317.0, 226.0, 180.0, 112.0, 73.0, 53.0, 43.0, 33.0, 27.0, 19.0, 14.0, 8.0, 7.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0], "bins": [-10.9140625, -10.5599365234375, -10.205810546875, -9.8516845703125, -9.49755859375, -9.1434326171875, -8.789306640625, -8.4351806640625, -8.0810546875, -7.7269287109375, -7.372802734375, -7.0186767578125, -6.66455078125, -6.3104248046875, -5.956298828125, -5.6021728515625, -5.248046875, -4.8939208984375, -4.539794921875, -4.1856689453125, -3.83154296875, -3.4774169921875, -3.123291015625, -2.7691650390625, -2.4150390625, -2.0609130859375, -1.706787109375, -1.3526611328125, -0.99853515625, -0.6444091796875, -0.290283203125, 0.0638427734375, 0.41796875, 0.7720947265625, 1.126220703125, 1.4803466796875, 1.83447265625, 2.1885986328125, 2.542724609375, 2.8968505859375, 3.2509765625, 3.6051025390625, 3.959228515625, 4.3133544921875, 4.66748046875, 5.0216064453125, 5.375732421875, 5.7298583984375, 6.083984375, 6.4381103515625, 6.792236328125, 7.1463623046875, 7.50048828125, 7.8546142578125, 8.208740234375, 8.5628662109375, 8.9169921875, 9.2711181640625, 9.625244140625, 9.9793701171875, 10.33349609375, 10.6876220703125, 11.041748046875, 11.3958740234375, 11.75]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 9.0, 10.0, 9.0, 12.0, 20.0, 25.0, 20.0, 32.0, 30.0, 43.0, 63.0, 60.0, 67.0, 79.0, 77.0, 65.0, 72.0, 53.0, 56.0, 49.0, 35.0, 22.0, 22.0, 17.0, 19.0, 11.0, 8.0, 4.0, 3.0, 1.0, 1.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.68359375, -4.53759765625, -4.3916015625, -4.24560546875, -4.099609375, -3.95361328125, -3.8076171875, -3.66162109375, -3.515625, -3.36962890625, -3.2236328125, -3.07763671875, -2.931640625, -2.78564453125, -2.6396484375, -2.49365234375, -2.34765625, -2.20166015625, -2.0556640625, -1.90966796875, -1.763671875, -1.61767578125, -1.4716796875, -1.32568359375, -1.1796875, -1.03369140625, -0.8876953125, -0.74169921875, -0.595703125, -0.44970703125, -0.3037109375, -0.15771484375, -0.01171875, 0.13427734375, 0.2802734375, 0.42626953125, 0.572265625, 0.71826171875, 0.8642578125, 1.01025390625, 1.15625, 1.30224609375, 1.4482421875, 1.59423828125, 1.740234375, 1.88623046875, 2.0322265625, 2.17822265625, 2.32421875, 2.47021484375, 2.6162109375, 2.76220703125, 2.908203125, 3.05419921875, 3.2001953125, 3.34619140625, 3.4921875, 3.63818359375, 3.7841796875, 3.93017578125, 4.076171875, 4.22216796875, 4.3681640625, 4.51416015625, 4.66015625]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 5.0, 2.0, 3.0, 9.0, 5.0, 9.0, 12.0, 18.0, 19.0, 19.0, 32.0, 36.0, 28.0, 35.0, 42.0, 47.0, 57.0, 58.0, 32.0, 42.0, 52.0, 57.0, 33.0, 39.0, 47.0, 37.0, 34.0, 30.0, 27.0, 23.0, 22.0, 19.0, 11.0, 10.0, 14.0, 14.0, 2.0, 5.0, 4.0, 3.0, 3.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.578789710998535, -12.14874267578125, -11.718695640563965, -11.28864860534668, -10.858601570129395, -10.42855453491211, -9.998507499694824, -9.568460464477539, -9.138413429260254, -8.708366394042969, -8.278319358825684, -7.848272323608398, -7.418225288391113, -6.988178253173828, -6.558131217956543, -6.128084182739258, -5.698037147521973, -5.2679901123046875, -4.837943077087402, -4.407896041870117, -3.977849006652832, -3.547801971435547, -3.1177549362182617, -2.6877079010009766, -2.2576608657836914, -1.8276138305664062, -1.397566795349121, -0.9675197601318359, -0.5374727249145508, -0.10742568969726562, 0.32262134552001953, 0.7526683807373047, 1.1827163696289062, 1.6127634048461914, 2.0428104400634766, 2.4728574752807617, 2.902904510498047, 3.332951545715332, 3.762998580932617, 4.193045616149902, 4.6230926513671875, 5.053139686584473, 5.483186721801758, 5.913233757019043, 6.343280792236328, 6.773327827453613, 7.203374862670898, 7.633421897888184, 8.063468933105469, 8.493515968322754, 8.923563003540039, 9.353610038757324, 9.78365707397461, 10.213704109191895, 10.64375114440918, 11.073798179626465, 11.50384521484375, 11.933892250061035, 12.36393928527832, 12.793986320495605, 13.22403335571289, 13.654080390930176, 14.084127426147461, 14.514174461364746, 14.944221496582031]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 7.0, 11.0, 6.0, 6.0, 12.0, 15.0, 8.0, 11.0, 14.0, 24.0, 19.0, 32.0, 29.0, 34.0, 25.0, 30.0, 44.0, 37.0, 43.0, 43.0, 46.0, 46.0, 31.0, 33.0, 40.0, 43.0, 33.0, 44.0, 30.0, 39.0, 32.0, 18.0, 20.0, 17.0, 19.0, 12.0, 10.0, 13.0, 10.0, 5.0, 1.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-14.63601016998291, -14.240499496459961, -13.844987869262695, -13.449477195739746, -13.053966522216797, -12.658454895019531, -12.262944221496582, -11.867433547973633, -11.471921920776367, -11.076411247253418, -10.680899620056152, -10.285388946533203, -9.889877319335938, -9.494366645812988, -9.098855972290039, -8.703344345092773, -8.307833671569824, -7.912322521209717, -7.516811370849609, -7.12130069732666, -6.725789546966553, -6.330278396606445, -5.934767723083496, -5.539256572723389, -5.143745422363281, -4.748234272003174, -4.352723121643066, -3.957212448120117, -3.5617012977600098, -3.1661901473999023, -2.770679235458374, -2.3751683235168457, -1.9796571731567383, -1.5841461420059204, -1.1886351108551025, -0.7931240797042847, -0.3976130485534668, -0.0021020174026489258, 0.39340901374816895, 0.7889199256896973, 1.1844310760498047, 1.5799421072006226, 1.9754531383514404, 2.3709640502929688, 2.766475200653076, 3.1619863510131836, 3.557497262954712, 3.9530081748962402, 4.348519325256348, 4.744030475616455, 5.1395416259765625, 5.535052299499512, 5.930563449859619, 6.326074600219727, 6.721585273742676, 7.117096424102783, 7.512607574462891, 7.908118724822998, 8.303629875183105, 8.699140548706055, 9.09465217590332, 9.49016284942627, 9.885673522949219, 10.281185150146484, 10.676695823669434]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 4.0, 7.0, 15.0, 16.0, 31.0, 31.0, 70.0, 80.0, 144.0, 210.0, 282.0, 394.0, 624.0, 907.0, 1482.0, 2297.0, 3690.0, 6124.0, 10139.0, 16718.0, 28431.0, 47503.0, 77761.0, 117695.0, 155682.0, 167804.0, 143378.0, 102504.0, 65265.0, 39603.0, 23519.0, 13893.0, 8438.0, 5120.0, 3115.0, 1946.0, 1234.0, 772.0, 541.0, 363.0, 220.0, 147.0, 105.0, 76.0, 54.0, 38.0, 25.0, 25.0, 13.0, 10.0, 3.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.078125, -11.651611328125, -11.22509765625, -10.798583984375, -10.3720703125, -9.945556640625, -9.51904296875, -9.092529296875, -8.666015625, -8.239501953125, -7.81298828125, -7.386474609375, -6.9599609375, -6.533447265625, -6.10693359375, -5.680419921875, -5.25390625, -4.827392578125, -4.40087890625, -3.974365234375, -3.5478515625, -3.121337890625, -2.69482421875, -2.268310546875, -1.841796875, -1.415283203125, -0.98876953125, -0.562255859375, -0.1357421875, 0.290771484375, 0.71728515625, 1.143798828125, 1.5703125, 1.996826171875, 2.42333984375, 2.849853515625, 3.2763671875, 3.702880859375, 4.12939453125, 4.555908203125, 4.982421875, 5.408935546875, 5.83544921875, 6.261962890625, 6.6884765625, 7.114990234375, 7.54150390625, 7.968017578125, 8.39453125, 8.821044921875, 9.24755859375, 9.674072265625, 10.1005859375, 10.527099609375, 10.95361328125, 11.380126953125, 11.806640625, 12.233154296875, 12.65966796875, 13.086181640625, 13.5126953125, 13.939208984375, 14.36572265625, 14.792236328125, 15.21875]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 9.0, 2.0, 4.0, 6.0, 7.0, 10.0, 8.0, 13.0, 17.0, 15.0, 28.0, 24.0, 26.0, 23.0, 36.0, 45.0, 29.0, 43.0, 29.0, 43.0, 33.0, 35.0, 42.0, 42.0, 42.0, 46.0, 29.0, 39.0, 31.0, 39.0, 31.0, 24.0, 26.0, 25.0, 16.0, 19.0, 15.0, 17.0, 12.0, 8.0, 4.0, 6.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.140625, -12.7667236328125, -12.392822265625, -12.0189208984375, -11.64501953125, -11.2711181640625, -10.897216796875, -10.5233154296875, -10.1494140625, -9.7755126953125, -9.401611328125, -9.0277099609375, -8.65380859375, -8.2799072265625, -7.906005859375, -7.5321044921875, -7.158203125, -6.7843017578125, -6.410400390625, -6.0364990234375, -5.66259765625, -5.2886962890625, -4.914794921875, -4.5408935546875, -4.1669921875, -3.7930908203125, -3.419189453125, -3.0452880859375, -2.67138671875, -2.2974853515625, -1.923583984375, -1.5496826171875, -1.17578125, -0.8018798828125, -0.427978515625, -0.0540771484375, 0.31982421875, 0.6937255859375, 1.067626953125, 1.4415283203125, 1.8154296875, 2.1893310546875, 2.563232421875, 2.9371337890625, 3.31103515625, 3.6849365234375, 4.058837890625, 4.4327392578125, 4.806640625, 5.1805419921875, 5.554443359375, 5.9283447265625, 6.30224609375, 6.6761474609375, 7.050048828125, 7.4239501953125, 7.7978515625, 8.1717529296875, 8.545654296875, 8.9195556640625, 9.29345703125, 9.6673583984375, 10.041259765625, 10.4151611328125, 10.7890625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 7.0, 13.0, 17.0, 20.0, 48.0, 58.0, 68.0, 113.0, 180.0, 271.0, 413.0, 627.0, 961.0, 1566.0, 2298.0, 3713.0, 6050.0, 9960.0, 16559.0, 27015.0, 44098.0, 70615.0, 106525.0, 143676.0, 163237.0, 146870.0, 110821.0, 73704.0, 46668.0, 28161.0, 17125.0, 10179.0, 6204.0, 3937.0, 2462.0, 1533.0, 962.0, 613.0, 432.0, 261.0, 184.0, 109.0, 75.0, 44.0, 41.0, 24.0, 13.0, 11.0, 8.0, 8.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.8828125, -11.506103515625, -11.12939453125, -10.752685546875, -10.3759765625, -9.999267578125, -9.62255859375, -9.245849609375, -8.869140625, -8.492431640625, -8.11572265625, -7.739013671875, -7.3623046875, -6.985595703125, -6.60888671875, -6.232177734375, -5.85546875, -5.478759765625, -5.10205078125, -4.725341796875, -4.3486328125, -3.971923828125, -3.59521484375, -3.218505859375, -2.841796875, -2.465087890625, -2.08837890625, -1.711669921875, -1.3349609375, -0.958251953125, -0.58154296875, -0.204833984375, 0.171875, 0.548583984375, 0.92529296875, 1.302001953125, 1.6787109375, 2.055419921875, 2.43212890625, 2.808837890625, 3.185546875, 3.562255859375, 3.93896484375, 4.315673828125, 4.6923828125, 5.069091796875, 5.44580078125, 5.822509765625, 6.19921875, 6.575927734375, 6.95263671875, 7.329345703125, 7.7060546875, 8.082763671875, 8.45947265625, 8.836181640625, 9.212890625, 9.589599609375, 9.96630859375, 10.343017578125, 10.7197265625, 11.096435546875, 11.47314453125, 11.849853515625, 12.2265625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 0.0, 5.0, 5.0, 8.0, 9.0, 5.0, 9.0, 10.0, 13.0, 14.0, 17.0, 27.0, 21.0, 27.0, 37.0, 39.0, 32.0, 39.0, 49.0, 39.0, 38.0, 56.0, 38.0, 39.0, 41.0, 44.0, 46.0, 49.0, 32.0, 31.0, 27.0, 26.0, 24.0, 17.0, 20.0, 24.0, 13.0, 8.0, 6.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.6484375, -8.39251708984375, -8.1365966796875, -7.88067626953125, -7.624755859375, -7.36883544921875, -7.1129150390625, -6.85699462890625, -6.60107421875, -6.34515380859375, -6.0892333984375, -5.83331298828125, -5.577392578125, -5.32147216796875, -5.0655517578125, -4.80963134765625, -4.5537109375, -4.29779052734375, -4.0418701171875, -3.78594970703125, -3.530029296875, -3.27410888671875, -3.0181884765625, -2.76226806640625, -2.50634765625, -2.25042724609375, -1.9945068359375, -1.73858642578125, -1.482666015625, -1.22674560546875, -0.9708251953125, -0.71490478515625, -0.458984375, -0.20306396484375, 0.0528564453125, 0.30877685546875, 0.564697265625, 0.82061767578125, 1.0765380859375, 1.33245849609375, 1.58837890625, 1.84429931640625, 2.1002197265625, 2.35614013671875, 2.612060546875, 2.86798095703125, 3.1239013671875, 3.37982177734375, 3.6357421875, 3.89166259765625, 4.1475830078125, 4.40350341796875, 4.659423828125, 4.91534423828125, 5.1712646484375, 5.42718505859375, 5.68310546875, 5.93902587890625, 6.1949462890625, 6.45086669921875, 6.706787109375, 6.96270751953125, 7.2186279296875, 7.47454833984375, 7.73046875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 9.0, 2.0, 6.0, 20.0, 26.0, 33.0, 70.0, 82.0, 161.0, 224.0, 352.0, 528.0, 848.0, 1361.0, 2393.0, 3981.0, 7199.0, 13620.0, 26235.0, 54431.0, 113385.0, 209110.0, 254724.0, 177759.0, 91318.0, 43414.0, 21381.0, 11179.0, 5907.0, 3563.0, 2030.0, 1202.0, 740.0, 460.0, 282.0, 185.0, 116.0, 87.0, 45.0, 41.0, 19.0, 11.0, 11.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.53125, -10.2056884765625, -9.880126953125, -9.5545654296875, -9.22900390625, -8.9034423828125, -8.577880859375, -8.2523193359375, -7.9267578125, -7.6011962890625, -7.275634765625, -6.9500732421875, -6.62451171875, -6.2989501953125, -5.973388671875, -5.6478271484375, -5.322265625, -4.9967041015625, -4.671142578125, -4.3455810546875, -4.02001953125, -3.6944580078125, -3.368896484375, -3.0433349609375, -2.7177734375, -2.3922119140625, -2.066650390625, -1.7410888671875, -1.41552734375, -1.0899658203125, -0.764404296875, -0.4388427734375, -0.11328125, 0.2122802734375, 0.537841796875, 0.8634033203125, 1.18896484375, 1.5145263671875, 1.840087890625, 2.1656494140625, 2.4912109375, 2.8167724609375, 3.142333984375, 3.4678955078125, 3.79345703125, 4.1190185546875, 4.444580078125, 4.7701416015625, 5.095703125, 5.4212646484375, 5.746826171875, 6.0723876953125, 6.39794921875, 6.7235107421875, 7.049072265625, 7.3746337890625, 7.7001953125, 8.0257568359375, 8.351318359375, 8.6768798828125, 9.00244140625, 9.3280029296875, 9.653564453125, 9.9791259765625, 10.3046875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 8.0, 9.0, 17.0, 25.0, 46.0, 47.0, 73.0, 94.0, 133.0, 116.0, 92.0, 97.0, 65.0, 53.0, 42.0, 24.0, 26.0, 11.0, 7.0, 5.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0021343231201171875, -0.0020851343870162964, -0.0020359456539154053, -0.001986756920814514, -0.001937568187713623, -0.001888379454612732, -0.0018391907215118408, -0.0017900019884109497, -0.0017408132553100586, -0.0016916245222091675, -0.0016424357891082764, -0.0015932470560073853, -0.0015440583229064941, -0.001494869589805603, -0.001445680856704712, -0.0013964921236038208, -0.0013473033905029297, -0.0012981146574020386, -0.0012489259243011475, -0.0011997371912002563, -0.0011505484580993652, -0.0011013597249984741, -0.001052170991897583, -0.001002982258796692, -0.0009537935256958008, -0.0009046047925949097, -0.0008554160594940186, -0.0008062273263931274, -0.0007570385932922363, -0.0007078498601913452, -0.0006586611270904541, -0.000609472393989563, -0.0005602836608886719, -0.0005110949277877808, -0.00046190619468688965, -0.00041271746158599854, -0.0003635287284851074, -0.0003143399953842163, -0.0002651512622833252, -0.00021596252918243408, -0.00016677379608154297, -0.00011758506298065186, -6.839632987976074e-05, -1.920759677886963e-05, 2.9981136322021484e-05, 7.91698694229126e-05, 0.0001283586025238037, 0.00017754733562469482, 0.00022673606872558594, 0.00027592480182647705, 0.00032511353492736816, 0.0003743022680282593, 0.0004234910011291504, 0.0004726797342300415, 0.0005218684673309326, 0.0005710572004318237, 0.0006202459335327148, 0.000669434666633606, 0.0007186233997344971, 0.0007678121328353882, 0.0008170008659362793, 0.0008661895990371704, 0.0009153783321380615, 0.0009645670652389526, 0.0010137557983398438]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 7.0, 10.0, 14.0, 19.0, 17.0, 37.0, 50.0, 85.0, 128.0, 192.0, 300.0, 442.0, 725.0, 1097.0, 1782.0, 2842.0, 4494.0, 7609.0, 12551.0, 21610.0, 38563.0, 68470.0, 119530.0, 179449.0, 199626.0, 157692.0, 99249.0, 55819.0, 31591.0, 17762.0, 10454.0, 6131.0, 3799.0, 2372.0, 1442.0, 922.0, 601.0, 367.0, 264.0, 159.0, 108.0, 62.0, 39.0, 33.0, 17.0, 9.0, 10.0, 3.0, 6.0, 0.0, 1.0, 3.0, 0.0, 2.0], "bins": [-8.328125, -8.08544921875, -7.8427734375, -7.60009765625, -7.357421875, -7.11474609375, -6.8720703125, -6.62939453125, -6.38671875, -6.14404296875, -5.9013671875, -5.65869140625, -5.416015625, -5.17333984375, -4.9306640625, -4.68798828125, -4.4453125, -4.20263671875, -3.9599609375, -3.71728515625, -3.474609375, -3.23193359375, -2.9892578125, -2.74658203125, -2.50390625, -2.26123046875, -2.0185546875, -1.77587890625, -1.533203125, -1.29052734375, -1.0478515625, -0.80517578125, -0.5625, -0.31982421875, -0.0771484375, 0.16552734375, 0.408203125, 0.65087890625, 0.8935546875, 1.13623046875, 1.37890625, 1.62158203125, 1.8642578125, 2.10693359375, 2.349609375, 2.59228515625, 2.8349609375, 3.07763671875, 3.3203125, 3.56298828125, 3.8056640625, 4.04833984375, 4.291015625, 4.53369140625, 4.7763671875, 5.01904296875, 5.26171875, 5.50439453125, 5.7470703125, 5.98974609375, 6.232421875, 6.47509765625, 6.7177734375, 6.96044921875, 7.203125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 6.0, 2.0, 3.0, 12.0, 12.0, 16.0, 24.0, 24.0, 21.0, 26.0, 34.0, 57.0, 57.0, 47.0, 58.0, 50.0, 72.0, 79.0, 57.0, 57.0, 43.0, 37.0, 29.0, 30.0, 26.0, 18.0, 17.0, 18.0, 18.0, 8.0, 5.0, 4.0, 6.0, 3.0, 5.0, 4.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.50390625, -2.424346923828125, -2.34478759765625, -2.265228271484375, -2.1856689453125, -2.106109619140625, -2.02655029296875, -1.946990966796875, -1.867431640625, -1.787872314453125, -1.70831298828125, -1.628753662109375, -1.5491943359375, -1.469635009765625, -1.39007568359375, -1.310516357421875, -1.23095703125, -1.151397705078125, -1.07183837890625, -0.992279052734375, -0.9127197265625, -0.833160400390625, -0.75360107421875, -0.674041748046875, -0.594482421875, -0.514923095703125, -0.43536376953125, -0.355804443359375, -0.2762451171875, -0.196685791015625, -0.11712646484375, -0.037567138671875, 0.0419921875, 0.121551513671875, 0.20111083984375, 0.280670166015625, 0.3602294921875, 0.439788818359375, 0.51934814453125, 0.598907470703125, 0.678466796875, 0.758026123046875, 0.83758544921875, 0.917144775390625, 0.9967041015625, 1.076263427734375, 1.15582275390625, 1.235382080078125, 1.31494140625, 1.394500732421875, 1.47406005859375, 1.553619384765625, 1.6331787109375, 1.712738037109375, 1.79229736328125, 1.871856689453125, 1.951416015625, 2.030975341796875, 2.11053466796875, 2.190093994140625, 2.2696533203125, 2.349212646484375, 2.42877197265625, 2.508331298828125, 2.587890625]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 5.0, 4.0, 7.0, 6.0, 6.0, 9.0, 14.0, 14.0, 19.0, 17.0, 27.0, 31.0, 29.0, 45.0, 45.0, 41.0, 45.0, 47.0, 46.0, 50.0, 55.0, 37.0, 57.0, 43.0, 29.0, 41.0, 33.0, 31.0, 24.0, 19.0, 22.0, 11.0, 22.0, 13.0, 9.0, 8.0, 6.0, 15.0, 2.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.397566795349121, -10.998830795288086, -10.600095748901367, -10.201360702514648, -9.802624702453613, -9.403888702392578, -9.00515365600586, -8.60641860961914, -8.207682609558105, -7.8089470863342285, -7.410211563110352, -7.011476039886475, -6.612740516662598, -6.214004993438721, -5.815269470214844, -5.416533946990967, -5.01779842376709, -4.619062900543213, -4.220327377319336, -3.821591854095459, -3.422856330871582, -3.024120807647705, -2.625385284423828, -2.226649761199951, -1.8279142379760742, -1.4291787147521973, -1.0304431915283203, -0.6317076683044434, -0.2329721450805664, 0.16576337814331055, 0.5644989013671875, 0.9632344245910645, 1.3619709014892578, 1.7607064247131348, 2.1594419479370117, 2.5581774711608887, 2.9569129943847656, 3.3556485176086426, 3.7543840408325195, 4.1531195640563965, 4.551855087280273, 4.95059061050415, 5.349326133728027, 5.748061656951904, 6.146797180175781, 6.545532703399658, 6.944268226623535, 7.343003749847412, 7.741739273071289, 8.140474319458008, 8.539210319519043, 8.937946319580078, 9.336681365966797, 9.735416412353516, 10.13415241241455, 10.532888412475586, 10.931623458862305, 11.330358505249023, 11.729094505310059, 12.127830505371094, 12.526565551757812, 12.925300598144531, 13.324036598205566, 13.722772598266602, 14.12150764465332]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 7.0, 4.0, 5.0, 5.0, 7.0, 12.0, 15.0, 15.0, 10.0, 17.0, 25.0, 24.0, 26.0, 35.0, 37.0, 33.0, 42.0, 33.0, 43.0, 41.0, 40.0, 35.0, 43.0, 50.0, 37.0, 33.0, 36.0, 34.0, 38.0, 32.0, 35.0, 23.0, 14.0, 16.0, 18.0, 15.0, 17.0, 9.0, 11.0, 10.0, 6.0, 7.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.395416259765625, -12.01191234588623, -11.628408432006836, -11.244904518127441, -10.861400604248047, -10.477897644042969, -10.094393730163574, -9.71088981628418, -9.327385902404785, -8.94388198852539, -8.560378074645996, -8.176874160766602, -7.793370723724365, -7.409866809844971, -7.026363372802734, -6.64285945892334, -6.259355545043945, -5.875851631164551, -5.492347717285156, -5.10884428024292, -4.725340366363525, -4.341836452484131, -3.9583327770233154, -3.5748291015625, -3.1913251876831055, -2.807821273803711, -2.4243175983428955, -2.04081392288208, -1.6573100090026855, -1.2738062143325806, -0.8903024196624756, -0.5067987442016602, -0.12329387664794922, 0.26020991802215576, 0.6437137126922607, 1.0272175073623657, 1.4107213020324707, 1.7942250967025757, 2.1777288913726807, 2.561232566833496, 2.9447364807128906, 3.328240394592285, 3.7117440700531006, 4.095247745513916, 4.4787516593933105, 4.862255573272705, 5.245759010314941, 5.629262924194336, 6.0127668380737305, 6.396270751953125, 6.7797746658325195, 7.163278102874756, 7.54678201675415, 7.930285930633545, 8.313789367675781, 8.697293281555176, 9.08079719543457, 9.464301109313965, 9.84780502319336, 10.231308937072754, 10.614812850952148, 10.998315811157227, 11.381819725036621, 11.765323638916016, 12.14882755279541]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 7.0, 6.0, 11.0, 17.0, 29.0, 33.0, 41.0, 82.0, 121.0, 191.0, 276.0, 397.0, 603.0, 1008.0, 1611.0, 2398.0, 3763.0, 6099.0, 9619.0, 15834.0, 26346.0, 45316.0, 80786.0, 152619.0, 304567.0, 592754.0, 899280.0, 878975.0, 559437.0, 283765.0, 143461.0, 76367.0, 43122.0, 25189.0, 15179.0, 9206.0, 5683.0, 3611.0, 2309.0, 1471.0, 922.0, 635.0, 383.0, 245.0, 173.0, 120.0, 84.0, 45.0, 36.0, 21.0, 11.0, 9.0, 6.0, 7.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-10.84375, -10.493408203125, -10.14306640625, -9.792724609375, -9.4423828125, -9.092041015625, -8.74169921875, -8.391357421875, -8.041015625, -7.690673828125, -7.34033203125, -6.989990234375, -6.6396484375, -6.289306640625, -5.93896484375, -5.588623046875, -5.23828125, -4.887939453125, -4.53759765625, -4.187255859375, -3.8369140625, -3.486572265625, -3.13623046875, -2.785888671875, -2.435546875, -2.085205078125, -1.73486328125, -1.384521484375, -1.0341796875, -0.683837890625, -0.33349609375, 0.016845703125, 0.3671875, 0.717529296875, 1.06787109375, 1.418212890625, 1.7685546875, 2.118896484375, 2.46923828125, 2.819580078125, 3.169921875, 3.520263671875, 3.87060546875, 4.220947265625, 4.5712890625, 4.921630859375, 5.27197265625, 5.622314453125, 5.97265625, 6.322998046875, 6.67333984375, 7.023681640625, 7.3740234375, 7.724365234375, 8.07470703125, 8.425048828125, 8.775390625, 9.125732421875, 9.47607421875, 9.826416015625, 10.1767578125, 10.527099609375, 10.87744140625, 11.227783203125, 11.578125]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 5.0, 7.0, 5.0, 7.0, 8.0, 8.0, 17.0, 17.0, 20.0, 18.0, 28.0, 30.0, 20.0, 25.0, 38.0, 37.0, 40.0, 33.0, 52.0, 35.0, 45.0, 55.0, 32.0, 41.0, 31.0, 27.0, 46.0, 31.0, 33.0, 26.0, 27.0, 26.0, 35.0, 19.0, 14.0, 9.0, 8.0, 11.0, 9.0, 2.0, 9.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5, -8.2330322265625, -7.966064453125, -7.6990966796875, -7.43212890625, -7.1651611328125, -6.898193359375, -6.6312255859375, -6.3642578125, -6.0972900390625, -5.830322265625, -5.5633544921875, -5.29638671875, -5.0294189453125, -4.762451171875, -4.4954833984375, -4.228515625, -3.9615478515625, -3.694580078125, -3.4276123046875, -3.16064453125, -2.8936767578125, -2.626708984375, -2.3597412109375, -2.0927734375, -1.8258056640625, -1.558837890625, -1.2918701171875, -1.02490234375, -0.7579345703125, -0.490966796875, -0.2239990234375, 0.04296875, 0.3099365234375, 0.576904296875, 0.8438720703125, 1.11083984375, 1.3778076171875, 1.644775390625, 1.9117431640625, 2.1787109375, 2.4456787109375, 2.712646484375, 2.9796142578125, 3.24658203125, 3.5135498046875, 3.780517578125, 4.0474853515625, 4.314453125, 4.5814208984375, 4.848388671875, 5.1153564453125, 5.38232421875, 5.6492919921875, 5.916259765625, 6.1832275390625, 6.4501953125, 6.7171630859375, 6.984130859375, 7.2510986328125, 7.51806640625, 7.7850341796875, 8.052001953125, 8.3189697265625, 8.5859375]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 8.0, 14.0, 20.0, 18.0, 42.0, 67.0, 110.0, 153.0, 242.0, 348.0, 553.0, 799.0, 1235.0, 1933.0, 3030.0, 4760.0, 7380.0, 11968.0, 19924.0, 32950.0, 55844.0, 96219.0, 167308.0, 294294.0, 507852.0, 776066.0, 824888.0, 578420.0, 340347.0, 193891.0, 111207.0, 64525.0, 37841.0, 23028.0, 13783.0, 8461.0, 5401.0, 3304.0, 2121.0, 1442.0, 871.0, 527.0, 379.0, 251.0, 155.0, 107.0, 66.0, 47.0, 44.0, 16.0, 13.0, 5.0, 3.0, 5.0, 3.0, 1.0, 2.0], "bins": [-10.984375, -10.65283203125, -10.3212890625, -9.98974609375, -9.658203125, -9.32666015625, -8.9951171875, -8.66357421875, -8.33203125, -8.00048828125, -7.6689453125, -7.33740234375, -7.005859375, -6.67431640625, -6.3427734375, -6.01123046875, -5.6796875, -5.34814453125, -5.0166015625, -4.68505859375, -4.353515625, -4.02197265625, -3.6904296875, -3.35888671875, -3.02734375, -2.69580078125, -2.3642578125, -2.03271484375, -1.701171875, -1.36962890625, -1.0380859375, -0.70654296875, -0.375, -0.04345703125, 0.2880859375, 0.61962890625, 0.951171875, 1.28271484375, 1.6142578125, 1.94580078125, 2.27734375, 2.60888671875, 2.9404296875, 3.27197265625, 3.603515625, 3.93505859375, 4.2666015625, 4.59814453125, 4.9296875, 5.26123046875, 5.5927734375, 5.92431640625, 6.255859375, 6.58740234375, 6.9189453125, 7.25048828125, 7.58203125, 7.91357421875, 8.2451171875, 8.57666015625, 8.908203125, 9.23974609375, 9.5712890625, 9.90283203125, 10.234375]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 10.0, 7.0, 11.0, 8.0, 9.0, 30.0, 20.0, 37.0, 42.0, 57.0, 61.0, 99.0, 99.0, 145.0, 175.0, 238.0, 273.0, 290.0, 305.0, 295.0, 290.0, 294.0, 233.0, 215.0, 164.0, 138.0, 131.0, 86.0, 75.0, 64.0, 49.0, 32.0, 27.0, 20.0, 11.0, 10.0, 7.0, 5.0, 4.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.62109375, -4.47296142578125, -4.3248291015625, -4.17669677734375, -4.028564453125, -3.88043212890625, -3.7322998046875, -3.58416748046875, -3.43603515625, -3.28790283203125, -3.1397705078125, -2.99163818359375, -2.843505859375, -2.69537353515625, -2.5472412109375, -2.39910888671875, -2.2509765625, -2.10284423828125, -1.9547119140625, -1.80657958984375, -1.658447265625, -1.51031494140625, -1.3621826171875, -1.21405029296875, -1.06591796875, -0.91778564453125, -0.7696533203125, -0.62152099609375, -0.473388671875, -0.32525634765625, -0.1771240234375, -0.02899169921875, 0.119140625, 0.26727294921875, 0.4154052734375, 0.56353759765625, 0.711669921875, 0.85980224609375, 1.0079345703125, 1.15606689453125, 1.30419921875, 1.45233154296875, 1.6004638671875, 1.74859619140625, 1.896728515625, 2.04486083984375, 2.1929931640625, 2.34112548828125, 2.4892578125, 2.63739013671875, 2.7855224609375, 2.93365478515625, 3.081787109375, 3.22991943359375, 3.3780517578125, 3.52618408203125, 3.67431640625, 3.82244873046875, 3.9705810546875, 4.11871337890625, 4.266845703125, 4.41497802734375, 4.5631103515625, 4.71124267578125, 4.859375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 8.0, 10.0, 9.0, 16.0, 9.0, 19.0, 27.0, 28.0, 36.0, 40.0, 38.0, 46.0, 44.0, 52.0, 52.0, 50.0, 49.0, 57.0, 48.0, 51.0, 49.0, 39.0, 29.0, 27.0, 25.0, 31.0, 18.0, 19.0, 16.0, 11.0, 10.0, 8.0, 6.0, 6.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.619545936584473, -11.259020805358887, -10.8984956741333, -10.537969589233398, -10.177444458007812, -9.816919326782227, -9.45639419555664, -9.095869064331055, -8.735343933105469, -8.374818801879883, -8.014293670654297, -7.653768062591553, -7.293242454528809, -6.932717323303223, -6.572192192077637, -6.211667060852051, -5.851140975952148, -5.4906158447265625, -5.130090236663818, -4.769565105438232, -4.409039497375488, -4.048514366149902, -3.6879892349243164, -3.3274638652801514, -2.9669384956359863, -2.6064131259918213, -2.2458877563476562, -1.8853626251220703, -1.5248372554779053, -1.1643118858337402, -0.8037867546081543, -0.44326138496398926, -0.08273601531982422, 0.27778929471969604, 0.6383146047592163, 0.9988398551940918, 1.3593652248382568, 1.7198905944824219, 2.080415725708008, 2.440941095352173, 2.801466464996338, 3.161991834640503, 3.522517204284668, 3.883042335510254, 4.24356746673584, 4.604093074798584, 4.96461820602417, 5.325143814086914, 5.6856689453125, 6.046194076538086, 6.40671968460083, 6.767244815826416, 7.12777042388916, 7.488295555114746, 7.848820686340332, 8.209345817565918, 8.56987190246582, 8.930397033691406, 9.290922164916992, 9.651447296142578, 10.01197338104248, 10.372498512268066, 10.733023643493652, 11.093548774719238, 11.454073905944824]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 5.0, 5.0, 6.0, 4.0, 5.0, 18.0, 11.0, 12.0, 20.0, 20.0, 30.0, 37.0, 30.0, 34.0, 24.0, 37.0, 34.0, 32.0, 46.0, 43.0, 39.0, 46.0, 29.0, 49.0, 27.0, 45.0, 31.0, 41.0, 31.0, 24.0, 24.0, 23.0, 28.0, 18.0, 16.0, 15.0, 8.0, 11.0, 10.0, 9.0, 2.0, 11.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.037527084350586, -9.726256370544434, -9.414985656738281, -9.103713989257812, -8.79244327545166, -8.481172561645508, -8.169900894165039, -7.858630180358887, -7.547359466552734, -7.236088752746582, -6.9248175621032715, -6.613546371459961, -6.302275657653809, -5.991004943847656, -5.679733753204346, -5.368462562561035, -5.057191848754883, -4.7459211349487305, -4.43464994430542, -4.123378753662109, -3.812108039855957, -3.5008370876312256, -3.189566135406494, -2.8782951831817627, -2.5670242309570312, -2.2557532787323, -1.9444823265075684, -1.633211374282837, -1.3219404220581055, -1.010669469833374, -0.6993985176086426, -0.38812756538391113, -0.07685661315917969, 0.23441433906555176, 0.5456852912902832, 0.8569562435150146, 1.168227195739746, 1.4794981479644775, 1.790769100189209, 2.1020400524139404, 2.413311004638672, 2.7245819568634033, 3.0358529090881348, 3.347123861312866, 3.6583948135375977, 3.969665765762329, 4.2809367179870605, 4.592207908630371, 4.903478622436523, 5.214749336242676, 5.526020526885986, 5.837291717529297, 6.148562431335449, 6.459833145141602, 6.771104335784912, 7.082375526428223, 7.393646240234375, 7.704916954040527, 8.01618766784668, 8.327459335327148, 8.6387300491333, 8.950000762939453, 9.261272430419922, 9.572543144226074, 9.883813858032227]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 8.0, 8.0, 36.0, 33.0, 52.0, 77.0, 101.0, 134.0, 178.0, 293.0, 417.0, 586.0, 935.0, 1276.0, 1850.0, 2864.0, 4375.0, 6599.0, 9638.0, 14367.0, 21960.0, 33026.0, 48157.0, 70267.0, 97131.0, 122556.0, 136834.0, 128011.0, 104503.0, 77274.0, 54280.0, 37025.0, 24495.0, 16119.0, 10863.0, 7317.0, 4799.0, 3349.0, 2141.0, 1463.0, 1035.0, 660.0, 441.0, 335.0, 241.0, 132.0, 99.0, 67.0, 37.0, 40.0, 22.0, 25.0, 7.0, 12.0, 6.0, 3.0, 0.0, 4.0], "bins": [-9.71875, -9.4210205078125, -9.123291015625, -8.8255615234375, -8.52783203125, -8.2301025390625, -7.932373046875, -7.6346435546875, -7.3369140625, -7.0391845703125, -6.741455078125, -6.4437255859375, -6.14599609375, -5.8482666015625, -5.550537109375, -5.2528076171875, -4.955078125, -4.6573486328125, -4.359619140625, -4.0618896484375, -3.76416015625, -3.4664306640625, -3.168701171875, -2.8709716796875, -2.5732421875, -2.2755126953125, -1.977783203125, -1.6800537109375, -1.38232421875, -1.0845947265625, -0.786865234375, -0.4891357421875, -0.19140625, 0.1063232421875, 0.404052734375, 0.7017822265625, 0.99951171875, 1.2972412109375, 1.594970703125, 1.8927001953125, 2.1904296875, 2.4881591796875, 2.785888671875, 3.0836181640625, 3.38134765625, 3.6790771484375, 3.976806640625, 4.2745361328125, 4.572265625, 4.8699951171875, 5.167724609375, 5.4654541015625, 5.76318359375, 6.0609130859375, 6.358642578125, 6.6563720703125, 6.9541015625, 7.2518310546875, 7.549560546875, 7.8472900390625, 8.14501953125, 8.4427490234375, 8.740478515625, 9.0382080078125, 9.3359375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 7.0, 5.0, 5.0, 2.0, 5.0, 4.0, 5.0, 8.0, 6.0, 13.0, 8.0, 17.0, 17.0, 19.0, 23.0, 28.0, 23.0, 27.0, 37.0, 35.0, 42.0, 32.0, 34.0, 32.0, 39.0, 31.0, 36.0, 38.0, 37.0, 32.0, 37.0, 27.0, 35.0, 35.0, 33.0, 33.0, 25.0, 20.0, 19.0, 14.0, 12.0, 11.0, 11.0, 14.0, 10.0, 5.0, 10.0, 3.0, 3.0, 7.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.1015625, -8.8089599609375, -8.516357421875, -8.2237548828125, -7.93115234375, -7.6385498046875, -7.345947265625, -7.0533447265625, -6.7607421875, -6.4681396484375, -6.175537109375, -5.8829345703125, -5.59033203125, -5.2977294921875, -5.005126953125, -4.7125244140625, -4.419921875, -4.1273193359375, -3.834716796875, -3.5421142578125, -3.24951171875, -2.9569091796875, -2.664306640625, -2.3717041015625, -2.0791015625, -1.7864990234375, -1.493896484375, -1.2012939453125, -0.90869140625, -0.6160888671875, -0.323486328125, -0.0308837890625, 0.26171875, 0.5543212890625, 0.846923828125, 1.1395263671875, 1.43212890625, 1.7247314453125, 2.017333984375, 2.3099365234375, 2.6025390625, 2.8951416015625, 3.187744140625, 3.4803466796875, 3.77294921875, 4.0655517578125, 4.358154296875, 4.6507568359375, 4.943359375, 5.2359619140625, 5.528564453125, 5.8211669921875, 6.11376953125, 6.4063720703125, 6.698974609375, 6.9915771484375, 7.2841796875, 7.5767822265625, 7.869384765625, 8.1619873046875, 8.45458984375, 8.7471923828125, 9.039794921875, 9.3323974609375, 9.625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 8.0, 6.0, 14.0, 22.0, 27.0, 49.0, 57.0, 84.0, 126.0, 174.0, 242.0, 306.0, 514.0, 778.0, 1208.0, 1875.0, 3174.0, 5432.0, 9791.0, 18925.0, 38520.0, 81819.0, 173019.0, 284674.0, 217106.0, 107364.0, 49922.0, 24185.0, 12439.0, 6473.0, 3757.0, 2264.0, 1387.0, 922.0, 615.0, 347.0, 280.0, 208.0, 139.0, 75.0, 80.0, 35.0, 35.0, 15.0, 16.0, 13.0, 11.0, 9.0, 8.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0], "bins": [-20.421875, -19.796875, -19.171875, -18.546875, -17.921875, -17.296875, -16.671875, -16.046875, -15.421875, -14.796875, -14.171875, -13.546875, -12.921875, -12.296875, -11.671875, -11.046875, -10.421875, -9.796875, -9.171875, -8.546875, -7.921875, -7.296875, -6.671875, -6.046875, -5.421875, -4.796875, -4.171875, -3.546875, -2.921875, -2.296875, -1.671875, -1.046875, -0.421875, 0.203125, 0.828125, 1.453125, 2.078125, 2.703125, 3.328125, 3.953125, 4.578125, 5.203125, 5.828125, 6.453125, 7.078125, 7.703125, 8.328125, 8.953125, 9.578125, 10.203125, 10.828125, 11.453125, 12.078125, 12.703125, 13.328125, 13.953125, 14.578125, 15.203125, 15.828125, 16.453125, 17.078125, 17.703125, 18.328125, 18.953125, 19.578125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 9.0, 11.0, 20.0, 7.0, 12.0, 13.0, 23.0, 28.0, 26.0, 26.0, 30.0, 31.0, 38.0, 58.0, 30.0, 31.0, 45.0, 42.0, 42.0, 34.0, 48.0, 40.0, 33.0, 44.0, 40.0, 23.0, 30.0, 30.0, 24.0, 17.0, 28.0, 15.0, 16.0, 11.0, 8.0, 10.0, 9.0, 5.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.1171875, -6.89892578125, -6.6806640625, -6.46240234375, -6.244140625, -6.02587890625, -5.8076171875, -5.58935546875, -5.37109375, -5.15283203125, -4.9345703125, -4.71630859375, -4.498046875, -4.27978515625, -4.0615234375, -3.84326171875, -3.625, -3.40673828125, -3.1884765625, -2.97021484375, -2.751953125, -2.53369140625, -2.3154296875, -2.09716796875, -1.87890625, -1.66064453125, -1.4423828125, -1.22412109375, -1.005859375, -0.78759765625, -0.5693359375, -0.35107421875, -0.1328125, 0.08544921875, 0.3037109375, 0.52197265625, 0.740234375, 0.95849609375, 1.1767578125, 1.39501953125, 1.61328125, 1.83154296875, 2.0498046875, 2.26806640625, 2.486328125, 2.70458984375, 2.9228515625, 3.14111328125, 3.359375, 3.57763671875, 3.7958984375, 4.01416015625, 4.232421875, 4.45068359375, 4.6689453125, 4.88720703125, 5.10546875, 5.32373046875, 5.5419921875, 5.76025390625, 5.978515625, 6.19677734375, 6.4150390625, 6.63330078125, 6.8515625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 7.0, 3.0, 15.0, 12.0, 23.0, 21.0, 41.0, 72.0, 110.0, 144.0, 269.0, 462.0, 879.0, 1779.0, 3947.0, 8599.0, 21817.0, 59921.0, 182656.0, 409839.0, 234512.0, 77137.0, 26985.0, 10443.0, 4447.0, 2001.0, 1053.0, 548.0, 310.0, 162.0, 113.0, 65.0, 51.0, 35.0, 18.0, 17.0, 11.0, 7.0, 4.0, 6.0, 3.0, 2.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.0390625, -13.594970703125, -13.15087890625, -12.706787109375, -12.2626953125, -11.818603515625, -11.37451171875, -10.930419921875, -10.486328125, -10.042236328125, -9.59814453125, -9.154052734375, -8.7099609375, -8.265869140625, -7.82177734375, -7.377685546875, -6.93359375, -6.489501953125, -6.04541015625, -5.601318359375, -5.1572265625, -4.713134765625, -4.26904296875, -3.824951171875, -3.380859375, -2.936767578125, -2.49267578125, -2.048583984375, -1.6044921875, -1.160400390625, -0.71630859375, -0.272216796875, 0.171875, 0.615966796875, 1.06005859375, 1.504150390625, 1.9482421875, 2.392333984375, 2.83642578125, 3.280517578125, 3.724609375, 4.168701171875, 4.61279296875, 5.056884765625, 5.5009765625, 5.945068359375, 6.38916015625, 6.833251953125, 7.27734375, 7.721435546875, 8.16552734375, 8.609619140625, 9.0537109375, 9.497802734375, 9.94189453125, 10.385986328125, 10.830078125, 11.274169921875, 11.71826171875, 12.162353515625, 12.6064453125, 13.050537109375, 13.49462890625, 13.938720703125, 14.3828125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 5.0, 10.0, 16.0, 14.0, 20.0, 32.0, 41.0, 40.0, 66.0, 85.0, 84.0, 93.0, 104.0, 86.0, 70.0, 46.0, 43.0, 29.0, 25.0, 13.0, 15.0, 13.0, 11.0, 3.0, 4.0, 10.0, 7.0, 1.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006146430969238281, -0.0005947276949882507, -0.0005748122930526733, -0.000554896891117096, -0.0005349814891815186, -0.0005150660872459412, -0.0004951506853103638, -0.0004752352833747864, -0.000455319881439209, -0.0004354044795036316, -0.0004154890775680542, -0.0003955736756324768, -0.0003756582736968994, -0.000355742871761322, -0.00033582746982574463, -0.00031591206789016724, -0.00029599666595458984, -0.00027608126401901245, -0.00025616586208343506, -0.00023625046014785767, -0.00021633505821228027, -0.00019641965627670288, -0.0001765042543411255, -0.0001565888524055481, -0.0001366734504699707, -0.00011675804853439331, -9.684264659881592e-05, -7.692724466323853e-05, -5.701184272766113e-05, -3.709644079208374e-05, -1.7181038856506348e-05, 2.734363079071045e-06, 2.2649765014648438e-05, 4.256516695022583e-05, 6.248056888580322e-05, 8.239597082138062e-05, 0.00010231137275695801, 0.0001222267746925354, 0.0001421421766281128, 0.00016205757856369019, 0.00018197298049926758, 0.00020188838243484497, 0.00022180378437042236, 0.00024171918630599976, 0.00026163458824157715, 0.00028154999017715454, 0.00030146539211273193, 0.0003213807940483093, 0.0003412961959838867, 0.0003612115979194641, 0.0003811269998550415, 0.0004010424017906189, 0.0004209578037261963, 0.0004408732056617737, 0.0004607886075973511, 0.00048070400953292847, 0.0005006194114685059, 0.0005205348134040833, 0.0005404502153396606, 0.000560365617275238, 0.0005802810192108154, 0.0006001964211463928, 0.0006201118230819702, 0.0006400272250175476, 0.000659942626953125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 10.0, 15.0, 13.0, 22.0, 45.0, 58.0, 77.0, 108.0, 161.0, 257.0, 370.0, 533.0, 785.0, 1240.0, 2007.0, 3337.0, 5263.0, 8777.0, 14567.0, 25191.0, 43964.0, 74912.0, 122044.0, 170988.0, 184085.0, 149997.0, 97944.0, 58572.0, 33782.0, 19376.0, 11586.0, 6874.0, 4254.0, 2568.0, 1652.0, 1079.0, 717.0, 423.0, 281.0, 196.0, 143.0, 84.0, 60.0, 49.0, 20.0, 24.0, 22.0, 11.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.63671875, -6.4310302734375, -6.225341796875, -6.0196533203125, -5.81396484375, -5.6082763671875, -5.402587890625, -5.1968994140625, -4.9912109375, -4.7855224609375, -4.579833984375, -4.3741455078125, -4.16845703125, -3.9627685546875, -3.757080078125, -3.5513916015625, -3.345703125, -3.1400146484375, -2.934326171875, -2.7286376953125, -2.52294921875, -2.3172607421875, -2.111572265625, -1.9058837890625, -1.7001953125, -1.4945068359375, -1.288818359375, -1.0831298828125, -0.87744140625, -0.6717529296875, -0.466064453125, -0.2603759765625, -0.0546875, 0.1510009765625, 0.356689453125, 0.5623779296875, 0.76806640625, 0.9737548828125, 1.179443359375, 1.3851318359375, 1.5908203125, 1.7965087890625, 2.002197265625, 2.2078857421875, 2.41357421875, 2.6192626953125, 2.824951171875, 3.0306396484375, 3.236328125, 3.4420166015625, 3.647705078125, 3.8533935546875, 4.05908203125, 4.2647705078125, 4.470458984375, 4.6761474609375, 4.8818359375, 5.0875244140625, 5.293212890625, 5.4989013671875, 5.70458984375, 5.9102783203125, 6.115966796875, 6.3216552734375, 6.52734375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 14.0, 10.0, 15.0, 21.0, 36.0, 29.0, 54.0, 70.0, 73.0, 65.0, 68.0, 74.0, 71.0, 82.0, 67.0, 56.0, 39.0, 34.0, 25.0, 31.0, 12.0, 16.0, 6.0, 5.0, 3.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.671875, -3.55828857421875, -3.4447021484375, -3.33111572265625, -3.217529296875, -3.10394287109375, -2.9903564453125, -2.87677001953125, -2.76318359375, -2.64959716796875, -2.5360107421875, -2.42242431640625, -2.308837890625, -2.19525146484375, -2.0816650390625, -1.96807861328125, -1.8544921875, -1.74090576171875, -1.6273193359375, -1.51373291015625, -1.400146484375, -1.28656005859375, -1.1729736328125, -1.05938720703125, -0.94580078125, -0.83221435546875, -0.7186279296875, -0.60504150390625, -0.491455078125, -0.37786865234375, -0.2642822265625, -0.15069580078125, -0.037109375, 0.07647705078125, 0.1900634765625, 0.30364990234375, 0.417236328125, 0.53082275390625, 0.6444091796875, 0.75799560546875, 0.87158203125, 0.98516845703125, 1.0987548828125, 1.21234130859375, 1.325927734375, 1.43951416015625, 1.5531005859375, 1.66668701171875, 1.7802734375, 1.89385986328125, 2.0074462890625, 2.12103271484375, 2.234619140625, 2.34820556640625, 2.4617919921875, 2.57537841796875, 2.68896484375, 2.80255126953125, 2.9161376953125, 3.02972412109375, 3.143310546875, 3.25689697265625, 3.3704833984375, 3.48406982421875, 3.59765625]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 4.0, 7.0, 8.0, 13.0, 9.0, 12.0, 27.0, 14.0, 31.0, 27.0, 32.0, 35.0, 39.0, 47.0, 32.0, 45.0, 52.0, 51.0, 57.0, 50.0, 40.0, 49.0, 53.0, 41.0, 44.0, 19.0, 25.0, 18.0, 16.0, 13.0, 19.0, 17.0, 11.0, 9.0, 5.0, 7.0, 8.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.239821434020996, -9.9097261428833, -9.579631805419922, -9.249536514282227, -8.919442176818848, -8.589346885681152, -8.259252548217773, -7.929157257080078, -7.599062442779541, -7.268967628479004, -6.938872814178467, -6.60877799987793, -6.278682708740234, -5.9485883712768555, -5.61849308013916, -5.288398265838623, -4.958303451538086, -4.628208637237549, -4.298113822937012, -3.9680187702178955, -3.6379239559173584, -3.3078291416168213, -2.977734088897705, -2.647639274597168, -2.317544460296631, -1.9874496459960938, -1.657354712486267, -1.3272597789764404, -0.9971649646759033, -0.6670701503753662, -0.33697521686553955, -0.006880283355712891, 0.3232154846191406, 0.6533103585243225, 0.9834052324295044, 1.313500165939331, 1.6435949802398682, 1.9736897945404053, 2.3037848472595215, 2.6338796615600586, 2.9639744758605957, 3.294069290161133, 3.62416410446167, 3.954259157180786, 4.284354209899902, 4.614448547363281, 4.944543838500977, 5.274638652801514, 5.604733467102051, 5.934828281402588, 6.264923095703125, 6.595017910003662, 6.925112724304199, 7.2552080154418945, 7.585302829742432, 7.915397644042969, 8.245492935180664, 8.57558822631836, 8.905682563781738, 9.235777854919434, 9.565872192382812, 9.895967483520508, 10.226061820983887, 10.556157112121582, 10.886251449584961]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 6.0, 3.0, 5.0, 6.0, 8.0, 15.0, 14.0, 12.0, 19.0, 20.0, 27.0, 29.0, 33.0, 25.0, 36.0, 35.0, 50.0, 35.0, 40.0, 40.0, 38.0, 43.0, 41.0, 46.0, 41.0, 41.0, 34.0, 30.0, 42.0, 22.0, 29.0, 20.0, 18.0, 19.0, 17.0, 14.0, 14.0, 8.0, 3.0, 5.0, 5.0, 4.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.418608665466309, -10.10146427154541, -9.784318923950195, -9.467174530029297, -9.150030136108398, -8.8328857421875, -8.515740394592285, -8.198596000671387, -7.88145112991333, -7.564306259155273, -7.247161865234375, -6.930016994476318, -6.612872123718262, -6.295727729797363, -5.978582859039307, -5.66143798828125, -5.344293594360352, -5.027148723602295, -4.7100043296813965, -4.39285945892334, -4.075715065002441, -3.7585701942443848, -3.441425323486328, -3.1242806911468506, -2.807136058807373, -2.4899914264678955, -2.172846794128418, -1.8557019233703613, -1.5385572910308838, -1.2214126586914062, -0.9042679071426392, -0.5871231555938721, -0.2699775695800781, 0.04716712236404419, 0.3643118143081665, 0.6814565062522888, 0.9986011981964111, 1.3157458305358887, 1.6328905820846558, 1.9500353336334229, 2.2671799659729004, 2.584324598312378, 2.9014692306518555, 3.218614101409912, 3.5357587337493896, 3.852903366088867, 4.170048236846924, 4.4871931076049805, 4.804337501525879, 5.1214823722839355, 5.438626766204834, 5.755771636962891, 6.072916030883789, 6.390060901641846, 6.707205772399902, 7.024350166320801, 7.341495037078857, 7.658639907836914, 7.9757843017578125, 8.292928695678711, 8.610074043273926, 8.927218437194824, 9.244362831115723, 9.561508178710938, 9.878652572631836]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 8.0, 6.0, 8.0, 19.0, 35.0, 35.0, 62.0, 110.0, 182.0, 250.0, 423.0, 662.0, 961.0, 1592.0, 2441.0, 3735.0, 5823.0, 8993.0, 13921.0, 21888.0, 33646.0, 50021.0, 72179.0, 97642.0, 121185.0, 133872.0, 126920.0, 106555.0, 79921.0, 56601.0, 38230.0, 24994.0, 16292.0, 10499.0, 6819.0, 4282.0, 2781.0, 1798.0, 1142.0, 695.0, 501.0, 305.0, 185.0, 120.0, 74.0, 60.0, 25.0, 23.0, 16.0, 9.0, 7.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0], "bins": [-9.2421875, -8.959228515625, -8.67626953125, -8.393310546875, -8.1103515625, -7.827392578125, -7.54443359375, -7.261474609375, -6.978515625, -6.695556640625, -6.41259765625, -6.129638671875, -5.8466796875, -5.563720703125, -5.28076171875, -4.997802734375, -4.71484375, -4.431884765625, -4.14892578125, -3.865966796875, -3.5830078125, -3.300048828125, -3.01708984375, -2.734130859375, -2.451171875, -2.168212890625, -1.88525390625, -1.602294921875, -1.3193359375, -1.036376953125, -0.75341796875, -0.470458984375, -0.1875, 0.095458984375, 0.37841796875, 0.661376953125, 0.9443359375, 1.227294921875, 1.51025390625, 1.793212890625, 2.076171875, 2.359130859375, 2.64208984375, 2.925048828125, 3.2080078125, 3.490966796875, 3.77392578125, 4.056884765625, 4.33984375, 4.622802734375, 4.90576171875, 5.188720703125, 5.4716796875, 5.754638671875, 6.03759765625, 6.320556640625, 6.603515625, 6.886474609375, 7.16943359375, 7.452392578125, 7.7353515625, 8.018310546875, 8.30126953125, 8.584228515625, 8.8671875]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 6.0, 5.0, 3.0, 4.0, 4.0, 11.0, 14.0, 9.0, 10.0, 16.0, 16.0, 18.0, 26.0, 32.0, 30.0, 34.0, 35.0, 33.0, 33.0, 45.0, 39.0, 28.0, 45.0, 36.0, 38.0, 48.0, 32.0, 32.0, 39.0, 37.0, 35.0, 25.0, 31.0, 27.0, 23.0, 16.0, 9.0, 17.0, 21.0, 7.0, 5.0, 7.0, 10.0, 5.0, 5.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.78125, -8.4896240234375, -8.197998046875, -7.9063720703125, -7.61474609375, -7.3231201171875, -7.031494140625, -6.7398681640625, -6.4482421875, -6.1566162109375, -5.864990234375, -5.5733642578125, -5.28173828125, -4.9901123046875, -4.698486328125, -4.4068603515625, -4.115234375, -3.8236083984375, -3.531982421875, -3.2403564453125, -2.94873046875, -2.6571044921875, -2.365478515625, -2.0738525390625, -1.7822265625, -1.4906005859375, -1.198974609375, -0.9073486328125, -0.61572265625, -0.3240966796875, -0.032470703125, 0.2591552734375, 0.55078125, 0.8424072265625, 1.134033203125, 1.4256591796875, 1.71728515625, 2.0089111328125, 2.300537109375, 2.5921630859375, 2.8837890625, 3.1754150390625, 3.467041015625, 3.7586669921875, 4.05029296875, 4.3419189453125, 4.633544921875, 4.9251708984375, 5.216796875, 5.5084228515625, 5.800048828125, 6.0916748046875, 6.38330078125, 6.6749267578125, 6.966552734375, 7.2581787109375, 7.5498046875, 7.8414306640625, 8.133056640625, 8.4246826171875, 8.71630859375, 9.0079345703125, 9.299560546875, 9.5911865234375, 9.8828125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 7.0, 12.0, 16.0, 22.0, 34.0, 36.0, 58.0, 89.0, 121.0, 202.0, 275.0, 409.0, 662.0, 1031.0, 1431.0, 2301.0, 3449.0, 5294.0, 8079.0, 12488.0, 19132.0, 29676.0, 43812.0, 63608.0, 86665.0, 111966.0, 128151.0, 128587.0, 112715.0, 89528.0, 65518.0, 45277.0, 30475.0, 20101.0, 12969.0, 8360.0, 5526.0, 3514.0, 2370.0, 1589.0, 985.0, 680.0, 441.0, 270.0, 222.0, 121.0, 83.0, 69.0, 46.0, 32.0, 18.0, 11.0, 9.0, 6.0, 4.0, 3.0, 4.0], "bins": [-8.53125, -8.2806396484375, -8.030029296875, -7.7794189453125, -7.52880859375, -7.2781982421875, -7.027587890625, -6.7769775390625, -6.5263671875, -6.2757568359375, -6.025146484375, -5.7745361328125, -5.52392578125, -5.2733154296875, -5.022705078125, -4.7720947265625, -4.521484375, -4.2708740234375, -4.020263671875, -3.7696533203125, -3.51904296875, -3.2684326171875, -3.017822265625, -2.7672119140625, -2.5166015625, -2.2659912109375, -2.015380859375, -1.7647705078125, -1.51416015625, -1.2635498046875, -1.012939453125, -0.7623291015625, -0.51171875, -0.2611083984375, -0.010498046875, 0.2401123046875, 0.49072265625, 0.7413330078125, 0.991943359375, 1.2425537109375, 1.4931640625, 1.7437744140625, 1.994384765625, 2.2449951171875, 2.49560546875, 2.7462158203125, 2.996826171875, 3.2474365234375, 3.498046875, 3.7486572265625, 3.999267578125, 4.2498779296875, 4.50048828125, 4.7510986328125, 5.001708984375, 5.2523193359375, 5.5029296875, 5.7535400390625, 6.004150390625, 6.2547607421875, 6.50537109375, 6.7559814453125, 7.006591796875, 7.2572021484375, 7.5078125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 4.0, 4.0, 7.0, 1.0, 4.0, 6.0, 14.0, 11.0, 12.0, 13.0, 16.0, 13.0, 16.0, 19.0, 33.0, 33.0, 32.0, 40.0, 33.0, 40.0, 34.0, 40.0, 46.0, 50.0, 36.0, 32.0, 32.0, 32.0, 33.0, 38.0, 40.0, 26.0, 34.0, 24.0, 25.0, 26.0, 16.0, 19.0, 15.0, 14.0, 10.0, 3.0, 5.0, 5.0, 8.0, 6.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.23046875, -5.04217529296875, -4.8538818359375, -4.66558837890625, -4.477294921875, -4.28900146484375, -4.1007080078125, -3.91241455078125, -3.72412109375, -3.53582763671875, -3.3475341796875, -3.15924072265625, -2.970947265625, -2.78265380859375, -2.5943603515625, -2.40606689453125, -2.2177734375, -2.02947998046875, -1.8411865234375, -1.65289306640625, -1.464599609375, -1.27630615234375, -1.0880126953125, -0.89971923828125, -0.71142578125, -0.52313232421875, -0.3348388671875, -0.14654541015625, 0.041748046875, 0.23004150390625, 0.4183349609375, 0.60662841796875, 0.794921875, 0.98321533203125, 1.1715087890625, 1.35980224609375, 1.548095703125, 1.73638916015625, 1.9246826171875, 2.11297607421875, 2.30126953125, 2.48956298828125, 2.6778564453125, 2.86614990234375, 3.054443359375, 3.24273681640625, 3.4310302734375, 3.61932373046875, 3.8076171875, 3.99591064453125, 4.1842041015625, 4.37249755859375, 4.560791015625, 4.74908447265625, 4.9373779296875, 5.12567138671875, 5.31396484375, 5.50225830078125, 5.6905517578125, 5.87884521484375, 6.067138671875, 6.25543212890625, 6.4437255859375, 6.63201904296875, 6.8203125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 8.0, 10.0, 13.0, 22.0, 34.0, 57.0, 68.0, 123.0, 155.0, 246.0, 384.0, 624.0, 957.0, 1582.0, 2530.0, 4354.0, 7638.0, 13975.0, 26162.0, 49621.0, 96548.0, 171746.0, 229258.0, 194631.0, 116454.0, 61012.0, 31737.0, 16468.0, 9128.0, 5062.0, 3082.0, 1777.0, 1144.0, 653.0, 441.0, 281.0, 188.0, 129.0, 82.0, 56.0, 38.0, 26.0, 24.0, 8.0, 14.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-8.890625, -8.634033203125, -8.37744140625, -8.120849609375, -7.8642578125, -7.607666015625, -7.35107421875, -7.094482421875, -6.837890625, -6.581298828125, -6.32470703125, -6.068115234375, -5.8115234375, -5.554931640625, -5.29833984375, -5.041748046875, -4.78515625, -4.528564453125, -4.27197265625, -4.015380859375, -3.7587890625, -3.502197265625, -3.24560546875, -2.989013671875, -2.732421875, -2.475830078125, -2.21923828125, -1.962646484375, -1.7060546875, -1.449462890625, -1.19287109375, -0.936279296875, -0.6796875, -0.423095703125, -0.16650390625, 0.090087890625, 0.3466796875, 0.603271484375, 0.85986328125, 1.116455078125, 1.373046875, 1.629638671875, 1.88623046875, 2.142822265625, 2.3994140625, 2.656005859375, 2.91259765625, 3.169189453125, 3.42578125, 3.682373046875, 3.93896484375, 4.195556640625, 4.4521484375, 4.708740234375, 4.96533203125, 5.221923828125, 5.478515625, 5.735107421875, 5.99169921875, 6.248291015625, 6.5048828125, 6.761474609375, 7.01806640625, 7.274658203125, 7.53125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 10.0, 7.0, 8.0, 7.0, 15.0, 18.0, 37.0, 34.0, 52.0, 70.0, 54.0, 90.0, 83.0, 86.0, 88.0, 82.0, 61.0, 44.0, 38.0, 26.0, 21.0, 20.0, 12.0, 6.0, 4.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0010852813720703125, -0.001055017113685608, -0.0010247528553009033, -0.0009944885969161987, -0.0009642243385314941, -0.0009339600801467896, -0.000903695821762085, -0.0008734315633773804, -0.0008431673049926758, -0.0008129030466079712, -0.0007826387882232666, -0.000752374529838562, -0.0007221102714538574, -0.0006918460130691528, -0.0006615817546844482, -0.0006313174962997437, -0.0006010532379150391, -0.0005707889795303345, -0.0005405247211456299, -0.0005102604627609253, -0.0004799962043762207, -0.0004497319459915161, -0.0004194676876068115, -0.00038920342922210693, -0.00035893917083740234, -0.00032867491245269775, -0.00029841065406799316, -0.0002681463956832886, -0.00023788213729858398, -0.0002076178789138794, -0.0001773536205291748, -0.00014708936214447021, -0.00011682510375976562, -8.656084537506104e-05, -5.6296586990356445e-05, -2.6032328605651855e-05, 4.231929779052734e-06, 3.4496188163757324e-05, 6.476044654846191e-05, 9.50247049331665e-05, 0.0001252889633178711, 0.00015555322170257568, 0.00018581748008728027, 0.00021608173847198486, 0.00024634599685668945, 0.00027661025524139404, 0.00030687451362609863, 0.0003371387720108032, 0.0003674030303955078, 0.0003976672887802124, 0.000427931547164917, 0.0004581958055496216, 0.0004884600639343262, 0.0005187243223190308, 0.0005489885807037354, 0.0005792528390884399, 0.0006095170974731445, 0.0006397813558578491, 0.0006700456142425537, 0.0007003098726272583, 0.0007305741310119629, 0.0007608383893966675, 0.0007911026477813721, 0.0008213669061660767, 0.0008516311645507812]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 3.0, 2.0, 5.0, 10.0, 21.0, 11.0, 35.0, 49.0, 64.0, 96.0, 146.0, 225.0, 357.0, 523.0, 900.0, 1388.0, 2291.0, 3667.0, 6571.0, 10770.0, 18799.0, 32708.0, 56964.0, 93410.0, 142855.0, 180411.0, 172318.0, 127256.0, 81352.0, 48207.0, 27849.0, 16176.0, 9161.0, 5407.0, 3147.0, 1935.0, 1268.0, 738.0, 525.0, 332.0, 208.0, 127.0, 91.0, 48.0, 42.0, 27.0, 22.0, 19.0, 11.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.63671875, -5.44134521484375, -5.2459716796875, -5.05059814453125, -4.855224609375, -4.65985107421875, -4.4644775390625, -4.26910400390625, -4.07373046875, -3.87835693359375, -3.6829833984375, -3.48760986328125, -3.292236328125, -3.09686279296875, -2.9014892578125, -2.70611572265625, -2.5107421875, -2.31536865234375, -2.1199951171875, -1.92462158203125, -1.729248046875, -1.53387451171875, -1.3385009765625, -1.14312744140625, -0.94775390625, -0.75238037109375, -0.5570068359375, -0.36163330078125, -0.166259765625, 0.02911376953125, 0.2244873046875, 0.41986083984375, 0.615234375, 0.81060791015625, 1.0059814453125, 1.20135498046875, 1.396728515625, 1.59210205078125, 1.7874755859375, 1.98284912109375, 2.17822265625, 2.37359619140625, 2.5689697265625, 2.76434326171875, 2.959716796875, 3.15509033203125, 3.3504638671875, 3.54583740234375, 3.7412109375, 3.93658447265625, 4.1319580078125, 4.32733154296875, 4.522705078125, 4.71807861328125, 4.9134521484375, 5.10882568359375, 5.30419921875, 5.49957275390625, 5.6949462890625, 5.89031982421875, 6.085693359375, 6.28106689453125, 6.4764404296875, 6.67181396484375, 6.8671875]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 1.0, 1.0, 3.0, 6.0, 8.0, 9.0, 12.0, 9.0, 14.0, 13.0, 19.0, 18.0, 23.0, 22.0, 38.0, 36.0, 44.0, 61.0, 62.0, 69.0, 55.0, 53.0, 51.0, 62.0, 44.0, 45.0, 34.0, 39.0, 17.0, 19.0, 19.0, 16.0, 13.0, 13.0, 9.0, 6.0, 4.0, 7.0, 5.0, 3.0, 7.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.099609375, -2.037750244140625, -1.97589111328125, -1.914031982421875, -1.8521728515625, -1.790313720703125, -1.72845458984375, -1.666595458984375, -1.604736328125, -1.542877197265625, -1.48101806640625, -1.419158935546875, -1.3572998046875, -1.295440673828125, -1.23358154296875, -1.171722412109375, -1.10986328125, -1.048004150390625, -0.98614501953125, -0.924285888671875, -0.8624267578125, -0.800567626953125, -0.73870849609375, -0.676849365234375, -0.614990234375, -0.553131103515625, -0.49127197265625, -0.429412841796875, -0.3675537109375, -0.305694580078125, -0.24383544921875, -0.181976318359375, -0.1201171875, -0.058258056640625, 0.00360107421875, 0.065460205078125, 0.1273193359375, 0.189178466796875, 0.25103759765625, 0.312896728515625, 0.374755859375, 0.436614990234375, 0.49847412109375, 0.560333251953125, 0.6221923828125, 0.684051513671875, 0.74591064453125, 0.807769775390625, 0.86962890625, 0.931488037109375, 0.99334716796875, 1.055206298828125, 1.1170654296875, 1.178924560546875, 1.24078369140625, 1.302642822265625, 1.364501953125, 1.426361083984375, 1.48822021484375, 1.550079345703125, 1.6119384765625, 1.673797607421875, 1.73565673828125, 1.797515869140625, 1.859375]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 6.0, 7.0, 9.0, 8.0, 5.0, 9.0, 15.0, 16.0, 19.0, 30.0, 35.0, 27.0, 43.0, 27.0, 35.0, 50.0, 51.0, 59.0, 57.0, 52.0, 55.0, 59.0, 63.0, 38.0, 27.0, 30.0, 30.0, 15.0, 20.0, 22.0, 13.0, 21.0, 13.0, 13.0, 6.0, 4.0, 6.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.8006591796875, -10.46111011505127, -10.121562004089355, -9.782012939453125, -9.442464828491211, -9.10291576385498, -8.76336669921875, -8.423818588256836, -8.084270477294922, -7.74472188949585, -7.405173301696777, -7.065624237060547, -6.726076126098633, -6.386527061462402, -6.04697847366333, -5.707429885864258, -5.367880821228027, -5.028332233428955, -4.688783645629883, -4.349234580993652, -4.009686470031738, -3.670137643814087, -3.3305888175964355, -2.9910402297973633, -2.651491641998291, -2.3119430541992188, -1.972394347190857, -1.6328456401824951, -1.2932970523834229, -0.9537484645843506, -0.6141996383666992, -0.27465105056762695, 0.0648965835571289, 0.40444523096084595, 0.743993878364563, 1.0835425853729248, 1.423091173171997, 1.7626397609710693, 2.1021885871887207, 2.441737174987793, 2.7812857627868652, 3.1208343505859375, 3.4603829383850098, 3.799931764602661, 4.1394805908203125, 4.479028701782227, 4.818577766418457, 5.158126354217529, 5.497674942016602, 5.837223529815674, 6.176772117614746, 6.516321182250977, 6.855869293212891, 7.195418357849121, 7.534966945648193, 7.874515533447266, 8.21406364440918, 8.55361270904541, 8.893160820007324, 9.232709884643555, 9.572257995605469, 9.9118070602417, 10.25135612487793, 10.590904235839844, 10.930453300476074]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 5.0, 2.0, 11.0, 4.0, 7.0, 7.0, 5.0, 22.0, 19.0, 18.0, 18.0, 29.0, 30.0, 22.0, 41.0, 32.0, 32.0, 37.0, 46.0, 43.0, 43.0, 57.0, 47.0, 42.0, 41.0, 39.0, 42.0, 50.0, 25.0, 25.0, 30.0, 21.0, 20.0, 15.0, 14.0, 13.0, 12.0, 6.0, 14.0, 13.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.268064498901367, -11.931300163269043, -11.594535827636719, -11.257771492004395, -10.92100715637207, -10.58424186706543, -10.247477531433105, -9.910713195800781, -9.573948860168457, -9.237184524536133, -8.900420188903809, -8.563655853271484, -8.226890563964844, -7.890126705169678, -7.553361892700195, -7.216597557067871, -6.879833221435547, -6.543068885803223, -6.206304550170898, -5.869539737701416, -5.532775402069092, -5.196011066436768, -4.859246253967285, -4.522481918334961, -4.185717582702637, -3.8489532470703125, -3.512188673019409, -3.175424098968506, -2.8386597633361816, -2.5018954277038574, -2.165130853652954, -1.8283662796020508, -1.4916009902954102, -1.1548365354537964, -0.8180720806121826, -0.48130762577056885, -0.14454317092895508, 0.1922212839126587, 0.5289857387542725, 0.8657503128051758, 1.2025146484375, 1.5392791032791138, 1.8760435581207275, 2.212808132171631, 2.549572467803955, 2.8863368034362793, 3.2231013774871826, 3.559865951538086, 3.89663028717041, 4.233394622802734, 4.570158958435059, 4.906923770904541, 5.243688106536865, 5.5804524421691895, 5.917217254638672, 6.253981590270996, 6.59074592590332, 6.9275102615356445, 7.264274597167969, 7.601039409637451, 7.937803745269775, 8.274568557739258, 8.611332893371582, 8.948097229003906, 9.28486156463623]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 8.0, 11.0, 17.0, 22.0, 21.0, 41.0, 77.0, 91.0, 121.0, 218.0, 316.0, 478.0, 824.0, 1276.0, 2062.0, 3310.0, 5614.0, 9646.0, 17168.0, 31603.0, 60088.0, 124412.0, 277687.0, 632249.0, 1075374.0, 988782.0, 520217.0, 225755.0, 102809.0, 50870.0, 27109.0, 14856.0, 8553.0, 4830.0, 2987.0, 1799.0, 1101.0, 683.0, 399.0, 272.0, 175.0, 111.0, 71.0, 57.0, 31.0, 22.0, 16.0, 9.0, 14.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0], "bins": [-11.6484375, -11.3045654296875, -10.960693359375, -10.6168212890625, -10.27294921875, -9.9290771484375, -9.585205078125, -9.2413330078125, -8.8974609375, -8.5535888671875, -8.209716796875, -7.8658447265625, -7.52197265625, -7.1781005859375, -6.834228515625, -6.4903564453125, -6.146484375, -5.8026123046875, -5.458740234375, -5.1148681640625, -4.77099609375, -4.4271240234375, -4.083251953125, -3.7393798828125, -3.3955078125, -3.0516357421875, -2.707763671875, -2.3638916015625, -2.02001953125, -1.6761474609375, -1.332275390625, -0.9884033203125, -0.64453125, -0.3006591796875, 0.043212890625, 0.3870849609375, 0.73095703125, 1.0748291015625, 1.418701171875, 1.7625732421875, 2.1064453125, 2.4503173828125, 2.794189453125, 3.1380615234375, 3.48193359375, 3.8258056640625, 4.169677734375, 4.5135498046875, 4.857421875, 5.2012939453125, 5.545166015625, 5.8890380859375, 6.23291015625, 6.5767822265625, 6.920654296875, 7.2645263671875, 7.6083984375, 7.9522705078125, 8.296142578125, 8.6400146484375, 8.98388671875, 9.3277587890625, 9.671630859375, 10.0155029296875, 10.359375]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 8.0, 4.0, 11.0, 7.0, 6.0, 10.0, 11.0, 20.0, 15.0, 18.0, 28.0, 23.0, 37.0, 34.0, 37.0, 27.0, 37.0, 33.0, 50.0, 46.0, 54.0, 58.0, 52.0, 39.0, 48.0, 46.0, 32.0, 39.0, 17.0, 29.0, 15.0, 21.0, 16.0, 16.0, 18.0, 14.0, 9.0, 3.0, 9.0, 3.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.6484375, -8.41119384765625, -8.1739501953125, -7.93670654296875, -7.699462890625, -7.46221923828125, -7.2249755859375, -6.98773193359375, -6.75048828125, -6.51324462890625, -6.2760009765625, -6.03875732421875, -5.801513671875, -5.56427001953125, -5.3270263671875, -5.08978271484375, -4.8525390625, -4.61529541015625, -4.3780517578125, -4.14080810546875, -3.903564453125, -3.66632080078125, -3.4290771484375, -3.19183349609375, -2.95458984375, -2.71734619140625, -2.4801025390625, -2.24285888671875, -2.005615234375, -1.76837158203125, -1.5311279296875, -1.29388427734375, -1.056640625, -0.81939697265625, -0.5821533203125, -0.34490966796875, -0.107666015625, 0.12957763671875, 0.3668212890625, 0.60406494140625, 0.84130859375, 1.07855224609375, 1.3157958984375, 1.55303955078125, 1.790283203125, 2.02752685546875, 2.2647705078125, 2.50201416015625, 2.7392578125, 2.97650146484375, 3.2137451171875, 3.45098876953125, 3.688232421875, 3.92547607421875, 4.1627197265625, 4.39996337890625, 4.63720703125, 4.87445068359375, 5.1116943359375, 5.34893798828125, 5.586181640625, 5.82342529296875, 6.0606689453125, 6.29791259765625, 6.53515625]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 2.0, 10.0, 7.0, 17.0, 33.0, 46.0, 64.0, 105.0, 159.0, 263.0, 398.0, 602.0, 986.0, 1540.0, 2371.0, 3925.0, 6503.0, 10916.0, 18999.0, 32902.0, 58653.0, 107317.0, 199822.0, 370548.0, 654602.0, 926608.0, 776236.0, 461904.0, 252151.0, 134907.0, 73940.0, 40775.0, 23056.0, 13468.0, 8070.0, 4720.0, 2927.0, 1754.0, 1072.0, 682.0, 449.0, 276.0, 175.0, 131.0, 67.0, 41.0, 38.0, 26.0, 9.0, 6.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.4453125, -9.147216796875, -8.84912109375, -8.551025390625, -8.2529296875, -7.954833984375, -7.65673828125, -7.358642578125, -7.060546875, -6.762451171875, -6.46435546875, -6.166259765625, -5.8681640625, -5.570068359375, -5.27197265625, -4.973876953125, -4.67578125, -4.377685546875, -4.07958984375, -3.781494140625, -3.4833984375, -3.185302734375, -2.88720703125, -2.589111328125, -2.291015625, -1.992919921875, -1.69482421875, -1.396728515625, -1.0986328125, -0.800537109375, -0.50244140625, -0.204345703125, 0.09375, 0.391845703125, 0.68994140625, 0.988037109375, 1.2861328125, 1.584228515625, 1.88232421875, 2.180419921875, 2.478515625, 2.776611328125, 3.07470703125, 3.372802734375, 3.6708984375, 3.968994140625, 4.26708984375, 4.565185546875, 4.86328125, 5.161376953125, 5.45947265625, 5.757568359375, 6.0556640625, 6.353759765625, 6.65185546875, 6.949951171875, 7.248046875, 7.546142578125, 7.84423828125, 8.142333984375, 8.4404296875, 8.738525390625, 9.03662109375, 9.334716796875, 9.6328125]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 12.0, 14.0, 16.0, 21.0, 27.0, 44.0, 51.0, 69.0, 70.0, 78.0, 113.0, 159.0, 162.0, 202.0, 257.0, 258.0, 260.0, 323.0, 283.0, 272.0, 243.0, 195.0, 162.0, 147.0, 112.0, 113.0, 83.0, 75.0, 53.0, 39.0, 36.0, 31.0, 23.0, 21.0, 13.0, 8.0, 5.0, 7.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.6328125, -3.51702880859375, -3.4012451171875, -3.28546142578125, -3.169677734375, -3.05389404296875, -2.9381103515625, -2.82232666015625, -2.70654296875, -2.59075927734375, -2.4749755859375, -2.35919189453125, -2.243408203125, -2.12762451171875, -2.0118408203125, -1.89605712890625, -1.7802734375, -1.66448974609375, -1.5487060546875, -1.43292236328125, -1.317138671875, -1.20135498046875, -1.0855712890625, -0.96978759765625, -0.85400390625, -0.73822021484375, -0.6224365234375, -0.50665283203125, -0.390869140625, -0.27508544921875, -0.1593017578125, -0.04351806640625, 0.072265625, 0.18804931640625, 0.3038330078125, 0.41961669921875, 0.535400390625, 0.65118408203125, 0.7669677734375, 0.88275146484375, 0.99853515625, 1.11431884765625, 1.2301025390625, 1.34588623046875, 1.461669921875, 1.57745361328125, 1.6932373046875, 1.80902099609375, 1.9248046875, 2.04058837890625, 2.1563720703125, 2.27215576171875, 2.387939453125, 2.50372314453125, 2.6195068359375, 2.73529052734375, 2.85107421875, 2.96685791015625, 3.0826416015625, 3.19842529296875, 3.314208984375, 3.42999267578125, 3.5457763671875, 3.66156005859375, 3.77734375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 0.0, 6.0, 6.0, 12.0, 10.0, 18.0, 12.0, 16.0, 19.0, 33.0, 28.0, 28.0, 34.0, 34.0, 44.0, 48.0, 45.0, 47.0, 49.0, 54.0, 63.0, 53.0, 34.0, 39.0, 42.0, 35.0, 28.0, 25.0, 19.0, 17.0, 21.0, 12.0, 14.0, 8.0, 7.0, 8.0, 5.0, 8.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.11755084991455, -7.827308177947998, -7.537065505981445, -7.246822834014893, -6.95658016204834, -6.666337966918945, -6.376095294952393, -6.08585262298584, -5.795609951019287, -5.505367279052734, -5.215124607086182, -4.924881935119629, -4.634639739990234, -4.344396591186523, -4.054154396057129, -3.763911724090576, -3.4736690521240234, -3.1834263801574707, -2.893183708190918, -2.6029412746429443, -2.3126986026763916, -2.022455930709839, -1.7322133779525757, -1.4419708251953125, -1.1517281532287598, -0.8614855408668518, -0.5712429285049438, -0.2810003161430359, 0.00924229621887207, 0.2994849681854248, 0.589727520942688, 0.8799700736999512, 1.170212745666504, 1.4604554176330566, 1.7506979703903198, 2.040940523147583, 2.3311831951141357, 2.6214258670806885, 2.911668300628662, 3.201910972595215, 3.4921536445617676, 3.7823963165283203, 4.072638988494873, 4.362881660461426, 4.65312385559082, 4.943367004394531, 5.233609199523926, 5.5238518714904785, 5.814094543457031, 6.104337215423584, 6.394579887390137, 6.6848225593566895, 6.975065231323242, 7.265307426452637, 7.5555500984191895, 7.845792770385742, 8.136035919189453, 8.426278114318848, 8.716521263122559, 9.006763458251953, 9.297006607055664, 9.587248802185059, 9.87749195098877, 10.167734146118164, 10.457976341247559]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 6.0, 4.0, 9.0, 5.0, 11.0, 19.0, 18.0, 14.0, 22.0, 17.0, 22.0, 33.0, 30.0, 27.0, 26.0, 37.0, 34.0, 37.0, 42.0, 34.0, 38.0, 37.0, 48.0, 44.0, 41.0, 38.0, 29.0, 38.0, 31.0, 31.0, 22.0, 23.0, 26.0, 22.0, 17.0, 13.0, 9.0, 4.0, 9.0, 12.0, 8.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-9.299307823181152, -9.035682678222656, -8.77205753326416, -8.508432388305664, -8.244807243347168, -7.981182098388672, -7.717556953430176, -7.45393180847168, -7.190306663513184, -6.9266815185546875, -6.663056373596191, -6.399431228637695, -6.135806083679199, -5.872180938720703, -5.608555793762207, -5.344930648803711, -5.081305503845215, -4.817680358886719, -4.554055213928223, -4.290430068969727, -4.0268049240112305, -3.7631797790527344, -3.4995546340942383, -3.235929489135742, -2.972304344177246, -2.70867919921875, -2.445054054260254, -2.181428909301758, -1.9178037643432617, -1.6541786193847656, -1.3905534744262695, -1.1269283294677734, -0.8633027076721191, -0.599677562713623, -0.33605241775512695, -0.07242727279663086, 0.19119787216186523, 0.45482301712036133, 0.7184481620788574, 0.9820733070373535, 1.2456984519958496, 1.5093235969543457, 1.7729487419128418, 2.036573886871338, 2.300199031829834, 2.56382417678833, 2.827449321746826, 3.0910744667053223, 3.3546996116638184, 3.6183247566223145, 3.8819499015808105, 4.145575046539307, 4.409200191497803, 4.672825336456299, 4.936450481414795, 5.200075626373291, 5.463700771331787, 5.727325916290283, 5.990951061248779, 6.254576206207275, 6.5182013511657715, 6.781826496124268, 7.045451641082764, 7.30907678604126, 7.572701930999756]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 6.0, 7.0, 12.0, 20.0, 21.0, 44.0, 57.0, 77.0, 130.0, 192.0, 328.0, 585.0, 896.0, 1584.0, 2774.0, 5339.0, 10190.0, 21926.0, 50461.0, 119766.0, 249268.0, 289674.0, 166022.0, 70617.0, 29736.0, 13641.0, 6595.0, 3606.0, 1978.0, 1183.0, 687.0, 422.0, 234.0, 169.0, 115.0, 71.0, 47.0, 25.0, 19.0, 18.0, 4.0, 5.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.828125, -14.352783203125, -13.87744140625, -13.402099609375, -12.9267578125, -12.451416015625, -11.97607421875, -11.500732421875, -11.025390625, -10.550048828125, -10.07470703125, -9.599365234375, -9.1240234375, -8.648681640625, -8.17333984375, -7.697998046875, -7.22265625, -6.747314453125, -6.27197265625, -5.796630859375, -5.3212890625, -4.845947265625, -4.37060546875, -3.895263671875, -3.419921875, -2.944580078125, -2.46923828125, -1.993896484375, -1.5185546875, -1.043212890625, -0.56787109375, -0.092529296875, 0.3828125, 0.858154296875, 1.33349609375, 1.808837890625, 2.2841796875, 2.759521484375, 3.23486328125, 3.710205078125, 4.185546875, 4.660888671875, 5.13623046875, 5.611572265625, 6.0869140625, 6.562255859375, 7.03759765625, 7.512939453125, 7.98828125, 8.463623046875, 8.93896484375, 9.414306640625, 9.8896484375, 10.364990234375, 10.84033203125, 11.315673828125, 11.791015625, 12.266357421875, 12.74169921875, 13.217041015625, 13.6923828125, 14.167724609375, 14.64306640625, 15.118408203125, 15.59375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 4.0, 9.0, 5.0, 6.0, 8.0, 21.0, 14.0, 14.0, 17.0, 18.0, 23.0, 27.0, 22.0, 29.0, 22.0, 44.0, 31.0, 26.0, 30.0, 41.0, 38.0, 35.0, 46.0, 40.0, 43.0, 33.0, 34.0, 23.0, 24.0, 33.0, 34.0, 28.0, 23.0, 25.0, 22.0, 15.0, 12.0, 11.0, 13.0, 8.0, 14.0, 7.0, 8.0, 5.0, 5.0, 4.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.45703125, -7.20892333984375, -6.9608154296875, -6.71270751953125, -6.464599609375, -6.21649169921875, -5.9683837890625, -5.72027587890625, -5.47216796875, -5.22406005859375, -4.9759521484375, -4.72784423828125, -4.479736328125, -4.23162841796875, -3.9835205078125, -3.73541259765625, -3.4873046875, -3.23919677734375, -2.9910888671875, -2.74298095703125, -2.494873046875, -2.24676513671875, -1.9986572265625, -1.75054931640625, -1.50244140625, -1.25433349609375, -1.0062255859375, -0.75811767578125, -0.510009765625, -0.26190185546875, -0.0137939453125, 0.23431396484375, 0.482421875, 0.73052978515625, 0.9786376953125, 1.22674560546875, 1.474853515625, 1.72296142578125, 1.9710693359375, 2.21917724609375, 2.46728515625, 2.71539306640625, 2.9635009765625, 3.21160888671875, 3.459716796875, 3.70782470703125, 3.9559326171875, 4.20404052734375, 4.4521484375, 4.70025634765625, 4.9483642578125, 5.19647216796875, 5.444580078125, 5.69268798828125, 5.9407958984375, 6.18890380859375, 6.43701171875, 6.68511962890625, 6.9332275390625, 7.18133544921875, 7.429443359375, 7.67755126953125, 7.9256591796875, 8.17376708984375, 8.421875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 13.0, 6.0, 15.0, 23.0, 23.0, 23.0, 36.0, 70.0, 69.0, 98.0, 151.0, 247.0, 308.0, 434.0, 692.0, 1018.0, 1587.0, 2460.0, 4074.0, 6903.0, 12094.0, 23674.0, 47711.0, 105733.0, 224292.0, 292118.0, 170421.0, 76708.0, 35422.0, 17595.0, 9592.0, 5523.0, 3340.0, 2012.0, 1280.0, 864.0, 573.0, 398.0, 272.0, 202.0, 133.0, 121.0, 59.0, 51.0, 42.0, 24.0, 11.0, 9.0, 14.0, 9.0, 2.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0], "bins": [-14.3359375, -13.89208984375, -13.4482421875, -13.00439453125, -12.560546875, -12.11669921875, -11.6728515625, -11.22900390625, -10.78515625, -10.34130859375, -9.8974609375, -9.45361328125, -9.009765625, -8.56591796875, -8.1220703125, -7.67822265625, -7.234375, -6.79052734375, -6.3466796875, -5.90283203125, -5.458984375, -5.01513671875, -4.5712890625, -4.12744140625, -3.68359375, -3.23974609375, -2.7958984375, -2.35205078125, -1.908203125, -1.46435546875, -1.0205078125, -0.57666015625, -0.1328125, 0.31103515625, 0.7548828125, 1.19873046875, 1.642578125, 2.08642578125, 2.5302734375, 2.97412109375, 3.41796875, 3.86181640625, 4.3056640625, 4.74951171875, 5.193359375, 5.63720703125, 6.0810546875, 6.52490234375, 6.96875, 7.41259765625, 7.8564453125, 8.30029296875, 8.744140625, 9.18798828125, 9.6318359375, 10.07568359375, 10.51953125, 10.96337890625, 11.4072265625, 11.85107421875, 12.294921875, 12.73876953125, 13.1826171875, 13.62646484375, 14.0703125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 1.0, 2.0, 4.0, 3.0, 8.0, 12.0, 12.0, 14.0, 12.0, 19.0, 19.0, 13.0, 19.0, 19.0, 23.0, 33.0, 33.0, 31.0, 39.0, 37.0, 31.0, 37.0, 27.0, 48.0, 41.0, 32.0, 38.0, 43.0, 45.0, 36.0, 32.0, 25.0, 25.0, 26.0, 26.0, 23.0, 22.0, 14.0, 3.0, 13.0, 16.0, 7.0, 10.0, 2.0, 8.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-5.11328125, -4.95416259765625, -4.7950439453125, -4.63592529296875, -4.476806640625, -4.31768798828125, -4.1585693359375, -3.99945068359375, -3.84033203125, -3.68121337890625, -3.5220947265625, -3.36297607421875, -3.203857421875, -3.04473876953125, -2.8856201171875, -2.72650146484375, -2.5673828125, -2.40826416015625, -2.2491455078125, -2.09002685546875, -1.930908203125, -1.77178955078125, -1.6126708984375, -1.45355224609375, -1.29443359375, -1.13531494140625, -0.9761962890625, -0.81707763671875, -0.657958984375, -0.49884033203125, -0.3397216796875, -0.18060302734375, -0.021484375, 0.13763427734375, 0.2967529296875, 0.45587158203125, 0.614990234375, 0.77410888671875, 0.9332275390625, 1.09234619140625, 1.25146484375, 1.41058349609375, 1.5697021484375, 1.72882080078125, 1.887939453125, 2.04705810546875, 2.2061767578125, 2.36529541015625, 2.5244140625, 2.68353271484375, 2.8426513671875, 3.00177001953125, 3.160888671875, 3.32000732421875, 3.4791259765625, 3.63824462890625, 3.79736328125, 3.95648193359375, 4.1156005859375, 4.27471923828125, 4.433837890625, 4.59295654296875, 4.7520751953125, 4.91119384765625, 5.0703125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 5.0, 5.0, 3.0, 9.0, 5.0, 10.0, 17.0, 22.0, 45.0, 40.0, 52.0, 93.0, 153.0, 243.0, 344.0, 570.0, 1019.0, 1755.0, 3206.0, 6234.0, 13189.0, 30150.0, 77326.0, 212385.0, 376333.0, 198360.0, 72801.0, 28520.0, 12586.0, 5895.0, 3054.0, 1616.0, 918.0, 563.0, 360.0, 207.0, 153.0, 90.0, 66.0, 49.0, 36.0, 26.0, 11.0, 14.0, 5.0, 10.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.4453125, -9.1630859375, -8.880859375, -8.5986328125, -8.31640625, -8.0341796875, -7.751953125, -7.4697265625, -7.1875, -6.9052734375, -6.623046875, -6.3408203125, -6.05859375, -5.7763671875, -5.494140625, -5.2119140625, -4.9296875, -4.6474609375, -4.365234375, -4.0830078125, -3.80078125, -3.5185546875, -3.236328125, -2.9541015625, -2.671875, -2.3896484375, -2.107421875, -1.8251953125, -1.54296875, -1.2607421875, -0.978515625, -0.6962890625, -0.4140625, -0.1318359375, 0.150390625, 0.4326171875, 0.71484375, 0.9970703125, 1.279296875, 1.5615234375, 1.84375, 2.1259765625, 2.408203125, 2.6904296875, 2.97265625, 3.2548828125, 3.537109375, 3.8193359375, 4.1015625, 4.3837890625, 4.666015625, 4.9482421875, 5.23046875, 5.5126953125, 5.794921875, 6.0771484375, 6.359375, 6.6416015625, 6.923828125, 7.2060546875, 7.48828125, 7.7705078125, 8.052734375, 8.3349609375, 8.6171875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 10.0, 5.0, 9.0, 19.0, 20.0, 31.0, 67.0, 71.0, 99.0, 122.0, 112.0, 114.0, 85.0, 65.0, 49.0, 34.0, 28.0, 13.0, 7.0, 11.0, 9.0, 3.0, 2.0, 1.0, 0.0, 7.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0006365776062011719, -0.000620424747467041, -0.0006042718887329102, -0.0005881190299987793, -0.0005719661712646484, -0.0005558133125305176, -0.0005396604537963867, -0.0005235075950622559, -0.000507354736328125, -0.0004912018775939941, -0.0004750490188598633, -0.0004588961601257324, -0.00044274330139160156, -0.0004265904426574707, -0.00041043758392333984, -0.000394284725189209, -0.0003781318664550781, -0.00036197900772094727, -0.0003458261489868164, -0.00032967329025268555, -0.0003135204315185547, -0.00029736757278442383, -0.00028121471405029297, -0.0002650618553161621, -0.00024890899658203125, -0.0002327561378479004, -0.00021660327911376953, -0.00020045042037963867, -0.0001842975616455078, -0.00016814470291137695, -0.0001519918441772461, -0.00013583898544311523, -0.00011968612670898438, -0.00010353326797485352, -8.738040924072266e-05, -7.12275505065918e-05, -5.507469177246094e-05, -3.892183303833008e-05, -2.276897430419922e-05, -6.616115570068359e-06, 9.5367431640625e-06, 2.568960189819336e-05, 4.184246063232422e-05, 5.799531936645508e-05, 7.414817810058594e-05, 9.03010368347168e-05, 0.00010645389556884766, 0.00012260675430297852, 0.00013875961303710938, 0.00015491247177124023, 0.0001710653305053711, 0.00018721818923950195, 0.0002033710479736328, 0.00021952390670776367, 0.00023567676544189453, 0.0002518296241760254, 0.00026798248291015625, 0.0002841353416442871, 0.00030028820037841797, 0.00031644105911254883, 0.0003325939178466797, 0.00034874677658081055, 0.0003648996353149414, 0.00038105249404907227, 0.0003972053527832031]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 5.0, 18.0, 18.0, 21.0, 32.0, 52.0, 95.0, 91.0, 153.0, 237.0, 310.0, 475.0, 717.0, 1003.0, 1589.0, 2434.0, 3913.0, 6300.0, 10331.0, 18282.0, 32711.0, 59126.0, 103962.0, 163185.0, 200628.0, 174180.0, 114559.0, 66198.0, 36686.0, 20475.0, 11675.0, 6891.0, 4305.0, 2662.0, 1715.0, 1109.0, 768.0, 526.0, 366.0, 219.0, 170.0, 120.0, 80.0, 57.0, 37.0, 23.0, 15.0, 13.0, 7.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-5.22265625, -5.06243896484375, -4.9022216796875, -4.74200439453125, -4.581787109375, -4.42156982421875, -4.2613525390625, -4.10113525390625, -3.94091796875, -3.78070068359375, -3.6204833984375, -3.46026611328125, -3.300048828125, -3.13983154296875, -2.9796142578125, -2.81939697265625, -2.6591796875, -2.49896240234375, -2.3387451171875, -2.17852783203125, -2.018310546875, -1.85809326171875, -1.6978759765625, -1.53765869140625, -1.37744140625, -1.21722412109375, -1.0570068359375, -0.89678955078125, -0.736572265625, -0.57635498046875, -0.4161376953125, -0.25592041015625, -0.095703125, 0.06451416015625, 0.2247314453125, 0.38494873046875, 0.545166015625, 0.70538330078125, 0.8656005859375, 1.02581787109375, 1.18603515625, 1.34625244140625, 1.5064697265625, 1.66668701171875, 1.826904296875, 1.98712158203125, 2.1473388671875, 2.30755615234375, 2.4677734375, 2.62799072265625, 2.7882080078125, 2.94842529296875, 3.108642578125, 3.26885986328125, 3.4290771484375, 3.58929443359375, 3.74951171875, 3.90972900390625, 4.0699462890625, 4.23016357421875, 4.390380859375, 4.55059814453125, 4.7108154296875, 4.87103271484375, 5.03125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 7.0, 5.0, 4.0, 8.0, 6.0, 11.0, 15.0, 14.0, 19.0, 20.0, 37.0, 50.0, 57.0, 52.0, 56.0, 68.0, 86.0, 79.0, 67.0, 56.0, 63.0, 44.0, 40.0, 42.0, 30.0, 19.0, 14.0, 9.0, 8.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8837890625, -1.8101654052734375, -1.736541748046875, -1.6629180908203125, -1.58929443359375, -1.5156707763671875, -1.442047119140625, -1.3684234619140625, -1.2947998046875, -1.2211761474609375, -1.147552490234375, -1.0739288330078125, -1.00030517578125, -0.9266815185546875, -0.853057861328125, -0.7794342041015625, -0.705810546875, -0.6321868896484375, -0.558563232421875, -0.4849395751953125, -0.41131591796875, -0.3376922607421875, -0.264068603515625, -0.1904449462890625, -0.1168212890625, -0.0431976318359375, 0.030426025390625, 0.1040496826171875, 0.17767333984375, 0.2512969970703125, 0.324920654296875, 0.3985443115234375, 0.47216796875, 0.5457916259765625, 0.619415283203125, 0.6930389404296875, 0.76666259765625, 0.8402862548828125, 0.913909912109375, 0.9875335693359375, 1.0611572265625, 1.1347808837890625, 1.208404541015625, 1.2820281982421875, 1.35565185546875, 1.4292755126953125, 1.502899169921875, 1.5765228271484375, 1.650146484375, 1.7237701416015625, 1.797393798828125, 1.8710174560546875, 1.94464111328125, 2.0182647705078125, 2.091888427734375, 2.1655120849609375, 2.2391357421875, 2.3127593994140625, 2.386383056640625, 2.4600067138671875, 2.53363037109375, 2.6072540283203125, 2.680877685546875, 2.7545013427734375, 2.828125]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 3.0, 9.0, 3.0, 6.0, 6.0, 16.0, 11.0, 18.0, 15.0, 22.0, 24.0, 35.0, 32.0, 40.0, 45.0, 41.0, 57.0, 47.0, 58.0, 63.0, 47.0, 62.0, 48.0, 39.0, 40.0, 38.0, 35.0, 38.0, 16.0, 15.0, 13.0, 12.0, 10.0, 10.0, 11.0, 3.0, 1.0, 4.0, 7.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.010624885559082, -8.702438354492188, -8.394251823425293, -8.086066246032715, -7.77787971496582, -7.469693183898926, -7.161506652832031, -6.853320121765137, -6.5451340675354, -6.236947536468506, -5.9287614822387695, -5.620574951171875, -5.3123884201049805, -5.004202365875244, -4.69601583480835, -4.387829780578613, -4.079643249511719, -3.7714569568634033, -3.463270664215088, -3.1550841331481934, -2.846897840499878, -2.5387115478515625, -2.230525016784668, -1.9223387241363525, -1.614152431488037, -1.3059661388397217, -0.9977797269821167, -0.6895933747291565, -0.3814070224761963, -0.07322072982788086, 0.23496568202972412, 0.5431520938873291, 0.8513393402099609, 1.1595256328582764, 1.4677120447158813, 1.7758984565734863, 2.0840847492218018, 2.392271041870117, 2.7004575729370117, 3.008643865585327, 3.3168301582336426, 3.625016450881958, 3.9332027435302734, 4.241389274597168, 4.5495758056640625, 4.857761859893799, 5.165948390960693, 5.47413444519043, 5.782320976257324, 6.090507507324219, 6.398693561553955, 6.70688009262085, 7.015066146850586, 7.3232526779174805, 7.631439208984375, 7.9396257400512695, 8.247812271118164, 8.555998802185059, 8.864185333251953, 9.172370910644531, 9.480557441711426, 9.78874397277832, 10.096930503845215, 10.40511703491211, 10.713302612304688]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 5.0, 2.0, 10.0, 9.0, 13.0, 9.0, 12.0, 25.0, 15.0, 14.0, 15.0, 29.0, 40.0, 29.0, 36.0, 29.0, 29.0, 44.0, 35.0, 45.0, 33.0, 37.0, 40.0, 39.0, 42.0, 42.0, 37.0, 33.0, 26.0, 24.0, 24.0, 29.0, 26.0, 24.0, 13.0, 17.0, 16.0, 17.0, 5.0, 2.0, 8.0, 8.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-8.665674209594727, -8.413859367370605, -8.162044525146484, -7.910229206085205, -7.658413887023926, -7.406599044799805, -7.154784202575684, -6.9029693603515625, -6.651154041290283, -6.399339199066162, -6.147523880004883, -5.895709037780762, -5.643894195556641, -5.392078876495361, -5.14026403427124, -4.888448715209961, -4.63663387298584, -4.384819030761719, -4.1330037117004395, -3.8811888694763184, -3.629373788833618, -3.377558708190918, -3.125743865966797, -2.8739287853240967, -2.6221137046813965, -2.3702986240386963, -2.118483543395996, -1.866668701171875, -1.6148536205291748, -1.3630385398864746, -1.111223578453064, -0.8594086170196533, -0.6075940132141113, -0.3557789921760559, -0.10396397113800049, 0.14785104990005493, 0.39966607093811035, 0.6514811515808105, 0.9032961130142212, 1.1551110744476318, 1.406926155090332, 1.6587412357330322, 1.9105561971664429, 2.1623711585998535, 2.4141862392425537, 2.666001319885254, 2.917816162109375, 3.169631242752075, 3.4214463233947754, 3.6732614040374756, 3.925076484680176, 4.176891326904297, 4.428706169128418, 4.680521488189697, 4.932336330413818, 5.184151649475098, 5.435966491699219, 5.68778133392334, 5.939596652984619, 6.19141149520874, 6.4432268142700195, 6.695041656494141, 6.946856498718262, 7.198671340942383, 7.450486660003662]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 6.0, 9.0, 12.0, 18.0, 30.0, 39.0, 52.0, 73.0, 109.0, 176.0, 281.0, 443.0, 720.0, 1193.0, 1974.0, 3288.0, 5630.0, 9326.0, 15531.0, 26110.0, 42995.0, 67321.0, 101188.0, 135950.0, 154823.0, 147126.0, 117176.0, 82002.0, 53437.0, 32730.0, 19465.0, 11689.0, 6887.0, 4174.0, 2515.0, 1536.0, 922.0, 578.0, 351.0, 207.0, 166.0, 89.0, 63.0, 42.0, 30.0, 23.0, 12.0, 12.0, 11.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0], "bins": [-9.3515625, -9.0657958984375, -8.780029296875, -8.4942626953125, -8.20849609375, -7.9227294921875, -7.636962890625, -7.3511962890625, -7.0654296875, -6.7796630859375, -6.493896484375, -6.2081298828125, -5.92236328125, -5.6365966796875, -5.350830078125, -5.0650634765625, -4.779296875, -4.4935302734375, -4.207763671875, -3.9219970703125, -3.63623046875, -3.3504638671875, -3.064697265625, -2.7789306640625, -2.4931640625, -2.2073974609375, -1.921630859375, -1.6358642578125, -1.35009765625, -1.0643310546875, -0.778564453125, -0.4927978515625, -0.20703125, 0.0787353515625, 0.364501953125, 0.6502685546875, 0.93603515625, 1.2218017578125, 1.507568359375, 1.7933349609375, 2.0791015625, 2.3648681640625, 2.650634765625, 2.9364013671875, 3.22216796875, 3.5079345703125, 3.793701171875, 4.0794677734375, 4.365234375, 4.6510009765625, 4.936767578125, 5.2225341796875, 5.50830078125, 5.7940673828125, 6.079833984375, 6.3656005859375, 6.6513671875, 6.9371337890625, 7.222900390625, 7.5086669921875, 7.79443359375, 8.0802001953125, 8.365966796875, 8.6517333984375, 8.9375]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 0.0, 2.0, 4.0, 8.0, 4.0, 8.0, 2.0, 10.0, 9.0, 9.0, 13.0, 14.0, 14.0, 18.0, 17.0, 18.0, 27.0, 30.0, 25.0, 35.0, 29.0, 33.0, 31.0, 31.0, 35.0, 38.0, 41.0, 36.0, 35.0, 35.0, 30.0, 29.0, 33.0, 21.0, 30.0, 25.0, 23.0, 35.0, 14.0, 20.0, 24.0, 12.0, 14.0, 22.0, 10.0, 15.0, 7.0, 6.0, 10.0, 4.0, 4.0, 2.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.87890625, -6.653564453125, -6.42822265625, -6.202880859375, -5.9775390625, -5.752197265625, -5.52685546875, -5.301513671875, -5.076171875, -4.850830078125, -4.62548828125, -4.400146484375, -4.1748046875, -3.949462890625, -3.72412109375, -3.498779296875, -3.2734375, -3.048095703125, -2.82275390625, -2.597412109375, -2.3720703125, -2.146728515625, -1.92138671875, -1.696044921875, -1.470703125, -1.245361328125, -1.02001953125, -0.794677734375, -0.5693359375, -0.343994140625, -0.11865234375, 0.106689453125, 0.33203125, 0.557373046875, 0.78271484375, 1.008056640625, 1.2333984375, 1.458740234375, 1.68408203125, 1.909423828125, 2.134765625, 2.360107421875, 2.58544921875, 2.810791015625, 3.0361328125, 3.261474609375, 3.48681640625, 3.712158203125, 3.9375, 4.162841796875, 4.38818359375, 4.613525390625, 4.8388671875, 5.064208984375, 5.28955078125, 5.514892578125, 5.740234375, 5.965576171875, 6.19091796875, 6.416259765625, 6.6416015625, 6.866943359375, 7.09228515625, 7.317626953125, 7.54296875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 6.0, 5.0, 8.0, 11.0, 22.0, 27.0, 33.0, 54.0, 91.0, 119.0, 214.0, 286.0, 446.0, 687.0, 1030.0, 1700.0, 2657.0, 3910.0, 5970.0, 9360.0, 14171.0, 21582.0, 32463.0, 47757.0, 68149.0, 91514.0, 113580.0, 127454.0, 125147.0, 108459.0, 83984.0, 61314.0, 42701.0, 28864.0, 19078.0, 12480.0, 8138.0, 5150.0, 3551.0, 2257.0, 1422.0, 968.0, 596.0, 374.0, 264.0, 170.0, 130.0, 75.0, 44.0, 35.0, 23.0, 16.0, 6.0, 4.0, 2.0, 7.0, 3.0, 1.0], "bins": [-7.15234375, -6.9410400390625, -6.729736328125, -6.5184326171875, -6.30712890625, -6.0958251953125, -5.884521484375, -5.6732177734375, -5.4619140625, -5.2506103515625, -5.039306640625, -4.8280029296875, -4.61669921875, -4.4053955078125, -4.194091796875, -3.9827880859375, -3.771484375, -3.5601806640625, -3.348876953125, -3.1375732421875, -2.92626953125, -2.7149658203125, -2.503662109375, -2.2923583984375, -2.0810546875, -1.8697509765625, -1.658447265625, -1.4471435546875, -1.23583984375, -1.0245361328125, -0.813232421875, -0.6019287109375, -0.390625, -0.1793212890625, 0.031982421875, 0.2432861328125, 0.45458984375, 0.6658935546875, 0.877197265625, 1.0885009765625, 1.2998046875, 1.5111083984375, 1.722412109375, 1.9337158203125, 2.14501953125, 2.3563232421875, 2.567626953125, 2.7789306640625, 2.990234375, 3.2015380859375, 3.412841796875, 3.6241455078125, 3.83544921875, 4.0467529296875, 4.258056640625, 4.4693603515625, 4.6806640625, 4.8919677734375, 5.103271484375, 5.3145751953125, 5.52587890625, 5.7371826171875, 5.948486328125, 6.1597900390625, 6.37109375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 4.0, 6.0, 6.0, 7.0, 3.0, 10.0, 11.0, 17.0, 25.0, 24.0, 33.0, 26.0, 43.0, 35.0, 40.0, 28.0, 47.0, 41.0, 51.0, 44.0, 38.0, 48.0, 48.0, 38.0, 51.0, 32.0, 35.0, 39.0, 32.0, 31.0, 18.0, 19.0, 20.0, 14.0, 7.0, 8.0, 7.0, 2.0, 9.0, 2.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5546875, -5.36761474609375, -5.1805419921875, -4.99346923828125, -4.806396484375, -4.61932373046875, -4.4322509765625, -4.24517822265625, -4.05810546875, -3.87103271484375, -3.6839599609375, -3.49688720703125, -3.309814453125, -3.12274169921875, -2.9356689453125, -2.74859619140625, -2.5615234375, -2.37445068359375, -2.1873779296875, -2.00030517578125, -1.813232421875, -1.62615966796875, -1.4390869140625, -1.25201416015625, -1.06494140625, -0.87786865234375, -0.6907958984375, -0.50372314453125, -0.316650390625, -0.12957763671875, 0.0574951171875, 0.24456787109375, 0.431640625, 0.61871337890625, 0.8057861328125, 0.99285888671875, 1.179931640625, 1.36700439453125, 1.5540771484375, 1.74114990234375, 1.92822265625, 2.11529541015625, 2.3023681640625, 2.48944091796875, 2.676513671875, 2.86358642578125, 3.0506591796875, 3.23773193359375, 3.4248046875, 3.61187744140625, 3.7989501953125, 3.98602294921875, 4.173095703125, 4.36016845703125, 4.5472412109375, 4.73431396484375, 4.92138671875, 5.10845947265625, 5.2955322265625, 5.48260498046875, 5.669677734375, 5.85675048828125, 6.0438232421875, 6.23089599609375, 6.41796875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 6.0, 4.0, 8.0, 11.0, 16.0, 20.0, 37.0, 44.0, 73.0, 101.0, 158.0, 257.0, 401.0, 602.0, 1000.0, 1670.0, 2692.0, 4770.0, 8815.0, 16704.0, 34548.0, 74534.0, 155945.0, 256776.0, 236743.0, 130563.0, 61501.0, 28654.0, 13913.0, 7541.0, 4065.0, 2393.0, 1515.0, 911.0, 559.0, 319.0, 252.0, 164.0, 90.0, 58.0, 42.0, 23.0, 18.0, 14.0, 5.0, 10.0, 5.0, 7.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5625, -8.27587890625, -7.9892578125, -7.70263671875, -7.416015625, -7.12939453125, -6.8427734375, -6.55615234375, -6.26953125, -5.98291015625, -5.6962890625, -5.40966796875, -5.123046875, -4.83642578125, -4.5498046875, -4.26318359375, -3.9765625, -3.68994140625, -3.4033203125, -3.11669921875, -2.830078125, -2.54345703125, -2.2568359375, -1.97021484375, -1.68359375, -1.39697265625, -1.1103515625, -0.82373046875, -0.537109375, -0.25048828125, 0.0361328125, 0.32275390625, 0.609375, 0.89599609375, 1.1826171875, 1.46923828125, 1.755859375, 2.04248046875, 2.3291015625, 2.61572265625, 2.90234375, 3.18896484375, 3.4755859375, 3.76220703125, 4.048828125, 4.33544921875, 4.6220703125, 4.90869140625, 5.1953125, 5.48193359375, 5.7685546875, 6.05517578125, 6.341796875, 6.62841796875, 6.9150390625, 7.20166015625, 7.48828125, 7.77490234375, 8.0615234375, 8.34814453125, 8.634765625, 8.92138671875, 9.2080078125, 9.49462890625, 9.78125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 10.0, 17.0, 13.0, 19.0, 21.0, 33.0, 61.0, 68.0, 91.0, 102.0, 120.0, 95.0, 97.0, 57.0, 48.0, 40.0, 32.0, 18.0, 22.0, 10.0, 10.0, 8.0, 5.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0012416839599609375, -0.0012094229459762573, -0.0011771619319915771, -0.001144900918006897, -0.0011126399040222168, -0.0010803788900375366, -0.0010481178760528564, -0.0010158568620681763, -0.000983595848083496, -0.0009513348340988159, -0.0009190738201141357, -0.0008868128061294556, -0.0008545517921447754, -0.0008222907781600952, -0.000790029764175415, -0.0007577687501907349, -0.0007255077362060547, -0.0006932467222213745, -0.0006609857082366943, -0.0006287246942520142, -0.000596463680267334, -0.0005642026662826538, -0.0005319416522979736, -0.0004996806383132935, -0.0004674196243286133, -0.0004351586103439331, -0.00040289759635925293, -0.00037063658237457275, -0.0003383755683898926, -0.0003061145544052124, -0.0002738535404205322, -0.00024159252643585205, -0.00020933151245117188, -0.0001770704984664917, -0.00014480948448181152, -0.00011254847049713135, -8.028745651245117e-05, -4.8026442527770996e-05, -1.576542854309082e-05, 1.6495585441589355e-05, 4.875659942626953e-05, 8.101761341094971e-05, 0.00011327862739562988, 0.00014553964138031006, 0.00017780065536499023, 0.0002100616693496704, 0.00024232268333435059, 0.00027458369731903076, 0.00030684471130371094, 0.0003391057252883911, 0.0003713667392730713, 0.00040362775325775146, 0.00043588876724243164, 0.0004681497812271118, 0.000500410795211792, 0.0005326718091964722, 0.0005649328231811523, 0.0005971938371658325, 0.0006294548511505127, 0.0006617158651351929, 0.000693976879119873, 0.0007262378931045532, 0.0007584989070892334, 0.0007907599210739136, 0.0008230209350585938]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 7.0, 2.0, 12.0, 20.0, 13.0, 27.0, 39.0, 64.0, 57.0, 111.0, 189.0, 245.0, 391.0, 569.0, 1039.0, 1679.0, 2733.0, 4863.0, 8579.0, 15785.0, 30056.0, 58159.0, 108594.0, 176748.0, 215984.0, 180739.0, 112454.0, 60435.0, 31173.0, 16351.0, 8855.0, 5034.0, 2922.0, 1713.0, 1002.0, 666.0, 417.0, 266.0, 178.0, 119.0, 88.0, 63.0, 38.0, 22.0, 14.0, 13.0, 8.0, 10.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-6.41015625, -6.2001953125, -5.990234375, -5.7802734375, -5.5703125, -5.3603515625, -5.150390625, -4.9404296875, -4.73046875, -4.5205078125, -4.310546875, -4.1005859375, -3.890625, -3.6806640625, -3.470703125, -3.2607421875, -3.05078125, -2.8408203125, -2.630859375, -2.4208984375, -2.2109375, -2.0009765625, -1.791015625, -1.5810546875, -1.37109375, -1.1611328125, -0.951171875, -0.7412109375, -0.53125, -0.3212890625, -0.111328125, 0.0986328125, 0.30859375, 0.5185546875, 0.728515625, 0.9384765625, 1.1484375, 1.3583984375, 1.568359375, 1.7783203125, 1.98828125, 2.1982421875, 2.408203125, 2.6181640625, 2.828125, 3.0380859375, 3.248046875, 3.4580078125, 3.66796875, 3.8779296875, 4.087890625, 4.2978515625, 4.5078125, 4.7177734375, 4.927734375, 5.1376953125, 5.34765625, 5.5576171875, 5.767578125, 5.9775390625, 6.1875, 6.3974609375, 6.607421875, 6.8173828125, 7.02734375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 6.0, 11.0, 5.0, 11.0, 4.0, 15.0, 26.0, 22.0, 37.0, 45.0, 59.0, 64.0, 74.0, 76.0, 75.0, 84.0, 58.0, 63.0, 57.0, 44.0, 46.0, 26.0, 31.0, 12.0, 11.0, 8.0, 4.0, 9.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.30859375, -3.215850830078125, -3.12310791015625, -3.030364990234375, -2.9376220703125, -2.844879150390625, -2.75213623046875, -2.659393310546875, -2.566650390625, -2.473907470703125, -2.38116455078125, -2.288421630859375, -2.1956787109375, -2.102935791015625, -2.01019287109375, -1.917449951171875, -1.82470703125, -1.731964111328125, -1.63922119140625, -1.546478271484375, -1.4537353515625, -1.360992431640625, -1.26824951171875, -1.175506591796875, -1.082763671875, -0.990020751953125, -0.89727783203125, -0.804534912109375, -0.7117919921875, -0.619049072265625, -0.52630615234375, -0.433563232421875, -0.3408203125, -0.248077392578125, -0.15533447265625, -0.062591552734375, 0.0301513671875, 0.122894287109375, 0.21563720703125, 0.308380126953125, 0.401123046875, 0.493865966796875, 0.58660888671875, 0.679351806640625, 0.7720947265625, 0.864837646484375, 0.95758056640625, 1.050323486328125, 1.14306640625, 1.235809326171875, 1.32855224609375, 1.421295166015625, 1.5140380859375, 1.606781005859375, 1.69952392578125, 1.792266845703125, 1.885009765625, 1.977752685546875, 2.07049560546875, 2.163238525390625, 2.2559814453125, 2.348724365234375, 2.44146728515625, 2.534210205078125, 2.626953125]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 3.0, 8.0, 6.0, 11.0, 10.0, 22.0, 23.0, 18.0, 29.0, 25.0, 32.0, 39.0, 43.0, 51.0, 49.0, 55.0, 59.0, 50.0, 65.0, 62.0, 53.0, 37.0, 38.0, 41.0, 45.0, 25.0, 28.0, 19.0, 12.0, 9.0, 9.0, 4.0, 4.0, 2.0, 3.0, 7.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.412333488464355, -8.092952728271484, -7.773571968078613, -7.454191207885742, -7.134810447692871, -6.8154296875, -6.496048450469971, -6.1766676902771, -5.8572869300842285, -5.537906169891357, -5.218525409698486, -4.899144649505615, -4.579763412475586, -4.260382652282715, -3.9410018920898438, -3.6216211318969727, -3.3022403717041016, -2.9828596115112305, -2.6634788513183594, -2.344097852706909, -2.024717092514038, -1.705336332321167, -1.3859554529190063, -1.0665745735168457, -0.7471938133239746, -0.42781299352645874, -0.10843217372894287, 0.210948646068573, 0.5303294658660889, 0.84971022605896, 1.1690911054611206, 1.4884719848632812, 1.8078536987304688, 2.12723445892334, 2.446615219116211, 2.765996217727661, 3.0853769779205322, 3.4047577381134033, 3.7241387367248535, 4.043519496917725, 4.362900257110596, 4.682281017303467, 5.001661777496338, 5.321042537689209, 5.640423774719238, 5.959804534912109, 6.2791852951049805, 6.598566055297852, 6.917946815490723, 7.237327575683594, 7.556708335876465, 7.876089096069336, 8.195469856262207, 8.514850616455078, 8.83423137664795, 9.15361213684082, 9.472993850708008, 9.792374610900879, 10.11175537109375, 10.431136131286621, 10.750516891479492, 11.069897651672363, 11.389278411865234, 11.708660125732422, 12.028039932250977]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 4.0, 8.0, 9.0, 15.0, 12.0, 18.0, 17.0, 14.0, 23.0, 24.0, 27.0, 29.0, 33.0, 28.0, 37.0, 31.0, 44.0, 37.0, 48.0, 46.0, 46.0, 44.0, 40.0, 41.0, 29.0, 26.0, 38.0, 35.0, 28.0, 22.0, 16.0, 21.0, 19.0, 18.0, 13.0, 14.0, 8.0, 9.0, 8.0, 7.0, 1.0, 6.0, 4.0, 5.0, 1.0, 2.0, 0.0, 2.0], "bins": [-9.691641807556152, -9.422221183776855, -9.152799606323242, -8.883378982543945, -8.613957405090332, -8.344536781311035, -8.075115203857422, -7.805694580078125, -7.536273002624512, -7.266851902008057, -6.997430801391602, -6.7280097007751465, -6.458588600158691, -6.189167499542236, -5.919746398925781, -5.650325775146484, -5.380904674530029, -5.111483573913574, -4.842062473297119, -4.572641372680664, -4.303220272064209, -4.033799171447754, -3.764378309249878, -3.494957208633423, -3.2255361080169678, -2.9561150074005127, -2.6866939067840576, -2.4172730445861816, -2.1478519439697266, -1.878430724143982, -1.6090097427368164, -1.3395886421203613, -1.070167064666748, -0.800745964050293, -0.5313249230384827, -0.26190388202667236, 0.007517218589782715, 0.2769383192062378, 0.5463593006134033, 0.8157804012298584, 1.0852015018463135, 1.3546226024627686, 1.6240437030792236, 1.8934646844863892, 2.1628856658935547, 2.4323067665100098, 2.701727867126465, 2.97114896774292, 3.240570068359375, 3.50999116897583, 3.779412269592285, 4.04883337020874, 4.318254470825195, 4.58767557144165, 4.8570966720581055, 5.126517295837402, 5.395938873291016, 5.665359973907471, 5.934781074523926, 6.204202175140381, 6.473623275756836, 6.743044376373291, 7.012465476989746, 7.281886100769043, 7.551307201385498]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 5.0, 5.0, 6.0, 8.0, 9.0, 15.0, 33.0, 52.0, 63.0, 79.0, 131.0, 198.0, 262.0, 400.0, 555.0, 882.0, 1403.0, 2204.0, 3425.0, 5551.0, 9113.0, 15598.0, 26807.0, 49146.0, 94682.0, 197171.0, 430146.0, 815170.0, 1029720.0, 755643.0, 379749.0, 175733.0, 86202.0, 46235.0, 26099.0, 15258.0, 9420.0, 5809.0, 3765.0, 2476.0, 1637.0, 1087.0, 742.0, 500.0, 344.0, 231.0, 162.0, 123.0, 72.0, 61.0, 38.0, 31.0, 14.0, 8.0, 8.0, 4.0, 4.0, 3.0, 2.0], "bins": [-8.734375, -8.47314453125, -8.2119140625, -7.95068359375, -7.689453125, -7.42822265625, -7.1669921875, -6.90576171875, -6.64453125, -6.38330078125, -6.1220703125, -5.86083984375, -5.599609375, -5.33837890625, -5.0771484375, -4.81591796875, -4.5546875, -4.29345703125, -4.0322265625, -3.77099609375, -3.509765625, -3.24853515625, -2.9873046875, -2.72607421875, -2.46484375, -2.20361328125, -1.9423828125, -1.68115234375, -1.419921875, -1.15869140625, -0.8974609375, -0.63623046875, -0.375, -0.11376953125, 0.1474609375, 0.40869140625, 0.669921875, 0.93115234375, 1.1923828125, 1.45361328125, 1.71484375, 1.97607421875, 2.2373046875, 2.49853515625, 2.759765625, 3.02099609375, 3.2822265625, 3.54345703125, 3.8046875, 4.06591796875, 4.3271484375, 4.58837890625, 4.849609375, 5.11083984375, 5.3720703125, 5.63330078125, 5.89453125, 6.15576171875, 6.4169921875, 6.67822265625, 6.939453125, 7.20068359375, 7.4619140625, 7.72314453125, 7.984375]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 5.0, 4.0, 8.0, 13.0, 9.0, 18.0, 15.0, 21.0, 11.0, 24.0, 31.0, 23.0, 34.0, 32.0, 31.0, 36.0, 36.0, 50.0, 43.0, 48.0, 49.0, 39.0, 34.0, 29.0, 37.0, 46.0, 24.0, 24.0, 32.0, 19.0, 27.0, 22.0, 19.0, 23.0, 11.0, 14.0, 10.0, 13.0, 10.0, 4.0, 7.0, 9.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.921875, -5.73876953125, -5.5556640625, -5.37255859375, -5.189453125, -5.00634765625, -4.8232421875, -4.64013671875, -4.45703125, -4.27392578125, -4.0908203125, -3.90771484375, -3.724609375, -3.54150390625, -3.3583984375, -3.17529296875, -2.9921875, -2.80908203125, -2.6259765625, -2.44287109375, -2.259765625, -2.07666015625, -1.8935546875, -1.71044921875, -1.52734375, -1.34423828125, -1.1611328125, -0.97802734375, -0.794921875, -0.61181640625, -0.4287109375, -0.24560546875, -0.0625, 0.12060546875, 0.3037109375, 0.48681640625, 0.669921875, 0.85302734375, 1.0361328125, 1.21923828125, 1.40234375, 1.58544921875, 1.7685546875, 1.95166015625, 2.134765625, 2.31787109375, 2.5009765625, 2.68408203125, 2.8671875, 3.05029296875, 3.2333984375, 3.41650390625, 3.599609375, 3.78271484375, 3.9658203125, 4.14892578125, 4.33203125, 4.51513671875, 4.6982421875, 4.88134765625, 5.064453125, 5.24755859375, 5.4306640625, 5.61376953125, 5.796875]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 8.0, 14.0, 15.0, 21.0, 33.0, 63.0, 82.0, 127.0, 185.0, 312.0, 511.0, 829.0, 1396.0, 2371.0, 3907.0, 6757.0, 11809.0, 20883.0, 38197.0, 72521.0, 141952.0, 290136.0, 587033.0, 997201.0, 947898.0, 531914.0, 262511.0, 129056.0, 65925.0, 34974.0, 19134.0, 10830.0, 6366.0, 3777.0, 2185.0, 1289.0, 790.0, 483.0, 303.0, 188.0, 125.0, 61.0, 41.0, 31.0, 20.0, 8.0, 5.0, 5.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.5234375, -8.2386474609375, -7.953857421875, -7.6690673828125, -7.38427734375, -7.0994873046875, -6.814697265625, -6.5299072265625, -6.2451171875, -5.9603271484375, -5.675537109375, -5.3907470703125, -5.10595703125, -4.8211669921875, -4.536376953125, -4.2515869140625, -3.966796875, -3.6820068359375, -3.397216796875, -3.1124267578125, -2.82763671875, -2.5428466796875, -2.258056640625, -1.9732666015625, -1.6884765625, -1.4036865234375, -1.118896484375, -0.8341064453125, -0.54931640625, -0.2645263671875, 0.020263671875, 0.3050537109375, 0.58984375, 0.8746337890625, 1.159423828125, 1.4442138671875, 1.72900390625, 2.0137939453125, 2.298583984375, 2.5833740234375, 2.8681640625, 3.1529541015625, 3.437744140625, 3.7225341796875, 4.00732421875, 4.2921142578125, 4.576904296875, 4.8616943359375, 5.146484375, 5.4312744140625, 5.716064453125, 6.0008544921875, 6.28564453125, 6.5704345703125, 6.855224609375, 7.1400146484375, 7.4248046875, 7.7095947265625, 7.994384765625, 8.2791748046875, 8.56396484375, 8.8487548828125, 9.133544921875, 9.4183349609375, 9.703125]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 4.0, 6.0, 4.0, 11.0, 18.0, 18.0, 32.0, 38.0, 24.0, 41.0, 61.0, 82.0, 84.0, 123.0, 164.0, 165.0, 186.0, 241.0, 327.0, 291.0, 299.0, 310.0, 248.0, 247.0, 197.0, 170.0, 152.0, 96.0, 81.0, 82.0, 47.0, 57.0, 41.0, 18.0, 30.0, 21.0, 17.0, 12.0, 10.0, 5.0, 6.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.306640625, -3.20794677734375, -3.1092529296875, -3.01055908203125, -2.911865234375, -2.81317138671875, -2.7144775390625, -2.61578369140625, -2.51708984375, -2.41839599609375, -2.3197021484375, -2.22100830078125, -2.122314453125, -2.02362060546875, -1.9249267578125, -1.82623291015625, -1.7275390625, -1.62884521484375, -1.5301513671875, -1.43145751953125, -1.332763671875, -1.23406982421875, -1.1353759765625, -1.03668212890625, -0.93798828125, -0.83929443359375, -0.7406005859375, -0.64190673828125, -0.543212890625, -0.44451904296875, -0.3458251953125, -0.24713134765625, -0.1484375, -0.04974365234375, 0.0489501953125, 0.14764404296875, 0.246337890625, 0.34503173828125, 0.4437255859375, 0.54241943359375, 0.64111328125, 0.73980712890625, 0.8385009765625, 0.93719482421875, 1.035888671875, 1.13458251953125, 1.2332763671875, 1.33197021484375, 1.4306640625, 1.52935791015625, 1.6280517578125, 1.72674560546875, 1.825439453125, 1.92413330078125, 2.0228271484375, 2.12152099609375, 2.22021484375, 2.31890869140625, 2.4176025390625, 2.51629638671875, 2.614990234375, 2.71368408203125, 2.8123779296875, 2.91107177734375, 3.009765625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 5.0, 6.0, 6.0, 6.0, 7.0, 9.0, 11.0, 14.0, 20.0, 30.0, 21.0, 25.0, 46.0, 42.0, 65.0, 60.0, 48.0, 58.0, 49.0, 68.0, 49.0, 42.0, 46.0, 53.0, 45.0, 23.0, 32.0, 20.0, 18.0, 12.0, 17.0, 11.0, 6.0, 7.0, 5.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.733976364135742, -7.454599380493164, -7.175222873687744, -6.895845890045166, -6.616469383239746, -6.337092399597168, -6.05771541595459, -5.778338432312012, -5.498961925506592, -5.219584941864014, -4.940208435058594, -4.660831451416016, -4.3814544677734375, -4.102077960968018, -3.8227009773254395, -3.5433242321014404, -3.2639474868774414, -2.9845707416534424, -2.7051939964294434, -2.4258170127868652, -2.146440267562866, -1.8670635223388672, -1.5876866579055786, -1.30830979347229, -1.028933048248291, -0.7495562434196472, -0.4701794385910034, -0.19080263376235962, 0.08857417106628418, 0.3679509162902832, 0.6473277807235718, 0.9267046451568604, 1.2060813903808594, 1.4854581356048584, 1.764835000038147, 2.0442118644714355, 2.3235886096954346, 2.6029653549194336, 2.8823423385620117, 3.1617190837860107, 3.4410958290100098, 3.720472574234009, 3.999849319458008, 4.279226303100586, 4.558603286743164, 4.837979793548584, 5.117356777191162, 5.396733283996582, 5.67611026763916, 5.955487251281738, 6.234863758087158, 6.514240741729736, 6.793617248535156, 7.072994232177734, 7.3523712158203125, 7.631748199462891, 7.9111247062683105, 8.19050121307373, 8.469878196716309, 8.749255180358887, 9.028632164001465, 9.308008193969727, 9.587385177612305, 9.866762161254883, 10.146139144897461]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 2.0, 5.0, 9.0, 11.0, 8.0, 4.0, 11.0, 10.0, 16.0, 30.0, 21.0, 25.0, 26.0, 42.0, 31.0, 33.0, 30.0, 33.0, 41.0, 44.0, 50.0, 41.0, 24.0, 42.0, 40.0, 40.0, 39.0, 37.0, 36.0, 36.0, 27.0, 17.0, 20.0, 20.0, 14.0, 14.0, 19.0, 12.0, 6.0, 4.0, 9.0, 8.0, 2.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.681656837463379, -7.452150821685791, -7.222645282745361, -6.993139266967773, -6.7636332511901855, -6.534127235412598, -6.304621696472168, -6.07511568069458, -5.845609664916992, -5.616103649139404, -5.386598110198975, -5.157092094421387, -4.927586078643799, -4.698080062866211, -4.468574523925781, -4.239068508148193, -4.0095624923706055, -3.7800567150115967, -3.550550699234009, -3.321044921875, -3.091538906097412, -2.8620331287384033, -2.6325273513793945, -2.4030213356018066, -2.173515796661377, -1.9440099000930786, -1.7145040035247803, -1.4849982261657715, -1.2554922103881836, -1.0259864330291748, -0.7964805364608765, -0.5669746398925781, -0.33746862411499023, -0.10796274244785309, 0.12154313921928406, 0.35104900598526, 0.5805549025535583, 0.8100607395172119, 1.0395666360855103, 1.2690725326538086, 1.498578429222107, 1.7280843257904053, 1.9575902223587036, 2.187096118927002, 2.4166018962860107, 2.6461076736450195, 2.8756136894226074, 3.1051197052001953, 3.334625482559204, 3.564131259918213, 3.793637275695801, 4.023143291473389, 4.252648830413818, 4.482154846191406, 4.711660861968994, 4.941166877746582, 5.170672416687012, 5.4001784324646, 5.629683971405029, 5.859189987182617, 6.088696002960205, 6.318202018737793, 6.547707557678223, 6.7772135734558105, 7.006719589233398]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 6.0, 5.0, 18.0, 13.0, 29.0, 27.0, 52.0, 72.0, 129.0, 201.0, 283.0, 435.0, 690.0, 1049.0, 1664.0, 2794.0, 4524.0, 7591.0, 12918.0, 22226.0, 38997.0, 66864.0, 109370.0, 163683.0, 191177.0, 160623.0, 108132.0, 64615.0, 37503.0, 21291.0, 12594.0, 7442.0, 4495.0, 2512.0, 1669.0, 1062.0, 626.0, 404.0, 273.0, 165.0, 108.0, 75.0, 46.0, 38.0, 23.0, 13.0, 11.0, 10.0, 6.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.4140625, -7.18572998046875, -6.9573974609375, -6.72906494140625, -6.500732421875, -6.27239990234375, -6.0440673828125, -5.81573486328125, -5.58740234375, -5.35906982421875, -5.1307373046875, -4.90240478515625, -4.674072265625, -4.44573974609375, -4.2174072265625, -3.98907470703125, -3.7607421875, -3.53240966796875, -3.3040771484375, -3.07574462890625, -2.847412109375, -2.61907958984375, -2.3907470703125, -2.16241455078125, -1.93408203125, -1.70574951171875, -1.4774169921875, -1.24908447265625, -1.020751953125, -0.79241943359375, -0.5640869140625, -0.33575439453125, -0.107421875, 0.12091064453125, 0.3492431640625, 0.57757568359375, 0.805908203125, 1.03424072265625, 1.2625732421875, 1.49090576171875, 1.71923828125, 1.94757080078125, 2.1759033203125, 2.40423583984375, 2.632568359375, 2.86090087890625, 3.0892333984375, 3.31756591796875, 3.5458984375, 3.77423095703125, 4.0025634765625, 4.23089599609375, 4.459228515625, 4.68756103515625, 4.9158935546875, 5.14422607421875, 5.37255859375, 5.60089111328125, 5.8292236328125, 6.05755615234375, 6.285888671875, 6.51422119140625, 6.7425537109375, 6.97088623046875, 7.19921875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 9.0, 5.0, 9.0, 10.0, 9.0, 13.0, 22.0, 24.0, 23.0, 16.0, 25.0, 32.0, 36.0, 48.0, 29.0, 29.0, 44.0, 49.0, 46.0, 52.0, 36.0, 49.0, 36.0, 41.0, 35.0, 35.0, 37.0, 25.0, 33.0, 16.0, 20.0, 18.0, 13.0, 17.0, 9.0, 10.0, 10.0, 4.0, 6.0, 5.0, 2.0, 4.0, 1.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.54296875, -7.3011474609375, -7.059326171875, -6.8175048828125, -6.57568359375, -6.3338623046875, -6.092041015625, -5.8502197265625, -5.6083984375, -5.3665771484375, -5.124755859375, -4.8829345703125, -4.64111328125, -4.3992919921875, -4.157470703125, -3.9156494140625, -3.673828125, -3.4320068359375, -3.190185546875, -2.9483642578125, -2.70654296875, -2.4647216796875, -2.222900390625, -1.9810791015625, -1.7392578125, -1.4974365234375, -1.255615234375, -1.0137939453125, -0.77197265625, -0.5301513671875, -0.288330078125, -0.0465087890625, 0.1953125, 0.4371337890625, 0.678955078125, 0.9207763671875, 1.16259765625, 1.4044189453125, 1.646240234375, 1.8880615234375, 2.1298828125, 2.3717041015625, 2.613525390625, 2.8553466796875, 3.09716796875, 3.3389892578125, 3.580810546875, 3.8226318359375, 4.064453125, 4.3062744140625, 4.548095703125, 4.7899169921875, 5.03173828125, 5.2735595703125, 5.515380859375, 5.7572021484375, 5.9990234375, 6.2408447265625, 6.482666015625, 6.7244873046875, 6.96630859375, 7.2081298828125, 7.449951171875, 7.6917724609375, 7.93359375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 7.0, 5.0, 11.0, 8.0, 21.0, 26.0, 29.0, 48.0, 75.0, 91.0, 117.0, 160.0, 223.0, 352.0, 541.0, 825.0, 1310.0, 2185.0, 3876.0, 7299.0, 15025.0, 31988.0, 76720.0, 181123.0, 319365.0, 227762.0, 99179.0, 41130.0, 18485.0, 8989.0, 4715.0, 2483.0, 1489.0, 972.0, 591.0, 379.0, 242.0, 205.0, 123.0, 99.0, 79.0, 48.0, 55.0, 28.0, 24.0, 21.0, 7.0, 5.0, 8.0, 5.0, 4.0, 1.0, 2.0, 4.0], "bins": [-13.859375, -13.4593505859375, -13.059326171875, -12.6593017578125, -12.25927734375, -11.8592529296875, -11.459228515625, -11.0592041015625, -10.6591796875, -10.2591552734375, -9.859130859375, -9.4591064453125, -9.05908203125, -8.6590576171875, -8.259033203125, -7.8590087890625, -7.458984375, -7.0589599609375, -6.658935546875, -6.2589111328125, -5.85888671875, -5.4588623046875, -5.058837890625, -4.6588134765625, -4.2587890625, -3.8587646484375, -3.458740234375, -3.0587158203125, -2.65869140625, -2.2586669921875, -1.858642578125, -1.4586181640625, -1.05859375, -0.6585693359375, -0.258544921875, 0.1414794921875, 0.54150390625, 0.9415283203125, 1.341552734375, 1.7415771484375, 2.1416015625, 2.5416259765625, 2.941650390625, 3.3416748046875, 3.74169921875, 4.1417236328125, 4.541748046875, 4.9417724609375, 5.341796875, 5.7418212890625, 6.141845703125, 6.5418701171875, 6.94189453125, 7.3419189453125, 7.741943359375, 8.1419677734375, 8.5419921875, 8.9420166015625, 9.342041015625, 9.7420654296875, 10.14208984375, 10.5421142578125, 10.942138671875, 11.3421630859375, 11.7421875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 9.0, 10.0, 13.0, 19.0, 28.0, 11.0, 19.0, 21.0, 30.0, 38.0, 34.0, 25.0, 40.0, 35.0, 46.0, 47.0, 41.0, 47.0, 39.0, 53.0, 41.0, 43.0, 40.0, 33.0, 39.0, 29.0, 33.0, 21.0, 22.0, 23.0, 12.0, 19.0, 6.0, 9.0, 5.0, 9.0, 5.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.875, -4.712158203125, -4.54931640625, -4.386474609375, -4.2236328125, -4.060791015625, -3.89794921875, -3.735107421875, -3.572265625, -3.409423828125, -3.24658203125, -3.083740234375, -2.9208984375, -2.758056640625, -2.59521484375, -2.432373046875, -2.26953125, -2.106689453125, -1.94384765625, -1.781005859375, -1.6181640625, -1.455322265625, -1.29248046875, -1.129638671875, -0.966796875, -0.803955078125, -0.64111328125, -0.478271484375, -0.3154296875, -0.152587890625, 0.01025390625, 0.173095703125, 0.3359375, 0.498779296875, 0.66162109375, 0.824462890625, 0.9873046875, 1.150146484375, 1.31298828125, 1.475830078125, 1.638671875, 1.801513671875, 1.96435546875, 2.127197265625, 2.2900390625, 2.452880859375, 2.61572265625, 2.778564453125, 2.94140625, 3.104248046875, 3.26708984375, 3.429931640625, 3.5927734375, 3.755615234375, 3.91845703125, 4.081298828125, 4.244140625, 4.406982421875, 4.56982421875, 4.732666015625, 4.8955078125, 5.058349609375, 5.22119140625, 5.384033203125, 5.546875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 10.0, 5.0, 17.0, 20.0, 23.0, 27.0, 62.0, 85.0, 101.0, 180.0, 223.0, 384.0, 516.0, 856.0, 1306.0, 2155.0, 3672.0, 6552.0, 12387.0, 25074.0, 54565.0, 125007.0, 266034.0, 285703.0, 142542.0, 61476.0, 28270.0, 13755.0, 7170.0, 3959.0, 2379.0, 1396.0, 917.0, 567.0, 376.0, 250.0, 162.0, 106.0, 85.0, 59.0, 43.0, 25.0, 16.0, 11.0, 10.0, 6.0, 4.0, 9.0, 4.0, 0.0, 1.0], "bins": [-6.1015625, -5.93243408203125, -5.7633056640625, -5.59417724609375, -5.425048828125, -5.25592041015625, -5.0867919921875, -4.91766357421875, -4.74853515625, -4.57940673828125, -4.4102783203125, -4.24114990234375, -4.072021484375, -3.90289306640625, -3.7337646484375, -3.56463623046875, -3.3955078125, -3.22637939453125, -3.0572509765625, -2.88812255859375, -2.718994140625, -2.54986572265625, -2.3807373046875, -2.21160888671875, -2.04248046875, -1.87335205078125, -1.7042236328125, -1.53509521484375, -1.365966796875, -1.19683837890625, -1.0277099609375, -0.85858154296875, -0.689453125, -0.52032470703125, -0.3511962890625, -0.18206787109375, -0.012939453125, 0.15618896484375, 0.3253173828125, 0.49444580078125, 0.66357421875, 0.83270263671875, 1.0018310546875, 1.17095947265625, 1.340087890625, 1.50921630859375, 1.6783447265625, 1.84747314453125, 2.0166015625, 2.18572998046875, 2.3548583984375, 2.52398681640625, 2.693115234375, 2.86224365234375, 3.0313720703125, 3.20050048828125, 3.36962890625, 3.53875732421875, 3.7078857421875, 3.87701416015625, 4.046142578125, 4.21527099609375, 4.3843994140625, 4.55352783203125, 4.72265625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 3.0, 8.0, 15.0, 14.0, 23.0, 22.0, 40.0, 51.0, 69.0, 80.0, 105.0, 117.0, 105.0, 81.0, 71.0, 48.0, 48.0, 21.0, 14.0, 11.0, 14.0, 9.0, 5.0, 4.0, 13.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0003571510314941406, -0.00034651532769203186, -0.0003358796238899231, -0.00032524392008781433, -0.00031460821628570557, -0.0003039725124835968, -0.00029333680868148804, -0.00028270110487937927, -0.0002720654010772705, -0.00026142969727516174, -0.000250793993473053, -0.00024015828967094421, -0.00022952258586883545, -0.00021888688206672668, -0.00020825117826461792, -0.00019761547446250916, -0.0001869797706604004, -0.00017634406685829163, -0.00016570836305618286, -0.0001550726592540741, -0.00014443695545196533, -0.00013380125164985657, -0.0001231655478477478, -0.00011252984404563904, -0.00010189414024353027, -9.125843644142151e-05, -8.062273263931274e-05, -6.998702883720398e-05, -5.9351325035095215e-05, -4.871562123298645e-05, -3.8079917430877686e-05, -2.744421362876892e-05, -1.6808509826660156e-05, -6.172806024551392e-06, 4.462897777557373e-06, 1.5098601579666138e-05, 2.5734305381774902e-05, 3.637000918388367e-05, 4.700571298599243e-05, 5.7641416788101196e-05, 6.827712059020996e-05, 7.891282439231873e-05, 8.954852819442749e-05, 0.00010018423199653625, 0.00011081993579864502, 0.00012145563960075378, 0.00013209134340286255, 0.0001427270472049713, 0.00015336275100708008, 0.00016399845480918884, 0.0001746341586112976, 0.00018526986241340637, 0.00019590556621551514, 0.0002065412700176239, 0.00021717697381973267, 0.00022781267762184143, 0.0002384483814239502, 0.00024908408522605896, 0.0002597197890281677, 0.0002703554928302765, 0.00028099119663238525, 0.000291626900434494, 0.0003022626042366028, 0.00031289830803871155, 0.0003235340118408203]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 14.0, 17.0, 21.0, 20.0, 36.0, 44.0, 47.0, 73.0, 98.0, 181.0, 243.0, 394.0, 573.0, 910.0, 1454.0, 2318.0, 3771.0, 6674.0, 12107.0, 23892.0, 48988.0, 103099.0, 197215.0, 258012.0, 190718.0, 99392.0, 47025.0, 22994.0, 11659.0, 6563.0, 3716.0, 2245.0, 1372.0, 886.0, 593.0, 361.0, 228.0, 186.0, 128.0, 76.0, 70.0, 40.0, 22.0, 28.0, 20.0, 7.0, 13.0, 6.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0], "bins": [-4.69140625, -4.54693603515625, -4.4024658203125, -4.25799560546875, -4.113525390625, -3.96905517578125, -3.8245849609375, -3.68011474609375, -3.53564453125, -3.39117431640625, -3.2467041015625, -3.10223388671875, -2.957763671875, -2.81329345703125, -2.6688232421875, -2.52435302734375, -2.3798828125, -2.23541259765625, -2.0909423828125, -1.94647216796875, -1.802001953125, -1.65753173828125, -1.5130615234375, -1.36859130859375, -1.22412109375, -1.07965087890625, -0.9351806640625, -0.79071044921875, -0.646240234375, -0.50177001953125, -0.3572998046875, -0.21282958984375, -0.068359375, 0.07611083984375, 0.2205810546875, 0.36505126953125, 0.509521484375, 0.65399169921875, 0.7984619140625, 0.94293212890625, 1.08740234375, 1.23187255859375, 1.3763427734375, 1.52081298828125, 1.665283203125, 1.80975341796875, 1.9542236328125, 2.09869384765625, 2.2431640625, 2.38763427734375, 2.5321044921875, 2.67657470703125, 2.821044921875, 2.96551513671875, 3.1099853515625, 3.25445556640625, 3.39892578125, 3.54339599609375, 3.6878662109375, 3.83233642578125, 3.976806640625, 4.12127685546875, 4.2657470703125, 4.41021728515625, 4.5546875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 5.0, 7.0, 4.0, 10.0, 10.0, 17.0, 19.0, 21.0, 36.0, 31.0, 45.0, 59.0, 63.0, 55.0, 85.0, 75.0, 66.0, 72.0, 66.0, 50.0, 41.0, 35.0, 22.0, 20.0, 22.0, 16.0, 9.0, 9.0, 6.0, 5.0, 6.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6279296875, -1.5830841064453125, -1.538238525390625, -1.4933929443359375, -1.44854736328125, -1.4037017822265625, -1.358856201171875, -1.3140106201171875, -1.2691650390625, -1.2243194580078125, -1.179473876953125, -1.1346282958984375, -1.08978271484375, -1.0449371337890625, -1.000091552734375, -0.9552459716796875, -0.910400390625, -0.8655548095703125, -0.820709228515625, -0.7758636474609375, -0.73101806640625, -0.6861724853515625, -0.641326904296875, -0.5964813232421875, -0.5516357421875, -0.5067901611328125, -0.461944580078125, -0.4170989990234375, -0.37225341796875, -0.3274078369140625, -0.282562255859375, -0.2377166748046875, -0.19287109375, -0.1480255126953125, -0.103179931640625, -0.0583343505859375, -0.01348876953125, 0.0313568115234375, 0.076202392578125, 0.1210479736328125, 0.1658935546875, 0.2107391357421875, 0.255584716796875, 0.3004302978515625, 0.34527587890625, 0.3901214599609375, 0.434967041015625, 0.4798126220703125, 0.524658203125, 0.5695037841796875, 0.614349365234375, 0.6591949462890625, 0.70404052734375, 0.7488861083984375, 0.793731689453125, 0.8385772705078125, 0.8834228515625, 0.9282684326171875, 0.973114013671875, 1.0179595947265625, 1.06280517578125, 1.1076507568359375, 1.152496337890625, 1.1973419189453125, 1.2421875]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 2.0, 7.0, 5.0, 8.0, 14.0, 7.0, 10.0, 17.0, 11.0, 19.0, 30.0, 22.0, 42.0, 43.0, 45.0, 59.0, 58.0, 65.0, 52.0, 65.0, 41.0, 50.0, 55.0, 38.0, 32.0, 34.0, 34.0, 31.0, 24.0, 14.0, 12.0, 12.0, 8.0, 9.0, 3.0, 4.0, 3.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.885694980621338, -6.6188063621521, -6.351917743682861, -6.085029125213623, -5.818140506744385, -5.5512518882751465, -5.284363746643066, -5.017475128173828, -4.75058650970459, -4.483697891235352, -4.216809272766113, -3.949920654296875, -3.6830320358276367, -3.4161434173583984, -3.1492550373077393, -2.882366418838501, -2.6154775619506836, -2.3485889434814453, -2.081700325012207, -1.8148118257522583, -1.54792320728302, -1.2810345888137817, -1.014146089553833, -0.7472574710845947, -0.48036885261535645, -0.21348026394844055, 0.05340832471847534, 0.32029688358306885, 0.5871855020523071, 0.8540741205215454, 1.1209626197814941, 1.3878512382507324, 1.654740333557129, 1.9216289520263672, 2.1885175704956055, 2.4554061889648438, 2.722294807434082, 2.9891834259033203, 3.2560718059539795, 3.5229604244232178, 3.789849042892456, 4.056737422943115, 4.3236260414123535, 4.590514659881592, 4.85740327835083, 5.124291896820068, 5.391180515289307, 5.658069133758545, 5.924957752227783, 6.1918463706970215, 6.45873498916626, 6.725623607635498, 6.992512226104736, 7.259400844573975, 7.526288986206055, 7.793177604675293, 8.060066223144531, 8.32695484161377, 8.593843460083008, 8.860732078552246, 9.127620697021484, 9.394509315490723, 9.661397933959961, 9.9282865524292, 10.195175170898438]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 3.0, 5.0, 8.0, 7.0, 8.0, 10.0, 11.0, 10.0, 12.0, 26.0, 24.0, 23.0, 16.0, 33.0, 32.0, 38.0, 38.0, 24.0, 45.0, 32.0, 42.0, 43.0, 34.0, 37.0, 36.0, 39.0, 36.0, 35.0, 33.0, 42.0, 29.0, 26.0, 20.0, 22.0, 12.0, 15.0, 25.0, 16.0, 7.0, 9.0, 10.0, 5.0, 4.0, 4.0, 6.0, 5.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.1655449867248535, -6.950623989105225, -6.735702991485596, -6.520781993865967, -6.305860996246338, -6.090939998626709, -5.876018524169922, -5.661097526550293, -5.446176528930664, -5.231255531311035, -5.016334533691406, -4.801413536071777, -4.586492538452148, -4.3715715408325195, -4.156650543212891, -3.9417293071746826, -3.726808547973633, -3.511887550354004, -3.296966552734375, -3.082045555114746, -2.867124557495117, -2.6522035598754883, -2.4372823238372803, -2.2223613262176514, -2.0074403285980225, -1.7925193309783936, -1.5775983333587646, -1.3626772165298462, -1.1477562189102173, -0.9328352212905884, -0.7179141044616699, -0.502993106842041, -0.2880721092224121, -0.07315108180046082, 0.14176994562149048, 0.35669100284576416, 0.5716120004653931, 0.786532998085022, 1.0014541149139404, 1.2163751125335693, 1.4312961101531982, 1.6462171077728271, 1.861138105392456, 2.076059341430664, 2.290980339050293, 2.505901336669922, 2.720822334289551, 2.9357433319091797, 3.1506643295288086, 3.3655853271484375, 3.5805063247680664, 3.7954273223876953, 4.010348320007324, 4.225269317626953, 4.440190315246582, 4.655111312866211, 4.87003231048584, 5.084953308105469, 5.299874305725098, 5.514795303344727, 5.7297163009643555, 5.944637298583984, 6.159558296203613, 6.374479293823242, 6.589400768280029]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 7.0, 10.0, 13.0, 14.0, 20.0, 59.0, 81.0, 148.0, 213.0, 382.0, 601.0, 992.0, 1608.0, 2738.0, 4449.0, 7430.0, 12477.0, 20704.0, 33686.0, 55469.0, 87031.0, 124376.0, 156408.0, 159675.0, 131610.0, 93800.0, 60237.0, 37511.0, 22523.0, 13613.0, 8193.0, 5009.0, 2962.0, 1787.0, 1073.0, 646.0, 378.0, 243.0, 168.0, 85.0, 59.0, 32.0, 11.0, 17.0, 1.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.75, -6.52569580078125, -6.3013916015625, -6.07708740234375, -5.852783203125, -5.62847900390625, -5.4041748046875, -5.17987060546875, -4.95556640625, -4.73126220703125, -4.5069580078125, -4.28265380859375, -4.058349609375, -3.83404541015625, -3.6097412109375, -3.38543701171875, -3.1611328125, -2.93682861328125, -2.7125244140625, -2.48822021484375, -2.263916015625, -2.03961181640625, -1.8153076171875, -1.59100341796875, -1.36669921875, -1.14239501953125, -0.9180908203125, -0.69378662109375, -0.469482421875, -0.24517822265625, -0.0208740234375, 0.20343017578125, 0.427734375, 0.65203857421875, 0.8763427734375, 1.10064697265625, 1.324951171875, 1.54925537109375, 1.7735595703125, 1.99786376953125, 2.22216796875, 2.44647216796875, 2.6707763671875, 2.89508056640625, 3.119384765625, 3.34368896484375, 3.5679931640625, 3.79229736328125, 4.0166015625, 4.24090576171875, 4.4652099609375, 4.68951416015625, 4.913818359375, 5.13812255859375, 5.3624267578125, 5.58673095703125, 5.81103515625, 6.03533935546875, 6.2596435546875, 6.48394775390625, 6.708251953125, 6.93255615234375, 7.1568603515625, 7.38116455078125, 7.60546875]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 5.0, 3.0, 7.0, 8.0, 4.0, 9.0, 14.0, 18.0, 12.0, 16.0, 15.0, 31.0, 26.0, 22.0, 33.0, 32.0, 28.0, 53.0, 34.0, 36.0, 48.0, 39.0, 42.0, 42.0, 28.0, 42.0, 23.0, 42.0, 33.0, 35.0, 27.0, 33.0, 21.0, 20.0, 21.0, 18.0, 14.0, 11.0, 15.0, 13.0, 8.0, 5.0, 2.0, 4.0, 4.0, 6.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0], "bins": [-7.30859375, -7.09014892578125, -6.8717041015625, -6.65325927734375, -6.434814453125, -6.21636962890625, -5.9979248046875, -5.77947998046875, -5.56103515625, -5.34259033203125, -5.1241455078125, -4.90570068359375, -4.687255859375, -4.46881103515625, -4.2503662109375, -4.03192138671875, -3.8134765625, -3.59503173828125, -3.3765869140625, -3.15814208984375, -2.939697265625, -2.72125244140625, -2.5028076171875, -2.28436279296875, -2.06591796875, -1.84747314453125, -1.6290283203125, -1.41058349609375, -1.192138671875, -0.97369384765625, -0.7552490234375, -0.53680419921875, -0.318359375, -0.09991455078125, 0.1185302734375, 0.33697509765625, 0.555419921875, 0.77386474609375, 0.9923095703125, 1.21075439453125, 1.42919921875, 1.64764404296875, 1.8660888671875, 2.08453369140625, 2.302978515625, 2.52142333984375, 2.7398681640625, 2.95831298828125, 3.1767578125, 3.39520263671875, 3.6136474609375, 3.83209228515625, 4.050537109375, 4.26898193359375, 4.4874267578125, 4.70587158203125, 4.92431640625, 5.14276123046875, 5.3612060546875, 5.57965087890625, 5.798095703125, 6.01654052734375, 6.2349853515625, 6.45343017578125, 6.671875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [4.0, 4.0, 4.0, 5.0, 11.0, 11.0, 20.0, 30.0, 52.0, 65.0, 90.0, 110.0, 206.0, 282.0, 432.0, 656.0, 932.0, 1437.0, 2200.0, 3302.0, 5184.0, 7866.0, 12227.0, 19250.0, 29949.0, 46050.0, 68624.0, 98431.0, 128239.0, 145103.0, 136508.0, 109619.0, 79156.0, 53735.0, 35082.0, 22505.0, 14467.0, 9318.0, 5921.0, 3951.0, 2463.0, 1700.0, 1086.0, 735.0, 479.0, 341.0, 248.0, 167.0, 100.0, 85.0, 40.0, 24.0, 18.0, 11.0, 14.0, 10.0, 10.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.328125, -5.14862060546875, -4.9691162109375, -4.78961181640625, -4.610107421875, -4.43060302734375, -4.2510986328125, -4.07159423828125, -3.89208984375, -3.71258544921875, -3.5330810546875, -3.35357666015625, -3.174072265625, -2.99456787109375, -2.8150634765625, -2.63555908203125, -2.4560546875, -2.27655029296875, -2.0970458984375, -1.91754150390625, -1.738037109375, -1.55853271484375, -1.3790283203125, -1.19952392578125, -1.02001953125, -0.84051513671875, -0.6610107421875, -0.48150634765625, -0.302001953125, -0.12249755859375, 0.0570068359375, 0.23651123046875, 0.416015625, 0.59552001953125, 0.7750244140625, 0.95452880859375, 1.134033203125, 1.31353759765625, 1.4930419921875, 1.67254638671875, 1.85205078125, 2.03155517578125, 2.2110595703125, 2.39056396484375, 2.570068359375, 2.74957275390625, 2.9290771484375, 3.10858154296875, 3.2880859375, 3.46759033203125, 3.6470947265625, 3.82659912109375, 4.006103515625, 4.18560791015625, 4.3651123046875, 4.54461669921875, 4.72412109375, 4.90362548828125, 5.0831298828125, 5.26263427734375, 5.442138671875, 5.62164306640625, 5.8011474609375, 5.98065185546875, 6.16015625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 0.0, 5.0, 8.0, 8.0, 6.0, 10.0, 7.0, 12.0, 18.0, 18.0, 19.0, 17.0, 26.0, 29.0, 41.0, 34.0, 31.0, 35.0, 36.0, 42.0, 39.0, 41.0, 36.0, 51.0, 34.0, 36.0, 35.0, 43.0, 33.0, 30.0, 24.0, 38.0, 19.0, 17.0, 25.0, 17.0, 14.0, 15.0, 12.0, 11.0, 5.0, 6.0, 5.0, 4.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.47265625, -4.3323974609375, -4.192138671875, -4.0518798828125, -3.91162109375, -3.7713623046875, -3.631103515625, -3.4908447265625, -3.3505859375, -3.2103271484375, -3.070068359375, -2.9298095703125, -2.78955078125, -2.6492919921875, -2.509033203125, -2.3687744140625, -2.228515625, -2.0882568359375, -1.947998046875, -1.8077392578125, -1.66748046875, -1.5272216796875, -1.386962890625, -1.2467041015625, -1.1064453125, -0.9661865234375, -0.825927734375, -0.6856689453125, -0.54541015625, -0.4051513671875, -0.264892578125, -0.1246337890625, 0.015625, 0.1558837890625, 0.296142578125, 0.4364013671875, 0.57666015625, 0.7169189453125, 0.857177734375, 0.9974365234375, 1.1376953125, 1.2779541015625, 1.418212890625, 1.5584716796875, 1.69873046875, 1.8389892578125, 1.979248046875, 2.1195068359375, 2.259765625, 2.4000244140625, 2.540283203125, 2.6805419921875, 2.82080078125, 2.9610595703125, 3.101318359375, 3.2415771484375, 3.3818359375, 3.5220947265625, 3.662353515625, 3.8026123046875, 3.94287109375, 4.0831298828125, 4.223388671875, 4.3636474609375, 4.50390625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 4.0, 5.0, 3.0, 10.0, 12.0, 18.0, 28.0, 28.0, 39.0, 65.0, 79.0, 110.0, 161.0, 235.0, 338.0, 537.0, 653.0, 973.0, 1398.0, 2070.0, 3149.0, 4784.0, 7725.0, 12581.0, 21090.0, 36836.0, 64199.0, 110624.0, 169812.0, 200953.0, 161962.0, 102158.0, 59540.0, 33901.0, 19669.0, 11783.0, 7211.0, 4509.0, 2941.0, 1916.0, 1345.0, 917.0, 644.0, 442.0, 313.0, 217.0, 165.0, 113.0, 74.0, 61.0, 45.0, 42.0, 16.0, 22.0, 19.0, 7.0, 7.0, 3.0, 3.0, 2.0, 3.0], "bins": [-4.87890625, -4.72845458984375, -4.5780029296875, -4.42755126953125, -4.277099609375, -4.12664794921875, -3.9761962890625, -3.82574462890625, -3.67529296875, -3.52484130859375, -3.3743896484375, -3.22393798828125, -3.073486328125, -2.92303466796875, -2.7725830078125, -2.62213134765625, -2.4716796875, -2.32122802734375, -2.1707763671875, -2.02032470703125, -1.869873046875, -1.71942138671875, -1.5689697265625, -1.41851806640625, -1.26806640625, -1.11761474609375, -0.9671630859375, -0.81671142578125, -0.666259765625, -0.51580810546875, -0.3653564453125, -0.21490478515625, -0.064453125, 0.08599853515625, 0.2364501953125, 0.38690185546875, 0.537353515625, 0.68780517578125, 0.8382568359375, 0.98870849609375, 1.13916015625, 1.28961181640625, 1.4400634765625, 1.59051513671875, 1.740966796875, 1.89141845703125, 2.0418701171875, 2.19232177734375, 2.3427734375, 2.49322509765625, 2.6436767578125, 2.79412841796875, 2.944580078125, 3.09503173828125, 3.2454833984375, 3.39593505859375, 3.54638671875, 3.69683837890625, 3.8472900390625, 3.99774169921875, 4.148193359375, 4.29864501953125, 4.4490966796875, 4.59954833984375, 4.75]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 8.0, 8.0, 8.0, 8.0, 13.0, 15.0, 18.0, 18.0, 22.0, 23.0, 35.0, 25.0, 37.0, 43.0, 47.0, 57.0, 58.0, 68.0, 64.0, 54.0, 53.0, 50.0, 37.0, 36.0, 28.0, 25.0, 21.0, 23.0, 23.0, 9.0, 7.0, 10.0, 8.0, 5.0, 6.0, 8.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003960132598876953, -0.0003835149109363556, -0.00037101656198501587, -0.00035851821303367615, -0.0003460198640823364, -0.0003335215151309967, -0.000321023166179657, -0.00030852481722831726, -0.00029602646827697754, -0.0002835281193256378, -0.0002710297703742981, -0.0002585314214229584, -0.00024603307247161865, -0.00023353472352027893, -0.0002210363745689392, -0.0002085380256175995, -0.00019603967666625977, -0.00018354132771492004, -0.00017104297876358032, -0.0001585446298122406, -0.00014604628086090088, -0.00013354793190956116, -0.00012104958295822144, -0.00010855123400688171, -9.605288505554199e-05, -8.355453610420227e-05, -7.105618715286255e-05, -5.855783820152283e-05, -4.6059489250183105e-05, -3.3561140298843384e-05, -2.1062791347503662e-05, -8.56444239616394e-06, 3.933906555175781e-06, 1.6432255506515503e-05, 2.8930604457855225e-05, 4.1428953409194946e-05, 5.392730236053467e-05, 6.642565131187439e-05, 7.892400026321411e-05, 9.142234921455383e-05, 0.00010392069816589355, 0.00011641904711723328, 0.000128917396068573, 0.00014141574501991272, 0.00015391409397125244, 0.00016641244292259216, 0.00017891079187393188, 0.0001914091408252716, 0.00020390748977661133, 0.00021640583872795105, 0.00022890418767929077, 0.0002414025366306305, 0.0002539008855819702, 0.00026639923453330994, 0.00027889758348464966, 0.0002913959324359894, 0.0003038942813873291, 0.0003163926303386688, 0.00032889097929000854, 0.00034138932824134827, 0.000353887677192688, 0.0003663860261440277, 0.00037888437509536743, 0.00039138272404670715, 0.0004038810729980469]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 3.0, 9.0, 14.0, 9.0, 16.0, 27.0, 52.0, 49.0, 109.0, 162.0, 247.0, 416.0, 613.0, 959.0, 1587.0, 2757.0, 4683.0, 8157.0, 14526.0, 26184.0, 47364.0, 83781.0, 136577.0, 186301.0, 189288.0, 142305.0, 88481.0, 50250.0, 27656.0, 15152.0, 8515.0, 4955.0, 2844.0, 1674.0, 1064.0, 619.0, 387.0, 245.0, 161.0, 117.0, 69.0, 52.0, 41.0, 28.0, 21.0, 13.0, 12.0, 7.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.7734375, -4.63323974609375, -4.4930419921875, -4.35284423828125, -4.212646484375, -4.07244873046875, -3.9322509765625, -3.79205322265625, -3.65185546875, -3.51165771484375, -3.3714599609375, -3.23126220703125, -3.091064453125, -2.95086669921875, -2.8106689453125, -2.67047119140625, -2.5302734375, -2.39007568359375, -2.2498779296875, -2.10968017578125, -1.969482421875, -1.82928466796875, -1.6890869140625, -1.54888916015625, -1.40869140625, -1.26849365234375, -1.1282958984375, -0.98809814453125, -0.847900390625, -0.70770263671875, -0.5675048828125, -0.42730712890625, -0.287109375, -0.14691162109375, -0.0067138671875, 0.13348388671875, 0.273681640625, 0.41387939453125, 0.5540771484375, 0.69427490234375, 0.83447265625, 0.97467041015625, 1.1148681640625, 1.25506591796875, 1.395263671875, 1.53546142578125, 1.6756591796875, 1.81585693359375, 1.9560546875, 2.09625244140625, 2.2364501953125, 2.37664794921875, 2.516845703125, 2.65704345703125, 2.7972412109375, 2.93743896484375, 3.07763671875, 3.21783447265625, 3.3580322265625, 3.49822998046875, 3.638427734375, 3.77862548828125, 3.9188232421875, 4.05902099609375, 4.19921875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 4.0, 5.0, 6.0, 6.0, 5.0, 9.0, 9.0, 18.0, 23.0, 22.0, 27.0, 18.0, 27.0, 31.0, 34.0, 37.0, 48.0, 49.0, 69.0, 59.0, 63.0, 53.0, 47.0, 49.0, 38.0, 39.0, 37.0, 28.0, 21.0, 24.0, 21.0, 12.0, 14.0, 10.0, 8.0, 8.0, 7.0, 4.0, 3.0, 9.0, 1.0, 0.0, 8.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.380859375, -1.335662841796875, -1.29046630859375, -1.245269775390625, -1.2000732421875, -1.154876708984375, -1.10968017578125, -1.064483642578125, -1.019287109375, -0.974090576171875, -0.92889404296875, -0.883697509765625, -0.8385009765625, -0.793304443359375, -0.74810791015625, -0.702911376953125, -0.65771484375, -0.612518310546875, -0.56732177734375, -0.522125244140625, -0.4769287109375, -0.431732177734375, -0.38653564453125, -0.341339111328125, -0.296142578125, -0.250946044921875, -0.20574951171875, -0.160552978515625, -0.1153564453125, -0.070159912109375, -0.02496337890625, 0.020233154296875, 0.0654296875, 0.110626220703125, 0.15582275390625, 0.201019287109375, 0.2462158203125, 0.291412353515625, 0.33660888671875, 0.381805419921875, 0.427001953125, 0.472198486328125, 0.51739501953125, 0.562591552734375, 0.6077880859375, 0.652984619140625, 0.69818115234375, 0.743377685546875, 0.78857421875, 0.833770751953125, 0.87896728515625, 0.924163818359375, 0.9693603515625, 1.014556884765625, 1.05975341796875, 1.104949951171875, 1.150146484375, 1.195343017578125, 1.24053955078125, 1.285736083984375, 1.3309326171875, 1.376129150390625, 1.42132568359375, 1.466522216796875, 1.51171875]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 2.0, 6.0, 6.0, 5.0, 8.0, 7.0, 16.0, 12.0, 19.0, 23.0, 22.0, 33.0, 39.0, 37.0, 51.0, 57.0, 64.0, 62.0, 68.0, 74.0, 50.0, 43.0, 46.0, 43.0, 38.0, 34.0, 22.0, 33.0, 18.0, 15.0, 18.0, 8.0, 5.0, 6.0, 5.0, 1.0, 4.0, 3.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.26020622253418, -5.975907325744629, -5.691608428955078, -5.407309532165527, -5.123010158538818, -4.838711261749268, -4.554412364959717, -4.270113468170166, -3.985814332962036, -3.7015154361724854, -3.4172163009643555, -3.1329174041748047, -2.848618507385254, -2.564319372177124, -2.2800204753875732, -1.995721459388733, -1.7114224433898926, -1.4271234273910522, -1.142824411392212, -0.8585255146026611, -0.5742264986038208, -0.28992748260498047, -0.0056285858154296875, 0.27867043018341064, 0.562969446182251, 0.8472684621810913, 1.1315674781799316, 1.4158663749694824, 1.7001653909683228, 1.984464406967163, 2.268763303756714, 2.5530624389648438, 2.8373613357543945, 3.1216602325439453, 3.405959367752075, 3.690258264541626, 3.974557399749756, 4.258856296539307, 4.543155193328857, 4.827454090118408, 5.111753463745117, 5.396052360534668, 5.680351257324219, 5.9646501541137695, 6.2489495277404785, 6.533248424530029, 6.81754732131958, 7.101846218109131, 7.386145114898682, 7.670444011688232, 7.954742908477783, 8.239042282104492, 8.523341178894043, 8.807640075683594, 9.091938972473145, 9.376237869262695, 9.660536766052246, 9.944835662841797, 10.229134559631348, 10.513433456420898, 10.79773235321045, 11.08203125, 11.366331100463867, 11.650629997253418, 11.934928894042969]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 7.0, 3.0, 7.0, 9.0, 13.0, 13.0, 14.0, 17.0, 21.0, 15.0, 24.0, 32.0, 33.0, 18.0, 30.0, 32.0, 27.0, 41.0, 45.0, 47.0, 43.0, 40.0, 46.0, 36.0, 51.0, 30.0, 23.0, 37.0, 29.0, 30.0, 25.0, 21.0, 24.0, 25.0, 14.0, 14.0, 10.0, 8.0, 7.0, 10.0, 7.0, 8.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-6.785921096801758, -6.569186687469482, -6.352452754974365, -6.13571834564209, -5.918984413146973, -5.702250003814697, -5.485515594482422, -5.268781661987305, -5.052047252655029, -4.835312843322754, -4.618578910827637, -4.401844501495361, -4.185110092163086, -3.9683761596679688, -3.7516417503356934, -3.534907579421997, -3.318173408508301, -3.1014392375946045, -2.884705066680908, -2.667970657348633, -2.4512364864349365, -2.2345023155212402, -2.017767906188965, -1.8010337352752686, -1.5842995643615723, -1.367565393447876, -1.1508311033248901, -0.9340968728065491, -0.717362642288208, -0.5006284713745117, -0.2838941812515259, -0.06715989112854004, 0.14957427978515625, 0.3663085103034973, 0.5830427408218384, 0.7997769713401794, 1.0165112018585205, 1.2332453727722168, 1.4499796628952026, 1.6667139530181885, 1.8834481239318848, 2.100182294845581, 2.3169164657592773, 2.5336508750915527, 2.750385046005249, 2.9671192169189453, 3.1838536262512207, 3.400587797164917, 3.6173219680786133, 3.8340561389923096, 4.050790309906006, 4.267524719238281, 4.484258651733398, 4.700993061065674, 4.917727470397949, 5.134461402893066, 5.351195812225342, 5.567930221557617, 5.784664154052734, 6.00139856338501, 6.218132972717285, 6.434866905212402, 6.651601314544678, 6.868335723876953, 7.08506965637207]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 7.0, 7.0, 9.0, 9.0, 15.0, 26.0, 53.0, 59.0, 127.0, 175.0, 316.0, 533.0, 1062.0, 1954.0, 3741.0, 7660.0, 16261.0, 37905.0, 96872.0, 290774.0, 920702.0, 1561171.0, 840570.0, 258946.0, 88447.0, 35426.0, 15913.0, 7497.0, 3824.0, 1929.0, 1033.0, 537.0, 318.0, 160.0, 111.0, 60.0, 26.0, 18.0, 11.0, 10.0, 8.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-13.46875, -13.1185302734375, -12.768310546875, -12.4180908203125, -12.06787109375, -11.7176513671875, -11.367431640625, -11.0172119140625, -10.6669921875, -10.3167724609375, -9.966552734375, -9.6163330078125, -9.26611328125, -8.9158935546875, -8.565673828125, -8.2154541015625, -7.865234375, -7.5150146484375, -7.164794921875, -6.8145751953125, -6.46435546875, -6.1141357421875, -5.763916015625, -5.4136962890625, -5.0634765625, -4.7132568359375, -4.363037109375, -4.0128173828125, -3.66259765625, -3.3123779296875, -2.962158203125, -2.6119384765625, -2.26171875, -1.9114990234375, -1.561279296875, -1.2110595703125, -0.86083984375, -0.5106201171875, -0.160400390625, 0.1898193359375, 0.5400390625, 0.8902587890625, 1.240478515625, 1.5906982421875, 1.94091796875, 2.2911376953125, 2.641357421875, 2.9915771484375, 3.341796875, 3.6920166015625, 4.042236328125, 4.3924560546875, 4.74267578125, 5.0928955078125, 5.443115234375, 5.7933349609375, 6.1435546875, 6.4937744140625, 6.843994140625, 7.1942138671875, 7.54443359375, 7.8946533203125, 8.244873046875, 8.5950927734375, 8.9453125]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 2.0, 6.0, 9.0, 8.0, 7.0, 13.0, 19.0, 22.0, 28.0, 27.0, 25.0, 40.0, 31.0, 33.0, 42.0, 37.0, 45.0, 52.0, 50.0, 47.0, 34.0, 55.0, 38.0, 39.0, 29.0, 29.0, 44.0, 27.0, 27.0, 24.0, 20.0, 14.0, 17.0, 13.0, 10.0, 7.0, 4.0, 6.0, 8.0, 7.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.6796875, -5.51416015625, -5.3486328125, -5.18310546875, -5.017578125, -4.85205078125, -4.6865234375, -4.52099609375, -4.35546875, -4.18994140625, -4.0244140625, -3.85888671875, -3.693359375, -3.52783203125, -3.3623046875, -3.19677734375, -3.03125, -2.86572265625, -2.7001953125, -2.53466796875, -2.369140625, -2.20361328125, -2.0380859375, -1.87255859375, -1.70703125, -1.54150390625, -1.3759765625, -1.21044921875, -1.044921875, -0.87939453125, -0.7138671875, -0.54833984375, -0.3828125, -0.21728515625, -0.0517578125, 0.11376953125, 0.279296875, 0.44482421875, 0.6103515625, 0.77587890625, 0.94140625, 1.10693359375, 1.2724609375, 1.43798828125, 1.603515625, 1.76904296875, 1.9345703125, 2.10009765625, 2.265625, 2.43115234375, 2.5966796875, 2.76220703125, 2.927734375, 3.09326171875, 3.2587890625, 3.42431640625, 3.58984375, 3.75537109375, 3.9208984375, 4.08642578125, 4.251953125, 4.41748046875, 4.5830078125, 4.74853515625, 4.9140625]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 6.0, 13.0, 19.0, 21.0, 47.0, 44.0, 97.0, 130.0, 199.0, 269.0, 392.0, 556.0, 905.0, 1334.0, 2121.0, 3252.0, 5131.0, 8299.0, 13392.0, 21868.0, 36958.0, 64008.0, 114200.0, 211567.0, 395823.0, 698741.0, 928098.0, 738724.0, 426639.0, 228475.0, 123953.0, 68368.0, 39149.0, 23319.0, 14027.0, 8777.0, 5388.0, 3359.0, 2238.0, 1491.0, 948.0, 656.0, 419.0, 290.0, 200.0, 140.0, 72.0, 47.0, 37.0, 24.0, 24.0, 13.0, 12.0, 4.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-6.296875, -6.0838623046875, -5.870849609375, -5.6578369140625, -5.44482421875, -5.2318115234375, -5.018798828125, -4.8057861328125, -4.5927734375, -4.3797607421875, -4.166748046875, -3.9537353515625, -3.74072265625, -3.5277099609375, -3.314697265625, -3.1016845703125, -2.888671875, -2.6756591796875, -2.462646484375, -2.2496337890625, -2.03662109375, -1.8236083984375, -1.610595703125, -1.3975830078125, -1.1845703125, -0.9715576171875, -0.758544921875, -0.5455322265625, -0.33251953125, -0.1195068359375, 0.093505859375, 0.3065185546875, 0.51953125, 0.7325439453125, 0.945556640625, 1.1585693359375, 1.37158203125, 1.5845947265625, 1.797607421875, 2.0106201171875, 2.2236328125, 2.4366455078125, 2.649658203125, 2.8626708984375, 3.07568359375, 3.2886962890625, 3.501708984375, 3.7147216796875, 3.927734375, 4.1407470703125, 4.353759765625, 4.5667724609375, 4.77978515625, 4.9927978515625, 5.205810546875, 5.4188232421875, 5.6318359375, 5.8448486328125, 6.057861328125, 6.2708740234375, 6.48388671875, 6.6968994140625, 6.909912109375, 7.1229248046875, 7.3359375]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 3.0, 2.0, 5.0, 7.0, 11.0, 8.0, 12.0, 15.0, 18.0, 28.0, 31.0, 25.0, 48.0, 47.0, 61.0, 87.0, 108.0, 131.0, 161.0, 176.0, 233.0, 258.0, 290.0, 296.0, 296.0, 293.0, 201.0, 236.0, 166.0, 148.0, 123.0, 113.0, 101.0, 78.0, 59.0, 33.0, 38.0, 25.0, 30.0, 24.0, 14.0, 9.0, 8.0, 9.0, 5.0, 2.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.564453125, -2.4840087890625, -2.403564453125, -2.3231201171875, -2.24267578125, -2.1622314453125, -2.081787109375, -2.0013427734375, -1.9208984375, -1.8404541015625, -1.760009765625, -1.6795654296875, -1.59912109375, -1.5186767578125, -1.438232421875, -1.3577880859375, -1.27734375, -1.1968994140625, -1.116455078125, -1.0360107421875, -0.95556640625, -0.8751220703125, -0.794677734375, -0.7142333984375, -0.6337890625, -0.5533447265625, -0.472900390625, -0.3924560546875, -0.31201171875, -0.2315673828125, -0.151123046875, -0.0706787109375, 0.009765625, 0.0902099609375, 0.170654296875, 0.2510986328125, 0.33154296875, 0.4119873046875, 0.492431640625, 0.5728759765625, 0.6533203125, 0.7337646484375, 0.814208984375, 0.8946533203125, 0.97509765625, 1.0555419921875, 1.135986328125, 1.2164306640625, 1.296875, 1.3773193359375, 1.457763671875, 1.5382080078125, 1.61865234375, 1.6990966796875, 1.779541015625, 1.8599853515625, 1.9404296875, 2.0208740234375, 2.101318359375, 2.1817626953125, 2.26220703125, 2.3426513671875, 2.423095703125, 2.5035400390625, 2.583984375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 7.0, 7.0, 12.0, 11.0, 20.0, 23.0, 20.0, 32.0, 35.0, 49.0, 65.0, 48.0, 79.0, 72.0, 75.0, 73.0, 58.0, 52.0, 47.0, 44.0, 34.0, 29.0, 24.0, 14.0, 14.0, 7.0, 15.0, 3.0, 6.0, 6.0, 2.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.479434013366699, -7.182035446166992, -6.884636878967285, -6.587238311767578, -6.289839267730713, -5.992440700531006, -5.695042133331299, -5.397643089294434, -5.100244522094727, -4.8028459548950195, -4.5054473876953125, -4.2080488204956055, -3.9106497764587402, -3.613251209259033, -3.315852642059326, -3.01845383644104, -2.721055507659912, -2.423656940460205, -2.126258134841919, -1.828859567642212, -1.5314608812332153, -1.2340621948242188, -0.9366636276245117, -0.6392648220062256, -0.34186625480651855, -0.04446759819984436, 0.25293105840682983, 0.5503296852111816, 0.8477283716201782, 1.1451270580291748, 1.4425256252288818, 1.739924430847168, 2.037322998046875, 2.334721565246582, 2.632120370864868, 2.929518938064575, 3.2269177436828613, 3.5243163108825684, 3.8217148780822754, 4.119113922119141, 4.416512489318848, 4.713911056518555, 5.011309623718262, 5.308708190917969, 5.606107234954834, 5.903505802154541, 6.200904369354248, 6.498303413391113, 6.795701503753662, 7.093100070953369, 7.390498638153076, 7.687897682189941, 7.985296249389648, 8.282694816589355, 8.580093383789062, 8.87749195098877, 9.174890518188477, 9.472289085388184, 9.76968765258789, 10.067086219787598, 10.364484786987305, 10.661884307861328, 10.959281921386719, 11.256681442260742, 11.55408000946045]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 7.0, 5.0, 5.0, 8.0, 10.0, 8.0, 11.0, 12.0, 19.0, 19.0, 23.0, 25.0, 30.0, 27.0, 27.0, 39.0, 39.0, 42.0, 35.0, 38.0, 35.0, 39.0, 35.0, 32.0, 40.0, 33.0, 37.0, 31.0, 43.0, 39.0, 24.0, 22.0, 25.0, 13.0, 21.0, 11.0, 14.0, 15.0, 10.0, 9.0, 12.0, 5.0, 4.0, 8.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0], "bins": [-5.8547821044921875, -5.6723103523254395, -5.489838600158691, -5.307366847991943, -5.124895095825195, -4.942423343658447, -4.759951591491699, -4.577480316162109, -4.395008087158203, -4.212536334991455, -4.030064582824707, -3.847592830657959, -3.665121078491211, -3.482649326324463, -3.300177812576294, -3.117706060409546, -2.935234546661377, -2.752762794494629, -2.570291042327881, -2.387819290161133, -2.2053475379943848, -2.0228757858276367, -1.8404042720794678, -1.6579325199127197, -1.4754607677459717, -1.2929890155792236, -1.1105172634124756, -0.9280456304550171, -0.745573878288269, -0.563102126121521, -0.3806304931640625, -0.19815874099731445, -0.01568746566772461, 0.16678425669670105, 0.3492559790611267, 0.53172767162323, 0.714199423789978, 0.8966711759567261, 1.0791428089141846, 1.2616145610809326, 1.4440863132476807, 1.6265580654144287, 1.8090298175811768, 1.9915014505386353, 2.1739730834960938, 2.356444835662842, 2.53891658782959, 2.721388339996338, 2.903860092163086, 3.086331844329834, 3.268803596496582, 3.45127534866333, 3.633747100830078, 3.816218852996826, 3.998690366744995, 4.181161880493164, 4.36363410949707, 4.546105861663818, 4.728577613830566, 4.9110493659973145, 5.0935211181640625, 5.2759928703308105, 5.458464622497559, 5.640935897827148, 5.8234076499938965]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 8.0, 6.0, 14.0, 11.0, 20.0, 27.0, 48.0, 59.0, 106.0, 196.0, 304.0, 588.0, 956.0, 1676.0, 3083.0, 5876.0, 11240.0, 22308.0, 45656.0, 89605.0, 161325.0, 225680.0, 207241.0, 131084.0, 70094.0, 35232.0, 17351.0, 8687.0, 4442.0, 2380.0, 1402.0, 709.0, 455.0, 241.0, 170.0, 107.0, 65.0, 46.0, 23.0, 10.0, 9.0, 8.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.984375, -5.78363037109375, -5.5828857421875, -5.38214111328125, -5.181396484375, -4.98065185546875, -4.7799072265625, -4.57916259765625, -4.37841796875, -4.17767333984375, -3.9769287109375, -3.77618408203125, -3.575439453125, -3.37469482421875, -3.1739501953125, -2.97320556640625, -2.7724609375, -2.57171630859375, -2.3709716796875, -2.17022705078125, -1.969482421875, -1.76873779296875, -1.5679931640625, -1.36724853515625, -1.16650390625, -0.96575927734375, -0.7650146484375, -0.56427001953125, -0.363525390625, -0.16278076171875, 0.0379638671875, 0.23870849609375, 0.439453125, 0.64019775390625, 0.8409423828125, 1.04168701171875, 1.242431640625, 1.44317626953125, 1.6439208984375, 1.84466552734375, 2.04541015625, 2.24615478515625, 2.4468994140625, 2.64764404296875, 2.848388671875, 3.04913330078125, 3.2498779296875, 3.45062255859375, 3.6513671875, 3.85211181640625, 4.0528564453125, 4.25360107421875, 4.454345703125, 4.65509033203125, 4.8558349609375, 5.05657958984375, 5.25732421875, 5.45806884765625, 5.6588134765625, 5.85955810546875, 6.060302734375, 6.26104736328125, 6.4617919921875, 6.66253662109375, 6.86328125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 5.0, 6.0, 6.0, 7.0, 9.0, 13.0, 11.0, 13.0, 20.0, 23.0, 25.0, 24.0, 35.0, 25.0, 31.0, 37.0, 36.0, 38.0, 40.0, 36.0, 33.0, 39.0, 48.0, 50.0, 38.0, 32.0, 47.0, 36.0, 20.0, 29.0, 26.0, 27.0, 20.0, 16.0, 14.0, 14.0, 12.0, 13.0, 11.0, 10.0, 5.0, 5.0, 5.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-6.30859375, -6.1151123046875, -5.921630859375, -5.7281494140625, -5.53466796875, -5.3411865234375, -5.147705078125, -4.9542236328125, -4.7607421875, -4.5672607421875, -4.373779296875, -4.1802978515625, -3.98681640625, -3.7933349609375, -3.599853515625, -3.4063720703125, -3.212890625, -3.0194091796875, -2.825927734375, -2.6324462890625, -2.43896484375, -2.2454833984375, -2.052001953125, -1.8585205078125, -1.6650390625, -1.4715576171875, -1.278076171875, -1.0845947265625, -0.89111328125, -0.6976318359375, -0.504150390625, -0.3106689453125, -0.1171875, 0.0762939453125, 0.269775390625, 0.4632568359375, 0.65673828125, 0.8502197265625, 1.043701171875, 1.2371826171875, 1.4306640625, 1.6241455078125, 1.817626953125, 2.0111083984375, 2.20458984375, 2.3980712890625, 2.591552734375, 2.7850341796875, 2.978515625, 3.1719970703125, 3.365478515625, 3.5589599609375, 3.75244140625, 3.9459228515625, 4.139404296875, 4.3328857421875, 4.5263671875, 4.7198486328125, 4.913330078125, 5.1068115234375, 5.30029296875, 5.4937744140625, 5.687255859375, 5.8807373046875, 6.07421875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 2.0, 14.0, 8.0, 19.0, 20.0, 28.0, 62.0, 78.0, 114.0, 158.0, 263.0, 404.0, 638.0, 983.0, 1679.0, 2887.0, 5251.0, 9801.0, 19160.0, 38799.0, 80136.0, 159174.0, 257868.0, 224914.0, 123679.0, 60283.0, 29338.0, 14796.0, 7572.0, 4255.0, 2303.0, 1455.0, 873.0, 513.0, 316.0, 240.0, 141.0, 116.0, 75.0, 31.0, 27.0, 30.0, 17.0, 10.0, 6.0, 7.0, 8.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.515625, -6.2894287109375, -6.063232421875, -5.8370361328125, -5.61083984375, -5.3846435546875, -5.158447265625, -4.9322509765625, -4.7060546875, -4.4798583984375, -4.253662109375, -4.0274658203125, -3.80126953125, -3.5750732421875, -3.348876953125, -3.1226806640625, -2.896484375, -2.6702880859375, -2.444091796875, -2.2178955078125, -1.99169921875, -1.7655029296875, -1.539306640625, -1.3131103515625, -1.0869140625, -0.8607177734375, -0.634521484375, -0.4083251953125, -0.18212890625, 0.0440673828125, 0.270263671875, 0.4964599609375, 0.72265625, 0.9488525390625, 1.175048828125, 1.4012451171875, 1.62744140625, 1.8536376953125, 2.079833984375, 2.3060302734375, 2.5322265625, 2.7584228515625, 2.984619140625, 3.2108154296875, 3.43701171875, 3.6632080078125, 3.889404296875, 4.1156005859375, 4.341796875, 4.5679931640625, 4.794189453125, 5.0203857421875, 5.24658203125, 5.4727783203125, 5.698974609375, 5.9251708984375, 6.1513671875, 6.3775634765625, 6.603759765625, 6.8299560546875, 7.05615234375, 7.2823486328125, 7.508544921875, 7.7347412109375, 7.9609375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 7.0, 7.0, 14.0, 16.0, 10.0, 13.0, 16.0, 19.0, 23.0, 27.0, 24.0, 27.0, 28.0, 40.0, 42.0, 24.0, 42.0, 41.0, 53.0, 43.0, 28.0, 45.0, 50.0, 35.0, 37.0, 42.0, 22.0, 28.0, 26.0, 24.0, 23.0, 23.0, 15.0, 17.0, 13.0, 13.0, 9.0, 6.0, 8.0, 6.0, 4.0, 4.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0], "bins": [-4.1640625, -4.0474853515625, -3.930908203125, -3.8143310546875, -3.69775390625, -3.5811767578125, -3.464599609375, -3.3480224609375, -3.2314453125, -3.1148681640625, -2.998291015625, -2.8817138671875, -2.76513671875, -2.6485595703125, -2.531982421875, -2.4154052734375, -2.298828125, -2.1822509765625, -2.065673828125, -1.9490966796875, -1.83251953125, -1.7159423828125, -1.599365234375, -1.4827880859375, -1.3662109375, -1.2496337890625, -1.133056640625, -1.0164794921875, -0.89990234375, -0.7833251953125, -0.666748046875, -0.5501708984375, -0.43359375, -0.3170166015625, -0.200439453125, -0.0838623046875, 0.03271484375, 0.1492919921875, 0.265869140625, 0.3824462890625, 0.4990234375, 0.6156005859375, 0.732177734375, 0.8487548828125, 0.96533203125, 1.0819091796875, 1.198486328125, 1.3150634765625, 1.431640625, 1.5482177734375, 1.664794921875, 1.7813720703125, 1.89794921875, 2.0145263671875, 2.131103515625, 2.2476806640625, 2.3642578125, 2.4808349609375, 2.597412109375, 2.7139892578125, 2.83056640625, 2.9471435546875, 3.063720703125, 3.1802978515625, 3.296875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 7.0, 4.0, 14.0, 14.0, 13.0, 18.0, 29.0, 43.0, 45.0, 76.0, 104.0, 124.0, 192.0, 256.0, 385.0, 626.0, 972.0, 1701.0, 2796.0, 5186.0, 10172.0, 21018.0, 47832.0, 114257.0, 266461.0, 314793.0, 147540.0, 60591.0, 26449.0, 12318.0, 6088.0, 3251.0, 1866.0, 1077.0, 677.0, 484.0, 295.0, 229.0, 153.0, 106.0, 93.0, 56.0, 35.0, 26.0, 32.0, 10.0, 12.0, 11.0, 8.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0], "bins": [-4.98046875, -4.8345947265625, -4.688720703125, -4.5428466796875, -4.39697265625, -4.2510986328125, -4.105224609375, -3.9593505859375, -3.8134765625, -3.6676025390625, -3.521728515625, -3.3758544921875, -3.22998046875, -3.0841064453125, -2.938232421875, -2.7923583984375, -2.646484375, -2.5006103515625, -2.354736328125, -2.2088623046875, -2.06298828125, -1.9171142578125, -1.771240234375, -1.6253662109375, -1.4794921875, -1.3336181640625, -1.187744140625, -1.0418701171875, -0.89599609375, -0.7501220703125, -0.604248046875, -0.4583740234375, -0.3125, -0.1666259765625, -0.020751953125, 0.1251220703125, 0.27099609375, 0.4168701171875, 0.562744140625, 0.7086181640625, 0.8544921875, 1.0003662109375, 1.146240234375, 1.2921142578125, 1.43798828125, 1.5838623046875, 1.729736328125, 1.8756103515625, 2.021484375, 2.1673583984375, 2.313232421875, 2.4591064453125, 2.60498046875, 2.7508544921875, 2.896728515625, 3.0426025390625, 3.1884765625, 3.3343505859375, 3.480224609375, 3.6260986328125, 3.77197265625, 3.9178466796875, 4.063720703125, 4.2095947265625, 4.35546875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 2.0, 7.0, 11.0, 13.0, 15.0, 18.0, 22.0, 28.0, 40.0, 43.0, 66.0, 52.0, 70.0, 65.0, 80.0, 76.0, 74.0, 71.0, 51.0, 52.0, 35.0, 20.0, 20.0, 11.0, 10.0, 9.0, 8.0, 11.0, 6.0, 5.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017976760864257812, -0.00017384812235832214, -0.00016792863607406616, -0.00016200914978981018, -0.0001560896635055542, -0.00015017017722129822, -0.00014425069093704224, -0.00013833120465278625, -0.00013241171836853027, -0.0001264922320842743, -0.00012057274580001831, -0.00011465325951576233, -0.00010873377323150635, -0.00010281428694725037, -9.689480066299438e-05, -9.09753143787384e-05, -8.505582809448242e-05, -7.913634181022644e-05, -7.321685552597046e-05, -6.729736924171448e-05, -6.13778829574585e-05, -5.5458396673202515e-05, -4.953891038894653e-05, -4.361942410469055e-05, -3.769993782043457e-05, -3.178045153617859e-05, -2.5860965251922607e-05, -1.9941478967666626e-05, -1.4021992683410645e-05, -8.102506399154663e-06, -2.1830201148986816e-06, 3.7364661693573e-06, 9.655952453613281e-06, 1.5575438737869263e-05, 2.1494925022125244e-05, 2.7414411306381226e-05, 3.333389759063721e-05, 3.925338387489319e-05, 4.517287015914917e-05, 5.109235644340515e-05, 5.701184272766113e-05, 6.293132901191711e-05, 6.88508152961731e-05, 7.477030158042908e-05, 8.068978786468506e-05, 8.660927414894104e-05, 9.252876043319702e-05, 9.8448246717453e-05, 0.00010436773300170898, 0.00011028721928596497, 0.00011620670557022095, 0.00012212619185447693, 0.0001280456781387329, 0.0001339651644229889, 0.00013988465070724487, 0.00014580413699150085, 0.00015172362327575684, 0.00015764310956001282, 0.0001635625958442688, 0.00016948208212852478, 0.00017540156841278076, 0.00018132105469703674, 0.00018724054098129272, 0.0001931600272655487, 0.0001990795135498047]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 6.0, 4.0, 5.0, 9.0, 14.0, 13.0, 23.0, 35.0, 59.0, 64.0, 119.0, 153.0, 246.0, 321.0, 516.0, 758.0, 1160.0, 1980.0, 3472.0, 6167.0, 11455.0, 22056.0, 44227.0, 89037.0, 165569.0, 235190.0, 209041.0, 125437.0, 63443.0, 31701.0, 16227.0, 8357.0, 4686.0, 2684.0, 1549.0, 939.0, 598.0, 392.0, 257.0, 183.0, 113.0, 87.0, 62.0, 38.0, 36.0, 20.0, 13.0, 13.0, 13.0, 7.0, 5.0, 3.0, 1.0, 4.0, 1.0], "bins": [-3.3828125, -3.285491943359375, -3.18817138671875, -3.090850830078125, -2.9935302734375, -2.896209716796875, -2.79888916015625, -2.701568603515625, -2.604248046875, -2.506927490234375, -2.40960693359375, -2.312286376953125, -2.2149658203125, -2.117645263671875, -2.02032470703125, -1.923004150390625, -1.82568359375, -1.728363037109375, -1.63104248046875, -1.533721923828125, -1.4364013671875, -1.339080810546875, -1.24176025390625, -1.144439697265625, -1.047119140625, -0.949798583984375, -0.85247802734375, -0.755157470703125, -0.6578369140625, -0.560516357421875, -0.46319580078125, -0.365875244140625, -0.2685546875, -0.171234130859375, -0.07391357421875, 0.023406982421875, 0.1207275390625, 0.218048095703125, 0.31536865234375, 0.412689208984375, 0.510009765625, 0.607330322265625, 0.70465087890625, 0.801971435546875, 0.8992919921875, 0.996612548828125, 1.09393310546875, 1.191253662109375, 1.28857421875, 1.385894775390625, 1.48321533203125, 1.580535888671875, 1.6778564453125, 1.775177001953125, 1.87249755859375, 1.969818115234375, 2.067138671875, 2.164459228515625, 2.26177978515625, 2.359100341796875, 2.4564208984375, 2.553741455078125, 2.65106201171875, 2.748382568359375, 2.845703125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 5.0, 8.0, 13.0, 8.0, 10.0, 12.0, 29.0, 36.0, 30.0, 45.0, 51.0, 60.0, 72.0, 71.0, 80.0, 70.0, 59.0, 60.0, 63.0, 40.0, 39.0, 29.0, 25.0, 17.0, 11.0, 15.0, 7.0, 7.0, 7.0, 4.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.0888671875, -1.055572509765625, -1.02227783203125, -0.988983154296875, -0.9556884765625, -0.922393798828125, -0.88909912109375, -0.855804443359375, -0.822509765625, -0.789215087890625, -0.75592041015625, -0.722625732421875, -0.6893310546875, -0.656036376953125, -0.62274169921875, -0.589447021484375, -0.55615234375, -0.522857666015625, -0.48956298828125, -0.456268310546875, -0.4229736328125, -0.389678955078125, -0.35638427734375, -0.323089599609375, -0.289794921875, -0.256500244140625, -0.22320556640625, -0.189910888671875, -0.1566162109375, -0.123321533203125, -0.09002685546875, -0.056732177734375, -0.0234375, 0.009857177734375, 0.04315185546875, 0.076446533203125, 0.1097412109375, 0.143035888671875, 0.17633056640625, 0.209625244140625, 0.242919921875, 0.276214599609375, 0.30950927734375, 0.342803955078125, 0.3760986328125, 0.409393310546875, 0.44268798828125, 0.475982666015625, 0.50927734375, 0.542572021484375, 0.57586669921875, 0.609161376953125, 0.6424560546875, 0.675750732421875, 0.70904541015625, 0.742340087890625, 0.775634765625, 0.808929443359375, 0.84222412109375, 0.875518798828125, 0.9088134765625, 0.942108154296875, 0.97540283203125, 1.008697509765625, 1.0419921875]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 7.0, 9.0, 9.0, 11.0, 12.0, 27.0, 15.0, 22.0, 28.0, 41.0, 60.0, 58.0, 62.0, 76.0, 60.0, 62.0, 71.0, 79.0, 52.0, 47.0, 32.0, 29.0, 30.0, 21.0, 14.0, 18.0, 3.0, 10.0, 9.0, 7.0, 7.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.090021133422852, -7.80002498626709, -7.510028839111328, -7.220032215118408, -6.9300360679626465, -6.640039920806885, -6.350043296813965, -6.060047149658203, -5.770051002502441, -5.48005485534668, -5.190058708190918, -4.900062084197998, -4.610065937042236, -4.320069789886475, -4.030073165893555, -3.740077018737793, -3.4500808715820312, -3.1600847244262695, -2.8700883388519287, -2.580091953277588, -2.290095806121826, -2.0000996589660645, -1.7101032733917236, -1.4201068878173828, -1.130110740661621, -0.8401144742965698, -0.5501182079315186, -0.2601219415664673, 0.029874324798583984, 0.31987059116363525, 0.6098668575286865, 0.8998632431030273, 1.189859390258789, 1.4798556566238403, 1.7698519229888916, 2.0598483085632324, 2.349844455718994, 2.639840602874756, 2.9298369884490967, 3.2198333740234375, 3.509829521179199, 3.799825668334961, 4.089821815490723, 4.379818439483643, 4.669814586639404, 4.959810733795166, 5.249807357788086, 5.539803504943848, 5.829799652099609, 6.119795799255371, 6.409791946411133, 6.699788570404053, 6.9897847175598145, 7.279780864715576, 7.569777488708496, 7.859773635864258, 8.14976978302002, 8.439765930175781, 8.729762077331543, 9.019758224487305, 9.309755325317383, 9.599751472473145, 9.889747619628906, 10.179743766784668, 10.46973991394043]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 6.0, 3.0, 7.0, 8.0, 9.0, 11.0, 12.0, 16.0, 15.0, 23.0, 31.0, 20.0, 31.0, 26.0, 26.0, 41.0, 39.0, 41.0, 39.0, 43.0, 39.0, 36.0, 28.0, 38.0, 32.0, 37.0, 32.0, 45.0, 34.0, 29.0, 30.0, 21.0, 21.0, 17.0, 14.0, 11.0, 19.0, 11.0, 9.0, 7.0, 8.0, 10.0, 2.0, 3.0, 8.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 3.0, 2.0], "bins": [-5.845791339874268, -5.666573524475098, -5.487356185913086, -5.308138370513916, -5.128920555114746, -4.949702739715576, -4.770484924316406, -4.5912675857543945, -4.412049770355225, -4.232831954956055, -4.053614616394043, -3.874396800994873, -3.695178985595703, -3.515961170196533, -3.3367435932159424, -3.1575260162353516, -2.9783082008361816, -2.7990903854370117, -2.619872808456421, -2.44065523147583, -2.26143741607666, -2.0822196006774902, -1.9030020236968994, -1.723784327507019, -1.5445666313171387, -1.3653489351272583, -1.186131238937378, -1.0069135427474976, -0.8276958465576172, -0.6484781503677368, -0.46926045417785645, -0.2900427579879761, -0.1108255386352539, 0.06839215755462646, 0.24760985374450684, 0.4268275499343872, 0.6060452461242676, 0.785262942314148, 0.9644806385040283, 1.1436983346939087, 1.322916030883789, 1.5021337270736694, 1.6813514232635498, 1.8605691194534302, 2.0397868156433105, 2.2190046310424805, 2.3982222080230713, 2.577439785003662, 2.756657600402832, 2.935875415802002, 3.1150929927825928, 3.2943105697631836, 3.4735283851623535, 3.6527462005615234, 3.8319637775421143, 4.011181354522705, 4.190399169921875, 4.369616985321045, 4.548834800720215, 4.728052139282227, 4.9072699546813965, 5.086487770080566, 5.265705108642578, 5.444922924041748, 5.624140739440918]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 1.0, 11.0, 13.0, 21.0, 28.0, 51.0, 86.0, 98.0, 159.0, 273.0, 436.0, 746.0, 1178.0, 2075.0, 3472.0, 6050.0, 10546.0, 17882.0, 31022.0, 52922.0, 87187.0, 130490.0, 167371.0, 169675.0, 136651.0, 92931.0, 56890.0, 33397.0, 19484.0, 11200.0, 6640.0, 3878.0, 2182.0, 1368.0, 806.0, 492.0, 301.0, 214.0, 117.0, 66.0, 40.0, 37.0, 25.0, 19.0, 10.0, 5.0, 6.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.0234375, -5.84130859375, -5.6591796875, -5.47705078125, -5.294921875, -5.11279296875, -4.9306640625, -4.74853515625, -4.56640625, -4.38427734375, -4.2021484375, -4.02001953125, -3.837890625, -3.65576171875, -3.4736328125, -3.29150390625, -3.109375, -2.92724609375, -2.7451171875, -2.56298828125, -2.380859375, -2.19873046875, -2.0166015625, -1.83447265625, -1.65234375, -1.47021484375, -1.2880859375, -1.10595703125, -0.923828125, -0.74169921875, -0.5595703125, -0.37744140625, -0.1953125, -0.01318359375, 0.1689453125, 0.35107421875, 0.533203125, 0.71533203125, 0.8974609375, 1.07958984375, 1.26171875, 1.44384765625, 1.6259765625, 1.80810546875, 1.990234375, 2.17236328125, 2.3544921875, 2.53662109375, 2.71875, 2.90087890625, 3.0830078125, 3.26513671875, 3.447265625, 3.62939453125, 3.8115234375, 3.99365234375, 4.17578125, 4.35791015625, 4.5400390625, 4.72216796875, 4.904296875, 5.08642578125, 5.2685546875, 5.45068359375, 5.6328125]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 1.0, 6.0, 9.0, 4.0, 11.0, 11.0, 15.0, 16.0, 26.0, 25.0, 36.0, 29.0, 33.0, 40.0, 46.0, 52.0, 53.0, 50.0, 51.0, 46.0, 40.0, 56.0, 36.0, 37.0, 39.0, 39.0, 31.0, 27.0, 20.0, 26.0, 15.0, 14.0, 16.0, 9.0, 12.0, 7.0, 5.0, 1.0, 3.0, 6.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 2.0], "bins": [-8.1015625, -7.87701416015625, -7.6524658203125, -7.42791748046875, -7.203369140625, -6.97882080078125, -6.7542724609375, -6.52972412109375, -6.30517578125, -6.08062744140625, -5.8560791015625, -5.63153076171875, -5.406982421875, -5.18243408203125, -4.9578857421875, -4.73333740234375, -4.5087890625, -4.28424072265625, -4.0596923828125, -3.83514404296875, -3.610595703125, -3.38604736328125, -3.1614990234375, -2.93695068359375, -2.71240234375, -2.48785400390625, -2.2633056640625, -2.03875732421875, -1.814208984375, -1.58966064453125, -1.3651123046875, -1.14056396484375, -0.916015625, -0.69146728515625, -0.4669189453125, -0.24237060546875, -0.017822265625, 0.20672607421875, 0.4312744140625, 0.65582275390625, 0.88037109375, 1.10491943359375, 1.3294677734375, 1.55401611328125, 1.778564453125, 2.00311279296875, 2.2276611328125, 2.45220947265625, 2.6767578125, 2.90130615234375, 3.1258544921875, 3.35040283203125, 3.574951171875, 3.79949951171875, 4.0240478515625, 4.24859619140625, 4.47314453125, 4.69769287109375, 4.9222412109375, 5.14678955078125, 5.371337890625, 5.59588623046875, 5.8204345703125, 6.04498291015625, 6.26953125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 2.0, 2.0, 6.0, 5.0, 17.0, 10.0, 22.0, 33.0, 45.0, 64.0, 85.0, 141.0, 185.0, 243.0, 409.0, 560.0, 867.0, 1373.0, 2004.0, 3197.0, 5038.0, 8207.0, 12791.0, 21069.0, 33839.0, 54867.0, 84779.0, 122928.0, 153863.0, 156992.0, 130744.0, 92869.0, 60677.0, 38071.0, 23524.0, 14474.0, 8930.0, 5399.0, 3549.0, 2214.0, 1448.0, 980.0, 594.0, 461.0, 312.0, 178.0, 146.0, 92.0, 79.0, 51.0, 32.0, 28.0, 22.0, 18.0, 11.0, 9.0, 5.0, 3.0, 2.0, 1.0, 2.0], "bins": [-5.05859375, -4.90106201171875, -4.7435302734375, -4.58599853515625, -4.428466796875, -4.27093505859375, -4.1134033203125, -3.95587158203125, -3.79833984375, -3.64080810546875, -3.4832763671875, -3.32574462890625, -3.168212890625, -3.01068115234375, -2.8531494140625, -2.69561767578125, -2.5380859375, -2.38055419921875, -2.2230224609375, -2.06549072265625, -1.907958984375, -1.75042724609375, -1.5928955078125, -1.43536376953125, -1.27783203125, -1.12030029296875, -0.9627685546875, -0.80523681640625, -0.647705078125, -0.49017333984375, -0.3326416015625, -0.17510986328125, -0.017578125, 0.13995361328125, 0.2974853515625, 0.45501708984375, 0.612548828125, 0.77008056640625, 0.9276123046875, 1.08514404296875, 1.24267578125, 1.40020751953125, 1.5577392578125, 1.71527099609375, 1.872802734375, 2.03033447265625, 2.1878662109375, 2.34539794921875, 2.5029296875, 2.66046142578125, 2.8179931640625, 2.97552490234375, 3.133056640625, 3.29058837890625, 3.4481201171875, 3.60565185546875, 3.76318359375, 3.92071533203125, 4.0782470703125, 4.23577880859375, 4.393310546875, 4.55084228515625, 4.7083740234375, 4.86590576171875, 5.0234375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 5.0, 9.0, 7.0, 6.0, 14.0, 11.0, 12.0, 13.0, 12.0, 25.0, 26.0, 22.0, 28.0, 32.0, 32.0, 33.0, 28.0, 30.0, 35.0, 45.0, 43.0, 31.0, 35.0, 39.0, 44.0, 29.0, 29.0, 38.0, 35.0, 29.0, 27.0, 27.0, 27.0, 22.0, 20.0, 20.0, 14.0, 14.0, 7.0, 9.0, 7.0, 5.0, 10.0, 4.0, 6.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.240234375, -3.129302978515625, -3.01837158203125, -2.907440185546875, -2.7965087890625, -2.685577392578125, -2.57464599609375, -2.463714599609375, -2.352783203125, -2.241851806640625, -2.13092041015625, -2.019989013671875, -1.9090576171875, -1.798126220703125, -1.68719482421875, -1.576263427734375, -1.46533203125, -1.354400634765625, -1.24346923828125, -1.132537841796875, -1.0216064453125, -0.910675048828125, -0.79974365234375, -0.688812255859375, -0.577880859375, -0.466949462890625, -0.35601806640625, -0.245086669921875, -0.1341552734375, -0.023223876953125, 0.08770751953125, 0.198638916015625, 0.3095703125, 0.420501708984375, 0.53143310546875, 0.642364501953125, 0.7532958984375, 0.864227294921875, 0.97515869140625, 1.086090087890625, 1.197021484375, 1.307952880859375, 1.41888427734375, 1.529815673828125, 1.6407470703125, 1.751678466796875, 1.86260986328125, 1.973541259765625, 2.08447265625, 2.195404052734375, 2.30633544921875, 2.417266845703125, 2.5281982421875, 2.639129638671875, 2.75006103515625, 2.860992431640625, 2.971923828125, 3.082855224609375, 3.19378662109375, 3.304718017578125, 3.4156494140625, 3.526580810546875, 3.63751220703125, 3.748443603515625, 3.859375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 7.0, 7.0, 10.0, 12.0, 22.0, 29.0, 63.0, 76.0, 118.0, 192.0, 244.0, 338.0, 608.0, 829.0, 1395.0, 2188.0, 3496.0, 5842.0, 10267.0, 18981.0, 36425.0, 71389.0, 135845.0, 215448.0, 225095.0, 149906.0, 79882.0, 40471.0, 21196.0, 11313.0, 6433.0, 3890.0, 2313.0, 1473.0, 929.0, 576.0, 407.0, 290.0, 191.0, 118.0, 85.0, 55.0, 43.0, 22.0, 17.0, 10.0, 10.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.37109375, -4.23046875, -4.08984375, -3.94921875, -3.80859375, -3.66796875, -3.52734375, -3.38671875, -3.24609375, -3.10546875, -2.96484375, -2.82421875, -2.68359375, -2.54296875, -2.40234375, -2.26171875, -2.12109375, -1.98046875, -1.83984375, -1.69921875, -1.55859375, -1.41796875, -1.27734375, -1.13671875, -0.99609375, -0.85546875, -0.71484375, -0.57421875, -0.43359375, -0.29296875, -0.15234375, -0.01171875, 0.12890625, 0.26953125, 0.41015625, 0.55078125, 0.69140625, 0.83203125, 0.97265625, 1.11328125, 1.25390625, 1.39453125, 1.53515625, 1.67578125, 1.81640625, 1.95703125, 2.09765625, 2.23828125, 2.37890625, 2.51953125, 2.66015625, 2.80078125, 2.94140625, 3.08203125, 3.22265625, 3.36328125, 3.50390625, 3.64453125, 3.78515625, 3.92578125, 4.06640625, 4.20703125, 4.34765625, 4.48828125, 4.62890625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 1.0, 6.0, 7.0, 12.0, 10.0, 11.0, 16.0, 20.0, 19.0, 28.0, 49.0, 47.0, 45.0, 60.0, 66.0, 75.0, 84.0, 82.0, 69.0, 54.0, 49.0, 47.0, 41.0, 25.0, 15.0, 14.0, 10.0, 12.0, 8.0, 5.0, 7.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0003941059112548828, -0.00038155168294906616, -0.0003689974546432495, -0.00035644322633743286, -0.0003438889980316162, -0.00033133476972579956, -0.0003187805414199829, -0.00030622631311416626, -0.0002936720848083496, -0.00028111785650253296, -0.0002685636281967163, -0.00025600939989089966, -0.000243455171585083, -0.00023090094327926636, -0.0002183467149734497, -0.00020579248666763306, -0.0001932382583618164, -0.00018068403005599976, -0.0001681298017501831, -0.00015557557344436646, -0.0001430213451385498, -0.00013046711683273315, -0.0001179128885269165, -0.00010535866022109985, -9.28044319152832e-05, -8.025020360946655e-05, -6.76959753036499e-05, -5.514174699783325e-05, -4.25875186920166e-05, -3.003329038619995e-05, -1.74790620803833e-05, -4.92483377456665e-06, 7.62939453125e-06, 2.018362283706665e-05, 3.27378511428833e-05, 4.529207944869995e-05, 5.78463077545166e-05, 7.040053606033325e-05, 8.29547643661499e-05, 9.550899267196655e-05, 0.0001080632209777832, 0.00012061744928359985, 0.0001331716775894165, 0.00014572590589523315, 0.0001582801342010498, 0.00017083436250686646, 0.0001833885908126831, 0.00019594281911849976, 0.0002084970474243164, 0.00022105127573013306, 0.0002336055040359497, 0.00024615973234176636, 0.000258713960647583, 0.00027126818895339966, 0.0002838224172592163, 0.00029637664556503296, 0.0003089308738708496, 0.00032148510217666626, 0.0003340393304824829, 0.00034659355878829956, 0.0003591477870941162, 0.00037170201539993286, 0.0003842562437057495, 0.00039681047201156616, 0.0004093647003173828]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 4.0, 5.0, 5.0, 7.0, 10.0, 19.0, 37.0, 48.0, 77.0, 117.0, 165.0, 180.0, 289.0, 446.0, 612.0, 980.0, 1443.0, 2305.0, 3448.0, 5500.0, 8800.0, 14409.0, 24316.0, 40800.0, 68997.0, 111942.0, 162570.0, 183932.0, 154360.0, 103907.0, 63001.0, 37474.0, 22131.0, 13499.0, 8101.0, 5097.0, 3323.0, 2106.0, 1330.0, 907.0, 556.0, 415.0, 286.0, 186.0, 143.0, 94.0, 58.0, 37.0, 34.0, 21.0, 12.0, 10.0, 8.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.2578125, -3.15411376953125, -3.0504150390625, -2.94671630859375, -2.843017578125, -2.73931884765625, -2.6356201171875, -2.53192138671875, -2.42822265625, -2.32452392578125, -2.2208251953125, -2.11712646484375, -2.013427734375, -1.90972900390625, -1.8060302734375, -1.70233154296875, -1.5986328125, -1.49493408203125, -1.3912353515625, -1.28753662109375, -1.183837890625, -1.08013916015625, -0.9764404296875, -0.87274169921875, -0.76904296875, -0.66534423828125, -0.5616455078125, -0.45794677734375, -0.354248046875, -0.25054931640625, -0.1468505859375, -0.04315185546875, 0.060546875, 0.16424560546875, 0.2679443359375, 0.37164306640625, 0.475341796875, 0.57904052734375, 0.6827392578125, 0.78643798828125, 0.89013671875, 0.99383544921875, 1.0975341796875, 1.20123291015625, 1.304931640625, 1.40863037109375, 1.5123291015625, 1.61602783203125, 1.7197265625, 1.82342529296875, 1.9271240234375, 2.03082275390625, 2.134521484375, 2.23822021484375, 2.3419189453125, 2.44561767578125, 2.54931640625, 2.65301513671875, 2.7567138671875, 2.86041259765625, 2.964111328125, 3.06781005859375, 3.1715087890625, 3.27520751953125, 3.37890625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 6.0, 8.0, 18.0, 26.0, 26.0, 35.0, 37.0, 43.0, 46.0, 46.0, 62.0, 53.0, 51.0, 58.0, 59.0, 59.0, 70.0, 47.0, 57.0, 32.0, 26.0, 23.0, 34.0, 18.0, 11.0, 10.0, 3.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.42578125, -1.3802490234375, -1.334716796875, -1.2891845703125, -1.24365234375, -1.1981201171875, -1.152587890625, -1.1070556640625, -1.0615234375, -1.0159912109375, -0.970458984375, -0.9249267578125, -0.87939453125, -0.8338623046875, -0.788330078125, -0.7427978515625, -0.697265625, -0.6517333984375, -0.606201171875, -0.5606689453125, -0.51513671875, -0.4696044921875, -0.424072265625, -0.3785400390625, -0.3330078125, -0.2874755859375, -0.241943359375, -0.1964111328125, -0.15087890625, -0.1053466796875, -0.059814453125, -0.0142822265625, 0.03125, 0.0767822265625, 0.122314453125, 0.1678466796875, 0.21337890625, 0.2589111328125, 0.304443359375, 0.3499755859375, 0.3955078125, 0.4410400390625, 0.486572265625, 0.5321044921875, 0.57763671875, 0.6231689453125, 0.668701171875, 0.7142333984375, 0.759765625, 0.8052978515625, 0.850830078125, 0.8963623046875, 0.94189453125, 0.9874267578125, 1.032958984375, 1.0784912109375, 1.1240234375, 1.1695556640625, 1.215087890625, 1.2606201171875, 1.30615234375, 1.3516845703125, 1.397216796875, 1.4427490234375, 1.48828125]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 8.0, 5.0, 11.0, 15.0, 15.0, 19.0, 18.0, 37.0, 31.0, 46.0, 64.0, 71.0, 76.0, 76.0, 72.0, 77.0, 60.0, 66.0, 53.0, 31.0, 36.0, 24.0, 31.0, 13.0, 10.0, 6.0, 12.0, 9.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.653032302856445, -8.334821701049805, -8.016611099243164, -7.698400497436523, -7.380189895629883, -7.061979293823242, -6.74376916885376, -6.425558567047119, -6.1073479652404785, -5.789137363433838, -5.470926761627197, -5.152716159820557, -4.834506034851074, -4.516295433044434, -4.198084831237793, -3.8798742294311523, -3.5616636276245117, -3.243453025817871, -2.9252424240112305, -2.607032060623169, -2.2888214588165283, -1.9706108570098877, -1.6524003744125366, -1.3341898918151855, -1.015979290008545, -0.6977687478065491, -0.3795582056045532, -0.06134766340255737, 0.2568628787994385, 0.5750734806060791, 0.8932839632034302, 1.2114944458007812, 1.5297060012817383, 1.847916603088379, 2.1661272048950195, 2.484337568283081, 2.8025481700897217, 3.1207587718963623, 3.438969135284424, 3.7571797370910645, 4.075390338897705, 4.393600940704346, 4.711811542510986, 5.030022144317627, 5.348232269287109, 5.66644287109375, 5.984653472900391, 6.302864074707031, 6.621074676513672, 6.9392852783203125, 7.257495880126953, 7.575706481933594, 7.893917083740234, 8.212127685546875, 8.530338287353516, 8.848548889160156, 9.166759490966797, 9.484970092773438, 9.803180694580078, 10.121391296386719, 10.43960189819336, 10.7578125, 11.07602310180664, 11.394233703613281, 11.712443351745605]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 9.0, 8.0, 8.0, 13.0, 17.0, 12.0, 25.0, 18.0, 27.0, 23.0, 23.0, 29.0, 37.0, 40.0, 30.0, 30.0, 44.0, 39.0, 48.0, 41.0, 30.0, 38.0, 35.0, 36.0, 41.0, 50.0, 29.0, 33.0, 28.0, 20.0, 19.0, 24.0, 15.0, 9.0, 12.0, 13.0, 14.0, 6.0, 6.0, 7.0, 3.0, 4.0, 4.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.179008960723877, -5.988417148590088, -5.797824859619141, -5.607233047485352, -5.4166412353515625, -5.226048946380615, -5.035457134246826, -4.844864845275879, -4.65427303314209, -4.463681221008301, -4.2730889320373535, -4.0824971199035645, -3.8919050693511963, -3.701313018798828, -3.510721206665039, -3.320129156112671, -3.1295371055603027, -2.9389450550079346, -2.7483530044555664, -2.5577611923217773, -2.367169141769409, -2.176577091217041, -1.9859851598739624, -1.7953932285308838, -1.6048011779785156, -1.4142091274261475, -1.2236171960830688, -1.0330252647399902, -0.8424332141876221, -0.6518412232398987, -0.4612492322921753, -0.2706573009490967, -0.08006477355957031, 0.11052721738815308, 0.30111920833587646, 0.49171119928359985, 0.6823031902313232, 0.8728951811790466, 1.06348717212677, 1.2540791034698486, 1.4446711540222168, 1.635263204574585, 1.8258551359176636, 2.016447067260742, 2.2070391178131104, 2.3976311683654785, 2.5882229804992676, 2.7788150310516357, 2.969407081604004, 3.159999132156372, 3.3505911827087402, 3.5411829948425293, 3.7317750453948975, 3.9223670959472656, 4.112958908081055, 4.303550720214844, 4.494143009185791, 4.68473482131958, 4.875327110290527, 5.065918922424316, 5.2565107345581055, 5.447103023529053, 5.637694835662842, 5.828287124633789, 6.018878936767578]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 5.0, 3.0, 11.0, 10.0, 11.0, 16.0, 23.0, 41.0, 48.0, 50.0, 99.0, 131.0, 191.0, 287.0, 398.0, 552.0, 871.0, 1292.0, 1966.0, 2912.0, 4685.0, 7397.0, 12123.0, 21308.0, 37995.0, 75213.0, 163150.0, 387008.0, 834973.0, 1149320.0, 805344.0, 366738.0, 156895.0, 72823.0, 37631.0, 20732.0, 11879.0, 7295.0, 4402.0, 2884.0, 1797.0, 1214.0, 838.0, 558.0, 360.0, 252.0, 190.0, 126.0, 76.0, 60.0, 41.0, 18.0, 17.0, 11.0, 9.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0], "bins": [-7.140625, -6.92071533203125, -6.7008056640625, -6.48089599609375, -6.260986328125, -6.04107666015625, -5.8211669921875, -5.60125732421875, -5.38134765625, -5.16143798828125, -4.9415283203125, -4.72161865234375, -4.501708984375, -4.28179931640625, -4.0618896484375, -3.84197998046875, -3.6220703125, -3.40216064453125, -3.1822509765625, -2.96234130859375, -2.742431640625, -2.52252197265625, -2.3026123046875, -2.08270263671875, -1.86279296875, -1.64288330078125, -1.4229736328125, -1.20306396484375, -0.983154296875, -0.76324462890625, -0.5433349609375, -0.32342529296875, -0.103515625, 0.11639404296875, 0.3363037109375, 0.55621337890625, 0.776123046875, 0.99603271484375, 1.2159423828125, 1.43585205078125, 1.65576171875, 1.87567138671875, 2.0955810546875, 2.31549072265625, 2.535400390625, 2.75531005859375, 2.9752197265625, 3.19512939453125, 3.4150390625, 3.63494873046875, 3.8548583984375, 4.07476806640625, 4.294677734375, 4.51458740234375, 4.7344970703125, 4.95440673828125, 5.17431640625, 5.39422607421875, 5.6141357421875, 5.83404541015625, 6.053955078125, 6.27386474609375, 6.4937744140625, 6.71368408203125, 6.93359375]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 8.0, 3.0, 10.0, 14.0, 16.0, 12.0, 14.0, 21.0, 19.0, 27.0, 34.0, 28.0, 41.0, 36.0, 41.0, 35.0, 50.0, 50.0, 54.0, 50.0, 34.0, 36.0, 38.0, 41.0, 40.0, 28.0, 36.0, 25.0, 22.0, 27.0, 21.0, 15.0, 8.0, 15.0, 12.0, 7.0, 13.0, 6.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.65625, -4.5142822265625, -4.372314453125, -4.2303466796875, -4.08837890625, -3.9464111328125, -3.804443359375, -3.6624755859375, -3.5205078125, -3.3785400390625, -3.236572265625, -3.0946044921875, -2.95263671875, -2.8106689453125, -2.668701171875, -2.5267333984375, -2.384765625, -2.2427978515625, -2.100830078125, -1.9588623046875, -1.81689453125, -1.6749267578125, -1.532958984375, -1.3909912109375, -1.2490234375, -1.1070556640625, -0.965087890625, -0.8231201171875, -0.68115234375, -0.5391845703125, -0.397216796875, -0.2552490234375, -0.11328125, 0.0286865234375, 0.170654296875, 0.3126220703125, 0.45458984375, 0.5965576171875, 0.738525390625, 0.8804931640625, 1.0224609375, 1.1644287109375, 1.306396484375, 1.4483642578125, 1.59033203125, 1.7322998046875, 1.874267578125, 2.0162353515625, 2.158203125, 2.3001708984375, 2.442138671875, 2.5841064453125, 2.72607421875, 2.8680419921875, 3.010009765625, 3.1519775390625, 3.2939453125, 3.4359130859375, 3.577880859375, 3.7198486328125, 3.86181640625, 4.0037841796875, 4.145751953125, 4.2877197265625, 4.4296875]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 5.0, 0.0, 4.0, 9.0, 8.0, 14.0, 12.0, 22.0, 24.0, 36.0, 69.0, 85.0, 153.0, 204.0, 301.0, 404.0, 616.0, 940.0, 1451.0, 2264.0, 3438.0, 5376.0, 8986.0, 15345.0, 26337.0, 48166.0, 89287.0, 177177.0, 368219.0, 752002.0, 1106528.0, 791674.0, 392154.0, 188155.0, 94624.0, 50298.0, 28037.0, 16159.0, 9528.0, 5723.0, 3655.0, 2305.0, 1526.0, 954.0, 657.0, 438.0, 292.0, 195.0, 139.0, 79.0, 54.0, 50.0, 38.0, 28.0, 19.0, 11.0, 9.0, 7.0, 7.0, 1.0, 2.0, 0.0, 2.0], "bins": [-7.0078125, -6.78564453125, -6.5634765625, -6.34130859375, -6.119140625, -5.89697265625, -5.6748046875, -5.45263671875, -5.23046875, -5.00830078125, -4.7861328125, -4.56396484375, -4.341796875, -4.11962890625, -3.8974609375, -3.67529296875, -3.453125, -3.23095703125, -3.0087890625, -2.78662109375, -2.564453125, -2.34228515625, -2.1201171875, -1.89794921875, -1.67578125, -1.45361328125, -1.2314453125, -1.00927734375, -0.787109375, -0.56494140625, -0.3427734375, -0.12060546875, 0.1015625, 0.32373046875, 0.5458984375, 0.76806640625, 0.990234375, 1.21240234375, 1.4345703125, 1.65673828125, 1.87890625, 2.10107421875, 2.3232421875, 2.54541015625, 2.767578125, 2.98974609375, 3.2119140625, 3.43408203125, 3.65625, 3.87841796875, 4.1005859375, 4.32275390625, 4.544921875, 4.76708984375, 4.9892578125, 5.21142578125, 5.43359375, 5.65576171875, 5.8779296875, 6.10009765625, 6.322265625, 6.54443359375, 6.7666015625, 6.98876953125, 7.2109375]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 6.0, 5.0, 6.0, 9.0, 13.0, 18.0, 24.0, 28.0, 31.0, 38.0, 37.0, 79.0, 104.0, 130.0, 146.0, 206.0, 218.0, 273.0, 322.0, 358.0, 346.0, 308.0, 294.0, 220.0, 189.0, 145.0, 128.0, 90.0, 69.0, 54.0, 50.0, 31.0, 21.0, 21.0, 24.0, 10.0, 9.0, 7.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-3.166015625, -3.082489013671875, -2.99896240234375, -2.915435791015625, -2.8319091796875, -2.748382568359375, -2.66485595703125, -2.581329345703125, -2.497802734375, -2.414276123046875, -2.33074951171875, -2.247222900390625, -2.1636962890625, -2.080169677734375, -1.99664306640625, -1.913116455078125, -1.82958984375, -1.746063232421875, -1.66253662109375, -1.579010009765625, -1.4954833984375, -1.411956787109375, -1.32843017578125, -1.244903564453125, -1.161376953125, -1.077850341796875, -0.99432373046875, -0.910797119140625, -0.8272705078125, -0.743743896484375, -0.66021728515625, -0.576690673828125, -0.4931640625, -0.409637451171875, -0.32611083984375, -0.242584228515625, -0.1590576171875, -0.075531005859375, 0.00799560546875, 0.091522216796875, 0.175048828125, 0.258575439453125, 0.34210205078125, 0.425628662109375, 0.5091552734375, 0.592681884765625, 0.67620849609375, 0.759735107421875, 0.84326171875, 0.926788330078125, 1.01031494140625, 1.093841552734375, 1.1773681640625, 1.260894775390625, 1.34442138671875, 1.427947998046875, 1.511474609375, 1.595001220703125, 1.67852783203125, 1.762054443359375, 1.8455810546875, 1.929107666015625, 2.01263427734375, 2.096160888671875, 2.1796875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 5.0, 5.0, 13.0, 7.0, 24.0, 29.0, 43.0, 63.0, 52.0, 94.0, 83.0, 101.0, 81.0, 97.0, 63.0, 53.0, 48.0, 37.0, 26.0, 12.0, 15.0, 16.0, 11.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.35332202911377, -10.997031211853027, -10.640740394592285, -10.28445053100586, -9.928159713745117, -9.571868896484375, -9.215578079223633, -8.85928726196289, -8.502996444702148, -8.146705627441406, -7.790415287017822, -7.43412446975708, -7.077833652496338, -6.721543312072754, -6.365252494812012, -6.0089616775512695, -5.6526713371276855, -5.296380519866943, -4.940090179443359, -4.583799362182617, -4.227508544921875, -3.871217966079712, -3.514927387237549, -3.1586365699768066, -2.8023459911346436, -2.4460554122924805, -2.0897645950317383, -1.7334740161895752, -1.3771833181381226, -1.02089262008667, -0.6646020412445068, -0.30831122398376465, 0.04797935485839844, 0.4042700231075287, 0.7605606913566589, 1.1168513298034668, 1.4731420278549194, 1.829432725906372, 2.185723304748535, 2.5420141220092773, 2.8983047008514404, 3.2545952796936035, 3.6108860969543457, 3.967176675796509, 4.323467254638672, 4.679758071899414, 5.036048889160156, 5.392339706420898, 5.748630046844482, 6.104920864105225, 6.461211204528809, 6.817502021789551, 7.173792839050293, 7.530083656311035, 7.886373996734619, 8.242664337158203, 8.598955154418945, 8.955245971679688, 9.31153678894043, 9.667827606201172, 10.024117469787598, 10.38040828704834, 10.736699104309082, 11.092989921569824, 11.449280738830566]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 10.0, 7.0, 15.0, 14.0, 14.0, 13.0, 18.0, 25.0, 17.0, 27.0, 28.0, 23.0, 24.0, 33.0, 39.0, 36.0, 38.0, 40.0, 42.0, 40.0, 45.0, 46.0, 31.0, 37.0, 44.0, 36.0, 34.0, 19.0, 22.0, 30.0, 23.0, 13.0, 19.0, 17.0, 16.0, 13.0, 15.0, 6.0, 11.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.965344429016113, -4.798496246337891, -4.631648063659668, -4.464799880981445, -4.297951698303223, -4.131103992462158, -3.9642558097839355, -3.797407627105713, -3.6305594444274902, -3.4637112617492676, -3.296863079071045, -3.1300151348114014, -2.9631669521331787, -2.796318769454956, -2.6294708251953125, -2.46262264251709, -2.295774459838867, -2.1289262771606445, -1.9620782136917114, -1.7952301502227783, -1.6283819675445557, -1.461533784866333, -1.2946857213974, -1.1278376579284668, -0.9609894752502441, -0.7941413521766663, -0.6272932291030884, -0.4604451060295105, -0.2935969829559326, -0.12674885988235474, 0.040099263191223145, 0.20694732666015625, 0.3737959861755371, 0.540644109249115, 0.7074922323226929, 0.8743403553962708, 1.0411884784698486, 1.2080366611480713, 1.3748847246170044, 1.5417327880859375, 1.7085809707641602, 1.8754291534423828, 2.0422773361206055, 2.209125280380249, 2.3759734630584717, 2.5428216457366943, 2.709669589996338, 2.8765177726745605, 3.043365955352783, 3.210214138031006, 3.3770623207092285, 3.543910264968872, 3.7107584476470947, 3.8776066303253174, 4.044454574584961, 4.211302757263184, 4.378150939941406, 4.544999122619629, 4.711847305297852, 4.878695487976074, 5.045543670654297, 5.212391376495361, 5.379239559173584, 5.546087741851807, 5.712935924530029]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 11.0, 7.0, 9.0, 26.0, 34.0, 41.0, 59.0, 98.0, 153.0, 262.0, 414.0, 738.0, 1435.0, 2678.0, 5398.0, 11237.0, 24063.0, 52833.0, 112758.0, 211222.0, 264683.0, 185031.0, 93333.0, 43034.0, 19975.0, 9438.0, 4558.0, 2245.0, 1165.0, 635.0, 347.0, 236.0, 120.0, 93.0, 59.0, 45.0, 21.0, 11.0, 16.0, 10.0, 10.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.55859375, -5.35552978515625, -5.1524658203125, -4.94940185546875, -4.746337890625, -4.54327392578125, -4.3402099609375, -4.13714599609375, -3.93408203125, -3.73101806640625, -3.5279541015625, -3.32489013671875, -3.121826171875, -2.91876220703125, -2.7156982421875, -2.51263427734375, -2.3095703125, -2.10650634765625, -1.9034423828125, -1.70037841796875, -1.497314453125, -1.29425048828125, -1.0911865234375, -0.88812255859375, -0.68505859375, -0.48199462890625, -0.2789306640625, -0.07586669921875, 0.127197265625, 0.33026123046875, 0.5333251953125, 0.73638916015625, 0.939453125, 1.14251708984375, 1.3455810546875, 1.54864501953125, 1.751708984375, 1.95477294921875, 2.1578369140625, 2.36090087890625, 2.56396484375, 2.76702880859375, 2.9700927734375, 3.17315673828125, 3.376220703125, 3.57928466796875, 3.7823486328125, 3.98541259765625, 4.1884765625, 4.39154052734375, 4.5946044921875, 4.79766845703125, 5.000732421875, 5.20379638671875, 5.4068603515625, 5.60992431640625, 5.81298828125, 6.01605224609375, 6.2191162109375, 6.42218017578125, 6.625244140625, 6.82830810546875, 7.0313720703125, 7.23443603515625, 7.4375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 6.0, 8.0, 7.0, 11.0, 9.0, 17.0, 18.0, 26.0, 25.0, 31.0, 18.0, 16.0, 35.0, 31.0, 37.0, 30.0, 46.0, 36.0, 34.0, 36.0, 51.0, 44.0, 39.0, 46.0, 36.0, 41.0, 40.0, 18.0, 24.0, 34.0, 16.0, 17.0, 22.0, 14.0, 17.0, 18.0, 4.0, 4.0, 7.0, 9.0, 6.0, 1.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.16796875, -4.99029541015625, -4.8126220703125, -4.63494873046875, -4.457275390625, -4.27960205078125, -4.1019287109375, -3.92425537109375, -3.74658203125, -3.56890869140625, -3.3912353515625, -3.21356201171875, -3.035888671875, -2.85821533203125, -2.6805419921875, -2.50286865234375, -2.3251953125, -2.14752197265625, -1.9698486328125, -1.79217529296875, -1.614501953125, -1.43682861328125, -1.2591552734375, -1.08148193359375, -0.90380859375, -0.72613525390625, -0.5484619140625, -0.37078857421875, -0.193115234375, -0.01544189453125, 0.1622314453125, 0.33990478515625, 0.517578125, 0.69525146484375, 0.8729248046875, 1.05059814453125, 1.228271484375, 1.40594482421875, 1.5836181640625, 1.76129150390625, 1.93896484375, 2.11663818359375, 2.2943115234375, 2.47198486328125, 2.649658203125, 2.82733154296875, 3.0050048828125, 3.18267822265625, 3.3603515625, 3.53802490234375, 3.7156982421875, 3.89337158203125, 4.071044921875, 4.24871826171875, 4.4263916015625, 4.60406494140625, 4.78173828125, 4.95941162109375, 5.1370849609375, 5.31475830078125, 5.492431640625, 5.67010498046875, 5.8477783203125, 6.02545166015625, 6.203125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 7.0, 12.0, 13.0, 14.0, 23.0, 36.0, 44.0, 55.0, 69.0, 94.0, 121.0, 162.0, 234.0, 354.0, 458.0, 843.0, 1207.0, 1883.0, 3030.0, 5213.0, 9305.0, 16645.0, 31907.0, 62399.0, 122016.0, 211682.0, 242193.0, 159300.0, 84444.0, 43070.0, 22223.0, 11963.0, 6869.0, 3791.0, 2382.0, 1495.0, 927.0, 624.0, 431.0, 295.0, 207.0, 124.0, 116.0, 70.0, 40.0, 45.0, 33.0, 25.0, 18.0, 20.0, 11.0, 7.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0], "bins": [-6.28125, -6.0863037109375, -5.891357421875, -5.6964111328125, -5.50146484375, -5.3065185546875, -5.111572265625, -4.9166259765625, -4.7216796875, -4.5267333984375, -4.331787109375, -4.1368408203125, -3.94189453125, -3.7469482421875, -3.552001953125, -3.3570556640625, -3.162109375, -2.9671630859375, -2.772216796875, -2.5772705078125, -2.38232421875, -2.1873779296875, -1.992431640625, -1.7974853515625, -1.6025390625, -1.4075927734375, -1.212646484375, -1.0177001953125, -0.82275390625, -0.6278076171875, -0.432861328125, -0.2379150390625, -0.04296875, 0.1519775390625, 0.346923828125, 0.5418701171875, 0.73681640625, 0.9317626953125, 1.126708984375, 1.3216552734375, 1.5166015625, 1.7115478515625, 1.906494140625, 2.1014404296875, 2.29638671875, 2.4913330078125, 2.686279296875, 2.8812255859375, 3.076171875, 3.2711181640625, 3.466064453125, 3.6610107421875, 3.85595703125, 4.0509033203125, 4.245849609375, 4.4407958984375, 4.6357421875, 4.8306884765625, 5.025634765625, 5.2205810546875, 5.41552734375, 5.6104736328125, 5.805419921875, 6.0003662109375, 6.1953125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 3.0, 5.0, 1.0, 8.0, 15.0, 3.0, 13.0, 19.0, 16.0, 13.0, 25.0, 25.0, 27.0, 36.0, 24.0, 27.0, 42.0, 45.0, 44.0, 47.0, 31.0, 38.0, 45.0, 28.0, 25.0, 38.0, 48.0, 31.0, 29.0, 38.0, 25.0, 18.0, 27.0, 31.0, 25.0, 18.0, 8.0, 13.0, 10.0, 13.0, 5.0, 3.0, 5.0, 5.0, 3.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.37109375, -3.26348876953125, -3.1558837890625, -3.04827880859375, -2.940673828125, -2.83306884765625, -2.7254638671875, -2.61785888671875, -2.51025390625, -2.40264892578125, -2.2950439453125, -2.18743896484375, -2.079833984375, -1.97222900390625, -1.8646240234375, -1.75701904296875, -1.6494140625, -1.54180908203125, -1.4342041015625, -1.32659912109375, -1.218994140625, -1.11138916015625, -1.0037841796875, -0.89617919921875, -0.78857421875, -0.68096923828125, -0.5733642578125, -0.46575927734375, -0.358154296875, -0.25054931640625, -0.1429443359375, -0.03533935546875, 0.072265625, 0.17987060546875, 0.2874755859375, 0.39508056640625, 0.502685546875, 0.61029052734375, 0.7178955078125, 0.82550048828125, 0.93310546875, 1.04071044921875, 1.1483154296875, 1.25592041015625, 1.363525390625, 1.47113037109375, 1.5787353515625, 1.68634033203125, 1.7939453125, 1.90155029296875, 2.0091552734375, 2.11676025390625, 2.224365234375, 2.33197021484375, 2.4395751953125, 2.54718017578125, 2.65478515625, 2.76239013671875, 2.8699951171875, 2.97760009765625, 3.085205078125, 3.19281005859375, 3.3004150390625, 3.40802001953125, 3.515625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 4.0, 6.0, 3.0, 5.0, 6.0, 19.0, 19.0, 22.0, 27.0, 47.0, 75.0, 103.0, 126.0, 193.0, 315.0, 460.0, 798.0, 1357.0, 2511.0, 4915.0, 10111.0, 23398.0, 58628.0, 162834.0, 364598.0, 257811.0, 94789.0, 35857.0, 14686.0, 6847.0, 3307.0, 1760.0, 1038.0, 634.0, 382.0, 268.0, 180.0, 125.0, 86.0, 60.0, 54.0, 26.0, 21.0, 20.0, 6.0, 4.0, 11.0, 3.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.96875, -4.82147216796875, -4.6741943359375, -4.52691650390625, -4.379638671875, -4.23236083984375, -4.0850830078125, -3.93780517578125, -3.79052734375, -3.64324951171875, -3.4959716796875, -3.34869384765625, -3.201416015625, -3.05413818359375, -2.9068603515625, -2.75958251953125, -2.6123046875, -2.46502685546875, -2.3177490234375, -2.17047119140625, -2.023193359375, -1.87591552734375, -1.7286376953125, -1.58135986328125, -1.43408203125, -1.28680419921875, -1.1395263671875, -0.99224853515625, -0.844970703125, -0.69769287109375, -0.5504150390625, -0.40313720703125, -0.255859375, -0.10858154296875, 0.0386962890625, 0.18597412109375, 0.333251953125, 0.48052978515625, 0.6278076171875, 0.77508544921875, 0.92236328125, 1.06964111328125, 1.2169189453125, 1.36419677734375, 1.511474609375, 1.65875244140625, 1.8060302734375, 1.95330810546875, 2.1005859375, 2.24786376953125, 2.3951416015625, 2.54241943359375, 2.689697265625, 2.83697509765625, 2.9842529296875, 3.13153076171875, 3.27880859375, 3.42608642578125, 3.5733642578125, 3.72064208984375, 3.867919921875, 4.01519775390625, 4.1624755859375, 4.30975341796875, 4.45703125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 8.0, 6.0, 11.0, 19.0, 15.0, 15.0, 31.0, 39.0, 55.0, 59.0, 77.0, 77.0, 77.0, 96.0, 73.0, 61.0, 43.0, 59.0, 54.0, 25.0, 22.0, 16.0, 19.0, 11.0, 5.0, 8.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00020837783813476562, -0.00020242482423782349, -0.00019647181034088135, -0.0001905187964439392, -0.00018456578254699707, -0.00017861276865005493, -0.0001726597547531128, -0.00016670674085617065, -0.00016075372695922852, -0.00015480071306228638, -0.00014884769916534424, -0.0001428946852684021, -0.00013694167137145996, -0.00013098865747451782, -0.00012503564357757568, -0.00011908262968063354, -0.0001131296157836914, -0.00010717660188674927, -0.00010122358798980713, -9.527057409286499e-05, -8.931756019592285e-05, -8.336454629898071e-05, -7.741153240203857e-05, -7.145851850509644e-05, -6.55055046081543e-05, -5.955249071121216e-05, -5.359947681427002e-05, -4.764646291732788e-05, -4.169344902038574e-05, -3.5740435123443604e-05, -2.9787421226501465e-05, -2.3834407329559326e-05, -1.7881393432617188e-05, -1.1928379535675049e-05, -5.97536563873291e-06, -2.2351741790771484e-08, 5.930662155151367e-06, 1.1883676052093506e-05, 1.7836689949035645e-05, 2.3789703845977783e-05, 2.9742717742919922e-05, 3.569573163986206e-05, 4.16487455368042e-05, 4.760175943374634e-05, 5.3554773330688477e-05, 5.9507787227630615e-05, 6.546080112457275e-05, 7.141381502151489e-05, 7.736682891845703e-05, 8.331984281539917e-05, 8.927285671234131e-05, 9.522587060928345e-05, 0.00010117888450622559, 0.00010713189840316772, 0.00011308491230010986, 0.000119037926197052, 0.00012499094009399414, 0.00013094395399093628, 0.00013689696788787842, 0.00014284998178482056, 0.0001488029956817627, 0.00015475600957870483, 0.00016070902347564697, 0.0001666620373725891, 0.00017261505126953125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 4.0, 6.0, 12.0, 16.0, 34.0, 31.0, 52.0, 93.0, 128.0, 191.0, 314.0, 636.0, 983.0, 1890.0, 3654.0, 7222.0, 15090.0, 32484.0, 71996.0, 153791.0, 257673.0, 245041.0, 138046.0, 63374.0, 28703.0, 13218.0, 6491.0, 3347.0, 1707.0, 959.0, 520.0, 298.0, 202.0, 126.0, 61.0, 54.0, 33.0, 23.0, 22.0, 13.0, 6.0, 6.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1640625, -3.061737060546875, -2.95941162109375, -2.857086181640625, -2.7547607421875, -2.652435302734375, -2.55010986328125, -2.447784423828125, -2.345458984375, -2.243133544921875, -2.14080810546875, -2.038482666015625, -1.9361572265625, -1.833831787109375, -1.73150634765625, -1.629180908203125, -1.52685546875, -1.424530029296875, -1.32220458984375, -1.219879150390625, -1.1175537109375, -1.015228271484375, -0.91290283203125, -0.810577392578125, -0.708251953125, -0.605926513671875, -0.50360107421875, -0.401275634765625, -0.2989501953125, -0.196624755859375, -0.09429931640625, 0.008026123046875, 0.1103515625, 0.212677001953125, 0.31500244140625, 0.417327880859375, 0.5196533203125, 0.621978759765625, 0.72430419921875, 0.826629638671875, 0.928955078125, 1.031280517578125, 1.13360595703125, 1.235931396484375, 1.3382568359375, 1.440582275390625, 1.54290771484375, 1.645233154296875, 1.74755859375, 1.849884033203125, 1.95220947265625, 2.054534912109375, 2.1568603515625, 2.259185791015625, 2.36151123046875, 2.463836669921875, 2.566162109375, 2.668487548828125, 2.77081298828125, 2.873138427734375, 2.9754638671875, 3.077789306640625, 3.18011474609375, 3.282440185546875, 3.384765625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 11.0, 6.0, 5.0, 4.0, 16.0, 17.0, 24.0, 25.0, 28.0, 36.0, 43.0, 75.0, 61.0, 64.0, 75.0, 71.0, 73.0, 65.0, 59.0, 43.0, 41.0, 39.0, 20.0, 23.0, 14.0, 17.0, 11.0, 9.0, 7.0, 3.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90283203125, -0.8705215454101562, -0.8382110595703125, -0.8059005737304688, -0.773590087890625, -0.7412796020507812, -0.7089691162109375, -0.6766586303710938, -0.64434814453125, -0.6120376586914062, -0.5797271728515625, -0.5474166870117188, -0.515106201171875, -0.48279571533203125, -0.4504852294921875, -0.41817474365234375, -0.3858642578125, -0.35355377197265625, -0.3212432861328125, -0.28893280029296875, -0.256622314453125, -0.22431182861328125, -0.1920013427734375, -0.15969085693359375, -0.12738037109375, -0.09506988525390625, -0.0627593994140625, -0.03044891357421875, 0.001861572265625, 0.03417205810546875, 0.0664825439453125, 0.09879302978515625, 0.131103515625, 0.16341400146484375, 0.1957244873046875, 0.22803497314453125, 0.260345458984375, 0.29265594482421875, 0.3249664306640625, 0.35727691650390625, 0.38958740234375, 0.42189788818359375, 0.4542083740234375, 0.48651885986328125, 0.518829345703125, 0.5511398315429688, 0.5834503173828125, 0.6157608032226562, 0.6480712890625, 0.6803817749023438, 0.7126922607421875, 0.7450027465820312, 0.777313232421875, 0.8096237182617188, 0.8419342041015625, 0.8742446899414062, 0.90655517578125, 0.9388656616210938, 0.9711761474609375, 1.0034866333007812, 1.035797119140625, 1.0681076049804688, 1.1004180908203125, 1.1327285766601562, 1.1650390625]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 4.0, 7.0, 5.0, 8.0, 8.0, 8.0, 19.0, 25.0, 27.0, 55.0, 59.0, 74.0, 82.0, 103.0, 101.0, 80.0, 68.0, 69.0, 52.0, 40.0, 28.0, 22.0, 14.0, 12.0, 15.0, 6.0, 9.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.238876342773438, -9.889521598815918, -9.540165901184082, -9.190811157226562, -8.841455459594727, -8.492100715637207, -8.142745971679688, -7.79339075088501, -7.444035530090332, -7.094680309295654, -6.745325088500977, -6.395970344543457, -6.046615123748779, -5.697259902954102, -5.347905158996582, -4.998549938201904, -4.649194717407227, -4.299839496612549, -3.95048451423645, -3.6011295318603516, -3.251774311065674, -2.902419090270996, -2.5530641078948975, -2.203709125518799, -1.854353904724121, -1.504998803138733, -1.1556437015533447, -0.8062885999679565, -0.45693349838256836, -0.10757839679718018, 0.241776704788208, 0.5911316871643066, 0.940485954284668, 1.2898410558700562, 1.6391961574554443, 1.9885512590408325, 2.3379063606262207, 2.6872615814208984, 3.036616563796997, 3.3859715461730957, 3.7353267669677734, 4.084681987762451, 4.434037208557129, 4.783391952514648, 5.132747173309326, 5.482102394104004, 5.831457138061523, 6.180812358856201, 6.530167579650879, 6.879522800445557, 7.228878021240234, 7.578232765197754, 7.927587985992432, 8.27694320678711, 8.626297950744629, 8.975652694702148, 9.325008392333984, 9.674363136291504, 10.02371883392334, 10.37307357788086, 10.722429275512695, 11.071784019470215, 11.421138763427734, 11.77049446105957, 12.11984920501709]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 9.0, 1.0, 14.0, 10.0, 10.0, 16.0, 6.0, 18.0, 22.0, 21.0, 21.0, 30.0, 27.0, 33.0, 30.0, 32.0, 29.0, 41.0, 41.0, 46.0, 36.0, 39.0, 52.0, 32.0, 40.0, 39.0, 37.0, 41.0, 19.0, 27.0, 21.0, 26.0, 14.0, 28.0, 13.0, 16.0, 17.0, 13.0, 14.0, 3.0, 3.0, 2.0, 5.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.970677852630615, -4.806047439575195, -4.641416549682617, -4.476786136627197, -4.312155723571777, -4.147525310516357, -3.9828946590423584, -3.8182640075683594, -3.6536335945129395, -3.4890031814575195, -3.3243725299835205, -3.1597418785095215, -2.9951114654541016, -2.8304810523986816, -2.6658504009246826, -2.5012197494506836, -2.3365893363952637, -2.1719589233398438, -2.0073282718658447, -1.8426977396011353, -1.6780672073364258, -1.5134366750717163, -1.3488061428070068, -1.1841756105422974, -1.019545078277588, -0.8549145460128784, -0.690284013748169, -0.5256534814834595, -0.36102294921875, -0.19639241695404053, -0.031761884689331055, 0.13286864757537842, 0.2974987030029297, 0.46212923526763916, 0.6267597675323486, 0.7913902997970581, 0.9560208320617676, 1.120651364326477, 1.2852818965911865, 1.449912428855896, 1.6145429611206055, 1.779173493385315, 1.9438040256500244, 2.1084346771240234, 2.2730650901794434, 2.4376955032348633, 2.6023261547088623, 2.7669568061828613, 2.9315872192382812, 3.096217632293701, 3.2608482837677, 3.425478935241699, 3.590109348297119, 3.754739761352539, 3.919370412826538, 4.084001064300537, 4.248631477355957, 4.413261890411377, 4.577892303466797, 4.742523193359375, 4.907153606414795, 5.071784019470215, 5.236414909362793, 5.401045322418213, 5.565675735473633]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 8.0, 9.0, 7.0, 12.0, 18.0, 34.0, 48.0, 68.0, 109.0, 188.0, 295.0, 437.0, 647.0, 1048.0, 1814.0, 2768.0, 4438.0, 7205.0, 11768.0, 18826.0, 30167.0, 48267.0, 73299.0, 104791.0, 135463.0, 149044.0, 137799.0, 108862.0, 76713.0, 50375.0, 32094.0, 19609.0, 12357.0, 7420.0, 4696.0, 2900.0, 1757.0, 1125.0, 730.0, 481.0, 317.0, 190.0, 114.0, 80.0, 65.0, 30.0, 20.0, 15.0, 15.0, 11.0, 3.0, 3.0, 4.0, 2.0, 0.0, 3.0], "bins": [-4.68359375, -4.54400634765625, -4.4044189453125, -4.26483154296875, -4.125244140625, -3.98565673828125, -3.8460693359375, -3.70648193359375, -3.56689453125, -3.42730712890625, -3.2877197265625, -3.14813232421875, -3.008544921875, -2.86895751953125, -2.7293701171875, -2.58978271484375, -2.4501953125, -2.31060791015625, -2.1710205078125, -2.03143310546875, -1.891845703125, -1.75225830078125, -1.6126708984375, -1.47308349609375, -1.33349609375, -1.19390869140625, -1.0543212890625, -0.91473388671875, -0.775146484375, -0.63555908203125, -0.4959716796875, -0.35638427734375, -0.216796875, -0.07720947265625, 0.0623779296875, 0.20196533203125, 0.341552734375, 0.48114013671875, 0.6207275390625, 0.76031494140625, 0.89990234375, 1.03948974609375, 1.1790771484375, 1.31866455078125, 1.458251953125, 1.59783935546875, 1.7374267578125, 1.87701416015625, 2.0166015625, 2.15618896484375, 2.2957763671875, 2.43536376953125, 2.574951171875, 2.71453857421875, 2.8541259765625, 2.99371337890625, 3.13330078125, 3.27288818359375, 3.4124755859375, 3.55206298828125, 3.691650390625, 3.83123779296875, 3.9708251953125, 4.11041259765625, 4.25]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [5.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 5.0, 10.0, 8.0, 14.0, 12.0, 8.0, 15.0, 18.0, 18.0, 15.0, 16.0, 24.0, 27.0, 30.0, 31.0, 42.0, 29.0, 35.0, 34.0, 39.0, 34.0, 39.0, 40.0, 44.0, 41.0, 37.0, 28.0, 35.0, 44.0, 26.0, 29.0, 25.0, 18.0, 14.0, 18.0, 22.0, 11.0, 11.0, 6.0, 12.0, 7.0, 8.0, 2.0, 3.0, 4.0, 3.0, 7.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7109375, -4.5465087890625, -4.382080078125, -4.2176513671875, -4.05322265625, -3.8887939453125, -3.724365234375, -3.5599365234375, -3.3955078125, -3.2310791015625, -3.066650390625, -2.9022216796875, -2.73779296875, -2.5733642578125, -2.408935546875, -2.2445068359375, -2.080078125, -1.9156494140625, -1.751220703125, -1.5867919921875, -1.42236328125, -1.2579345703125, -1.093505859375, -0.9290771484375, -0.7646484375, -0.6002197265625, -0.435791015625, -0.2713623046875, -0.10693359375, 0.0574951171875, 0.221923828125, 0.3863525390625, 0.55078125, 0.7152099609375, 0.879638671875, 1.0440673828125, 1.20849609375, 1.3729248046875, 1.537353515625, 1.7017822265625, 1.8662109375, 2.0306396484375, 2.195068359375, 2.3594970703125, 2.52392578125, 2.6883544921875, 2.852783203125, 3.0172119140625, 3.181640625, 3.3460693359375, 3.510498046875, 3.6749267578125, 3.83935546875, 4.0037841796875, 4.168212890625, 4.3326416015625, 4.4970703125, 4.6614990234375, 4.825927734375, 4.9903564453125, 5.15478515625, 5.3192138671875, 5.483642578125, 5.6480712890625, 5.8125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 7.0, 12.0, 16.0, 20.0, 25.0, 33.0, 61.0, 90.0, 118.0, 194.0, 311.0, 428.0, 717.0, 1018.0, 1530.0, 2403.0, 3618.0, 5698.0, 9040.0, 13638.0, 21098.0, 32312.0, 48700.0, 69294.0, 96327.0, 121142.0, 135058.0, 129288.0, 107641.0, 81225.0, 56809.0, 38351.0, 25101.0, 16599.0, 10889.0, 6875.0, 4434.0, 2856.0, 1977.0, 1238.0, 844.0, 484.0, 332.0, 220.0, 177.0, 90.0, 64.0, 52.0, 33.0, 28.0, 12.0, 12.0, 8.0, 7.0, 2.0, 3.0], "bins": [-4.2578125, -4.135162353515625, -4.01251220703125, -3.889862060546875, -3.7672119140625, -3.644561767578125, -3.52191162109375, -3.399261474609375, -3.276611328125, -3.153961181640625, -3.03131103515625, -2.908660888671875, -2.7860107421875, -2.663360595703125, -2.54071044921875, -2.418060302734375, -2.29541015625, -2.172760009765625, -2.05010986328125, -1.927459716796875, -1.8048095703125, -1.682159423828125, -1.55950927734375, -1.436859130859375, -1.314208984375, -1.191558837890625, -1.06890869140625, -0.946258544921875, -0.8236083984375, -0.700958251953125, -0.57830810546875, -0.455657958984375, -0.3330078125, -0.210357666015625, -0.08770751953125, 0.034942626953125, 0.1575927734375, 0.280242919921875, 0.40289306640625, 0.525543212890625, 0.648193359375, 0.770843505859375, 0.89349365234375, 1.016143798828125, 1.1387939453125, 1.261444091796875, 1.38409423828125, 1.506744384765625, 1.62939453125, 1.752044677734375, 1.87469482421875, 1.997344970703125, 2.1199951171875, 2.242645263671875, 2.36529541015625, 2.487945556640625, 2.610595703125, 2.733245849609375, 2.85589599609375, 2.978546142578125, 3.1011962890625, 3.223846435546875, 3.34649658203125, 3.469146728515625, 3.591796875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 8.0, 7.0, 6.0, 13.0, 7.0, 15.0, 19.0, 18.0, 14.0, 15.0, 27.0, 21.0, 27.0, 31.0, 29.0, 41.0, 50.0, 43.0, 47.0, 32.0, 41.0, 44.0, 37.0, 37.0, 38.0, 33.0, 26.0, 32.0, 27.0, 36.0, 23.0, 28.0, 21.0, 21.0, 15.0, 20.0, 8.0, 20.0, 9.0, 4.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.025390625, -2.91668701171875, -2.8079833984375, -2.69927978515625, -2.590576171875, -2.48187255859375, -2.3731689453125, -2.26446533203125, -2.15576171875, -2.04705810546875, -1.9383544921875, -1.82965087890625, -1.720947265625, -1.61224365234375, -1.5035400390625, -1.39483642578125, -1.2861328125, -1.17742919921875, -1.0687255859375, -0.96002197265625, -0.851318359375, -0.74261474609375, -0.6339111328125, -0.52520751953125, -0.41650390625, -0.30780029296875, -0.1990966796875, -0.09039306640625, 0.018310546875, 0.12701416015625, 0.2357177734375, 0.34442138671875, 0.453125, 0.56182861328125, 0.6705322265625, 0.77923583984375, 0.887939453125, 0.99664306640625, 1.1053466796875, 1.21405029296875, 1.32275390625, 1.43145751953125, 1.5401611328125, 1.64886474609375, 1.757568359375, 1.86627197265625, 1.9749755859375, 2.08367919921875, 2.1923828125, 2.30108642578125, 2.4097900390625, 2.51849365234375, 2.627197265625, 2.73590087890625, 2.8446044921875, 2.95330810546875, 3.06201171875, 3.17071533203125, 3.2794189453125, 3.38812255859375, 3.496826171875, 3.60552978515625, 3.7142333984375, 3.82293701171875, 3.931640625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 9.0, 6.0, 12.0, 18.0, 20.0, 31.0, 63.0, 87.0, 130.0, 225.0, 348.0, 645.0, 1042.0, 1767.0, 3056.0, 5428.0, 9644.0, 18146.0, 33171.0, 62210.0, 109828.0, 172745.0, 207121.0, 173834.0, 111156.0, 62676.0, 34025.0, 18245.0, 9861.0, 5452.0, 3168.0, 1765.0, 1027.0, 630.0, 350.0, 230.0, 123.0, 92.0, 64.0, 35.0, 28.0, 14.0, 10.0, 11.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.87109375, -2.7738037109375, -2.676513671875, -2.5792236328125, -2.48193359375, -2.3846435546875, -2.287353515625, -2.1900634765625, -2.0927734375, -1.9954833984375, -1.898193359375, -1.8009033203125, -1.70361328125, -1.6063232421875, -1.509033203125, -1.4117431640625, -1.314453125, -1.2171630859375, -1.119873046875, -1.0225830078125, -0.92529296875, -0.8280029296875, -0.730712890625, -0.6334228515625, -0.5361328125, -0.4388427734375, -0.341552734375, -0.2442626953125, -0.14697265625, -0.0496826171875, 0.047607421875, 0.1448974609375, 0.2421875, 0.3394775390625, 0.436767578125, 0.5340576171875, 0.63134765625, 0.7286376953125, 0.825927734375, 0.9232177734375, 1.0205078125, 1.1177978515625, 1.215087890625, 1.3123779296875, 1.40966796875, 1.5069580078125, 1.604248046875, 1.7015380859375, 1.798828125, 1.8961181640625, 1.993408203125, 2.0906982421875, 2.18798828125, 2.2852783203125, 2.382568359375, 2.4798583984375, 2.5771484375, 2.6744384765625, 2.771728515625, 2.8690185546875, 2.96630859375, 3.0635986328125, 3.160888671875, 3.2581787109375, 3.35546875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 5.0, 5.0, 10.0, 9.0, 5.0, 8.0, 16.0, 16.0, 20.0, 32.0, 32.0, 28.0, 44.0, 56.0, 53.0, 54.0, 57.0, 65.0, 64.0, 59.0, 62.0, 39.0, 43.0, 36.0, 31.0, 39.0, 26.0, 15.0, 13.0, 8.0, 17.0, 7.0, 7.0, 7.0, 3.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00024306774139404297, -0.000235067680478096, -0.00022706761956214905, -0.0002190675586462021, -0.00021106749773025513, -0.00020306743681430817, -0.0001950673758983612, -0.00018706731498241425, -0.00017906725406646729, -0.00017106719315052032, -0.00016306713223457336, -0.0001550670713186264, -0.00014706701040267944, -0.00013906694948673248, -0.00013106688857078552, -0.00012306682765483856, -0.0001150667667388916, -0.00010706670582294464, -9.906664490699768e-05, -9.106658399105072e-05, -8.306652307510376e-05, -7.50664621591568e-05, -6.706640124320984e-05, -5.906634032726288e-05, -5.106627941131592e-05, -4.306621849536896e-05, -3.5066157579422e-05, -2.7066096663475037e-05, -1.9066035747528076e-05, -1.1065974831581116e-05, -3.0659139156341553e-06, 4.934147000312805e-06, 1.2934207916259766e-05, 2.0934268832206726e-05, 2.8934329748153687e-05, 3.693439066410065e-05, 4.493445158004761e-05, 5.293451249599457e-05, 6.093457341194153e-05, 6.893463432788849e-05, 7.693469524383545e-05, 8.493475615978241e-05, 9.293481707572937e-05, 0.00010093487799167633, 0.00010893493890762329, 0.00011693499982357025, 0.0001249350607395172, 0.00013293512165546417, 0.00014093518257141113, 0.0001489352434873581, 0.00015693530440330505, 0.00016493536531925201, 0.00017293542623519897, 0.00018093548715114594, 0.0001889355480670929, 0.00019693560898303986, 0.00020493566989898682, 0.00021293573081493378, 0.00022093579173088074, 0.0002289358526468277, 0.00023693591356277466, 0.0002449359744787216, 0.0002529360353946686, 0.00026093609631061554, 0.0002689361572265625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 1.0, 13.0, 18.0, 39.0, 42.0, 45.0, 78.0, 107.0, 180.0, 279.0, 429.0, 653.0, 1026.0, 1625.0, 2516.0, 3996.0, 6781.0, 10837.0, 17945.0, 30323.0, 50293.0, 80770.0, 122299.0, 160389.0, 168370.0, 139118.0, 95818.0, 61077.0, 37114.0, 22011.0, 12996.0, 7903.0, 4918.0, 2993.0, 1980.0, 1230.0, 767.0, 517.0, 368.0, 227.0, 163.0, 116.0, 64.0, 41.0, 30.0, 22.0, 22.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.603515625, -2.52508544921875, -2.4466552734375, -2.36822509765625, -2.289794921875, -2.21136474609375, -2.1329345703125, -2.05450439453125, -1.97607421875, -1.89764404296875, -1.8192138671875, -1.74078369140625, -1.662353515625, -1.58392333984375, -1.5054931640625, -1.42706298828125, -1.3486328125, -1.27020263671875, -1.1917724609375, -1.11334228515625, -1.034912109375, -0.95648193359375, -0.8780517578125, -0.79962158203125, -0.72119140625, -0.64276123046875, -0.5643310546875, -0.48590087890625, -0.407470703125, -0.32904052734375, -0.2506103515625, -0.17218017578125, -0.09375, -0.01531982421875, 0.0631103515625, 0.14154052734375, 0.219970703125, 0.29840087890625, 0.3768310546875, 0.45526123046875, 0.53369140625, 0.61212158203125, 0.6905517578125, 0.76898193359375, 0.847412109375, 0.92584228515625, 1.0042724609375, 1.08270263671875, 1.1611328125, 1.23956298828125, 1.3179931640625, 1.39642333984375, 1.474853515625, 1.55328369140625, 1.6317138671875, 1.71014404296875, 1.78857421875, 1.86700439453125, 1.9454345703125, 2.02386474609375, 2.102294921875, 2.18072509765625, 2.2591552734375, 2.33758544921875, 2.416015625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 5.0, 4.0, 3.0, 5.0, 18.0, 11.0, 12.0, 18.0, 22.0, 36.0, 29.0, 28.0, 30.0, 43.0, 40.0, 44.0, 51.0, 48.0, 60.0, 54.0, 53.0, 50.0, 55.0, 39.0, 35.0, 42.0, 31.0, 22.0, 24.0, 21.0, 22.0, 6.0, 12.0, 12.0, 5.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-1.04296875, -1.0161056518554688, -0.9892425537109375, -0.9623794555664062, -0.935516357421875, -0.9086532592773438, -0.8817901611328125, -0.8549270629882812, -0.82806396484375, -0.8012008666992188, -0.7743377685546875, -0.7474746704101562, -0.720611572265625, -0.6937484741210938, -0.6668853759765625, -0.6400222778320312, -0.6131591796875, -0.5862960815429688, -0.5594329833984375, -0.5325698852539062, -0.505706787109375, -0.47884368896484375, -0.4519805908203125, -0.42511749267578125, -0.39825439453125, -0.37139129638671875, -0.3445281982421875, -0.31766510009765625, -0.290802001953125, -0.26393890380859375, -0.2370758056640625, -0.21021270751953125, -0.183349609375, -0.15648651123046875, -0.1296234130859375, -0.10276031494140625, -0.075897216796875, -0.04903411865234375, -0.0221710205078125, 0.00469207763671875, 0.03155517578125, 0.05841827392578125, 0.0852813720703125, 0.11214447021484375, 0.139007568359375, 0.16587066650390625, 0.1927337646484375, 0.21959686279296875, 0.2464599609375, 0.27332305908203125, 0.3001861572265625, 0.32704925537109375, 0.353912353515625, 0.38077545166015625, 0.4076385498046875, 0.43450164794921875, 0.46136474609375, 0.48822784423828125, 0.5150909423828125, 0.5419540405273438, 0.568817138671875, 0.5956802368164062, 0.6225433349609375, 0.6494064331054688, 0.67626953125]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 6.0, 9.0, 9.0, 8.0, 12.0, 15.0, 23.0, 38.0, 47.0, 53.0, 61.0, 87.0, 92.0, 86.0, 84.0, 89.0, 64.0, 51.0, 44.0, 28.0, 27.0, 20.0, 8.0, 17.0, 8.0, 6.0, 7.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.054876327514648, -8.726757049560547, -8.398637771606445, -8.070518493652344, -7.742399215698242, -7.414279937744141, -7.086161136627197, -6.758041858673096, -6.429922580718994, -6.101803302764893, -5.773684024810791, -5.4455647468566895, -5.117445945739746, -4.7893266677856445, -4.461207389831543, -4.133088111877441, -3.80496883392334, -3.4768495559692383, -3.1487302780151367, -2.8206112384796143, -2.4924919605255127, -2.164372682571411, -1.8362535238265991, -1.508134365081787, -1.1800150871276855, -0.8518958687782288, -0.523776650428772, -0.19565743207931519, 0.1324617862701416, 0.46058106422424316, 0.7887002229690552, 1.1168193817138672, 1.4449377059936523, 1.773056983947754, 2.1011762619018555, 2.429295301437378, 2.7574145793914795, 3.085533857345581, 3.4136528968811035, 3.741772174835205, 4.069891452789307, 4.398010730743408, 4.72613000869751, 5.054249286651611, 5.382368087768555, 5.710487365722656, 6.038606643676758, 6.366725921630859, 6.694845199584961, 7.0229644775390625, 7.351083755493164, 7.679203033447266, 8.007322311401367, 8.335441589355469, 8.66356086730957, 8.991680145263672, 9.319799423217773, 9.647918701171875, 9.976037979125977, 10.304157257080078, 10.63227653503418, 10.960395812988281, 11.288515090942383, 11.616634368896484, 11.94475269317627]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 1.0, 3.0, 5.0, 4.0, 8.0, 4.0, 8.0, 8.0, 15.0, 15.0, 14.0, 21.0, 18.0, 17.0, 28.0, 28.0, 21.0, 27.0, 39.0, 42.0, 38.0, 30.0, 46.0, 37.0, 31.0, 43.0, 37.0, 37.0, 39.0, 25.0, 39.0, 30.0, 24.0, 37.0, 26.0, 16.0, 25.0, 14.0, 25.0, 8.0, 8.0, 9.0, 9.0, 8.0, 13.0, 8.0, 5.0, 3.0, 2.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.073388576507568, -4.918100357055664, -4.762812614440918, -4.607524871826172, -4.452236652374268, -4.296948432922363, -4.141660690307617, -3.986372709274292, -3.831084728240967, -3.6757967472076416, -3.5205087661743164, -3.365220785140991, -3.209932804107666, -3.054644823074341, -2.8993568420410156, -2.7440688610076904, -2.5887808799743652, -2.43349289894104, -2.278204917907715, -2.1229169368743896, -1.9676289558410645, -1.8123409748077393, -1.657052993774414, -1.5017650127410889, -1.3464770317077637, -1.1911890506744385, -1.0359010696411133, -0.8806130886077881, -0.7253251075744629, -0.5700371265411377, -0.4147491455078125, -0.2594611644744873, -0.10417366027832031, 0.05111432075500488, 0.20640230178833008, 0.3616902828216553, 0.5169782638549805, 0.6722662448883057, 0.8275542259216309, 0.982842206954956, 1.1381301879882812, 1.2934181690216064, 1.4487061500549316, 1.6039941310882568, 1.759282112121582, 1.9145700931549072, 2.0698580741882324, 2.2251460552215576, 2.380434036254883, 2.535722017288208, 2.691009998321533, 2.8462979793548584, 3.0015859603881836, 3.156873941421509, 3.312161922454834, 3.467449903488159, 3.6227378845214844, 3.7780258655548096, 3.9333138465881348, 4.088602066040039, 4.243889808654785, 4.399177551269531, 4.5544657707214355, 4.70975399017334, 4.865041732788086]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 10.0, 18.0, 17.0, 15.0, 35.0, 47.0, 76.0, 133.0, 183.0, 274.0, 426.0, 763.0, 1244.0, 1984.0, 3281.0, 5769.0, 10413.0, 20228.0, 40328.0, 88191.0, 224046.0, 611448.0, 1261866.0, 1115483.0, 483081.0, 179061.0, 73297.0, 33661.0, 17078.0, 9191.0, 5100.0, 2895.0, 1732.0, 1074.0, 632.0, 425.0, 229.0, 173.0, 137.0, 70.0, 38.0, 41.0, 32.0, 15.0, 17.0, 13.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-8.34375, -8.10455322265625, -7.8653564453125, -7.62615966796875, -7.386962890625, -7.14776611328125, -6.9085693359375, -6.66937255859375, -6.43017578125, -6.19097900390625, -5.9517822265625, -5.71258544921875, -5.473388671875, -5.23419189453125, -4.9949951171875, -4.75579833984375, -4.5166015625, -4.27740478515625, -4.0382080078125, -3.79901123046875, -3.559814453125, -3.32061767578125, -3.0814208984375, -2.84222412109375, -2.60302734375, -2.36383056640625, -2.1246337890625, -1.88543701171875, -1.646240234375, -1.40704345703125, -1.1678466796875, -0.92864990234375, -0.689453125, -0.45025634765625, -0.2110595703125, 0.02813720703125, 0.267333984375, 0.50653076171875, 0.7457275390625, 0.98492431640625, 1.22412109375, 1.46331787109375, 1.7025146484375, 1.94171142578125, 2.180908203125, 2.42010498046875, 2.6593017578125, 2.89849853515625, 3.1376953125, 3.37689208984375, 3.6160888671875, 3.85528564453125, 4.094482421875, 4.33367919921875, 4.5728759765625, 4.81207275390625, 5.05126953125, 5.29046630859375, 5.5296630859375, 5.76885986328125, 6.008056640625, 6.24725341796875, 6.4864501953125, 6.72564697265625, 6.96484375]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 5.0, 7.0, 9.0, 10.0, 8.0, 12.0, 12.0, 9.0, 19.0, 30.0, 19.0, 35.0, 23.0, 27.0, 24.0, 26.0, 32.0, 33.0, 42.0, 49.0, 52.0, 41.0, 36.0, 45.0, 35.0, 44.0, 36.0, 36.0, 33.0, 27.0, 35.0, 22.0, 15.0, 19.0, 10.0, 13.0, 16.0, 7.0, 10.0, 6.0, 9.0, 3.0, 6.0, 4.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.6796875, -3.56591796875, -3.4521484375, -3.33837890625, -3.224609375, -3.11083984375, -2.9970703125, -2.88330078125, -2.76953125, -2.65576171875, -2.5419921875, -2.42822265625, -2.314453125, -2.20068359375, -2.0869140625, -1.97314453125, -1.859375, -1.74560546875, -1.6318359375, -1.51806640625, -1.404296875, -1.29052734375, -1.1767578125, -1.06298828125, -0.94921875, -0.83544921875, -0.7216796875, -0.60791015625, -0.494140625, -0.38037109375, -0.2666015625, -0.15283203125, -0.0390625, 0.07470703125, 0.1884765625, 0.30224609375, 0.416015625, 0.52978515625, 0.6435546875, 0.75732421875, 0.87109375, 0.98486328125, 1.0986328125, 1.21240234375, 1.326171875, 1.43994140625, 1.5537109375, 1.66748046875, 1.78125, 1.89501953125, 2.0087890625, 2.12255859375, 2.236328125, 2.35009765625, 2.4638671875, 2.57763671875, 2.69140625, 2.80517578125, 2.9189453125, 3.03271484375, 3.146484375, 3.26025390625, 3.3740234375, 3.48779296875, 3.6015625]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 10.0, 7.0, 12.0, 17.0, 27.0, 45.0, 74.0, 85.0, 130.0, 215.0, 302.0, 454.0, 682.0, 1054.0, 1643.0, 2574.0, 4124.0, 6613.0, 11132.0, 19174.0, 34521.0, 64041.0, 126148.0, 262576.0, 570948.0, 1070342.0, 1011462.0, 516261.0, 237239.0, 115471.0, 59349.0, 32247.0, 17779.0, 10432.0, 6315.0, 3863.0, 2429.0, 1519.0, 940.0, 723.0, 413.0, 286.0, 188.0, 135.0, 93.0, 71.0, 42.0, 31.0, 17.0, 12.0, 10.0, 8.0, 6.0, 3.0, 0.0, 1.0, 1.0], "bins": [-7.21875, -6.99957275390625, -6.7803955078125, -6.56121826171875, -6.342041015625, -6.12286376953125, -5.9036865234375, -5.68450927734375, -5.46533203125, -5.24615478515625, -5.0269775390625, -4.80780029296875, -4.588623046875, -4.36944580078125, -4.1502685546875, -3.93109130859375, -3.7119140625, -3.49273681640625, -3.2735595703125, -3.05438232421875, -2.835205078125, -2.61602783203125, -2.3968505859375, -2.17767333984375, -1.95849609375, -1.73931884765625, -1.5201416015625, -1.30096435546875, -1.081787109375, -0.86260986328125, -0.6434326171875, -0.42425537109375, -0.205078125, 0.01409912109375, 0.2332763671875, 0.45245361328125, 0.671630859375, 0.89080810546875, 1.1099853515625, 1.32916259765625, 1.54833984375, 1.76751708984375, 1.9866943359375, 2.20587158203125, 2.425048828125, 2.64422607421875, 2.8634033203125, 3.08258056640625, 3.3017578125, 3.52093505859375, 3.7401123046875, 3.95928955078125, 4.178466796875, 4.39764404296875, 4.6168212890625, 4.83599853515625, 5.05517578125, 5.27435302734375, 5.4935302734375, 5.71270751953125, 5.931884765625, 6.15106201171875, 6.3702392578125, 6.58941650390625, 6.80859375]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 2.0, 8.0, 3.0, 9.0, 10.0, 10.0, 6.0, 23.0, 25.0, 25.0, 34.0, 47.0, 58.0, 84.0, 102.0, 121.0, 158.0, 203.0, 215.0, 251.0, 276.0, 301.0, 320.0, 308.0, 280.0, 241.0, 194.0, 148.0, 129.0, 109.0, 84.0, 79.0, 42.0, 36.0, 30.0, 28.0, 13.0, 12.0, 9.0, 6.0, 12.0, 5.0, 2.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.517578125, -2.4479217529296875, -2.378265380859375, -2.3086090087890625, -2.23895263671875, -2.1692962646484375, -2.099639892578125, -2.0299835205078125, -1.9603271484375, -1.8906707763671875, -1.821014404296875, -1.7513580322265625, -1.68170166015625, -1.6120452880859375, -1.542388916015625, -1.4727325439453125, -1.403076171875, -1.3334197998046875, -1.263763427734375, -1.1941070556640625, -1.12445068359375, -1.0547943115234375, -0.985137939453125, -0.9154815673828125, -0.8458251953125, -0.7761688232421875, -0.706512451171875, -0.6368560791015625, -0.56719970703125, -0.4975433349609375, -0.427886962890625, -0.3582305908203125, -0.28857421875, -0.2189178466796875, -0.149261474609375, -0.0796051025390625, -0.00994873046875, 0.0597076416015625, 0.129364013671875, 0.1990203857421875, 0.2686767578125, 0.3383331298828125, 0.407989501953125, 0.4776458740234375, 0.54730224609375, 0.6169586181640625, 0.686614990234375, 0.7562713623046875, 0.825927734375, 0.8955841064453125, 0.965240478515625, 1.0348968505859375, 1.10455322265625, 1.1742095947265625, 1.243865966796875, 1.3135223388671875, 1.3831787109375, 1.4528350830078125, 1.522491455078125, 1.5921478271484375, 1.66180419921875, 1.7314605712890625, 1.801116943359375, 1.8707733154296875, 1.9404296875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 5.0, 8.0, 8.0, 14.0, 13.0, 17.0, 29.0, 34.0, 39.0, 54.0, 56.0, 98.0, 117.0, 86.0, 98.0, 79.0, 74.0, 55.0, 25.0, 22.0, 17.0, 15.0, 6.0, 14.0, 4.0, 7.0, 2.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.846148490905762, -8.509147644042969, -8.172146797180176, -7.835146427154541, -7.498146057128906, -7.161145210266113, -6.82414436340332, -6.487143516540527, -6.150143146514893, -5.8131422996521, -5.476141929626465, -5.139141082763672, -4.802140235900879, -4.465139865875244, -4.128139019012451, -3.7911384105682373, -3.4541378021240234, -3.1171371936798096, -2.7801365852355957, -2.4431357383728027, -2.106135129928589, -1.769134521484375, -1.432133674621582, -1.0951330661773682, -0.7581324577331543, -0.42113178968429565, -0.08413112163543701, 0.2528696060180664, 0.5898702144622803, 0.9268708229064941, 1.263871669769287, 1.600872278213501, 1.9378719329833984, 2.2748725414276123, 2.611873149871826, 2.948873996734619, 3.285874605178833, 3.622875213623047, 3.95987606048584, 4.296876907348633, 4.633877277374268, 4.9708781242370605, 5.307878494262695, 5.644879341125488, 5.981880187988281, 6.318880558013916, 6.655881404876709, 6.992881774902344, 7.329882621765137, 7.66688346862793, 8.003884315490723, 8.340885162353516, 8.677885055541992, 9.014885902404785, 9.351886749267578, 9.688887596130371, 10.025888442993164, 10.362889289855957, 10.69989013671875, 11.036890029907227, 11.37389087677002, 11.710891723632812, 12.047892570495605, 12.384893417358398, 12.721893310546875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 7.0, 10.0, 12.0, 11.0, 15.0, 11.0, 12.0, 28.0, 23.0, 21.0, 28.0, 47.0, 38.0, 37.0, 33.0, 51.0, 40.0, 41.0, 54.0, 48.0, 40.0, 43.0, 33.0, 42.0, 41.0, 30.0, 37.0, 19.0, 25.0, 20.0, 16.0, 16.0, 13.0, 13.0, 9.0, 11.0, 8.0, 1.0, 3.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0195159912109375, -4.8498053550720215, -4.6800947189331055, -4.510384559631348, -4.340673923492432, -4.170963287353516, -4.0012526512146, -3.8315422534942627, -3.661831855773926, -3.4921212196350098, -3.322410821914673, -3.152700185775757, -2.98298978805542, -2.813279151916504, -2.643568515777588, -2.473858118057251, -2.304147481918335, -2.134436845779419, -1.964726448059082, -1.795015811920166, -1.625305414199829, -1.455594778060913, -1.2858842611312866, -1.1161737442016602, -0.9464632272720337, -0.7767527103424072, -0.6070421934127808, -0.4373316168785095, -0.26762109994888306, -0.09791058301925659, 0.07179999351501465, 0.2415105104446411, 0.4112210273742676, 0.580931544303894, 0.7506420612335205, 0.9203526377677917, 1.0900630950927734, 1.2597737312316895, 1.429484248161316, 1.5991947650909424, 1.7689052820205688, 1.9386157989501953, 2.1083264350891113, 2.2780368328094482, 2.4477474689483643, 2.617457866668701, 2.787168502807617, 2.956879138946533, 3.12658953666687, 3.296300172805786, 3.466010570526123, 3.635721206665039, 3.805431604385376, 3.975142240524292, 4.144852638244629, 4.314563274383545, 4.484273910522461, 4.653984546661377, 4.823695182800293, 4.993405342102051, 5.163115978240967, 5.332826614379883, 5.502537250518799, 5.672247886657715, 5.841958045959473]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 6.0, 6.0, 14.0, 16.0, 22.0, 27.0, 64.0, 73.0, 97.0, 158.0, 239.0, 462.0, 680.0, 1105.0, 1933.0, 3325.0, 5924.0, 10689.0, 19111.0, 35316.0, 63349.0, 108570.0, 169819.0, 205485.0, 169383.0, 109258.0, 63428.0, 35616.0, 19432.0, 10651.0, 5989.0, 3302.0, 1986.0, 1143.0, 685.0, 448.0, 280.0, 186.0, 95.0, 57.0, 45.0, 30.0, 19.0, 18.0, 8.0, 10.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.890625, -4.75286865234375, -4.6151123046875, -4.47735595703125, -4.339599609375, -4.20184326171875, -4.0640869140625, -3.92633056640625, -3.78857421875, -3.65081787109375, -3.5130615234375, -3.37530517578125, -3.237548828125, -3.09979248046875, -2.9620361328125, -2.82427978515625, -2.6865234375, -2.54876708984375, -2.4110107421875, -2.27325439453125, -2.135498046875, -1.99774169921875, -1.8599853515625, -1.72222900390625, -1.58447265625, -1.44671630859375, -1.3089599609375, -1.17120361328125, -1.033447265625, -0.89569091796875, -0.7579345703125, -0.62017822265625, -0.482421875, -0.34466552734375, -0.2069091796875, -0.06915283203125, 0.068603515625, 0.20635986328125, 0.3441162109375, 0.48187255859375, 0.61962890625, 0.75738525390625, 0.8951416015625, 1.03289794921875, 1.170654296875, 1.30841064453125, 1.4461669921875, 1.58392333984375, 1.7216796875, 1.85943603515625, 1.9971923828125, 2.13494873046875, 2.272705078125, 2.41046142578125, 2.5482177734375, 2.68597412109375, 2.82373046875, 2.96148681640625, 3.0992431640625, 3.23699951171875, 3.374755859375, 3.51251220703125, 3.6502685546875, 3.78802490234375, 3.92578125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 7.0, 1.0, 6.0, 11.0, 12.0, 12.0, 11.0, 18.0, 15.0, 25.0, 26.0, 25.0, 32.0, 41.0, 34.0, 38.0, 45.0, 31.0, 44.0, 52.0, 51.0, 57.0, 45.0, 28.0, 38.0, 36.0, 34.0, 41.0, 23.0, 28.0, 30.0, 18.0, 14.0, 13.0, 14.0, 11.0, 10.0, 10.0, 9.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4609375, -5.2816162109375, -5.102294921875, -4.9229736328125, -4.74365234375, -4.5643310546875, -4.385009765625, -4.2056884765625, -4.0263671875, -3.8470458984375, -3.667724609375, -3.4884033203125, -3.30908203125, -3.1297607421875, -2.950439453125, -2.7711181640625, -2.591796875, -2.4124755859375, -2.233154296875, -2.0538330078125, -1.87451171875, -1.6951904296875, -1.515869140625, -1.3365478515625, -1.1572265625, -0.9779052734375, -0.798583984375, -0.6192626953125, -0.43994140625, -0.2606201171875, -0.081298828125, 0.0980224609375, 0.27734375, 0.4566650390625, 0.635986328125, 0.8153076171875, 0.99462890625, 1.1739501953125, 1.353271484375, 1.5325927734375, 1.7119140625, 1.8912353515625, 2.070556640625, 2.2498779296875, 2.42919921875, 2.6085205078125, 2.787841796875, 2.9671630859375, 3.146484375, 3.3258056640625, 3.505126953125, 3.6844482421875, 3.86376953125, 4.0430908203125, 4.222412109375, 4.4017333984375, 4.5810546875, 4.7603759765625, 4.939697265625, 5.1190185546875, 5.29833984375, 5.4776611328125, 5.656982421875, 5.8363037109375, 6.015625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 5.0, 9.0, 9.0, 24.0, 27.0, 35.0, 56.0, 93.0, 154.0, 281.0, 421.0, 712.0, 1146.0, 1880.0, 3376.0, 6020.0, 11109.0, 21647.0, 42601.0, 84881.0, 161221.0, 248038.0, 214957.0, 121408.0, 61841.0, 31003.0, 16119.0, 8345.0, 4638.0, 2629.0, 1501.0, 859.0, 512.0, 368.0, 225.0, 118.0, 93.0, 67.0, 45.0, 28.0, 19.0, 19.0, 6.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.5, -5.326904296875, -5.15380859375, -4.980712890625, -4.8076171875, -4.634521484375, -4.46142578125, -4.288330078125, -4.115234375, -3.942138671875, -3.76904296875, -3.595947265625, -3.4228515625, -3.249755859375, -3.07666015625, -2.903564453125, -2.73046875, -2.557373046875, -2.38427734375, -2.211181640625, -2.0380859375, -1.864990234375, -1.69189453125, -1.518798828125, -1.345703125, -1.172607421875, -0.99951171875, -0.826416015625, -0.6533203125, -0.480224609375, -0.30712890625, -0.134033203125, 0.0390625, 0.212158203125, 0.38525390625, 0.558349609375, 0.7314453125, 0.904541015625, 1.07763671875, 1.250732421875, 1.423828125, 1.596923828125, 1.77001953125, 1.943115234375, 2.1162109375, 2.289306640625, 2.46240234375, 2.635498046875, 2.80859375, 2.981689453125, 3.15478515625, 3.327880859375, 3.5009765625, 3.674072265625, 3.84716796875, 4.020263671875, 4.193359375, 4.366455078125, 4.53955078125, 4.712646484375, 4.8857421875, 5.058837890625, 5.23193359375, 5.405029296875, 5.578125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 5.0, 7.0, 0.0, 8.0, 7.0, 6.0, 11.0, 14.0, 12.0, 11.0, 16.0, 28.0, 23.0, 24.0, 37.0, 34.0, 33.0, 33.0, 27.0, 39.0, 42.0, 42.0, 44.0, 29.0, 31.0, 41.0, 47.0, 37.0, 32.0, 34.0, 40.0, 21.0, 25.0, 25.0, 20.0, 18.0, 12.0, 13.0, 13.0, 10.0, 11.0, 7.0, 8.0, 6.0, 7.0, 6.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-2.966796875, -2.8758544921875, -2.784912109375, -2.6939697265625, -2.60302734375, -2.5120849609375, -2.421142578125, -2.3302001953125, -2.2392578125, -2.1483154296875, -2.057373046875, -1.9664306640625, -1.87548828125, -1.7845458984375, -1.693603515625, -1.6026611328125, -1.51171875, -1.4207763671875, -1.329833984375, -1.2388916015625, -1.14794921875, -1.0570068359375, -0.966064453125, -0.8751220703125, -0.7841796875, -0.6932373046875, -0.602294921875, -0.5113525390625, -0.42041015625, -0.3294677734375, -0.238525390625, -0.1475830078125, -0.056640625, 0.0343017578125, 0.125244140625, 0.2161865234375, 0.30712890625, 0.3980712890625, 0.489013671875, 0.5799560546875, 0.6708984375, 0.7618408203125, 0.852783203125, 0.9437255859375, 1.03466796875, 1.1256103515625, 1.216552734375, 1.3074951171875, 1.3984375, 1.4893798828125, 1.580322265625, 1.6712646484375, 1.76220703125, 1.8531494140625, 1.944091796875, 2.0350341796875, 2.1259765625, 2.2169189453125, 2.307861328125, 2.3988037109375, 2.48974609375, 2.5806884765625, 2.671630859375, 2.7625732421875, 2.853515625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 7.0, 11.0, 20.0, 21.0, 44.0, 63.0, 100.0, 167.0, 272.0, 416.0, 635.0, 1092.0, 1824.0, 3151.0, 5566.0, 9747.0, 18545.0, 35798.0, 73760.0, 155091.0, 271516.0, 233064.0, 118409.0, 56859.0, 28297.0, 14770.0, 8114.0, 4528.0, 2622.0, 1528.0, 957.0, 587.0, 341.0, 228.0, 139.0, 91.0, 60.0, 45.0, 33.0, 14.0, 10.0, 11.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.669921875, -2.590972900390625, -2.51202392578125, -2.433074951171875, -2.3541259765625, -2.275177001953125, -2.19622802734375, -2.117279052734375, -2.038330078125, -1.959381103515625, -1.88043212890625, -1.801483154296875, -1.7225341796875, -1.643585205078125, -1.56463623046875, -1.485687255859375, -1.40673828125, -1.327789306640625, -1.24884033203125, -1.169891357421875, -1.0909423828125, -1.011993408203125, -0.93304443359375, -0.854095458984375, -0.775146484375, -0.696197509765625, -0.61724853515625, -0.538299560546875, -0.4593505859375, -0.380401611328125, -0.30145263671875, -0.222503662109375, -0.1435546875, -0.064605712890625, 0.01434326171875, 0.093292236328125, 0.1722412109375, 0.251190185546875, 0.33013916015625, 0.409088134765625, 0.488037109375, 0.566986083984375, 0.64593505859375, 0.724884033203125, 0.8038330078125, 0.882781982421875, 0.96173095703125, 1.040679931640625, 1.11962890625, 1.198577880859375, 1.27752685546875, 1.356475830078125, 1.4354248046875, 1.514373779296875, 1.59332275390625, 1.672271728515625, 1.751220703125, 1.830169677734375, 1.90911865234375, 1.988067626953125, 2.0670166015625, 2.145965576171875, 2.22491455078125, 2.303863525390625, 2.3828125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 6.0, 6.0, 6.0, 14.0, 11.0, 18.0, 28.0, 25.0, 43.0, 52.0, 53.0, 74.0, 85.0, 98.0, 73.0, 72.0, 77.0, 57.0, 36.0, 37.0, 34.0, 21.0, 26.0, 6.0, 7.0, 10.0, 6.0, 4.0, 3.0, 8.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011140108108520508, -0.00010639335960149765, -0.00010138563811779022, -9.63779166340828e-05, -9.137019515037537e-05, -8.636247366666794e-05, -8.135475218296051e-05, -7.634703069925308e-05, -7.133930921554565e-05, -6.633158773183823e-05, -6.13238662481308e-05, -5.631614476442337e-05, -5.130842328071594e-05, -4.6300701797008514e-05, -4.1292980313301086e-05, -3.628525882959366e-05, -3.127753734588623e-05, -2.6269815862178802e-05, -2.1262094378471375e-05, -1.6254372894763947e-05, -1.1246651411056519e-05, -6.2389299273490906e-06, -1.2312084436416626e-06, 3.7765130400657654e-06, 8.784234523773193e-06, 1.3791956007480621e-05, 1.879967749118805e-05, 2.3807398974895477e-05, 2.8815120458602905e-05, 3.382284194231033e-05, 3.883056342601776e-05, 4.383828490972519e-05, 4.884600639343262e-05, 5.3853727877140045e-05, 5.886144936084747e-05, 6.38691708445549e-05, 6.887689232826233e-05, 7.388461381196976e-05, 7.889233529567719e-05, 8.390005677938461e-05, 8.890777826309204e-05, 9.391549974679947e-05, 9.89232212305069e-05, 0.00010393094271421432, 0.00010893866419792175, 0.00011394638568162918, 0.00011895410716533661, 0.00012396182864904404, 0.00012896955013275146, 0.0001339772716164589, 0.00013898499310016632, 0.00014399271458387375, 0.00014900043606758118, 0.0001540081575512886, 0.00015901587903499603, 0.00016402360051870346, 0.0001690313220024109, 0.00017403904348611832, 0.00017904676496982574, 0.00018405448645353317, 0.0001890622079372406, 0.00019406992942094803, 0.00019907765090465546, 0.00020408537238836288, 0.0002090930938720703]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 8.0, 14.0, 19.0, 26.0, 39.0, 34.0, 60.0, 94.0, 131.0, 192.0, 252.0, 401.0, 531.0, 875.0, 1323.0, 2152.0, 3498.0, 6014.0, 10853.0, 20057.0, 38468.0, 76284.0, 141733.0, 213074.0, 216667.0, 146625.0, 79865.0, 40999.0, 20899.0, 11206.0, 6221.0, 3640.0, 2138.0, 1419.0, 864.0, 562.0, 390.0, 233.0, 206.0, 154.0, 95.0, 71.0, 47.0, 33.0, 27.0, 23.0, 15.0, 6.0, 4.0, 5.0, 3.0, 3.0, 1.0, 2.0], "bins": [-2.22265625, -2.1573486328125, -2.092041015625, -2.0267333984375, -1.96142578125, -1.8961181640625, -1.830810546875, -1.7655029296875, -1.7001953125, -1.6348876953125, -1.569580078125, -1.5042724609375, -1.43896484375, -1.3736572265625, -1.308349609375, -1.2430419921875, -1.177734375, -1.1124267578125, -1.047119140625, -0.9818115234375, -0.91650390625, -0.8511962890625, -0.785888671875, -0.7205810546875, -0.6552734375, -0.5899658203125, -0.524658203125, -0.4593505859375, -0.39404296875, -0.3287353515625, -0.263427734375, -0.1981201171875, -0.1328125, -0.0675048828125, -0.002197265625, 0.0631103515625, 0.12841796875, 0.1937255859375, 0.259033203125, 0.3243408203125, 0.3896484375, 0.4549560546875, 0.520263671875, 0.5855712890625, 0.65087890625, 0.7161865234375, 0.781494140625, 0.8468017578125, 0.912109375, 0.9774169921875, 1.042724609375, 1.1080322265625, 1.17333984375, 1.2386474609375, 1.303955078125, 1.3692626953125, 1.4345703125, 1.4998779296875, 1.565185546875, 1.6304931640625, 1.69580078125, 1.7611083984375, 1.826416015625, 1.8917236328125, 1.95703125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 7.0, 6.0, 5.0, 10.0, 8.0, 18.0, 19.0, 20.0, 36.0, 51.0, 62.0, 49.0, 70.0, 62.0, 71.0, 69.0, 64.0, 57.0, 47.0, 43.0, 53.0, 37.0, 33.0, 23.0, 21.0, 14.0, 16.0, 3.0, 8.0, 3.0, 5.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.76513671875, -0.739593505859375, -0.71405029296875, -0.688507080078125, -0.6629638671875, -0.637420654296875, -0.61187744140625, -0.586334228515625, -0.560791015625, -0.535247802734375, -0.50970458984375, -0.484161376953125, -0.4586181640625, -0.433074951171875, -0.40753173828125, -0.381988525390625, -0.3564453125, -0.330902099609375, -0.30535888671875, -0.279815673828125, -0.2542724609375, -0.228729248046875, -0.20318603515625, -0.177642822265625, -0.152099609375, -0.126556396484375, -0.10101318359375, -0.075469970703125, -0.0499267578125, -0.024383544921875, 0.00115966796875, 0.026702880859375, 0.05224609375, 0.077789306640625, 0.10333251953125, 0.128875732421875, 0.1544189453125, 0.179962158203125, 0.20550537109375, 0.231048583984375, 0.256591796875, 0.282135009765625, 0.30767822265625, 0.333221435546875, 0.3587646484375, 0.384307861328125, 0.40985107421875, 0.435394287109375, 0.4609375, 0.486480712890625, 0.51202392578125, 0.537567138671875, 0.5631103515625, 0.588653564453125, 0.61419677734375, 0.639739990234375, 0.665283203125, 0.690826416015625, 0.71636962890625, 0.741912841796875, 0.7674560546875, 0.792999267578125, 0.81854248046875, 0.844085693359375, 0.86962890625]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 7.0, 8.0, 8.0, 7.0, 12.0, 20.0, 28.0, 29.0, 43.0, 49.0, 68.0, 99.0, 112.0, 97.0, 104.0, 65.0, 82.0, 41.0, 33.0, 24.0, 11.0, 16.0, 11.0, 9.0, 4.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.14549732208252, -8.808816909790039, -8.472137451171875, -8.135457038879395, -7.7987775802612305, -7.462097644805908, -7.125417709350586, -6.7887372970581055, -6.452057838439941, -6.115377902984619, -5.778697967529297, -5.442018032073975, -5.105338096618652, -4.76865816116333, -4.431978225708008, -4.095297813415527, -3.758617877960205, -3.421937942504883, -3.0852580070495605, -2.7485780715942383, -2.411898136138916, -2.0752182006835938, -1.7385380268096924, -1.4018580913543701, -1.0651781558990479, -0.7284982204437256, -0.39181822538375854, -0.055138230323791504, 0.28154170513153076, 0.618221640586853, 0.9549016952514648, 1.291581630706787, 1.6282615661621094, 1.9649415016174316, 2.301621437072754, 2.638301372528076, 2.9749813079833984, 3.3116612434387207, 3.648341417312622, 3.9850213527679443, 4.3217010498046875, 4.65838098526001, 4.995060920715332, 5.331740856170654, 5.668420791625977, 6.005100727081299, 6.341780662536621, 6.678461074829102, 7.015141010284424, 7.351820945739746, 7.688500881195068, 8.02518081665039, 8.361861228942871, 8.698540687561035, 9.035221099853516, 9.37190055847168, 9.70858097076416, 10.04526138305664, 10.381940841674805, 10.718621253967285, 11.05530071258545, 11.39198112487793, 11.728660583496094, 12.065340995788574, 12.402020454406738]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 7.0, 1.0, 6.0, 4.0, 10.0, 13.0, 14.0, 9.0, 16.0, 15.0, 22.0, 23.0, 16.0, 42.0, 41.0, 41.0, 34.0, 39.0, 46.0, 45.0, 42.0, 56.0, 40.0, 44.0, 39.0, 38.0, 40.0, 38.0, 38.0, 24.0, 29.0, 21.0, 21.0, 13.0, 16.0, 14.0, 12.0, 12.0, 7.0, 2.0, 5.0, 5.0, 6.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.905910015106201, -4.7390899658203125, -4.572269916534424, -4.405449867248535, -4.2386298179626465, -4.071809768676758, -3.90498948097229, -3.7381694316864014, -3.5713493824005127, -3.404529333114624, -3.2377092838287354, -3.0708889961242676, -2.904068946838379, -2.7372488975524902, -2.5704288482666016, -2.403608798980713, -2.236788749694824, -2.0699687004089355, -1.9031486511230469, -1.7363284826278687, -1.56950843334198, -1.4026883840560913, -1.235868215560913, -1.0690481662750244, -0.9022281169891357, -0.7354080677032471, -0.5685879588127136, -0.4017678499221802, -0.2349478006362915, -0.06812775135040283, 0.09869241714477539, 0.26551246643066406, 0.43233299255371094, 0.5991530418395996, 0.7659731507301331, 0.9327932596206665, 1.0996133089065552, 1.2664333581924438, 1.433253526687622, 1.6000735759735107, 1.7668936252593994, 1.933713674545288, 2.1005337238311768, 2.2673540115356445, 2.434174060821533, 2.600994110107422, 2.7678141593933105, 2.934634208679199, 3.101454257965088, 3.2682743072509766, 3.4350943565368652, 3.601914405822754, 3.7687344551086426, 3.9355545043945312, 4.102375030517578, 4.269194602966309, 4.4360151290893555, 4.602835178375244, 4.769655227661133, 4.9364752769470215, 5.10329532623291, 5.270115375518799, 5.4369354248046875, 5.603755950927734, 5.770575523376465]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 6.0, 13.0, 9.0, 16.0, 22.0, 45.0, 70.0, 97.0, 154.0, 218.0, 317.0, 517.0, 803.0, 1264.0, 1921.0, 3104.0, 5068.0, 8230.0, 13678.0, 22937.0, 37799.0, 62602.0, 100420.0, 143767.0, 173493.0, 159503.0, 117742.0, 76950.0, 46680.0, 27826.0, 16852.0, 9905.0, 6213.0, 3725.0, 2383.0, 1504.0, 935.0, 621.0, 416.0, 242.0, 175.0, 114.0, 57.0, 55.0, 32.0, 24.0, 16.0, 7.0, 6.0, 6.0, 8.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.90625, -4.7562255859375, -4.606201171875, -4.4561767578125, -4.30615234375, -4.1561279296875, -4.006103515625, -3.8560791015625, -3.7060546875, -3.5560302734375, -3.406005859375, -3.2559814453125, -3.10595703125, -2.9559326171875, -2.805908203125, -2.6558837890625, -2.505859375, -2.3558349609375, -2.205810546875, -2.0557861328125, -1.90576171875, -1.7557373046875, -1.605712890625, -1.4556884765625, -1.3056640625, -1.1556396484375, -1.005615234375, -0.8555908203125, -0.70556640625, -0.5555419921875, -0.405517578125, -0.2554931640625, -0.10546875, 0.0445556640625, 0.194580078125, 0.3446044921875, 0.49462890625, 0.6446533203125, 0.794677734375, 0.9447021484375, 1.0947265625, 1.2447509765625, 1.394775390625, 1.5447998046875, 1.69482421875, 1.8448486328125, 1.994873046875, 2.1448974609375, 2.294921875, 2.4449462890625, 2.594970703125, 2.7449951171875, 2.89501953125, 3.0450439453125, 3.195068359375, 3.3450927734375, 3.4951171875, 3.6451416015625, 3.795166015625, 3.9451904296875, 4.09521484375, 4.2452392578125, 4.395263671875, 4.5452880859375, 4.6953125]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 5.0, 7.0, 9.0, 9.0, 5.0, 13.0, 14.0, 16.0, 19.0, 13.0, 29.0, 29.0, 32.0, 30.0, 38.0, 36.0, 42.0, 52.0, 53.0, 47.0, 30.0, 48.0, 49.0, 37.0, 48.0, 37.0, 35.0, 33.0, 27.0, 27.0, 21.0, 21.0, 21.0, 11.0, 11.0, 11.0, 5.0, 6.0, 6.0, 9.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.34375, -5.16766357421875, -4.9915771484375, -4.81549072265625, -4.639404296875, -4.46331787109375, -4.2872314453125, -4.11114501953125, -3.93505859375, -3.75897216796875, -3.5828857421875, -3.40679931640625, -3.230712890625, -3.05462646484375, -2.8785400390625, -2.70245361328125, -2.5263671875, -2.35028076171875, -2.1741943359375, -1.99810791015625, -1.822021484375, -1.64593505859375, -1.4698486328125, -1.29376220703125, -1.11767578125, -0.94158935546875, -0.7655029296875, -0.58941650390625, -0.413330078125, -0.23724365234375, -0.0611572265625, 0.11492919921875, 0.291015625, 0.46710205078125, 0.6431884765625, 0.81927490234375, 0.995361328125, 1.17144775390625, 1.3475341796875, 1.52362060546875, 1.69970703125, 1.87579345703125, 2.0518798828125, 2.22796630859375, 2.404052734375, 2.58013916015625, 2.7562255859375, 2.93231201171875, 3.1083984375, 3.28448486328125, 3.4605712890625, 3.63665771484375, 3.812744140625, 3.98883056640625, 4.1649169921875, 4.34100341796875, 4.51708984375, 4.69317626953125, 4.8692626953125, 5.04534912109375, 5.221435546875, 5.39752197265625, 5.5736083984375, 5.74969482421875, 5.92578125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 3.0, 6.0, 2.0, 4.0, 4.0, 10.0, 10.0, 8.0, 14.0, 23.0, 29.0, 43.0, 52.0, 64.0, 92.0, 135.0, 159.0, 243.0, 344.0, 504.0, 799.0, 1355.0, 2272.0, 3991.0, 7518.0, 14920.0, 31423.0, 66426.0, 134683.0, 221750.0, 238393.0, 161022.0, 83082.0, 39592.0, 18598.0, 9314.0, 4912.0, 2523.0, 1392.0, 896.0, 584.0, 370.0, 277.0, 189.0, 117.0, 106.0, 89.0, 52.0, 44.0, 31.0, 29.0, 19.0, 17.0, 13.0, 8.0, 7.0, 2.0, 1.0, 2.0, 5.0, 0.0, 0.0, 2.0], "bins": [-6.64453125, -6.43121337890625, -6.2178955078125, -6.00457763671875, -5.791259765625, -5.57794189453125, -5.3646240234375, -5.15130615234375, -4.93798828125, -4.72467041015625, -4.5113525390625, -4.29803466796875, -4.084716796875, -3.87139892578125, -3.6580810546875, -3.44476318359375, -3.2314453125, -3.01812744140625, -2.8048095703125, -2.59149169921875, -2.378173828125, -2.16485595703125, -1.9515380859375, -1.73822021484375, -1.52490234375, -1.31158447265625, -1.0982666015625, -0.88494873046875, -0.671630859375, -0.45831298828125, -0.2449951171875, -0.03167724609375, 0.181640625, 0.39495849609375, 0.6082763671875, 0.82159423828125, 1.034912109375, 1.24822998046875, 1.4615478515625, 1.67486572265625, 1.88818359375, 2.10150146484375, 2.3148193359375, 2.52813720703125, 2.741455078125, 2.95477294921875, 3.1680908203125, 3.38140869140625, 3.5947265625, 3.80804443359375, 4.0213623046875, 4.23468017578125, 4.447998046875, 4.66131591796875, 4.8746337890625, 5.08795166015625, 5.30126953125, 5.51458740234375, 5.7279052734375, 5.94122314453125, 6.154541015625, 6.36785888671875, 6.5811767578125, 6.79449462890625, 7.0078125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 5.0, 4.0, 7.0, 4.0, 11.0, 8.0, 4.0, 9.0, 11.0, 10.0, 12.0, 15.0, 28.0, 19.0, 46.0, 25.0, 30.0, 43.0, 29.0, 33.0, 38.0, 37.0, 32.0, 37.0, 45.0, 52.0, 46.0, 45.0, 36.0, 35.0, 28.0, 26.0, 34.0, 32.0, 27.0, 16.0, 19.0, 9.0, 16.0, 7.0, 5.0, 3.0, 8.0, 3.0, 6.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.080078125, -2.981231689453125, -2.88238525390625, -2.783538818359375, -2.6846923828125, -2.585845947265625, -2.48699951171875, -2.388153076171875, -2.289306640625, -2.190460205078125, -2.09161376953125, -1.992767333984375, -1.8939208984375, -1.795074462890625, -1.69622802734375, -1.597381591796875, -1.49853515625, -1.399688720703125, -1.30084228515625, -1.201995849609375, -1.1031494140625, -1.004302978515625, -0.90545654296875, -0.806610107421875, -0.707763671875, -0.608917236328125, -0.51007080078125, -0.411224365234375, -0.3123779296875, -0.213531494140625, -0.11468505859375, -0.015838623046875, 0.0830078125, 0.181854248046875, 0.28070068359375, 0.379547119140625, 0.4783935546875, 0.577239990234375, 0.67608642578125, 0.774932861328125, 0.873779296875, 0.972625732421875, 1.07147216796875, 1.170318603515625, 1.2691650390625, 1.368011474609375, 1.46685791015625, 1.565704345703125, 1.66455078125, 1.763397216796875, 1.86224365234375, 1.961090087890625, 2.0599365234375, 2.158782958984375, 2.25762939453125, 2.356475830078125, 2.455322265625, 2.554168701171875, 2.65301513671875, 2.751861572265625, 2.8507080078125, 2.949554443359375, 3.04840087890625, 3.147247314453125, 3.24609375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 5.0, 8.0, 6.0, 8.0, 11.0, 17.0, 24.0, 32.0, 49.0, 80.0, 99.0, 127.0, 186.0, 292.0, 428.0, 618.0, 978.0, 1464.0, 2632.0, 4459.0, 8337.0, 15813.0, 32806.0, 68461.0, 137617.0, 223869.0, 236050.0, 155632.0, 79248.0, 38233.0, 18596.0, 9495.0, 5047.0, 2887.0, 1718.0, 1134.0, 660.0, 437.0, 322.0, 201.0, 134.0, 92.0, 71.0, 53.0, 38.0, 18.0, 23.0, 12.0, 7.0, 6.0, 6.0, 3.0, 4.0, 6.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.05078125, -2.95574951171875, -2.8607177734375, -2.76568603515625, -2.670654296875, -2.57562255859375, -2.4805908203125, -2.38555908203125, -2.29052734375, -2.19549560546875, -2.1004638671875, -2.00543212890625, -1.910400390625, -1.81536865234375, -1.7203369140625, -1.62530517578125, -1.5302734375, -1.43524169921875, -1.3402099609375, -1.24517822265625, -1.150146484375, -1.05511474609375, -0.9600830078125, -0.86505126953125, -0.77001953125, -0.67498779296875, -0.5799560546875, -0.48492431640625, -0.389892578125, -0.29486083984375, -0.1998291015625, -0.10479736328125, -0.009765625, 0.08526611328125, 0.1802978515625, 0.27532958984375, 0.370361328125, 0.46539306640625, 0.5604248046875, 0.65545654296875, 0.75048828125, 0.84552001953125, 0.9405517578125, 1.03558349609375, 1.130615234375, 1.22564697265625, 1.3206787109375, 1.41571044921875, 1.5107421875, 1.60577392578125, 1.7008056640625, 1.79583740234375, 1.890869140625, 1.98590087890625, 2.0809326171875, 2.17596435546875, 2.27099609375, 2.36602783203125, 2.4610595703125, 2.55609130859375, 2.651123046875, 2.74615478515625, 2.8411865234375, 2.93621826171875, 3.03125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 7.0, 2.0, 7.0, 7.0, 15.0, 8.0, 15.0, 13.0, 21.0, 27.0, 22.0, 37.0, 48.0, 65.0, 49.0, 66.0, 57.0, 63.0, 73.0, 66.0, 51.0, 43.0, 52.0, 36.0, 31.0, 33.0, 19.0, 18.0, 7.0, 8.0, 9.0, 7.0, 3.0, 3.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021791458129882812, -0.0002105608582496643, -0.0002032071352005005, -0.00019585341215133667, -0.00018849968910217285, -0.00018114596605300903, -0.00017379224300384521, -0.0001664385199546814, -0.00015908479690551758, -0.00015173107385635376, -0.00014437735080718994, -0.00013702362775802612, -0.0001296699047088623, -0.00012231618165969849, -0.00011496245861053467, -0.00010760873556137085, -0.00010025501251220703, -9.290128946304321e-05, -8.55475664138794e-05, -7.819384336471558e-05, -7.084012031555176e-05, -6.348639726638794e-05, -5.613267421722412e-05, -4.87789511680603e-05, -4.1425228118896484e-05, -3.4071505069732666e-05, -2.6717782020568848e-05, -1.936405897140503e-05, -1.2010335922241211e-05, -4.656612873077393e-06, 2.6971101760864258e-06, 1.0050833225250244e-05, 1.7404556274414062e-05, 2.475827932357788e-05, 3.21120023727417e-05, 3.946572542190552e-05, 4.6819448471069336e-05, 5.4173171520233154e-05, 6.152689456939697e-05, 6.888061761856079e-05, 7.623434066772461e-05, 8.358806371688843e-05, 9.094178676605225e-05, 9.829550981521606e-05, 0.00010564923286437988, 0.0001130029559135437, 0.00012035667896270752, 0.00012771040201187134, 0.00013506412506103516, 0.00014241784811019897, 0.0001497715711593628, 0.0001571252942085266, 0.00016447901725769043, 0.00017183274030685425, 0.00017918646335601807, 0.00018654018640518188, 0.0001938939094543457, 0.00020124763250350952, 0.00020860135555267334, 0.00021595507860183716, 0.00022330880165100098, 0.0002306625247001648, 0.0002380162477493286, 0.00024536997079849243, 0.00025272369384765625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 2.0, 8.0, 4.0, 13.0, 12.0, 19.0, 29.0, 58.0, 48.0, 80.0, 140.0, 187.0, 266.0, 402.0, 644.0, 982.0, 1752.0, 3108.0, 6077.0, 12981.0, 29850.0, 73451.0, 176039.0, 299294.0, 244461.0, 114464.0, 46038.0, 19367.0, 8609.0, 4313.0, 2199.0, 1280.0, 805.0, 509.0, 324.0, 240.0, 161.0, 94.0, 78.0, 39.0, 45.0, 26.0, 21.0, 15.0, 8.0, 7.0, 6.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.560546875, -3.444732666015625, -3.32891845703125, -3.213104248046875, -3.0972900390625, -2.981475830078125, -2.86566162109375, -2.749847412109375, -2.634033203125, -2.518218994140625, -2.40240478515625, -2.286590576171875, -2.1707763671875, -2.054962158203125, -1.93914794921875, -1.823333740234375, -1.70751953125, -1.591705322265625, -1.47589111328125, -1.360076904296875, -1.2442626953125, -1.128448486328125, -1.01263427734375, -0.896820068359375, -0.781005859375, -0.665191650390625, -0.54937744140625, -0.433563232421875, -0.3177490234375, -0.201934814453125, -0.08612060546875, 0.029693603515625, 0.1455078125, 0.261322021484375, 0.37713623046875, 0.492950439453125, 0.6087646484375, 0.724578857421875, 0.84039306640625, 0.956207275390625, 1.072021484375, 1.187835693359375, 1.30364990234375, 1.419464111328125, 1.5352783203125, 1.651092529296875, 1.76690673828125, 1.882720947265625, 1.99853515625, 2.114349365234375, 2.23016357421875, 2.345977783203125, 2.4617919921875, 2.577606201171875, 2.69342041015625, 2.809234619140625, 2.925048828125, 3.040863037109375, 3.15667724609375, 3.272491455078125, 3.3883056640625, 3.504119873046875, 3.61993408203125, 3.735748291015625, 3.8515625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 7.0, 9.0, 18.0, 11.0, 13.0, 25.0, 23.0, 49.0, 41.0, 63.0, 72.0, 71.0, 90.0, 88.0, 80.0, 73.0, 60.0, 49.0, 43.0, 35.0, 19.0, 15.0, 15.0, 8.0, 3.0, 2.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0234375, -0.9903106689453125, -0.957183837890625, -0.9240570068359375, -0.89093017578125, -0.8578033447265625, -0.824676513671875, -0.7915496826171875, -0.7584228515625, -0.7252960205078125, -0.692169189453125, -0.6590423583984375, -0.62591552734375, -0.5927886962890625, -0.559661865234375, -0.5265350341796875, -0.493408203125, -0.4602813720703125, -0.427154541015625, -0.3940277099609375, -0.36090087890625, -0.3277740478515625, -0.294647216796875, -0.2615203857421875, -0.2283935546875, -0.1952667236328125, -0.162139892578125, -0.1290130615234375, -0.09588623046875, -0.0627593994140625, -0.029632568359375, 0.0034942626953125, 0.03662109375, 0.0697479248046875, 0.102874755859375, 0.1360015869140625, 0.16912841796875, 0.2022552490234375, 0.235382080078125, 0.2685089111328125, 0.3016357421875, 0.3347625732421875, 0.367889404296875, 0.4010162353515625, 0.43414306640625, 0.4672698974609375, 0.500396728515625, 0.5335235595703125, 0.566650390625, 0.5997772216796875, 0.632904052734375, 0.6660308837890625, 0.69915771484375, 0.7322845458984375, 0.765411376953125, 0.7985382080078125, 0.8316650390625, 0.8647918701171875, 0.897918701171875, 0.9310455322265625, 0.96417236328125, 0.9972991943359375, 1.030426025390625, 1.0635528564453125, 1.0966796875]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 6.0, 9.0, 16.0, 8.0, 18.0, 24.0, 29.0, 37.0, 51.0, 57.0, 84.0, 98.0, 98.0, 93.0, 75.0, 72.0, 57.0, 35.0, 37.0, 21.0, 14.0, 12.0, 10.0, 11.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.431387901306152, -8.125255584716797, -7.819123268127441, -7.512991428375244, -7.206859111785889, -6.900726795196533, -6.594594955444336, -6.2884626388549805, -5.982330322265625, -5.6761980056762695, -5.370065689086914, -5.063933849334717, -4.757801532745361, -4.451669216156006, -4.145537376403809, -3.839405059814453, -3.5332727432250977, -3.227140426635742, -2.921008348464966, -2.6148762702941895, -2.308743953704834, -2.0026116371154785, -1.6964795589447021, -1.3903474807739258, -1.0842151641845703, -0.7780829668045044, -0.4719507694244385, -0.16581857204437256, 0.14031362533569336, 0.4464458227157593, 0.7525780200958252, 1.0587100982666016, 1.3648433685302734, 1.6709755659103394, 1.9771077632904053, 2.2832398414611816, 2.589372158050537, 2.8955044746398926, 3.201636552810669, 3.5077686309814453, 3.813900947570801, 4.120033264160156, 4.426165580749512, 4.732297420501709, 5.0384297370910645, 5.34456205368042, 5.650693893432617, 5.956826210021973, 6.262958526611328, 6.569090843200684, 6.875223159790039, 7.181354999542236, 7.487487316131592, 7.793619632720947, 8.099751472473145, 8.4058837890625, 8.712016105651855, 9.018148422241211, 9.324280738830566, 9.630413055419922, 9.936544418334961, 10.242676734924316, 10.548809051513672, 10.854941368103027, 11.161073684692383]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 7.0, 12.0, 10.0, 7.0, 13.0, 22.0, 21.0, 22.0, 20.0, 25.0, 31.0, 32.0, 38.0, 38.0, 37.0, 55.0, 33.0, 46.0, 48.0, 52.0, 47.0, 42.0, 37.0, 46.0, 44.0, 30.0, 27.0, 18.0, 16.0, 20.0, 20.0, 21.0, 11.0, 14.0, 6.0, 7.0, 5.0, 6.0, 9.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.728944778442383, -4.568073749542236, -4.407203197479248, -4.246332168579102, -4.085461616516113, -3.924590826034546, -3.7637200355529785, -3.602849006652832, -3.4419784545898438, -3.2811076641082764, -3.120236873626709, -2.9593660831451416, -2.798495292663574, -2.637624502182007, -2.4767537117004395, -2.315882682800293, -2.1550118923187256, -1.9941411018371582, -1.8332703113555908, -1.6723995208740234, -1.511528730392456, -1.3506579399108887, -1.1897870302200317, -1.0289162397384644, -0.868045449256897, -0.7071746587753296, -0.5463038682937622, -0.38543301820755005, -0.22456222772598267, -0.06369143724441528, 0.09717941284179688, 0.25805020332336426, 0.41892099380493164, 0.579791784286499, 0.7406625747680664, 0.9015334248542786, 1.0624041557312012, 1.2232749462127686, 1.3841458559036255, 1.5450166463851929, 1.7058874368667603, 1.8667582273483276, 2.0276291370391846, 2.188499927520752, 2.3493707180023193, 2.5102415084838867, 2.671112298965454, 2.8319830894470215, 2.992853879928589, 3.1537246704101562, 3.3145954608917236, 3.475466251373291, 3.6363370418548584, 3.797207832336426, 3.9580788612365723, 4.1189494132995605, 4.279820442199707, 4.4406914710998535, 4.601562023162842, 4.762433052062988, 4.923303604125977, 5.084174633026123, 5.245045185089111, 5.405916213989258, 5.566786766052246]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 7.0, 9.0, 13.0, 6.0, 22.0, 29.0, 24.0, 51.0, 83.0, 163.0, 230.0, 332.0, 632.0, 1098.0, 1913.0, 3490.0, 6683.0, 13854.0, 31073.0, 80035.0, 254327.0, 909314.0, 1694677.0, 829262.0, 232124.0, 76069.0, 29755.0, 13491.0, 6776.0, 3694.0, 2003.0, 1195.0, 692.0, 441.0, 269.0, 159.0, 113.0, 67.0, 31.0, 24.0, 21.0, 16.0, 9.0, 5.0, 8.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.5625, -9.2679443359375, -8.973388671875, -8.6788330078125, -8.38427734375, -8.0897216796875, -7.795166015625, -7.5006103515625, -7.2060546875, -6.9114990234375, -6.616943359375, -6.3223876953125, -6.02783203125, -5.7332763671875, -5.438720703125, -5.1441650390625, -4.849609375, -4.5550537109375, -4.260498046875, -3.9659423828125, -3.67138671875, -3.3768310546875, -3.082275390625, -2.7877197265625, -2.4931640625, -2.1986083984375, -1.904052734375, -1.6094970703125, -1.31494140625, -1.0203857421875, -0.725830078125, -0.4312744140625, -0.13671875, 0.1578369140625, 0.452392578125, 0.7469482421875, 1.04150390625, 1.3360595703125, 1.630615234375, 1.9251708984375, 2.2197265625, 2.5142822265625, 2.808837890625, 3.1033935546875, 3.39794921875, 3.6925048828125, 3.987060546875, 4.2816162109375, 4.576171875, 4.8707275390625, 5.165283203125, 5.4598388671875, 5.75439453125, 6.0489501953125, 6.343505859375, 6.6380615234375, 6.9326171875, 7.2271728515625, 7.521728515625, 7.8162841796875, 8.11083984375, 8.4053955078125, 8.699951171875, 8.9945068359375, 9.2890625]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 10.0, 11.0, 15.0, 9.0, 18.0, 28.0, 29.0, 34.0, 21.0, 40.0, 37.0, 46.0, 39.0, 54.0, 41.0, 60.0, 52.0, 51.0, 61.0, 37.0, 55.0, 51.0, 31.0, 30.0, 19.0, 16.0, 21.0, 17.0, 17.0, 17.0, 13.0, 4.0, 3.0, 6.0, 3.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.884765625, -3.750213623046875, -3.61566162109375, -3.481109619140625, -3.3465576171875, -3.212005615234375, -3.07745361328125, -2.942901611328125, -2.808349609375, -2.673797607421875, -2.53924560546875, -2.404693603515625, -2.2701416015625, -2.135589599609375, -2.00103759765625, -1.866485595703125, -1.73193359375, -1.597381591796875, -1.46282958984375, -1.328277587890625, -1.1937255859375, -1.059173583984375, -0.92462158203125, -0.790069580078125, -0.655517578125, -0.520965576171875, -0.38641357421875, -0.251861572265625, -0.1173095703125, 0.017242431640625, 0.15179443359375, 0.286346435546875, 0.4208984375, 0.555450439453125, 0.69000244140625, 0.824554443359375, 0.9591064453125, 1.093658447265625, 1.22821044921875, 1.362762451171875, 1.497314453125, 1.631866455078125, 1.76641845703125, 1.900970458984375, 2.0355224609375, 2.170074462890625, 2.30462646484375, 2.439178466796875, 2.57373046875, 2.708282470703125, 2.84283447265625, 2.977386474609375, 3.1119384765625, 3.246490478515625, 3.38104248046875, 3.515594482421875, 3.650146484375, 3.784698486328125, 3.91925048828125, 4.053802490234375, 4.1883544921875, 4.322906494140625, 4.45745849609375, 4.592010498046875, 4.7265625]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 5.0, 1.0, 6.0, 5.0, 11.0, 11.0, 16.0, 22.0, 46.0, 60.0, 58.0, 103.0, 158.0, 206.0, 332.0, 550.0, 802.0, 1285.0, 2076.0, 3260.0, 5605.0, 9486.0, 17163.0, 31322.0, 59331.0, 121401.0, 261273.0, 581822.0, 1104003.0, 1027741.0, 512074.0, 229198.0, 106581.0, 52945.0, 27771.0, 15269.0, 8681.0, 5085.0, 3103.0, 1917.0, 1251.0, 765.0, 485.0, 330.0, 215.0, 149.0, 95.0, 76.0, 40.0, 24.0, 25.0, 17.0, 18.0, 7.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0], "bins": [-7.3671875, -7.14337158203125, -6.9195556640625, -6.69573974609375, -6.471923828125, -6.24810791015625, -6.0242919921875, -5.80047607421875, -5.57666015625, -5.35284423828125, -5.1290283203125, -4.90521240234375, -4.681396484375, -4.45758056640625, -4.2337646484375, -4.00994873046875, -3.7861328125, -3.56231689453125, -3.3385009765625, -3.11468505859375, -2.890869140625, -2.66705322265625, -2.4432373046875, -2.21942138671875, -1.99560546875, -1.77178955078125, -1.5479736328125, -1.32415771484375, -1.100341796875, -0.87652587890625, -0.6527099609375, -0.42889404296875, -0.205078125, 0.01873779296875, 0.2425537109375, 0.46636962890625, 0.690185546875, 0.91400146484375, 1.1378173828125, 1.36163330078125, 1.58544921875, 1.80926513671875, 2.0330810546875, 2.25689697265625, 2.480712890625, 2.70452880859375, 2.9283447265625, 3.15216064453125, 3.3759765625, 3.59979248046875, 3.8236083984375, 4.04742431640625, 4.271240234375, 4.49505615234375, 4.7188720703125, 4.94268798828125, 5.16650390625, 5.39031982421875, 5.6141357421875, 5.83795166015625, 6.061767578125, 6.28558349609375, 6.5093994140625, 6.73321533203125, 6.95703125]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 5.0, 1.0, 6.0, 4.0, 6.0, 4.0, 10.0, 13.0, 20.0, 9.0, 26.0, 35.0, 48.0, 71.0, 99.0, 106.0, 124.0, 145.0, 183.0, 237.0, 303.0, 313.0, 330.0, 314.0, 339.0, 284.0, 240.0, 180.0, 152.0, 110.0, 79.0, 63.0, 48.0, 36.0, 38.0, 17.0, 23.0, 12.0, 7.0, 11.0, 6.0, 11.0, 5.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-2.544921875, -2.4739227294921875, -2.402923583984375, -2.3319244384765625, -2.26092529296875, -2.1899261474609375, -2.118927001953125, -2.0479278564453125, -1.9769287109375, -1.9059295654296875, -1.834930419921875, -1.7639312744140625, -1.69293212890625, -1.6219329833984375, -1.550933837890625, -1.4799346923828125, -1.408935546875, -1.3379364013671875, -1.266937255859375, -1.1959381103515625, -1.12493896484375, -1.0539398193359375, -0.982940673828125, -0.9119415283203125, -0.8409423828125, -0.7699432373046875, -0.698944091796875, -0.6279449462890625, -0.55694580078125, -0.4859466552734375, -0.414947509765625, -0.3439483642578125, -0.27294921875, -0.2019500732421875, -0.130950927734375, -0.0599517822265625, 0.01104736328125, 0.0820465087890625, 0.153045654296875, 0.2240447998046875, 0.2950439453125, 0.3660430908203125, 0.437042236328125, 0.5080413818359375, 0.57904052734375, 0.6500396728515625, 0.721038818359375, 0.7920379638671875, 0.863037109375, 0.9340362548828125, 1.005035400390625, 1.0760345458984375, 1.14703369140625, 1.2180328369140625, 1.289031982421875, 1.3600311279296875, 1.4310302734375, 1.5020294189453125, 1.573028564453125, 1.6440277099609375, 1.71502685546875, 1.7860260009765625, 1.857025146484375, 1.9280242919921875, 1.9990234375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 9.0, 4.0, 4.0, 9.0, 14.0, 19.0, 18.0, 30.0, 33.0, 35.0, 58.0, 64.0, 82.0, 86.0, 110.0, 94.0, 79.0, 63.0, 52.0, 30.0, 31.0, 24.0, 12.0, 13.0, 9.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.282023429870605, -7.975139617919922, -7.66825532913208, -7.3613715171813965, -7.054487228393555, -6.747603416442871, -6.4407196044921875, -6.133835792541504, -5.826951503753662, -5.5200676918029785, -5.213183403015137, -4.906299591064453, -4.5994157791137695, -4.292531490325928, -3.985647678375244, -3.6787636280059814, -3.3718795776367188, -3.064995527267456, -2.7581114768981934, -2.4512276649475098, -2.144343614578247, -1.8374595642089844, -1.5305756330490112, -1.223691701889038, -0.9168076515197754, -0.6099236607551575, -0.30303966999053955, 0.003844320774078369, 0.3107283115386963, 0.617612361907959, 0.9244962930679321, 1.2313802242279053, 1.538264274597168, 1.8451483249664307, 2.1520323753356934, 2.458916187286377, 2.7658002376556396, 3.0726842880249023, 3.379568099975586, 3.6864521503448486, 3.9933362007141113, 4.300220012664795, 4.607104301452637, 4.91398811340332, 5.220871925354004, 5.527756214141846, 5.834640026092529, 6.141524314880371, 6.448408126831055, 6.755291938781738, 7.06217622756958, 7.369060039520264, 7.6759443283081055, 7.982828140258789, 8.289711952209473, 8.596595764160156, 8.903480529785156, 9.21036434173584, 9.517248153686523, 9.824132919311523, 10.131016731262207, 10.43790054321289, 10.744784355163574, 11.051668167114258, 11.358551979064941]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 9.0, 8.0, 11.0, 15.0, 15.0, 21.0, 17.0, 23.0, 39.0, 28.0, 27.0, 42.0, 37.0, 51.0, 38.0, 38.0, 44.0, 52.0, 38.0, 58.0, 65.0, 33.0, 39.0, 31.0, 29.0, 34.0, 25.0, 22.0, 12.0, 26.0, 17.0, 14.0, 8.0, 10.0, 9.0, 4.0, 1.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.997282028198242, -4.833381175994873, -4.669480800628662, -4.505579948425293, -4.341679096221924, -4.177778244018555, -4.013877868652344, -3.8499770164489746, -3.6860764026641846, -3.5221757888793945, -3.3582749366760254, -3.1943743228912354, -3.0304737091064453, -2.866572856903076, -2.702672243118286, -2.538771629333496, -2.374870777130127, -2.210970163345337, -2.0470693111419678, -1.8831686973571777, -1.7192679643630981, -1.5553672313690186, -1.3914666175842285, -1.227565884590149, -1.0636651515960693, -0.8997644186019897, -0.7358637452125549, -0.5719630718231201, -0.4080623388290405, -0.24416160583496094, -0.08026093244552612, 0.08363974094390869, 0.24754095077514648, 0.4114416539669037, 0.5753423571586609, 0.7392430305480957, 0.9031437635421753, 1.0670444965362549, 1.230945110321045, 1.3948458433151245, 1.558746576309204, 1.7226473093032837, 1.8865480422973633, 2.0504486560821533, 2.2143492698669434, 2.3782501220703125, 2.5421507358551025, 2.7060513496398926, 2.8699522018432617, 3.0338528156280518, 3.197753667831421, 3.361654281616211, 3.52555513381958, 3.68945574760437, 3.85335636138916, 4.017257213592529, 4.181158065795898, 4.345058917999268, 4.5089592933654785, 4.672860145568848, 4.836760997772217, 5.000661849975586, 5.164562225341797, 5.328463077545166, 5.492363452911377]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 8.0, 9.0, 14.0, 15.0, 24.0, 28.0, 66.0, 92.0, 143.0, 225.0, 361.0, 488.0, 933.0, 1514.0, 2849.0, 5372.0, 11398.0, 25401.0, 59095.0, 134977.0, 255785.0, 272573.0, 153238.0, 68114.0, 29305.0, 13112.0, 6046.0, 3061.0, 1736.0, 1002.0, 562.0, 341.0, 234.0, 121.0, 112.0, 61.0, 43.0, 31.0, 30.0, 12.0, 6.0, 7.0, 6.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-6.32421875, -6.138671875, -5.953125, -5.767578125, -5.58203125, -5.396484375, -5.2109375, -5.025390625, -4.83984375, -4.654296875, -4.46875, -4.283203125, -4.09765625, -3.912109375, -3.7265625, -3.541015625, -3.35546875, -3.169921875, -2.984375, -2.798828125, -2.61328125, -2.427734375, -2.2421875, -2.056640625, -1.87109375, -1.685546875, -1.5, -1.314453125, -1.12890625, -0.943359375, -0.7578125, -0.572265625, -0.38671875, -0.201171875, -0.015625, 0.169921875, 0.35546875, 0.541015625, 0.7265625, 0.912109375, 1.09765625, 1.283203125, 1.46875, 1.654296875, 1.83984375, 2.025390625, 2.2109375, 2.396484375, 2.58203125, 2.767578125, 2.953125, 3.138671875, 3.32421875, 3.509765625, 3.6953125, 3.880859375, 4.06640625, 4.251953125, 4.4375, 4.623046875, 4.80859375, 4.994140625, 5.1796875, 5.365234375, 5.55078125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 7.0, 6.0, 7.0, 13.0, 6.0, 15.0, 17.0, 19.0, 24.0, 27.0, 32.0, 34.0, 29.0, 37.0, 36.0, 42.0, 57.0, 32.0, 54.0, 43.0, 38.0, 55.0, 42.0, 54.0, 49.0, 31.0, 20.0, 35.0, 25.0, 28.0, 15.0, 16.0, 18.0, 9.0, 10.0, 4.0, 5.0, 5.0, 6.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.703125, -4.52935791015625, -4.3555908203125, -4.18182373046875, -4.008056640625, -3.83428955078125, -3.6605224609375, -3.48675537109375, -3.31298828125, -3.13922119140625, -2.9654541015625, -2.79168701171875, -2.617919921875, -2.44415283203125, -2.2703857421875, -2.09661865234375, -1.9228515625, -1.74908447265625, -1.5753173828125, -1.40155029296875, -1.227783203125, -1.05401611328125, -0.8802490234375, -0.70648193359375, -0.53271484375, -0.35894775390625, -0.1851806640625, -0.01141357421875, 0.162353515625, 0.33612060546875, 0.5098876953125, 0.68365478515625, 0.857421875, 1.03118896484375, 1.2049560546875, 1.37872314453125, 1.552490234375, 1.72625732421875, 1.9000244140625, 2.07379150390625, 2.24755859375, 2.42132568359375, 2.5950927734375, 2.76885986328125, 2.942626953125, 3.11639404296875, 3.2901611328125, 3.46392822265625, 3.6376953125, 3.81146240234375, 3.9852294921875, 4.15899658203125, 4.332763671875, 4.50653076171875, 4.6802978515625, 4.85406494140625, 5.02783203125, 5.20159912109375, 5.3753662109375, 5.54913330078125, 5.722900390625, 5.89666748046875, 6.0704345703125, 6.24420166015625, 6.41796875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 11.0, 7.0, 5.0, 12.0, 12.0, 13.0, 25.0, 50.0, 70.0, 100.0, 118.0, 167.0, 260.0, 431.0, 644.0, 1126.0, 1887.0, 3628.0, 7202.0, 16276.0, 38847.0, 98307.0, 239479.0, 337173.0, 178185.0, 71461.0, 28311.0, 12231.0, 5620.0, 2802.0, 1594.0, 891.0, 550.0, 327.0, 213.0, 141.0, 106.0, 66.0, 42.0, 44.0, 37.0, 21.0, 16.0, 13.0, 14.0, 3.0, 4.0, 5.0, 3.0, 4.0, 3.0, 5.0, 0.0, 2.0], "bins": [-7.32421875, -7.10443115234375, -6.8846435546875, -6.66485595703125, -6.445068359375, -6.22528076171875, -6.0054931640625, -5.78570556640625, -5.56591796875, -5.34613037109375, -5.1263427734375, -4.90655517578125, -4.686767578125, -4.46697998046875, -4.2471923828125, -4.02740478515625, -3.8076171875, -3.58782958984375, -3.3680419921875, -3.14825439453125, -2.928466796875, -2.70867919921875, -2.4888916015625, -2.26910400390625, -2.04931640625, -1.82952880859375, -1.6097412109375, -1.38995361328125, -1.170166015625, -0.95037841796875, -0.7305908203125, -0.51080322265625, -0.291015625, -0.07122802734375, 0.1485595703125, 0.36834716796875, 0.588134765625, 0.80792236328125, 1.0277099609375, 1.24749755859375, 1.46728515625, 1.68707275390625, 1.9068603515625, 2.12664794921875, 2.346435546875, 2.56622314453125, 2.7860107421875, 3.00579833984375, 3.2255859375, 3.44537353515625, 3.6651611328125, 3.88494873046875, 4.104736328125, 4.32452392578125, 4.5443115234375, 4.76409912109375, 4.98388671875, 5.20367431640625, 5.4234619140625, 5.64324951171875, 5.863037109375, 6.08282470703125, 6.3026123046875, 6.52239990234375, 6.7421875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 2.0, 4.0, 7.0, 8.0, 9.0, 18.0, 14.0, 22.0, 25.0, 28.0, 29.0, 25.0, 30.0, 31.0, 39.0, 38.0, 35.0, 41.0, 45.0, 49.0, 51.0, 48.0, 50.0, 47.0, 40.0, 34.0, 20.0, 34.0, 20.0, 28.0, 23.0, 17.0, 15.0, 14.0, 15.0, 8.0, 12.0, 10.0, 6.0, 3.0, 6.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.83984375, -2.743743896484375, -2.64764404296875, -2.551544189453125, -2.4554443359375, -2.359344482421875, -2.26324462890625, -2.167144775390625, -2.071044921875, -1.974945068359375, -1.87884521484375, -1.782745361328125, -1.6866455078125, -1.590545654296875, -1.49444580078125, -1.398345947265625, -1.30224609375, -1.206146240234375, -1.11004638671875, -1.013946533203125, -0.9178466796875, -0.821746826171875, -0.72564697265625, -0.629547119140625, -0.533447265625, -0.437347412109375, -0.34124755859375, -0.245147705078125, -0.1490478515625, -0.052947998046875, 0.04315185546875, 0.139251708984375, 0.2353515625, 0.331451416015625, 0.42755126953125, 0.523651123046875, 0.6197509765625, 0.715850830078125, 0.81195068359375, 0.908050537109375, 1.004150390625, 1.100250244140625, 1.19635009765625, 1.292449951171875, 1.3885498046875, 1.484649658203125, 1.58074951171875, 1.676849365234375, 1.77294921875, 1.869049072265625, 1.96514892578125, 2.061248779296875, 2.1573486328125, 2.253448486328125, 2.34954833984375, 2.445648193359375, 2.541748046875, 2.637847900390625, 2.73394775390625, 2.830047607421875, 2.9261474609375, 3.022247314453125, 3.11834716796875, 3.214447021484375, 3.310546875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 1.0, 7.0, 5.0, 11.0, 11.0, 19.0, 16.0, 31.0, 38.0, 45.0, 58.0, 87.0, 131.0, 152.0, 216.0, 276.0, 392.0, 618.0, 844.0, 1211.0, 1909.0, 3309.0, 6407.0, 15072.0, 45105.0, 176874.0, 487075.0, 219297.0, 54889.0, 17234.0, 7086.0, 3650.0, 2029.0, 1378.0, 844.0, 586.0, 442.0, 300.0, 249.0, 160.0, 140.0, 84.0, 56.0, 56.0, 36.0, 33.0, 33.0, 18.0, 13.0, 9.0, 5.0, 3.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.5703125, -4.42083740234375, -4.2713623046875, -4.12188720703125, -3.972412109375, -3.82293701171875, -3.6734619140625, -3.52398681640625, -3.37451171875, -3.22503662109375, -3.0755615234375, -2.92608642578125, -2.776611328125, -2.62713623046875, -2.4776611328125, -2.32818603515625, -2.1787109375, -2.02923583984375, -1.8797607421875, -1.73028564453125, -1.580810546875, -1.43133544921875, -1.2818603515625, -1.13238525390625, -0.98291015625, -0.83343505859375, -0.6839599609375, -0.53448486328125, -0.385009765625, -0.23553466796875, -0.0860595703125, 0.06341552734375, 0.212890625, 0.36236572265625, 0.5118408203125, 0.66131591796875, 0.810791015625, 0.96026611328125, 1.1097412109375, 1.25921630859375, 1.40869140625, 1.55816650390625, 1.7076416015625, 1.85711669921875, 2.006591796875, 2.15606689453125, 2.3055419921875, 2.45501708984375, 2.6044921875, 2.75396728515625, 2.9034423828125, 3.05291748046875, 3.202392578125, 3.35186767578125, 3.5013427734375, 3.65081787109375, 3.80029296875, 3.94976806640625, 4.0992431640625, 4.24871826171875, 4.398193359375, 4.54766845703125, 4.6971435546875, 4.84661865234375, 4.99609375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 7.0, 11.0, 13.0, 15.0, 32.0, 39.0, 53.0, 72.0, 85.0, 107.0, 102.0, 113.0, 80.0, 72.0, 56.0, 45.0, 30.0, 23.0, 10.0, 11.0, 8.0, 5.0, 4.0, 0.0, 4.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00023245811462402344, -0.00022612139582633972, -0.000219784677028656, -0.0002134479582309723, -0.00020711123943328857, -0.00020077452063560486, -0.00019443780183792114, -0.00018810108304023743, -0.0001817643642425537, -0.00017542764544487, -0.00016909092664718628, -0.00016275420784950256, -0.00015641748905181885, -0.00015008077025413513, -0.00014374405145645142, -0.0001374073326587677, -0.00013107061386108398, -0.00012473389506340027, -0.00011839717626571655, -0.00011206045746803284, -0.00010572373867034912, -9.93870198726654e-05, -9.305030107498169e-05, -8.671358227729797e-05, -8.037686347961426e-05, -7.404014468193054e-05, -6.770342588424683e-05, -6.136670708656311e-05, -5.5029988288879395e-05, -4.869326949119568e-05, -4.235655069351196e-05, -3.601983189582825e-05, -2.968311309814453e-05, -2.3346394300460815e-05, -1.70096755027771e-05, -1.0672956705093384e-05, -4.336237907409668e-06, 2.000480890274048e-06, 8.337199687957764e-06, 1.467391848564148e-05, 2.1010637283325195e-05, 2.734735608100891e-05, 3.368407487869263e-05, 4.002079367637634e-05, 4.635751247406006e-05, 5.2694231271743774e-05, 5.903095006942749e-05, 6.53676688671112e-05, 7.170438766479492e-05, 7.804110646247864e-05, 8.437782526016235e-05, 9.071454405784607e-05, 9.705126285552979e-05, 0.0001033879816532135, 0.00010972470045089722, 0.00011606141924858093, 0.00012239813804626465, 0.00012873485684394836, 0.00013507157564163208, 0.0001414082944393158, 0.0001477450132369995, 0.00015408173203468323, 0.00016041845083236694, 0.00016675516963005066, 0.00017309188842773438]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 0.0, 5.0, 2.0, 4.0, 7.0, 19.0, 28.0, 39.0, 40.0, 45.0, 62.0, 87.0, 91.0, 148.0, 154.0, 218.0, 287.0, 370.0, 462.0, 705.0, 1116.0, 1623.0, 2771.0, 5723.0, 16118.0, 64709.0, 297005.0, 463328.0, 142954.0, 30955.0, 8942.0, 3854.0, 2078.0, 1330.0, 864.0, 576.0, 443.0, 287.0, 243.0, 200.0, 165.0, 120.0, 102.0, 79.0, 52.0, 41.0, 24.0, 25.0, 16.0, 13.0, 16.0, 7.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0], "bins": [-5.09765625, -4.9443359375, -4.791015625, -4.6376953125, -4.484375, -4.3310546875, -4.177734375, -4.0244140625, -3.87109375, -3.7177734375, -3.564453125, -3.4111328125, -3.2578125, -3.1044921875, -2.951171875, -2.7978515625, -2.64453125, -2.4912109375, -2.337890625, -2.1845703125, -2.03125, -1.8779296875, -1.724609375, -1.5712890625, -1.41796875, -1.2646484375, -1.111328125, -0.9580078125, -0.8046875, -0.6513671875, -0.498046875, -0.3447265625, -0.19140625, -0.0380859375, 0.115234375, 0.2685546875, 0.421875, 0.5751953125, 0.728515625, 0.8818359375, 1.03515625, 1.1884765625, 1.341796875, 1.4951171875, 1.6484375, 1.8017578125, 1.955078125, 2.1083984375, 2.26171875, 2.4150390625, 2.568359375, 2.7216796875, 2.875, 3.0283203125, 3.181640625, 3.3349609375, 3.48828125, 3.6416015625, 3.794921875, 3.9482421875, 4.1015625, 4.2548828125, 4.408203125, 4.5615234375, 4.71484375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 7.0, 24.0, 33.0, 79.0, 121.0, 172.0, 156.0, 149.0, 112.0, 67.0, 28.0, 18.0, 9.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.74609375, -1.6920318603515625, -1.637969970703125, -1.5839080810546875, -1.52984619140625, -1.4757843017578125, -1.421722412109375, -1.3676605224609375, -1.3135986328125, -1.2595367431640625, -1.205474853515625, -1.1514129638671875, -1.09735107421875, -1.0432891845703125, -0.989227294921875, -0.9351654052734375, -0.881103515625, -0.8270416259765625, -0.772979736328125, -0.7189178466796875, -0.66485595703125, -0.6107940673828125, -0.556732177734375, -0.5026702880859375, -0.4486083984375, -0.3945465087890625, -0.340484619140625, -0.2864227294921875, -0.23236083984375, -0.1782989501953125, -0.124237060546875, -0.0701751708984375, -0.01611328125, 0.0379486083984375, 0.092010498046875, 0.1460723876953125, 0.20013427734375, 0.2541961669921875, 0.308258056640625, 0.3623199462890625, 0.4163818359375, 0.4704437255859375, 0.524505615234375, 0.5785675048828125, 0.63262939453125, 0.6866912841796875, 0.740753173828125, 0.7948150634765625, 0.848876953125, 0.9029388427734375, 0.957000732421875, 1.0110626220703125, 1.06512451171875, 1.1191864013671875, 1.173248291015625, 1.2273101806640625, 1.2813720703125, 1.3354339599609375, 1.389495849609375, 1.4435577392578125, 1.49761962890625, 1.5516815185546875, 1.605743408203125, 1.6598052978515625, 1.7138671875]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 6.0, 8.0, 4.0, 8.0, 13.0, 11.0, 16.0, 19.0, 20.0, 38.0, 41.0, 53.0, 68.0, 86.0, 102.0, 118.0, 85.0, 80.0, 56.0, 49.0, 27.0, 34.0, 19.0, 8.0, 11.0, 9.0, 5.0, 5.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.044318199157715, -7.732737064361572, -7.42115592956543, -7.109575271606445, -6.797994136810303, -6.48641300201416, -6.174832344055176, -5.863251209259033, -5.551670074462891, -5.240088939666748, -4.9285078048706055, -4.616927146911621, -4.3053460121154785, -3.993764877319336, -3.6821839809417725, -3.370603084564209, -3.0590219497680664, -2.747440814971924, -2.4358599185943604, -2.124279022216797, -1.8126978874206543, -1.5011168718338013, -1.1895358562469482, -0.8779549598693848, -0.5663738250732422, -0.25479280948638916, 0.05678820610046387, 0.3683692216873169, 0.6799502372741699, 0.991531252861023, 1.303112268447876, 1.6146931648254395, 1.9262752532958984, 2.237856388092041, 2.5494372844696045, 2.861018180847168, 3.1725993156433105, 3.484180450439453, 3.7957613468170166, 4.10734224319458, 4.418923377990723, 4.730504512786865, 5.042085647583008, 5.353666305541992, 5.665247440338135, 5.976828575134277, 6.288409233093262, 6.599990367889404, 6.911571502685547, 7.2231526374816895, 7.534733772277832, 7.846314430236816, 8.157896041870117, 8.469476699829102, 8.781057357788086, 9.09263801574707, 9.404219627380371, 9.715800285339355, 10.027381896972656, 10.33896255493164, 10.650543212890625, 10.962124824523926, 11.27370548248291, 11.585287094116211, 11.896867752075195]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 0.0, 5.0, 7.0, 9.0, 10.0, 11.0, 15.0, 19.0, 23.0, 32.0, 30.0, 30.0, 29.0, 43.0, 42.0, 45.0, 45.0, 40.0, 45.0, 44.0, 49.0, 56.0, 48.0, 39.0, 39.0, 27.0, 37.0, 30.0, 23.0, 17.0, 25.0, 18.0, 14.0, 18.0, 7.0, 12.0, 7.0, 3.0, 2.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.159510135650635, -4.9949188232421875, -4.83032751083374, -4.665735721588135, -4.5011444091796875, -4.33655309677124, -4.171961784362793, -4.0073699951171875, -3.8427786827087402, -3.678187370300293, -3.5135958194732666, -3.3490045070648193, -3.184412956237793, -3.0198216438293457, -2.8552303314208984, -2.690638780593872, -2.526047468185425, -2.3614561557769775, -2.196864604949951, -2.032273292541504, -1.8676817417144775, -1.7030904293060303, -1.5384989976882935, -1.3739075660705566, -1.2093161344528198, -1.044724702835083, -0.8801332712173462, -0.7155418992042542, -0.5509504675865173, -0.3863590359687805, -0.22176766395568848, -0.05717623233795166, 0.10741519927978516, 0.272006630897522, 0.4365980327129364, 0.6011894345283508, 0.7657808661460876, 0.9303722977638245, 1.0949636697769165, 1.2595551013946533, 1.4241465330123901, 1.588737964630127, 1.7533293962478638, 1.9179208278656006, 2.082512140274048, 2.247103691101074, 2.4116950035095215, 2.5762863159179688, 2.740877866744995, 2.9054691791534424, 3.0700607299804688, 3.234652042388916, 3.3992435932159424, 3.5638349056243896, 3.728426456451416, 3.8930177688598633, 4.0576090812683105, 4.222200393676758, 4.386791706085205, 4.5513834953308105, 4.715974807739258, 4.880566120147705, 5.045157432556152, 5.209749221801758, 5.374340534210205]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 9.0, 5.0, 12.0, 26.0, 14.0, 21.0, 44.0, 64.0, 98.0, 145.0, 228.0, 349.0, 524.0, 821.0, 1301.0, 2027.0, 3429.0, 5581.0, 9594.0, 16933.0, 28415.0, 48847.0, 83707.0, 133169.0, 177804.0, 181615.0, 138578.0, 88846.0, 52418.0, 30061.0, 17737.0, 10405.0, 6155.0, 3574.0, 2190.0, 1331.0, 834.0, 533.0, 348.0, 228.0, 154.0, 107.0, 79.0, 62.0, 38.0, 40.0, 17.0, 14.0, 10.0, 8.0, 4.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-4.89453125, -4.7369384765625, -4.579345703125, -4.4217529296875, -4.26416015625, -4.1065673828125, -3.948974609375, -3.7913818359375, -3.6337890625, -3.4761962890625, -3.318603515625, -3.1610107421875, -3.00341796875, -2.8458251953125, -2.688232421875, -2.5306396484375, -2.373046875, -2.2154541015625, -2.057861328125, -1.9002685546875, -1.74267578125, -1.5850830078125, -1.427490234375, -1.2698974609375, -1.1123046875, -0.9547119140625, -0.797119140625, -0.6395263671875, -0.48193359375, -0.3243408203125, -0.166748046875, -0.0091552734375, 0.1484375, 0.3060302734375, 0.463623046875, 0.6212158203125, 0.77880859375, 0.9364013671875, 1.093994140625, 1.2515869140625, 1.4091796875, 1.5667724609375, 1.724365234375, 1.8819580078125, 2.03955078125, 2.1971435546875, 2.354736328125, 2.5123291015625, 2.669921875, 2.8275146484375, 2.985107421875, 3.1427001953125, 3.30029296875, 3.4578857421875, 3.615478515625, 3.7730712890625, 3.9306640625, 4.0882568359375, 4.245849609375, 4.4034423828125, 4.56103515625, 4.7186279296875, 4.876220703125, 5.0338134765625, 5.19140625]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 12.0, 8.0, 6.0, 5.0, 18.0, 25.0, 20.0, 26.0, 25.0, 28.0, 32.0, 43.0, 37.0, 38.0, 38.0, 45.0, 49.0, 47.0, 53.0, 49.0, 42.0, 46.0, 47.0, 38.0, 30.0, 35.0, 28.0, 20.0, 18.0, 13.0, 10.0, 18.0, 9.0, 9.0, 10.0, 5.0, 6.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.890625, -5.71575927734375, -5.5408935546875, -5.36602783203125, -5.191162109375, -5.01629638671875, -4.8414306640625, -4.66656494140625, -4.49169921875, -4.31683349609375, -4.1419677734375, -3.96710205078125, -3.792236328125, -3.61737060546875, -3.4425048828125, -3.26763916015625, -3.0927734375, -2.91790771484375, -2.7430419921875, -2.56817626953125, -2.393310546875, -2.21844482421875, -2.0435791015625, -1.86871337890625, -1.69384765625, -1.51898193359375, -1.3441162109375, -1.16925048828125, -0.994384765625, -0.81951904296875, -0.6446533203125, -0.46978759765625, -0.294921875, -0.12005615234375, 0.0548095703125, 0.22967529296875, 0.404541015625, 0.57940673828125, 0.7542724609375, 0.92913818359375, 1.10400390625, 1.27886962890625, 1.4537353515625, 1.62860107421875, 1.803466796875, 1.97833251953125, 2.1531982421875, 2.32806396484375, 2.5029296875, 2.67779541015625, 2.8526611328125, 3.02752685546875, 3.202392578125, 3.37725830078125, 3.5521240234375, 3.72698974609375, 3.90185546875, 4.07672119140625, 4.2515869140625, 4.42645263671875, 4.601318359375, 4.77618408203125, 4.9510498046875, 5.12591552734375, 5.30078125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 6.0, 9.0, 8.0, 5.0, 14.0, 19.0, 17.0, 38.0, 47.0, 71.0, 124.0, 174.0, 243.0, 376.0, 561.0, 838.0, 1379.0, 2106.0, 3291.0, 5355.0, 8968.0, 14782.0, 24706.0, 41422.0, 68798.0, 106277.0, 149366.0, 171206.0, 153061.0, 111880.0, 72370.0, 43935.0, 26086.0, 15777.0, 9479.0, 5852.0, 3572.0, 2157.0, 1451.0, 954.0, 603.0, 382.0, 262.0, 192.0, 103.0, 85.0, 35.0, 39.0, 23.0, 20.0, 11.0, 8.0, 7.0, 11.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-4.6171875, -4.47088623046875, -4.3245849609375, -4.17828369140625, -4.031982421875, -3.88568115234375, -3.7393798828125, -3.59307861328125, -3.44677734375, -3.30047607421875, -3.1541748046875, -3.00787353515625, -2.861572265625, -2.71527099609375, -2.5689697265625, -2.42266845703125, -2.2763671875, -2.13006591796875, -1.9837646484375, -1.83746337890625, -1.691162109375, -1.54486083984375, -1.3985595703125, -1.25225830078125, -1.10595703125, -0.95965576171875, -0.8133544921875, -0.66705322265625, -0.520751953125, -0.37445068359375, -0.2281494140625, -0.08184814453125, 0.064453125, 0.21075439453125, 0.3570556640625, 0.50335693359375, 0.649658203125, 0.79595947265625, 0.9422607421875, 1.08856201171875, 1.23486328125, 1.38116455078125, 1.5274658203125, 1.67376708984375, 1.820068359375, 1.96636962890625, 2.1126708984375, 2.25897216796875, 2.4052734375, 2.55157470703125, 2.6978759765625, 2.84417724609375, 2.990478515625, 3.13677978515625, 3.2830810546875, 3.42938232421875, 3.57568359375, 3.72198486328125, 3.8682861328125, 4.01458740234375, 4.160888671875, 4.30718994140625, 4.4534912109375, 4.59979248046875, 4.74609375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 5.0, 4.0, 7.0, 3.0, 11.0, 14.0, 23.0, 27.0, 23.0, 24.0, 24.0, 24.0, 42.0, 34.0, 39.0, 34.0, 39.0, 38.0, 23.0, 44.0, 53.0, 37.0, 37.0, 44.0, 41.0, 29.0, 28.0, 27.0, 26.0, 28.0, 26.0, 29.0, 18.0, 15.0, 11.0, 10.0, 11.0, 12.0, 8.0, 3.0, 4.0, 3.0, 6.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.96875, -2.8792724609375, -2.789794921875, -2.7003173828125, -2.61083984375, -2.5213623046875, -2.431884765625, -2.3424072265625, -2.2529296875, -2.1634521484375, -2.073974609375, -1.9844970703125, -1.89501953125, -1.8055419921875, -1.716064453125, -1.6265869140625, -1.537109375, -1.4476318359375, -1.358154296875, -1.2686767578125, -1.17919921875, -1.0897216796875, -1.000244140625, -0.9107666015625, -0.8212890625, -0.7318115234375, -0.642333984375, -0.5528564453125, -0.46337890625, -0.3739013671875, -0.284423828125, -0.1949462890625, -0.10546875, -0.0159912109375, 0.073486328125, 0.1629638671875, 0.25244140625, 0.3419189453125, 0.431396484375, 0.5208740234375, 0.6103515625, 0.6998291015625, 0.789306640625, 0.8787841796875, 0.96826171875, 1.0577392578125, 1.147216796875, 1.2366943359375, 1.326171875, 1.4156494140625, 1.505126953125, 1.5946044921875, 1.68408203125, 1.7735595703125, 1.863037109375, 1.9525146484375, 2.0419921875, 2.1314697265625, 2.220947265625, 2.3104248046875, 2.39990234375, 2.4893798828125, 2.578857421875, 2.6683349609375, 2.7578125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 5.0, 3.0, 5.0, 10.0, 8.0, 28.0, 20.0, 37.0, 45.0, 51.0, 57.0, 70.0, 90.0, 129.0, 160.0, 242.0, 344.0, 424.0, 573.0, 915.0, 1395.0, 2519.0, 4562.0, 8763.0, 18039.0, 38493.0, 81953.0, 161565.0, 245188.0, 224747.0, 132442.0, 64285.0, 30134.0, 14349.0, 7125.0, 3685.0, 2035.0, 1225.0, 800.0, 529.0, 361.0, 278.0, 200.0, 163.0, 110.0, 104.0, 54.0, 56.0, 56.0, 37.0, 36.0, 17.0, 18.0, 9.0, 11.0, 7.0, 2.0, 4.0, 0.0, 1.0], "bins": [-3.017578125, -2.925689697265625, -2.83380126953125, -2.741912841796875, -2.6500244140625, -2.558135986328125, -2.46624755859375, -2.374359130859375, -2.282470703125, -2.190582275390625, -2.09869384765625, -2.006805419921875, -1.9149169921875, -1.823028564453125, -1.73114013671875, -1.639251708984375, -1.54736328125, -1.455474853515625, -1.36358642578125, -1.271697998046875, -1.1798095703125, -1.087921142578125, -0.99603271484375, -0.904144287109375, -0.812255859375, -0.720367431640625, -0.62847900390625, -0.536590576171875, -0.4447021484375, -0.352813720703125, -0.26092529296875, -0.169036865234375, -0.0771484375, 0.014739990234375, 0.10662841796875, 0.198516845703125, 0.2904052734375, 0.382293701171875, 0.47418212890625, 0.566070556640625, 0.657958984375, 0.749847412109375, 0.84173583984375, 0.933624267578125, 1.0255126953125, 1.117401123046875, 1.20928955078125, 1.301177978515625, 1.39306640625, 1.484954833984375, 1.57684326171875, 1.668731689453125, 1.7606201171875, 1.852508544921875, 1.94439697265625, 2.036285400390625, 2.128173828125, 2.220062255859375, 2.31195068359375, 2.403839111328125, 2.4957275390625, 2.587615966796875, 2.67950439453125, 2.771392822265625, 2.86328125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 13.0, 13.0, 11.0, 18.0, 20.0, 28.0, 46.0, 51.0, 63.0, 69.0, 82.0, 76.0, 83.0, 75.0, 67.0, 56.0, 58.0, 46.0, 30.0, 20.0, 12.0, 18.0, 5.0, 9.0, 4.0, 4.0, 6.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00034880638122558594, -0.00034005753695964813, -0.00033130869269371033, -0.0003225598484277725, -0.0003138110041618347, -0.0003050621598958969, -0.0002963133156299591, -0.0002875644713640213, -0.0002788156270980835, -0.0002700667828321457, -0.0002613179385662079, -0.0002525690943002701, -0.00024382025003433228, -0.00023507140576839447, -0.00022632256150245667, -0.00021757371723651886, -0.00020882487297058105, -0.00020007602870464325, -0.00019132718443870544, -0.00018257834017276764, -0.00017382949590682983, -0.00016508065164089203, -0.00015633180737495422, -0.00014758296310901642, -0.0001388341188430786, -0.0001300852745771408, -0.000121336430311203, -0.0001125875860452652, -0.00010383874177932739, -9.508989751338959e-05, -8.634105324745178e-05, -7.759220898151398e-05, -6.884336471557617e-05, -6.009452044963837e-05, -5.134567618370056e-05, -4.2596831917762756e-05, -3.384798765182495e-05, -2.5099143385887146e-05, -1.635029911994934e-05, -7.601454854011536e-06, 1.1473894119262695e-06, 9.896233677864075e-06, 1.864507794380188e-05, 2.7393922209739685e-05, 3.614276647567749e-05, 4.4891610741615295e-05, 5.36404550075531e-05, 6.23892992734909e-05, 7.113814353942871e-05, 7.988698780536652e-05, 8.863583207130432e-05, 9.738467633724213e-05, 0.00010613352060317993, 0.00011488236486911774, 0.00012363120913505554, 0.00013238005340099335, 0.00014112889766693115, 0.00014987774193286896, 0.00015862658619880676, 0.00016737543046474457, 0.00017612427473068237, 0.00018487311899662018, 0.00019362196326255798, 0.0002023708075284958, 0.0002111196517944336]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 5.0, 4.0, 11.0, 16.0, 10.0, 18.0, 20.0, 28.0, 48.0, 73.0, 110.0, 168.0, 322.0, 623.0, 1271.0, 2799.0, 7273.0, 20867.0, 66427.0, 205613.0, 379688.0, 241629.0, 81092.0, 25380.0, 8725.0, 3253.0, 1402.0, 712.0, 381.0, 198.0, 119.0, 91.0, 43.0, 39.0, 16.0, 18.0, 19.0, 15.0, 10.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.96484375, -4.8170166015625, -4.669189453125, -4.5213623046875, -4.37353515625, -4.2257080078125, -4.077880859375, -3.9300537109375, -3.7822265625, -3.6343994140625, -3.486572265625, -3.3387451171875, -3.19091796875, -3.0430908203125, -2.895263671875, -2.7474365234375, -2.599609375, -2.4517822265625, -2.303955078125, -2.1561279296875, -2.00830078125, -1.8604736328125, -1.712646484375, -1.5648193359375, -1.4169921875, -1.2691650390625, -1.121337890625, -0.9735107421875, -0.82568359375, -0.6778564453125, -0.530029296875, -0.3822021484375, -0.234375, -0.0865478515625, 0.061279296875, 0.2091064453125, 0.35693359375, 0.5047607421875, 0.652587890625, 0.8004150390625, 0.9482421875, 1.0960693359375, 1.243896484375, 1.3917236328125, 1.53955078125, 1.6873779296875, 1.835205078125, 1.9830322265625, 2.130859375, 2.2786865234375, 2.426513671875, 2.5743408203125, 2.72216796875, 2.8699951171875, 3.017822265625, 3.1656494140625, 3.3134765625, 3.4613037109375, 3.609130859375, 3.7569580078125, 3.90478515625, 4.0526123046875, 4.200439453125, 4.3482666015625, 4.49609375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 15.0, 7.0, 17.0, 11.0, 27.0, 33.0, 33.0, 58.0, 52.0, 64.0, 68.0, 81.0, 77.0, 77.0, 80.0, 53.0, 59.0, 53.0, 41.0, 22.0, 22.0, 14.0, 11.0, 15.0, 9.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2822265625, -1.2505264282226562, -1.2188262939453125, -1.1871261596679688, -1.155426025390625, -1.1237258911132812, -1.0920257568359375, -1.0603256225585938, -1.02862548828125, -0.9969253540039062, -0.9652252197265625, -0.9335250854492188, -0.901824951171875, -0.8701248168945312, -0.8384246826171875, -0.8067245483398438, -0.7750244140625, -0.7433242797851562, -0.7116241455078125, -0.6799240112304688, -0.648223876953125, -0.6165237426757812, -0.5848236083984375, -0.5531234741210938, -0.52142333984375, -0.48972320556640625, -0.4580230712890625, -0.42632293701171875, -0.394622802734375, -0.36292266845703125, -0.3312225341796875, -0.29952239990234375, -0.267822265625, -0.23612213134765625, -0.2044219970703125, -0.17272186279296875, -0.141021728515625, -0.10932159423828125, -0.0776214599609375, -0.04592132568359375, -0.01422119140625, 0.01747894287109375, 0.0491790771484375, 0.08087921142578125, 0.112579345703125, 0.14427947998046875, 0.1759796142578125, 0.20767974853515625, 0.2393798828125, 0.27108001708984375, 0.3027801513671875, 0.33448028564453125, 0.366180419921875, 0.39788055419921875, 0.4295806884765625, 0.46128082275390625, 0.49298095703125, 0.5246810913085938, 0.5563812255859375, 0.5880813598632812, 0.619781494140625, 0.6514816284179688, 0.6831817626953125, 0.7148818969726562, 0.74658203125]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 5.0, 13.0, 18.0, 18.0, 21.0, 22.0, 28.0, 49.0, 60.0, 68.0, 102.0, 92.0, 97.0, 113.0, 75.0, 52.0, 40.0, 31.0, 29.0, 15.0, 13.0, 11.0, 4.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.124826431274414, -8.80727767944336, -8.489727973937988, -8.172179222106934, -7.8546295166015625, -7.53708028793335, -7.219531059265137, -6.901982307434082, -6.584432601928711, -6.266883373260498, -5.949334144592285, -5.631784915924072, -5.314235687255859, -4.9966864585876465, -4.679137229919434, -4.361588478088379, -4.044039249420166, -3.726490020751953, -3.4089407920837402, -3.0913915634155273, -2.7738423347473145, -2.4562931060791016, -2.1387441158294678, -1.8211948871612549, -1.503645658493042, -1.186096429824829, -0.868547260761261, -0.5509980916976929, -0.23344886302947998, 0.08410036563873291, 0.40164947509765625, 0.7191987037658691, 1.036747932434082, 1.354297161102295, 1.6718463897705078, 1.9893954992294312, 2.3069448471069336, 2.6244940757751465, 2.9420430660247803, 3.259592294692993, 3.577141523361206, 3.894690752029419, 4.212239742279053, 4.529788970947266, 4.8473381996154785, 5.164887428283691, 5.482436656951904, 5.799985885620117, 6.11753511428833, 6.435084342956543, 6.752633571624756, 7.070182800292969, 7.387732028961182, 7.7052812576293945, 8.02283000946045, 8.34037971496582, 8.657928466796875, 8.97547721862793, 9.2930269241333, 9.610575675964355, 9.928125381469727, 10.245674133300781, 10.563223838806152, 10.880772590637207, 11.198322296142578]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 9.0, 5.0, 16.0, 14.0, 19.0, 18.0, 15.0, 21.0, 24.0, 34.0, 41.0, 43.0, 42.0, 38.0, 44.0, 43.0, 54.0, 50.0, 44.0, 46.0, 39.0, 52.0, 36.0, 29.0, 40.0, 22.0, 23.0, 23.0, 19.0, 24.0, 13.0, 8.0, 15.0, 15.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.089992046356201, -4.92699670791626, -4.764001846313477, -4.601006507873535, -4.438011169433594, -4.2750163078308105, -4.112020969390869, -3.949025869369507, -3.7860307693481445, -3.6230356693267822, -3.46004056930542, -3.2970452308654785, -3.134050130844116, -2.971055030822754, -2.8080596923828125, -2.64506459236145, -2.482069492340088, -2.3190743923187256, -2.1560792922973633, -1.9930839538574219, -1.8300888538360596, -1.6670937538146973, -1.5040985345840454, -1.3411033153533936, -1.1781082153320312, -1.015113115310669, -0.8521178960800171, -0.68912273645401, -0.5261275768280029, -0.36313241720199585, -0.20013725757598877, -0.037142038345336914, 0.1258525848388672, 0.28884774446487427, 0.45184290409088135, 0.6148380637168884, 0.7778332233428955, 0.9408283829689026, 1.1038235425949097, 1.2668187618255615, 1.4298138618469238, 1.5928089618682861, 1.755804181098938, 1.9187994003295898, 2.081794500350952, 2.2447896003723145, 2.407784938812256, 2.570780038833618, 2.7337751388549805, 2.8967702388763428, 3.059765338897705, 3.2227606773376465, 3.385755777359009, 3.548750877380371, 3.7117462158203125, 3.874741315841675, 4.037736415863037, 4.2007317543029785, 4.363726615905762, 4.526721954345703, 4.6897172927856445, 4.852712154388428, 5.015707492828369, 5.178702354431152, 5.341697692871094]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 2.0, 4.0, 5.0, 7.0, 2.0, 2.0, 11.0, 11.0, 24.0, 18.0, 33.0, 52.0, 81.0, 98.0, 139.0, 206.0, 295.0, 427.0, 655.0, 1028.0, 1634.0, 2527.0, 4306.0, 7350.0, 13389.0, 26268.0, 55055.0, 129156.0, 346722.0, 919553.0, 1379129.0, 796317.0, 292754.0, 111888.0, 49362.0, 24314.0, 12913.0, 7203.0, 4208.0, 2528.0, 1552.0, 1000.0, 706.0, 452.0, 293.0, 191.0, 124.0, 80.0, 69.0, 45.0, 33.0, 20.0, 19.0, 7.0, 9.0, 4.0, 5.0, 3.0, 3.0, 2.0, 3.0], "bins": [-7.62890625, -7.400634765625, -7.17236328125, -6.944091796875, -6.7158203125, -6.487548828125, -6.25927734375, -6.031005859375, -5.802734375, -5.574462890625, -5.34619140625, -5.117919921875, -4.8896484375, -4.661376953125, -4.43310546875, -4.204833984375, -3.9765625, -3.748291015625, -3.52001953125, -3.291748046875, -3.0634765625, -2.835205078125, -2.60693359375, -2.378662109375, -2.150390625, -1.922119140625, -1.69384765625, -1.465576171875, -1.2373046875, -1.009033203125, -0.78076171875, -0.552490234375, -0.32421875, -0.095947265625, 0.13232421875, 0.360595703125, 0.5888671875, 0.817138671875, 1.04541015625, 1.273681640625, 1.501953125, 1.730224609375, 1.95849609375, 2.186767578125, 2.4150390625, 2.643310546875, 2.87158203125, 3.099853515625, 3.328125, 3.556396484375, 3.78466796875, 4.012939453125, 4.2412109375, 4.469482421875, 4.69775390625, 4.926025390625, 5.154296875, 5.382568359375, 5.61083984375, 5.839111328125, 6.0673828125, 6.295654296875, 6.52392578125, 6.752197265625, 6.98046875]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 5.0, 6.0, 13.0, 11.0, 13.0, 19.0, 16.0, 18.0, 19.0, 21.0, 29.0, 39.0, 42.0, 45.0, 45.0, 44.0, 62.0, 57.0, 55.0, 52.0, 58.0, 29.0, 37.0, 32.0, 27.0, 32.0, 24.0, 24.0, 31.0, 20.0, 16.0, 16.0, 13.0, 10.0, 5.0, 4.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9375, -3.8143310546875, -3.691162109375, -3.5679931640625, -3.44482421875, -3.3216552734375, -3.198486328125, -3.0753173828125, -2.9521484375, -2.8289794921875, -2.705810546875, -2.5826416015625, -2.45947265625, -2.3363037109375, -2.213134765625, -2.0899658203125, -1.966796875, -1.8436279296875, -1.720458984375, -1.5972900390625, -1.47412109375, -1.3509521484375, -1.227783203125, -1.1046142578125, -0.9814453125, -0.8582763671875, -0.735107421875, -0.6119384765625, -0.48876953125, -0.3656005859375, -0.242431640625, -0.1192626953125, 0.00390625, 0.1270751953125, 0.250244140625, 0.3734130859375, 0.49658203125, 0.6197509765625, 0.742919921875, 0.8660888671875, 0.9892578125, 1.1124267578125, 1.235595703125, 1.3587646484375, 1.48193359375, 1.6051025390625, 1.728271484375, 1.8514404296875, 1.974609375, 2.0977783203125, 2.220947265625, 2.3441162109375, 2.46728515625, 2.5904541015625, 2.713623046875, 2.8367919921875, 2.9599609375, 3.0831298828125, 3.206298828125, 3.3294677734375, 3.45263671875, 3.5758056640625, 3.698974609375, 3.8221435546875, 3.9453125]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 4.0, 4.0, 8.0, 10.0, 24.0, 13.0, 34.0, 42.0, 68.0, 87.0, 149.0, 186.0, 276.0, 441.0, 644.0, 1060.0, 1728.0, 2733.0, 4567.0, 8082.0, 14428.0, 27094.0, 54775.0, 116687.0, 267303.0, 642831.0, 1253124.0, 1004653.0, 437803.0, 184706.0, 83017.0, 40224.0, 20479.0, 10942.0, 6201.0, 3696.0, 2274.0, 1373.0, 847.0, 550.0, 364.0, 243.0, 174.0, 121.0, 61.0, 54.0, 30.0, 24.0, 19.0, 9.0, 9.0, 7.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.44921875, -7.20721435546875, -6.9652099609375, -6.72320556640625, -6.481201171875, -6.23919677734375, -5.9971923828125, -5.75518798828125, -5.51318359375, -5.27117919921875, -5.0291748046875, -4.78717041015625, -4.545166015625, -4.30316162109375, -4.0611572265625, -3.81915283203125, -3.5771484375, -3.33514404296875, -3.0931396484375, -2.85113525390625, -2.609130859375, -2.36712646484375, -2.1251220703125, -1.88311767578125, -1.64111328125, -1.39910888671875, -1.1571044921875, -0.91510009765625, -0.673095703125, -0.43109130859375, -0.1890869140625, 0.05291748046875, 0.294921875, 0.53692626953125, 0.7789306640625, 1.02093505859375, 1.262939453125, 1.50494384765625, 1.7469482421875, 1.98895263671875, 2.23095703125, 2.47296142578125, 2.7149658203125, 2.95697021484375, 3.198974609375, 3.44097900390625, 3.6829833984375, 3.92498779296875, 4.1669921875, 4.40899658203125, 4.6510009765625, 4.89300537109375, 5.135009765625, 5.37701416015625, 5.6190185546875, 5.86102294921875, 6.10302734375, 6.34503173828125, 6.5870361328125, 6.82904052734375, 7.071044921875, 7.31304931640625, 7.5550537109375, 7.79705810546875, 8.0390625]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 5.0, 3.0, 5.0, 5.0, 4.0, 10.0, 9.0, 15.0, 17.0, 23.0, 33.0, 36.0, 52.0, 47.0, 88.0, 118.0, 148.0, 192.0, 225.0, 283.0, 308.0, 334.0, 351.0, 307.0, 289.0, 275.0, 199.0, 180.0, 111.0, 113.0, 73.0, 62.0, 53.0, 31.0, 19.0, 14.0, 10.0, 5.0, 8.0, 4.0, 6.0, 6.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.23046875, -2.156524658203125, -2.08258056640625, -2.008636474609375, -1.9346923828125, -1.860748291015625, -1.78680419921875, -1.712860107421875, -1.638916015625, -1.564971923828125, -1.49102783203125, -1.417083740234375, -1.3431396484375, -1.269195556640625, -1.19525146484375, -1.121307373046875, -1.04736328125, -0.973419189453125, -0.89947509765625, -0.825531005859375, -0.7515869140625, -0.677642822265625, -0.60369873046875, -0.529754638671875, -0.455810546875, -0.381866455078125, -0.30792236328125, -0.233978271484375, -0.1600341796875, -0.086090087890625, -0.01214599609375, 0.061798095703125, 0.1357421875, 0.209686279296875, 0.28363037109375, 0.357574462890625, 0.4315185546875, 0.505462646484375, 0.57940673828125, 0.653350830078125, 0.727294921875, 0.801239013671875, 0.87518310546875, 0.949127197265625, 1.0230712890625, 1.097015380859375, 1.17095947265625, 1.244903564453125, 1.31884765625, 1.392791748046875, 1.46673583984375, 1.540679931640625, 1.6146240234375, 1.688568115234375, 1.76251220703125, 1.836456298828125, 1.910400390625, 1.984344482421875, 2.05828857421875, 2.132232666015625, 2.2061767578125, 2.280120849609375, 2.35406494140625, 2.428009033203125, 2.501953125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 8.0, 3.0, 1.0, 3.0, 11.0, 10.0, 16.0, 12.0, 32.0, 24.0, 29.0, 48.0, 51.0, 56.0, 69.0, 90.0, 93.0, 77.0, 86.0, 66.0, 49.0, 49.0, 33.0, 21.0, 21.0, 15.0, 10.0, 6.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.17936897277832, -8.893779754638672, -8.60819149017334, -8.322602272033691, -8.03701400756836, -7.751424789428711, -7.465836048126221, -7.1802473068237305, -6.89465856552124, -6.60906982421875, -6.32348108291626, -6.0378923416137695, -5.752303123474121, -5.466714859008789, -5.181125640869141, -4.89553689956665, -4.60994815826416, -4.32435941696167, -4.03877067565918, -3.7531816959381104, -3.46759295463562, -3.18200421333313, -2.8964152336120605, -2.6108264923095703, -2.32523775100708, -2.03964900970459, -1.75406014919281, -1.4684712886810303, -1.18288254737854, -0.8972938060760498, -0.61170494556427, -0.32611608505249023, -0.040526390075683594, 0.24506241083145142, 0.5306512117385864, 0.8162400126457214, 1.1018288135528564, 1.3874175548553467, 1.6730064153671265, 1.9585952758789062, 2.2441840171813965, 2.5297727584838867, 2.815361499786377, 3.1009504795074463, 3.3865392208099365, 3.6721279621124268, 3.957716941833496, 4.243305683135986, 4.528894424438477, 4.814483165740967, 5.100071907043457, 5.385660648345947, 5.6712493896484375, 5.956838607788086, 6.242427349090576, 6.528016090393066, 6.813604831695557, 7.099193572998047, 7.384782314300537, 7.670371055603027, 7.955960273742676, 8.241548538208008, 8.527137756347656, 8.812726974487305, 9.098315238952637]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 9.0, 6.0, 7.0, 8.0, 11.0, 10.0, 22.0, 18.0, 30.0, 22.0, 28.0, 28.0, 43.0, 41.0, 53.0, 46.0, 46.0, 38.0, 49.0, 49.0, 46.0, 49.0, 32.0, 40.0, 41.0, 34.0, 23.0, 36.0, 20.0, 24.0, 23.0, 14.0, 13.0, 15.0, 8.0, 8.0, 3.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3765716552734375, -4.217191219329834, -4.057810306549072, -3.8984296321868896, -3.739048957824707, -3.5796685218811035, -3.420287847518921, -3.2609071731567383, -3.1015264987945557, -2.942145824432373, -2.7827651500701904, -2.623384475708008, -2.4640040397644043, -2.3046231269836426, -2.145242691040039, -1.9858620166778564, -1.8264813423156738, -1.6671006679534912, -1.5077199935913086, -1.3483394384384155, -1.188958764076233, -1.0295780897140503, -0.8701974749565125, -0.7108168601989746, -0.551436185836792, -0.39205554127693176, -0.23267489671707153, -0.0732942521572113, 0.08608639240264893, 0.24546706676483154, 0.4048476815223694, 0.5642282962799072, 0.7236084938049316, 0.8829891681671143, 1.0423698425292969, 1.20175039768219, 1.3611310720443726, 1.5205117464065552, 1.6798923015594482, 1.8392729759216309, 1.9986536502838135, 2.158034324645996, 2.3174149990081787, 2.4767956733703613, 2.636176109313965, 2.7955570220947266, 2.95493745803833, 3.1143181324005127, 3.2736988067626953, 3.433079481124878, 3.5924601554870605, 3.751840829849243, 3.911221504211426, 4.070601940155029, 4.229982852935791, 4.3893632888793945, 4.548744201660156, 4.70812463760376, 4.8675055503845215, 5.026885986328125, 5.186266899108887, 5.34564733505249, 5.505028247833252, 5.6644086837768555, 5.823789119720459]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 7.0, 6.0, 4.0, 11.0, 26.0, 36.0, 52.0, 73.0, 107.0, 195.0, 308.0, 527.0, 840.0, 1388.0, 2590.0, 4672.0, 8653.0, 17353.0, 37485.0, 81235.0, 174517.0, 283598.0, 225020.0, 111016.0, 50153.0, 23693.0, 11506.0, 5920.0, 3113.0, 1788.0, 1037.0, 600.0, 340.0, 229.0, 157.0, 111.0, 58.0, 38.0, 30.0, 23.0, 7.0, 13.0, 4.0, 5.0, 6.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.5703125, -5.38885498046875, -5.2073974609375, -5.02593994140625, -4.844482421875, -4.66302490234375, -4.4815673828125, -4.30010986328125, -4.11865234375, -3.93719482421875, -3.7557373046875, -3.57427978515625, -3.392822265625, -3.21136474609375, -3.0299072265625, -2.84844970703125, -2.6669921875, -2.48553466796875, -2.3040771484375, -2.12261962890625, -1.941162109375, -1.75970458984375, -1.5782470703125, -1.39678955078125, -1.21533203125, -1.03387451171875, -0.8524169921875, -0.67095947265625, -0.489501953125, -0.30804443359375, -0.1265869140625, 0.05487060546875, 0.236328125, 0.41778564453125, 0.5992431640625, 0.78070068359375, 0.962158203125, 1.14361572265625, 1.3250732421875, 1.50653076171875, 1.68798828125, 1.86944580078125, 2.0509033203125, 2.23236083984375, 2.413818359375, 2.59527587890625, 2.7767333984375, 2.95819091796875, 3.1396484375, 3.32110595703125, 3.5025634765625, 3.68402099609375, 3.865478515625, 4.04693603515625, 4.2283935546875, 4.40985107421875, 4.59130859375, 4.77276611328125, 4.9542236328125, 5.13568115234375, 5.317138671875, 5.49859619140625, 5.6800537109375, 5.86151123046875, 6.04296875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 6.0, 9.0, 8.0, 8.0, 6.0, 7.0, 14.0, 18.0, 14.0, 18.0, 26.0, 32.0, 34.0, 30.0, 36.0, 38.0, 48.0, 45.0, 40.0, 46.0, 52.0, 48.0, 44.0, 51.0, 43.0, 40.0, 34.0, 25.0, 35.0, 28.0, 16.0, 17.0, 16.0, 14.0, 12.0, 9.0, 16.0, 10.0, 3.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.91015625, -4.74749755859375, -4.5848388671875, -4.42218017578125, -4.259521484375, -4.09686279296875, -3.9342041015625, -3.77154541015625, -3.60888671875, -3.44622802734375, -3.2835693359375, -3.12091064453125, -2.958251953125, -2.79559326171875, -2.6329345703125, -2.47027587890625, -2.3076171875, -2.14495849609375, -1.9822998046875, -1.81964111328125, -1.656982421875, -1.49432373046875, -1.3316650390625, -1.16900634765625, -1.00634765625, -0.84368896484375, -0.6810302734375, -0.51837158203125, -0.355712890625, -0.19305419921875, -0.0303955078125, 0.13226318359375, 0.294921875, 0.45758056640625, 0.6202392578125, 0.78289794921875, 0.945556640625, 1.10821533203125, 1.2708740234375, 1.43353271484375, 1.59619140625, 1.75885009765625, 1.9215087890625, 2.08416748046875, 2.246826171875, 2.40948486328125, 2.5721435546875, 2.73480224609375, 2.8974609375, 3.06011962890625, 3.2227783203125, 3.38543701171875, 3.548095703125, 3.71075439453125, 3.8734130859375, 4.03607177734375, 4.19873046875, 4.36138916015625, 4.5240478515625, 4.68670654296875, 4.849365234375, 5.01202392578125, 5.1746826171875, 5.33734130859375, 5.5]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 3.0, 8.0, 4.0, 19.0, 17.0, 26.0, 37.0, 64.0, 74.0, 125.0, 178.0, 273.0, 476.0, 711.0, 1052.0, 1814.0, 3031.0, 5308.0, 9890.0, 19538.0, 42190.0, 95148.0, 213504.0, 311963.0, 186617.0, 81804.0, 36646.0, 17078.0, 8867.0, 4867.0, 2753.0, 1575.0, 1037.0, 597.0, 444.0, 253.0, 174.0, 118.0, 79.0, 60.0, 48.0, 35.0, 15.0, 7.0, 10.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.62890625, -6.42437744140625, -6.2198486328125, -6.01531982421875, -5.810791015625, -5.60626220703125, -5.4017333984375, -5.19720458984375, -4.99267578125, -4.78814697265625, -4.5836181640625, -4.37908935546875, -4.174560546875, -3.97003173828125, -3.7655029296875, -3.56097412109375, -3.3564453125, -3.15191650390625, -2.9473876953125, -2.74285888671875, -2.538330078125, -2.33380126953125, -2.1292724609375, -1.92474365234375, -1.72021484375, -1.51568603515625, -1.3111572265625, -1.10662841796875, -0.902099609375, -0.69757080078125, -0.4930419921875, -0.28851318359375, -0.083984375, 0.12054443359375, 0.3250732421875, 0.52960205078125, 0.734130859375, 0.93865966796875, 1.1431884765625, 1.34771728515625, 1.55224609375, 1.75677490234375, 1.9613037109375, 2.16583251953125, 2.370361328125, 2.57489013671875, 2.7794189453125, 2.98394775390625, 3.1884765625, 3.39300537109375, 3.5975341796875, 3.80206298828125, 4.006591796875, 4.21112060546875, 4.4156494140625, 4.62017822265625, 4.82470703125, 5.02923583984375, 5.2337646484375, 5.43829345703125, 5.642822265625, 5.84735107421875, 6.0518798828125, 6.25640869140625, 6.4609375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 6.0, 4.0, 4.0, 7.0, 8.0, 13.0, 17.0, 10.0, 15.0, 27.0, 26.0, 20.0, 29.0, 20.0, 26.0, 43.0, 36.0, 43.0, 47.0, 37.0, 43.0, 34.0, 34.0, 53.0, 36.0, 27.0, 29.0, 39.0, 33.0, 28.0, 29.0, 24.0, 19.0, 21.0, 22.0, 19.0, 16.0, 20.0, 10.0, 8.0, 5.0, 10.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-2.818359375, -2.733062744140625, -2.64776611328125, -2.562469482421875, -2.4771728515625, -2.391876220703125, -2.30657958984375, -2.221282958984375, -2.135986328125, -2.050689697265625, -1.96539306640625, -1.880096435546875, -1.7947998046875, -1.709503173828125, -1.62420654296875, -1.538909912109375, -1.45361328125, -1.368316650390625, -1.28302001953125, -1.197723388671875, -1.1124267578125, -1.027130126953125, -0.94183349609375, -0.856536865234375, -0.771240234375, -0.685943603515625, -0.60064697265625, -0.515350341796875, -0.4300537109375, -0.344757080078125, -0.25946044921875, -0.174163818359375, -0.0888671875, -0.003570556640625, 0.08172607421875, 0.167022705078125, 0.2523193359375, 0.337615966796875, 0.42291259765625, 0.508209228515625, 0.593505859375, 0.678802490234375, 0.76409912109375, 0.849395751953125, 0.9346923828125, 1.019989013671875, 1.10528564453125, 1.190582275390625, 1.27587890625, 1.361175537109375, 1.44647216796875, 1.531768798828125, 1.6170654296875, 1.702362060546875, 1.78765869140625, 1.872955322265625, 1.958251953125, 2.043548583984375, 2.12884521484375, 2.214141845703125, 2.2994384765625, 2.384735107421875, 2.47003173828125, 2.555328369140625, 2.640625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 16.0, 11.0, 15.0, 24.0, 28.0, 34.0, 48.0, 74.0, 99.0, 113.0, 161.0, 232.0, 346.0, 449.0, 724.0, 988.0, 1464.0, 2270.0, 3751.0, 6367.0, 12169.0, 25872.0, 65131.0, 189061.0, 400142.0, 208083.0, 71418.0, 28157.0, 13115.0, 6851.0, 3884.0, 2420.0, 1599.0, 1061.0, 731.0, 446.0, 300.0, 233.0, 198.0, 142.0, 87.0, 82.0, 49.0, 25.0, 30.0, 17.0, 10.0, 10.0, 5.0, 4.0, 4.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0], "bins": [-3.6171875, -3.498779296875, -3.38037109375, -3.261962890625, -3.1435546875, -3.025146484375, -2.90673828125, -2.788330078125, -2.669921875, -2.551513671875, -2.43310546875, -2.314697265625, -2.1962890625, -2.077880859375, -1.95947265625, -1.841064453125, -1.72265625, -1.604248046875, -1.48583984375, -1.367431640625, -1.2490234375, -1.130615234375, -1.01220703125, -0.893798828125, -0.775390625, -0.656982421875, -0.53857421875, -0.420166015625, -0.3017578125, -0.183349609375, -0.06494140625, 0.053466796875, 0.171875, 0.290283203125, 0.40869140625, 0.527099609375, 0.6455078125, 0.763916015625, 0.88232421875, 1.000732421875, 1.119140625, 1.237548828125, 1.35595703125, 1.474365234375, 1.5927734375, 1.711181640625, 1.82958984375, 1.947998046875, 2.06640625, 2.184814453125, 2.30322265625, 2.421630859375, 2.5400390625, 2.658447265625, 2.77685546875, 2.895263671875, 3.013671875, 3.132080078125, 3.25048828125, 3.368896484375, 3.4873046875, 3.605712890625, 3.72412109375, 3.842529296875, 3.9609375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 7.0, 3.0, 5.0, 3.0, 4.0, 7.0, 10.0, 8.0, 10.0, 24.0, 24.0, 30.0, 38.0, 41.0, 74.0, 79.0, 87.0, 101.0, 90.0, 75.0, 56.0, 61.0, 25.0, 34.0, 31.0, 19.0, 14.0, 14.0, 10.0, 3.0, 5.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014448165893554688, -0.00013866834342479706, -0.00013285502791404724, -0.00012704171240329742, -0.00012122839689254761, -0.00011541508138179779, -0.00010960176587104797, -0.00010378845036029816, -9.797513484954834e-05, -9.216181933879852e-05, -8.63485038280487e-05, -8.053518831729889e-05, -7.472187280654907e-05, -6.890855729579926e-05, -6.309524178504944e-05, -5.728192627429962e-05, -5.1468610763549805e-05, -4.565529525279999e-05, -3.984197974205017e-05, -3.4028664231300354e-05, -2.8215348720550537e-05, -2.240203320980072e-05, -1.6588717699050903e-05, -1.0775402188301086e-05, -4.9620866775512695e-06, 8.512288331985474e-07, 6.664544343948364e-06, 1.2477859854698181e-05, 1.8291175365447998e-05, 2.4104490876197815e-05, 2.9917806386947632e-05, 3.573112189769745e-05, 4.1544437408447266e-05, 4.735775291919708e-05, 5.31710684299469e-05, 5.8984383940696716e-05, 6.479769945144653e-05, 7.061101496219635e-05, 7.642433047294617e-05, 8.223764598369598e-05, 8.80509614944458e-05, 9.386427700519562e-05, 9.967759251594543e-05, 0.00010549090802669525, 0.00011130422353744507, 0.00011711753904819489, 0.0001229308545589447, 0.00012874417006969452, 0.00013455748558044434, 0.00014037080109119415, 0.00014618411660194397, 0.0001519974321126938, 0.0001578107476234436, 0.00016362406313419342, 0.00016943737864494324, 0.00017525069415569305, 0.00018106400966644287, 0.0001868773251771927, 0.0001926906406879425, 0.00019850395619869232, 0.00020431727170944214, 0.00021013058722019196, 0.00021594390273094177, 0.0002217572182416916, 0.0002275705337524414]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 6.0, 8.0, 4.0, 9.0, 16.0, 27.0, 33.0, 56.0, 66.0, 121.0, 160.0, 244.0, 339.0, 577.0, 839.0, 1352.0, 2100.0, 3521.0, 6047.0, 11851.0, 26875.0, 72533.0, 212363.0, 372850.0, 210786.0, 72010.0, 26498.0, 11859.0, 6092.0, 3500.0, 2014.0, 1300.0, 824.0, 550.0, 375.0, 253.0, 147.0, 118.0, 73.0, 40.0, 37.0, 31.0, 17.0, 13.0, 9.0, 8.0, 8.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.30078125, -3.188873291015625, -3.07696533203125, -2.965057373046875, -2.8531494140625, -2.741241455078125, -2.62933349609375, -2.517425537109375, -2.405517578125, -2.293609619140625, -2.18170166015625, -2.069793701171875, -1.9578857421875, -1.845977783203125, -1.73406982421875, -1.622161865234375, -1.51025390625, -1.398345947265625, -1.28643798828125, -1.174530029296875, -1.0626220703125, -0.950714111328125, -0.83880615234375, -0.726898193359375, -0.614990234375, -0.503082275390625, -0.39117431640625, -0.279266357421875, -0.1673583984375, -0.055450439453125, 0.05645751953125, 0.168365478515625, 0.2802734375, 0.392181396484375, 0.50408935546875, 0.615997314453125, 0.7279052734375, 0.839813232421875, 0.95172119140625, 1.063629150390625, 1.175537109375, 1.287445068359375, 1.39935302734375, 1.511260986328125, 1.6231689453125, 1.735076904296875, 1.84698486328125, 1.958892822265625, 2.07080078125, 2.182708740234375, 2.29461669921875, 2.406524658203125, 2.5184326171875, 2.630340576171875, 2.74224853515625, 2.854156494140625, 2.966064453125, 3.077972412109375, 3.18988037109375, 3.301788330078125, 3.4136962890625, 3.525604248046875, 3.63751220703125, 3.749420166015625, 3.861328125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 6.0, 5.0, 1.0, 10.0, 10.0, 20.0, 10.0, 21.0, 33.0, 45.0, 59.0, 72.0, 85.0, 96.0, 77.0, 73.0, 72.0, 87.0, 52.0, 52.0, 27.0, 31.0, 12.0, 5.0, 10.0, 6.0, 4.0, 8.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90625, -0.878387451171875, -0.85052490234375, -0.822662353515625, -0.7947998046875, -0.766937255859375, -0.73907470703125, -0.711212158203125, -0.683349609375, -0.655487060546875, -0.62762451171875, -0.599761962890625, -0.5718994140625, -0.544036865234375, -0.51617431640625, -0.488311767578125, -0.46044921875, -0.432586669921875, -0.40472412109375, -0.376861572265625, -0.3489990234375, -0.321136474609375, -0.29327392578125, -0.265411376953125, -0.237548828125, -0.209686279296875, -0.18182373046875, -0.153961181640625, -0.1260986328125, -0.098236083984375, -0.07037353515625, -0.042510986328125, -0.0146484375, 0.013214111328125, 0.04107666015625, 0.068939208984375, 0.0968017578125, 0.124664306640625, 0.15252685546875, 0.180389404296875, 0.208251953125, 0.236114501953125, 0.26397705078125, 0.291839599609375, 0.3197021484375, 0.347564697265625, 0.37542724609375, 0.403289794921875, 0.43115234375, 0.459014892578125, 0.48687744140625, 0.514739990234375, 0.5426025390625, 0.570465087890625, 0.59832763671875, 0.626190185546875, 0.654052734375, 0.681915283203125, 0.70977783203125, 0.737640380859375, 0.7655029296875, 0.793365478515625, 0.82122802734375, 0.849090576171875, 0.876953125]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 7.0, 3.0, 8.0, 13.0, 12.0, 16.0, 18.0, 20.0, 25.0, 44.0, 30.0, 43.0, 54.0, 73.0, 81.0, 95.0, 77.0, 77.0, 63.0, 45.0, 55.0, 38.0, 26.0, 17.0, 16.0, 14.0, 9.0, 8.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.284247398376465, -8.018978118896484, -7.75370979309082, -7.48844051361084, -7.223171710968018, -6.957902908325195, -6.692633628845215, -6.427364826202393, -6.16209602355957, -5.896827220916748, -5.631558418273926, -5.366289138793945, -5.101020336151123, -4.835751533508301, -4.57048225402832, -4.305213451385498, -4.039944648742676, -3.7746758460998535, -3.509406805038452, -3.244137763977051, -2.9788689613342285, -2.7136001586914062, -2.448331117630005, -2.1830620765686035, -1.9177932739257812, -1.6525243520736694, -1.3872554302215576, -1.1219865083694458, -0.856717586517334, -0.5914486646652222, -0.32617974281311035, -0.060910820960998535, 0.20435714721679688, 0.4696260690689087, 0.7348949909210205, 1.0001639127731323, 1.2654328346252441, 1.530701756477356, 1.7959706783294678, 2.061239719390869, 2.3265085220336914, 2.5917773246765137, 2.857046365737915, 3.1223154067993164, 3.3875842094421387, 3.652853012084961, 3.9181220531463623, 4.183391094207764, 4.448659896850586, 4.713928699493408, 4.9791975021362305, 5.244466781616211, 5.509735584259033, 5.7750043869018555, 6.040273666381836, 6.305542469024658, 6.5708112716674805, 6.836080074310303, 7.101348876953125, 7.3666181564331055, 7.631886959075928, 7.89715576171875, 8.16242504119873, 8.427693367004395, 8.692962646484375]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 8.0, 7.0, 9.0, 7.0, 10.0, 9.0, 18.0, 29.0, 21.0, 26.0, 23.0, 32.0, 38.0, 45.0, 63.0, 34.0, 44.0, 49.0, 43.0, 49.0, 54.0, 47.0, 42.0, 41.0, 34.0, 38.0, 21.0, 27.0, 29.0, 27.0, 20.0, 15.0, 10.0, 13.0, 11.0, 3.0, 4.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.414175987243652, -4.2537431716918945, -4.093310832977295, -3.932878017425537, -3.7724454402923584, -3.6120128631591797, -3.451580047607422, -3.291147470474243, -3.1307148933410645, -2.9702823162078857, -2.809849739074707, -2.649416923522949, -2.4889843463897705, -2.328551769256592, -2.168118953704834, -2.0076863765716553, -1.8472537994384766, -1.6868212223052979, -1.5263885259628296, -1.3659558296203613, -1.2055232524871826, -1.045090675354004, -0.8846579790115356, -0.7242252826690674, -0.5637927055358887, -0.4033600687980652, -0.2429274320602417, -0.08249479532241821, 0.07793784141540527, 0.23837047815322876, 0.39880311489105225, 0.5592358112335205, 0.719667911529541, 0.8801005482673645, 1.040533185005188, 1.2009658813476562, 1.361398458480835, 1.5218310356140137, 1.682263731956482, 1.8426964282989502, 2.003129005432129, 2.1635615825653076, 2.3239941596984863, 2.484426975250244, 2.644859552383423, 2.8052921295166016, 2.9657249450683594, 3.126157522201538, 3.286590099334717, 3.4470226764678955, 3.607455253601074, 3.767888069152832, 3.9283206462860107, 4.0887532234191895, 4.249186038970947, 4.409618377685547, 4.570051193237305, 4.7304840087890625, 4.890916347503662, 5.05134916305542, 5.2117815017700195, 5.372214317321777, 5.532647132873535, 5.693079948425293, 5.853512287139893]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 6.0, 6.0, 8.0, 14.0, 26.0, 26.0, 44.0, 77.0, 87.0, 153.0, 208.0, 272.0, 513.0, 782.0, 1144.0, 1924.0, 3306.0, 5386.0, 9531.0, 16652.0, 29752.0, 53741.0, 93621.0, 148544.0, 192682.0, 182480.0, 128805.0, 77604.0, 43578.0, 24288.0, 13684.0, 7779.0, 4552.0, 2650.0, 1593.0, 1085.0, 664.0, 438.0, 283.0, 181.0, 137.0, 78.0, 57.0, 37.0, 23.0, 19.0, 17.0, 6.0, 7.0, 8.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.6640625, -5.49151611328125, -5.3189697265625, -5.14642333984375, -4.973876953125, -4.80133056640625, -4.6287841796875, -4.45623779296875, -4.28369140625, -4.11114501953125, -3.9385986328125, -3.76605224609375, -3.593505859375, -3.42095947265625, -3.2484130859375, -3.07586669921875, -2.9033203125, -2.73077392578125, -2.5582275390625, -2.38568115234375, -2.213134765625, -2.04058837890625, -1.8680419921875, -1.69549560546875, -1.52294921875, -1.35040283203125, -1.1778564453125, -1.00531005859375, -0.832763671875, -0.66021728515625, -0.4876708984375, -0.31512451171875, -0.142578125, 0.02996826171875, 0.2025146484375, 0.37506103515625, 0.547607421875, 0.72015380859375, 0.8927001953125, 1.06524658203125, 1.23779296875, 1.41033935546875, 1.5828857421875, 1.75543212890625, 1.927978515625, 2.10052490234375, 2.2730712890625, 2.44561767578125, 2.6181640625, 2.79071044921875, 2.9632568359375, 3.13580322265625, 3.308349609375, 3.48089599609375, 3.6534423828125, 3.82598876953125, 3.99853515625, 4.17108154296875, 4.3436279296875, 4.51617431640625, 4.688720703125, 4.86126708984375, 5.0338134765625, 5.20635986328125, 5.37890625]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 2.0, 7.0, 10.0, 9.0, 8.0, 17.0, 9.0, 14.0, 15.0, 18.0, 21.0, 23.0, 28.0, 22.0, 25.0, 31.0, 38.0, 42.0, 40.0, 37.0, 42.0, 33.0, 49.0, 42.0, 35.0, 47.0, 34.0, 36.0, 31.0, 37.0, 22.0, 32.0, 27.0, 18.0, 16.0, 15.0, 10.0, 15.0, 8.0, 9.0, 7.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-4.83203125, -4.68865966796875, -4.5452880859375, -4.40191650390625, -4.258544921875, -4.11517333984375, -3.9718017578125, -3.82843017578125, -3.68505859375, -3.54168701171875, -3.3983154296875, -3.25494384765625, -3.111572265625, -2.96820068359375, -2.8248291015625, -2.68145751953125, -2.5380859375, -2.39471435546875, -2.2513427734375, -2.10797119140625, -1.964599609375, -1.82122802734375, -1.6778564453125, -1.53448486328125, -1.39111328125, -1.24774169921875, -1.1043701171875, -0.96099853515625, -0.817626953125, -0.67425537109375, -0.5308837890625, -0.38751220703125, -0.244140625, -0.10076904296875, 0.0426025390625, 0.18597412109375, 0.329345703125, 0.47271728515625, 0.6160888671875, 0.75946044921875, 0.90283203125, 1.04620361328125, 1.1895751953125, 1.33294677734375, 1.476318359375, 1.61968994140625, 1.7630615234375, 1.90643310546875, 2.0498046875, 2.19317626953125, 2.3365478515625, 2.47991943359375, 2.623291015625, 2.76666259765625, 2.9100341796875, 3.05340576171875, 3.19677734375, 3.34014892578125, 3.4835205078125, 3.62689208984375, 3.770263671875, 3.91363525390625, 4.0570068359375, 4.20037841796875, 4.34375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 5.0, 15.0, 11.0, 26.0, 37.0, 32.0, 54.0, 89.0, 116.0, 212.0, 325.0, 546.0, 862.0, 1430.0, 2600.0, 4728.0, 8984.0, 17782.0, 35313.0, 70796.0, 134385.0, 211192.0, 225317.0, 158418.0, 85904.0, 43914.0, 21396.0, 11008.0, 5534.0, 3001.0, 1752.0, 1030.0, 615.0, 373.0, 281.0, 178.0, 114.0, 55.0, 43.0, 23.0, 23.0, 11.0, 10.0, 3.0, 4.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.14453125, -5.9337158203125, -5.722900390625, -5.5120849609375, -5.30126953125, -5.0904541015625, -4.879638671875, -4.6688232421875, -4.4580078125, -4.2471923828125, -4.036376953125, -3.8255615234375, -3.61474609375, -3.4039306640625, -3.193115234375, -2.9822998046875, -2.771484375, -2.5606689453125, -2.349853515625, -2.1390380859375, -1.92822265625, -1.7174072265625, -1.506591796875, -1.2957763671875, -1.0849609375, -0.8741455078125, -0.663330078125, -0.4525146484375, -0.24169921875, -0.0308837890625, 0.179931640625, 0.3907470703125, 0.6015625, 0.8123779296875, 1.023193359375, 1.2340087890625, 1.44482421875, 1.6556396484375, 1.866455078125, 2.0772705078125, 2.2880859375, 2.4989013671875, 2.709716796875, 2.9205322265625, 3.13134765625, 3.3421630859375, 3.552978515625, 3.7637939453125, 3.974609375, 4.1854248046875, 4.396240234375, 4.6070556640625, 4.81787109375, 5.0286865234375, 5.239501953125, 5.4503173828125, 5.6611328125, 5.8719482421875, 6.082763671875, 6.2935791015625, 6.50439453125, 6.7152099609375, 6.926025390625, 7.1368408203125, 7.34765625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 7.0, 11.0, 12.0, 15.0, 16.0, 21.0, 14.0, 19.0, 28.0, 31.0, 24.0, 31.0, 34.0, 40.0, 37.0, 50.0, 34.0, 53.0, 43.0, 42.0, 30.0, 60.0, 34.0, 46.0, 42.0, 35.0, 34.0, 18.0, 26.0, 24.0, 22.0, 10.0, 15.0, 7.0, 11.0, 6.0, 5.0, 2.0, 4.0, 6.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.755859375, -2.659088134765625, -2.56231689453125, -2.465545654296875, -2.3687744140625, -2.272003173828125, -2.17523193359375, -2.078460693359375, -1.981689453125, -1.884918212890625, -1.78814697265625, -1.691375732421875, -1.5946044921875, -1.497833251953125, -1.40106201171875, -1.304290771484375, -1.20751953125, -1.110748291015625, -1.01397705078125, -0.917205810546875, -0.8204345703125, -0.723663330078125, -0.62689208984375, -0.530120849609375, -0.433349609375, -0.336578369140625, -0.23980712890625, -0.143035888671875, -0.0462646484375, 0.050506591796875, 0.14727783203125, 0.244049072265625, 0.3408203125, 0.437591552734375, 0.53436279296875, 0.631134033203125, 0.7279052734375, 0.824676513671875, 0.92144775390625, 1.018218994140625, 1.114990234375, 1.211761474609375, 1.30853271484375, 1.405303955078125, 1.5020751953125, 1.598846435546875, 1.69561767578125, 1.792388916015625, 1.88916015625, 1.985931396484375, 2.08270263671875, 2.179473876953125, 2.2762451171875, 2.373016357421875, 2.46978759765625, 2.566558837890625, 2.663330078125, 2.760101318359375, 2.85687255859375, 2.953643798828125, 3.0504150390625, 3.147186279296875, 3.24395751953125, 3.340728759765625, 3.4375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 1.0, 5.0, 6.0, 10.0, 24.0, 25.0, 34.0, 52.0, 89.0, 107.0, 157.0, 239.0, 402.0, 572.0, 843.0, 1314.0, 2019.0, 3111.0, 4797.0, 7717.0, 12498.0, 20550.0, 34477.0, 56616.0, 90757.0, 135053.0, 170768.0, 165373.0, 125921.0, 82728.0, 51313.0, 31127.0, 18627.0, 11410.0, 7208.0, 4418.0, 2849.0, 1798.0, 1168.0, 780.0, 523.0, 332.0, 250.0, 152.0, 102.0, 82.0, 54.0, 45.0, 23.0, 15.0, 9.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-2.033203125, -1.971405029296875, -1.90960693359375, -1.847808837890625, -1.7860107421875, -1.724212646484375, -1.66241455078125, -1.600616455078125, -1.538818359375, -1.477020263671875, -1.41522216796875, -1.353424072265625, -1.2916259765625, -1.229827880859375, -1.16802978515625, -1.106231689453125, -1.04443359375, -0.982635498046875, -0.92083740234375, -0.859039306640625, -0.7972412109375, -0.735443115234375, -0.67364501953125, -0.611846923828125, -0.550048828125, -0.488250732421875, -0.42645263671875, -0.364654541015625, -0.3028564453125, -0.241058349609375, -0.17926025390625, -0.117462158203125, -0.0556640625, 0.006134033203125, 0.06793212890625, 0.129730224609375, 0.1915283203125, 0.253326416015625, 0.31512451171875, 0.376922607421875, 0.438720703125, 0.500518798828125, 0.56231689453125, 0.624114990234375, 0.6859130859375, 0.747711181640625, 0.80950927734375, 0.871307373046875, 0.93310546875, 0.994903564453125, 1.05670166015625, 1.118499755859375, 1.1802978515625, 1.242095947265625, 1.30389404296875, 1.365692138671875, 1.427490234375, 1.489288330078125, 1.55108642578125, 1.612884521484375, 1.6746826171875, 1.736480712890625, 1.79827880859375, 1.860076904296875, 1.921875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 2.0, 4.0, 2.0, 7.0, 10.0, 7.0, 11.0, 14.0, 18.0, 21.0, 34.0, 50.0, 61.0, 73.0, 71.0, 85.0, 87.0, 76.0, 72.0, 55.0, 49.0, 49.0, 30.0, 27.0, 14.0, 15.0, 12.0, 14.0, 10.0, 9.0, 5.0, 8.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003025531768798828, -0.0002929605543613434, -0.00028336793184280396, -0.0002737753093242645, -0.0002641826868057251, -0.00025459006428718567, -0.00024499744176864624, -0.0002354048192501068, -0.00022581219673156738, -0.00021621957421302795, -0.00020662695169448853, -0.0001970343291759491, -0.00018744170665740967, -0.00017784908413887024, -0.0001682564616203308, -0.00015866383910179138, -0.00014907121658325195, -0.00013947859406471252, -0.0001298859715461731, -0.00012029334902763367, -0.00011070072650909424, -0.00010110810399055481, -9.151548147201538e-05, -8.192285895347595e-05, -7.233023643493652e-05, -6.27376139163971e-05, -5.3144991397857666e-05, -4.355236887931824e-05, -3.395974636077881e-05, -2.436712384223938e-05, -1.4774501323699951e-05, -5.1818788051605225e-06, 4.410743713378906e-06, 1.4003366231918335e-05, 2.3595988750457764e-05, 3.318861126899719e-05, 4.278123378753662e-05, 5.237385630607605e-05, 6.196647882461548e-05, 7.155910134315491e-05, 8.115172386169434e-05, 9.074434638023376e-05, 0.0001003369688987732, 0.00010992959141731262, 0.00011952221393585205, 0.00012911483645439148, 0.0001387074589729309, 0.00014830008149147034, 0.00015789270401000977, 0.0001674853265285492, 0.00017707794904708862, 0.00018667057156562805, 0.00019626319408416748, 0.0002058558166027069, 0.00021544843912124634, 0.00022504106163978577, 0.0002346336841583252, 0.0002442263066768646, 0.00025381892919540405, 0.0002634115517139435, 0.0002730041742324829, 0.00028259679675102234, 0.00029218941926956177, 0.0003017820417881012, 0.0003113746643066406]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 9.0, 10.0, 21.0, 41.0, 39.0, 103.0, 135.0, 237.0, 427.0, 650.0, 1106.0, 2013.0, 3602.0, 6371.0, 11890.0, 22469.0, 42185.0, 79367.0, 139372.0, 202237.0, 205286.0, 147988.0, 84946.0, 45777.0, 23875.0, 12779.0, 6803.0, 3843.0, 2041.0, 1176.0, 691.0, 410.0, 236.0, 147.0, 95.0, 57.0, 39.0, 30.0, 21.0, 11.0, 5.0, 4.0, 2.0, 7.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.587890625, -2.514068603515625, -2.44024658203125, -2.366424560546875, -2.2926025390625, -2.218780517578125, -2.14495849609375, -2.071136474609375, -1.997314453125, -1.923492431640625, -1.84967041015625, -1.775848388671875, -1.7020263671875, -1.628204345703125, -1.55438232421875, -1.480560302734375, -1.40673828125, -1.332916259765625, -1.25909423828125, -1.185272216796875, -1.1114501953125, -1.037628173828125, -0.96380615234375, -0.889984130859375, -0.816162109375, -0.742340087890625, -0.66851806640625, -0.594696044921875, -0.5208740234375, -0.447052001953125, -0.37322998046875, -0.299407958984375, -0.2255859375, -0.151763916015625, -0.07794189453125, -0.004119873046875, 0.0697021484375, 0.143524169921875, 0.21734619140625, 0.291168212890625, 0.364990234375, 0.438812255859375, 0.51263427734375, 0.586456298828125, 0.6602783203125, 0.734100341796875, 0.80792236328125, 0.881744384765625, 0.95556640625, 1.029388427734375, 1.10321044921875, 1.177032470703125, 1.2508544921875, 1.324676513671875, 1.39849853515625, 1.472320556640625, 1.546142578125, 1.619964599609375, 1.69378662109375, 1.767608642578125, 1.8414306640625, 1.915252685546875, 1.98907470703125, 2.062896728515625, 2.13671875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 3.0, 5.0, 2.0, 2.0, 2.0, 5.0, 2.0, 4.0, 6.0, 10.0, 4.0, 11.0, 18.0, 25.0, 22.0, 12.0, 27.0, 35.0, 32.0, 33.0, 27.0, 36.0, 31.0, 41.0, 49.0, 42.0, 50.0, 51.0, 25.0, 48.0, 38.0, 37.0, 38.0, 29.0, 23.0, 25.0, 27.0, 16.0, 18.0, 16.0, 13.0, 16.0, 19.0, 6.0, 8.0, 4.0, 3.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.412353515625, -0.3975410461425781, -0.38272857666015625, -0.3679161071777344, -0.3531036376953125, -0.3382911682128906, -0.32347869873046875, -0.3086662292480469, -0.293853759765625, -0.2790412902832031, -0.26422882080078125, -0.24941635131835938, -0.2346038818359375, -0.21979141235351562, -0.20497894287109375, -0.19016647338867188, -0.17535400390625, -0.16054153442382812, -0.14572906494140625, -0.13091659545898438, -0.1161041259765625, -0.10129165649414062, -0.08647918701171875, -0.07166671752929688, -0.056854248046875, -0.042041778564453125, -0.02722930908203125, -0.012416839599609375, 0.0023956298828125, 0.017208099365234375, 0.03202056884765625, 0.046833038330078125, 0.0616455078125, 0.07645797729492188, 0.09127044677734375, 0.10608291625976562, 0.1208953857421875, 0.13570785522460938, 0.15052032470703125, 0.16533279418945312, 0.180145263671875, 0.19495773315429688, 0.20977020263671875, 0.22458267211914062, 0.2393951416015625, 0.2542076110839844, 0.26902008056640625, 0.2838325500488281, 0.29864501953125, 0.3134574890136719, 0.32826995849609375, 0.3430824279785156, 0.3578948974609375, 0.3727073669433594, 0.38751983642578125, 0.4023323059082031, 0.417144775390625, 0.4319572448730469, 0.44676971435546875, 0.4615821838378906, 0.4763946533203125, 0.4912071228027344, 0.5060195922851562, 0.5208320617675781, 0.53564453125]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 3.0, 0.0, 4.0, 6.0, 4.0, 5.0, 14.0, 12.0, 19.0, 16.0, 33.0, 17.0, 25.0, 49.0, 53.0, 59.0, 68.0, 78.0, 95.0, 74.0, 75.0, 72.0, 55.0, 48.0, 37.0, 23.0, 17.0, 12.0, 11.0, 6.0, 0.0, 9.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.282942771911621, -7.014131546020508, -6.745320796966553, -6.4765095710754395, -6.207698345184326, -5.938887596130371, -5.670076370239258, -5.4012651443481445, -5.132453918457031, -4.863642692565918, -4.594831943511963, -4.32602071762085, -4.057209491729736, -3.788398504257202, -3.519587516784668, -3.2507762908935547, -2.9819655418395996, -2.7131545543670654, -2.444343328475952, -2.175532341003418, -1.9067212343215942, -1.6379101276397705, -1.3690991401672363, -1.1002880334854126, -0.8314769268035889, -0.5626658201217651, -0.2938547730445862, -0.025043725967407227, 0.2437673807144165, 0.5125784873962402, 0.7813894748687744, 1.0502005815505981, 1.3190116882324219, 1.5878227949142456, 1.8566339015960693, 2.1254448890686035, 2.394256114959717, 2.663067102432251, 2.931878089904785, 3.2006893157958984, 3.4695003032684326, 3.738311290740967, 4.00712251663208, 4.275933265686035, 4.544744491577148, 4.813555717468262, 5.082366943359375, 5.35117769241333, 5.619988918304443, 5.888800144195557, 6.157610893249512, 6.426422119140625, 6.695233345031738, 6.964044570922852, 7.232855319976807, 7.50166654586792, 7.770477294921875, 8.039288520812988, 8.308099746704102, 8.576910018920898, 8.845721244812012, 9.114532470703125, 9.383343696594238, 9.652154922485352, 9.920966148376465]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 6.0, 5.0, 8.0, 8.0, 14.0, 20.0, 12.0, 17.0, 24.0, 25.0, 28.0, 26.0, 52.0, 40.0, 39.0, 55.0, 31.0, 57.0, 49.0, 53.0, 46.0, 46.0, 47.0, 39.0, 37.0, 25.0, 26.0, 25.0, 26.0, 20.0, 25.0, 17.0, 11.0, 13.0, 8.0, 5.0, 6.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.709172248840332, -4.549365997314453, -4.389560222625732, -4.2297539710998535, -4.069948196411133, -3.910141944885254, -3.750335931777954, -3.5905299186706543, -3.4307236671447754, -3.2709176540374756, -3.111111640930176, -2.951305389404297, -2.791499376296997, -2.6316933631896973, -2.4718873500823975, -2.3120813369750977, -2.152275323867798, -1.992469310760498, -1.8326631784439087, -1.6728571653366089, -1.5130510330200195, -1.3532450199127197, -1.19343900680542, -1.0336328744888306, -0.8738268613815308, -0.7140207886695862, -0.5542147159576416, -0.3944087028503418, -0.23460263013839722, -0.07479655742645264, 0.08500945568084717, 0.24481558799743652, 0.40462160110473633, 0.5644276738166809, 0.7242337465286255, 0.8840397596359253, 1.0438458919525146, 1.2036519050598145, 1.3634579181671143, 1.5232640504837036, 1.6830700635910034, 1.8428760766983032, 2.0026822090148926, 2.1624882221221924, 2.322294235229492, 2.482100486755371, 2.641906261444092, 2.8017125129699707, 2.9615185260772705, 3.1213245391845703, 3.28113055229187, 3.44093656539917, 3.600742816925049, 3.7605488300323486, 3.9203548431396484, 4.080161094665527, 4.239966869354248, 4.399773120880127, 4.559578895568848, 4.719385147094727, 4.879190921783447, 5.038997173309326, 5.198802947998047, 5.358609199523926, 5.518415451049805]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 6.0, 6.0, 7.0, 28.0, 27.0, 34.0, 58.0, 78.0, 113.0, 217.0, 278.0, 487.0, 808.0, 1325.0, 2236.0, 4183.0, 7942.0, 15336.0, 32063.0, 74477.0, 195248.0, 584754.0, 1401308.0, 1190817.0, 428741.0, 143166.0, 56825.0, 25567.0, 12574.0, 6591.0, 3632.0, 2078.0, 1215.0, 738.0, 467.0, 299.0, 197.0, 110.0, 84.0, 40.0, 42.0, 23.0, 17.0, 13.0, 8.0, 6.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.5078125, -8.2489013671875, -7.989990234375, -7.7310791015625, -7.47216796875, -7.2132568359375, -6.954345703125, -6.6954345703125, -6.4365234375, -6.1776123046875, -5.918701171875, -5.6597900390625, -5.40087890625, -5.1419677734375, -4.883056640625, -4.6241455078125, -4.365234375, -4.1063232421875, -3.847412109375, -3.5885009765625, -3.32958984375, -3.0706787109375, -2.811767578125, -2.5528564453125, -2.2939453125, -2.0350341796875, -1.776123046875, -1.5172119140625, -1.25830078125, -0.9993896484375, -0.740478515625, -0.4815673828125, -0.22265625, 0.0362548828125, 0.295166015625, 0.5540771484375, 0.81298828125, 1.0718994140625, 1.330810546875, 1.5897216796875, 1.8486328125, 2.1075439453125, 2.366455078125, 2.6253662109375, 2.88427734375, 3.1431884765625, 3.402099609375, 3.6610107421875, 3.919921875, 4.1788330078125, 4.437744140625, 4.6966552734375, 4.95556640625, 5.2144775390625, 5.473388671875, 5.7322998046875, 5.9912109375, 6.2501220703125, 6.509033203125, 6.7679443359375, 7.02685546875, 7.2857666015625, 7.544677734375, 7.8035888671875, 8.0625]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 1.0, 3.0, 5.0, 6.0, 9.0, 7.0, 8.0, 11.0, 18.0, 14.0, 18.0, 32.0, 31.0, 32.0, 47.0, 46.0, 34.0, 44.0, 53.0, 48.0, 45.0, 51.0, 47.0, 51.0, 47.0, 46.0, 44.0, 24.0, 29.0, 31.0, 15.0, 27.0, 24.0, 16.0, 9.0, 7.0, 7.0, 8.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5, -3.3780517578125, -3.256103515625, -3.1341552734375, -3.01220703125, -2.8902587890625, -2.768310546875, -2.6463623046875, -2.5244140625, -2.4024658203125, -2.280517578125, -2.1585693359375, -2.03662109375, -1.9146728515625, -1.792724609375, -1.6707763671875, -1.548828125, -1.4268798828125, -1.304931640625, -1.1829833984375, -1.06103515625, -0.9390869140625, -0.817138671875, -0.6951904296875, -0.5732421875, -0.4512939453125, -0.329345703125, -0.2073974609375, -0.08544921875, 0.0364990234375, 0.158447265625, 0.2803955078125, 0.40234375, 0.5242919921875, 0.646240234375, 0.7681884765625, 0.89013671875, 1.0120849609375, 1.134033203125, 1.2559814453125, 1.3779296875, 1.4998779296875, 1.621826171875, 1.7437744140625, 1.86572265625, 1.9876708984375, 2.109619140625, 2.2315673828125, 2.353515625, 2.4754638671875, 2.597412109375, 2.7193603515625, 2.84130859375, 2.9632568359375, 3.085205078125, 3.2071533203125, 3.3291015625, 3.4510498046875, 3.572998046875, 3.6949462890625, 3.81689453125, 3.9388427734375, 4.060791015625, 4.1827392578125, 4.3046875]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 7.0, 8.0, 6.0, 10.0, 22.0, 26.0, 34.0, 63.0, 105.0, 148.0, 223.0, 357.0, 513.0, 839.0, 1327.0, 2195.0, 3781.0, 6404.0, 11704.0, 21178.0, 41416.0, 84851.0, 186143.0, 424970.0, 928754.0, 1211830.0, 694739.0, 304408.0, 134819.0, 63148.0, 31530.0, 16458.0, 9050.0, 5124.0, 3085.0, 1820.0, 1162.0, 711.0, 422.0, 297.0, 180.0, 117.0, 92.0, 70.0, 55.0, 30.0, 11.0, 22.0, 10.0, 7.0, 1.0, 2.0, 1.0, 2.0], "bins": [-8.0859375, -7.85687255859375, -7.6278076171875, -7.39874267578125, -7.169677734375, -6.94061279296875, -6.7115478515625, -6.48248291015625, -6.25341796875, -6.02435302734375, -5.7952880859375, -5.56622314453125, -5.337158203125, -5.10809326171875, -4.8790283203125, -4.64996337890625, -4.4208984375, -4.19183349609375, -3.9627685546875, -3.73370361328125, -3.504638671875, -3.27557373046875, -3.0465087890625, -2.81744384765625, -2.58837890625, -2.35931396484375, -2.1302490234375, -1.90118408203125, -1.672119140625, -1.44305419921875, -1.2139892578125, -0.98492431640625, -0.755859375, -0.52679443359375, -0.2977294921875, -0.06866455078125, 0.160400390625, 0.38946533203125, 0.6185302734375, 0.84759521484375, 1.07666015625, 1.30572509765625, 1.5347900390625, 1.76385498046875, 1.992919921875, 2.22198486328125, 2.4510498046875, 2.68011474609375, 2.9091796875, 3.13824462890625, 3.3673095703125, 3.59637451171875, 3.825439453125, 4.05450439453125, 4.2835693359375, 4.51263427734375, 4.74169921875, 4.97076416015625, 5.1998291015625, 5.42889404296875, 5.657958984375, 5.88702392578125, 6.1160888671875, 6.34515380859375, 6.57421875]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 9.0, 6.0, 10.0, 12.0, 13.0, 14.0, 25.0, 26.0, 37.0, 45.0, 54.0, 65.0, 88.0, 127.0, 139.0, 194.0, 228.0, 245.0, 277.0, 299.0, 338.0, 274.0, 264.0, 294.0, 203.0, 162.0, 144.0, 115.0, 73.0, 54.0, 59.0, 41.0, 29.0, 26.0, 28.0, 14.0, 7.0, 11.0, 6.0, 2.0, 4.0, 2.0, 2.0, 4.0, 1.0, 4.0], "bins": [-2.478515625, -2.413665771484375, -2.34881591796875, -2.283966064453125, -2.2191162109375, -2.154266357421875, -2.08941650390625, -2.024566650390625, -1.959716796875, -1.894866943359375, -1.83001708984375, -1.765167236328125, -1.7003173828125, -1.635467529296875, -1.57061767578125, -1.505767822265625, -1.44091796875, -1.376068115234375, -1.31121826171875, -1.246368408203125, -1.1815185546875, -1.116668701171875, -1.05181884765625, -0.986968994140625, -0.922119140625, -0.857269287109375, -0.79241943359375, -0.727569580078125, -0.6627197265625, -0.597869873046875, -0.53302001953125, -0.468170166015625, -0.4033203125, -0.338470458984375, -0.27362060546875, -0.208770751953125, -0.1439208984375, -0.079071044921875, -0.01422119140625, 0.050628662109375, 0.115478515625, 0.180328369140625, 0.24517822265625, 0.310028076171875, 0.3748779296875, 0.439727783203125, 0.50457763671875, 0.569427490234375, 0.63427734375, 0.699127197265625, 0.76397705078125, 0.828826904296875, 0.8936767578125, 0.958526611328125, 1.02337646484375, 1.088226318359375, 1.153076171875, 1.217926025390625, 1.28277587890625, 1.347625732421875, 1.4124755859375, 1.477325439453125, 1.54217529296875, 1.607025146484375, 1.671875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 0.0, 4.0, 6.0, 8.0, 8.0, 18.0, 14.0, 12.0, 21.0, 21.0, 17.0, 31.0, 41.0, 46.0, 57.0, 69.0, 65.0, 64.0, 80.0, 61.0, 52.0, 59.0, 53.0, 32.0, 39.0, 28.0, 22.0, 13.0, 16.0, 10.0, 13.0, 5.0, 3.0, 1.0, 5.0, 4.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.507089614868164, -7.277308464050293, -7.047527313232422, -6.817746162414551, -6.58796501159668, -6.358183860778809, -6.1284027099609375, -5.898621082305908, -5.668839931488037, -5.439058780670166, -5.209277629852295, -4.979496479034424, -4.749715328216553, -4.519933700561523, -4.290152549743652, -4.060371398925781, -3.8305904865264893, -3.600809335708618, -3.371028184890747, -3.141246795654297, -2.911465644836426, -2.6816844940185547, -2.4519033432006836, -2.2221221923828125, -1.9923409223556519, -1.7625597715377808, -1.5327785015106201, -1.302997350692749, -1.073216199874878, -0.8434349298477173, -0.6136537790298462, -0.38387250900268555, -0.15409135818481445, 0.07568983733654022, 0.3054710328578949, 0.5352522134780884, 0.7650334239006042, 0.9948146343231201, 1.2245957851409912, 1.4543770551681519, 1.684158205986023, 1.913939356803894, 2.1437206268310547, 2.373501777648926, 2.603282928466797, 2.833064079284668, 3.062845230102539, 3.2926266193389893, 3.5224077701568604, 3.7521889209747314, 3.9819700717926025, 4.211751461029053, 4.441532611846924, 4.671313762664795, 4.901094913482666, 5.130876064300537, 5.360657215118408, 5.590438365936279, 5.82021951675415, 6.0500006675720215, 6.279781818389893, 6.509563446044922, 6.739344596862793, 6.969125747680664, 7.198906898498535]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 3.0, 7.0, 3.0, 10.0, 14.0, 16.0, 14.0, 18.0, 21.0, 31.0, 35.0, 21.0, 32.0, 44.0, 37.0, 53.0, 46.0, 59.0, 58.0, 54.0, 46.0, 44.0, 47.0, 42.0, 41.0, 29.0, 26.0, 34.0, 26.0, 19.0, 22.0, 17.0, 11.0, 9.0, 4.0, 5.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.126667022705078, -4.96545934677124, -4.804251194000244, -4.643043518066406, -4.48183536529541, -4.320627689361572, -4.159419536590576, -3.9982118606567383, -3.837003707885742, -3.675795793533325, -3.514587879180908, -3.353379964828491, -3.192172050476074, -3.0309641361236572, -2.8697562217712402, -2.7085485458374023, -2.5473406314849854, -2.3861327171325684, -2.2249248027801514, -2.0637168884277344, -1.9025089740753174, -1.7413010597229004, -1.580093264579773, -1.418885350227356, -1.257677435874939, -1.096469521522522, -0.935261607170105, -0.7740537524223328, -0.6128458380699158, -0.4516379237174988, -0.29043006896972656, -0.12922215461730957, 0.03198575973510742, 0.19319365918636322, 0.354401558637619, 0.5156094431877136, 0.6768173575401306, 0.8380252718925476, 0.9992331266403198, 1.1604410409927368, 1.3216489553451538, 1.4828568696975708, 1.6440647840499878, 1.8052725791931152, 1.9664804935455322, 2.127688407897949, 2.288896322250366, 2.450104236602783, 2.6113121509552, 2.772520065307617, 2.933727979660034, 3.094935894012451, 3.256143808364868, 3.417351722717285, 3.578559398651123, 3.739767551422119, 3.900975227355957, 4.062182903289795, 4.223391056060791, 4.384598731994629, 4.545806884765625, 4.707014560699463, 4.868222713470459, 5.029430389404297, 5.190638542175293]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 5.0, 10.0, 13.0, 12.0, 25.0, 27.0, 32.0, 52.0, 77.0, 136.0, 186.0, 254.0, 395.0, 614.0, 898.0, 1363.0, 2144.0, 3294.0, 5103.0, 7855.0, 12713.0, 19966.0, 31888.0, 50468.0, 78631.0, 116158.0, 149502.0, 158849.0, 135279.0, 97655.0, 64180.0, 40806.0, 25512.0, 16109.0, 10134.0, 6402.0, 4094.0, 2660.0, 1686.0, 1079.0, 754.0, 513.0, 341.0, 211.0, 127.0, 116.0, 75.0, 50.0, 37.0, 21.0, 18.0, 15.0, 4.0, 6.0, 4.0, 0.0, 2.0, 4.0], "bins": [-2.775390625, -2.69195556640625, -2.6085205078125, -2.52508544921875, -2.441650390625, -2.35821533203125, -2.2747802734375, -2.19134521484375, -2.10791015625, -2.02447509765625, -1.9410400390625, -1.85760498046875, -1.774169921875, -1.69073486328125, -1.6072998046875, -1.52386474609375, -1.4404296875, -1.35699462890625, -1.2735595703125, -1.19012451171875, -1.106689453125, -1.02325439453125, -0.9398193359375, -0.85638427734375, -0.77294921875, -0.68951416015625, -0.6060791015625, -0.52264404296875, -0.439208984375, -0.35577392578125, -0.2723388671875, -0.18890380859375, -0.10546875, -0.02203369140625, 0.0614013671875, 0.14483642578125, 0.228271484375, 0.31170654296875, 0.3951416015625, 0.47857666015625, 0.56201171875, 0.64544677734375, 0.7288818359375, 0.81231689453125, 0.895751953125, 0.97918701171875, 1.0626220703125, 1.14605712890625, 1.2294921875, 1.31292724609375, 1.3963623046875, 1.47979736328125, 1.563232421875, 1.64666748046875, 1.7301025390625, 1.81353759765625, 1.89697265625, 1.98040771484375, 2.0638427734375, 2.14727783203125, 2.230712890625, 2.31414794921875, 2.3975830078125, 2.48101806640625, 2.564453125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 3.0, 3.0, 4.0, 6.0, 6.0, 10.0, 16.0, 11.0, 15.0, 23.0, 25.0, 35.0, 29.0, 36.0, 32.0, 43.0, 47.0, 50.0, 44.0, 56.0, 58.0, 60.0, 42.0, 53.0, 51.0, 34.0, 31.0, 40.0, 20.0, 28.0, 22.0, 17.0, 10.0, 15.0, 10.0, 7.0, 7.0, 2.0, 3.0, 5.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.671875, -5.495361328125, -5.31884765625, -5.142333984375, -4.9658203125, -4.789306640625, -4.61279296875, -4.436279296875, -4.259765625, -4.083251953125, -3.90673828125, -3.730224609375, -3.5537109375, -3.377197265625, -3.20068359375, -3.024169921875, -2.84765625, -2.671142578125, -2.49462890625, -2.318115234375, -2.1416015625, -1.965087890625, -1.78857421875, -1.612060546875, -1.435546875, -1.259033203125, -1.08251953125, -0.906005859375, -0.7294921875, -0.552978515625, -0.37646484375, -0.199951171875, -0.0234375, 0.153076171875, 0.32958984375, 0.506103515625, 0.6826171875, 0.859130859375, 1.03564453125, 1.212158203125, 1.388671875, 1.565185546875, 1.74169921875, 1.918212890625, 2.0947265625, 2.271240234375, 2.44775390625, 2.624267578125, 2.80078125, 2.977294921875, 3.15380859375, 3.330322265625, 3.5068359375, 3.683349609375, 3.85986328125, 4.036376953125, 4.212890625, 4.389404296875, 4.56591796875, 4.742431640625, 4.9189453125, 5.095458984375, 5.27197265625, 5.448486328125, 5.625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 6.0, 7.0, 15.0, 22.0, 20.0, 39.0, 43.0, 62.0, 67.0, 110.0, 163.0, 242.0, 381.0, 583.0, 905.0, 1481.0, 2225.0, 3795.0, 6512.0, 11163.0, 19950.0, 36031.0, 64842.0, 115528.0, 190734.0, 223372.0, 159773.0, 92420.0, 51042.0, 28218.0, 16088.0, 9086.0, 5239.0, 3169.0, 1901.0, 1138.0, 727.0, 507.0, 330.0, 188.0, 111.0, 97.0, 74.0, 40.0, 42.0, 20.0, 16.0, 14.0, 5.0, 6.0, 8.0, 5.0, 1.0, 2.0, 2.0, 1.0], "bins": [-3.99609375, -3.8760986328125, -3.756103515625, -3.6361083984375, -3.51611328125, -3.3961181640625, -3.276123046875, -3.1561279296875, -3.0361328125, -2.9161376953125, -2.796142578125, -2.6761474609375, -2.55615234375, -2.4361572265625, -2.316162109375, -2.1961669921875, -2.076171875, -1.9561767578125, -1.836181640625, -1.7161865234375, -1.59619140625, -1.4761962890625, -1.356201171875, -1.2362060546875, -1.1162109375, -0.9962158203125, -0.876220703125, -0.7562255859375, -0.63623046875, -0.5162353515625, -0.396240234375, -0.2762451171875, -0.15625, -0.0362548828125, 0.083740234375, 0.2037353515625, 0.32373046875, 0.4437255859375, 0.563720703125, 0.6837158203125, 0.8037109375, 0.9237060546875, 1.043701171875, 1.1636962890625, 1.28369140625, 1.4036865234375, 1.523681640625, 1.6436767578125, 1.763671875, 1.8836669921875, 2.003662109375, 2.1236572265625, 2.24365234375, 2.3636474609375, 2.483642578125, 2.6036376953125, 2.7236328125, 2.8436279296875, 2.963623046875, 3.0836181640625, 3.20361328125, 3.3236083984375, 3.443603515625, 3.5635986328125, 3.68359375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 4.0, 4.0, 11.0, 10.0, 22.0, 16.0, 11.0, 14.0, 21.0, 24.0, 20.0, 37.0, 29.0, 28.0, 40.0, 43.0, 38.0, 39.0, 29.0, 51.0, 47.0, 49.0, 33.0, 43.0, 31.0, 29.0, 29.0, 26.0, 32.0, 26.0, 29.0, 28.0, 21.0, 14.0, 14.0, 9.0, 10.0, 11.0, 5.0, 6.0, 3.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.736328125, -2.6539306640625, -2.571533203125, -2.4891357421875, -2.40673828125, -2.3243408203125, -2.241943359375, -2.1595458984375, -2.0771484375, -1.9947509765625, -1.912353515625, -1.8299560546875, -1.74755859375, -1.6651611328125, -1.582763671875, -1.5003662109375, -1.41796875, -1.3355712890625, -1.253173828125, -1.1707763671875, -1.08837890625, -1.0059814453125, -0.923583984375, -0.8411865234375, -0.7587890625, -0.6763916015625, -0.593994140625, -0.5115966796875, -0.42919921875, -0.3468017578125, -0.264404296875, -0.1820068359375, -0.099609375, -0.0172119140625, 0.065185546875, 0.1475830078125, 0.22998046875, 0.3123779296875, 0.394775390625, 0.4771728515625, 0.5595703125, 0.6419677734375, 0.724365234375, 0.8067626953125, 0.88916015625, 0.9715576171875, 1.053955078125, 1.1363525390625, 1.21875, 1.3011474609375, 1.383544921875, 1.4659423828125, 1.54833984375, 1.6307373046875, 1.713134765625, 1.7955322265625, 1.8779296875, 1.9603271484375, 2.042724609375, 2.1251220703125, 2.20751953125, 2.2899169921875, 2.372314453125, 2.4547119140625, 2.537109375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 6.0, 5.0, 9.0, 13.0, 16.0, 16.0, 36.0, 55.0, 78.0, 132.0, 197.0, 351.0, 561.0, 1025.0, 1766.0, 3226.0, 5481.0, 10718.0, 19835.0, 38534.0, 75970.0, 146521.0, 244633.0, 228375.0, 130393.0, 67404.0, 34073.0, 17938.0, 9293.0, 5061.0, 2849.0, 1605.0, 953.0, 544.0, 319.0, 218.0, 140.0, 70.0, 51.0, 25.0, 20.0, 14.0, 12.0, 7.0, 4.0, 0.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.060546875, -1.9959716796875, -1.931396484375, -1.8668212890625, -1.80224609375, -1.7376708984375, -1.673095703125, -1.6085205078125, -1.5439453125, -1.4793701171875, -1.414794921875, -1.3502197265625, -1.28564453125, -1.2210693359375, -1.156494140625, -1.0919189453125, -1.02734375, -0.9627685546875, -0.898193359375, -0.8336181640625, -0.76904296875, -0.7044677734375, -0.639892578125, -0.5753173828125, -0.5107421875, -0.4461669921875, -0.381591796875, -0.3170166015625, -0.25244140625, -0.1878662109375, -0.123291015625, -0.0587158203125, 0.005859375, 0.0704345703125, 0.135009765625, 0.1995849609375, 0.26416015625, 0.3287353515625, 0.393310546875, 0.4578857421875, 0.5224609375, 0.5870361328125, 0.651611328125, 0.7161865234375, 0.78076171875, 0.8453369140625, 0.909912109375, 0.9744873046875, 1.0390625, 1.1036376953125, 1.168212890625, 1.2327880859375, 1.29736328125, 1.3619384765625, 1.426513671875, 1.4910888671875, 1.5556640625, 1.6202392578125, 1.684814453125, 1.7493896484375, 1.81396484375, 1.8785400390625, 1.943115234375, 2.0076904296875, 2.072265625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 2.0, 4.0, 3.0, 5.0, 3.0, 4.0, 6.0, 7.0, 6.0, 10.0, 14.0, 14.0, 26.0, 20.0, 38.0, 23.0, 29.0, 46.0, 43.0, 49.0, 64.0, 63.0, 74.0, 58.0, 57.0, 46.0, 33.0, 49.0, 43.0, 32.0, 19.0, 21.0, 20.0, 12.0, 16.0, 7.0, 9.0, 4.0, 7.0, 5.0, 7.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.988380432128906e-05, -8.70702788233757e-05, -8.425675332546234e-05, -8.144322782754898e-05, -7.862970232963562e-05, -7.581617683172226e-05, -7.30026513338089e-05, -7.018912583589554e-05, -6.737560033798218e-05, -6.456207484006882e-05, -6.174854934215546e-05, -5.8935023844242096e-05, -5.6121498346328735e-05, -5.3307972848415375e-05, -5.0494447350502014e-05, -4.7680921852588654e-05, -4.486739635467529e-05, -4.205387085676193e-05, -3.924034535884857e-05, -3.642681986093521e-05, -3.361329436302185e-05, -3.079976886510849e-05, -2.798624336719513e-05, -2.517271786928177e-05, -2.2359192371368408e-05, -1.9545666873455048e-05, -1.6732141375541687e-05, -1.3918615877628326e-05, -1.1105090379714966e-05, -8.291564881801605e-06, -5.478039383888245e-06, -2.664513885974884e-06, 1.4901161193847656e-07, 2.962537109851837e-06, 5.776062607765198e-06, 8.589588105678558e-06, 1.1403113603591919e-05, 1.421663910150528e-05, 1.703016459941864e-05, 1.9843690097332e-05, 2.265721559524536e-05, 2.5470741093158722e-05, 2.8284266591072083e-05, 3.109779208898544e-05, 3.3911317586898804e-05, 3.6724843084812164e-05, 3.9538368582725525e-05, 4.2351894080638885e-05, 4.5165419578552246e-05, 4.797894507646561e-05, 5.079247057437897e-05, 5.360599607229233e-05, 5.641952157020569e-05, 5.923304706811905e-05, 6.204657256603241e-05, 6.486009806394577e-05, 6.767362356185913e-05, 7.048714905977249e-05, 7.330067455768585e-05, 7.611420005559921e-05, 7.892772555351257e-05, 8.174125105142593e-05, 8.45547765493393e-05, 8.736830204725266e-05, 9.018182754516602e-05]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 5.0, 7.0, 6.0, 6.0, 7.0, 14.0, 15.0, 34.0, 36.0, 53.0, 69.0, 104.0, 144.0, 236.0, 333.0, 480.0, 826.0, 1165.0, 1858.0, 2983.0, 4781.0, 7621.0, 12202.0, 19621.0, 30967.0, 49042.0, 74254.0, 107321.0, 138018.0, 151043.0, 137209.0, 105671.0, 72962.0, 47975.0, 30075.0, 19009.0, 11921.0, 7410.0, 4665.0, 2908.0, 1939.0, 1204.0, 778.0, 515.0, 340.0, 237.0, 157.0, 105.0, 73.0, 51.0, 37.0, 23.0, 19.0, 11.0, 7.0, 6.0, 5.0, 4.0, 0.0, 0.0, 2.0], "bins": [-1.2685546875, -1.2294921875, -1.1904296875, -1.1513671875, -1.1123046875, -1.0732421875, -1.0341796875, -0.9951171875, -0.9560546875, -0.9169921875, -0.8779296875, -0.8388671875, -0.7998046875, -0.7607421875, -0.7216796875, -0.6826171875, -0.6435546875, -0.6044921875, -0.5654296875, -0.5263671875, -0.4873046875, -0.4482421875, -0.4091796875, -0.3701171875, -0.3310546875, -0.2919921875, -0.2529296875, -0.2138671875, -0.1748046875, -0.1357421875, -0.0966796875, -0.0576171875, -0.0185546875, 0.0205078125, 0.0595703125, 0.0986328125, 0.1376953125, 0.1767578125, 0.2158203125, 0.2548828125, 0.2939453125, 0.3330078125, 0.3720703125, 0.4111328125, 0.4501953125, 0.4892578125, 0.5283203125, 0.5673828125, 0.6064453125, 0.6455078125, 0.6845703125, 0.7236328125, 0.7626953125, 0.8017578125, 0.8408203125, 0.8798828125, 0.9189453125, 0.9580078125, 0.9970703125, 1.0361328125, 1.0751953125, 1.1142578125, 1.1533203125, 1.1923828125, 1.2314453125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 2.0, 11.0, 14.0, 13.0, 15.0, 12.0, 14.0, 20.0, 25.0, 36.0, 34.0, 44.0, 42.0, 42.0, 52.0, 44.0, 44.0, 41.0, 46.0, 52.0, 42.0, 47.0, 43.0, 34.0, 29.0, 30.0, 26.0, 30.0, 26.0, 13.0, 16.0, 13.0, 10.0, 6.0, 11.0, 5.0, 7.0, 1.0, 3.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.462890625, -0.44986724853515625, -0.4368438720703125, -0.42382049560546875, -0.410797119140625, -0.39777374267578125, -0.3847503662109375, -0.37172698974609375, -0.35870361328125, -0.34568023681640625, -0.3326568603515625, -0.31963348388671875, -0.306610107421875, -0.29358673095703125, -0.2805633544921875, -0.26753997802734375, -0.2545166015625, -0.24149322509765625, -0.2284698486328125, -0.21544647216796875, -0.202423095703125, -0.18939971923828125, -0.1763763427734375, -0.16335296630859375, -0.15032958984375, -0.13730621337890625, -0.1242828369140625, -0.11125946044921875, -0.098236083984375, -0.08521270751953125, -0.0721893310546875, -0.05916595458984375, -0.046142578125, -0.03311920166015625, -0.0200958251953125, -0.00707244873046875, 0.005950927734375, 0.01897430419921875, 0.0319976806640625, 0.04502105712890625, 0.05804443359375, 0.07106781005859375, 0.0840911865234375, 0.09711456298828125, 0.110137939453125, 0.12316131591796875, 0.1361846923828125, 0.14920806884765625, 0.1622314453125, 0.17525482177734375, 0.1882781982421875, 0.20130157470703125, 0.214324951171875, 0.22734832763671875, 0.2403717041015625, 0.25339508056640625, 0.26641845703125, 0.27944183349609375, 0.2924652099609375, 0.30548858642578125, 0.318511962890625, 0.33153533935546875, 0.3445587158203125, 0.35758209228515625, 0.37060546875]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 6.0, 5.0, 9.0, 13.0, 17.0, 12.0, 17.0, 20.0, 18.0, 28.0, 40.0, 27.0, 52.0, 59.0, 76.0, 72.0, 51.0, 66.0, 59.0, 56.0, 67.0, 43.0, 38.0, 27.0, 21.0, 28.0, 13.0, 19.0, 4.0, 13.0, 3.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.75745964050293, -6.534886360168457, -6.312313556671143, -6.08974027633667, -5.867166996002197, -5.644594192504883, -5.42202091217041, -5.1994476318359375, -4.976874351501465, -4.754301071166992, -4.531728267669678, -4.309154987335205, -4.086581707000732, -3.864008665084839, -3.6414356231689453, -3.4188623428344727, -3.196289539337158, -2.9737164974212646, -2.751143217086792, -2.5285701751708984, -2.305996894836426, -2.0834238529205322, -1.8608508110046387, -1.6382776498794556, -1.4157044887542725, -1.1931313276290894, -0.970558226108551, -0.7479851245880127, -0.5254119634628296, -0.3028388023376465, -0.08026576042175293, 0.14230740070343018, 0.3648800849914551, 0.5874532461166382, 0.8100263476371765, 1.0325994491577148, 1.255172610282898, 1.477745771408081, 1.7003188133239746, 1.9228919744491577, 2.145465135574341, 2.3680381774902344, 2.590611457824707, 2.8131844997406006, 3.035757541656494, 3.258330821990967, 3.4809038639068604, 3.703476905822754, 3.9260501861572266, 4.148623466491699, 4.371196269989014, 4.593769550323486, 4.816342830657959, 5.038915634155273, 5.261488914489746, 5.484062194824219, 5.706635475158691, 5.929208755493164, 6.1517815589904785, 6.374354839324951, 6.596928119659424, 6.819500923156738, 7.042074203491211, 7.264647483825684, 7.487220287322998]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 2.0, 5.0, 4.0, 8.0, 11.0, 14.0, 18.0, 12.0, 16.0, 26.0, 26.0, 34.0, 31.0, 34.0, 34.0, 45.0, 51.0, 44.0, 60.0, 57.0, 50.0, 40.0, 48.0, 54.0, 37.0, 32.0, 29.0, 28.0, 37.0, 18.0, 22.0, 24.0, 18.0, 11.0, 7.0, 5.0, 5.0, 3.0, 3.0, 0.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.892008304595947, -4.736620903015137, -4.581233024597168, -4.425845623016357, -4.270457744598389, -4.115070343017578, -3.9596827030181885, -3.804295063018799, -3.648907423019409, -3.4935197830200195, -3.33813214302063, -3.1827445030212402, -3.0273571014404297, -2.871969223022461, -2.7165818214416504, -2.5611941814422607, -2.405806541442871, -2.2504189014434814, -2.095031261444092, -1.9396437406539917, -1.784256100654602, -1.6288684606552124, -1.4734809398651123, -1.3180932998657227, -1.162705659866333, -1.0073180198669434, -0.8519304394721985, -0.6965428590774536, -0.541155219078064, -0.3857675790786743, -0.23037999868392944, -0.07499241828918457, 0.08039522171020508, 0.23578283190727234, 0.3911704421043396, 0.5465580224990845, 0.7019456624984741, 0.8573333024978638, 1.0127208232879639, 1.1681084632873535, 1.3234961032867432, 1.4788837432861328, 1.6342713832855225, 1.7896589040756226, 1.9450465440750122, 2.1004343032836914, 2.255821704864502, 2.4112093448638916, 2.5665969848632812, 2.721984624862671, 2.8773722648620605, 3.03275990486145, 3.18814754486084, 3.3435349464416504, 3.49892258644104, 3.6543102264404297, 3.8096978664398193, 3.965085506439209, 4.1204729080200195, 4.275860786437988, 4.431248188018799, 4.586636066436768, 4.742023468017578, 4.897411346435547, 5.052798748016357]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 10.0, 6.0, 18.0, 20.0, 33.0, 44.0, 78.0, 130.0, 225.0, 365.0, 562.0, 1117.0, 2158.0, 4691.0, 9717.0, 21331.0, 46683.0, 101242.0, 192673.0, 257286.0, 204917.0, 109961.0, 51048.0, 23299.0, 10674.0, 5051.0, 2374.0, 1253.0, 675.0, 358.0, 199.0, 125.0, 83.0, 55.0, 23.0, 24.0, 17.0, 10.0, 7.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.44140625, -7.22607421875, -7.0107421875, -6.79541015625, -6.580078125, -6.36474609375, -6.1494140625, -5.93408203125, -5.71875, -5.50341796875, -5.2880859375, -5.07275390625, -4.857421875, -4.64208984375, -4.4267578125, -4.21142578125, -3.99609375, -3.78076171875, -3.5654296875, -3.35009765625, -3.134765625, -2.91943359375, -2.7041015625, -2.48876953125, -2.2734375, -2.05810546875, -1.8427734375, -1.62744140625, -1.412109375, -1.19677734375, -0.9814453125, -0.76611328125, -0.55078125, -0.33544921875, -0.1201171875, 0.09521484375, 0.310546875, 0.52587890625, 0.7412109375, 0.95654296875, 1.171875, 1.38720703125, 1.6025390625, 1.81787109375, 2.033203125, 2.24853515625, 2.4638671875, 2.67919921875, 2.89453125, 3.10986328125, 3.3251953125, 3.54052734375, 3.755859375, 3.97119140625, 4.1865234375, 4.40185546875, 4.6171875, 4.83251953125, 5.0478515625, 5.26318359375, 5.478515625, 5.69384765625, 5.9091796875, 6.12451171875, 6.33984375]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 6.0, 5.0, 4.0, 10.0, 6.0, 12.0, 12.0, 10.0, 14.0, 22.0, 17.0, 22.0, 37.0, 21.0, 37.0, 38.0, 48.0, 41.0, 40.0, 59.0, 43.0, 55.0, 51.0, 50.0, 37.0, 36.0, 36.0, 28.0, 26.0, 38.0, 17.0, 25.0, 19.0, 17.0, 16.0, 12.0, 10.0, 11.0, 5.0, 3.0, 7.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.91796875, -4.76336669921875, -4.6087646484375, -4.45416259765625, -4.299560546875, -4.14495849609375, -3.9903564453125, -3.83575439453125, -3.68115234375, -3.52655029296875, -3.3719482421875, -3.21734619140625, -3.062744140625, -2.90814208984375, -2.7535400390625, -2.59893798828125, -2.4443359375, -2.28973388671875, -2.1351318359375, -1.98052978515625, -1.825927734375, -1.67132568359375, -1.5167236328125, -1.36212158203125, -1.20751953125, -1.05291748046875, -0.8983154296875, -0.74371337890625, -0.589111328125, -0.43450927734375, -0.2799072265625, -0.12530517578125, 0.029296875, 0.18389892578125, 0.3385009765625, 0.49310302734375, 0.647705078125, 0.80230712890625, 0.9569091796875, 1.11151123046875, 1.26611328125, 1.42071533203125, 1.5753173828125, 1.72991943359375, 1.884521484375, 2.03912353515625, 2.1937255859375, 2.34832763671875, 2.5029296875, 2.65753173828125, 2.8121337890625, 2.96673583984375, 3.121337890625, 3.27593994140625, 3.4305419921875, 3.58514404296875, 3.73974609375, 3.89434814453125, 4.0489501953125, 4.20355224609375, 4.358154296875, 4.51275634765625, 4.6673583984375, 4.82196044921875, 4.9765625]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 6.0, 6.0, 8.0, 10.0, 14.0, 25.0, 45.0, 54.0, 105.0, 144.0, 210.0, 354.0, 531.0, 951.0, 1506.0, 2525.0, 4346.0, 7668.0, 13243.0, 23696.0, 42463.0, 74906.0, 123453.0, 172996.0, 188627.0, 153567.0, 101225.0, 59542.0, 33059.0, 18445.0, 10148.0, 5869.0, 3538.0, 2026.0, 1247.0, 740.0, 465.0, 266.0, 198.0, 111.0, 81.0, 58.0, 15.0, 21.0, 14.0, 10.0, 9.0, 3.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.93359375, -4.77069091796875, -4.6077880859375, -4.44488525390625, -4.281982421875, -4.11907958984375, -3.9561767578125, -3.79327392578125, -3.63037109375, -3.46746826171875, -3.3045654296875, -3.14166259765625, -2.978759765625, -2.81585693359375, -2.6529541015625, -2.49005126953125, -2.3271484375, -2.16424560546875, -2.0013427734375, -1.83843994140625, -1.675537109375, -1.51263427734375, -1.3497314453125, -1.18682861328125, -1.02392578125, -0.86102294921875, -0.6981201171875, -0.53521728515625, -0.372314453125, -0.20941162109375, -0.0465087890625, 0.11639404296875, 0.279296875, 0.44219970703125, 0.6051025390625, 0.76800537109375, 0.930908203125, 1.09381103515625, 1.2567138671875, 1.41961669921875, 1.58251953125, 1.74542236328125, 1.9083251953125, 2.07122802734375, 2.234130859375, 2.39703369140625, 2.5599365234375, 2.72283935546875, 2.8857421875, 3.04864501953125, 3.2115478515625, 3.37445068359375, 3.537353515625, 3.70025634765625, 3.8631591796875, 4.02606201171875, 4.18896484375, 4.35186767578125, 4.5147705078125, 4.67767333984375, 4.840576171875, 5.00347900390625, 5.1663818359375, 5.32928466796875, 5.4921875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 5.0, 4.0, 5.0, 5.0, 2.0, 7.0, 9.0, 14.0, 9.0, 18.0, 5.0, 17.0, 21.0, 22.0, 32.0, 31.0, 25.0, 27.0, 32.0, 39.0, 38.0, 38.0, 49.0, 42.0, 28.0, 35.0, 40.0, 39.0, 37.0, 38.0, 33.0, 27.0, 25.0, 29.0, 38.0, 23.0, 15.0, 19.0, 15.0, 15.0, 12.0, 13.0, 8.0, 9.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.78515625, -2.70452880859375, -2.6239013671875, -2.54327392578125, -2.462646484375, -2.38201904296875, -2.3013916015625, -2.22076416015625, -2.14013671875, -2.05950927734375, -1.9788818359375, -1.89825439453125, -1.817626953125, -1.73699951171875, -1.6563720703125, -1.57574462890625, -1.4951171875, -1.41448974609375, -1.3338623046875, -1.25323486328125, -1.172607421875, -1.09197998046875, -1.0113525390625, -0.93072509765625, -0.85009765625, -0.76947021484375, -0.6888427734375, -0.60821533203125, -0.527587890625, -0.44696044921875, -0.3663330078125, -0.28570556640625, -0.205078125, -0.12445068359375, -0.0438232421875, 0.03680419921875, 0.117431640625, 0.19805908203125, 0.2786865234375, 0.35931396484375, 0.43994140625, 0.52056884765625, 0.6011962890625, 0.68182373046875, 0.762451171875, 0.84307861328125, 0.9237060546875, 1.00433349609375, 1.0849609375, 1.16558837890625, 1.2462158203125, 1.32684326171875, 1.407470703125, 1.48809814453125, 1.5687255859375, 1.64935302734375, 1.72998046875, 1.81060791015625, 1.8912353515625, 1.97186279296875, 2.052490234375, 2.13311767578125, 2.2137451171875, 2.29437255859375, 2.375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 4.0, 12.0, 14.0, 14.0, 30.0, 35.0, 68.0, 81.0, 134.0, 164.0, 318.0, 502.0, 824.0, 1228.0, 1955.0, 3097.0, 5270.0, 8604.0, 14891.0, 25652.0, 44293.0, 76838.0, 123670.0, 175307.0, 187766.0, 147548.0, 94756.0, 56230.0, 32365.0, 18918.0, 10934.0, 6543.0, 4019.0, 2441.0, 1500.0, 922.0, 585.0, 360.0, 227.0, 158.0, 107.0, 47.0, 43.0, 27.0, 20.0, 12.0, 7.0, 3.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.056640625, -1.9927978515625, -1.928955078125, -1.8651123046875, -1.80126953125, -1.7374267578125, -1.673583984375, -1.6097412109375, -1.5458984375, -1.4820556640625, -1.418212890625, -1.3543701171875, -1.29052734375, -1.2266845703125, -1.162841796875, -1.0989990234375, -1.03515625, -0.9713134765625, -0.907470703125, -0.8436279296875, -0.77978515625, -0.7159423828125, -0.652099609375, -0.5882568359375, -0.5244140625, -0.4605712890625, -0.396728515625, -0.3328857421875, -0.26904296875, -0.2052001953125, -0.141357421875, -0.0775146484375, -0.013671875, 0.0501708984375, 0.114013671875, 0.1778564453125, 0.24169921875, 0.3055419921875, 0.369384765625, 0.4332275390625, 0.4970703125, 0.5609130859375, 0.624755859375, 0.6885986328125, 0.75244140625, 0.8162841796875, 0.880126953125, 0.9439697265625, 1.0078125, 1.0716552734375, 1.135498046875, 1.1993408203125, 1.26318359375, 1.3270263671875, 1.390869140625, 1.4547119140625, 1.5185546875, 1.5823974609375, 1.646240234375, 1.7100830078125, 1.77392578125, 1.8377685546875, 1.901611328125, 1.9654541015625, 2.029296875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 8.0, 4.0, 8.0, 8.0, 11.0, 20.0, 19.0, 36.0, 29.0, 37.0, 43.0, 69.0, 56.0, 53.0, 67.0, 63.0, 45.0, 62.0, 47.0, 53.0, 58.0, 43.0, 31.0, 27.0, 21.0, 14.0, 9.0, 18.0, 5.0, 2.0, 9.0, 4.0, 2.0, 6.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000209808349609375, -0.00020316801965236664, -0.00019652768969535828, -0.00018988735973834991, -0.00018324702978134155, -0.0001766066998243332, -0.00016996636986732483, -0.00016332603991031647, -0.0001566857099533081, -0.00015004537999629974, -0.00014340505003929138, -0.00013676472008228302, -0.00013012439012527466, -0.0001234840601682663, -0.00011684373021125793, -0.00011020340025424957, -0.00010356307029724121, -9.692274034023285e-05, -9.028241038322449e-05, -8.364208042621613e-05, -7.700175046920776e-05, -7.03614205121994e-05, -6.372109055519104e-05, -5.708076059818268e-05, -5.0440430641174316e-05, -4.3800100684165955e-05, -3.715977072715759e-05, -3.051944077014923e-05, -2.387911081314087e-05, -1.7238780856132507e-05, -1.0598450899124146e-05, -3.958120942115784e-06, 2.682209014892578e-06, 9.32253897190094e-06, 1.5962868928909302e-05, 2.2603198885917664e-05, 2.9243528842926025e-05, 3.588385879993439e-05, 4.252418875694275e-05, 4.916451871395111e-05, 5.580484867095947e-05, 6.244517862796783e-05, 6.90855085849762e-05, 7.572583854198456e-05, 8.236616849899292e-05, 8.900649845600128e-05, 9.564682841300964e-05, 0.000102287158370018, 0.00010892748832702637, 0.00011556781828403473, 0.0001222081482410431, 0.00012884847819805145, 0.00013548880815505981, 0.00014212913811206818, 0.00014876946806907654, 0.0001554097980260849, 0.00016205012798309326, 0.00016869045794010162, 0.00017533078789710999, 0.00018197111785411835, 0.0001886114478111267, 0.00019525177776813507, 0.00020189210772514343, 0.0002085324376821518, 0.00021517276763916016]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 7.0, 7.0, 15.0, 18.0, 22.0, 32.0, 54.0, 89.0, 152.0, 216.0, 315.0, 513.0, 913.0, 1566.0, 2483.0, 4612.0, 8381.0, 15286.0, 29767.0, 57955.0, 108770.0, 180719.0, 222041.0, 181300.0, 109791.0, 58357.0, 30130.0, 15771.0, 8448.0, 4509.0, 2481.0, 1434.0, 865.0, 574.0, 334.0, 216.0, 125.0, 105.0, 58.0, 47.0, 31.0, 14.0, 10.0, 6.0, 7.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.193359375, -2.1214599609375, -2.049560546875, -1.9776611328125, -1.90576171875, -1.8338623046875, -1.761962890625, -1.6900634765625, -1.6181640625, -1.5462646484375, -1.474365234375, -1.4024658203125, -1.33056640625, -1.2586669921875, -1.186767578125, -1.1148681640625, -1.04296875, -0.9710693359375, -0.899169921875, -0.8272705078125, -0.75537109375, -0.6834716796875, -0.611572265625, -0.5396728515625, -0.4677734375, -0.3958740234375, -0.323974609375, -0.2520751953125, -0.18017578125, -0.1082763671875, -0.036376953125, 0.0355224609375, 0.107421875, 0.1793212890625, 0.251220703125, 0.3231201171875, 0.39501953125, 0.4669189453125, 0.538818359375, 0.6107177734375, 0.6826171875, 0.7545166015625, 0.826416015625, 0.8983154296875, 0.97021484375, 1.0421142578125, 1.114013671875, 1.1859130859375, 1.2578125, 1.3297119140625, 1.401611328125, 1.4735107421875, 1.54541015625, 1.6173095703125, 1.689208984375, 1.7611083984375, 1.8330078125, 1.9049072265625, 1.976806640625, 2.0487060546875, 2.12060546875, 2.1925048828125, 2.264404296875, 2.3363037109375, 2.408203125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 7.0, 2.0, 5.0, 10.0, 8.0, 6.0, 18.0, 13.0, 25.0, 22.0, 28.0, 28.0, 30.0, 30.0, 28.0, 48.0, 45.0, 50.0, 40.0, 57.0, 57.0, 49.0, 43.0, 43.0, 52.0, 33.0, 31.0, 34.0, 22.0, 28.0, 25.0, 15.0, 9.0, 7.0, 13.0, 8.0, 10.0, 5.0, 4.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.58984375, -0.5725784301757812, -0.5553131103515625, -0.5380477905273438, -0.520782470703125, -0.5035171508789062, -0.4862518310546875, -0.46898651123046875, -0.45172119140625, -0.43445587158203125, -0.4171905517578125, -0.39992523193359375, -0.382659912109375, -0.36539459228515625, -0.3481292724609375, -0.33086395263671875, -0.3135986328125, -0.29633331298828125, -0.2790679931640625, -0.26180267333984375, -0.244537353515625, -0.22727203369140625, -0.2100067138671875, -0.19274139404296875, -0.17547607421875, -0.15821075439453125, -0.1409454345703125, -0.12368011474609375, -0.106414794921875, -0.08914947509765625, -0.0718841552734375, -0.05461883544921875, -0.037353515625, -0.02008819580078125, -0.0028228759765625, 0.01444244384765625, 0.031707763671875, 0.04897308349609375, 0.0662384033203125, 0.08350372314453125, 0.10076904296875, 0.11803436279296875, 0.1352996826171875, 0.15256500244140625, 0.169830322265625, 0.18709564208984375, 0.2043609619140625, 0.22162628173828125, 0.2388916015625, 0.25615692138671875, 0.2734222412109375, 0.29068756103515625, 0.307952880859375, 0.32521820068359375, 0.3424835205078125, 0.35974884033203125, 0.37701416015625, 0.39427947998046875, 0.4115447998046875, 0.42881011962890625, 0.446075439453125, 0.46334075927734375, 0.4806060791015625, 0.49787139892578125, 0.51513671875]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 3.0, 4.0, 1.0, 4.0, 3.0, 6.0, 9.0, 11.0, 18.0, 17.0, 23.0, 13.0, 22.0, 23.0, 33.0, 49.0, 43.0, 63.0, 56.0, 58.0, 70.0, 59.0, 63.0, 62.0, 53.0, 37.0, 47.0, 27.0, 33.0, 19.0, 14.0, 17.0, 11.0, 8.0, 10.0, 9.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.388792514801025, -6.171700954437256, -5.954609394073486, -5.737517833709717, -5.520426273345947, -5.303334712982178, -5.086243152618408, -4.869151592254639, -4.652060031890869, -4.4349684715271, -4.21787691116333, -4.0007853507995605, -3.783693790435791, -3.5666022300720215, -3.349510669708252, -3.1324191093444824, -2.915327548980713, -2.6982359886169434, -2.481144428253174, -2.2640528678894043, -2.0469613075256348, -1.8298697471618652, -1.6127781867980957, -1.3956866264343262, -1.1785950660705566, -0.9615035057067871, -0.7444119453430176, -0.527320384979248, -0.3102288246154785, -0.09313726425170898, 0.12395429611206055, 0.3410458564758301, 0.5581374168395996, 0.7752289772033691, 0.9923205375671387, 1.2094120979309082, 1.4265036582946777, 1.6435952186584473, 1.8606867790222168, 2.0777783393859863, 2.294869899749756, 2.5119614601135254, 2.729053020477295, 2.9461445808410645, 3.163236141204834, 3.3803277015686035, 3.597419261932373, 3.8145108222961426, 4.031602382659912, 4.248693943023682, 4.465785503387451, 4.682877063751221, 4.89996862411499, 5.11706018447876, 5.334151744842529, 5.551243305206299, 5.768334865570068, 5.985426425933838, 6.202517986297607, 6.419609546661377, 6.6367011070251465, 6.853792667388916, 7.0708842277526855, 7.287975788116455, 7.505067348480225]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 3.0, 1.0, 7.0, 14.0, 7.0, 9.0, 21.0, 18.0, 26.0, 38.0, 24.0, 36.0, 33.0, 36.0, 54.0, 47.0, 44.0, 48.0, 56.0, 56.0, 60.0, 51.0, 45.0, 28.0, 41.0, 29.0, 31.0, 31.0, 24.0, 12.0, 12.0, 21.0, 11.0, 9.0, 3.0, 9.0, 0.0, 3.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.146744728088379, -4.987565040588379, -4.828384876251221, -4.6692047119140625, -4.5100250244140625, -4.3508453369140625, -4.191665172576904, -4.032485008239746, -3.873305320739746, -3.714125394821167, -3.554945468902588, -3.395765542984009, -3.2365856170654297, -3.0774056911468506, -2.9182257652282715, -2.7590458393096924, -2.5998659133911133, -2.440685987472534, -2.281506061553955, -2.122326135635376, -1.9631462097167969, -1.8039662837982178, -1.6447863578796387, -1.4856064319610596, -1.3264265060424805, -1.1672465801239014, -1.0080666542053223, -0.8488867282867432, -0.6897068023681641, -0.530526876449585, -0.37134695053100586, -0.21216702461242676, -0.05298662185668945, 0.10619330406188965, 0.26537322998046875, 0.42455315589904785, 0.583733081817627, 0.742913007736206, 0.9020929336547852, 1.0612728595733643, 1.2204527854919434, 1.3796327114105225, 1.5388126373291016, 1.6979925632476807, 1.8571724891662598, 2.016352415084839, 2.175532341003418, 2.334712266921997, 2.493892192840576, 2.6530721187591553, 2.8122520446777344, 2.9714319705963135, 3.1306118965148926, 3.2897918224334717, 3.448971748352051, 3.60815167427063, 3.767331600189209, 3.926511526107788, 4.085691452026367, 4.244871139526367, 4.404051303863525, 4.563231468200684, 4.722411155700684, 4.881590843200684, 5.040771007537842]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 2.0, 7.0, 5.0, 17.0, 21.0, 25.0, 36.0, 69.0, 82.0, 131.0, 231.0, 350.0, 568.0, 973.0, 1680.0, 2767.0, 5096.0, 9745.0, 20074.0, 45225.0, 116064.0, 341232.0, 1036173.0, 1541147.0, 707640.0, 222456.0, 78640.0, 32156.0, 14821.0, 7383.0, 3964.0, 2218.0, 1252.0, 726.0, 458.0, 296.0, 194.0, 99.0, 93.0, 45.0, 42.0, 26.0, 15.0, 11.0, 15.0, 11.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.6796875, -8.41912841796875, -8.1585693359375, -7.89801025390625, -7.637451171875, -7.37689208984375, -7.1163330078125, -6.85577392578125, -6.59521484375, -6.33465576171875, -6.0740966796875, -5.81353759765625, -5.552978515625, -5.29241943359375, -5.0318603515625, -4.77130126953125, -4.5107421875, -4.25018310546875, -3.9896240234375, -3.72906494140625, -3.468505859375, -3.20794677734375, -2.9473876953125, -2.68682861328125, -2.42626953125, -2.16571044921875, -1.9051513671875, -1.64459228515625, -1.384033203125, -1.12347412109375, -0.8629150390625, -0.60235595703125, -0.341796875, -0.08123779296875, 0.1793212890625, 0.43988037109375, 0.700439453125, 0.96099853515625, 1.2215576171875, 1.48211669921875, 1.74267578125, 2.00323486328125, 2.2637939453125, 2.52435302734375, 2.784912109375, 3.04547119140625, 3.3060302734375, 3.56658935546875, 3.8271484375, 4.08770751953125, 4.3482666015625, 4.60882568359375, 4.869384765625, 5.12994384765625, 5.3905029296875, 5.65106201171875, 5.91162109375, 6.17218017578125, 6.4327392578125, 6.69329833984375, 6.953857421875, 7.21441650390625, 7.4749755859375, 7.73553466796875, 7.99609375]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 4.0, 2.0, 7.0, 5.0, 11.0, 12.0, 18.0, 19.0, 17.0, 35.0, 32.0, 38.0, 36.0, 43.0, 39.0, 29.0, 43.0, 47.0, 47.0, 51.0, 62.0, 55.0, 46.0, 49.0, 41.0, 32.0, 28.0, 32.0, 20.0, 20.0, 15.0, 11.0, 12.0, 11.0, 12.0, 4.0, 8.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.91796875, -3.799163818359375, -3.68035888671875, -3.561553955078125, -3.4427490234375, -3.323944091796875, -3.20513916015625, -3.086334228515625, -2.967529296875, -2.848724365234375, -2.72991943359375, -2.611114501953125, -2.4923095703125, -2.373504638671875, -2.25469970703125, -2.135894775390625, -2.01708984375, -1.898284912109375, -1.77947998046875, -1.660675048828125, -1.5418701171875, -1.423065185546875, -1.30426025390625, -1.185455322265625, -1.066650390625, -0.947845458984375, -0.82904052734375, -0.710235595703125, -0.5914306640625, -0.472625732421875, -0.35382080078125, -0.235015869140625, -0.1162109375, 0.002593994140625, 0.12139892578125, 0.240203857421875, 0.3590087890625, 0.477813720703125, 0.59661865234375, 0.715423583984375, 0.834228515625, 0.953033447265625, 1.07183837890625, 1.190643310546875, 1.3094482421875, 1.428253173828125, 1.54705810546875, 1.665863037109375, 1.78466796875, 1.903472900390625, 2.02227783203125, 2.141082763671875, 2.2598876953125, 2.378692626953125, 2.49749755859375, 2.616302490234375, 2.735107421875, 2.853912353515625, 2.97271728515625, 3.091522216796875, 3.2103271484375, 3.329132080078125, 3.44793701171875, 3.566741943359375, 3.685546875]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 8.0, 16.0, 14.0, 22.0, 24.0, 39.0, 55.0, 73.0, 124.0, 173.0, 282.0, 412.0, 674.0, 1025.0, 1711.0, 2626.0, 4494.0, 7675.0, 13561.0, 25259.0, 48642.0, 97089.0, 209106.0, 466660.0, 964655.0, 1150781.0, 640240.0, 288736.0, 132224.0, 63898.0, 32342.0, 17466.0, 9695.0, 5580.0, 3283.0, 2031.0, 1218.0, 820.0, 487.0, 347.0, 237.0, 159.0, 94.0, 69.0, 49.0, 34.0, 23.0, 22.0, 10.0, 4.0, 8.0, 5.0, 2.0, 3.0, 1.0, 1.0, 4.0], "bins": [-7.13671875, -6.91510009765625, -6.6934814453125, -6.47186279296875, -6.250244140625, -6.02862548828125, -5.8070068359375, -5.58538818359375, -5.36376953125, -5.14215087890625, -4.9205322265625, -4.69891357421875, -4.477294921875, -4.25567626953125, -4.0340576171875, -3.81243896484375, -3.5908203125, -3.36920166015625, -3.1475830078125, -2.92596435546875, -2.704345703125, -2.48272705078125, -2.2611083984375, -2.03948974609375, -1.81787109375, -1.59625244140625, -1.3746337890625, -1.15301513671875, -0.931396484375, -0.70977783203125, -0.4881591796875, -0.26654052734375, -0.044921875, 0.17669677734375, 0.3983154296875, 0.61993408203125, 0.841552734375, 1.06317138671875, 1.2847900390625, 1.50640869140625, 1.72802734375, 1.94964599609375, 2.1712646484375, 2.39288330078125, 2.614501953125, 2.83612060546875, 3.0577392578125, 3.27935791015625, 3.5009765625, 3.72259521484375, 3.9442138671875, 4.16583251953125, 4.387451171875, 4.60906982421875, 4.8306884765625, 5.05230712890625, 5.27392578125, 5.49554443359375, 5.7171630859375, 5.93878173828125, 6.160400390625, 6.38201904296875, 6.6036376953125, 6.82525634765625, 7.046875]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 5.0, 7.0, 7.0, 5.0, 5.0, 7.0, 18.0, 12.0, 25.0, 44.0, 46.0, 49.0, 76.0, 102.0, 121.0, 143.0, 193.0, 257.0, 315.0, 331.0, 370.0, 346.0, 328.0, 260.0, 231.0, 176.0, 154.0, 109.0, 96.0, 64.0, 54.0, 27.0, 17.0, 20.0, 12.0, 12.0, 16.0, 7.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5625, -2.490875244140625, -2.41925048828125, -2.347625732421875, -2.2760009765625, -2.204376220703125, -2.13275146484375, -2.061126708984375, -1.989501953125, -1.917877197265625, -1.84625244140625, -1.774627685546875, -1.7030029296875, -1.631378173828125, -1.55975341796875, -1.488128662109375, -1.41650390625, -1.344879150390625, -1.27325439453125, -1.201629638671875, -1.1300048828125, -1.058380126953125, -0.98675537109375, -0.915130615234375, -0.843505859375, -0.771881103515625, -0.70025634765625, -0.628631591796875, -0.5570068359375, -0.485382080078125, -0.41375732421875, -0.342132568359375, -0.2705078125, -0.198883056640625, -0.12725830078125, -0.055633544921875, 0.0159912109375, 0.087615966796875, 0.15924072265625, 0.230865478515625, 0.302490234375, 0.374114990234375, 0.44573974609375, 0.517364501953125, 0.5889892578125, 0.660614013671875, 0.73223876953125, 0.803863525390625, 0.87548828125, 0.947113037109375, 1.01873779296875, 1.090362548828125, 1.1619873046875, 1.233612060546875, 1.30523681640625, 1.376861572265625, 1.448486328125, 1.520111083984375, 1.59173583984375, 1.663360595703125, 1.7349853515625, 1.806610107421875, 1.87823486328125, 1.949859619140625, 2.021484375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 6.0, 2.0, 4.0, 7.0, 14.0, 10.0, 14.0, 24.0, 20.0, 41.0, 28.0, 41.0, 49.0, 72.0, 78.0, 65.0, 85.0, 67.0, 63.0, 55.0, 63.0, 39.0, 38.0, 26.0, 24.0, 13.0, 11.0, 14.0, 7.0, 10.0, 5.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.568060874938965, -8.318124771118164, -8.068188667297363, -7.8182525634765625, -7.568316459655762, -7.318380355834961, -7.06844425201416, -6.818508148193359, -6.568572044372559, -6.318635940551758, -6.068699836730957, -5.818763732910156, -5.5688276290893555, -5.318891525268555, -5.068955421447754, -4.819019317626953, -4.569083213806152, -4.319147109985352, -4.069211006164551, -3.81927490234375, -3.569338798522949, -3.3194026947021484, -3.0694665908813477, -2.819530487060547, -2.569594383239746, -2.3196582794189453, -2.0697221755981445, -1.8197860717773438, -1.569849967956543, -1.3199138641357422, -1.0699777603149414, -0.8200416564941406, -0.570106029510498, -0.32016992568969727, -0.07023382186889648, 0.1797022819519043, 0.4296383857727051, 0.6795744895935059, 0.9295105934143066, 1.1794466972351074, 1.4293828010559082, 1.679318904876709, 1.9292550086975098, 2.1791911125183105, 2.4291272163391113, 2.679063320159912, 2.928999423980713, 3.1789355278015137, 3.4288716316223145, 3.6788077354431152, 3.928743839263916, 4.178679943084717, 4.428616046905518, 4.678552150726318, 4.928488254547119, 5.17842435836792, 5.428360462188721, 5.6782965660095215, 5.928232669830322, 6.178168773651123, 6.428104877471924, 6.678040981292725, 6.927977085113525, 7.177913188934326, 7.427849292755127]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 4.0, 2.0, 6.0, 10.0, 17.0, 20.0, 26.0, 14.0, 20.0, 18.0, 27.0, 35.0, 30.0, 29.0, 41.0, 31.0, 31.0, 40.0, 45.0, 46.0, 43.0, 38.0, 41.0, 30.0, 53.0, 24.0, 29.0, 29.0, 32.0, 21.0, 20.0, 21.0, 21.0, 22.0, 17.0, 8.0, 8.0, 5.0, 7.0, 6.0, 7.0, 5.0, 3.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.169615268707275, -4.043285369873047, -3.91695499420166, -3.7906248569488525, -3.664294719696045, -3.5379648208618164, -3.411634683609009, -3.285304546356201, -3.1589744091033936, -3.032644271850586, -2.9063141345977783, -2.7799839973449707, -2.653654098510742, -2.5273237228393555, -2.400993824005127, -2.2746636867523193, -2.1483335494995117, -2.022003412246704, -1.8956732749938965, -1.7693432569503784, -1.6430131196975708, -1.5166829824447632, -1.3903529644012451, -1.2640228271484375, -1.1376926898956299, -1.0113625526428223, -0.8850324749946594, -0.7587023973464966, -0.632372260093689, -0.5060421228408813, -0.3797120451927185, -0.25338196754455566, -0.12705206871032715, -0.0007219612598419189, 0.1256081461906433, 0.25193825364112854, 0.37826836109161377, 0.5045984983444214, 0.6309285759925842, 0.7572586536407471, 0.8835887908935547, 1.0099189281463623, 1.13624906539917, 1.262579083442688, 1.3889092206954956, 1.5152393579483032, 1.6415693759918213, 1.767899513244629, 1.8942296504974365, 2.020559787750244, 2.1468899250030518, 2.2732200622558594, 2.399549961090088, 2.5258803367614746, 2.652210235595703, 2.7785403728485107, 2.9048705101013184, 3.031200647354126, 3.1575307846069336, 3.283860921859741, 3.410191059112549, 3.5365209579467773, 3.662851095199585, 3.7891812324523926, 3.9155113697052]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 1.0, 1.0, 6.0, 10.0, 9.0, 15.0, 23.0, 36.0, 46.0, 89.0, 111.0, 206.0, 330.0, 526.0, 857.0, 1401.0, 2417.0, 3984.0, 6840.0, 11726.0, 20661.0, 36311.0, 64651.0, 109280.0, 165406.0, 196061.0, 166764.0, 109992.0, 64538.0, 36784.0, 20802.0, 11691.0, 6968.0, 3946.0, 2398.0, 1454.0, 843.0, 499.0, 309.0, 203.0, 127.0, 89.0, 55.0, 31.0, 23.0, 14.0, 12.0, 4.0, 2.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0], "bins": [-3.4296875, -3.330291748046875, -3.23089599609375, -3.131500244140625, -3.0321044921875, -2.932708740234375, -2.83331298828125, -2.733917236328125, -2.634521484375, -2.535125732421875, -2.43572998046875, -2.336334228515625, -2.2369384765625, -2.137542724609375, -2.03814697265625, -1.938751220703125, -1.83935546875, -1.739959716796875, -1.64056396484375, -1.541168212890625, -1.4417724609375, -1.342376708984375, -1.24298095703125, -1.143585205078125, -1.044189453125, -0.944793701171875, -0.84539794921875, -0.746002197265625, -0.6466064453125, -0.547210693359375, -0.44781494140625, -0.348419189453125, -0.2490234375, -0.149627685546875, -0.05023193359375, 0.049163818359375, 0.1485595703125, 0.247955322265625, 0.34735107421875, 0.446746826171875, 0.546142578125, 0.645538330078125, 0.74493408203125, 0.844329833984375, 0.9437255859375, 1.043121337890625, 1.14251708984375, 1.241912841796875, 1.34130859375, 1.440704345703125, 1.54010009765625, 1.639495849609375, 1.7388916015625, 1.838287353515625, 1.93768310546875, 2.037078857421875, 2.136474609375, 2.235870361328125, 2.33526611328125, 2.434661865234375, 2.5340576171875, 2.633453369140625, 2.73284912109375, 2.832244873046875, 2.931640625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 4.0, 0.0, 4.0, 4.0, 8.0, 10.0, 10.0, 12.0, 20.0, 18.0, 18.0, 23.0, 16.0, 28.0, 29.0, 35.0, 28.0, 36.0, 41.0, 42.0, 41.0, 49.0, 58.0, 37.0, 39.0, 47.0, 27.0, 26.0, 33.0, 36.0, 23.0, 32.0, 24.0, 24.0, 18.0, 20.0, 17.0, 12.0, 9.0, 13.0, 8.0, 4.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.15234375, -4.01324462890625, -3.8741455078125, -3.73504638671875, -3.595947265625, -3.45684814453125, -3.3177490234375, -3.17864990234375, -3.03955078125, -2.90045166015625, -2.7613525390625, -2.62225341796875, -2.483154296875, -2.34405517578125, -2.2049560546875, -2.06585693359375, -1.9267578125, -1.78765869140625, -1.6485595703125, -1.50946044921875, -1.370361328125, -1.23126220703125, -1.0921630859375, -0.95306396484375, -0.81396484375, -0.67486572265625, -0.5357666015625, -0.39666748046875, -0.257568359375, -0.11846923828125, 0.0206298828125, 0.15972900390625, 0.298828125, 0.43792724609375, 0.5770263671875, 0.71612548828125, 0.855224609375, 0.99432373046875, 1.1334228515625, 1.27252197265625, 1.41162109375, 1.55072021484375, 1.6898193359375, 1.82891845703125, 1.968017578125, 2.10711669921875, 2.2462158203125, 2.38531494140625, 2.5244140625, 2.66351318359375, 2.8026123046875, 2.94171142578125, 3.080810546875, 3.21990966796875, 3.3590087890625, 3.49810791015625, 3.63720703125, 3.77630615234375, 3.9154052734375, 4.05450439453125, 4.193603515625, 4.33270263671875, 4.4718017578125, 4.61090087890625, 4.75]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 13.0, 22.0, 18.0, 34.0, 40.0, 64.0, 81.0, 139.0, 180.0, 268.0, 385.0, 554.0, 792.0, 1191.0, 1771.0, 2712.0, 4077.0, 6220.0, 9655.0, 15069.0, 24007.0, 38049.0, 60442.0, 93929.0, 138190.0, 171804.0, 157934.0, 114283.0, 74934.0, 47821.0, 30127.0, 18878.0, 12010.0, 7750.0, 5038.0, 3240.0, 2185.0, 1457.0, 980.0, 684.0, 434.0, 327.0, 223.0, 182.0, 123.0, 87.0, 47.0, 31.0, 30.0, 12.0, 11.0, 5.0, 11.0, 7.0, 1.0, 2.0, 1.0, 2.0], "bins": [-2.890625, -2.799560546875, -2.70849609375, -2.617431640625, -2.5263671875, -2.435302734375, -2.34423828125, -2.253173828125, -2.162109375, -2.071044921875, -1.97998046875, -1.888916015625, -1.7978515625, -1.706787109375, -1.61572265625, -1.524658203125, -1.43359375, -1.342529296875, -1.25146484375, -1.160400390625, -1.0693359375, -0.978271484375, -0.88720703125, -0.796142578125, -0.705078125, -0.614013671875, -0.52294921875, -0.431884765625, -0.3408203125, -0.249755859375, -0.15869140625, -0.067626953125, 0.0234375, 0.114501953125, 0.20556640625, 0.296630859375, 0.3876953125, 0.478759765625, 0.56982421875, 0.660888671875, 0.751953125, 0.843017578125, 0.93408203125, 1.025146484375, 1.1162109375, 1.207275390625, 1.29833984375, 1.389404296875, 1.48046875, 1.571533203125, 1.66259765625, 1.753662109375, 1.8447265625, 1.935791015625, 2.02685546875, 2.117919921875, 2.208984375, 2.300048828125, 2.39111328125, 2.482177734375, 2.5732421875, 2.664306640625, 2.75537109375, 2.846435546875, 2.9375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 4.0, 4.0, 1.0, 5.0, 3.0, 4.0, 5.0, 8.0, 5.0, 13.0, 13.0, 17.0, 19.0, 25.0, 23.0, 25.0, 19.0, 27.0, 23.0, 40.0, 25.0, 38.0, 31.0, 34.0, 28.0, 38.0, 38.0, 53.0, 49.0, 39.0, 35.0, 32.0, 30.0, 34.0, 23.0, 21.0, 31.0, 25.0, 15.0, 17.0, 20.0, 15.0, 14.0, 9.0, 6.0, 10.0, 5.0, 8.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.423828125, -2.34619140625, -2.2685546875, -2.19091796875, -2.11328125, -2.03564453125, -1.9580078125, -1.88037109375, -1.802734375, -1.72509765625, -1.6474609375, -1.56982421875, -1.4921875, -1.41455078125, -1.3369140625, -1.25927734375, -1.181640625, -1.10400390625, -1.0263671875, -0.94873046875, -0.87109375, -0.79345703125, -0.7158203125, -0.63818359375, -0.560546875, -0.48291015625, -0.4052734375, -0.32763671875, -0.25, -0.17236328125, -0.0947265625, -0.01708984375, 0.060546875, 0.13818359375, 0.2158203125, 0.29345703125, 0.37109375, 0.44873046875, 0.5263671875, 0.60400390625, 0.681640625, 0.75927734375, 0.8369140625, 0.91455078125, 0.9921875, 1.06982421875, 1.1474609375, 1.22509765625, 1.302734375, 1.38037109375, 1.4580078125, 1.53564453125, 1.61328125, 1.69091796875, 1.7685546875, 1.84619140625, 1.923828125, 2.00146484375, 2.0791015625, 2.15673828125, 2.234375, 2.31201171875, 2.3896484375, 2.46728515625, 2.544921875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 4.0, 6.0, 9.0, 8.0, 7.0, 17.0, 20.0, 26.0, 29.0, 42.0, 68.0, 114.0, 164.0, 251.0, 377.0, 589.0, 868.0, 1438.0, 2415.0, 4198.0, 7487.0, 13915.0, 27382.0, 55300.0, 115547.0, 226909.0, 274043.0, 160821.0, 76977.0, 37435.0, 18689.0, 9961.0, 5480.0, 3052.0, 1744.0, 1118.0, 680.0, 440.0, 312.0, 177.0, 134.0, 96.0, 57.0, 52.0, 29.0, 21.0, 18.0, 11.0, 8.0, 8.0, 6.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8994140625, -1.8344268798828125, -1.769439697265625, -1.7044525146484375, -1.63946533203125, -1.5744781494140625, -1.509490966796875, -1.4445037841796875, -1.3795166015625, -1.3145294189453125, -1.249542236328125, -1.1845550537109375, -1.11956787109375, -1.0545806884765625, -0.989593505859375, -0.9246063232421875, -0.859619140625, -0.7946319580078125, -0.729644775390625, -0.6646575927734375, -0.59967041015625, -0.5346832275390625, -0.469696044921875, -0.4047088623046875, -0.3397216796875, -0.2747344970703125, -0.209747314453125, -0.1447601318359375, -0.07977294921875, -0.0147857666015625, 0.050201416015625, 0.1151885986328125, 0.18017578125, 0.2451629638671875, 0.310150146484375, 0.3751373291015625, 0.44012451171875, 0.5051116943359375, 0.570098876953125, 0.6350860595703125, 0.7000732421875, 0.7650604248046875, 0.830047607421875, 0.8950347900390625, 0.96002197265625, 1.0250091552734375, 1.089996337890625, 1.1549835205078125, 1.219970703125, 1.2849578857421875, 1.349945068359375, 1.4149322509765625, 1.47991943359375, 1.5449066162109375, 1.609893798828125, 1.6748809814453125, 1.7398681640625, 1.8048553466796875, 1.869842529296875, 1.9348297119140625, 1.99981689453125, 2.0648040771484375, 2.129791259765625, 2.1947784423828125, 2.259765625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 11.0, 7.0, 12.0, 12.0, 15.0, 16.0, 31.0, 30.0, 44.0, 58.0, 56.0, 64.0, 75.0, 76.0, 88.0, 71.0, 53.0, 52.0, 50.0, 39.0, 28.0, 19.0, 22.0, 23.0, 11.0, 13.0, 5.0, 4.0, 3.0, 3.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00015425682067871094, -0.00014993548393249512, -0.0001456141471862793, -0.00014129281044006348, -0.00013697147369384766, -0.00013265013694763184, -0.00012832880020141602, -0.0001240074634552002, -0.00011968612670898438, -0.00011536478996276855, -0.00011104345321655273, -0.00010672211647033691, -0.0001024007797241211, -9.807944297790527e-05, -9.375810623168945e-05, -8.943676948547363e-05, -8.511543273925781e-05, -8.079409599304199e-05, -7.647275924682617e-05, -7.215142250061035e-05, -6.783008575439453e-05, -6.350874900817871e-05, -5.918741226196289e-05, -5.486607551574707e-05, -5.054473876953125e-05, -4.622340202331543e-05, -4.190206527709961e-05, -3.758072853088379e-05, -3.325939178466797e-05, -2.893805503845215e-05, -2.4616718292236328e-05, -2.0295381546020508e-05, -1.5974044799804688e-05, -1.1652708053588867e-05, -7.331371307373047e-06, -3.0100345611572266e-06, 1.3113021850585938e-06, 5.632638931274414e-06, 9.953975677490234e-06, 1.4275312423706055e-05, 1.8596649169921875e-05, 2.2917985916137695e-05, 2.7239322662353516e-05, 3.1560659408569336e-05, 3.5881996154785156e-05, 4.0203332901000977e-05, 4.45246696472168e-05, 4.884600639343262e-05, 5.316734313964844e-05, 5.748867988586426e-05, 6.181001663208008e-05, 6.61313533782959e-05, 7.045269012451172e-05, 7.477402687072754e-05, 7.909536361694336e-05, 8.341670036315918e-05, 8.7738037109375e-05, 9.205937385559082e-05, 9.638071060180664e-05, 0.00010070204734802246, 0.00010502338409423828, 0.0001093447208404541, 0.00011366605758666992, 0.00011798739433288574, 0.00012230873107910156]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 6.0, 4.0, 7.0, 11.0, 19.0, 38.0, 55.0, 63.0, 109.0, 199.0, 301.0, 513.0, 822.0, 1470.0, 2615.0, 4874.0, 9375.0, 19144.0, 41029.0, 88232.0, 176137.0, 257422.0, 217186.0, 119724.0, 56605.0, 26062.0, 12400.0, 6315.0, 3330.0, 1826.0, 1063.0, 606.0, 369.0, 231.0, 138.0, 104.0, 63.0, 38.0, 24.0, 8.0, 11.0, 9.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.1328125, -2.0695343017578125, -2.006256103515625, -1.9429779052734375, -1.87969970703125, -1.8164215087890625, -1.753143310546875, -1.6898651123046875, -1.6265869140625, -1.5633087158203125, -1.500030517578125, -1.4367523193359375, -1.37347412109375, -1.3101959228515625, -1.246917724609375, -1.1836395263671875, -1.120361328125, -1.0570831298828125, -0.993804931640625, -0.9305267333984375, -0.86724853515625, -0.8039703369140625, -0.740692138671875, -0.6774139404296875, -0.6141357421875, -0.5508575439453125, -0.487579345703125, -0.4243011474609375, -0.36102294921875, -0.2977447509765625, -0.234466552734375, -0.1711883544921875, -0.10791015625, -0.0446319580078125, 0.018646240234375, 0.0819244384765625, 0.14520263671875, 0.2084808349609375, 0.271759033203125, 0.3350372314453125, 0.3983154296875, 0.4615936279296875, 0.524871826171875, 0.5881500244140625, 0.65142822265625, 0.7147064208984375, 0.777984619140625, 0.8412628173828125, 0.904541015625, 0.9678192138671875, 1.031097412109375, 1.0943756103515625, 1.15765380859375, 1.2209320068359375, 1.284210205078125, 1.3474884033203125, 1.4107666015625, 1.4740447998046875, 1.537322998046875, 1.6006011962890625, 1.66387939453125, 1.7271575927734375, 1.790435791015625, 1.8537139892578125, 1.9169921875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 10.0, 14.0, 8.0, 9.0, 10.0, 13.0, 20.0, 23.0, 21.0, 36.0, 26.0, 40.0, 38.0, 55.0, 45.0, 56.0, 65.0, 73.0, 51.0, 57.0, 50.0, 44.0, 43.0, 37.0, 36.0, 22.0, 17.0, 15.0, 16.0, 16.0, 13.0, 6.0, 4.0, 7.0, 5.0, 0.0, 5.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.385009765625, -0.3710136413574219, -0.35701751708984375, -0.3430213928222656, -0.3290252685546875, -0.3150291442871094, -0.30103302001953125, -0.2870368957519531, -0.273040771484375, -0.2590446472167969, -0.24504852294921875, -0.23105239868164062, -0.2170562744140625, -0.20306015014648438, -0.18906402587890625, -0.17506790161132812, -0.16107177734375, -0.14707565307617188, -0.13307952880859375, -0.11908340454101562, -0.1050872802734375, -0.09109115600585938, -0.07709503173828125, -0.06309890747070312, -0.049102783203125, -0.035106658935546875, -0.02111053466796875, -0.007114410400390625, 0.0068817138671875, 0.020877838134765625, 0.03487396240234375, 0.048870086669921875, 0.0628662109375, 0.07686233520507812, 0.09085845947265625, 0.10485458374023438, 0.1188507080078125, 0.13284683227539062, 0.14684295654296875, 0.16083908081054688, 0.174835205078125, 0.18883132934570312, 0.20282745361328125, 0.21682357788085938, 0.2308197021484375, 0.24481582641601562, 0.25881195068359375, 0.2728080749511719, 0.28680419921875, 0.3008003234863281, 0.31479644775390625, 0.3287925720214844, 0.3427886962890625, 0.3567848205566406, 0.37078094482421875, 0.3847770690917969, 0.398773193359375, 0.4127693176269531, 0.42676544189453125, 0.4407615661621094, 0.4547576904296875, 0.4687538146972656, 0.48274993896484375, 0.4967460632324219, 0.5107421875]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 5.0, 5.0, 3.0, 16.0, 13.0, 14.0, 24.0, 21.0, 39.0, 35.0, 40.0, 51.0, 73.0, 76.0, 63.0, 85.0, 78.0, 60.0, 54.0, 54.0, 41.0, 35.0, 31.0, 15.0, 15.0, 14.0, 10.0, 5.0, 8.0, 6.0, 3.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.66557502746582, -8.418362617492676, -8.171150207519531, -7.9239373207092285, -7.676724433898926, -7.429512023925781, -7.182299613952637, -6.935086727142334, -6.687873840332031, -6.440661430358887, -6.193448543548584, -5.9462361335754395, -5.699023246765137, -5.451810836791992, -5.204598426818848, -4.957385540008545, -4.7101731300354, -4.462960720062256, -4.215747833251953, -3.9685354232788086, -3.721322536468506, -3.4741101264953613, -3.2268974781036377, -2.979684829711914, -2.7324721813201904, -2.485259532928467, -2.238046884536743, -1.990834355354309, -1.7436217069625854, -1.4964090585708618, -1.2491965293884277, -1.001983880996704, -0.7547707557678223, -0.5075581073760986, -0.2603455185890198, -0.013132929801940918, 0.23407971858978271, 0.48129236698150635, 0.7285048961639404, 0.9757175445556641, 1.2229301929473877, 1.4701428413391113, 1.717355489730835, 1.964568018913269, 2.211780548095703, 2.458993434906006, 2.7062058448791504, 2.953418493270874, 3.2006311416625977, 3.4478437900543213, 3.695056438446045, 3.9422688484191895, 4.189481735229492, 4.436694145202637, 4.683906555175781, 4.931119441986084, 5.178332328796387, 5.425544738769531, 5.672757625579834, 5.9199700355529785, 6.167182922363281, 6.414395332336426, 6.66160774230957, 6.908820629119873, 7.156033039093018]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 7.0, 2.0, 4.0, 11.0, 12.0, 20.0, 28.0, 17.0, 14.0, 22.0, 30.0, 29.0, 32.0, 35.0, 32.0, 36.0, 38.0, 35.0, 50.0, 49.0, 38.0, 44.0, 42.0, 31.0, 46.0, 32.0, 20.0, 42.0, 29.0, 15.0, 26.0, 22.0, 19.0, 19.0, 9.0, 14.0, 7.0, 2.0, 10.0, 5.0, 5.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.1894402503967285, -4.062045574188232, -3.9346511363983154, -3.8072564601898193, -3.6798620223999023, -3.5524673461914062, -3.42507266998291, -3.297678232192993, -3.170283794403076, -3.04288911819458, -2.915494680404663, -2.788100004196167, -2.66070556640625, -2.533310890197754, -2.405916213989258, -2.278521776199341, -2.1511270999908447, -2.0237324237823486, -1.8963379859924316, -1.7689433097839355, -1.6415488719940186, -1.5141541957855225, -1.386759638786316, -1.2593650817871094, -1.1319705247879028, -1.0045759677886963, -0.8771814107894897, -0.7497867941856384, -0.6223922371864319, -0.49499768018722534, -0.367603063583374, -0.24020850658416748, -0.11281371116638184, 0.014580860733985901, 0.14197543263435364, 0.26937001943588257, 0.3967645764350891, 0.5241591334342957, 0.651553750038147, 0.7789483070373535, 0.9063428640365601, 1.0337374210357666, 1.1611319780349731, 1.2885265350341797, 1.4159212112426758, 1.5433156490325928, 1.6707103252410889, 1.7981048822402954, 1.925499439239502, 2.052894115447998, 2.180288553237915, 2.307683229446411, 2.435077667236328, 2.562472343444824, 2.6898670196533203, 2.8172614574432373, 2.9446558952331543, 3.0720505714416504, 3.1994450092315674, 3.3268396854400635, 3.4542341232299805, 3.5816287994384766, 3.7090234756469727, 3.8364179134368896, 3.9638125896453857]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 3.0, 8.0, 20.0, 20.0, 32.0, 46.0, 79.0, 104.0, 167.0, 297.0, 446.0, 687.0, 1067.0, 1818.0, 3035.0, 5196.0, 9205.0, 16322.0, 28885.0, 51791.0, 90325.0, 144065.0, 190691.0, 183706.0, 133115.0, 81232.0, 45868.0, 25950.0, 14528.0, 8080.0, 4615.0, 2732.0, 1636.0, 1027.0, 611.0, 418.0, 269.0, 145.0, 112.0, 72.0, 48.0, 25.0, 17.0, 7.0, 9.0, 8.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-5.484375, -5.306884765625, -5.12939453125, -4.951904296875, -4.7744140625, -4.596923828125, -4.41943359375, -4.241943359375, -4.064453125, -3.886962890625, -3.70947265625, -3.531982421875, -3.3544921875, -3.177001953125, -2.99951171875, -2.822021484375, -2.64453125, -2.467041015625, -2.28955078125, -2.112060546875, -1.9345703125, -1.757080078125, -1.57958984375, -1.402099609375, -1.224609375, -1.047119140625, -0.86962890625, -0.692138671875, -0.5146484375, -0.337158203125, -0.15966796875, 0.017822265625, 0.1953125, 0.372802734375, 0.55029296875, 0.727783203125, 0.9052734375, 1.082763671875, 1.26025390625, 1.437744140625, 1.615234375, 1.792724609375, 1.97021484375, 2.147705078125, 2.3251953125, 2.502685546875, 2.68017578125, 2.857666015625, 3.03515625, 3.212646484375, 3.39013671875, 3.567626953125, 3.7451171875, 3.922607421875, 4.10009765625, 4.277587890625, 4.455078125, 4.632568359375, 4.81005859375, 4.987548828125, 5.1650390625, 5.342529296875, 5.52001953125, 5.697509765625, 5.875]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 2.0, 5.0, 12.0, 19.0, 11.0, 15.0, 15.0, 27.0, 31.0, 25.0, 33.0, 34.0, 27.0, 32.0, 36.0, 45.0, 48.0, 38.0, 50.0, 45.0, 45.0, 55.0, 43.0, 37.0, 38.0, 29.0, 26.0, 25.0, 17.0, 28.0, 17.0, 18.0, 11.0, 17.0, 6.0, 8.0, 8.0, 1.0, 4.0, 2.0, 6.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.01953125, -4.8702392578125, -4.720947265625, -4.5716552734375, -4.42236328125, -4.2730712890625, -4.123779296875, -3.9744873046875, -3.8251953125, -3.6759033203125, -3.526611328125, -3.3773193359375, -3.22802734375, -3.0787353515625, -2.929443359375, -2.7801513671875, -2.630859375, -2.4815673828125, -2.332275390625, -2.1829833984375, -2.03369140625, -1.8843994140625, -1.735107421875, -1.5858154296875, -1.4365234375, -1.2872314453125, -1.137939453125, -0.9886474609375, -0.83935546875, -0.6900634765625, -0.540771484375, -0.3914794921875, -0.2421875, -0.0928955078125, 0.056396484375, 0.2056884765625, 0.35498046875, 0.5042724609375, 0.653564453125, 0.8028564453125, 0.9521484375, 1.1014404296875, 1.250732421875, 1.4000244140625, 1.54931640625, 1.6986083984375, 1.847900390625, 1.9971923828125, 2.146484375, 2.2957763671875, 2.445068359375, 2.5943603515625, 2.74365234375, 2.8929443359375, 3.042236328125, 3.1915283203125, 3.3408203125, 3.4901123046875, 3.639404296875, 3.7886962890625, 3.93798828125, 4.0872802734375, 4.236572265625, 4.3858642578125, 4.53515625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 7.0, 7.0, 14.0, 19.0, 36.0, 54.0, 78.0, 83.0, 119.0, 203.0, 268.0, 406.0, 630.0, 903.0, 1364.0, 2071.0, 3225.0, 4776.0, 7571.0, 12188.0, 19247.0, 30649.0, 47907.0, 73980.0, 106532.0, 138380.0, 150542.0, 137991.0, 105519.0, 72940.0, 47833.0, 30269.0, 19102.0, 12109.0, 7521.0, 4860.0, 3004.0, 1980.0, 1368.0, 915.0, 588.0, 428.0, 298.0, 154.0, 147.0, 86.0, 45.0, 40.0, 36.0, 26.0, 18.0, 10.0, 3.0, 5.0, 4.0, 2.0, 2.0], "bins": [-4.6171875, -4.47930908203125, -4.3414306640625, -4.20355224609375, -4.065673828125, -3.92779541015625, -3.7899169921875, -3.65203857421875, -3.51416015625, -3.37628173828125, -3.2384033203125, -3.10052490234375, -2.962646484375, -2.82476806640625, -2.6868896484375, -2.54901123046875, -2.4111328125, -2.27325439453125, -2.1353759765625, -1.99749755859375, -1.859619140625, -1.72174072265625, -1.5838623046875, -1.44598388671875, -1.30810546875, -1.17022705078125, -1.0323486328125, -0.89447021484375, -0.756591796875, -0.61871337890625, -0.4808349609375, -0.34295654296875, -0.205078125, -0.06719970703125, 0.0706787109375, 0.20855712890625, 0.346435546875, 0.48431396484375, 0.6221923828125, 0.76007080078125, 0.89794921875, 1.03582763671875, 1.1737060546875, 1.31158447265625, 1.449462890625, 1.58734130859375, 1.7252197265625, 1.86309814453125, 2.0009765625, 2.13885498046875, 2.2767333984375, 2.41461181640625, 2.552490234375, 2.69036865234375, 2.8282470703125, 2.96612548828125, 3.10400390625, 3.24188232421875, 3.3797607421875, 3.51763916015625, 3.655517578125, 3.79339599609375, 3.9312744140625, 4.06915283203125, 4.20703125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 7.0, 4.0, 10.0, 13.0, 12.0, 13.0, 17.0, 27.0, 28.0, 27.0, 30.0, 35.0, 31.0, 29.0, 44.0, 42.0, 45.0, 43.0, 39.0, 29.0, 38.0, 47.0, 36.0, 35.0, 42.0, 35.0, 41.0, 31.0, 21.0, 23.0, 22.0, 19.0, 19.0, 19.0, 9.0, 12.0, 5.0, 8.0, 5.0, 3.0, 6.0, 1.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.00390625, -2.917327880859375, -2.83074951171875, -2.744171142578125, -2.6575927734375, -2.571014404296875, -2.48443603515625, -2.397857666015625, -2.311279296875, -2.224700927734375, -2.13812255859375, -2.051544189453125, -1.9649658203125, -1.878387451171875, -1.79180908203125, -1.705230712890625, -1.61865234375, -1.532073974609375, -1.44549560546875, -1.358917236328125, -1.2723388671875, -1.185760498046875, -1.09918212890625, -1.012603759765625, -0.926025390625, -0.839447021484375, -0.75286865234375, -0.666290283203125, -0.5797119140625, -0.493133544921875, -0.40655517578125, -0.319976806640625, -0.2333984375, -0.146820068359375, -0.06024169921875, 0.026336669921875, 0.1129150390625, 0.199493408203125, 0.28607177734375, 0.372650146484375, 0.459228515625, 0.545806884765625, 0.63238525390625, 0.718963623046875, 0.8055419921875, 0.892120361328125, 0.97869873046875, 1.065277099609375, 1.15185546875, 1.238433837890625, 1.32501220703125, 1.411590576171875, 1.4981689453125, 1.584747314453125, 1.67132568359375, 1.757904052734375, 1.844482421875, 1.931060791015625, 2.01763916015625, 2.104217529296875, 2.1907958984375, 2.277374267578125, 2.36395263671875, 2.450531005859375, 2.537109375]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 7.0, 11.0, 19.0, 20.0, 37.0, 50.0, 65.0, 112.0, 132.0, 173.0, 248.0, 378.0, 545.0, 777.0, 1268.0, 1879.0, 3177.0, 5505.0, 9817.0, 18416.0, 36199.0, 72541.0, 139870.0, 218760.0, 226060.0, 149274.0, 78977.0, 38957.0, 19696.0, 10447.0, 5826.0, 3285.0, 2040.0, 1298.0, 818.0, 559.0, 376.0, 271.0, 197.0, 125.0, 99.0, 69.0, 53.0, 35.0, 38.0, 10.0, 14.0, 11.0, 6.0, 2.0, 3.0, 3.0, 2.0, 3.0], "bins": [-2.701171875, -2.621856689453125, -2.54254150390625, -2.463226318359375, -2.3839111328125, -2.304595947265625, -2.22528076171875, -2.145965576171875, -2.066650390625, -1.987335205078125, -1.90802001953125, -1.828704833984375, -1.7493896484375, -1.670074462890625, -1.59075927734375, -1.511444091796875, -1.43212890625, -1.352813720703125, -1.27349853515625, -1.194183349609375, -1.1148681640625, -1.035552978515625, -0.95623779296875, -0.876922607421875, -0.797607421875, -0.718292236328125, -0.63897705078125, -0.559661865234375, -0.4803466796875, -0.401031494140625, -0.32171630859375, -0.242401123046875, -0.1630859375, -0.083770751953125, -0.00445556640625, 0.074859619140625, 0.1541748046875, 0.233489990234375, 0.31280517578125, 0.392120361328125, 0.471435546875, 0.550750732421875, 0.63006591796875, 0.709381103515625, 0.7886962890625, 0.868011474609375, 0.94732666015625, 1.026641845703125, 1.10595703125, 1.185272216796875, 1.26458740234375, 1.343902587890625, 1.4232177734375, 1.502532958984375, 1.58184814453125, 1.661163330078125, 1.740478515625, 1.819793701171875, 1.89910888671875, 1.978424072265625, 2.0577392578125, 2.137054443359375, 2.21636962890625, 2.295684814453125, 2.375]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 8.0, 4.0, 22.0, 19.0, 27.0, 27.0, 46.0, 43.0, 57.0, 92.0, 86.0, 98.0, 93.0, 79.0, 53.0, 57.0, 50.0, 34.0, 21.0, 21.0, 15.0, 9.0, 10.0, 13.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.00041484832763671875, -0.0004055984318256378, -0.0003963485360145569, -0.00038709864020347595, -0.000377848744392395, -0.0003685988485813141, -0.00035934895277023315, -0.0003500990569591522, -0.0003408491611480713, -0.00033159926533699036, -0.0003223493695259094, -0.0003130994737148285, -0.00030384957790374756, -0.0002945996820926666, -0.0002853497862815857, -0.00027609989047050476, -0.00026684999465942383, -0.0002576000988483429, -0.00024835020303726196, -0.00023910030722618103, -0.0002298504114151001, -0.00022060051560401917, -0.00021135061979293823, -0.0002021007239818573, -0.00019285082817077637, -0.00018360093235969543, -0.0001743510365486145, -0.00016510114073753357, -0.00015585124492645264, -0.0001466013491153717, -0.00013735145330429077, -0.00012810155749320984, -0.0001188516616821289, -0.00010960176587104797, -0.00010035187005996704, -9.110197424888611e-05, -8.185207843780518e-05, -7.260218262672424e-05, -6.335228681564331e-05, -5.410239100456238e-05, -4.4852495193481445e-05, -3.560259938240051e-05, -2.635270357131958e-05, -1.7102807760238647e-05, -7.852911949157715e-06, 1.3969838619232178e-06, 1.064687967300415e-05, 1.9896775484085083e-05, 2.9146671295166016e-05, 3.839656710624695e-05, 4.764646291732788e-05, 5.6896358728408813e-05, 6.614625453948975e-05, 7.539615035057068e-05, 8.464604616165161e-05, 9.389594197273254e-05, 0.00010314583778381348, 0.00011239573359489441, 0.00012164562940597534, 0.00013089552521705627, 0.0001401454210281372, 0.00014939531683921814, 0.00015864521265029907, 0.00016789510846138, 0.00017714500427246094]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 6.0, 9.0, 17.0, 12.0, 24.0, 34.0, 58.0, 67.0, 118.0, 175.0, 257.0, 414.0, 682.0, 1100.0, 1814.0, 3103.0, 5359.0, 9845.0, 19189.0, 39908.0, 83058.0, 160295.0, 239258.0, 220849.0, 131592.0, 65142.0, 31210.0, 15762.0, 8195.0, 4443.0, 2524.0, 1544.0, 898.0, 538.0, 356.0, 239.0, 146.0, 95.0, 76.0, 48.0, 30.0, 19.0, 11.0, 14.0, 4.0, 3.0, 6.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.5, -2.421478271484375, -2.34295654296875, -2.264434814453125, -2.1859130859375, -2.107391357421875, -2.02886962890625, -1.950347900390625, -1.871826171875, -1.793304443359375, -1.71478271484375, -1.636260986328125, -1.5577392578125, -1.479217529296875, -1.40069580078125, -1.322174072265625, -1.24365234375, -1.165130615234375, -1.08660888671875, -1.008087158203125, -0.9295654296875, -0.851043701171875, -0.77252197265625, -0.694000244140625, -0.615478515625, -0.536956787109375, -0.45843505859375, -0.379913330078125, -0.3013916015625, -0.222869873046875, -0.14434814453125, -0.065826416015625, 0.0126953125, 0.091217041015625, 0.16973876953125, 0.248260498046875, 0.3267822265625, 0.405303955078125, 0.48382568359375, 0.562347412109375, 0.640869140625, 0.719390869140625, 0.79791259765625, 0.876434326171875, 0.9549560546875, 1.033477783203125, 1.11199951171875, 1.190521240234375, 1.26904296875, 1.347564697265625, 1.42608642578125, 1.504608154296875, 1.5831298828125, 1.661651611328125, 1.74017333984375, 1.818695068359375, 1.897216796875, 1.975738525390625, 2.05426025390625, 2.132781982421875, 2.2113037109375, 2.289825439453125, 2.36834716796875, 2.446868896484375, 2.525390625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 2.0, 4.0, 2.0, 4.0, 7.0, 4.0, 6.0, 14.0, 8.0, 8.0, 12.0, 12.0, 14.0, 22.0, 23.0, 25.0, 33.0, 32.0, 44.0, 46.0, 42.0, 66.0, 49.0, 57.0, 54.0, 51.0, 43.0, 49.0, 41.0, 27.0, 34.0, 41.0, 30.0, 21.0, 19.0, 16.0, 11.0, 8.0, 4.0, 5.0, 5.0, 4.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46240234375, -0.444915771484375, -0.42742919921875, -0.409942626953125, -0.3924560546875, -0.374969482421875, -0.35748291015625, -0.339996337890625, -0.322509765625, -0.305023193359375, -0.28753662109375, -0.270050048828125, -0.2525634765625, -0.235076904296875, -0.21759033203125, -0.200103759765625, -0.1826171875, -0.165130615234375, -0.14764404296875, -0.130157470703125, -0.1126708984375, -0.095184326171875, -0.07769775390625, -0.060211181640625, -0.042724609375, -0.025238037109375, -0.00775146484375, 0.009735107421875, 0.0272216796875, 0.044708251953125, 0.06219482421875, 0.079681396484375, 0.09716796875, 0.114654541015625, 0.13214111328125, 0.149627685546875, 0.1671142578125, 0.184600830078125, 0.20208740234375, 0.219573974609375, 0.237060546875, 0.254547119140625, 0.27203369140625, 0.289520263671875, 0.3070068359375, 0.324493408203125, 0.34197998046875, 0.359466552734375, 0.376953125, 0.394439697265625, 0.41192626953125, 0.429412841796875, 0.4468994140625, 0.464385986328125, 0.48187255859375, 0.499359130859375, 0.516845703125, 0.534332275390625, 0.55181884765625, 0.569305419921875, 0.5867919921875, 0.604278564453125, 0.62176513671875, 0.639251708984375, 0.65673828125]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 4.0, 2.0, 5.0, 9.0, 7.0, 10.0, 12.0, 19.0, 19.0, 35.0, 41.0, 42.0, 49.0, 69.0, 64.0, 74.0, 93.0, 81.0, 67.0, 68.0, 48.0, 46.0, 32.0, 25.0, 30.0, 12.0, 9.0, 5.0, 14.0, 7.0, 5.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.590655326843262, -10.321578979492188, -10.052502632141113, -9.783426284790039, -9.514350891113281, -9.245274543762207, -8.976198196411133, -8.707121849060059, -8.438045501708984, -8.16896915435791, -7.899892807006836, -7.63081693649292, -7.361740589141846, -7.0926642417907715, -6.8235883712768555, -6.554512023925781, -6.285435676574707, -6.016359329223633, -5.747282981872559, -5.478207111358643, -5.209130764007568, -4.940054416656494, -4.670978546142578, -4.401902198791504, -4.13282585144043, -3.8637495040893555, -3.5946733951568604, -3.3255972862243652, -3.056520938873291, -2.787444591522217, -2.5183684825897217, -2.2492923736572266, -1.9802160263061523, -1.7111397981643677, -1.442063570022583, -1.1729873418807983, -0.9039111137390137, -0.634834885597229, -0.36575865745544434, -0.09668242931365967, 0.172393798828125, 0.44147002696990967, 0.7105462551116943, 0.979622483253479, 1.2486987113952637, 1.5177749395370483, 1.786851167678833, 2.055927276611328, 2.3250036239624023, 2.5940799713134766, 2.8631560802459717, 3.132232189178467, 3.401308536529541, 3.6703848838806152, 3.9394609928131104, 4.2085371017456055, 4.47761344909668, 4.746689796447754, 5.015766143798828, 5.284842014312744, 5.553918361663818, 5.822994709014893, 6.092070579528809, 6.361146926879883, 6.630223274230957]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 6.0, 7.0, 7.0, 6.0, 13.0, 13.0, 12.0, 18.0, 7.0, 18.0, 26.0, 23.0, 41.0, 34.0, 46.0, 35.0, 34.0, 26.0, 28.0, 40.0, 42.0, 42.0, 48.0, 39.0, 33.0, 42.0, 33.0, 43.0, 25.0, 25.0, 30.0, 25.0, 18.0, 23.0, 17.0, 11.0, 9.0, 9.0, 6.0, 8.0, 13.0, 6.0, 2.0, 5.0, 2.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.17221736907959, -4.0430169105529785, -3.9138166904449463, -3.784616470336914, -3.6554160118103027, -3.5262157917022705, -3.3970155715942383, -3.267815113067627, -3.1386148929595947, -3.0094146728515625, -2.880214214324951, -2.751013994216919, -2.6218137741088867, -2.4926133155822754, -2.363413095474243, -2.234212875366211, -2.1050124168395996, -1.9758120775222778, -1.846611738204956, -1.7174115180969238, -1.588211178779602, -1.4590108394622803, -1.329810619354248, -1.2006102800369263, -1.0714099407196045, -0.9422096014022827, -0.8130093216896057, -0.6838090419769287, -0.5546087026596069, -0.42540836334228516, -0.29620808362960815, -0.16700780391693115, -0.03780698776245117, 0.09139332175254822, 0.2205936312675476, 0.349793940782547, 0.4789942502975464, 0.6081945896148682, 0.7373948693275452, 0.8665951490402222, 0.995795488357544, 1.1249958276748657, 1.2541961669921875, 1.3833963871002197, 1.5125967264175415, 1.6417970657348633, 1.7709972858428955, 1.9001976251602173, 2.029397964477539, 2.1585981845855713, 2.2877986431121826, 2.416998863220215, 2.546199321746826, 2.6753995418548584, 2.8045997619628906, 2.933800220489502, 3.063000440597534, 3.1922006607055664, 3.3214011192321777, 3.45060133934021, 3.579801559448242, 3.7090020179748535, 3.8382022380828857, 3.967402458190918, 4.096602916717529]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 1.0, 6.0, 8.0, 15.0, 15.0, 19.0, 43.0, 60.0, 77.0, 138.0, 221.0, 388.0, 665.0, 1221.0, 2207.0, 4004.0, 7323.0, 14534.0, 30164.0, 71018.0, 195507.0, 623944.0, 1506508.0, 1140742.0, 380077.0, 124164.0, 47775.0, 21203.0, 10337.0, 5215.0, 2831.0, 1536.0, 928.0, 551.0, 314.0, 210.0, 105.0, 77.0, 50.0, 34.0, 18.0, 12.0, 11.0, 9.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5703125, -8.3006591796875, -8.031005859375, -7.7613525390625, -7.49169921875, -7.2220458984375, -6.952392578125, -6.6827392578125, -6.4130859375, -6.1434326171875, -5.873779296875, -5.6041259765625, -5.33447265625, -5.0648193359375, -4.795166015625, -4.5255126953125, -4.255859375, -3.9862060546875, -3.716552734375, -3.4468994140625, -3.17724609375, -2.9075927734375, -2.637939453125, -2.3682861328125, -2.0986328125, -1.8289794921875, -1.559326171875, -1.2896728515625, -1.02001953125, -0.7503662109375, -0.480712890625, -0.2110595703125, 0.05859375, 0.3282470703125, 0.597900390625, 0.8675537109375, 1.13720703125, 1.4068603515625, 1.676513671875, 1.9461669921875, 2.2158203125, 2.4854736328125, 2.755126953125, 3.0247802734375, 3.29443359375, 3.5640869140625, 3.833740234375, 4.1033935546875, 4.373046875, 4.6427001953125, 4.912353515625, 5.1820068359375, 5.45166015625, 5.7213134765625, 5.990966796875, 6.2606201171875, 6.5302734375, 6.7999267578125, 7.069580078125, 7.3392333984375, 7.60888671875, 7.8785400390625, 8.148193359375, 8.4178466796875, 8.6875]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 8.0, 5.0, 12.0, 5.0, 10.0, 19.0, 9.0, 18.0, 23.0, 21.0, 34.0, 38.0, 34.0, 31.0, 26.0, 43.0, 37.0, 50.0, 55.0, 44.0, 45.0, 36.0, 42.0, 46.0, 37.0, 32.0, 38.0, 35.0, 32.0, 18.0, 23.0, 17.0, 14.0, 10.0, 9.0, 8.0, 8.0, 6.0, 11.0, 4.0, 6.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.599609375, -3.4892578125, -3.37890625, -3.2685546875, -3.158203125, -3.0478515625, -2.9375, -2.8271484375, -2.716796875, -2.6064453125, -2.49609375, -2.3857421875, -2.275390625, -2.1650390625, -2.0546875, -1.9443359375, -1.833984375, -1.7236328125, -1.61328125, -1.5029296875, -1.392578125, -1.2822265625, -1.171875, -1.0615234375, -0.951171875, -0.8408203125, -0.73046875, -0.6201171875, -0.509765625, -0.3994140625, -0.2890625, -0.1787109375, -0.068359375, 0.0419921875, 0.15234375, 0.2626953125, 0.373046875, 0.4833984375, 0.59375, 0.7041015625, 0.814453125, 0.9248046875, 1.03515625, 1.1455078125, 1.255859375, 1.3662109375, 1.4765625, 1.5869140625, 1.697265625, 1.8076171875, 1.91796875, 2.0283203125, 2.138671875, 2.2490234375, 2.359375, 2.4697265625, 2.580078125, 2.6904296875, 2.80078125, 2.9111328125, 3.021484375, 3.1318359375, 3.2421875, 3.3525390625, 3.462890625]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 7.0, 6.0, 12.0, 23.0, 26.0, 28.0, 54.0, 95.0, 126.0, 223.0, 392.0, 702.0, 1212.0, 2310.0, 4645.0, 9439.0, 20666.0, 47499.0, 118977.0, 331640.0, 959137.0, 1546169.0, 734860.0, 252007.0, 93027.0, 38010.0, 16767.0, 7855.0, 3824.0, 1984.0, 1063.0, 586.0, 359.0, 229.0, 115.0, 76.0, 45.0, 30.0, 20.0, 10.0, 10.0, 9.0, 2.0, 6.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-10.59375, -10.2855224609375, -9.977294921875, -9.6690673828125, -9.36083984375, -9.0526123046875, -8.744384765625, -8.4361572265625, -8.1279296875, -7.8197021484375, -7.511474609375, -7.2032470703125, -6.89501953125, -6.5867919921875, -6.278564453125, -5.9703369140625, -5.662109375, -5.3538818359375, -5.045654296875, -4.7374267578125, -4.42919921875, -4.1209716796875, -3.812744140625, -3.5045166015625, -3.1962890625, -2.8880615234375, -2.579833984375, -2.2716064453125, -1.96337890625, -1.6551513671875, -1.346923828125, -1.0386962890625, -0.73046875, -0.4222412109375, -0.114013671875, 0.1942138671875, 0.50244140625, 0.8106689453125, 1.118896484375, 1.4271240234375, 1.7353515625, 2.0435791015625, 2.351806640625, 2.6600341796875, 2.96826171875, 3.2764892578125, 3.584716796875, 3.8929443359375, 4.201171875, 4.5093994140625, 4.817626953125, 5.1258544921875, 5.43408203125, 5.7423095703125, 6.050537109375, 6.3587646484375, 6.6669921875, 6.9752197265625, 7.283447265625, 7.5916748046875, 7.89990234375, 8.2081298828125, 8.516357421875, 8.8245849609375, 9.1328125]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 1.0, 6.0, 9.0, 10.0, 10.0, 10.0, 19.0, 28.0, 26.0, 45.0, 57.0, 65.0, 83.0, 97.0, 118.0, 155.0, 194.0, 253.0, 295.0, 327.0, 337.0, 333.0, 296.0, 269.0, 226.0, 164.0, 137.0, 118.0, 79.0, 72.0, 63.0, 43.0, 29.0, 25.0, 21.0, 16.0, 10.0, 10.0, 6.0, 6.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.03125, -1.962677001953125, -1.89410400390625, -1.825531005859375, -1.7569580078125, -1.688385009765625, -1.61981201171875, -1.551239013671875, -1.482666015625, -1.414093017578125, -1.34552001953125, -1.276947021484375, -1.2083740234375, -1.139801025390625, -1.07122802734375, -1.002655029296875, -0.93408203125, -0.865509033203125, -0.79693603515625, -0.728363037109375, -0.6597900390625, -0.591217041015625, -0.52264404296875, -0.454071044921875, -0.385498046875, -0.316925048828125, -0.24835205078125, -0.179779052734375, -0.1112060546875, -0.042633056640625, 0.02593994140625, 0.094512939453125, 0.1630859375, 0.231658935546875, 0.30023193359375, 0.368804931640625, 0.4373779296875, 0.505950927734375, 0.57452392578125, 0.643096923828125, 0.711669921875, 0.780242919921875, 0.84881591796875, 0.917388916015625, 0.9859619140625, 1.054534912109375, 1.12310791015625, 1.191680908203125, 1.26025390625, 1.328826904296875, 1.39739990234375, 1.465972900390625, 1.5345458984375, 1.603118896484375, 1.67169189453125, 1.740264892578125, 1.808837890625, 1.877410888671875, 1.94598388671875, 2.014556884765625, 2.0831298828125, 2.151702880859375, 2.22027587890625, 2.288848876953125, 2.357421875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 4.0, 4.0, 10.0, 12.0, 8.0, 20.0, 17.0, 18.0, 37.0, 29.0, 54.0, 42.0, 49.0, 55.0, 59.0, 64.0, 71.0, 74.0, 56.0, 53.0, 50.0, 43.0, 35.0, 24.0, 15.0, 19.0, 13.0, 13.0, 10.0, 9.0, 6.0, 6.0, 3.0, 4.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-8.342803001403809, -8.111039161682129, -7.879275321960449, -7.6475114822387695, -7.415748119354248, -7.183984279632568, -6.952220439910889, -6.720456600189209, -6.488692760467529, -6.25692892074585, -6.02516508102417, -5.793401718139648, -5.561637878417969, -5.329874038696289, -5.098110198974609, -4.86634635925293, -4.63458251953125, -4.40281867980957, -4.171054840087891, -3.93929123878479, -3.7075273990631104, -3.4757637977600098, -3.24399995803833, -3.0122361183166504, -2.780472755432129, -2.548708915710449, -2.3169453144073486, -2.085181474685669, -1.8534176349639893, -1.6216539144515991, -1.389890193939209, -1.1581263542175293, -0.9263625144958496, -0.6945987343788147, -0.4628349840641022, -0.23107123374938965, 0.0006925463676452637, 0.23245632648468018, 0.4642200469970703, 0.69598388671875, 0.9277476072311401, 1.1595113277435303, 1.39127516746521, 1.6230388879776, 1.8548026084899902, 2.08656644821167, 2.3183302879333496, 2.5500941276550293, 2.78185772895813, 3.0136215686798096, 3.24538516998291, 3.47714900970459, 3.7089128494262695, 3.940676689147949, 4.172440528869629, 4.404204368591309, 4.63596773147583, 4.86773157119751, 5.0994954109191895, 5.331258773803711, 5.563022613525391, 5.79478645324707, 6.02655029296875, 6.25831413269043, 6.490077972412109]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 3.0, 0.0, 3.0, 3.0, 1.0, 3.0, 6.0, 10.0, 5.0, 11.0, 11.0, 17.0, 19.0, 15.0, 17.0, 23.0, 18.0, 17.0, 28.0, 38.0, 26.0, 35.0, 36.0, 29.0, 29.0, 42.0, 32.0, 45.0, 39.0, 40.0, 35.0, 40.0, 28.0, 39.0, 37.0, 24.0, 23.0, 17.0, 20.0, 26.0, 16.0, 14.0, 12.0, 8.0, 7.0, 14.0, 8.0, 8.0, 4.0, 7.0, 3.0, 2.0, 3.0, 2.0, 8.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-3.578434467315674, -3.460970163345337, -3.343505859375, -3.226041555404663, -3.108577251434326, -2.9911129474639893, -2.8736486434936523, -2.7561841011047363, -2.6387200355529785, -2.5212557315826416, -2.4037914276123047, -2.2863271236419678, -2.168862819671631, -2.051398515701294, -1.9339340925216675, -1.8164697885513306, -1.699005365371704, -1.5815410614013672, -1.4640767574310303, -1.3466124534606934, -1.2291481494903564, -1.1116838455200195, -0.9942194223403931, -0.8767551183700562, -0.7592908143997192, -0.6418265104293823, -0.5243622064590454, -0.4068978428840637, -0.2894335389137268, -0.1719692349433899, -0.0545048713684082, 0.06295943260192871, 0.18042397499084473, 0.29788827896118164, 0.41535261273384094, 0.5328169465065002, 0.6502812504768372, 0.7677455544471741, 0.8852099180221558, 1.0026742219924927, 1.1201385259628296, 1.2376028299331665, 1.3550671339035034, 1.4725315570831299, 1.5899958610534668, 1.7074601650238037, 1.8249244689941406, 1.9423887729644775, 2.0598530769348145, 2.1773173809051514, 2.2947816848754883, 2.412245988845825, 2.529710292816162, 2.647174596786499, 2.764638900756836, 2.882103443145752, 2.9995675086975098, 3.1170318126678467, 3.2344961166381836, 3.3519604206085205, 3.4694247245788574, 3.5868890285491943, 3.7043533325195312, 3.8218178749084473, 3.939282178878784]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 3.0, 10.0, 9.0, 10.0, 21.0, 36.0, 55.0, 63.0, 113.0, 166.0, 250.0, 388.0, 550.0, 779.0, 1291.0, 2181.0, 3958.0, 7851.0, 17993.0, 46803.0, 132439.0, 316747.0, 309460.0, 127531.0, 45139.0, 17178.0, 7766.0, 3780.0, 2220.0, 1293.0, 780.0, 566.0, 360.0, 280.0, 175.0, 110.0, 66.0, 47.0, 39.0, 16.0, 11.0, 9.0, 9.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.83984375, -7.609130859375, -7.37841796875, -7.147705078125, -6.9169921875, -6.686279296875, -6.45556640625, -6.224853515625, -5.994140625, -5.763427734375, -5.53271484375, -5.302001953125, -5.0712890625, -4.840576171875, -4.60986328125, -4.379150390625, -4.1484375, -3.917724609375, -3.68701171875, -3.456298828125, -3.2255859375, -2.994873046875, -2.76416015625, -2.533447265625, -2.302734375, -2.072021484375, -1.84130859375, -1.610595703125, -1.3798828125, -1.149169921875, -0.91845703125, -0.687744140625, -0.45703125, -0.226318359375, 0.00439453125, 0.235107421875, 0.4658203125, 0.696533203125, 0.92724609375, 1.157958984375, 1.388671875, 1.619384765625, 1.85009765625, 2.080810546875, 2.3115234375, 2.542236328125, 2.77294921875, 3.003662109375, 3.234375, 3.465087890625, 3.69580078125, 3.926513671875, 4.1572265625, 4.387939453125, 4.61865234375, 4.849365234375, 5.080078125, 5.310791015625, 5.54150390625, 5.772216796875, 6.0029296875, 6.233642578125, 6.46435546875, 6.695068359375, 6.92578125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 2.0, 9.0, 7.0, 15.0, 9.0, 10.0, 15.0, 18.0, 25.0, 16.0, 25.0, 20.0, 26.0, 31.0, 33.0, 41.0, 45.0, 45.0, 49.0, 46.0, 39.0, 43.0, 49.0, 39.0, 27.0, 39.0, 31.0, 35.0, 30.0, 35.0, 25.0, 17.0, 13.0, 14.0, 13.0, 6.0, 12.0, 11.0, 5.0, 7.0, 7.0, 5.0, 1.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-4.48828125, -4.345703125, -4.203125, -4.060546875, -3.91796875, -3.775390625, -3.6328125, -3.490234375, -3.34765625, -3.205078125, -3.0625, -2.919921875, -2.77734375, -2.634765625, -2.4921875, -2.349609375, -2.20703125, -2.064453125, -1.921875, -1.779296875, -1.63671875, -1.494140625, -1.3515625, -1.208984375, -1.06640625, -0.923828125, -0.78125, -0.638671875, -0.49609375, -0.353515625, -0.2109375, -0.068359375, 0.07421875, 0.216796875, 0.359375, 0.501953125, 0.64453125, 0.787109375, 0.9296875, 1.072265625, 1.21484375, 1.357421875, 1.5, 1.642578125, 1.78515625, 1.927734375, 2.0703125, 2.212890625, 2.35546875, 2.498046875, 2.640625, 2.783203125, 2.92578125, 3.068359375, 3.2109375, 3.353515625, 3.49609375, 3.638671875, 3.78125, 3.923828125, 4.06640625, 4.208984375, 4.3515625, 4.494140625, 4.63671875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 5.0, 6.0, 8.0, 15.0, 15.0, 21.0, 22.0, 41.0, 41.0, 65.0, 92.0, 129.0, 210.0, 282.0, 495.0, 825.0, 1398.0, 2826.0, 6695.0, 20826.0, 91770.0, 436171.0, 380208.0, 76389.0, 17874.0, 5985.0, 2638.0, 1378.0, 781.0, 444.0, 279.0, 177.0, 117.0, 97.0, 63.0, 58.0, 22.0, 32.0, 15.0, 9.0, 11.0, 7.0, 3.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.6328125, -13.24267578125, -12.8525390625, -12.46240234375, -12.072265625, -11.68212890625, -11.2919921875, -10.90185546875, -10.51171875, -10.12158203125, -9.7314453125, -9.34130859375, -8.951171875, -8.56103515625, -8.1708984375, -7.78076171875, -7.390625, -7.00048828125, -6.6103515625, -6.22021484375, -5.830078125, -5.43994140625, -5.0498046875, -4.65966796875, -4.26953125, -3.87939453125, -3.4892578125, -3.09912109375, -2.708984375, -2.31884765625, -1.9287109375, -1.53857421875, -1.1484375, -0.75830078125, -0.3681640625, 0.02197265625, 0.412109375, 0.80224609375, 1.1923828125, 1.58251953125, 1.97265625, 2.36279296875, 2.7529296875, 3.14306640625, 3.533203125, 3.92333984375, 4.3134765625, 4.70361328125, 5.09375, 5.48388671875, 5.8740234375, 6.26416015625, 6.654296875, 7.04443359375, 7.4345703125, 7.82470703125, 8.21484375, 8.60498046875, 8.9951171875, 9.38525390625, 9.775390625, 10.16552734375, 10.5556640625, 10.94580078125, 11.3359375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 4.0, 8.0, 11.0, 10.0, 14.0, 10.0, 23.0, 33.0, 22.0, 34.0, 36.0, 32.0, 45.0, 50.0, 40.0, 63.0, 43.0, 47.0, 46.0, 40.0, 49.0, 41.0, 37.0, 44.0, 39.0, 40.0, 22.0, 24.0, 16.0, 13.0, 21.0, 11.0, 14.0, 8.0, 4.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.623046875, -3.518707275390625, -3.41436767578125, -3.310028076171875, -3.2056884765625, -3.101348876953125, -2.99700927734375, -2.892669677734375, -2.788330078125, -2.683990478515625, -2.57965087890625, -2.475311279296875, -2.3709716796875, -2.266632080078125, -2.16229248046875, -2.057952880859375, -1.95361328125, -1.849273681640625, -1.74493408203125, -1.640594482421875, -1.5362548828125, -1.431915283203125, -1.32757568359375, -1.223236083984375, -1.118896484375, -1.014556884765625, -0.91021728515625, -0.805877685546875, -0.7015380859375, -0.597198486328125, -0.49285888671875, -0.388519287109375, -0.2841796875, -0.179840087890625, -0.07550048828125, 0.028839111328125, 0.1331787109375, 0.237518310546875, 0.34185791015625, 0.446197509765625, 0.550537109375, 0.654876708984375, 0.75921630859375, 0.863555908203125, 0.9678955078125, 1.072235107421875, 1.17657470703125, 1.280914306640625, 1.38525390625, 1.489593505859375, 1.59393310546875, 1.698272705078125, 1.8026123046875, 1.906951904296875, 2.01129150390625, 2.115631103515625, 2.219970703125, 2.324310302734375, 2.42864990234375, 2.532989501953125, 2.6373291015625, 2.741668701171875, 2.84600830078125, 2.950347900390625, 3.0546875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 5.0, 9.0, 12.0, 26.0, 34.0, 34.0, 53.0, 66.0, 96.0, 126.0, 187.0, 312.0, 444.0, 680.0, 1168.0, 2129.0, 4057.0, 9225.0, 24669.0, 79881.0, 297960.0, 431619.0, 132823.0, 37923.0, 13080.0, 5456.0, 2644.0, 1413.0, 821.0, 493.0, 311.0, 226.0, 140.0, 111.0, 85.0, 70.0, 42.0, 38.0, 26.0, 17.0, 14.0, 4.0, 3.0, 9.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.91015625, -4.75762939453125, -4.6051025390625, -4.45257568359375, -4.300048828125, -4.14752197265625, -3.9949951171875, -3.84246826171875, -3.68994140625, -3.53741455078125, -3.3848876953125, -3.23236083984375, -3.079833984375, -2.92730712890625, -2.7747802734375, -2.62225341796875, -2.4697265625, -2.31719970703125, -2.1646728515625, -2.01214599609375, -1.859619140625, -1.70709228515625, -1.5545654296875, -1.40203857421875, -1.24951171875, -1.09698486328125, -0.9444580078125, -0.79193115234375, -0.639404296875, -0.48687744140625, -0.3343505859375, -0.18182373046875, -0.029296875, 0.12322998046875, 0.2757568359375, 0.42828369140625, 0.580810546875, 0.73333740234375, 0.8858642578125, 1.03839111328125, 1.19091796875, 1.34344482421875, 1.4959716796875, 1.64849853515625, 1.801025390625, 1.95355224609375, 2.1060791015625, 2.25860595703125, 2.4111328125, 2.56365966796875, 2.7161865234375, 2.86871337890625, 3.021240234375, 3.17376708984375, 3.3262939453125, 3.47882080078125, 3.63134765625, 3.78387451171875, 3.9364013671875, 4.08892822265625, 4.241455078125, 4.39398193359375, 4.5465087890625, 4.69903564453125, 4.8515625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 7.0, 6.0, 22.0, 23.0, 38.0, 76.0, 91.0, 128.0, 143.0, 129.0, 110.0, 69.0, 45.0, 35.0, 24.0, 13.0, 12.0, 6.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0002982616424560547, -0.0002888627350330353, -0.00027946382761001587, -0.00027006492018699646, -0.00026066601276397705, -0.00025126710534095764, -0.00024186819791793823, -0.00023246929049491882, -0.00022307038307189941, -0.00021367147564888, -0.0002042725682258606, -0.0001948736608028412, -0.00018547475337982178, -0.00017607584595680237, -0.00016667693853378296, -0.00015727803111076355, -0.00014787912368774414, -0.00013848021626472473, -0.00012908130884170532, -0.00011968240141868591, -0.0001102834939956665, -0.0001008845865726471, -9.148567914962769e-05, -8.208677172660828e-05, -7.268786430358887e-05, -6.328895688056946e-05, -5.389004945755005e-05, -4.449114203453064e-05, -3.509223461151123e-05, -2.569332718849182e-05, -1.6294419765472412e-05, -6.895512342453003e-06, 2.5033950805664062e-06, 1.1902302503585815e-05, 2.1301209926605225e-05, 3.0700117349624634e-05, 4.009902477264404e-05, 4.949793219566345e-05, 5.889683961868286e-05, 6.829574704170227e-05, 7.769465446472168e-05, 8.709356188774109e-05, 9.64924693107605e-05, 0.00010589137673377991, 0.00011529028415679932, 0.00012468919157981873, 0.00013408809900283813, 0.00014348700642585754, 0.00015288591384887695, 0.00016228482127189636, 0.00017168372869491577, 0.00018108263611793518, 0.0001904815435409546, 0.000199880450963974, 0.0002092793583869934, 0.00021867826581001282, 0.00022807717323303223, 0.00023747608065605164, 0.00024687498807907104, 0.00025627389550209045, 0.00026567280292510986, 0.00027507171034812927, 0.0002844706177711487, 0.0002938695251941681, 0.0003032684326171875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 8.0, 9.0, 18.0, 17.0, 26.0, 39.0, 59.0, 74.0, 120.0, 159.0, 253.0, 320.0, 490.0, 709.0, 901.0, 1371.0, 2056.0, 3183.0, 5742.0, 13686.0, 41265.0, 143240.0, 377627.0, 306688.0, 97728.0, 28923.0, 10412.0, 4776.0, 2793.0, 1788.0, 1173.0, 831.0, 576.0, 448.0, 310.0, 218.0, 155.0, 107.0, 74.0, 51.0, 39.0, 33.0, 13.0, 12.0, 8.0, 6.0, 6.0, 7.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.234375, -4.10546875, -3.9765625, -3.84765625, -3.71875, -3.58984375, -3.4609375, -3.33203125, -3.203125, -3.07421875, -2.9453125, -2.81640625, -2.6875, -2.55859375, -2.4296875, -2.30078125, -2.171875, -2.04296875, -1.9140625, -1.78515625, -1.65625, -1.52734375, -1.3984375, -1.26953125, -1.140625, -1.01171875, -0.8828125, -0.75390625, -0.625, -0.49609375, -0.3671875, -0.23828125, -0.109375, 0.01953125, 0.1484375, 0.27734375, 0.40625, 0.53515625, 0.6640625, 0.79296875, 0.921875, 1.05078125, 1.1796875, 1.30859375, 1.4375, 1.56640625, 1.6953125, 1.82421875, 1.953125, 2.08203125, 2.2109375, 2.33984375, 2.46875, 2.59765625, 2.7265625, 2.85546875, 2.984375, 3.11328125, 3.2421875, 3.37109375, 3.5, 3.62890625, 3.7578125, 3.88671875, 4.015625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 12.0, 3.0, 11.0, 40.0, 79.0, 107.0, 163.0, 164.0, 153.0, 100.0, 73.0, 48.0, 20.0, 10.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.5341796875, -1.483734130859375, -1.43328857421875, -1.382843017578125, -1.3323974609375, -1.281951904296875, -1.23150634765625, -1.181060791015625, -1.130615234375, -1.080169677734375, -1.02972412109375, -0.979278564453125, -0.9288330078125, -0.878387451171875, -0.82794189453125, -0.777496337890625, -0.72705078125, -0.676605224609375, -0.62615966796875, -0.575714111328125, -0.5252685546875, -0.474822998046875, -0.42437744140625, -0.373931884765625, -0.323486328125, -0.273040771484375, -0.22259521484375, -0.172149658203125, -0.1217041015625, -0.071258544921875, -0.02081298828125, 0.029632568359375, 0.080078125, 0.130523681640625, 0.18096923828125, 0.231414794921875, 0.2818603515625, 0.332305908203125, 0.38275146484375, 0.433197021484375, 0.483642578125, 0.534088134765625, 0.58453369140625, 0.634979248046875, 0.6854248046875, 0.735870361328125, 0.78631591796875, 0.836761474609375, 0.88720703125, 0.937652587890625, 0.98809814453125, 1.038543701171875, 1.0889892578125, 1.139434814453125, 1.18988037109375, 1.240325927734375, 1.290771484375, 1.341217041015625, 1.39166259765625, 1.442108154296875, 1.4925537109375, 1.542999267578125, 1.59344482421875, 1.643890380859375, 1.6943359375]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 6.0, 8.0, 2.0, 8.0, 5.0, 13.0, 14.0, 14.0, 24.0, 23.0, 33.0, 38.0, 43.0, 43.0, 48.0, 56.0, 66.0, 65.0, 71.0, 65.0, 59.0, 62.0, 38.0, 41.0, 35.0, 20.0, 20.0, 13.0, 11.0, 13.0, 15.0, 3.0, 7.0, 4.0, 2.0, 2.0, 3.0, 5.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.847781181335449, -7.621734619140625, -7.395688056945801, -7.169641017913818, -6.943594455718994, -6.71754789352417, -6.4915008544921875, -6.265454292297363, -6.039407730102539, -5.813361167907715, -5.587314605712891, -5.361267566680908, -5.135221004486084, -4.90917444229126, -4.683127403259277, -4.457080841064453, -4.231034278869629, -4.004987716674805, -3.7789409160614014, -3.552894115447998, -3.326847553253174, -3.1008009910583496, -2.8747541904449463, -2.648707389831543, -2.4226608276367188, -2.1966142654418945, -1.9705674648284912, -1.7445207834243774, -1.5184741020202637, -1.29242742061615, -1.0663807392120361, -0.8403340578079224, -0.6142868995666504, -0.3882402181625366, -0.16219353675842285, 0.06385314464569092, 0.2898998260498047, 0.5159465074539185, 0.7419931888580322, 0.968039870262146, 1.1940865516662598, 1.4201332330703735, 1.6461799144744873, 1.872226595878601, 2.098273277282715, 2.324319839477539, 2.5503666400909424, 2.7764134407043457, 3.00246000289917, 3.228506565093994, 3.4545533657073975, 3.680600166320801, 3.906646728515625, 4.132693290710449, 4.358739852905273, 4.584786891937256, 4.81083345413208, 5.036880016326904, 5.262927055358887, 5.488973617553711, 5.715020179748535, 5.941066741943359, 6.167113304138184, 6.393160343170166, 6.61920690536499]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 6.0, 6.0, 7.0, 9.0, 9.0, 9.0, 16.0, 14.0, 27.0, 24.0, 12.0, 28.0, 21.0, 31.0, 24.0, 41.0, 38.0, 35.0, 28.0, 35.0, 41.0, 37.0, 43.0, 37.0, 49.0, 36.0, 34.0, 37.0, 35.0, 28.0, 19.0, 21.0, 26.0, 19.0, 18.0, 14.0, 8.0, 8.0, 16.0, 13.0, 7.0, 6.0, 4.0, 5.0, 3.0, 1.0, 2.0, 3.0, 5.0, 5.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-3.6926181316375732, -3.572848081588745, -3.453077793121338, -3.3333077430725098, -3.2135376930236816, -3.0937674045562744, -2.9739973545074463, -2.854227066040039, -2.734457015991211, -2.614686965942383, -2.4949166774749756, -2.3751466274261475, -2.2553763389587402, -2.135606288909912, -2.015836238861084, -1.8960660696029663, -1.7762959003448486, -1.656525731086731, -1.5367555618286133, -1.4169855117797852, -1.2972153425216675, -1.1774451732635498, -1.0576751232147217, -0.937904953956604, -0.8181347846984863, -0.6983646154403687, -0.5785945057868958, -0.45882436633110046, -0.3390542268753052, -0.2192840576171875, -0.0995139479637146, 0.0202561616897583, 0.14002633094787598, 0.25979647040367126, 0.37956660985946655, 0.49933674931526184, 0.6191068887710571, 0.7388770580291748, 0.8586471676826477, 0.9784172773361206, 1.0981874465942383, 1.217957615852356, 1.3377277851104736, 1.4574978351593018, 1.5772680044174194, 1.697038173675537, 1.8168082237243652, 1.936578392982483, 2.0563485622406006, 2.1761186122894287, 2.295888900756836, 2.415658950805664, 2.535429000854492, 2.6551992893218994, 2.7749693393707275, 2.8947396278381348, 3.014509677886963, 3.134279727935791, 3.2540500164031982, 3.3738200664520264, 3.4935903549194336, 3.6133604049682617, 3.73313045501709, 3.852900505065918, 3.972670793533325]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 6.0, 5.0, 5.0, 8.0, 22.0, 18.0, 24.0, 49.0, 67.0, 108.0, 199.0, 348.0, 595.0, 1084.0, 2030.0, 3974.0, 8197.0, 16959.0, 37287.0, 84823.0, 176687.0, 267605.0, 227071.0, 120141.0, 54072.0, 23883.0, 11425.0, 5512.0, 2812.0, 1532.0, 812.0, 497.0, 263.0, 155.0, 75.0, 66.0, 59.0, 24.0, 24.0, 17.0, 9.0, 6.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.390625, -8.1175537109375, -7.844482421875, -7.5714111328125, -7.29833984375, -7.0252685546875, -6.752197265625, -6.4791259765625, -6.2060546875, -5.9329833984375, -5.659912109375, -5.3868408203125, -5.11376953125, -4.8406982421875, -4.567626953125, -4.2945556640625, -4.021484375, -3.7484130859375, -3.475341796875, -3.2022705078125, -2.92919921875, -2.6561279296875, -2.383056640625, -2.1099853515625, -1.8369140625, -1.5638427734375, -1.290771484375, -1.0177001953125, -0.74462890625, -0.4715576171875, -0.198486328125, 0.0745849609375, 0.34765625, 0.6207275390625, 0.893798828125, 1.1668701171875, 1.43994140625, 1.7130126953125, 1.986083984375, 2.2591552734375, 2.5322265625, 2.8052978515625, 3.078369140625, 3.3514404296875, 3.62451171875, 3.8975830078125, 4.170654296875, 4.4437255859375, 4.716796875, 4.9898681640625, 5.262939453125, 5.5360107421875, 5.80908203125, 6.0821533203125, 6.355224609375, 6.6282958984375, 6.9013671875, 7.1744384765625, 7.447509765625, 7.7205810546875, 7.99365234375, 8.2667236328125, 8.539794921875, 8.8128662109375, 9.0859375]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 5.0, 5.0, 3.0, 11.0, 12.0, 10.0, 11.0, 14.0, 23.0, 30.0, 27.0, 18.0, 22.0, 35.0, 34.0, 34.0, 37.0, 25.0, 54.0, 36.0, 39.0, 41.0, 41.0, 47.0, 34.0, 36.0, 44.0, 38.0, 31.0, 29.0, 27.0, 21.0, 18.0, 15.0, 21.0, 20.0, 10.0, 5.0, 6.0, 7.0, 4.0, 3.0, 5.0, 4.0, 2.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.57421875, -4.43212890625, -4.2900390625, -4.14794921875, -4.005859375, -3.86376953125, -3.7216796875, -3.57958984375, -3.4375, -3.29541015625, -3.1533203125, -3.01123046875, -2.869140625, -2.72705078125, -2.5849609375, -2.44287109375, -2.30078125, -2.15869140625, -2.0166015625, -1.87451171875, -1.732421875, -1.59033203125, -1.4482421875, -1.30615234375, -1.1640625, -1.02197265625, -0.8798828125, -0.73779296875, -0.595703125, -0.45361328125, -0.3115234375, -0.16943359375, -0.02734375, 0.11474609375, 0.2568359375, 0.39892578125, 0.541015625, 0.68310546875, 0.8251953125, 0.96728515625, 1.109375, 1.25146484375, 1.3935546875, 1.53564453125, 1.677734375, 1.81982421875, 1.9619140625, 2.10400390625, 2.24609375, 2.38818359375, 2.5302734375, 2.67236328125, 2.814453125, 2.95654296875, 3.0986328125, 3.24072265625, 3.3828125, 3.52490234375, 3.6669921875, 3.80908203125, 3.951171875, 4.09326171875, 4.2353515625, 4.37744140625, 4.51953125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 17.0, 11.0, 26.0, 33.0, 47.0, 76.0, 116.0, 172.0, 257.0, 357.0, 553.0, 800.0, 1193.0, 1898.0, 2887.0, 4443.0, 7007.0, 11174.0, 18142.0, 29103.0, 46486.0, 72115.0, 106570.0, 141297.0, 158299.0, 141930.0, 106388.0, 72593.0, 46229.0, 29140.0, 18062.0, 11105.0, 7290.0, 4474.0, 2794.0, 1774.0, 1220.0, 818.0, 544.0, 367.0, 228.0, 161.0, 114.0, 81.0, 68.0, 32.0, 19.0, 22.0, 8.0, 7.0, 6.0, 4.0, 3.0, 3.0], "bins": [-5.578125, -5.41644287109375, -5.2547607421875, -5.09307861328125, -4.931396484375, -4.76971435546875, -4.6080322265625, -4.44635009765625, -4.28466796875, -4.12298583984375, -3.9613037109375, -3.79962158203125, -3.637939453125, -3.47625732421875, -3.3145751953125, -3.15289306640625, -2.9912109375, -2.82952880859375, -2.6678466796875, -2.50616455078125, -2.344482421875, -2.18280029296875, -2.0211181640625, -1.85943603515625, -1.69775390625, -1.53607177734375, -1.3743896484375, -1.21270751953125, -1.051025390625, -0.88934326171875, -0.7276611328125, -0.56597900390625, -0.404296875, -0.24261474609375, -0.0809326171875, 0.08074951171875, 0.242431640625, 0.40411376953125, 0.5657958984375, 0.72747802734375, 0.88916015625, 1.05084228515625, 1.2125244140625, 1.37420654296875, 1.535888671875, 1.69757080078125, 1.8592529296875, 2.02093505859375, 2.1826171875, 2.34429931640625, 2.5059814453125, 2.66766357421875, 2.829345703125, 2.99102783203125, 3.1527099609375, 3.31439208984375, 3.47607421875, 3.63775634765625, 3.7994384765625, 3.96112060546875, 4.122802734375, 4.28448486328125, 4.4461669921875, 4.60784912109375, 4.76953125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 5.0, 11.0, 4.0, 11.0, 11.0, 19.0, 20.0, 20.0, 26.0, 18.0, 32.0, 34.0, 33.0, 30.0, 35.0, 32.0, 43.0, 39.0, 50.0, 46.0, 48.0, 42.0, 38.0, 37.0, 48.0, 33.0, 29.0, 38.0, 40.0, 18.0, 17.0, 18.0, 15.0, 14.0, 13.0, 15.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-3.275390625, -3.18011474609375, -3.0848388671875, -2.98956298828125, -2.894287109375, -2.79901123046875, -2.7037353515625, -2.60845947265625, -2.51318359375, -2.41790771484375, -2.3226318359375, -2.22735595703125, -2.132080078125, -2.03680419921875, -1.9415283203125, -1.84625244140625, -1.7509765625, -1.65570068359375, -1.5604248046875, -1.46514892578125, -1.369873046875, -1.27459716796875, -1.1793212890625, -1.08404541015625, -0.98876953125, -0.89349365234375, -0.7982177734375, -0.70294189453125, -0.607666015625, -0.51239013671875, -0.4171142578125, -0.32183837890625, -0.2265625, -0.13128662109375, -0.0360107421875, 0.05926513671875, 0.154541015625, 0.24981689453125, 0.3450927734375, 0.44036865234375, 0.53564453125, 0.63092041015625, 0.7261962890625, 0.82147216796875, 0.916748046875, 1.01202392578125, 1.1072998046875, 1.20257568359375, 1.2978515625, 1.39312744140625, 1.4884033203125, 1.58367919921875, 1.678955078125, 1.77423095703125, 1.8695068359375, 1.96478271484375, 2.06005859375, 2.15533447265625, 2.2506103515625, 2.34588623046875, 2.441162109375, 2.53643798828125, 2.6317138671875, 2.72698974609375, 2.822265625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 11.0, 8.0, 8.0, 17.0, 18.0, 24.0, 42.0, 50.0, 73.0, 139.0, 184.0, 248.0, 339.0, 475.0, 773.0, 1081.0, 1645.0, 2582.0, 4085.0, 7062.0, 13398.0, 27502.0, 64829.0, 174434.0, 339687.0, 240116.0, 93075.0, 36729.0, 17014.0, 8741.0, 5128.0, 3079.0, 1955.0, 1231.0, 810.0, 624.0, 413.0, 251.0, 189.0, 152.0, 99.0, 60.0, 38.0, 40.0, 31.0, 17.0, 17.0, 12.0, 6.0, 6.0, 7.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.2421875, -5.081787109375, -4.92138671875, -4.760986328125, -4.6005859375, -4.440185546875, -4.27978515625, -4.119384765625, -3.958984375, -3.798583984375, -3.63818359375, -3.477783203125, -3.3173828125, -3.156982421875, -2.99658203125, -2.836181640625, -2.67578125, -2.515380859375, -2.35498046875, -2.194580078125, -2.0341796875, -1.873779296875, -1.71337890625, -1.552978515625, -1.392578125, -1.232177734375, -1.07177734375, -0.911376953125, -0.7509765625, -0.590576171875, -0.43017578125, -0.269775390625, -0.109375, 0.051025390625, 0.21142578125, 0.371826171875, 0.5322265625, 0.692626953125, 0.85302734375, 1.013427734375, 1.173828125, 1.334228515625, 1.49462890625, 1.655029296875, 1.8154296875, 1.975830078125, 2.13623046875, 2.296630859375, 2.45703125, 2.617431640625, 2.77783203125, 2.938232421875, 3.0986328125, 3.259033203125, 3.41943359375, 3.579833984375, 3.740234375, 3.900634765625, 4.06103515625, 4.221435546875, 4.3818359375, 4.542236328125, 4.70263671875, 4.863037109375, 5.0234375]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 6.0, 9.0, 4.0, 16.0, 10.0, 23.0, 29.0, 46.0, 61.0, 97.0, 120.0, 156.0, 139.0, 89.0, 70.0, 50.0, 29.0, 11.0, 10.0, 11.0, 4.0, 5.0, 3.0, 4.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0008454322814941406, -0.0008250437676906586, -0.0008046552538871765, -0.0007842667400836945, -0.0007638782262802124, -0.0007434897124767303, -0.0007231011986732483, -0.0007027126848697662, -0.0006823241710662842, -0.0006619356572628021, -0.0006415471434593201, -0.000621158629655838, -0.000600770115852356, -0.0005803816020488739, -0.0005599930882453918, -0.0005396045744419098, -0.0005192160606384277, -0.0004988275468349457, -0.0004784390330314636, -0.00045805051922798157, -0.0004376620054244995, -0.00041727349162101746, -0.0003968849778175354, -0.00037649646401405334, -0.0003561079502105713, -0.00033571943640708923, -0.0003153309226036072, -0.0002949424088001251, -0.00027455389499664307, -0.000254165381193161, -0.00023377686738967896, -0.0002133883535861969, -0.00019299983978271484, -0.0001726113259792328, -0.00015222281217575073, -0.00013183429837226868, -0.00011144578456878662, -9.105727076530457e-05, -7.066875696182251e-05, -5.0280243158340454e-05, -2.98917293548584e-05, -9.503215551376343e-06, 1.0885298252105713e-05, 3.127381205558777e-05, 5.1662325859069824e-05, 7.205083966255188e-05, 9.243935346603394e-05, 0.00011282786726951599, 0.00013321638107299805, 0.0001536048948764801, 0.00017399340867996216, 0.00019438192248344421, 0.00021477043628692627, 0.00023515895009040833, 0.0002555474638938904, 0.00027593597769737244, 0.0002963244915008545, 0.00031671300530433655, 0.0003371015191078186, 0.00035749003291130066, 0.0003778785467147827, 0.00039826706051826477, 0.0004186555743217468, 0.0004390440881252289, 0.00045943260192871094]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 10.0, 10.0, 13.0, 28.0, 29.0, 45.0, 76.0, 96.0, 174.0, 263.0, 394.0, 624.0, 887.0, 1439.0, 2201.0, 3497.0, 5693.0, 9670.0, 17202.0, 32204.0, 65876.0, 137498.0, 238489.0, 243914.0, 142511.0, 68248.0, 33824.0, 17706.0, 9891.0, 5894.0, 3687.0, 2313.0, 1468.0, 967.0, 620.0, 367.0, 235.0, 161.0, 132.0, 69.0, 47.0, 28.0, 25.0, 9.0, 9.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.40234375, -3.296112060546875, -3.18988037109375, -3.083648681640625, -2.9774169921875, -2.871185302734375, -2.76495361328125, -2.658721923828125, -2.552490234375, -2.446258544921875, -2.34002685546875, -2.233795166015625, -2.1275634765625, -2.021331787109375, -1.91510009765625, -1.808868408203125, -1.70263671875, -1.596405029296875, -1.49017333984375, -1.383941650390625, -1.2777099609375, -1.171478271484375, -1.06524658203125, -0.959014892578125, -0.852783203125, -0.746551513671875, -0.64031982421875, -0.534088134765625, -0.4278564453125, -0.321624755859375, -0.21539306640625, -0.109161376953125, -0.0029296875, 0.103302001953125, 0.20953369140625, 0.315765380859375, 0.4219970703125, 0.528228759765625, 0.63446044921875, 0.740692138671875, 0.846923828125, 0.953155517578125, 1.05938720703125, 1.165618896484375, 1.2718505859375, 1.378082275390625, 1.48431396484375, 1.590545654296875, 1.69677734375, 1.803009033203125, 1.90924072265625, 2.015472412109375, 2.1217041015625, 2.227935791015625, 2.33416748046875, 2.440399169921875, 2.546630859375, 2.652862548828125, 2.75909423828125, 2.865325927734375, 2.9715576171875, 3.077789306640625, 3.18402099609375, 3.290252685546875, 3.396484375]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 2.0, 2.0, 2.0, 3.0, 2.0, 8.0, 11.0, 10.0, 18.0, 18.0, 22.0, 19.0, 23.0, 47.0, 64.0, 41.0, 56.0, 56.0, 67.0, 67.0, 64.0, 61.0, 56.0, 42.0, 30.0, 30.0, 40.0, 25.0, 25.0, 15.0, 12.0, 14.0, 6.0, 9.0, 8.0, 4.0, 6.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.81640625, -0.790283203125, -0.76416015625, -0.738037109375, -0.7119140625, -0.685791015625, -0.65966796875, -0.633544921875, -0.607421875, -0.581298828125, -0.55517578125, -0.529052734375, -0.5029296875, -0.476806640625, -0.45068359375, -0.424560546875, -0.3984375, -0.372314453125, -0.34619140625, -0.320068359375, -0.2939453125, -0.267822265625, -0.24169921875, -0.215576171875, -0.189453125, -0.163330078125, -0.13720703125, -0.111083984375, -0.0849609375, -0.058837890625, -0.03271484375, -0.006591796875, 0.01953125, 0.045654296875, 0.07177734375, 0.097900390625, 0.1240234375, 0.150146484375, 0.17626953125, 0.202392578125, 0.228515625, 0.254638671875, 0.28076171875, 0.306884765625, 0.3330078125, 0.359130859375, 0.38525390625, 0.411376953125, 0.4375, 0.463623046875, 0.48974609375, 0.515869140625, 0.5419921875, 0.568115234375, 0.59423828125, 0.620361328125, 0.646484375, 0.672607421875, 0.69873046875, 0.724853515625, 0.7509765625, 0.777099609375, 0.80322265625, 0.829345703125, 0.85546875]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 3.0, 3.0, 5.0, 11.0, 7.0, 12.0, 11.0, 13.0, 16.0, 20.0, 30.0, 25.0, 31.0, 28.0, 40.0, 34.0, 39.0, 62.0, 67.0, 64.0, 57.0, 64.0, 54.0, 47.0, 52.0, 29.0, 29.0, 13.0, 26.0, 20.0, 14.0, 9.0, 10.0, 11.0, 11.0, 3.0, 6.0, 2.0, 3.0, 1.0, 4.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.40284538269043, -6.201117038726807, -5.999388694763184, -5.797659873962402, -5.595931529998779, -5.394203186035156, -5.192474365234375, -4.990746021270752, -4.789017677307129, -4.587289333343506, -4.385560989379883, -4.183832168579102, -3.9821038246154785, -3.7803754806518555, -3.5786468982696533, -3.376918315887451, -3.175189971923828, -2.973461627960205, -2.771733045578003, -2.570004463195801, -2.3682761192321777, -2.1665477752685547, -1.9648191928863525, -1.76309072971344, -1.5613622665405273, -1.3596338033676147, -1.1579053401947021, -0.9561768770217896, -0.754448413848877, -0.5527199506759644, -0.35099148750305176, -0.14926302433013916, 0.05246591567993164, 0.25419437885284424, 0.45592284202575684, 0.6576513051986694, 0.859379768371582, 1.0611082315444946, 1.2628366947174072, 1.4645651578903198, 1.6662936210632324, 1.868022084236145, 2.0697505474090576, 2.2714791297912598, 2.473207473754883, 2.674935817718506, 2.876664400100708, 3.07839298248291, 3.280121326446533, 3.4818496704101562, 3.6835782527923584, 3.8853068351745605, 4.087035179138184, 4.288763523101807, 4.49049186706543, 4.692220687866211, 4.893949031829834, 5.095677375793457, 5.297406196594238, 5.499134540557861, 5.700862884521484, 5.902591228485107, 6.1043195724487305, 6.306048393249512, 6.507776737213135]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 4.0, 1.0, 3.0, 3.0, 5.0, 7.0, 9.0, 11.0, 5.0, 17.0, 13.0, 22.0, 19.0, 28.0, 26.0, 20.0, 28.0, 25.0, 33.0, 41.0, 42.0, 32.0, 41.0, 48.0, 37.0, 49.0, 45.0, 38.0, 38.0, 27.0, 43.0, 33.0, 28.0, 34.0, 34.0, 27.0, 17.0, 10.0, 12.0, 8.0, 8.0, 8.0, 8.0, 8.0, 4.0, 2.0, 0.0, 4.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-4.52749490737915, -4.39070463180542, -4.2539143562316895, -4.117124557495117, -3.9803342819213867, -3.8435440063476562, -3.706753730773926, -3.5699634552001953, -3.433173418045044, -3.2963831424713135, -3.159593105316162, -3.0228028297424316, -2.886012554168701, -2.74922251701355, -2.6124322414398193, -2.475642204284668, -2.3388519287109375, -2.202061653137207, -2.0652716159820557, -1.9284813404083252, -1.7916911840438843, -1.6549010276794434, -1.518110752105713, -1.381320595741272, -1.244530439376831, -1.1077402830123901, -0.9709500670433044, -0.8341598510742188, -0.6973696947097778, -0.5605795383453369, -0.4237893223762512, -0.2869991064071655, -0.1502084732055664, -0.0134182870388031, 0.1233718991279602, 0.2601620852947235, 0.3969522714614868, 0.5337424278259277, 0.6705326437950134, 0.8073228597640991, 0.94411301612854, 1.080903172492981, 1.2176933288574219, 1.3544836044311523, 1.4912737607955933, 1.6280639171600342, 1.7648541927337646, 1.9016443490982056, 2.0384345054626465, 2.175224781036377, 2.3120148181915283, 2.448805093765259, 2.58559513092041, 2.7223854064941406, 2.859175682067871, 2.9959659576416016, 3.132755994796753, 3.2695462703704834, 3.4063363075256348, 3.5431265830993652, 3.6799168586730957, 3.816706895828247, 3.9534971714019775, 4.090287208557129, 4.227077484130859]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 3.0, 12.0, 15.0, 21.0, 31.0, 47.0, 63.0, 112.0, 181.0, 252.0, 452.0, 750.0, 1388.0, 2432.0, 4699.0, 9699.0, 21073.0, 49377.0, 129991.0, 404757.0, 1294012.0, 1497458.0, 520023.0, 156567.0, 56460.0, 23088.0, 10428.0, 5008.0, 2514.0, 1378.0, 803.0, 445.0, 273.0, 174.0, 102.0, 66.0, 50.0, 28.0, 19.0, 9.0, 5.0, 7.0, 2.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8046875, -10.496826171875, -10.18896484375, -9.881103515625, -9.5732421875, -9.265380859375, -8.95751953125, -8.649658203125, -8.341796875, -8.033935546875, -7.72607421875, -7.418212890625, -7.1103515625, -6.802490234375, -6.49462890625, -6.186767578125, -5.87890625, -5.571044921875, -5.26318359375, -4.955322265625, -4.6474609375, -4.339599609375, -4.03173828125, -3.723876953125, -3.416015625, -3.108154296875, -2.80029296875, -2.492431640625, -2.1845703125, -1.876708984375, -1.56884765625, -1.260986328125, -0.953125, -0.645263671875, -0.33740234375, -0.029541015625, 0.2783203125, 0.586181640625, 0.89404296875, 1.201904296875, 1.509765625, 1.817626953125, 2.12548828125, 2.433349609375, 2.7412109375, 3.049072265625, 3.35693359375, 3.664794921875, 3.97265625, 4.280517578125, 4.58837890625, 4.896240234375, 5.2041015625, 5.511962890625, 5.81982421875, 6.127685546875, 6.435546875, 6.743408203125, 7.05126953125, 7.359130859375, 7.6669921875, 7.974853515625, 8.28271484375, 8.590576171875, 8.8984375]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 3.0, 0.0, 7.0, 4.0, 9.0, 7.0, 14.0, 11.0, 6.0, 7.0, 17.0, 25.0, 29.0, 28.0, 19.0, 34.0, 37.0, 27.0, 30.0, 28.0, 31.0, 40.0, 32.0, 39.0, 33.0, 36.0, 36.0, 37.0, 36.0, 42.0, 35.0, 30.0, 32.0, 27.0, 30.0, 26.0, 21.0, 20.0, 12.0, 11.0, 14.0, 7.0, 6.0, 6.0, 4.0, 3.0, 6.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0], "bins": [-3.224609375, -3.12750244140625, -3.0303955078125, -2.93328857421875, -2.836181640625, -2.73907470703125, -2.6419677734375, -2.54486083984375, -2.44775390625, -2.35064697265625, -2.2535400390625, -2.15643310546875, -2.059326171875, -1.96221923828125, -1.8651123046875, -1.76800537109375, -1.6708984375, -1.57379150390625, -1.4766845703125, -1.37957763671875, -1.282470703125, -1.18536376953125, -1.0882568359375, -0.99114990234375, -0.89404296875, -0.79693603515625, -0.6998291015625, -0.60272216796875, -0.505615234375, -0.40850830078125, -0.3114013671875, -0.21429443359375, -0.1171875, -0.02008056640625, 0.0770263671875, 0.17413330078125, 0.271240234375, 0.36834716796875, 0.4654541015625, 0.56256103515625, 0.65966796875, 0.75677490234375, 0.8538818359375, 0.95098876953125, 1.048095703125, 1.14520263671875, 1.2423095703125, 1.33941650390625, 1.4365234375, 1.53363037109375, 1.6307373046875, 1.72784423828125, 1.824951171875, 1.92205810546875, 2.0191650390625, 2.11627197265625, 2.21337890625, 2.31048583984375, 2.4075927734375, 2.50469970703125, 2.601806640625, 2.69891357421875, 2.7960205078125, 2.89312744140625, 2.990234375]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 1.0, 8.0, 13.0, 14.0, 24.0, 35.0, 34.0, 65.0, 109.0, 138.0, 217.0, 311.0, 474.0, 716.0, 1120.0, 1799.0, 2953.0, 4976.0, 8432.0, 15062.0, 28188.0, 55741.0, 114211.0, 248538.0, 546234.0, 1058596.0, 1064039.0, 552250.0, 251805.0, 116231.0, 56396.0, 28846.0, 15343.0, 8423.0, 4908.0, 2951.0, 1847.0, 1104.0, 671.0, 474.0, 338.0, 224.0, 138.0, 93.0, 57.0, 38.0, 42.0, 17.0, 13.0, 11.0, 8.0, 4.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.6796875, -7.43975830078125, -7.1998291015625, -6.95989990234375, -6.719970703125, -6.48004150390625, -6.2401123046875, -6.00018310546875, -5.76025390625, -5.52032470703125, -5.2803955078125, -5.04046630859375, -4.800537109375, -4.56060791015625, -4.3206787109375, -4.08074951171875, -3.8408203125, -3.60089111328125, -3.3609619140625, -3.12103271484375, -2.881103515625, -2.64117431640625, -2.4012451171875, -2.16131591796875, -1.92138671875, -1.68145751953125, -1.4415283203125, -1.20159912109375, -0.961669921875, -0.72174072265625, -0.4818115234375, -0.24188232421875, -0.001953125, 0.23797607421875, 0.4779052734375, 0.71783447265625, 0.957763671875, 1.19769287109375, 1.4376220703125, 1.67755126953125, 1.91748046875, 2.15740966796875, 2.3973388671875, 2.63726806640625, 2.877197265625, 3.11712646484375, 3.3570556640625, 3.59698486328125, 3.8369140625, 4.07684326171875, 4.3167724609375, 4.55670166015625, 4.796630859375, 5.03656005859375, 5.2764892578125, 5.51641845703125, 5.75634765625, 5.99627685546875, 6.2362060546875, 6.47613525390625, 6.716064453125, 6.95599365234375, 7.1959228515625, 7.43585205078125, 7.67578125]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 6.0, 9.0, 10.0, 14.0, 15.0, 22.0, 29.0, 53.0, 40.0, 60.0, 64.0, 107.0, 137.0, 176.0, 197.0, 285.0, 284.0, 303.0, 304.0, 352.0, 299.0, 270.0, 227.0, 182.0, 152.0, 128.0, 94.0, 61.0, 54.0, 31.0, 23.0, 22.0, 12.0, 15.0, 12.0, 6.0, 7.0, 3.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.26171875, -2.187957763671875, -2.11419677734375, -2.040435791015625, -1.9666748046875, -1.892913818359375, -1.81915283203125, -1.745391845703125, -1.671630859375, -1.597869873046875, -1.52410888671875, -1.450347900390625, -1.3765869140625, -1.302825927734375, -1.22906494140625, -1.155303955078125, -1.08154296875, -1.007781982421875, -0.93402099609375, -0.860260009765625, -0.7864990234375, -0.712738037109375, -0.63897705078125, -0.565216064453125, -0.491455078125, -0.417694091796875, -0.34393310546875, -0.270172119140625, -0.1964111328125, -0.122650146484375, -0.04888916015625, 0.024871826171875, 0.0986328125, 0.172393798828125, 0.24615478515625, 0.319915771484375, 0.3936767578125, 0.467437744140625, 0.54119873046875, 0.614959716796875, 0.688720703125, 0.762481689453125, 0.83624267578125, 0.910003662109375, 0.9837646484375, 1.057525634765625, 1.13128662109375, 1.205047607421875, 1.27880859375, 1.352569580078125, 1.42633056640625, 1.500091552734375, 1.5738525390625, 1.647613525390625, 1.72137451171875, 1.795135498046875, 1.868896484375, 1.942657470703125, 2.01641845703125, 2.090179443359375, 2.1639404296875, 2.237701416015625, 2.31146240234375, 2.385223388671875, 2.458984375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 8.0, 6.0, 5.0, 8.0, 9.0, 8.0, 19.0, 13.0, 24.0, 24.0, 23.0, 24.0, 41.0, 53.0, 62.0, 71.0, 58.0, 52.0, 72.0, 64.0, 62.0, 58.0, 26.0, 41.0, 36.0, 29.0, 19.0, 26.0, 15.0, 7.0, 6.0, 3.0, 6.0, 6.0, 2.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-7.171698570251465, -6.946063995361328, -6.72042989730835, -6.494795799255371, -6.269161224365234, -6.043526649475098, -5.817892551422119, -5.592258453369141, -5.366623878479004, -5.140989303588867, -4.915355205535889, -4.68972110748291, -4.464086532592773, -4.238451957702637, -4.012817859649658, -3.7871835231781006, -3.561549186706543, -3.3359148502349854, -3.1102805137634277, -2.88464617729187, -2.6590118408203125, -2.433377504348755, -2.2077431678771973, -1.9821088314056396, -1.756474494934082, -1.5308401584625244, -1.3052058219909668, -1.0795714855194092, -0.8539371490478516, -0.628302812576294, -0.40266847610473633, -0.1770341396331787, 0.048600196838378906, 0.2742345333099365, 0.49986886978149414, 0.7255032062530518, 0.9511375427246094, 1.176771879196167, 1.4024062156677246, 1.6280405521392822, 1.8536748886108398, 2.0793092250823975, 2.304943561553955, 2.5305778980255127, 2.7562122344970703, 2.981846570968628, 3.2074809074401855, 3.433115243911743, 3.658749580383301, 3.8843839168548584, 4.110018253326416, 4.3356523513793945, 4.561286926269531, 4.786921501159668, 5.0125555992126465, 5.238189697265625, 5.463824272155762, 5.689458847045898, 5.915092945098877, 6.1407270431518555, 6.366361618041992, 6.591996192932129, 6.817630290985107, 7.043264389038086, 7.268898963928223]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 5.0, 7.0, 7.0, 6.0, 11.0, 16.0, 14.0, 15.0, 22.0, 25.0, 24.0, 32.0, 31.0, 33.0, 46.0, 41.0, 50.0, 36.0, 45.0, 46.0, 45.0, 35.0, 48.0, 37.0, 29.0, 38.0, 36.0, 38.0, 30.0, 22.0, 19.0, 20.0, 19.0, 12.0, 13.0, 6.0, 5.0, 6.0, 6.0, 2.0, 6.0, 6.0, 4.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.1419172286987305, -4.007763862609863, -3.873610496520996, -3.739457130432129, -3.6053037643432617, -3.4711503982543945, -3.3369970321655273, -3.20284366607666, -3.068690299987793, -2.934536933898926, -2.8003835678100586, -2.6662302017211914, -2.532076835632324, -2.397923469543457, -2.26377010345459, -2.1296167373657227, -1.9954633712768555, -1.8613100051879883, -1.727156639099121, -1.593003273010254, -1.4588499069213867, -1.3246965408325195, -1.1905431747436523, -1.0563898086547852, -0.922236442565918, -0.7880830764770508, -0.6539297103881836, -0.5197763442993164, -0.3856229782104492, -0.25146961212158203, -0.11731624603271484, 0.016837120056152344, 0.15099000930786133, 0.2851433753967285, 0.4192967414855957, 0.5534501075744629, 0.6876034736633301, 0.8217568397521973, 0.9559102058410645, 1.0900635719299316, 1.2242169380187988, 1.358370304107666, 1.4925236701965332, 1.6266770362854004, 1.7608304023742676, 1.8949837684631348, 2.029137134552002, 2.163290500640869, 2.2974438667297363, 2.4315972328186035, 2.5657505989074707, 2.699903964996338, 2.834057331085205, 2.9682106971740723, 3.1023640632629395, 3.2365174293518066, 3.370670795440674, 3.504824161529541, 3.638977527618408, 3.7731308937072754, 3.9072842597961426, 4.04143762588501, 4.175590991973877, 4.309744358062744, 4.443897724151611]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 15.0, 15.0, 9.0, 32.0, 38.0, 62.0, 97.0, 133.0, 211.0, 370.0, 559.0, 1114.0, 2046.0, 3951.0, 8041.0, 16915.0, 37131.0, 80593.0, 163113.0, 253932.0, 230815.0, 131526.0, 62725.0, 28431.0, 13253.0, 6327.0, 3294.0, 1609.0, 896.0, 528.0, 267.0, 187.0, 108.0, 68.0, 45.0, 31.0, 28.0, 18.0, 13.0, 3.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0], "bins": [-5.78515625, -5.62371826171875, -5.4622802734375, -5.30084228515625, -5.139404296875, -4.97796630859375, -4.8165283203125, -4.65509033203125, -4.49365234375, -4.33221435546875, -4.1707763671875, -4.00933837890625, -3.847900390625, -3.68646240234375, -3.5250244140625, -3.36358642578125, -3.2021484375, -3.04071044921875, -2.8792724609375, -2.71783447265625, -2.556396484375, -2.39495849609375, -2.2335205078125, -2.07208251953125, -1.91064453125, -1.74920654296875, -1.5877685546875, -1.42633056640625, -1.264892578125, -1.10345458984375, -0.9420166015625, -0.78057861328125, -0.619140625, -0.45770263671875, -0.2962646484375, -0.13482666015625, 0.026611328125, 0.18804931640625, 0.3494873046875, 0.51092529296875, 0.67236328125, 0.83380126953125, 0.9952392578125, 1.15667724609375, 1.318115234375, 1.47955322265625, 1.6409912109375, 1.80242919921875, 1.9638671875, 2.12530517578125, 2.2867431640625, 2.44818115234375, 2.609619140625, 2.77105712890625, 2.9324951171875, 3.09393310546875, 3.25537109375, 3.41680908203125, 3.5782470703125, 3.73968505859375, 3.901123046875, 4.06256103515625, 4.2239990234375, 4.38543701171875, 4.546875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 5.0, 10.0, 13.0, 14.0, 7.0, 15.0, 12.0, 11.0, 17.0, 28.0, 22.0, 27.0, 38.0, 29.0, 39.0, 49.0, 50.0, 46.0, 44.0, 43.0, 37.0, 48.0, 39.0, 29.0, 49.0, 38.0, 44.0, 25.0, 29.0, 22.0, 19.0, 23.0, 22.0, 11.0, 11.0, 9.0, 5.0, 4.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.72265625, -4.57403564453125, -4.4254150390625, -4.27679443359375, -4.128173828125, -3.97955322265625, -3.8309326171875, -3.68231201171875, -3.53369140625, -3.38507080078125, -3.2364501953125, -3.08782958984375, -2.939208984375, -2.79058837890625, -2.6419677734375, -2.49334716796875, -2.3447265625, -2.19610595703125, -2.0474853515625, -1.89886474609375, -1.750244140625, -1.60162353515625, -1.4530029296875, -1.30438232421875, -1.15576171875, -1.00714111328125, -0.8585205078125, -0.70989990234375, -0.561279296875, -0.41265869140625, -0.2640380859375, -0.11541748046875, 0.033203125, 0.18182373046875, 0.3304443359375, 0.47906494140625, 0.627685546875, 0.77630615234375, 0.9249267578125, 1.07354736328125, 1.22216796875, 1.37078857421875, 1.5194091796875, 1.66802978515625, 1.816650390625, 1.96527099609375, 2.1138916015625, 2.26251220703125, 2.4111328125, 2.55975341796875, 2.7083740234375, 2.85699462890625, 3.005615234375, 3.15423583984375, 3.3028564453125, 3.45147705078125, 3.60009765625, 3.74871826171875, 3.8973388671875, 4.04595947265625, 4.194580078125, 4.34320068359375, 4.4918212890625, 4.64044189453125, 4.7890625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 5.0, 10.0, 9.0, 10.0, 16.0, 24.0, 14.0, 40.0, 53.0, 71.0, 105.0, 147.0, 242.0, 432.0, 640.0, 1134.0, 1978.0, 3832.0, 7859.0, 17155.0, 39680.0, 94290.0, 214437.0, 317632.0, 196749.0, 85308.0, 35541.0, 15570.0, 7352.0, 3557.0, 1875.0, 1085.0, 653.0, 374.0, 238.0, 152.0, 93.0, 64.0, 36.0, 32.0, 14.0, 16.0, 12.0, 9.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9140625, -5.71978759765625, -5.5255126953125, -5.33123779296875, -5.136962890625, -4.94268798828125, -4.7484130859375, -4.55413818359375, -4.35986328125, -4.16558837890625, -3.9713134765625, -3.77703857421875, -3.582763671875, -3.38848876953125, -3.1942138671875, -2.99993896484375, -2.8056640625, -2.61138916015625, -2.4171142578125, -2.22283935546875, -2.028564453125, -1.83428955078125, -1.6400146484375, -1.44573974609375, -1.25146484375, -1.05718994140625, -0.8629150390625, -0.66864013671875, -0.474365234375, -0.28009033203125, -0.0858154296875, 0.10845947265625, 0.302734375, 0.49700927734375, 0.6912841796875, 0.88555908203125, 1.079833984375, 1.27410888671875, 1.4683837890625, 1.66265869140625, 1.85693359375, 2.05120849609375, 2.2454833984375, 2.43975830078125, 2.634033203125, 2.82830810546875, 3.0225830078125, 3.21685791015625, 3.4111328125, 3.60540771484375, 3.7996826171875, 3.99395751953125, 4.188232421875, 4.38250732421875, 4.5767822265625, 4.77105712890625, 4.96533203125, 5.15960693359375, 5.3538818359375, 5.54815673828125, 5.742431640625, 5.93670654296875, 6.1309814453125, 6.32525634765625, 6.51953125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 8.0, 7.0, 8.0, 11.0, 7.0, 17.0, 11.0, 22.0, 15.0, 20.0, 13.0, 32.0, 24.0, 27.0, 26.0, 27.0, 34.0, 41.0, 38.0, 54.0, 40.0, 43.0, 34.0, 48.0, 47.0, 28.0, 40.0, 34.0, 22.0, 27.0, 18.0, 28.0, 25.0, 12.0, 20.0, 20.0, 13.0, 8.0, 9.0, 12.0, 5.0, 9.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.232421875, -2.15594482421875, -2.0794677734375, -2.00299072265625, -1.926513671875, -1.85003662109375, -1.7735595703125, -1.69708251953125, -1.62060546875, -1.54412841796875, -1.4676513671875, -1.39117431640625, -1.314697265625, -1.23822021484375, -1.1617431640625, -1.08526611328125, -1.0087890625, -0.93231201171875, -0.8558349609375, -0.77935791015625, -0.702880859375, -0.62640380859375, -0.5499267578125, -0.47344970703125, -0.39697265625, -0.32049560546875, -0.2440185546875, -0.16754150390625, -0.091064453125, -0.01458740234375, 0.0618896484375, 0.13836669921875, 0.21484375, 0.29132080078125, 0.3677978515625, 0.44427490234375, 0.520751953125, 0.59722900390625, 0.6737060546875, 0.75018310546875, 0.82666015625, 0.90313720703125, 0.9796142578125, 1.05609130859375, 1.132568359375, 1.20904541015625, 1.2855224609375, 1.36199951171875, 1.4384765625, 1.51495361328125, 1.5914306640625, 1.66790771484375, 1.744384765625, 1.82086181640625, 1.8973388671875, 1.97381591796875, 2.05029296875, 2.12677001953125, 2.2032470703125, 2.27972412109375, 2.356201171875, 2.43267822265625, 2.5091552734375, 2.58563232421875, 2.662109375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 2.0, 8.0, 12.0, 32.0, 25.0, 19.0, 54.0, 102.0, 136.0, 218.0, 354.0, 600.0, 1112.0, 2267.0, 4441.0, 9464.0, 21324.0, 52917.0, 139139.0, 330258.0, 291309.0, 115918.0, 44011.0, 18425.0, 8206.0, 3883.0, 1905.0, 971.0, 581.0, 320.0, 190.0, 111.0, 74.0, 48.0, 43.0, 20.0, 17.0, 11.0, 8.0, 4.0, 4.0, 4.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.2734375, -3.17083740234375, -3.0682373046875, -2.96563720703125, -2.863037109375, -2.76043701171875, -2.6578369140625, -2.55523681640625, -2.45263671875, -2.35003662109375, -2.2474365234375, -2.14483642578125, -2.042236328125, -1.93963623046875, -1.8370361328125, -1.73443603515625, -1.6318359375, -1.52923583984375, -1.4266357421875, -1.32403564453125, -1.221435546875, -1.11883544921875, -1.0162353515625, -0.91363525390625, -0.81103515625, -0.70843505859375, -0.6058349609375, -0.50323486328125, -0.400634765625, -0.29803466796875, -0.1954345703125, -0.09283447265625, 0.009765625, 0.11236572265625, 0.2149658203125, 0.31756591796875, 0.420166015625, 0.52276611328125, 0.6253662109375, 0.72796630859375, 0.83056640625, 0.93316650390625, 1.0357666015625, 1.13836669921875, 1.240966796875, 1.34356689453125, 1.4461669921875, 1.54876708984375, 1.6513671875, 1.75396728515625, 1.8565673828125, 1.95916748046875, 2.061767578125, 2.16436767578125, 2.2669677734375, 2.36956787109375, 2.47216796875, 2.57476806640625, 2.6773681640625, 2.77996826171875, 2.882568359375, 2.98516845703125, 3.0877685546875, 3.19036865234375, 3.29296875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 5.0, 2.0, 4.0, 10.0, 9.0, 13.0, 17.0, 12.0, 27.0, 36.0, 54.0, 61.0, 67.0, 79.0, 84.0, 78.0, 80.0, 78.0, 59.0, 32.0, 44.0, 35.0, 32.0, 20.0, 14.0, 7.0, 10.0, 5.0, 5.0, 7.0, 5.0, 4.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016772747039794922, -0.0001629665493965149, -0.00015820562839508057, -0.00015344470739364624, -0.00014868378639221191, -0.0001439228653907776, -0.00013916194438934326, -0.00013440102338790894, -0.0001296401023864746, -0.00012487918138504028, -0.00012011826038360596, -0.00011535733938217163, -0.0001105964183807373, -0.00010583549737930298, -0.00010107457637786865, -9.631365537643433e-05, -9.1552734375e-05, -8.679181337356567e-05, -8.203089237213135e-05, -7.726997137069702e-05, -7.25090503692627e-05, -6.774812936782837e-05, -6.298720836639404e-05, -5.822628736495972e-05, -5.346536636352539e-05, -4.8704445362091064e-05, -4.394352436065674e-05, -3.918260335922241e-05, -3.4421682357788086e-05, -2.966076135635376e-05, -2.4899840354919434e-05, -2.0138919353485107e-05, -1.537799835205078e-05, -1.0617077350616455e-05, -5.856156349182129e-06, -1.0952353477478027e-06, 3.6656856536865234e-06, 8.42660665512085e-06, 1.3187527656555176e-05, 1.7948448657989502e-05, 2.2709369659423828e-05, 2.7470290660858154e-05, 3.223121166229248e-05, 3.699213266372681e-05, 4.175305366516113e-05, 4.651397466659546e-05, 5.1274895668029785e-05, 5.603581666946411e-05, 6.079673767089844e-05, 6.555765867233276e-05, 7.031857967376709e-05, 7.507950067520142e-05, 7.984042167663574e-05, 8.460134267807007e-05, 8.93622636795044e-05, 9.412318468093872e-05, 9.888410568237305e-05, 0.00010364502668380737, 0.0001084059476852417, 0.00011316686868667603, 0.00011792778968811035, 0.00012268871068954468, 0.000127449631690979, 0.00013221055269241333, 0.00013697147369384766]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 10.0, 7.0, 19.0, 17.0, 37.0, 53.0, 83.0, 120.0, 185.0, 279.0, 415.0, 650.0, 1046.0, 1658.0, 2696.0, 4464.0, 7565.0, 12817.0, 22438.0, 39646.0, 70663.0, 119475.0, 177096.0, 198157.0, 156994.0, 98795.0, 56967.0, 31767.0, 17847.0, 10520.0, 6217.0, 3566.0, 2308.0, 1421.0, 852.0, 609.0, 389.0, 247.0, 156.0, 101.0, 73.0, 40.0, 38.0, 22.0, 11.0, 4.0, 7.0, 4.0, 7.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.861328125, -1.805450439453125, -1.74957275390625, -1.693695068359375, -1.6378173828125, -1.581939697265625, -1.52606201171875, -1.470184326171875, -1.414306640625, -1.358428955078125, -1.30255126953125, -1.246673583984375, -1.1907958984375, -1.134918212890625, -1.07904052734375, -1.023162841796875, -0.96728515625, -0.911407470703125, -0.85552978515625, -0.799652099609375, -0.7437744140625, -0.687896728515625, -0.63201904296875, -0.576141357421875, -0.520263671875, -0.464385986328125, -0.40850830078125, -0.352630615234375, -0.2967529296875, -0.240875244140625, -0.18499755859375, -0.129119873046875, -0.0732421875, -0.017364501953125, 0.03851318359375, 0.094390869140625, 0.1502685546875, 0.206146240234375, 0.26202392578125, 0.317901611328125, 0.373779296875, 0.429656982421875, 0.48553466796875, 0.541412353515625, 0.5972900390625, 0.653167724609375, 0.70904541015625, 0.764923095703125, 0.82080078125, 0.876678466796875, 0.93255615234375, 0.988433837890625, 1.0443115234375, 1.100189208984375, 1.15606689453125, 1.211944580078125, 1.267822265625, 1.323699951171875, 1.37957763671875, 1.435455322265625, 1.4913330078125, 1.547210693359375, 1.60308837890625, 1.658966064453125, 1.71484375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 4.0, 2.0, 11.0, 7.0, 11.0, 13.0, 11.0, 21.0, 26.0, 29.0, 28.0, 28.0, 43.0, 52.0, 56.0, 36.0, 49.0, 56.0, 70.0, 68.0, 35.0, 68.0, 42.0, 37.0, 35.0, 30.0, 33.0, 21.0, 16.0, 17.0, 15.0, 5.0, 9.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.583984375, -0.5670890808105469, -0.5501937866210938, -0.5332984924316406, -0.5164031982421875, -0.4995079040527344, -0.48261260986328125, -0.4657173156738281, -0.448822021484375, -0.4319267272949219, -0.41503143310546875, -0.3981361389160156, -0.3812408447265625, -0.3643455505371094, -0.34745025634765625, -0.3305549621582031, -0.31365966796875, -0.2967643737792969, -0.27986907958984375, -0.2629737854003906, -0.2460784912109375, -0.22918319702148438, -0.21228790283203125, -0.19539260864257812, -0.178497314453125, -0.16160202026367188, -0.14470672607421875, -0.12781143188476562, -0.1109161376953125, -0.09402084350585938, -0.07712554931640625, -0.060230255126953125, -0.0433349609375, -0.026439666748046875, -0.00954437255859375, 0.007350921630859375, 0.0242462158203125, 0.041141510009765625, 0.05803680419921875, 0.07493209838867188, 0.091827392578125, 0.10872268676757812, 0.12561798095703125, 0.14251327514648438, 0.1594085693359375, 0.17630386352539062, 0.19319915771484375, 0.21009445190429688, 0.22698974609375, 0.24388504028320312, 0.26078033447265625, 0.2776756286621094, 0.2945709228515625, 0.3114662170410156, 0.32836151123046875, 0.3452568054199219, 0.362152099609375, 0.3790473937988281, 0.39594268798828125, 0.4128379821777344, 0.4297332763671875, 0.4466285705566406, 0.46352386474609375, 0.4804191589355469, 0.497314453125]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 4.0, 9.0, 5.0, 6.0, 7.0, 11.0, 8.0, 14.0, 11.0, 25.0, 22.0, 28.0, 35.0, 33.0, 56.0, 56.0, 58.0, 57.0, 73.0, 47.0, 68.0, 68.0, 42.0, 48.0, 46.0, 31.0, 24.0, 24.0, 21.0, 18.0, 7.0, 5.0, 8.0, 7.0, 2.0, 2.0, 4.0, 3.0, 1.0, 5.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.995565414428711, -6.775362014770508, -6.555158615112305, -6.334955215454102, -6.114751815795898, -5.894548416137695, -5.674345016479492, -5.454141616821289, -5.233938217163086, -5.013734817504883, -4.79353141784668, -4.573328018188477, -4.353124618530273, -4.13292121887207, -3.912717819213867, -3.692514419555664, -3.472310781478882, -3.2521073818206787, -3.0319039821624756, -2.8117005825042725, -2.5914971828460693, -2.371293544769287, -2.151090145111084, -1.9308868646621704, -1.7106834650039673, -1.4904800653457642, -1.270276665687561, -1.0500731468200684, -0.82986980676651, -0.6096663475036621, -0.389462947845459, -0.16925954818725586, 0.050943851470947266, 0.2711472511291504, 0.4913506805896759, 0.7115541100502014, 0.9317575097084045, 1.1519609689712524, 1.3721643686294556, 1.5923677682876587, 1.8125711679458618, 2.0327746868133545, 2.2529780864715576, 2.4731814861297607, 2.693384885787964, 2.913588285446167, 3.13379168510437, 3.3539950847625732, 3.5741984844207764, 3.7944018840789795, 4.014605522155762, 4.234808921813965, 4.455012321472168, 4.675215721130371, 4.895419120788574, 5.115622520446777, 5.3358259201049805, 5.556029319763184, 5.776232719421387, 5.99643611907959, 6.216639518737793, 6.436842918395996, 6.657046318054199, 6.877249717712402, 7.0974531173706055]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 3.0, 3.0, 8.0, 14.0, 10.0, 12.0, 15.0, 20.0, 26.0, 28.0, 26.0, 22.0, 34.0, 47.0, 37.0, 47.0, 36.0, 45.0, 46.0, 41.0, 42.0, 40.0, 42.0, 39.0, 32.0, 33.0, 44.0, 25.0, 31.0, 20.0, 26.0, 16.0, 16.0, 16.0, 6.0, 7.0, 5.0, 10.0, 3.0, 1.0, 3.0, 8.0, 6.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.998119592666626, -3.8669707775115967, -3.7358222007751465, -3.604673385620117, -3.473524570465088, -3.3423757553100586, -3.2112271785736084, -3.080078363418579, -2.948929786682129, -2.8177809715270996, -2.6866323947906494, -2.55548357963562, -2.424334764480591, -2.2931861877441406, -2.1620373725891113, -2.030888557434082, -1.8997397422790527, -1.768591046333313, -1.6374422311782837, -1.506293535232544, -1.3751447200775146, -1.243996024131775, -1.1128473281860352, -0.9816985726356506, -0.8505498170852661, -0.7194010615348816, -0.5882523059844971, -0.4571036100387573, -0.3259548544883728, -0.19480609893798828, -0.06365740299224854, 0.06749135255813599, 0.1986398696899414, 0.3297886252403259, 0.46093735098838806, 0.5920860767364502, 0.7232348322868347, 0.8543835878372192, 0.985532283782959, 1.1166810989379883, 1.247829794883728, 1.3789784908294678, 1.510127305984497, 1.6412760019302368, 1.7724246978759766, 1.9035735130310059, 2.034722328186035, 2.1658709049224854, 2.2970197200775146, 2.428168535232544, 2.559317111968994, 2.6904659271240234, 2.8216147422790527, 2.952763557434082, 3.0839121341705322, 3.2150609493255615, 3.3462095260620117, 3.477358341217041, 3.608506917953491, 3.7396557331085205, 3.87080454826355, 4.001953125, 4.133101940155029, 4.264250755310059, 4.395399570465088]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 9.0, 17.0, 8.0, 30.0, 25.0, 45.0, 72.0, 103.0, 144.0, 227.0, 382.0, 577.0, 886.0, 1267.0, 2016.0, 3310.0, 5151.0, 7774.0, 12516.0, 19544.0, 30489.0, 47213.0, 70196.0, 99032.0, 126640.0, 142569.0, 134835.0, 109991.0, 80119.0, 54187.0, 35927.0, 23041.0, 14651.0, 9267.0, 5899.0, 3739.0, 2342.0, 1502.0, 1005.0, 628.0, 380.0, 292.0, 179.0, 102.0, 79.0, 50.0, 40.0, 14.0, 25.0, 13.0, 4.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-4.59765625, -4.4525146484375, -4.307373046875, -4.1622314453125, -4.01708984375, -3.8719482421875, -3.726806640625, -3.5816650390625, -3.4365234375, -3.2913818359375, -3.146240234375, -3.0010986328125, -2.85595703125, -2.7108154296875, -2.565673828125, -2.4205322265625, -2.275390625, -2.1302490234375, -1.985107421875, -1.8399658203125, -1.69482421875, -1.5496826171875, -1.404541015625, -1.2593994140625, -1.1142578125, -0.9691162109375, -0.823974609375, -0.6788330078125, -0.53369140625, -0.3885498046875, -0.243408203125, -0.0982666015625, 0.046875, 0.1920166015625, 0.337158203125, 0.4822998046875, 0.62744140625, 0.7725830078125, 0.917724609375, 1.0628662109375, 1.2080078125, 1.3531494140625, 1.498291015625, 1.6434326171875, 1.78857421875, 1.9337158203125, 2.078857421875, 2.2239990234375, 2.369140625, 2.5142822265625, 2.659423828125, 2.8045654296875, 2.94970703125, 3.0948486328125, 3.239990234375, 3.3851318359375, 3.5302734375, 3.6754150390625, 3.820556640625, 3.9656982421875, 4.11083984375, 4.2559814453125, 4.401123046875, 4.5462646484375, 4.69140625]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 5.0, 5.0, 9.0, 7.0, 8.0, 12.0, 19.0, 24.0, 20.0, 26.0, 18.0, 38.0, 41.0, 35.0, 34.0, 49.0, 51.0, 50.0, 46.0, 51.0, 45.0, 42.0, 44.0, 43.0, 42.0, 42.0, 28.0, 27.0, 23.0, 18.0, 16.0, 14.0, 13.0, 17.0, 4.0, 6.0, 12.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.0703125, -4.9176025390625, -4.764892578125, -4.6121826171875, -4.45947265625, -4.3067626953125, -4.154052734375, -4.0013427734375, -3.8486328125, -3.6959228515625, -3.543212890625, -3.3905029296875, -3.23779296875, -3.0850830078125, -2.932373046875, -2.7796630859375, -2.626953125, -2.4742431640625, -2.321533203125, -2.1688232421875, -2.01611328125, -1.8634033203125, -1.710693359375, -1.5579833984375, -1.4052734375, -1.2525634765625, -1.099853515625, -0.9471435546875, -0.79443359375, -0.6417236328125, -0.489013671875, -0.3363037109375, -0.18359375, -0.0308837890625, 0.121826171875, 0.2745361328125, 0.42724609375, 0.5799560546875, 0.732666015625, 0.8853759765625, 1.0380859375, 1.1907958984375, 1.343505859375, 1.4962158203125, 1.64892578125, 1.8016357421875, 1.954345703125, 2.1070556640625, 2.259765625, 2.4124755859375, 2.565185546875, 2.7178955078125, 2.87060546875, 3.0233154296875, 3.176025390625, 3.3287353515625, 3.4814453125, 3.6341552734375, 3.786865234375, 3.9395751953125, 4.09228515625, 4.2449951171875, 4.397705078125, 4.5504150390625, 4.703125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 11.0, 21.0, 30.0, 38.0, 60.0, 91.0, 127.0, 242.0, 411.0, 733.0, 1287.0, 1987.0, 3634.0, 6374.0, 11023.0, 18968.0, 33205.0, 55015.0, 87945.0, 128898.0, 162973.0, 165380.0, 134110.0, 93334.0, 58655.0, 35422.0, 20646.0, 11814.0, 6874.0, 3891.0, 2210.0, 1295.0, 718.0, 463.0, 223.0, 176.0, 92.0, 59.0, 38.0, 26.0, 16.0, 13.0, 10.0, 9.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.82421875, -5.642578125, -5.4609375, -5.279296875, -5.09765625, -4.916015625, -4.734375, -4.552734375, -4.37109375, -4.189453125, -4.0078125, -3.826171875, -3.64453125, -3.462890625, -3.28125, -3.099609375, -2.91796875, -2.736328125, -2.5546875, -2.373046875, -2.19140625, -2.009765625, -1.828125, -1.646484375, -1.46484375, -1.283203125, -1.1015625, -0.919921875, -0.73828125, -0.556640625, -0.375, -0.193359375, -0.01171875, 0.169921875, 0.3515625, 0.533203125, 0.71484375, 0.896484375, 1.078125, 1.259765625, 1.44140625, 1.623046875, 1.8046875, 1.986328125, 2.16796875, 2.349609375, 2.53125, 2.712890625, 2.89453125, 3.076171875, 3.2578125, 3.439453125, 3.62109375, 3.802734375, 3.984375, 4.166015625, 4.34765625, 4.529296875, 4.7109375, 4.892578125, 5.07421875, 5.255859375, 5.4375, 5.619140625, 5.80078125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 10.0, 9.0, 11.0, 5.0, 9.0, 8.0, 14.0, 18.0, 23.0, 23.0, 33.0, 35.0, 34.0, 34.0, 38.0, 33.0, 44.0, 43.0, 35.0, 51.0, 34.0, 42.0, 44.0, 34.0, 41.0, 51.0, 32.0, 36.0, 28.0, 20.0, 20.0, 23.0, 19.0, 15.0, 13.0, 12.0, 14.0, 5.0, 4.0, 2.0, 0.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.966796875, -2.878662109375, -2.79052734375, -2.702392578125, -2.6142578125, -2.526123046875, -2.43798828125, -2.349853515625, -2.26171875, -2.173583984375, -2.08544921875, -1.997314453125, -1.9091796875, -1.821044921875, -1.73291015625, -1.644775390625, -1.556640625, -1.468505859375, -1.38037109375, -1.292236328125, -1.2041015625, -1.115966796875, -1.02783203125, -0.939697265625, -0.8515625, -0.763427734375, -0.67529296875, -0.587158203125, -0.4990234375, -0.410888671875, -0.32275390625, -0.234619140625, -0.146484375, -0.058349609375, 0.02978515625, 0.117919921875, 0.2060546875, 0.294189453125, 0.38232421875, 0.470458984375, 0.55859375, 0.646728515625, 0.73486328125, 0.822998046875, 0.9111328125, 0.999267578125, 1.08740234375, 1.175537109375, 1.263671875, 1.351806640625, 1.43994140625, 1.528076171875, 1.6162109375, 1.704345703125, 1.79248046875, 1.880615234375, 1.96875, 2.056884765625, 2.14501953125, 2.233154296875, 2.3212890625, 2.409423828125, 2.49755859375, 2.585693359375, 2.673828125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 6.0, 6.0, 11.0, 12.0, 26.0, 33.0, 37.0, 53.0, 72.0, 88.0, 122.0, 171.0, 216.0, 385.0, 515.0, 823.0, 1213.0, 2021.0, 3590.0, 6950.0, 15074.0, 39506.0, 123322.0, 327456.0, 330261.0, 125109.0, 39905.0, 15240.0, 6799.0, 3588.0, 2125.0, 1249.0, 818.0, 495.0, 371.0, 230.0, 172.0, 145.0, 97.0, 55.0, 52.0, 38.0, 27.0, 31.0, 13.0, 8.0, 10.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-7.41796875, -7.1998291015625, -6.981689453125, -6.7635498046875, -6.54541015625, -6.3272705078125, -6.109130859375, -5.8909912109375, -5.6728515625, -5.4547119140625, -5.236572265625, -5.0184326171875, -4.80029296875, -4.5821533203125, -4.364013671875, -4.1458740234375, -3.927734375, -3.7095947265625, -3.491455078125, -3.2733154296875, -3.05517578125, -2.8370361328125, -2.618896484375, -2.4007568359375, -2.1826171875, -1.9644775390625, -1.746337890625, -1.5281982421875, -1.31005859375, -1.0919189453125, -0.873779296875, -0.6556396484375, -0.4375, -0.2193603515625, -0.001220703125, 0.2169189453125, 0.43505859375, 0.6531982421875, 0.871337890625, 1.0894775390625, 1.3076171875, 1.5257568359375, 1.743896484375, 1.9620361328125, 2.18017578125, 2.3983154296875, 2.616455078125, 2.8345947265625, 3.052734375, 3.2708740234375, 3.489013671875, 3.7071533203125, 3.92529296875, 4.1434326171875, 4.361572265625, 4.5797119140625, 4.7978515625, 5.0159912109375, 5.234130859375, 5.4522705078125, 5.67041015625, 5.8885498046875, 6.106689453125, 6.3248291015625, 6.54296875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 7.0, 13.0, 32.0, 67.0, 127.0, 174.0, 211.0, 158.0, 96.0, 35.0, 25.0, 12.0, 9.0, 6.0, 4.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0013246536254882812, -0.001286044716835022, -0.0012474358081817627, -0.0012088268995285034, -0.0011702179908752441, -0.0011316090822219849, -0.0010930001735687256, -0.0010543912649154663, -0.001015782356262207, -0.0009771734476089478, -0.0009385645389556885, -0.0008999556303024292, -0.0008613467216491699, -0.0008227378129959106, -0.0007841289043426514, -0.0007455199956893921, -0.0007069110870361328, -0.0006683021783828735, -0.0006296932697296143, -0.000591084361076355, -0.0005524754524230957, -0.0005138665437698364, -0.00047525763511657715, -0.00043664872646331787, -0.0003980398178100586, -0.0003594309091567993, -0.00032082200050354004, -0.00028221309185028076, -0.00024360418319702148, -0.0002049952745437622, -0.00016638636589050293, -0.00012777745723724365, -8.916854858398438e-05, -5.05596399307251e-05, -1.195073127746582e-05, 2.6658177375793457e-05, 6.526708602905273e-05, 0.00010387599468231201, 0.0001424849033355713, 0.00018109381198883057, 0.00021970272064208984, 0.0002583116292953491, 0.0002969205379486084, 0.0003355294466018677, 0.00037413835525512695, 0.00041274726390838623, 0.0004513561725616455, 0.0004899650812149048, 0.0005285739898681641, 0.0005671828985214233, 0.0006057918071746826, 0.0006444007158279419, 0.0006830096244812012, 0.0007216185331344604, 0.0007602274417877197, 0.000798836350440979, 0.0008374452590942383, 0.0008760541677474976, 0.0009146630764007568, 0.0009532719850540161, 0.0009918808937072754, 0.0010304898023605347, 0.001069098711013794, 0.0011077076196670532, 0.0011463165283203125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 5.0, 10.0, 14.0, 21.0, 23.0, 31.0, 53.0, 88.0, 120.0, 195.0, 332.0, 523.0, 805.0, 1343.0, 2381.0, 4528.0, 8953.0, 18876.0, 42280.0, 97736.0, 204359.0, 281303.0, 205287.0, 98029.0, 42658.0, 19067.0, 9087.0, 4514.0, 2380.0, 1408.0, 817.0, 479.0, 277.0, 187.0, 122.0, 87.0, 59.0, 32.0, 22.0, 21.0, 17.0, 6.0, 9.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.21484375, -4.0810546875, -3.947265625, -3.8134765625, -3.6796875, -3.5458984375, -3.412109375, -3.2783203125, -3.14453125, -3.0107421875, -2.876953125, -2.7431640625, -2.609375, -2.4755859375, -2.341796875, -2.2080078125, -2.07421875, -1.9404296875, -1.806640625, -1.6728515625, -1.5390625, -1.4052734375, -1.271484375, -1.1376953125, -1.00390625, -0.8701171875, -0.736328125, -0.6025390625, -0.46875, -0.3349609375, -0.201171875, -0.0673828125, 0.06640625, 0.2001953125, 0.333984375, 0.4677734375, 0.6015625, 0.7353515625, 0.869140625, 1.0029296875, 1.13671875, 1.2705078125, 1.404296875, 1.5380859375, 1.671875, 1.8056640625, 1.939453125, 2.0732421875, 2.20703125, 2.3408203125, 2.474609375, 2.6083984375, 2.7421875, 2.8759765625, 3.009765625, 3.1435546875, 3.27734375, 3.4111328125, 3.544921875, 3.6787109375, 3.8125, 3.9462890625, 4.080078125, 4.2138671875, 4.34765625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 7.0, 5.0, 10.0, 8.0, 14.0, 15.0, 12.0, 29.0, 33.0, 36.0, 34.0, 45.0, 56.0, 54.0, 67.0, 56.0, 95.0, 68.0, 56.0, 51.0, 42.0, 33.0, 35.0, 25.0, 27.0, 12.0, 10.0, 11.0, 9.0, 6.0, 8.0, 6.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.978515625, -0.9477615356445312, -0.9170074462890625, -0.8862533569335938, -0.855499267578125, -0.8247451782226562, -0.7939910888671875, -0.7632369995117188, -0.73248291015625, -0.7017288208007812, -0.6709747314453125, -0.6402206420898438, -0.609466552734375, -0.5787124633789062, -0.5479583740234375, -0.5172042846679688, -0.4864501953125, -0.45569610595703125, -0.4249420166015625, -0.39418792724609375, -0.363433837890625, -0.33267974853515625, -0.3019256591796875, -0.27117156982421875, -0.24041748046875, -0.20966339111328125, -0.1789093017578125, -0.14815521240234375, -0.117401123046875, -0.08664703369140625, -0.0558929443359375, -0.02513885498046875, 0.005615234375, 0.03636932373046875, 0.0671234130859375, 0.09787750244140625, 0.128631591796875, 0.15938568115234375, 0.1901397705078125, 0.22089385986328125, 0.25164794921875, 0.28240203857421875, 0.3131561279296875, 0.34391021728515625, 0.374664306640625, 0.40541839599609375, 0.4361724853515625, 0.46692657470703125, 0.4976806640625, 0.5284347534179688, 0.5591888427734375, 0.5899429321289062, 0.620697021484375, 0.6514511108398438, 0.6822052001953125, 0.7129592895507812, 0.74371337890625, 0.7744674682617188, 0.8052215576171875, 0.8359756469726562, 0.866729736328125, 0.8974838256835938, 0.9282379150390625, 0.9589920043945312, 0.98974609375]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 9.0, 9.0, 3.0, 12.0, 10.0, 17.0, 12.0, 23.0, 24.0, 14.0, 38.0, 44.0, 53.0, 47.0, 57.0, 58.0, 70.0, 52.0, 67.0, 54.0, 68.0, 42.0, 41.0, 34.0, 27.0, 23.0, 19.0, 15.0, 16.0, 7.0, 6.0, 10.0, 8.0, 4.0, 2.0, 4.0, 3.0, 1.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.33606481552124, -7.108825206756592, -6.881585597991943, -6.654345989227295, -6.4271063804626465, -6.199866771697998, -5.97262716293335, -5.745387554168701, -5.518147945404053, -5.290908336639404, -5.063668727874756, -4.836429119110107, -4.609189510345459, -4.3819499015808105, -4.154710292816162, -3.9274706840515137, -3.7002310752868652, -3.472991466522217, -3.2457518577575684, -3.01851224899292, -2.7912726402282715, -2.564033031463623, -2.3367934226989746, -2.109553813934326, -1.8823142051696777, -1.6550745964050293, -1.4278349876403809, -1.2005953788757324, -0.973355770111084, -0.7461161613464355, -0.5188765525817871, -0.29163694381713867, -0.06439781188964844, 0.162841796875, 0.39008140563964844, 0.6173210144042969, 0.8445606231689453, 1.0718002319335938, 1.2990398406982422, 1.5262794494628906, 1.753519058227539, 1.9807586669921875, 2.207998275756836, 2.4352378845214844, 2.662477493286133, 2.8897171020507812, 3.1169567108154297, 3.344196319580078, 3.5714359283447266, 3.798675537109375, 4.025915145874023, 4.253154754638672, 4.48039436340332, 4.707633972167969, 4.934873580932617, 5.162113189697266, 5.389352798461914, 5.6165924072265625, 5.843832015991211, 6.071071624755859, 6.298311233520508, 6.525550842285156, 6.752790451049805, 6.980030059814453, 7.207269668579102]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 7.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 7.0, 5.0, 9.0, 13.0, 12.0, 16.0, 15.0, 19.0, 28.0, 22.0, 33.0, 33.0, 43.0, 34.0, 48.0, 45.0, 31.0, 39.0, 39.0, 36.0, 51.0, 54.0, 35.0, 42.0, 33.0, 50.0, 28.0, 25.0, 24.0, 22.0, 18.0, 9.0, 14.0, 10.0, 10.0, 7.0, 9.0, 5.0, 2.0, 6.0, 3.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.09138822555542, -3.952510356903076, -3.8136324882507324, -3.6747546195983887, -3.535876750946045, -3.396998882293701, -3.2581212520599365, -3.1192433834075928, -2.980365514755249, -2.8414876461029053, -2.7026097774505615, -2.5637319087982178, -2.424854278564453, -2.2859764099121094, -2.1470985412597656, -2.008220672607422, -1.8693428039550781, -1.7304649353027344, -1.5915870666503906, -1.4527093172073364, -1.3138314485549927, -1.174953579902649, -1.0360758304595947, -0.897197961807251, -0.7583200931549072, -0.6194422245025635, -0.4805644154548645, -0.34168657660484314, -0.20280873775482178, -0.06393086910247803, 0.07494693994522095, 0.21382474899291992, 0.35270261764526367, 0.49158045649528503, 0.6304582953453064, 0.7693361043930054, 0.9082139730453491, 1.0470918416976929, 1.185969591140747, 1.3248474597930908, 1.4637253284454346, 1.6026031970977783, 1.741481065750122, 1.8803588151931763, 2.0192365646362305, 2.158114433288574, 2.296992301940918, 2.4358701705932617, 2.5747480392456055, 2.713625907897949, 2.852503776550293, 2.9913816452026367, 3.1302595138549805, 3.269137382507324, 3.408015012741089, 3.5468928813934326, 3.6857707500457764, 3.82464861869812, 3.963526487350464, 4.1024041175842285, 4.241281986236572, 4.380159854888916, 4.51903772354126, 4.6579155921936035, 4.796793460845947]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 9.0, 8.0, 7.0, 17.0, 20.0, 38.0, 58.0, 85.0, 113.0, 197.0, 351.0, 599.0, 986.0, 1737.0, 3114.0, 5682.0, 11209.0, 23273.0, 51247.0, 126649.0, 351821.0, 998785.0, 1463241.0, 732206.0, 250883.0, 94245.0, 39266.0, 18295.0, 9040.0, 4723.0, 2602.0, 1521.0, 875.0, 534.0, 319.0, 203.0, 114.0, 62.0, 44.0, 41.0, 18.0, 21.0, 9.0, 5.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0625, -7.7877197265625, -7.512939453125, -7.2381591796875, -6.96337890625, -6.6885986328125, -6.413818359375, -6.1390380859375, -5.8642578125, -5.5894775390625, -5.314697265625, -5.0399169921875, -4.76513671875, -4.4903564453125, -4.215576171875, -3.9407958984375, -3.666015625, -3.3912353515625, -3.116455078125, -2.8416748046875, -2.56689453125, -2.2921142578125, -2.017333984375, -1.7425537109375, -1.4677734375, -1.1929931640625, -0.918212890625, -0.6434326171875, -0.36865234375, -0.0938720703125, 0.180908203125, 0.4556884765625, 0.73046875, 1.0052490234375, 1.280029296875, 1.5548095703125, 1.82958984375, 2.1043701171875, 2.379150390625, 2.6539306640625, 2.9287109375, 3.2034912109375, 3.478271484375, 3.7530517578125, 4.02783203125, 4.3026123046875, 4.577392578125, 4.8521728515625, 5.126953125, 5.4017333984375, 5.676513671875, 5.9512939453125, 6.22607421875, 6.5008544921875, 6.775634765625, 7.0504150390625, 7.3251953125, 7.5999755859375, 7.874755859375, 8.1495361328125, 8.42431640625, 8.6990966796875, 8.973876953125, 9.2486572265625, 9.5234375]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 4.0, 5.0, 5.0, 7.0, 12.0, 11.0, 10.0, 12.0, 18.0, 30.0, 19.0, 22.0, 32.0, 32.0, 29.0, 44.0, 49.0, 35.0, 56.0, 39.0, 38.0, 37.0, 57.0, 42.0, 43.0, 42.0, 46.0, 33.0, 33.0, 26.0, 30.0, 16.0, 13.0, 16.0, 7.0, 8.0, 6.0, 9.0, 6.0, 5.0, 5.0, 4.0, 3.0, 1.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.537109375, -3.42144775390625, -3.3057861328125, -3.19012451171875, -3.074462890625, -2.95880126953125, -2.8431396484375, -2.72747802734375, -2.61181640625, -2.49615478515625, -2.3804931640625, -2.26483154296875, -2.149169921875, -2.03350830078125, -1.9178466796875, -1.80218505859375, -1.6865234375, -1.57086181640625, -1.4552001953125, -1.33953857421875, -1.223876953125, -1.10821533203125, -0.9925537109375, -0.87689208984375, -0.76123046875, -0.64556884765625, -0.5299072265625, -0.41424560546875, -0.298583984375, -0.18292236328125, -0.0672607421875, 0.04840087890625, 0.1640625, 0.27972412109375, 0.3953857421875, 0.51104736328125, 0.626708984375, 0.74237060546875, 0.8580322265625, 0.97369384765625, 1.08935546875, 1.20501708984375, 1.3206787109375, 1.43634033203125, 1.552001953125, 1.66766357421875, 1.7833251953125, 1.89898681640625, 2.0146484375, 2.13031005859375, 2.2459716796875, 2.36163330078125, 2.477294921875, 2.59295654296875, 2.7086181640625, 2.82427978515625, 2.93994140625, 3.05560302734375, 3.1712646484375, 3.28692626953125, 3.402587890625, 3.51824951171875, 3.6339111328125, 3.74957275390625, 3.865234375]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 7.0, 13.0, 18.0, 27.0, 40.0, 57.0, 97.0, 144.0, 205.0, 367.0, 485.0, 786.0, 1259.0, 2056.0, 3430.0, 5569.0, 9677.0, 16949.0, 30777.0, 57183.0, 110769.0, 221618.0, 451364.0, 859243.0, 1060757.0, 674265.0, 336138.0, 165477.0, 84389.0, 43980.0, 24157.0, 13261.0, 7725.0, 4569.0, 2757.0, 1755.0, 1062.0, 647.0, 433.0, 258.0, 174.0, 114.0, 81.0, 54.0, 25.0, 26.0, 16.0, 8.0, 4.0, 5.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.30859375, -7.082275390625, -6.85595703125, -6.629638671875, -6.4033203125, -6.177001953125, -5.95068359375, -5.724365234375, -5.498046875, -5.271728515625, -5.04541015625, -4.819091796875, -4.5927734375, -4.366455078125, -4.14013671875, -3.913818359375, -3.6875, -3.461181640625, -3.23486328125, -3.008544921875, -2.7822265625, -2.555908203125, -2.32958984375, -2.103271484375, -1.876953125, -1.650634765625, -1.42431640625, -1.197998046875, -0.9716796875, -0.745361328125, -0.51904296875, -0.292724609375, -0.06640625, 0.159912109375, 0.38623046875, 0.612548828125, 0.8388671875, 1.065185546875, 1.29150390625, 1.517822265625, 1.744140625, 1.970458984375, 2.19677734375, 2.423095703125, 2.6494140625, 2.875732421875, 3.10205078125, 3.328369140625, 3.5546875, 3.781005859375, 4.00732421875, 4.233642578125, 4.4599609375, 4.686279296875, 4.91259765625, 5.138916015625, 5.365234375, 5.591552734375, 5.81787109375, 6.044189453125, 6.2705078125, 6.496826171875, 6.72314453125, 6.949462890625, 7.17578125]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 4.0, 3.0, 5.0, 2.0, 10.0, 8.0, 16.0, 12.0, 21.0, 38.0, 46.0, 54.0, 70.0, 79.0, 103.0, 129.0, 173.0, 213.0, 265.0, 304.0, 335.0, 350.0, 334.0, 307.0, 253.0, 219.0, 139.0, 130.0, 108.0, 85.0, 62.0, 65.0, 36.0, 23.0, 27.0, 9.0, 14.0, 7.0, 9.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.716796875, -2.64178466796875, -2.5667724609375, -2.49176025390625, -2.416748046875, -2.34173583984375, -2.2667236328125, -2.19171142578125, -2.11669921875, -2.04168701171875, -1.9666748046875, -1.89166259765625, -1.816650390625, -1.74163818359375, -1.6666259765625, -1.59161376953125, -1.5166015625, -1.44158935546875, -1.3665771484375, -1.29156494140625, -1.216552734375, -1.14154052734375, -1.0665283203125, -0.99151611328125, -0.91650390625, -0.84149169921875, -0.7664794921875, -0.69146728515625, -0.616455078125, -0.54144287109375, -0.4664306640625, -0.39141845703125, -0.31640625, -0.24139404296875, -0.1663818359375, -0.09136962890625, -0.016357421875, 0.05865478515625, 0.1336669921875, 0.20867919921875, 0.28369140625, 0.35870361328125, 0.4337158203125, 0.50872802734375, 0.583740234375, 0.65875244140625, 0.7337646484375, 0.80877685546875, 0.8837890625, 0.95880126953125, 1.0338134765625, 1.10882568359375, 1.183837890625, 1.25885009765625, 1.3338623046875, 1.40887451171875, 1.48388671875, 1.55889892578125, 1.6339111328125, 1.70892333984375, 1.783935546875, 1.85894775390625, 1.9339599609375, 2.00897216796875, 2.083984375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 7.0, 15.0, 10.0, 10.0, 12.0, 11.0, 16.0, 22.0, 30.0, 42.0, 45.0, 53.0, 66.0, 62.0, 51.0, 83.0, 60.0, 76.0, 57.0, 47.0, 37.0, 39.0, 31.0, 21.0, 18.0, 16.0, 14.0, 13.0, 10.0, 5.0, 7.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-9.556941986083984, -9.307881355285645, -9.058820724487305, -8.809761047363281, -8.560700416564941, -8.311639785766602, -8.062579154968262, -7.81351900100708, -7.564458847045898, -7.315398216247559, -7.066338062286377, -6.817277431488037, -6.5682172775268555, -6.319156646728516, -6.070096015930176, -5.821035861968994, -5.571975231170654, -5.3229146003723145, -5.073854446411133, -4.824793815612793, -4.575733661651611, -4.3266730308532715, -4.07761287689209, -3.82855224609375, -3.5794918537139893, -3.3304314613342285, -3.0813710689544678, -2.832310676574707, -2.583250045776367, -2.3341898918151855, -2.0851292610168457, -1.836068868637085, -1.5870084762573242, -1.3379480838775635, -1.0888876914978027, -0.8398271799087524, -0.5907667875289917, -0.34170639514923096, -0.09264588356018066, 0.15641450881958008, 0.4054749011993408, 0.6545352935791016, 0.9035957455635071, 1.1526561975479126, 1.4017165899276733, 1.650776982307434, 1.8998374938964844, 2.148897886276245, 2.397958278656006, 2.6470186710357666, 2.8960790634155273, 3.145139694213867, 3.394199848175049, 3.6432604789733887, 3.8923208713531494, 4.14138126373291, 4.39044189453125, 4.63950252532959, 4.8885626792907715, 5.137623310089111, 5.386683464050293, 5.635744094848633, 5.884804725646973, 6.133864879608154, 6.382925033569336]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 2.0, 3.0, 3.0, 4.0, 10.0, 14.0, 6.0, 11.0, 15.0, 16.0, 16.0, 25.0, 32.0, 29.0, 36.0, 42.0, 28.0, 34.0, 53.0, 53.0, 37.0, 48.0, 53.0, 46.0, 34.0, 43.0, 47.0, 44.0, 28.0, 29.0, 34.0, 22.0, 20.0, 16.0, 14.0, 15.0, 11.0, 9.0, 8.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.054889678955078, -4.903929710388184, -4.752969741821289, -4.6020097732543945, -4.4510498046875, -4.3000898361206055, -4.149129867553711, -3.9981696605682373, -3.8472096920013428, -3.6962497234344482, -3.5452897548675537, -3.394329786300659, -3.2433695793151855, -3.092409610748291, -2.9414496421813965, -2.790489673614502, -2.6395297050476074, -2.488569736480713, -2.3376097679138184, -2.186649799346924, -2.0356898307800293, -1.8847297430038452, -1.7337696552276611, -1.5828096866607666, -1.431849718093872, -1.2808897495269775, -1.129929780960083, -0.9789696931838989, -0.8280097246170044, -0.6770497560501099, -0.5260897278785706, -0.37512969970703125, -0.22416925430297852, -0.0732092559337616, 0.07775074243545532, 0.22871074080467224, 0.37967073917388916, 0.5306307077407837, 0.681590735912323, 0.8325507640838623, 0.9835107326507568, 1.1344707012176514, 1.285430669784546, 1.43639075756073, 1.5873507261276245, 1.738310694694519, 1.8892707824707031, 2.0402307510375977, 2.191190719604492, 2.3421506881713867, 2.4931106567382812, 2.644070625305176, 2.7950305938720703, 2.945990562438965, 3.0969507694244385, 3.247910737991333, 3.3988707065582275, 3.549830675125122, 3.7007906436920166, 3.851750612258911, 4.002710819244385, 4.153670787811279, 4.304630756378174, 4.455590724945068, 4.606550693511963]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 6.0, 17.0, 20.0, 26.0, 55.0, 97.0, 138.0, 209.0, 346.0, 544.0, 954.0, 1622.0, 3017.0, 6498.0, 16393.0, 48724.0, 155216.0, 346434.0, 296861.0, 112238.0, 35457.0, 12366.0, 5225.0, 2544.0, 1430.0, 856.0, 501.0, 328.0, 157.0, 112.0, 59.0, 41.0, 16.0, 17.0, 14.0, 6.0, 6.0, 5.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.84375, -7.5975341796875, -7.351318359375, -7.1051025390625, -6.85888671875, -6.6126708984375, -6.366455078125, -6.1202392578125, -5.8740234375, -5.6278076171875, -5.381591796875, -5.1353759765625, -4.88916015625, -4.6429443359375, -4.396728515625, -4.1505126953125, -3.904296875, -3.6580810546875, -3.411865234375, -3.1656494140625, -2.91943359375, -2.6732177734375, -2.427001953125, -2.1807861328125, -1.9345703125, -1.6883544921875, -1.442138671875, -1.1959228515625, -0.94970703125, -0.7034912109375, -0.457275390625, -0.2110595703125, 0.03515625, 0.2813720703125, 0.527587890625, 0.7738037109375, 1.02001953125, 1.2662353515625, 1.512451171875, 1.7586669921875, 2.0048828125, 2.2510986328125, 2.497314453125, 2.7435302734375, 2.98974609375, 3.2359619140625, 3.482177734375, 3.7283935546875, 3.974609375, 4.2208251953125, 4.467041015625, 4.7132568359375, 4.95947265625, 5.2056884765625, 5.451904296875, 5.6981201171875, 5.9443359375, 6.1905517578125, 6.436767578125, 6.6829833984375, 6.92919921875, 7.1754150390625, 7.421630859375, 7.6678466796875, 7.9140625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 3.0, 6.0, 5.0, 6.0, 10.0, 12.0, 17.0, 18.0, 9.0, 15.0, 20.0, 28.0, 28.0, 29.0, 31.0, 28.0, 36.0, 35.0, 54.0, 44.0, 39.0, 35.0, 41.0, 55.0, 48.0, 39.0, 34.0, 36.0, 37.0, 32.0, 28.0, 27.0, 19.0, 12.0, 13.0, 17.0, 11.0, 9.0, 6.0, 12.0, 4.0, 11.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-5.23046875, -5.07958984375, -4.9287109375, -4.77783203125, -4.626953125, -4.47607421875, -4.3251953125, -4.17431640625, -4.0234375, -3.87255859375, -3.7216796875, -3.57080078125, -3.419921875, -3.26904296875, -3.1181640625, -2.96728515625, -2.81640625, -2.66552734375, -2.5146484375, -2.36376953125, -2.212890625, -2.06201171875, -1.9111328125, -1.76025390625, -1.609375, -1.45849609375, -1.3076171875, -1.15673828125, -1.005859375, -0.85498046875, -0.7041015625, -0.55322265625, -0.40234375, -0.25146484375, -0.1005859375, 0.05029296875, 0.201171875, 0.35205078125, 0.5029296875, 0.65380859375, 0.8046875, 0.95556640625, 1.1064453125, 1.25732421875, 1.408203125, 1.55908203125, 1.7099609375, 1.86083984375, 2.01171875, 2.16259765625, 2.3134765625, 2.46435546875, 2.615234375, 2.76611328125, 2.9169921875, 3.06787109375, 3.21875, 3.36962890625, 3.5205078125, 3.67138671875, 3.822265625, 3.97314453125, 4.1240234375, 4.27490234375, 4.42578125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 7.0, 6.0, 7.0, 10.0, 13.0, 14.0, 16.0, 26.0, 41.0, 45.0, 69.0, 93.0, 160.0, 218.0, 292.0, 526.0, 862.0, 1589.0, 3207.0, 7835.0, 27139.0, 129984.0, 494454.0, 297917.0, 59293.0, 14359.0, 5019.0, 2154.0, 1176.0, 678.0, 430.0, 270.0, 209.0, 133.0, 83.0, 50.0, 46.0, 31.0, 24.0, 19.0, 13.0, 15.0, 3.0, 6.0, 6.0, 3.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.8828125, -11.5086669921875, -11.134521484375, -10.7603759765625, -10.38623046875, -10.0120849609375, -9.637939453125, -9.2637939453125, -8.8896484375, -8.5155029296875, -8.141357421875, -7.7672119140625, -7.39306640625, -7.0189208984375, -6.644775390625, -6.2706298828125, -5.896484375, -5.5223388671875, -5.148193359375, -4.7740478515625, -4.39990234375, -4.0257568359375, -3.651611328125, -3.2774658203125, -2.9033203125, -2.5291748046875, -2.155029296875, -1.7808837890625, -1.40673828125, -1.0325927734375, -0.658447265625, -0.2843017578125, 0.08984375, 0.4639892578125, 0.838134765625, 1.2122802734375, 1.58642578125, 1.9605712890625, 2.334716796875, 2.7088623046875, 3.0830078125, 3.4571533203125, 3.831298828125, 4.2054443359375, 4.57958984375, 4.9537353515625, 5.327880859375, 5.7020263671875, 6.076171875, 6.4503173828125, 6.824462890625, 7.1986083984375, 7.57275390625, 7.9468994140625, 8.321044921875, 8.6951904296875, 9.0693359375, 9.4434814453125, 9.817626953125, 10.1917724609375, 10.56591796875, 10.9400634765625, 11.314208984375, 11.6883544921875, 12.0625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 7.0, 6.0, 3.0, 7.0, 10.0, 3.0, 14.0, 15.0, 21.0, 16.0, 24.0, 28.0, 23.0, 26.0, 37.0, 30.0, 30.0, 51.0, 40.0, 39.0, 32.0, 46.0, 40.0, 42.0, 46.0, 38.0, 34.0, 33.0, 33.0, 29.0, 32.0, 26.0, 22.0, 23.0, 23.0, 17.0, 11.0, 15.0, 11.0, 3.0, 2.0, 6.0, 3.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.849609375, -2.76300048828125, -2.6763916015625, -2.58978271484375, -2.503173828125, -2.41656494140625, -2.3299560546875, -2.24334716796875, -2.15673828125, -2.07012939453125, -1.9835205078125, -1.89691162109375, -1.810302734375, -1.72369384765625, -1.6370849609375, -1.55047607421875, -1.4638671875, -1.37725830078125, -1.2906494140625, -1.20404052734375, -1.117431640625, -1.03082275390625, -0.9442138671875, -0.85760498046875, -0.77099609375, -0.68438720703125, -0.5977783203125, -0.51116943359375, -0.424560546875, -0.33795166015625, -0.2513427734375, -0.16473388671875, -0.078125, 0.00848388671875, 0.0950927734375, 0.18170166015625, 0.268310546875, 0.35491943359375, 0.4415283203125, 0.52813720703125, 0.61474609375, 0.70135498046875, 0.7879638671875, 0.87457275390625, 0.961181640625, 1.04779052734375, 1.1343994140625, 1.22100830078125, 1.3076171875, 1.39422607421875, 1.4808349609375, 1.56744384765625, 1.654052734375, 1.74066162109375, 1.8272705078125, 1.91387939453125, 2.00048828125, 2.08709716796875, 2.1737060546875, 2.26031494140625, 2.346923828125, 2.43353271484375, 2.5201416015625, 2.60675048828125, 2.693359375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 6.0, 5.0, 9.0, 13.0, 21.0, 20.0, 49.0, 51.0, 90.0, 122.0, 174.0, 237.0, 318.0, 418.0, 602.0, 884.0, 1235.0, 1923.0, 3001.0, 5226.0, 10858.0, 29419.0, 107388.0, 398762.0, 349485.0, 89227.0, 25670.0, 9736.0, 4894.0, 2743.0, 1846.0, 1216.0, 817.0, 601.0, 429.0, 322.0, 192.0, 153.0, 117.0, 89.0, 56.0, 40.0, 24.0, 25.0, 19.0, 11.0, 5.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0], "bins": [-6.20703125, -6.02935791015625, -5.8516845703125, -5.67401123046875, -5.496337890625, -5.31866455078125, -5.1409912109375, -4.96331787109375, -4.78564453125, -4.60797119140625, -4.4302978515625, -4.25262451171875, -4.074951171875, -3.89727783203125, -3.7196044921875, -3.54193115234375, -3.3642578125, -3.18658447265625, -3.0089111328125, -2.83123779296875, -2.653564453125, -2.47589111328125, -2.2982177734375, -2.12054443359375, -1.94287109375, -1.76519775390625, -1.5875244140625, -1.40985107421875, -1.232177734375, -1.05450439453125, -0.8768310546875, -0.69915771484375, -0.521484375, -0.34381103515625, -0.1661376953125, 0.01153564453125, 0.189208984375, 0.36688232421875, 0.5445556640625, 0.72222900390625, 0.89990234375, 1.07757568359375, 1.2552490234375, 1.43292236328125, 1.610595703125, 1.78826904296875, 1.9659423828125, 2.14361572265625, 2.3212890625, 2.49896240234375, 2.6766357421875, 2.85430908203125, 3.031982421875, 3.20965576171875, 3.3873291015625, 3.56500244140625, 3.74267578125, 3.92034912109375, 4.0980224609375, 4.27569580078125, 4.453369140625, 4.63104248046875, 4.8087158203125, 4.98638916015625, 5.1640625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 6.0, 7.0, 15.0, 19.0, 33.0, 39.0, 54.0, 89.0, 110.0, 132.0, 118.0, 105.0, 81.0, 64.0, 32.0, 26.0, 15.0, 14.0, 7.0, 6.0, 3.0, 6.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.00034308433532714844, -0.0003342684358358383, -0.0003254525363445282, -0.0003166366368532181, -0.00030782073736190796, -0.00029900483787059784, -0.0002901889383792877, -0.0002813730388879776, -0.0002725571393966675, -0.00026374123990535736, -0.00025492534041404724, -0.0002461094409227371, -0.000237293541431427, -0.00022847764194011688, -0.00021966174244880676, -0.00021084584295749664, -0.00020202994346618652, -0.0001932140439748764, -0.00018439814448356628, -0.00017558224499225616, -0.00016676634550094604, -0.00015795044600963593, -0.0001491345465183258, -0.00014031864702701569, -0.00013150274753570557, -0.00012268684804439545, -0.00011387094855308533, -0.00010505504906177521, -9.623914957046509e-05, -8.742325007915497e-05, -7.860735058784485e-05, -6.979145109653473e-05, -6.097555160522461e-05, -5.215965211391449e-05, -4.334375262260437e-05, -3.452785313129425e-05, -2.571195363998413e-05, -1.689605414867401e-05, -8.080154657363892e-06, 7.35744833946228e-07, 9.551644325256348e-06, 1.8367543816566467e-05, 2.7183443307876587e-05, 3.5999342799186707e-05, 4.4815242290496826e-05, 5.3631141781806946e-05, 6.244704127311707e-05, 7.126294076442719e-05, 8.00788402557373e-05, 8.889473974704742e-05, 9.771063923835754e-05, 0.00010652653872966766, 0.00011534243822097778, 0.0001241583377122879, 0.00013297423720359802, 0.00014179013669490814, 0.00015060603618621826, 0.00015942193567752838, 0.0001682378351688385, 0.00017705373466014862, 0.00018586963415145874, 0.00019468553364276886, 0.00020350143313407898, 0.0002123173326253891, 0.00022113323211669922]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 8.0, 4.0, 6.0, 13.0, 10.0, 15.0, 18.0, 44.0, 37.0, 59.0, 84.0, 113.0, 165.0, 213.0, 301.0, 434.0, 634.0, 1002.0, 1339.0, 2153.0, 3734.0, 6883.0, 16796.0, 59535.0, 241888.0, 449083.0, 188816.0, 45819.0, 13897.0, 5975.0, 3303.0, 2034.0, 1297.0, 836.0, 599.0, 420.0, 289.0, 206.0, 123.0, 99.0, 85.0, 47.0, 33.0, 34.0, 18.0, 21.0, 17.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.25, -5.08282470703125, -4.9156494140625, -4.74847412109375, -4.581298828125, -4.41412353515625, -4.2469482421875, -4.07977294921875, -3.91259765625, -3.74542236328125, -3.5782470703125, -3.41107177734375, -3.243896484375, -3.07672119140625, -2.9095458984375, -2.74237060546875, -2.5751953125, -2.40802001953125, -2.2408447265625, -2.07366943359375, -1.906494140625, -1.73931884765625, -1.5721435546875, -1.40496826171875, -1.23779296875, -1.07061767578125, -0.9034423828125, -0.73626708984375, -0.569091796875, -0.40191650390625, -0.2347412109375, -0.06756591796875, 0.099609375, 0.26678466796875, 0.4339599609375, 0.60113525390625, 0.768310546875, 0.93548583984375, 1.1026611328125, 1.26983642578125, 1.43701171875, 1.60418701171875, 1.7713623046875, 1.93853759765625, 2.105712890625, 2.27288818359375, 2.4400634765625, 2.60723876953125, 2.7744140625, 2.94158935546875, 3.1087646484375, 3.27593994140625, 3.443115234375, 3.61029052734375, 3.7774658203125, 3.94464111328125, 4.11181640625, 4.27899169921875, 4.4461669921875, 4.61334228515625, 4.780517578125, 4.94769287109375, 5.1148681640625, 5.28204345703125, 5.44921875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 8.0, 8.0, 24.0, 41.0, 65.0, 121.0, 142.0, 161.0, 124.0, 110.0, 76.0, 42.0, 27.0, 19.0, 6.0, 5.0, 3.0, 3.0, 0.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3466796875, -1.296051025390625, -1.24542236328125, -1.194793701171875, -1.1441650390625, -1.093536376953125, -1.04290771484375, -0.992279052734375, -0.941650390625, -0.891021728515625, -0.84039306640625, -0.789764404296875, -0.7391357421875, -0.688507080078125, -0.63787841796875, -0.587249755859375, -0.53662109375, -0.485992431640625, -0.43536376953125, -0.384735107421875, -0.3341064453125, -0.283477783203125, -0.23284912109375, -0.182220458984375, -0.131591796875, -0.080963134765625, -0.03033447265625, 0.020294189453125, 0.0709228515625, 0.121551513671875, 0.17218017578125, 0.222808837890625, 0.2734375, 0.324066162109375, 0.37469482421875, 0.425323486328125, 0.4759521484375, 0.526580810546875, 0.57720947265625, 0.627838134765625, 0.678466796875, 0.729095458984375, 0.77972412109375, 0.830352783203125, 0.8809814453125, 0.931610107421875, 0.98223876953125, 1.032867431640625, 1.08349609375, 1.134124755859375, 1.18475341796875, 1.235382080078125, 1.2860107421875, 1.336639404296875, 1.38726806640625, 1.437896728515625, 1.488525390625, 1.539154052734375, 1.58978271484375, 1.640411376953125, 1.6910400390625, 1.741668701171875, 1.79229736328125, 1.842926025390625, 1.8935546875]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 13.0, 9.0, 9.0, 14.0, 7.0, 8.0, 24.0, 20.0, 34.0, 41.0, 59.0, 49.0, 52.0, 68.0, 65.0, 69.0, 73.0, 72.0, 55.0, 47.0, 40.0, 31.0, 25.0, 26.0, 17.0, 17.0, 13.0, 11.0, 14.0, 3.0, 4.0, 7.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-9.574878692626953, -9.324416160583496, -9.073952674865723, -8.823490142822266, -8.573026657104492, -8.322564125061035, -8.072100639343262, -7.821638107299805, -7.5711750984191895, -7.320712089538574, -7.070249080657959, -6.819786071777344, -6.569323539733887, -6.318860054016113, -6.068397521972656, -5.817934513092041, -5.567471504211426, -5.3170084953308105, -5.066545486450195, -4.81608247756958, -4.565619468688965, -4.315156936645508, -4.064693927764893, -3.8142309188842773, -3.563767910003662, -3.313304901123047, -3.0628418922424316, -2.8123791217803955, -2.5619161128997803, -2.311453104019165, -2.060990333557129, -1.8105273246765137, -1.560063362121582, -1.3096003532409668, -1.0591374635696411, -0.8086745142936707, -0.5582115650177002, -0.30774855613708496, -0.05728566646575928, 0.1931772232055664, 0.44364023208618164, 0.6941031813621521, 0.9445661306381226, 1.1950290203094482, 1.4454920291900635, 1.6959550380706787, 1.9464179277420044, 2.19688081741333, 2.4473438262939453, 2.6978068351745605, 2.948269844055176, 3.198732614517212, 3.449195623397827, 3.6996586322784424, 3.9501214027404785, 4.200584411621094, 4.451047420501709, 4.701510429382324, 4.9519734382629395, 5.202436447143555, 5.452898979187012, 5.703362464904785, 5.953824996948242, 6.204288005828857, 6.454751014709473]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 3.0, 5.0, 4.0, 7.0, 9.0, 9.0, 14.0, 9.0, 15.0, 18.0, 24.0, 25.0, 27.0, 40.0, 28.0, 29.0, 32.0, 50.0, 40.0, 56.0, 47.0, 47.0, 46.0, 38.0, 40.0, 40.0, 45.0, 29.0, 37.0, 34.0, 24.0, 25.0, 18.0, 18.0, 13.0, 13.0, 10.0, 11.0, 7.0, 9.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.813549041748047, -4.668715476989746, -4.523881912231445, -4.379047870635986, -4.2342143058776855, -4.089380741119385, -3.944546937942505, -3.799713134765625, -3.654879570007324, -3.5100460052490234, -3.3652122020721436, -3.2203783988952637, -3.075544834136963, -2.930711269378662, -2.7858774662017822, -2.6410436630249023, -2.4962100982666016, -2.351376533508301, -2.206542730331421, -2.061708927154541, -1.9168753623962402, -1.77204167842865, -1.6272079944610596, -1.4823743104934692, -1.337540626525879, -1.1927069425582886, -1.0478732585906982, -0.9030395746231079, -0.7582058906555176, -0.6133722066879272, -0.4685385227203369, -0.3237048387527466, -0.17887163162231445, -0.03403794765472412, 0.11079573631286621, 0.25562942028045654, 0.4004631042480469, 0.5452967882156372, 0.6901304721832275, 0.8349641561508179, 0.9797978401184082, 1.1246315240859985, 1.2694652080535889, 1.4142988920211792, 1.5591325759887695, 1.7039662599563599, 1.8487999439239502, 1.9936336278915405, 2.138467311859131, 2.2833008766174316, 2.4281346797943115, 2.5729684829711914, 2.717802047729492, 2.862635612487793, 3.007469415664673, 3.1523032188415527, 3.2971367835998535, 3.4419703483581543, 3.586804151535034, 3.731637954711914, 3.876471519470215, 4.021305084228516, 4.166138648986816, 4.310972690582275, 4.455806255340576]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 8.0, 13.0, 19.0, 23.0, 42.0, 59.0, 88.0, 151.0, 216.0, 388.0, 632.0, 1102.0, 1817.0, 3176.0, 5523.0, 9538.0, 16531.0, 28602.0, 48671.0, 79318.0, 119164.0, 156694.0, 167841.0, 144587.0, 103323.0, 66071.0, 39855.0, 23049.0, 13260.0, 7693.0, 4528.0, 2624.0, 1533.0, 941.0, 585.0, 343.0, 197.0, 140.0, 75.0, 48.0, 34.0, 16.0, 10.0, 8.0, 7.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.92578125, -5.73651123046875, -5.5472412109375, -5.35797119140625, -5.168701171875, -4.97943115234375, -4.7901611328125, -4.60089111328125, -4.41162109375, -4.22235107421875, -4.0330810546875, -3.84381103515625, -3.654541015625, -3.46527099609375, -3.2760009765625, -3.08673095703125, -2.8974609375, -2.70819091796875, -2.5189208984375, -2.32965087890625, -2.140380859375, -1.95111083984375, -1.7618408203125, -1.57257080078125, -1.38330078125, -1.19403076171875, -1.0047607421875, -0.81549072265625, -0.626220703125, -0.43695068359375, -0.2476806640625, -0.05841064453125, 0.130859375, 0.32012939453125, 0.5093994140625, 0.69866943359375, 0.887939453125, 1.07720947265625, 1.2664794921875, 1.45574951171875, 1.64501953125, 1.83428955078125, 2.0235595703125, 2.21282958984375, 2.402099609375, 2.59136962890625, 2.7806396484375, 2.96990966796875, 3.1591796875, 3.34844970703125, 3.5377197265625, 3.72698974609375, 3.916259765625, 4.10552978515625, 4.2947998046875, 4.48406982421875, 4.67333984375, 4.86260986328125, 5.0518798828125, 5.24114990234375, 5.430419921875, 5.61968994140625, 5.8089599609375, 5.99822998046875, 6.1875]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 3.0, 5.0, 8.0, 6.0, 9.0, 12.0, 13.0, 14.0, 19.0, 20.0, 26.0, 47.0, 47.0, 30.0, 41.0, 49.0, 43.0, 46.0, 37.0, 51.0, 48.0, 48.0, 39.0, 49.0, 46.0, 37.0, 38.0, 41.0, 21.0, 16.0, 10.0, 16.0, 15.0, 8.0, 12.0, 7.0, 4.0, 6.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.0390625, -5.871826171875, -5.70458984375, -5.537353515625, -5.3701171875, -5.202880859375, -5.03564453125, -4.868408203125, -4.701171875, -4.533935546875, -4.36669921875, -4.199462890625, -4.0322265625, -3.864990234375, -3.69775390625, -3.530517578125, -3.36328125, -3.196044921875, -3.02880859375, -2.861572265625, -2.6943359375, -2.527099609375, -2.35986328125, -2.192626953125, -2.025390625, -1.858154296875, -1.69091796875, -1.523681640625, -1.3564453125, -1.189208984375, -1.02197265625, -0.854736328125, -0.6875, -0.520263671875, -0.35302734375, -0.185791015625, -0.0185546875, 0.148681640625, 0.31591796875, 0.483154296875, 0.650390625, 0.817626953125, 0.98486328125, 1.152099609375, 1.3193359375, 1.486572265625, 1.65380859375, 1.821044921875, 1.98828125, 2.155517578125, 2.32275390625, 2.489990234375, 2.6572265625, 2.824462890625, 2.99169921875, 3.158935546875, 3.326171875, 3.493408203125, 3.66064453125, 3.827880859375, 3.9951171875, 4.162353515625, 4.32958984375, 4.496826171875, 4.6640625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 9.0, 7.0, 20.0, 19.0, 31.0, 59.0, 87.0, 148.0, 206.0, 308.0, 525.0, 827.0, 1272.0, 2216.0, 3550.0, 5508.0, 9165.0, 15202.0, 24330.0, 39645.0, 61824.0, 91586.0, 125363.0, 148392.0, 147086.0, 123055.0, 89135.0, 59672.0, 37857.0, 23730.0, 14406.0, 8977.0, 5401.0, 3365.0, 2047.0, 1318.0, 825.0, 484.0, 313.0, 216.0, 137.0, 95.0, 41.0, 30.0, 19.0, 16.0, 11.0, 9.0, 7.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.23828125, -5.069091796875, -4.89990234375, -4.730712890625, -4.5615234375, -4.392333984375, -4.22314453125, -4.053955078125, -3.884765625, -3.715576171875, -3.54638671875, -3.377197265625, -3.2080078125, -3.038818359375, -2.86962890625, -2.700439453125, -2.53125, -2.362060546875, -2.19287109375, -2.023681640625, -1.8544921875, -1.685302734375, -1.51611328125, -1.346923828125, -1.177734375, -1.008544921875, -0.83935546875, -0.670166015625, -0.5009765625, -0.331787109375, -0.16259765625, 0.006591796875, 0.17578125, 0.344970703125, 0.51416015625, 0.683349609375, 0.8525390625, 1.021728515625, 1.19091796875, 1.360107421875, 1.529296875, 1.698486328125, 1.86767578125, 2.036865234375, 2.2060546875, 2.375244140625, 2.54443359375, 2.713623046875, 2.8828125, 3.052001953125, 3.22119140625, 3.390380859375, 3.5595703125, 3.728759765625, 3.89794921875, 4.067138671875, 4.236328125, 4.405517578125, 4.57470703125, 4.743896484375, 4.9130859375, 5.082275390625, 5.25146484375, 5.420654296875, 5.58984375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 2.0, 10.0, 7.0, 7.0, 6.0, 11.0, 10.0, 20.0, 19.0, 17.0, 31.0, 16.0, 28.0, 37.0, 33.0, 35.0, 30.0, 39.0, 18.0, 58.0, 43.0, 51.0, 46.0, 42.0, 25.0, 33.0, 45.0, 28.0, 28.0, 25.0, 26.0, 28.0, 21.0, 27.0, 11.0, 21.0, 12.0, 12.0, 14.0, 13.0, 3.0, 3.0, 4.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.404296875, -2.317108154296875, -2.22991943359375, -2.142730712890625, -2.0555419921875, -1.968353271484375, -1.88116455078125, -1.793975830078125, -1.706787109375, -1.619598388671875, -1.53240966796875, -1.445220947265625, -1.3580322265625, -1.270843505859375, -1.18365478515625, -1.096466064453125, -1.00927734375, -0.922088623046875, -0.83489990234375, -0.747711181640625, -0.6605224609375, -0.573333740234375, -0.48614501953125, -0.398956298828125, -0.311767578125, -0.224578857421875, -0.13739013671875, -0.050201416015625, 0.0369873046875, 0.124176025390625, 0.21136474609375, 0.298553466796875, 0.3857421875, 0.472930908203125, 0.56011962890625, 0.647308349609375, 0.7344970703125, 0.821685791015625, 0.90887451171875, 0.996063232421875, 1.083251953125, 1.170440673828125, 1.25762939453125, 1.344818115234375, 1.4320068359375, 1.519195556640625, 1.60638427734375, 1.693572998046875, 1.78076171875, 1.867950439453125, 1.95513916015625, 2.042327880859375, 2.1295166015625, 2.216705322265625, 2.30389404296875, 2.391082763671875, 2.478271484375, 2.565460205078125, 2.65264892578125, 2.739837646484375, 2.8270263671875, 2.914215087890625, 3.00140380859375, 3.088592529296875, 3.17578125]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 3.0, 6.0, 5.0, 8.0, 11.0, 16.0, 29.0, 36.0, 46.0, 54.0, 96.0, 126.0, 159.0, 264.0, 307.0, 502.0, 831.0, 1214.0, 1787.0, 2866.0, 4474.0, 7094.0, 11728.0, 20014.0, 33681.0, 58642.0, 100761.0, 161113.0, 202817.0, 171347.0, 110476.0, 64326.0, 37089.0, 21792.0, 12988.0, 7878.0, 4964.0, 3129.0, 1977.0, 1266.0, 832.0, 578.0, 384.0, 241.0, 170.0, 141.0, 80.0, 67.0, 46.0, 31.0, 24.0, 18.0, 8.0, 9.0, 7.0, 3.0, 5.0, 1.0, 3.0, 1.0], "bins": [-3.78515625, -3.66900634765625, -3.5528564453125, -3.43670654296875, -3.320556640625, -3.20440673828125, -3.0882568359375, -2.97210693359375, -2.85595703125, -2.73980712890625, -2.6236572265625, -2.50750732421875, -2.391357421875, -2.27520751953125, -2.1590576171875, -2.04290771484375, -1.9267578125, -1.81060791015625, -1.6944580078125, -1.57830810546875, -1.462158203125, -1.34600830078125, -1.2298583984375, -1.11370849609375, -0.99755859375, -0.88140869140625, -0.7652587890625, -0.64910888671875, -0.532958984375, -0.41680908203125, -0.3006591796875, -0.18450927734375, -0.068359375, 0.04779052734375, 0.1639404296875, 0.28009033203125, 0.396240234375, 0.51239013671875, 0.6285400390625, 0.74468994140625, 0.86083984375, 0.97698974609375, 1.0931396484375, 1.20928955078125, 1.325439453125, 1.44158935546875, 1.5577392578125, 1.67388916015625, 1.7900390625, 1.90618896484375, 2.0223388671875, 2.13848876953125, 2.254638671875, 2.37078857421875, 2.4869384765625, 2.60308837890625, 2.71923828125, 2.83538818359375, 2.9515380859375, 3.06768798828125, 3.183837890625, 3.29998779296875, 3.4161376953125, 3.53228759765625, 3.6484375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 4.0, 4.0, 6.0, 1.0, 11.0, 7.0, 14.0, 21.0, 26.0, 33.0, 40.0, 40.0, 53.0, 85.0, 78.0, 93.0, 98.0, 83.0, 66.0, 51.0, 33.0, 43.0, 28.0, 18.0, 11.0, 7.0, 10.0, 13.0, 6.0, 6.0, 0.0, 5.0, 3.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0005068778991699219, -0.0004900619387626648, -0.0004732459783554077, -0.00045643001794815063, -0.00043961405754089355, -0.0004227980971336365, -0.0004059821367263794, -0.0003891661763191223, -0.00037235021591186523, -0.00035553425550460815, -0.0003387182950973511, -0.000321902334690094, -0.0003050863742828369, -0.00028827041387557983, -0.00027145445346832275, -0.0002546384930610657, -0.0002378225326538086, -0.00022100657224655151, -0.00020419061183929443, -0.00018737465143203735, -0.00017055869102478027, -0.0001537427306175232, -0.0001369267702102661, -0.00012011080980300903, -0.00010329484939575195, -8.647888898849487e-05, -6.966292858123779e-05, -5.284696817398071e-05, -3.603100776672363e-05, -1.9215047359466553e-05, -2.3990869522094727e-06, 1.4416873455047607e-05, 3.123283386230469e-05, 4.804879426956177e-05, 6.486475467681885e-05, 8.168071508407593e-05, 9.849667549133301e-05, 0.00011531263589859009, 0.00013212859630584717, 0.00014894455671310425, 0.00016576051712036133, 0.0001825764775276184, 0.0001993924379348755, 0.00021620839834213257, 0.00023302435874938965, 0.00024984031915664673, 0.0002666562795639038, 0.0002834722399711609, 0.00030028820037841797, 0.00031710416078567505, 0.00033392012119293213, 0.0003507360816001892, 0.0003675520420074463, 0.00038436800241470337, 0.00040118396282196045, 0.00041799992322921753, 0.0004348158836364746, 0.0004516318440437317, 0.00046844780445098877, 0.00048526376485824585, 0.0005020797252655029, 0.00051889568567276, 0.0005357116460800171, 0.0005525276064872742, 0.0005693435668945312]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 7.0, 6.0, 13.0, 24.0, 27.0, 44.0, 69.0, 87.0, 129.0, 184.0, 276.0, 417.0, 609.0, 866.0, 1274.0, 2065.0, 3136.0, 4814.0, 7663.0, 11909.0, 18932.0, 30810.0, 49512.0, 78120.0, 117995.0, 156701.0, 166455.0, 136771.0, 95694.0, 61203.0, 38085.0, 23580.0, 14794.0, 9219.0, 5823.0, 3700.0, 2502.0, 1580.0, 1103.0, 781.0, 479.0, 315.0, 245.0, 175.0, 101.0, 80.0, 56.0, 41.0, 23.0, 22.0, 15.0, 14.0, 9.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.765625, -2.6798095703125, -2.593994140625, -2.5081787109375, -2.42236328125, -2.3365478515625, -2.250732421875, -2.1649169921875, -2.0791015625, -1.9932861328125, -1.907470703125, -1.8216552734375, -1.73583984375, -1.6500244140625, -1.564208984375, -1.4783935546875, -1.392578125, -1.3067626953125, -1.220947265625, -1.1351318359375, -1.04931640625, -0.9635009765625, -0.877685546875, -0.7918701171875, -0.7060546875, -0.6202392578125, -0.534423828125, -0.4486083984375, -0.36279296875, -0.2769775390625, -0.191162109375, -0.1053466796875, -0.01953125, 0.0662841796875, 0.152099609375, 0.2379150390625, 0.32373046875, 0.4095458984375, 0.495361328125, 0.5811767578125, 0.6669921875, 0.7528076171875, 0.838623046875, 0.9244384765625, 1.01025390625, 1.0960693359375, 1.181884765625, 1.2677001953125, 1.353515625, 1.4393310546875, 1.525146484375, 1.6109619140625, 1.69677734375, 1.7825927734375, 1.868408203125, 1.9542236328125, 2.0400390625, 2.1258544921875, 2.211669921875, 2.2974853515625, 2.38330078125, 2.4691162109375, 2.554931640625, 2.6407470703125, 2.7265625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 2.0, 4.0, 12.0, 13.0, 14.0, 10.0, 14.0, 16.0, 21.0, 21.0, 25.0, 32.0, 32.0, 21.0, 51.0, 59.0, 61.0, 54.0, 57.0, 56.0, 47.0, 50.0, 51.0, 49.0, 38.0, 32.0, 21.0, 18.0, 13.0, 21.0, 18.0, 14.0, 10.0, 10.0, 7.0, 5.0, 4.0, 6.0, 2.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.98486328125, -0.956817626953125, -0.92877197265625, -0.900726318359375, -0.8726806640625, -0.844635009765625, -0.81658935546875, -0.788543701171875, -0.760498046875, -0.732452392578125, -0.70440673828125, -0.676361083984375, -0.6483154296875, -0.620269775390625, -0.59222412109375, -0.564178466796875, -0.5361328125, -0.508087158203125, -0.48004150390625, -0.451995849609375, -0.4239501953125, -0.395904541015625, -0.36785888671875, -0.339813232421875, -0.311767578125, -0.283721923828125, -0.25567626953125, -0.227630615234375, -0.1995849609375, -0.171539306640625, -0.14349365234375, -0.115447998046875, -0.08740234375, -0.059356689453125, -0.03131103515625, -0.003265380859375, 0.0247802734375, 0.052825927734375, 0.08087158203125, 0.108917236328125, 0.136962890625, 0.165008544921875, 0.19305419921875, 0.221099853515625, 0.2491455078125, 0.277191162109375, 0.30523681640625, 0.333282470703125, 0.361328125, 0.389373779296875, 0.41741943359375, 0.445465087890625, 0.4735107421875, 0.501556396484375, 0.52960205078125, 0.557647705078125, 0.585693359375, 0.613739013671875, 0.64178466796875, 0.669830322265625, 0.6978759765625, 0.725921630859375, 0.75396728515625, 0.782012939453125, 0.81005859375]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 7.0, 1.0, 6.0, 5.0, 8.0, 14.0, 11.0, 25.0, 17.0, 32.0, 28.0, 42.0, 42.0, 76.0, 69.0, 66.0, 78.0, 68.0, 65.0, 73.0, 50.0, 41.0, 43.0, 27.0, 28.0, 15.0, 16.0, 16.0, 10.0, 12.0, 7.0, 5.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.663951873779297, -9.392720222473145, -9.121489524841309, -8.850257873535156, -8.57902717590332, -8.307795524597168, -8.036564826965332, -7.76533317565918, -7.4941020011901855, -7.222870826721191, -6.951639652252197, -6.680408477783203, -6.409176826477051, -6.137946128845215, -5.8667144775390625, -5.595483303070068, -5.324252128601074, -5.05302095413208, -4.781789779663086, -4.510558605194092, -4.239327430725098, -3.9680960178375244, -3.696864604949951, -3.425633430480957, -3.154402256011963, -2.8831710815429688, -2.6119399070739746, -2.3407084941864014, -2.0694773197174072, -1.798246145248413, -1.5270148515701294, -1.2557835578918457, -0.9845523834228516, -0.7133211493492126, -0.44208991527557373, -0.17085868120193481, 0.1003725528717041, 0.37160372734069824, 0.6428350210189819, 0.9140663146972656, 1.1852974891662598, 1.456528663635254, 1.7277599573135376, 1.9989912509918213, 2.2702224254608154, 2.5414535999298096, 2.812685012817383, 3.083916187286377, 3.355147361755371, 3.6263785362243652, 3.8976097106933594, 4.1688408851623535, 4.440072059631348, 4.7113037109375, 4.982534885406494, 5.253766059875488, 5.524997234344482, 5.796228408813477, 6.067459583282471, 6.338690757751465, 6.609922409057617, 6.881153106689453, 7.1523847579956055, 7.4236159324646, 7.694847106933594]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 8.0, 4.0, 4.0, 6.0, 9.0, 7.0, 9.0, 11.0, 13.0, 14.0, 20.0, 16.0, 28.0, 28.0, 19.0, 29.0, 25.0, 29.0, 24.0, 46.0, 33.0, 33.0, 47.0, 53.0, 48.0, 34.0, 43.0, 48.0, 37.0, 37.0, 44.0, 20.0, 30.0, 30.0, 22.0, 13.0, 19.0, 8.0, 13.0, 11.0, 5.0, 5.0, 8.0, 3.0, 2.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.654512405395508, -4.511689186096191, -4.368866443634033, -4.226043701171875, -4.083220481872559, -3.9403975009918213, -3.797574520111084, -3.6547515392303467, -3.5119285583496094, -3.369105577468872, -3.2262825965881348, -3.0834596157073975, -2.94063663482666, -2.797813653945923, -2.6549906730651855, -2.5121676921844482, -2.369344711303711, -2.2265217304229736, -2.0836987495422363, -1.940875768661499, -1.7980527877807617, -1.6552298069000244, -1.512406826019287, -1.3695838451385498, -1.2267608642578125, -1.0839378833770752, -0.9411149024963379, -0.7982919216156006, -0.6554689407348633, -0.512645959854126, -0.36982297897338867, -0.22699999809265137, -0.08417701721191406, 0.05864596366882324, 0.20146894454956055, 0.34429192543029785, 0.48711490631103516, 0.6299378871917725, 0.7727608680725098, 0.9155838489532471, 1.0584068298339844, 1.2012298107147217, 1.344052791595459, 1.4868757724761963, 1.6296987533569336, 1.772521734237671, 1.9153447151184082, 2.0581676959991455, 2.200990676879883, 2.34381365776062, 2.4866366386413574, 2.6294596195220947, 2.772282600402832, 2.9151055812835693, 3.0579285621643066, 3.200751543045044, 3.3435745239257812, 3.4863975048065186, 3.629220485687256, 3.772043466567993, 3.9148664474487305, 4.057689666748047, 4.200512409210205, 4.343335151672363, 4.48615837097168]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 2.0, 4.0, 3.0, 13.0, 14.0, 14.0, 13.0, 25.0, 23.0, 44.0, 69.0, 103.0, 145.0, 241.0, 360.0, 555.0, 869.0, 1363.0, 2071.0, 3452.0, 6011.0, 10622.0, 19694.0, 38070.0, 80232.0, 181578.0, 438830.0, 983108.0, 1217101.0, 691316.0, 283790.0, 119806.0, 54357.0, 27003.0, 13981.0, 7842.0, 4333.0, 2708.0, 1544.0, 1049.0, 667.0, 435.0, 287.0, 188.0, 118.0, 74.0, 59.0, 37.0, 30.0, 15.0, 10.0, 7.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-8.5078125, -8.2664794921875, -8.025146484375, -7.7838134765625, -7.54248046875, -7.3011474609375, -7.059814453125, -6.8184814453125, -6.5771484375, -6.3358154296875, -6.094482421875, -5.8531494140625, -5.61181640625, -5.3704833984375, -5.129150390625, -4.8878173828125, -4.646484375, -4.4051513671875, -4.163818359375, -3.9224853515625, -3.68115234375, -3.4398193359375, -3.198486328125, -2.9571533203125, -2.7158203125, -2.4744873046875, -2.233154296875, -1.9918212890625, -1.75048828125, -1.5091552734375, -1.267822265625, -1.0264892578125, -0.78515625, -0.5438232421875, -0.302490234375, -0.0611572265625, 0.18017578125, 0.4215087890625, 0.662841796875, 0.9041748046875, 1.1455078125, 1.3868408203125, 1.628173828125, 1.8695068359375, 2.11083984375, 2.3521728515625, 2.593505859375, 2.8348388671875, 3.076171875, 3.3175048828125, 3.558837890625, 3.8001708984375, 4.04150390625, 4.2828369140625, 4.524169921875, 4.7655029296875, 5.0068359375, 5.2481689453125, 5.489501953125, 5.7308349609375, 5.97216796875, 6.2135009765625, 6.454833984375, 6.6961669921875, 6.9375]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 3.0, 3.0, 9.0, 6.0, 9.0, 12.0, 14.0, 12.0, 9.0, 21.0, 25.0, 20.0, 30.0, 23.0, 33.0, 38.0, 28.0, 42.0, 38.0, 46.0, 40.0, 37.0, 47.0, 45.0, 41.0, 49.0, 41.0, 41.0, 32.0, 34.0, 32.0, 19.0, 22.0, 20.0, 16.0, 17.0, 7.0, 7.0, 9.0, 5.0, 4.0, 3.0, 2.0, 2.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.859375, -3.742156982421875, -3.62493896484375, -3.507720947265625, -3.3905029296875, -3.273284912109375, -3.15606689453125, -3.038848876953125, -2.921630859375, -2.804412841796875, -2.68719482421875, -2.569976806640625, -2.4527587890625, -2.335540771484375, -2.21832275390625, -2.101104736328125, -1.98388671875, -1.866668701171875, -1.74945068359375, -1.632232666015625, -1.5150146484375, -1.397796630859375, -1.28057861328125, -1.163360595703125, -1.046142578125, -0.928924560546875, -0.81170654296875, -0.694488525390625, -0.5772705078125, -0.460052490234375, -0.34283447265625, -0.225616455078125, -0.1083984375, 0.008819580078125, 0.12603759765625, 0.243255615234375, 0.3604736328125, 0.477691650390625, 0.59490966796875, 0.712127685546875, 0.829345703125, 0.946563720703125, 1.06378173828125, 1.180999755859375, 1.2982177734375, 1.415435791015625, 1.53265380859375, 1.649871826171875, 1.76708984375, 1.884307861328125, 2.00152587890625, 2.118743896484375, 2.2359619140625, 2.353179931640625, 2.47039794921875, 2.587615966796875, 2.704833984375, 2.822052001953125, 2.93927001953125, 3.056488037109375, 3.1737060546875, 3.290924072265625, 3.40814208984375, 3.525360107421875, 3.642578125]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 5.0, 6.0, 10.0, 12.0, 18.0, 33.0, 50.0, 53.0, 86.0, 136.0, 176.0, 321.0, 443.0, 712.0, 1053.0, 1654.0, 2668.0, 4565.0, 7420.0, 12637.0, 22416.0, 40549.0, 74570.0, 142518.0, 280222.0, 551928.0, 940688.0, 945837.0, 560994.0, 285820.0, 145229.0, 75427.0, 40962.0, 22483.0, 12798.0, 7743.0, 4575.0, 2733.0, 1712.0, 1074.0, 668.0, 443.0, 278.0, 163.0, 135.0, 89.0, 64.0, 32.0, 35.0, 16.0, 17.0, 2.0, 6.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.8984375, -6.6685791015625, -6.438720703125, -6.2088623046875, -5.97900390625, -5.7491455078125, -5.519287109375, -5.2894287109375, -5.0595703125, -4.8297119140625, -4.599853515625, -4.3699951171875, -4.14013671875, -3.9102783203125, -3.680419921875, -3.4505615234375, -3.220703125, -2.9908447265625, -2.760986328125, -2.5311279296875, -2.30126953125, -2.0714111328125, -1.841552734375, -1.6116943359375, -1.3818359375, -1.1519775390625, -0.922119140625, -0.6922607421875, -0.46240234375, -0.2325439453125, -0.002685546875, 0.2271728515625, 0.45703125, 0.6868896484375, 0.916748046875, 1.1466064453125, 1.37646484375, 1.6063232421875, 1.836181640625, 2.0660400390625, 2.2958984375, 2.5257568359375, 2.755615234375, 2.9854736328125, 3.21533203125, 3.4451904296875, 3.675048828125, 3.9049072265625, 4.134765625, 4.3646240234375, 4.594482421875, 4.8243408203125, 5.05419921875, 5.2840576171875, 5.513916015625, 5.7437744140625, 5.9736328125, 6.2034912109375, 6.433349609375, 6.6632080078125, 6.89306640625, 7.1229248046875, 7.352783203125, 7.5826416015625, 7.8125]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 3.0, 3.0, 6.0, 4.0, 6.0, 10.0, 12.0, 10.0, 13.0, 13.0, 32.0, 29.0, 36.0, 53.0, 68.0, 86.0, 101.0, 125.0, 160.0, 190.0, 247.0, 252.0, 272.0, 315.0, 312.0, 300.0, 255.0, 216.0, 232.0, 165.0, 114.0, 102.0, 92.0, 61.0, 46.0, 30.0, 26.0, 21.0, 17.0, 16.0, 11.0, 8.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.728515625, -2.654571533203125, -2.58062744140625, -2.506683349609375, -2.4327392578125, -2.358795166015625, -2.28485107421875, -2.210906982421875, -2.136962890625, -2.063018798828125, -1.98907470703125, -1.915130615234375, -1.8411865234375, -1.767242431640625, -1.69329833984375, -1.619354248046875, -1.54541015625, -1.471466064453125, -1.39752197265625, -1.323577880859375, -1.2496337890625, -1.175689697265625, -1.10174560546875, -1.027801513671875, -0.953857421875, -0.879913330078125, -0.80596923828125, -0.732025146484375, -0.6580810546875, -0.584136962890625, -0.51019287109375, -0.436248779296875, -0.3623046875, -0.288360595703125, -0.21441650390625, -0.140472412109375, -0.0665283203125, 0.007415771484375, 0.08135986328125, 0.155303955078125, 0.229248046875, 0.303192138671875, 0.37713623046875, 0.451080322265625, 0.5250244140625, 0.598968505859375, 0.67291259765625, 0.746856689453125, 0.82080078125, 0.894744873046875, 0.96868896484375, 1.042633056640625, 1.1165771484375, 1.190521240234375, 1.26446533203125, 1.338409423828125, 1.412353515625, 1.486297607421875, 1.56024169921875, 1.634185791015625, 1.7081298828125, 1.782073974609375, 1.85601806640625, 1.929962158203125, 2.00390625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 3.0, 3.0, 9.0, 9.0, 10.0, 9.0, 17.0, 18.0, 17.0, 30.0, 30.0, 36.0, 38.0, 49.0, 67.0, 63.0, 66.0, 56.0, 68.0, 62.0, 58.0, 46.0, 40.0, 37.0, 41.0, 22.0, 22.0, 17.0, 13.0, 15.0, 12.0, 6.0, 5.0, 1.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.27569580078125, -8.019668579101562, -7.763640880584717, -7.507613182067871, -7.251585960388184, -6.995558261871338, -6.739530563354492, -6.483503341674805, -6.227475643157959, -5.971447944641113, -5.715420722961426, -5.45939302444458, -5.203365325927734, -4.947338104248047, -4.691310405731201, -4.4352827072143555, -4.179255485534668, -3.9232280254364014, -3.6672005653381348, -3.411172866821289, -3.1551454067230225, -2.899117946624756, -2.64309024810791, -2.3870627880096436, -2.131035327911377, -1.8750078678131104, -1.6189802885055542, -1.362952709197998, -1.1069252490997314, -0.8508977890014648, -0.5948702096939087, -0.33884263038635254, -0.08281517028808594, 0.17321234941482544, 0.4292398691177368, 0.6852673888206482, 0.9412949085235596, 1.1973223686218262, 1.4533499479293823, 1.7093775272369385, 1.965404987335205, 2.2214324474334717, 2.4774599075317383, 2.733487606048584, 2.9895150661468506, 3.245542526245117, 3.501570224761963, 3.7575976848602295, 4.013625144958496, 4.269652843475342, 4.525680065155029, 4.781707763671875, 5.0377349853515625, 5.293762683868408, 5.549790382385254, 5.805817604064941, 6.061845302581787, 6.317873001098633, 6.57390022277832, 6.829927921295166, 7.085955619812012, 7.341982841491699, 7.598010540008545, 7.854038238525391, 8.110065460205078]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 4.0, 1.0, 11.0, 8.0, 6.0, 8.0, 22.0, 15.0, 13.0, 25.0, 23.0, 27.0, 32.0, 30.0, 32.0, 28.0, 35.0, 48.0, 35.0, 41.0, 40.0, 51.0, 53.0, 45.0, 48.0, 36.0, 34.0, 33.0, 28.0, 36.0, 26.0, 18.0, 19.0, 13.0, 15.0, 12.0, 11.0, 12.0, 5.0, 5.0, 10.0, 6.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.571853160858154, -4.4191575050354, -4.266462326049805, -4.113766670227051, -3.961071252822876, -3.808375835418701, -3.6556801795959473, -3.5029847621917725, -3.3502893447875977, -3.197593927383423, -3.044898509979248, -2.892202854156494, -2.7395074367523193, -2.5868120193481445, -2.4341163635253906, -2.281420946121216, -2.128725528717041, -1.9760301113128662, -1.8233345746994019, -1.6706390380859375, -1.5179436206817627, -1.365248203277588, -1.2125526666641235, -1.0598571300506592, -0.9071617126464844, -0.7544662356376648, -0.6017707586288452, -0.44907528162002563, -0.29637980461120605, -0.14368432760238647, 0.009011149406433105, 0.16170668601989746, 0.31440258026123047, 0.46709805727005005, 0.6197935342788696, 0.7724890112876892, 0.9251844882965088, 1.0778799057006836, 1.230575442314148, 1.3832709789276123, 1.535966396331787, 1.688661813735962, 1.8413573503494263, 1.9940528869628906, 2.1467483043670654, 2.2994437217712402, 2.452139377593994, 2.604834794998169, 2.7575302124023438, 2.9102256298065186, 3.0629210472106934, 3.2156167030334473, 3.368312120437622, 3.521007537841797, 3.673703193664551, 3.8263986110687256, 3.9790940284729004, 4.131789684295654, 4.28448486328125, 4.437180519104004, 4.589876174926758, 4.7425713539123535, 4.895267009735107, 5.047962188720703, 5.200657844543457]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 9.0, 13.0, 15.0, 22.0, 40.0, 49.0, 58.0, 92.0, 167.0, 270.0, 420.0, 628.0, 957.0, 1567.0, 2494.0, 3882.0, 6499.0, 11057.0, 18145.0, 30641.0, 51060.0, 81917.0, 123701.0, 161614.0, 167993.0, 138177.0, 95608.0, 60284.0, 36460.0, 21583.0, 13006.0, 7619.0, 4753.0, 2874.0, 1745.0, 1089.0, 679.0, 450.0, 306.0, 195.0, 125.0, 103.0, 59.0, 54.0, 21.0, 21.0, 14.0, 8.0, 6.0, 2.0, 4.0, 2.0, 3.0], "bins": [-3.705078125, -3.5997314453125, -3.494384765625, -3.3890380859375, -3.28369140625, -3.1783447265625, -3.072998046875, -2.9676513671875, -2.8623046875, -2.7569580078125, -2.651611328125, -2.5462646484375, -2.44091796875, -2.3355712890625, -2.230224609375, -2.1248779296875, -2.01953125, -1.9141845703125, -1.808837890625, -1.7034912109375, -1.59814453125, -1.4927978515625, -1.387451171875, -1.2821044921875, -1.1767578125, -1.0714111328125, -0.966064453125, -0.8607177734375, -0.75537109375, -0.6500244140625, -0.544677734375, -0.4393310546875, -0.333984375, -0.2286376953125, -0.123291015625, -0.0179443359375, 0.08740234375, 0.1927490234375, 0.298095703125, 0.4034423828125, 0.5087890625, 0.6141357421875, 0.719482421875, 0.8248291015625, 0.93017578125, 1.0355224609375, 1.140869140625, 1.2462158203125, 1.3515625, 1.4569091796875, 1.562255859375, 1.6676025390625, 1.77294921875, 1.8782958984375, 1.983642578125, 2.0889892578125, 2.1943359375, 2.2996826171875, 2.405029296875, 2.5103759765625, 2.61572265625, 2.7210693359375, 2.826416015625, 2.9317626953125, 3.037109375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 4.0, 7.0, 8.0, 11.0, 10.0, 14.0, 14.0, 22.0, 20.0, 24.0, 30.0, 35.0, 30.0, 37.0, 45.0, 43.0, 42.0, 49.0, 49.0, 39.0, 40.0, 48.0, 47.0, 45.0, 42.0, 21.0, 33.0, 28.0, 30.0, 26.0, 24.0, 24.0, 9.0, 15.0, 6.0, 9.0, 9.0, 2.0, 5.0, 7.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8828125, -4.7054443359375, -4.528076171875, -4.3507080078125, -4.17333984375, -3.9959716796875, -3.818603515625, -3.6412353515625, -3.4638671875, -3.2864990234375, -3.109130859375, -2.9317626953125, -2.75439453125, -2.5770263671875, -2.399658203125, -2.2222900390625, -2.044921875, -1.8675537109375, -1.690185546875, -1.5128173828125, -1.33544921875, -1.1580810546875, -0.980712890625, -0.8033447265625, -0.6259765625, -0.4486083984375, -0.271240234375, -0.0938720703125, 0.08349609375, 0.2608642578125, 0.438232421875, 0.6156005859375, 0.79296875, 0.9703369140625, 1.147705078125, 1.3250732421875, 1.50244140625, 1.6798095703125, 1.857177734375, 2.0345458984375, 2.2119140625, 2.3892822265625, 2.566650390625, 2.7440185546875, 2.92138671875, 3.0987548828125, 3.276123046875, 3.4534912109375, 3.630859375, 3.8082275390625, 3.985595703125, 4.1629638671875, 4.34033203125, 4.5177001953125, 4.695068359375, 4.8724365234375, 5.0498046875, 5.2271728515625, 5.404541015625, 5.5819091796875, 5.75927734375, 5.9366455078125, 6.114013671875, 6.2913818359375, 6.46875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 9.0, 13.0, 22.0, 20.0, 48.0, 53.0, 102.0, 121.0, 209.0, 307.0, 413.0, 652.0, 966.0, 1525.0, 2410.0, 3514.0, 5595.0, 9024.0, 14958.0, 24534.0, 40937.0, 67142.0, 110060.0, 165226.0, 191959.0, 153053.0, 99883.0, 61102.0, 36244.0, 21931.0, 13478.0, 8269.0, 5239.0, 3367.0, 2083.0, 1398.0, 894.0, 617.0, 390.0, 277.0, 164.0, 109.0, 87.0, 52.0, 37.0, 23.0, 20.0, 11.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.97265625, -3.85369873046875, -3.7347412109375, -3.61578369140625, -3.496826171875, -3.37786865234375, -3.2589111328125, -3.13995361328125, -3.02099609375, -2.90203857421875, -2.7830810546875, -2.66412353515625, -2.545166015625, -2.42620849609375, -2.3072509765625, -2.18829345703125, -2.0693359375, -1.95037841796875, -1.8314208984375, -1.71246337890625, -1.593505859375, -1.47454833984375, -1.3555908203125, -1.23663330078125, -1.11767578125, -0.99871826171875, -0.8797607421875, -0.76080322265625, -0.641845703125, -0.52288818359375, -0.4039306640625, -0.28497314453125, -0.166015625, -0.04705810546875, 0.0718994140625, 0.19085693359375, 0.309814453125, 0.42877197265625, 0.5477294921875, 0.66668701171875, 0.78564453125, 0.90460205078125, 1.0235595703125, 1.14251708984375, 1.261474609375, 1.38043212890625, 1.4993896484375, 1.61834716796875, 1.7373046875, 1.85626220703125, 1.9752197265625, 2.09417724609375, 2.213134765625, 2.33209228515625, 2.4510498046875, 2.57000732421875, 2.68896484375, 2.80792236328125, 2.9268798828125, 3.04583740234375, 3.164794921875, 3.28375244140625, 3.4027099609375, 3.52166748046875, 3.640625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 9.0, 6.0, 19.0, 9.0, 10.0, 17.0, 8.0, 18.0, 34.0, 28.0, 38.0, 30.0, 46.0, 39.0, 41.0, 44.0, 42.0, 47.0, 36.0, 45.0, 54.0, 38.0, 55.0, 31.0, 40.0, 32.0, 28.0, 29.0, 24.0, 16.0, 15.0, 12.0, 8.0, 10.0, 9.0, 14.0, 1.0, 8.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.068359375, -2.96612548828125, -2.8638916015625, -2.76165771484375, -2.659423828125, -2.55718994140625, -2.4549560546875, -2.35272216796875, -2.25048828125, -2.14825439453125, -2.0460205078125, -1.94378662109375, -1.841552734375, -1.73931884765625, -1.6370849609375, -1.53485107421875, -1.4326171875, -1.33038330078125, -1.2281494140625, -1.12591552734375, -1.023681640625, -0.92144775390625, -0.8192138671875, -0.71697998046875, -0.61474609375, -0.51251220703125, -0.4102783203125, -0.30804443359375, -0.205810546875, -0.10357666015625, -0.0013427734375, 0.10089111328125, 0.203125, 0.30535888671875, 0.4075927734375, 0.50982666015625, 0.612060546875, 0.71429443359375, 0.8165283203125, 0.91876220703125, 1.02099609375, 1.12322998046875, 1.2254638671875, 1.32769775390625, 1.429931640625, 1.53216552734375, 1.6343994140625, 1.73663330078125, 1.8388671875, 1.94110107421875, 2.0433349609375, 2.14556884765625, 2.247802734375, 2.35003662109375, 2.4522705078125, 2.55450439453125, 2.65673828125, 2.75897216796875, 2.8612060546875, 2.96343994140625, 3.065673828125, 3.16790771484375, 3.2701416015625, 3.37237548828125, 3.474609375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 5.0, 3.0, 10.0, 12.0, 16.0, 23.0, 24.0, 43.0, 55.0, 93.0, 146.0, 184.0, 298.0, 490.0, 729.0, 1107.0, 1737.0, 2975.0, 5097.0, 9182.0, 17139.0, 33595.0, 67557.0, 135720.0, 238815.0, 245294.0, 141273.0, 71002.0, 35255.0, 18033.0, 9504.0, 5172.0, 3009.0, 1806.0, 1072.0, 697.0, 472.0, 335.0, 180.0, 128.0, 74.0, 63.0, 46.0, 32.0, 17.0, 14.0, 8.0, 8.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.27734375, -2.19610595703125, -2.1148681640625, -2.03363037109375, -1.952392578125, -1.87115478515625, -1.7899169921875, -1.70867919921875, -1.62744140625, -1.54620361328125, -1.4649658203125, -1.38372802734375, -1.302490234375, -1.22125244140625, -1.1400146484375, -1.05877685546875, -0.9775390625, -0.89630126953125, -0.8150634765625, -0.73382568359375, -0.652587890625, -0.57135009765625, -0.4901123046875, -0.40887451171875, -0.32763671875, -0.24639892578125, -0.1651611328125, -0.08392333984375, -0.002685546875, 0.07855224609375, 0.1597900390625, 0.24102783203125, 0.322265625, 0.40350341796875, 0.4847412109375, 0.56597900390625, 0.647216796875, 0.72845458984375, 0.8096923828125, 0.89093017578125, 0.97216796875, 1.05340576171875, 1.1346435546875, 1.21588134765625, 1.297119140625, 1.37835693359375, 1.4595947265625, 1.54083251953125, 1.6220703125, 1.70330810546875, 1.7845458984375, 1.86578369140625, 1.947021484375, 2.02825927734375, 2.1094970703125, 2.19073486328125, 2.27197265625, 2.35321044921875, 2.4344482421875, 2.51568603515625, 2.596923828125, 2.67816162109375, 2.7593994140625, 2.84063720703125, 2.921875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 4.0, 2.0, 5.0, 10.0, 12.0, 12.0, 11.0, 26.0, 28.0, 22.0, 39.0, 55.0, 63.0, 74.0, 74.0, 75.0, 75.0, 58.0, 50.0, 55.0, 47.0, 34.0, 32.0, 34.0, 24.0, 16.0, 12.0, 11.0, 8.0, 12.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013267993927001953, -0.00012789294123649597, -0.0001231059432029724, -0.00011831894516944885, -0.00011353194713592529, -0.00010874494910240173, -0.00010395795106887817, -9.917095303535461e-05, -9.438395500183105e-05, -8.95969569683075e-05, -8.480995893478394e-05, -8.002296090126038e-05, -7.523596286773682e-05, -7.044896483421326e-05, -6.56619668006897e-05, -6.087496876716614e-05, -5.608797073364258e-05, -5.130097270011902e-05, -4.651397466659546e-05, -4.17269766330719e-05, -3.693997859954834e-05, -3.215298056602478e-05, -2.736598253250122e-05, -2.257898449897766e-05, -1.77919864654541e-05, -1.3004988431930542e-05, -8.217990398406982e-06, -3.430992364883423e-06, 1.3560056686401367e-06, 6.143003702163696e-06, 1.0930001735687256e-05, 1.5716999769210815e-05, 2.0503997802734375e-05, 2.5290995836257935e-05, 3.0077993869781494e-05, 3.4864991903305054e-05, 3.965198993682861e-05, 4.443898797035217e-05, 4.922598600387573e-05, 5.401298403739929e-05, 5.879998207092285e-05, 6.358698010444641e-05, 6.837397813796997e-05, 7.316097617149353e-05, 7.794797420501709e-05, 8.273497223854065e-05, 8.752197027206421e-05, 9.230896830558777e-05, 9.709596633911133e-05, 0.00010188296437263489, 0.00010666996240615845, 0.00011145696043968201, 0.00011624395847320557, 0.00012103095650672913, 0.00012581795454025269, 0.00013060495257377625, 0.0001353919506072998, 0.00014017894864082336, 0.00014496594667434692, 0.00014975294470787048, 0.00015453994274139404, 0.0001593269407749176, 0.00016411393880844116, 0.00016890093684196472, 0.00017368793487548828]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 2.0, 7.0, 10.0, 17.0, 12.0, 29.0, 36.0, 42.0, 64.0, 93.0, 144.0, 168.0, 276.0, 383.0, 549.0, 853.0, 1226.0, 1873.0, 2643.0, 4191.0, 6610.0, 10626.0, 17140.0, 27704.0, 44665.0, 70140.0, 104546.0, 138210.0, 155042.0, 142816.0, 111204.0, 76369.0, 49083.0, 30480.0, 18779.0, 11618.0, 7274.0, 4494.0, 2913.0, 2002.0, 1335.0, 842.0, 592.0, 449.0, 303.0, 218.0, 149.0, 121.0, 71.0, 44.0, 31.0, 18.0, 16.0, 13.0, 9.0, 9.0, 6.0, 2.0, 1.0, 1.0, 4.0], "bins": [-1.6044921875, -1.5537109375, -1.5029296875, -1.4521484375, -1.4013671875, -1.3505859375, -1.2998046875, -1.2490234375, -1.1982421875, -1.1474609375, -1.0966796875, -1.0458984375, -0.9951171875, -0.9443359375, -0.8935546875, -0.8427734375, -0.7919921875, -0.7412109375, -0.6904296875, -0.6396484375, -0.5888671875, -0.5380859375, -0.4873046875, -0.4365234375, -0.3857421875, -0.3349609375, -0.2841796875, -0.2333984375, -0.1826171875, -0.1318359375, -0.0810546875, -0.0302734375, 0.0205078125, 0.0712890625, 0.1220703125, 0.1728515625, 0.2236328125, 0.2744140625, 0.3251953125, 0.3759765625, 0.4267578125, 0.4775390625, 0.5283203125, 0.5791015625, 0.6298828125, 0.6806640625, 0.7314453125, 0.7822265625, 0.8330078125, 0.8837890625, 0.9345703125, 0.9853515625, 1.0361328125, 1.0869140625, 1.1376953125, 1.1884765625, 1.2392578125, 1.2900390625, 1.3408203125, 1.3916015625, 1.4423828125, 1.4931640625, 1.5439453125, 1.5947265625, 1.6455078125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 6.0, 7.0, 7.0, 5.0, 10.0, 15.0, 21.0, 27.0, 27.0, 42.0, 47.0, 48.0, 59.0, 52.0, 78.0, 75.0, 84.0, 51.0, 65.0, 58.0, 54.0, 29.0, 31.0, 27.0, 23.0, 15.0, 11.0, 10.0, 8.0, 3.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.76025390625, -0.7388153076171875, -0.717376708984375, -0.6959381103515625, -0.67449951171875, -0.6530609130859375, -0.631622314453125, -0.6101837158203125, -0.5887451171875, -0.5673065185546875, -0.545867919921875, -0.5244293212890625, -0.50299072265625, -0.4815521240234375, -0.460113525390625, -0.4386749267578125, -0.417236328125, -0.3957977294921875, -0.374359130859375, -0.3529205322265625, -0.33148193359375, -0.3100433349609375, -0.288604736328125, -0.2671661376953125, -0.2457275390625, -0.2242889404296875, -0.202850341796875, -0.1814117431640625, -0.15997314453125, -0.1385345458984375, -0.117095947265625, -0.0956573486328125, -0.07421875, -0.0527801513671875, -0.031341552734375, -0.0099029541015625, 0.01153564453125, 0.0329742431640625, 0.054412841796875, 0.0758514404296875, 0.0972900390625, 0.1187286376953125, 0.140167236328125, 0.1616058349609375, 0.18304443359375, 0.2044830322265625, 0.225921630859375, 0.2473602294921875, 0.268798828125, 0.2902374267578125, 0.311676025390625, 0.3331146240234375, 0.35455322265625, 0.3759918212890625, 0.397430419921875, 0.4188690185546875, 0.4403076171875, 0.4617462158203125, 0.483184814453125, 0.5046234130859375, 0.52606201171875, 0.5475006103515625, 0.568939208984375, 0.5903778076171875, 0.61181640625]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 7.0, 6.0, 8.0, 9.0, 8.0, 23.0, 9.0, 21.0, 22.0, 26.0, 33.0, 41.0, 55.0, 53.0, 61.0, 54.0, 73.0, 61.0, 68.0, 66.0, 53.0, 46.0, 29.0, 31.0, 33.0, 21.0, 25.0, 11.0, 14.0, 10.0, 10.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.051548957824707, -7.797083854675293, -7.542618751525879, -7.288154125213623, -7.033689022064209, -6.779223918914795, -6.524759292602539, -6.270294189453125, -6.015829086303711, -5.761363983154297, -5.506898880004883, -5.252434253692627, -4.997969150543213, -4.743504047393799, -4.489039421081543, -4.234574317932129, -3.980109214782715, -3.725644111633301, -3.471179246902466, -3.216714382171631, -2.962249279022217, -2.7077841758728027, -2.4533193111419678, -2.198854446411133, -1.9443893432617188, -1.6899243593215942, -1.4354593753814697, -1.1809943914413452, -0.9265294075012207, -0.6720644235610962, -0.4175994396209717, -0.16313445568084717, 0.09133052825927734, 0.34579551219940186, 0.6002604961395264, 0.8547254800796509, 1.1091904640197754, 1.3636554479599, 1.6181204319000244, 1.872585415840149, 2.1270503997802734, 2.3815155029296875, 2.6359803676605225, 2.8904452323913574, 3.1449103355407715, 3.3993754386901855, 3.6538403034210205, 3.9083051681518555, 4.1627702713012695, 4.417235374450684, 4.671700477600098, 4.9261651039123535, 5.180630207061768, 5.435095310211182, 5.6895599365234375, 5.944025039672852, 6.198490142822266, 6.45295524597168, 6.707420349121094, 6.96188497543335, 7.216350078582764, 7.470815181732178, 7.725279808044434, 7.979744911193848, 8.234210014343262]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 2.0, 6.0, 7.0, 9.0, 8.0, 12.0, 19.0, 14.0, 22.0, 26.0, 26.0, 25.0, 26.0, 30.0, 36.0, 27.0, 41.0, 40.0, 37.0, 40.0, 49.0, 46.0, 48.0, 53.0, 36.0, 34.0, 33.0, 31.0, 31.0, 31.0, 26.0, 16.0, 20.0, 14.0, 12.0, 11.0, 14.0, 9.0, 5.0, 5.0, 7.0, 8.0, 3.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.356161594390869, -4.208642482757568, -4.061123847961426, -3.913604736328125, -3.766085624694824, -3.6185667514801025, -3.471047878265381, -3.32352876663208, -3.1760098934173584, -3.0284910202026367, -2.880971908569336, -2.7334530353546143, -2.5859341621398926, -2.438415050506592, -2.29089617729187, -2.1433773040771484, -1.9958581924438477, -1.8483392000198364, -1.7008202075958252, -1.5533013343811035, -1.4057823419570923, -1.258263349533081, -1.1107444763183594, -0.9632254838943481, -0.8157064914703369, -0.6681874990463257, -0.5206685662269592, -0.3731496036052704, -0.22563064098358154, -0.07811164855957031, 0.06940728425979614, 0.2169262170791626, 0.36444568634033203, 0.5119646787643433, 0.6594836115837097, 0.8070025444030762, 0.9545215368270874, 1.1020405292510986, 1.2495594024658203, 1.3970783948898315, 1.5445973873138428, 1.692116379737854, 1.8396353721618652, 1.987154245376587, 2.1346731185913086, 2.2821922302246094, 2.429711103439331, 2.5772299766540527, 2.7247490882873535, 2.872267961502075, 3.019787073135376, 3.1673059463500977, 3.3148250579833984, 3.46234393119812, 3.609862804412842, 3.7573819160461426, 3.9049007892608643, 4.052419662475586, 4.199938774108887, 4.3474578857421875, 4.49497652053833, 4.642495632171631, 4.790014743804932, 4.937533378601074, 5.085052490234375]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 1.0, 9.0, 4.0, 10.0, 9.0, 15.0, 13.0, 31.0, 49.0, 56.0, 81.0, 103.0, 180.0, 215.0, 359.0, 471.0, 779.0, 1204.0, 1893.0, 2928.0, 4426.0, 7108.0, 11364.0, 18111.0, 29140.0, 45789.0, 70188.0, 101531.0, 133697.0, 149619.0, 139720.0, 109719.0, 78354.0, 52143.0, 33138.0, 20623.0, 13134.0, 8074.0, 5006.0, 3202.0, 2061.0, 1271.0, 887.0, 568.0, 417.0, 248.0, 190.0, 128.0, 89.0, 68.0, 41.0, 28.0, 23.0, 9.0, 14.0, 10.0, 5.0, 8.0, 3.0, 3.0], "bins": [-5.69921875, -5.52978515625, -5.3603515625, -5.19091796875, -5.021484375, -4.85205078125, -4.6826171875, -4.51318359375, -4.34375, -4.17431640625, -4.0048828125, -3.83544921875, -3.666015625, -3.49658203125, -3.3271484375, -3.15771484375, -2.98828125, -2.81884765625, -2.6494140625, -2.47998046875, -2.310546875, -2.14111328125, -1.9716796875, -1.80224609375, -1.6328125, -1.46337890625, -1.2939453125, -1.12451171875, -0.955078125, -0.78564453125, -0.6162109375, -0.44677734375, -0.27734375, -0.10791015625, 0.0615234375, 0.23095703125, 0.400390625, 0.56982421875, 0.7392578125, 0.90869140625, 1.078125, 1.24755859375, 1.4169921875, 1.58642578125, 1.755859375, 1.92529296875, 2.0947265625, 2.26416015625, 2.43359375, 2.60302734375, 2.7724609375, 2.94189453125, 3.111328125, 3.28076171875, 3.4501953125, 3.61962890625, 3.7890625, 3.95849609375, 4.1279296875, 4.29736328125, 4.466796875, 4.63623046875, 4.8056640625, 4.97509765625, 5.14453125]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 10.0, 7.0, 3.0, 13.0, 9.0, 24.0, 14.0, 23.0, 25.0, 31.0, 21.0, 31.0, 46.0, 42.0, 39.0, 48.0, 39.0, 55.0, 51.0, 55.0, 38.0, 40.0, 51.0, 37.0, 39.0, 27.0, 28.0, 27.0, 30.0, 19.0, 14.0, 14.0, 13.0, 4.0, 8.0, 6.0, 6.0, 5.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.13671875, -4.961181640625, -4.78564453125, -4.610107421875, -4.4345703125, -4.259033203125, -4.08349609375, -3.907958984375, -3.732421875, -3.556884765625, -3.38134765625, -3.205810546875, -3.0302734375, -2.854736328125, -2.67919921875, -2.503662109375, -2.328125, -2.152587890625, -1.97705078125, -1.801513671875, -1.6259765625, -1.450439453125, -1.27490234375, -1.099365234375, -0.923828125, -0.748291015625, -0.57275390625, -0.397216796875, -0.2216796875, -0.046142578125, 0.12939453125, 0.304931640625, 0.48046875, 0.656005859375, 0.83154296875, 1.007080078125, 1.1826171875, 1.358154296875, 1.53369140625, 1.709228515625, 1.884765625, 2.060302734375, 2.23583984375, 2.411376953125, 2.5869140625, 2.762451171875, 2.93798828125, 3.113525390625, 3.2890625, 3.464599609375, 3.64013671875, 3.815673828125, 3.9912109375, 4.166748046875, 4.34228515625, 4.517822265625, 4.693359375, 4.868896484375, 5.04443359375, 5.219970703125, 5.3955078125, 5.571044921875, 5.74658203125, 5.922119140625, 6.09765625]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 10.0, 10.0, 20.0, 23.0, 40.0, 57.0, 84.0, 128.0, 167.0, 240.0, 380.0, 527.0, 819.0, 1302.0, 2015.0, 3237.0, 5202.0, 8228.0, 13724.0, 22218.0, 36377.0, 58258.0, 89542.0, 126907.0, 154503.0, 154224.0, 126667.0, 90235.0, 58372.0, 36324.0, 22340.0, 13677.0, 8393.0, 5175.0, 3251.0, 2072.0, 1279.0, 852.0, 575.0, 347.0, 223.0, 175.0, 106.0, 80.0, 51.0, 43.0, 21.0, 22.0, 15.0, 7.0, 3.0, 8.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.52734375, -5.34906005859375, -5.1707763671875, -4.99249267578125, -4.814208984375, -4.63592529296875, -4.4576416015625, -4.27935791015625, -4.10107421875, -3.92279052734375, -3.7445068359375, -3.56622314453125, -3.387939453125, -3.20965576171875, -3.0313720703125, -2.85308837890625, -2.6748046875, -2.49652099609375, -2.3182373046875, -2.13995361328125, -1.961669921875, -1.78338623046875, -1.6051025390625, -1.42681884765625, -1.24853515625, -1.07025146484375, -0.8919677734375, -0.71368408203125, -0.535400390625, -0.35711669921875, -0.1788330078125, -0.00054931640625, 0.177734375, 0.35601806640625, 0.5343017578125, 0.71258544921875, 0.890869140625, 1.06915283203125, 1.2474365234375, 1.42572021484375, 1.60400390625, 1.78228759765625, 1.9605712890625, 2.13885498046875, 2.317138671875, 2.49542236328125, 2.6737060546875, 2.85198974609375, 3.0302734375, 3.20855712890625, 3.3868408203125, 3.56512451171875, 3.743408203125, 3.92169189453125, 4.0999755859375, 4.27825927734375, 4.45654296875, 4.63482666015625, 4.8131103515625, 4.99139404296875, 5.169677734375, 5.34796142578125, 5.5262451171875, 5.70452880859375, 5.8828125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 7.0, 5.0, 17.0, 22.0, 21.0, 20.0, 17.0, 15.0, 20.0, 23.0, 40.0, 48.0, 42.0, 37.0, 43.0, 71.0, 52.0, 43.0, 36.0, 35.0, 47.0, 27.0, 41.0, 41.0, 32.0, 25.0, 32.0, 22.0, 18.0, 20.0, 17.0, 11.0, 6.0, 12.0, 7.0, 6.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.45703125, -3.3521728515625, -3.247314453125, -3.1424560546875, -3.03759765625, -2.9327392578125, -2.827880859375, -2.7230224609375, -2.6181640625, -2.5133056640625, -2.408447265625, -2.3035888671875, -2.19873046875, -2.0938720703125, -1.989013671875, -1.8841552734375, -1.779296875, -1.6744384765625, -1.569580078125, -1.4647216796875, -1.35986328125, -1.2550048828125, -1.150146484375, -1.0452880859375, -0.9404296875, -0.8355712890625, -0.730712890625, -0.6258544921875, -0.52099609375, -0.4161376953125, -0.311279296875, -0.2064208984375, -0.1015625, 0.0032958984375, 0.108154296875, 0.2130126953125, 0.31787109375, 0.4227294921875, 0.527587890625, 0.6324462890625, 0.7373046875, 0.8421630859375, 0.947021484375, 1.0518798828125, 1.15673828125, 1.2615966796875, 1.366455078125, 1.4713134765625, 1.576171875, 1.6810302734375, 1.785888671875, 1.8907470703125, 1.99560546875, 2.1004638671875, 2.205322265625, 2.3101806640625, 2.4150390625, 2.5198974609375, 2.624755859375, 2.7296142578125, 2.83447265625, 2.9393310546875, 3.044189453125, 3.1490478515625, 3.25390625]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 6.0, 5.0, 6.0, 6.0, 7.0, 23.0, 18.0, 40.0, 39.0, 68.0, 112.0, 153.0, 234.0, 340.0, 556.0, 757.0, 1182.0, 1697.0, 2705.0, 4522.0, 7439.0, 12501.0, 22847.0, 43174.0, 86191.0, 171175.0, 255637.0, 206442.0, 109675.0, 54241.0, 27843.0, 15530.0, 8740.0, 5320.0, 3312.0, 2048.0, 1356.0, 878.0, 562.0, 393.0, 259.0, 177.0, 113.0, 71.0, 52.0, 35.0, 28.0, 14.0, 10.0, 10.0, 3.0, 6.0, 2.0, 3.0, 5.0], "bins": [-5.0703125, -4.92816162109375, -4.7860107421875, -4.64385986328125, -4.501708984375, -4.35955810546875, -4.2174072265625, -4.07525634765625, -3.93310546875, -3.79095458984375, -3.6488037109375, -3.50665283203125, -3.364501953125, -3.22235107421875, -3.0802001953125, -2.93804931640625, -2.7958984375, -2.65374755859375, -2.5115966796875, -2.36944580078125, -2.227294921875, -2.08514404296875, -1.9429931640625, -1.80084228515625, -1.65869140625, -1.51654052734375, -1.3743896484375, -1.23223876953125, -1.090087890625, -0.94793701171875, -0.8057861328125, -0.66363525390625, -0.521484375, -0.37933349609375, -0.2371826171875, -0.09503173828125, 0.047119140625, 0.18927001953125, 0.3314208984375, 0.47357177734375, 0.61572265625, 0.75787353515625, 0.9000244140625, 1.04217529296875, 1.184326171875, 1.32647705078125, 1.4686279296875, 1.61077880859375, 1.7529296875, 1.89508056640625, 2.0372314453125, 2.17938232421875, 2.321533203125, 2.46368408203125, 2.6058349609375, 2.74798583984375, 2.89013671875, 3.03228759765625, 3.1744384765625, 3.31658935546875, 3.458740234375, 3.60089111328125, 3.7430419921875, 3.88519287109375, 4.02734375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 6.0, 3.0, 10.0, 11.0, 11.0, 18.0, 13.0, 14.0, 29.0, 35.0, 36.0, 52.0, 64.0, 63.0, 81.0, 94.0, 65.0, 83.0, 57.0, 56.0, 48.0, 34.0, 27.0, 18.0, 11.0, 11.0, 17.0, 8.0, 2.0, 3.0, 4.0, 5.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.000507354736328125, -0.0004931129515171051, -0.0004788711667060852, -0.0004646293818950653, -0.0004503875970840454, -0.0004361458122730255, -0.0004219040274620056, -0.0004076622426509857, -0.0003934204578399658, -0.0003791786730289459, -0.000364936888217926, -0.00035069510340690613, -0.00033645331859588623, -0.00032221153378486633, -0.00030796974897384644, -0.00029372796416282654, -0.00027948617935180664, -0.00026524439454078674, -0.00025100260972976685, -0.00023676082491874695, -0.00022251904010772705, -0.00020827725529670715, -0.00019403547048568726, -0.00017979368567466736, -0.00016555190086364746, -0.00015131011605262756, -0.00013706833124160767, -0.00012282654643058777, -0.00010858476161956787, -9.434297680854797e-05, -8.010119199752808e-05, -6.585940718650818e-05, -5.161762237548828e-05, -3.7375837564468384e-05, -2.3134052753448486e-05, -8.892267942428589e-06, 5.349516868591309e-06, 1.9591301679611206e-05, 3.3833086490631104e-05, 4.8074871301651e-05, 6.23166561126709e-05, 7.65584409236908e-05, 9.08002257347107e-05, 0.00010504201054573059, 0.00011928379535675049, 0.00013352558016777039, 0.00014776736497879028, 0.00016200914978981018, 0.00017625093460083008, 0.00019049271941184998, 0.00020473450422286987, 0.00021897628903388977, 0.00023321807384490967, 0.00024745985865592957, 0.00026170164346694946, 0.00027594342827796936, 0.00029018521308898926, 0.00030442699790000916, 0.00031866878271102905, 0.00033291056752204895, 0.00034715235233306885, 0.00036139413714408875, 0.00037563592195510864, 0.00038987770676612854, 0.00040411949157714844]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 2.0, 4.0, 9.0, 9.0, 14.0, 21.0, 25.0, 38.0, 54.0, 73.0, 130.0, 217.0, 382.0, 633.0, 1079.0, 2206.0, 4115.0, 8426.0, 17680.0, 39087.0, 86957.0, 188363.0, 287504.0, 217941.0, 105260.0, 46801.0, 21205.0, 9765.0, 4925.0, 2477.0, 1308.0, 724.0, 457.0, 251.0, 142.0, 85.0, 56.0, 40.0, 19.0, 21.0, 15.0, 9.0, 8.0, 5.0, 5.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-4.8671875, -4.71795654296875, -4.5687255859375, -4.41949462890625, -4.270263671875, -4.12103271484375, -3.9718017578125, -3.82257080078125, -3.67333984375, -3.52410888671875, -3.3748779296875, -3.22564697265625, -3.076416015625, -2.92718505859375, -2.7779541015625, -2.62872314453125, -2.4794921875, -2.33026123046875, -2.1810302734375, -2.03179931640625, -1.882568359375, -1.73333740234375, -1.5841064453125, -1.43487548828125, -1.28564453125, -1.13641357421875, -0.9871826171875, -0.83795166015625, -0.688720703125, -0.53948974609375, -0.3902587890625, -0.24102783203125, -0.091796875, 0.05743408203125, 0.2066650390625, 0.35589599609375, 0.505126953125, 0.65435791015625, 0.8035888671875, 0.95281982421875, 1.10205078125, 1.25128173828125, 1.4005126953125, 1.54974365234375, 1.698974609375, 1.84820556640625, 1.9974365234375, 2.14666748046875, 2.2958984375, 2.44512939453125, 2.5943603515625, 2.74359130859375, 2.892822265625, 3.04205322265625, 3.1912841796875, 3.34051513671875, 3.48974609375, 3.63897705078125, 3.7882080078125, 3.93743896484375, 4.086669921875, 4.23590087890625, 4.3851318359375, 4.53436279296875, 4.68359375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 6.0, 4.0, 9.0, 11.0, 10.0, 23.0, 32.0, 37.0, 42.0, 54.0, 68.0, 67.0, 89.0, 82.0, 99.0, 78.0, 72.0, 64.0, 30.0, 30.0, 21.0, 17.0, 17.0, 13.0, 13.0, 9.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.953125, -1.9080047607421875, -1.862884521484375, -1.8177642822265625, -1.77264404296875, -1.7275238037109375, -1.682403564453125, -1.6372833251953125, -1.5921630859375, -1.5470428466796875, -1.501922607421875, -1.4568023681640625, -1.41168212890625, -1.3665618896484375, -1.321441650390625, -1.2763214111328125, -1.231201171875, -1.1860809326171875, -1.140960693359375, -1.0958404541015625, -1.05072021484375, -1.0055999755859375, -0.960479736328125, -0.9153594970703125, -0.8702392578125, -0.8251190185546875, -0.779998779296875, -0.7348785400390625, -0.68975830078125, -0.6446380615234375, -0.599517822265625, -0.5543975830078125, -0.50927734375, -0.4641571044921875, -0.419036865234375, -0.3739166259765625, -0.32879638671875, -0.2836761474609375, -0.238555908203125, -0.1934356689453125, -0.1483154296875, -0.1031951904296875, -0.058074951171875, -0.0129547119140625, 0.03216552734375, 0.0772857666015625, 0.122406005859375, 0.1675262451171875, 0.212646484375, 0.2577667236328125, 0.302886962890625, 0.3480072021484375, 0.39312744140625, 0.4382476806640625, 0.483367919921875, 0.5284881591796875, 0.5736083984375, 0.6187286376953125, 0.663848876953125, 0.7089691162109375, 0.75408935546875, 0.7992095947265625, 0.844329833984375, 0.8894500732421875, 0.9345703125]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 5.0, 4.0, 8.0, 6.0, 15.0, 15.0, 11.0, 23.0, 30.0, 19.0, 27.0, 40.0, 42.0, 51.0, 55.0, 53.0, 55.0, 43.0, 57.0, 40.0, 60.0, 48.0, 57.0, 43.0, 29.0, 33.0, 18.0, 13.0, 20.0, 16.0, 15.0, 7.0, 9.0, 6.0, 7.0, 9.0, 0.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.334050178527832, -7.109960556030273, -6.885870933532715, -6.661780834197998, -6.4376912117004395, -6.213601589202881, -5.989511966705322, -5.7654218673706055, -5.541332244873047, -5.317242622375488, -5.09315299987793, -4.869062900543213, -4.644973278045654, -4.420883655548096, -4.196794033050537, -3.9727041721343994, -3.748614549636841, -3.5245249271392822, -3.3004350662231445, -3.076345443725586, -2.8522555828094482, -2.6281659603118896, -2.404076099395752, -2.1799864768981934, -1.9558967351913452, -1.731806993484497, -1.507717251777649, -1.2836275100708008, -1.0595378875732422, -0.835448145866394, -0.6113584041595459, -0.38726866245269775, -0.1631789207458496, 0.06091080605983734, 0.2850005328655243, 0.50909024477005, 0.7331799864768982, 0.9572696685791016, 1.1813594102859497, 1.4054491519927979, 1.629538893699646, 1.8536286354064941, 2.0777182579040527, 2.3018081188201904, 2.525897741317749, 2.7499876022338867, 2.9740772247314453, 3.198166847229004, 3.4222567081451416, 3.6463463306427, 3.870436191558838, 4.0945258140563965, 4.318615436553955, 4.542705535888672, 4.7667951583862305, 4.990884780883789, 5.214974403381348, 5.439064025878906, 5.663153648376465, 5.887243747711182, 6.11133337020874, 6.335422992706299, 6.559512615203857, 6.783602714538574, 7.007692337036133]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 0.0, 4.0, 4.0, 4.0, 7.0, 7.0, 12.0, 9.0, 14.0, 14.0, 17.0, 27.0, 24.0, 30.0, 29.0, 29.0, 38.0, 29.0, 38.0, 35.0, 36.0, 34.0, 32.0, 42.0, 38.0, 25.0, 36.0, 26.0, 42.0, 26.0, 28.0, 32.0, 31.0, 32.0, 25.0, 19.0, 25.0, 17.0, 19.0, 10.0, 8.0, 10.0, 6.0, 8.0, 4.0, 7.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.351051330566406, -4.2086663246154785, -4.066281795501709, -3.9238967895507812, -3.7815117835998535, -3.639127016067505, -3.4967422485351562, -3.3543572425842285, -3.21197247505188, -3.0695877075195312, -2.9272027015686035, -2.784817934036255, -2.6424331665039062, -2.5000481605529785, -2.35766339302063, -2.2152786254882812, -2.0728936195373535, -1.9305087327957153, -1.7881238460540771, -1.6457390785217285, -1.5033541917800903, -1.3609693050384521, -1.2185845375061035, -1.0761996507644653, -0.9338147640228271, -0.791429877281189, -0.6490450501441956, -0.5066602230072021, -0.36427533626556396, -0.22189044952392578, -0.07950562238693237, 0.06287920475006104, 0.20526361465454102, 0.3476484715938568, 0.4900333285331726, 0.632418155670166, 0.7748030424118042, 0.9171879291534424, 1.059572696685791, 1.2019575834274292, 1.3443424701690674, 1.4867273569107056, 1.6291122436523438, 1.7714970111846924, 1.9138818979263306, 2.0562667846679688, 2.1986515522003174, 2.341036319732666, 2.4834213256835938, 2.6258060932159424, 2.76819109916687, 2.9105758666992188, 3.0529608726501465, 3.195345640182495, 3.3377304077148438, 3.4801154136657715, 3.62250018119812, 3.7648849487304688, 3.9072699546813965, 4.049654960632324, 4.192039489746094, 4.3344244956970215, 4.476809501647949, 4.619194030761719, 4.7615790367126465]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 8.0, 7.0, 9.0, 9.0, 22.0, 29.0, 47.0, 57.0, 94.0, 138.0, 202.0, 341.0, 446.0, 711.0, 1128.0, 1748.0, 2856.0, 4546.0, 7858.0, 13728.0, 25106.0, 47634.0, 96610.0, 207904.0, 468327.0, 935488.0, 1110558.0, 678973.0, 306855.0, 138017.0, 65604.0, 33459.0, 18515.0, 10595.0, 6229.0, 3715.0, 2378.0, 1526.0, 955.0, 614.0, 405.0, 273.0, 187.0, 138.0, 89.0, 50.0, 37.0, 33.0, 14.0, 10.0, 5.0, 4.0, 1.0, 0.0, 2.0], "bins": [-8.6875, -8.44097900390625, -8.1944580078125, -7.94793701171875, -7.701416015625, -7.45489501953125, -7.2083740234375, -6.96185302734375, -6.71533203125, -6.46881103515625, -6.2222900390625, -5.97576904296875, -5.729248046875, -5.48272705078125, -5.2362060546875, -4.98968505859375, -4.7431640625, -4.49664306640625, -4.2501220703125, -4.00360107421875, -3.757080078125, -3.51055908203125, -3.2640380859375, -3.01751708984375, -2.77099609375, -2.52447509765625, -2.2779541015625, -2.03143310546875, -1.784912109375, -1.53839111328125, -1.2918701171875, -1.04534912109375, -0.798828125, -0.55230712890625, -0.3057861328125, -0.05926513671875, 0.187255859375, 0.43377685546875, 0.6802978515625, 0.92681884765625, 1.17333984375, 1.41986083984375, 1.6663818359375, 1.91290283203125, 2.159423828125, 2.40594482421875, 2.6524658203125, 2.89898681640625, 3.1455078125, 3.39202880859375, 3.6385498046875, 3.88507080078125, 4.131591796875, 4.37811279296875, 4.6246337890625, 4.87115478515625, 5.11767578125, 5.36419677734375, 5.6107177734375, 5.85723876953125, 6.103759765625, 6.35028076171875, 6.5968017578125, 6.84332275390625, 7.08984375]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 4.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 7.0, 12.0, 8.0, 14.0, 9.0, 13.0, 14.0, 16.0, 32.0, 34.0, 25.0, 22.0, 37.0, 34.0, 36.0, 45.0, 31.0, 32.0, 42.0, 47.0, 41.0, 32.0, 32.0, 35.0, 32.0, 34.0, 22.0, 33.0, 35.0, 22.0, 23.0, 25.0, 22.0, 27.0, 17.0, 11.0, 7.0, 9.0, 4.0, 3.0, 4.0, 0.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.541015625, -3.425140380859375, -3.30926513671875, -3.193389892578125, -3.0775146484375, -2.961639404296875, -2.84576416015625, -2.729888916015625, -2.614013671875, -2.498138427734375, -2.38226318359375, -2.266387939453125, -2.1505126953125, -2.034637451171875, -1.91876220703125, -1.802886962890625, -1.68701171875, -1.571136474609375, -1.45526123046875, -1.339385986328125, -1.2235107421875, -1.107635498046875, -0.99176025390625, -0.875885009765625, -0.760009765625, -0.644134521484375, -0.52825927734375, -0.412384033203125, -0.2965087890625, -0.180633544921875, -0.06475830078125, 0.051116943359375, 0.1669921875, 0.282867431640625, 0.39874267578125, 0.514617919921875, 0.6304931640625, 0.746368408203125, 0.86224365234375, 0.978118896484375, 1.093994140625, 1.209869384765625, 1.32574462890625, 1.441619873046875, 1.5574951171875, 1.673370361328125, 1.78924560546875, 1.905120849609375, 2.02099609375, 2.136871337890625, 2.25274658203125, 2.368621826171875, 2.4844970703125, 2.600372314453125, 2.71624755859375, 2.832122802734375, 2.947998046875, 3.063873291015625, 3.17974853515625, 3.295623779296875, 3.4114990234375, 3.527374267578125, 3.64324951171875, 3.759124755859375, 3.875]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 7.0, 5.0, 13.0, 19.0, 31.0, 46.0, 62.0, 98.0, 153.0, 231.0, 336.0, 528.0, 813.0, 1304.0, 2159.0, 3647.0, 5961.0, 10324.0, 19014.0, 34706.0, 66860.0, 135621.0, 283078.0, 585841.0, 1007598.0, 970445.0, 543495.0, 261064.0, 124868.0, 62369.0, 31984.0, 17584.0, 9712.0, 5638.0, 3306.0, 1949.0, 1225.0, 780.0, 497.0, 338.0, 210.0, 127.0, 82.0, 45.0, 40.0, 30.0, 20.0, 12.0, 6.0, 3.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.8359375, -8.559326171875, -8.28271484375, -8.006103515625, -7.7294921875, -7.452880859375, -7.17626953125, -6.899658203125, -6.623046875, -6.346435546875, -6.06982421875, -5.793212890625, -5.5166015625, -5.239990234375, -4.96337890625, -4.686767578125, -4.41015625, -4.133544921875, -3.85693359375, -3.580322265625, -3.3037109375, -3.027099609375, -2.75048828125, -2.473876953125, -2.197265625, -1.920654296875, -1.64404296875, -1.367431640625, -1.0908203125, -0.814208984375, -0.53759765625, -0.260986328125, 0.015625, 0.292236328125, 0.56884765625, 0.845458984375, 1.1220703125, 1.398681640625, 1.67529296875, 1.951904296875, 2.228515625, 2.505126953125, 2.78173828125, 3.058349609375, 3.3349609375, 3.611572265625, 3.88818359375, 4.164794921875, 4.44140625, 4.718017578125, 4.99462890625, 5.271240234375, 5.5478515625, 5.824462890625, 6.10107421875, 6.377685546875, 6.654296875, 6.930908203125, 7.20751953125, 7.484130859375, 7.7607421875, 8.037353515625, 8.31396484375, 8.590576171875, 8.8671875]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 7.0, 6.0, 8.0, 11.0, 14.0, 18.0, 22.0, 20.0, 45.0, 56.0, 76.0, 71.0, 98.0, 145.0, 200.0, 195.0, 269.0, 319.0, 329.0, 355.0, 324.0, 286.0, 266.0, 214.0, 177.0, 142.0, 104.0, 91.0, 53.0, 45.0, 40.0, 24.0, 10.0, 13.0, 5.0, 7.0, 6.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.501953125, -3.410186767578125, -3.31842041015625, -3.226654052734375, -3.1348876953125, -3.043121337890625, -2.95135498046875, -2.859588623046875, -2.767822265625, -2.676055908203125, -2.58428955078125, -2.492523193359375, -2.4007568359375, -2.308990478515625, -2.21722412109375, -2.125457763671875, -2.03369140625, -1.941925048828125, -1.85015869140625, -1.758392333984375, -1.6666259765625, -1.574859619140625, -1.48309326171875, -1.391326904296875, -1.299560546875, -1.207794189453125, -1.11602783203125, -1.024261474609375, -0.9324951171875, -0.840728759765625, -0.74896240234375, -0.657196044921875, -0.5654296875, -0.473663330078125, -0.38189697265625, -0.290130615234375, -0.1983642578125, -0.106597900390625, -0.01483154296875, 0.076934814453125, 0.168701171875, 0.260467529296875, 0.35223388671875, 0.444000244140625, 0.5357666015625, 0.627532958984375, 0.71929931640625, 0.811065673828125, 0.90283203125, 0.994598388671875, 1.08636474609375, 1.178131103515625, 1.2698974609375, 1.361663818359375, 1.45343017578125, 1.545196533203125, 1.636962890625, 1.728729248046875, 1.82049560546875, 1.912261962890625, 2.0040283203125, 2.095794677734375, 2.18756103515625, 2.279327392578125, 2.37109375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 2.0, 3.0, 6.0, 4.0, 9.0, 11.0, 16.0, 17.0, 14.0, 26.0, 33.0, 34.0, 45.0, 51.0, 44.0, 68.0, 60.0, 68.0, 70.0, 56.0, 58.0, 45.0, 47.0, 30.0, 28.0, 24.0, 26.0, 25.0, 14.0, 13.0, 8.0, 15.0, 9.0, 2.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6845011711120605, -7.41606330871582, -7.14762544631958, -6.87918758392334, -6.6107497215271, -6.342311859130859, -6.073873519897461, -5.805436134338379, -5.5369977951049805, -5.26855993270874, -5.0001220703125, -4.73168420791626, -4.4632463455200195, -4.194808483123779, -3.92637038230896, -3.6579325199127197, -3.3894948959350586, -3.1210570335388184, -2.852619171142578, -2.584181308746338, -2.3157434463500977, -2.0473055839538574, -1.778867483139038, -1.5104296207427979, -1.2419917583465576, -0.9735538959503174, -0.7051159739494324, -0.43667805194854736, -0.16824018955230713, 0.1001976728439331, 0.3686356544494629, 0.6370735168457031, 0.9055118560791016, 1.1739497184753418, 1.442387580871582, 1.7108255624771118, 1.979263424873352, 2.2477011680603027, 2.516139268875122, 2.7845771312713623, 3.0530149936676025, 3.3214528560638428, 3.589890718460083, 3.8583288192749023, 4.126766681671143, 4.395204544067383, 4.663642406463623, 4.932080268859863, 5.2005181312561035, 5.468955993652344, 5.737393856048584, 6.005831718444824, 6.2742695808410645, 6.542707443237305, 6.811145782470703, 7.079583168029785, 7.348021507263184, 7.616459369659424, 7.884897232055664, 8.153335571289062, 8.421772956848145, 8.690211296081543, 8.958648681640625, 9.227087020874023, 9.495524406433105]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 8.0, 10.0, 7.0, 9.0, 5.0, 16.0, 19.0, 16.0, 26.0, 19.0, 23.0, 35.0, 50.0, 32.0, 28.0, 34.0, 40.0, 43.0, 36.0, 40.0, 33.0, 48.0, 44.0, 31.0, 32.0, 32.0, 40.0, 32.0, 37.0, 22.0, 24.0, 24.0, 20.0, 13.0, 18.0, 9.0, 13.0, 8.0, 6.0, 10.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.958791732788086, -4.799306392669678, -4.639821529388428, -4.4803361892700195, -4.320850849151611, -4.161365509033203, -4.001880645751953, -3.842395305633545, -3.682910203933716, -3.5234251022338867, -3.3639397621154785, -3.2044546604156494, -3.0449695587158203, -2.885484218597412, -2.725999116897583, -2.566514015197754, -2.4070286750793457, -2.2475435733795166, -2.0880582332611084, -1.9285731315612793, -1.7690879106521606, -1.609602689743042, -1.450117588043213, -1.2906323671340942, -1.1311471462249756, -0.9716619253158569, -0.8121767640113831, -0.6526916027069092, -0.4932063817977905, -0.3337211608886719, -0.174235999584198, -0.014750838279724121, 0.14473390579223633, 0.3042190968990326, 0.46370428800582886, 0.6231894493103027, 0.7826746702194214, 0.94215989112854, 1.1016449928283691, 1.2611302137374878, 1.4206154346466064, 1.580100655555725, 1.7395858764648438, 1.8990709781646729, 2.058556079864502, 2.21804141998291, 2.3775265216827393, 2.5370116233825684, 2.6964969635009766, 2.8559820652008057, 3.015467405319214, 3.174952507019043, 3.334437847137451, 3.4939229488372803, 3.6534080505371094, 3.8128933906555176, 3.9723784923553467, 4.131863594055176, 4.291348934173584, 4.450834274291992, 4.610319137573242, 4.76980447769165, 4.929289817810059, 5.088774681091309, 5.248260021209717]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 14.0, 16.0, 23.0, 28.0, 35.0, 58.0, 96.0, 153.0, 233.0, 350.0, 525.0, 913.0, 1454.0, 2445.0, 4507.0, 8860.0, 20761.0, 55647.0, 160287.0, 341175.0, 275929.0, 107328.0, 37057.0, 14958.0, 6854.0, 3544.0, 2021.0, 1209.0, 722.0, 495.0, 294.0, 174.0, 131.0, 84.0, 65.0, 50.0, 19.0, 17.0, 5.0, 4.0, 10.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-11.2890625, -10.9647216796875, -10.640380859375, -10.3160400390625, -9.99169921875, -9.6673583984375, -9.343017578125, -9.0186767578125, -8.6943359375, -8.3699951171875, -8.045654296875, -7.7213134765625, -7.39697265625, -7.0726318359375, -6.748291015625, -6.4239501953125, -6.099609375, -5.7752685546875, -5.450927734375, -5.1265869140625, -4.80224609375, -4.4779052734375, -4.153564453125, -3.8292236328125, -3.5048828125, -3.1805419921875, -2.856201171875, -2.5318603515625, -2.20751953125, -1.8831787109375, -1.558837890625, -1.2344970703125, -0.91015625, -0.5858154296875, -0.261474609375, 0.0628662109375, 0.38720703125, 0.7115478515625, 1.035888671875, 1.3602294921875, 1.6845703125, 2.0089111328125, 2.333251953125, 2.6575927734375, 2.98193359375, 3.3062744140625, 3.630615234375, 3.9549560546875, 4.279296875, 4.6036376953125, 4.927978515625, 5.2523193359375, 5.57666015625, 5.9010009765625, 6.225341796875, 6.5496826171875, 6.8740234375, 7.1983642578125, 7.522705078125, 7.8470458984375, 8.17138671875, 8.4957275390625, 8.820068359375, 9.1444091796875, 9.46875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 7.0, 3.0, 11.0, 6.0, 10.0, 15.0, 10.0, 11.0, 17.0, 19.0, 28.0, 28.0, 31.0, 32.0, 37.0, 31.0, 34.0, 37.0, 41.0, 42.0, 46.0, 37.0, 45.0, 50.0, 47.0, 33.0, 37.0, 43.0, 38.0, 27.0, 18.0, 28.0, 17.0, 16.0, 18.0, 11.0, 6.0, 5.0, 8.0, 8.0, 3.0, 8.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.44921875, -5.2689208984375, -5.088623046875, -4.9083251953125, -4.72802734375, -4.5477294921875, -4.367431640625, -4.1871337890625, -4.0068359375, -3.8265380859375, -3.646240234375, -3.4659423828125, -3.28564453125, -3.1053466796875, -2.925048828125, -2.7447509765625, -2.564453125, -2.3841552734375, -2.203857421875, -2.0235595703125, -1.84326171875, -1.6629638671875, -1.482666015625, -1.3023681640625, -1.1220703125, -0.9417724609375, -0.761474609375, -0.5811767578125, -0.40087890625, -0.2205810546875, -0.040283203125, 0.1400146484375, 0.3203125, 0.5006103515625, 0.680908203125, 0.8612060546875, 1.04150390625, 1.2218017578125, 1.402099609375, 1.5823974609375, 1.7626953125, 1.9429931640625, 2.123291015625, 2.3035888671875, 2.48388671875, 2.6641845703125, 2.844482421875, 3.0247802734375, 3.205078125, 3.3853759765625, 3.565673828125, 3.7459716796875, 3.92626953125, 4.1065673828125, 4.286865234375, 4.4671630859375, 4.6474609375, 4.8277587890625, 5.008056640625, 5.1883544921875, 5.36865234375, 5.5489501953125, 5.729248046875, 5.9095458984375, 6.08984375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 17.0, 4.0, 12.0, 17.0, 21.0, 28.0, 40.0, 58.0, 70.0, 96.0, 162.0, 177.0, 263.0, 453.0, 598.0, 775.0, 1255.0, 1890.0, 3094.0, 5245.0, 9902.0, 21532.0, 55637.0, 161638.0, 374045.0, 257902.0, 89783.0, 32189.0, 13833.0, 6867.0, 3852.0, 2350.0, 1459.0, 1038.0, 718.0, 447.0, 337.0, 204.0, 160.0, 116.0, 71.0, 63.0, 40.0, 31.0, 21.0, 14.0, 13.0, 6.0, 7.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-11.4375, -11.0880126953125, -10.738525390625, -10.3890380859375, -10.03955078125, -9.6900634765625, -9.340576171875, -8.9910888671875, -8.6416015625, -8.2921142578125, -7.942626953125, -7.5931396484375, -7.24365234375, -6.8941650390625, -6.544677734375, -6.1951904296875, -5.845703125, -5.4962158203125, -5.146728515625, -4.7972412109375, -4.44775390625, -4.0982666015625, -3.748779296875, -3.3992919921875, -3.0498046875, -2.7003173828125, -2.350830078125, -2.0013427734375, -1.65185546875, -1.3023681640625, -0.952880859375, -0.6033935546875, -0.25390625, 0.0955810546875, 0.445068359375, 0.7945556640625, 1.14404296875, 1.4935302734375, 1.843017578125, 2.1925048828125, 2.5419921875, 2.8914794921875, 3.240966796875, 3.5904541015625, 3.93994140625, 4.2894287109375, 4.638916015625, 4.9884033203125, 5.337890625, 5.6873779296875, 6.036865234375, 6.3863525390625, 6.73583984375, 7.0853271484375, 7.434814453125, 7.7843017578125, 8.1337890625, 8.4832763671875, 8.832763671875, 9.1822509765625, 9.53173828125, 9.8812255859375, 10.230712890625, 10.5802001953125, 10.9296875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 2.0, 3.0, 8.0, 9.0, 10.0, 8.0, 9.0, 9.0, 8.0, 20.0, 19.0, 21.0, 18.0, 21.0, 26.0, 34.0, 36.0, 37.0, 39.0, 43.0, 38.0, 44.0, 39.0, 42.0, 44.0, 30.0, 43.0, 40.0, 23.0, 39.0, 31.0, 31.0, 23.0, 22.0, 13.0, 20.0, 15.0, 15.0, 12.0, 7.0, 7.0, 12.0, 11.0, 7.0, 2.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.19140625, -3.089447021484375, -2.98748779296875, -2.885528564453125, -2.7835693359375, -2.681610107421875, -2.57965087890625, -2.477691650390625, -2.375732421875, -2.273773193359375, -2.17181396484375, -2.069854736328125, -1.9678955078125, -1.865936279296875, -1.76397705078125, -1.662017822265625, -1.56005859375, -1.458099365234375, -1.35614013671875, -1.254180908203125, -1.1522216796875, -1.050262451171875, -0.94830322265625, -0.846343994140625, -0.744384765625, -0.642425537109375, -0.54046630859375, -0.438507080078125, -0.3365478515625, -0.234588623046875, -0.13262939453125, -0.030670166015625, 0.0712890625, 0.173248291015625, 0.27520751953125, 0.377166748046875, 0.4791259765625, 0.581085205078125, 0.68304443359375, 0.785003662109375, 0.886962890625, 0.988922119140625, 1.09088134765625, 1.192840576171875, 1.2947998046875, 1.396759033203125, 1.49871826171875, 1.600677490234375, 1.70263671875, 1.804595947265625, 1.90655517578125, 2.008514404296875, 2.1104736328125, 2.212432861328125, 2.31439208984375, 2.416351318359375, 2.518310546875, 2.620269775390625, 2.72222900390625, 2.824188232421875, 2.9261474609375, 3.028106689453125, 3.13006591796875, 3.232025146484375, 3.333984375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 6.0, 5.0, 8.0, 10.0, 13.0, 21.0, 27.0, 26.0, 35.0, 71.0, 81.0, 125.0, 187.0, 204.0, 351.0, 441.0, 630.0, 952.0, 1342.0, 2052.0, 3313.0, 5376.0, 9763.0, 19692.0, 47347.0, 140143.0, 383240.0, 277912.0, 88283.0, 32321.0, 14374.0, 7415.0, 4364.0, 2733.0, 1780.0, 1175.0, 761.0, 556.0, 420.0, 291.0, 213.0, 157.0, 114.0, 75.0, 55.0, 30.0, 20.0, 11.0, 10.0, 11.0, 4.0, 5.0, 6.0, 4.0, 4.0, 0.0, 0.0, 3.0], "bins": [-5.93359375, -5.752685546875, -5.57177734375, -5.390869140625, -5.2099609375, -5.029052734375, -4.84814453125, -4.667236328125, -4.486328125, -4.305419921875, -4.12451171875, -3.943603515625, -3.7626953125, -3.581787109375, -3.40087890625, -3.219970703125, -3.0390625, -2.858154296875, -2.67724609375, -2.496337890625, -2.3154296875, -2.134521484375, -1.95361328125, -1.772705078125, -1.591796875, -1.410888671875, -1.22998046875, -1.049072265625, -0.8681640625, -0.687255859375, -0.50634765625, -0.325439453125, -0.14453125, 0.036376953125, 0.21728515625, 0.398193359375, 0.5791015625, 0.760009765625, 0.94091796875, 1.121826171875, 1.302734375, 1.483642578125, 1.66455078125, 1.845458984375, 2.0263671875, 2.207275390625, 2.38818359375, 2.569091796875, 2.75, 2.930908203125, 3.11181640625, 3.292724609375, 3.4736328125, 3.654541015625, 3.83544921875, 4.016357421875, 4.197265625, 4.378173828125, 4.55908203125, 4.739990234375, 4.9208984375, 5.101806640625, 5.28271484375, 5.463623046875, 5.64453125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 11.0, 9.0, 17.0, 33.0, 32.0, 53.0, 81.0, 144.0, 151.0, 141.0, 116.0, 72.0, 54.0, 26.0, 19.0, 12.0, 9.0, 4.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004987716674804688, -0.00048445165157318115, -0.00047013163566589355, -0.00045581161975860596, -0.00044149160385131836, -0.00042717158794403076, -0.00041285157203674316, -0.00039853155612945557, -0.00038421154022216797, -0.00036989152431488037, -0.0003555715084075928, -0.0003412514925003052, -0.0003269314765930176, -0.00031261146068573, -0.0002982914447784424, -0.0002839714288711548, -0.0002696514129638672, -0.0002553313970565796, -0.000241011381149292, -0.0002266913652420044, -0.0002123713493347168, -0.0001980513334274292, -0.0001837313175201416, -0.000169411301612854, -0.0001550912857055664, -0.0001407712697982788, -0.0001264512538909912, -0.00011213123798370361, -9.781122207641602e-05, -8.349120616912842e-05, -6.917119026184082e-05, -5.485117435455322e-05, -4.0531158447265625e-05, -2.6211142539978027e-05, -1.189112663269043e-05, 2.428889274597168e-06, 1.6748905181884766e-05, 3.106892108917236e-05, 4.538893699645996e-05, 5.970895290374756e-05, 7.402896881103516e-05, 8.834898471832275e-05, 0.00010266900062561035, 0.00011698901653289795, 0.00013130903244018555, 0.00014562904834747314, 0.00015994906425476074, 0.00017426908016204834, 0.00018858909606933594, 0.00020290911197662354, 0.00021722912788391113, 0.00023154914379119873, 0.00024586915969848633, 0.0002601891756057739, 0.0002745091915130615, 0.0002888292074203491, 0.0003031492233276367, 0.0003174692392349243, 0.0003317892551422119, 0.0003461092710494995, 0.0003604292869567871, 0.0003747493028640747, 0.0003890693187713623, 0.0004033893346786499, 0.0004177093505859375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 6.0, 11.0, 10.0, 11.0, 12.0, 12.0, 20.0, 33.0, 62.0, 73.0, 74.0, 107.0, 162.0, 217.0, 317.0, 414.0, 597.0, 898.0, 1281.0, 1960.0, 3116.0, 4969.0, 8034.0, 15431.0, 36008.0, 127885.0, 397060.0, 307750.0, 83420.0, 26727.0, 12438.0, 6976.0, 4152.0, 2712.0, 1743.0, 1111.0, 784.0, 571.0, 388.0, 281.0, 218.0, 146.0, 98.0, 71.0, 52.0, 43.0, 29.0, 19.0, 11.0, 16.0, 8.0, 4.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 4.0], "bins": [-6.828125, -6.61370849609375, -6.3992919921875, -6.18487548828125, -5.970458984375, -5.75604248046875, -5.5416259765625, -5.32720947265625, -5.11279296875, -4.89837646484375, -4.6839599609375, -4.46954345703125, -4.255126953125, -4.04071044921875, -3.8262939453125, -3.61187744140625, -3.3974609375, -3.18304443359375, -2.9686279296875, -2.75421142578125, -2.539794921875, -2.32537841796875, -2.1109619140625, -1.89654541015625, -1.68212890625, -1.46771240234375, -1.2532958984375, -1.03887939453125, -0.824462890625, -0.61004638671875, -0.3956298828125, -0.18121337890625, 0.033203125, 0.24761962890625, 0.4620361328125, 0.67645263671875, 0.890869140625, 1.10528564453125, 1.3197021484375, 1.53411865234375, 1.74853515625, 1.96295166015625, 2.1773681640625, 2.39178466796875, 2.606201171875, 2.82061767578125, 3.0350341796875, 3.24945068359375, 3.4638671875, 3.67828369140625, 3.8927001953125, 4.10711669921875, 4.321533203125, 4.53594970703125, 4.7503662109375, 4.96478271484375, 5.17919921875, 5.39361572265625, 5.6080322265625, 5.82244873046875, 6.036865234375, 6.25128173828125, 6.4656982421875, 6.68011474609375, 6.89453125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 3.0, 1.0, 3.0, 3.0, 6.0, 6.0, 7.0, 6.0, 10.0, 28.0, 53.0, 75.0, 110.0, 161.0, 157.0, 126.0, 93.0, 59.0, 23.0, 17.0, 9.0, 5.0, 8.0, 4.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.50390625, -2.428131103515625, -2.35235595703125, -2.276580810546875, -2.2008056640625, -2.125030517578125, -2.04925537109375, -1.973480224609375, -1.897705078125, -1.821929931640625, -1.74615478515625, -1.670379638671875, -1.5946044921875, -1.518829345703125, -1.44305419921875, -1.367279052734375, -1.29150390625, -1.215728759765625, -1.13995361328125, -1.064178466796875, -0.9884033203125, -0.912628173828125, -0.83685302734375, -0.761077880859375, -0.685302734375, -0.609527587890625, -0.53375244140625, -0.457977294921875, -0.3822021484375, -0.306427001953125, -0.23065185546875, -0.154876708984375, -0.0791015625, -0.003326416015625, 0.07244873046875, 0.148223876953125, 0.2239990234375, 0.299774169921875, 0.37554931640625, 0.451324462890625, 0.527099609375, 0.602874755859375, 0.67864990234375, 0.754425048828125, 0.8302001953125, 0.905975341796875, 0.98175048828125, 1.057525634765625, 1.13330078125, 1.209075927734375, 1.28485107421875, 1.360626220703125, 1.4364013671875, 1.512176513671875, 1.58795166015625, 1.663726806640625, 1.739501953125, 1.815277099609375, 1.89105224609375, 1.966827392578125, 2.0426025390625, 2.118377685546875, 2.19415283203125, 2.269927978515625, 2.345703125]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 6.0, 4.0, 4.0, 5.0, 5.0, 15.0, 8.0, 12.0, 17.0, 16.0, 24.0, 32.0, 28.0, 52.0, 47.0, 63.0, 53.0, 66.0, 74.0, 67.0, 55.0, 53.0, 50.0, 38.0, 38.0, 24.0, 29.0, 18.0, 23.0, 18.0, 12.0, 11.0, 10.0, 6.0, 7.0, 6.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.132872581481934, -7.867674827575684, -7.602477073669434, -7.337279319763184, -7.072081565856934, -6.806883811950684, -6.541686058044434, -6.276488304138184, -6.011290550231934, -5.746092796325684, -5.480895042419434, -5.215697288513184, -4.950499534606934, -4.685301780700684, -4.420104026794434, -4.154906272888184, -3.8897085189819336, -3.6245107650756836, -3.3593130111694336, -3.0941152572631836, -2.8289175033569336, -2.5637197494506836, -2.2985219955444336, -2.0333242416381836, -1.7681264877319336, -1.5029287338256836, -1.2377309799194336, -0.9725332260131836, -0.7073354721069336, -0.4421377182006836, -0.1769399642944336, 0.0882577896118164, 0.35345458984375, 0.61865234375, 0.88385009765625, 1.1490478515625, 1.41424560546875, 1.679443359375, 1.94464111328125, 2.2098388671875, 2.47503662109375, 2.740234375, 3.00543212890625, 3.2706298828125, 3.53582763671875, 3.801025390625, 4.06622314453125, 4.3314208984375, 4.59661865234375, 4.86181640625, 5.12701416015625, 5.3922119140625, 5.65740966796875, 5.922607421875, 6.18780517578125, 6.4530029296875, 6.71820068359375, 6.9833984375, 7.24859619140625, 7.5137939453125, 7.77899169921875, 8.044189453125, 8.30938720703125, 8.5745849609375, 8.83978271484375]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 3.0, 9.0, 5.0, 9.0, 5.0, 12.0, 10.0, 14.0, 19.0, 20.0, 34.0, 30.0, 39.0, 40.0, 28.0, 34.0, 48.0, 45.0, 36.0, 37.0, 51.0, 38.0, 34.0, 43.0, 35.0, 41.0, 38.0, 38.0, 36.0, 28.0, 24.0, 21.0, 20.0, 12.0, 21.0, 14.0, 9.0, 8.0, 6.0, 8.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.453555583953857, -5.281481742858887, -5.109408378601074, -4.9373345375061035, -4.765260696411133, -4.59318733215332, -4.42111349105835, -4.249039649963379, -4.076966285705566, -3.904892683029175, -3.732818841934204, -3.5607452392578125, -3.388671398162842, -3.21659779548645, -3.0445241928100586, -2.872450351715088, -2.700376510620117, -2.5283029079437256, -2.356229066848755, -2.1841554641723633, -2.0120816230773926, -1.840008020401001, -1.6679344177246094, -1.4958606958389282, -1.323786973953247, -1.151713252067566, -0.9796395897865295, -0.8075659275054932, -0.635492205619812, -0.46341848373413086, -0.29134488105773926, -0.1192711591720581, 0.052802085876464844, 0.2248757779598236, 0.3969494700431824, 0.5690231323242188, 0.7410968542098999, 0.913170576095581, 1.0852441787719727, 1.2573179006576538, 1.429391622543335, 1.6014653444290161, 1.7735390663146973, 1.9456126689910889, 2.1176862716674805, 2.289760112762451, 2.4618337154388428, 2.6339073181152344, 2.805981159210205, 2.9780547618865967, 3.1501286029815674, 3.322202205657959, 3.4942760467529297, 3.6663496494293213, 3.838423252105713, 4.010497093200684, 4.182570457458496, 4.354644298553467, 4.526717662811279, 4.69879150390625, 4.870865345001221, 5.042939186096191, 5.215012550354004, 5.387086391448975, 5.559160232543945]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 10.0, 17.0, 25.0, 29.0, 57.0, 80.0, 128.0, 172.0, 262.0, 431.0, 680.0, 977.0, 1457.0, 2184.0, 3408.0, 5228.0, 8280.0, 12882.0, 19690.0, 30020.0, 45526.0, 66635.0, 92278.0, 118062.0, 133793.0, 131177.0, 111668.0, 85161.0, 60277.0, 40980.0, 27048.0, 17563.0, 11342.0, 7371.0, 4691.0, 3133.0, 1981.0, 1354.0, 849.0, 549.0, 366.0, 255.0, 168.0, 104.0, 66.0, 40.0, 38.0, 18.0, 12.0, 8.0, 7.0, 6.0, 5.0, 6.0, 1.0, 2.0], "bins": [-4.65625, -4.51458740234375, -4.3729248046875, -4.23126220703125, -4.089599609375, -3.94793701171875, -3.8062744140625, -3.66461181640625, -3.52294921875, -3.38128662109375, -3.2396240234375, -3.09796142578125, -2.956298828125, -2.81463623046875, -2.6729736328125, -2.53131103515625, -2.3896484375, -2.24798583984375, -2.1063232421875, -1.96466064453125, -1.822998046875, -1.68133544921875, -1.5396728515625, -1.39801025390625, -1.25634765625, -1.11468505859375, -0.9730224609375, -0.83135986328125, -0.689697265625, -0.54803466796875, -0.4063720703125, -0.26470947265625, -0.123046875, 0.01861572265625, 0.1602783203125, 0.30194091796875, 0.443603515625, 0.58526611328125, 0.7269287109375, 0.86859130859375, 1.01025390625, 1.15191650390625, 1.2935791015625, 1.43524169921875, 1.576904296875, 1.71856689453125, 1.8602294921875, 2.00189208984375, 2.1435546875, 2.28521728515625, 2.4268798828125, 2.56854248046875, 2.710205078125, 2.85186767578125, 2.9935302734375, 3.13519287109375, 3.27685546875, 3.41851806640625, 3.5601806640625, 3.70184326171875, 3.843505859375, 3.98516845703125, 4.1268310546875, 4.26849365234375, 4.41015625]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 7.0, 7.0, 12.0, 13.0, 13.0, 15.0, 14.0, 20.0, 28.0, 32.0, 37.0, 28.0, 22.0, 34.0, 37.0, 36.0, 36.0, 43.0, 38.0, 43.0, 47.0, 37.0, 35.0, 37.0, 31.0, 48.0, 36.0, 36.0, 24.0, 31.0, 14.0, 16.0, 24.0, 13.0, 16.0, 8.0, 6.0, 7.0, 8.0, 2.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.74609375, -5.568603515625, -5.39111328125, -5.213623046875, -5.0361328125, -4.858642578125, -4.68115234375, -4.503662109375, -4.326171875, -4.148681640625, -3.97119140625, -3.793701171875, -3.6162109375, -3.438720703125, -3.26123046875, -3.083740234375, -2.90625, -2.728759765625, -2.55126953125, -2.373779296875, -2.1962890625, -2.018798828125, -1.84130859375, -1.663818359375, -1.486328125, -1.308837890625, -1.13134765625, -0.953857421875, -0.7763671875, -0.598876953125, -0.42138671875, -0.243896484375, -0.06640625, 0.111083984375, 0.28857421875, 0.466064453125, 0.6435546875, 0.821044921875, 0.99853515625, 1.176025390625, 1.353515625, 1.531005859375, 1.70849609375, 1.885986328125, 2.0634765625, 2.240966796875, 2.41845703125, 2.595947265625, 2.7734375, 2.950927734375, 3.12841796875, 3.305908203125, 3.4833984375, 3.660888671875, 3.83837890625, 4.015869140625, 4.193359375, 4.370849609375, 4.54833984375, 4.725830078125, 4.9033203125, 5.080810546875, 5.25830078125, 5.435791015625, 5.61328125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 7.0, 15.0, 22.0, 33.0, 40.0, 80.0, 124.0, 177.0, 316.0, 492.0, 802.0, 1291.0, 2049.0, 3342.0, 5220.0, 8876.0, 14198.0, 23525.0, 38527.0, 60949.0, 93313.0, 129610.0, 154645.0, 151654.0, 123304.0, 87577.0, 57186.0, 35251.0, 21445.0, 13308.0, 8075.0, 4936.0, 3091.0, 1984.0, 1175.0, 744.0, 469.0, 275.0, 159.0, 116.0, 69.0, 27.0, 24.0, 18.0, 9.0, 9.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.5859375, -5.42596435546875, -5.2659912109375, -5.10601806640625, -4.946044921875, -4.78607177734375, -4.6260986328125, -4.46612548828125, -4.30615234375, -4.14617919921875, -3.9862060546875, -3.82623291015625, -3.666259765625, -3.50628662109375, -3.3463134765625, -3.18634033203125, -3.0263671875, -2.86639404296875, -2.7064208984375, -2.54644775390625, -2.386474609375, -2.22650146484375, -2.0665283203125, -1.90655517578125, -1.74658203125, -1.58660888671875, -1.4266357421875, -1.26666259765625, -1.106689453125, -0.94671630859375, -0.7867431640625, -0.62677001953125, -0.466796875, -0.30682373046875, -0.1468505859375, 0.01312255859375, 0.173095703125, 0.33306884765625, 0.4930419921875, 0.65301513671875, 0.81298828125, 0.97296142578125, 1.1329345703125, 1.29290771484375, 1.452880859375, 1.61285400390625, 1.7728271484375, 1.93280029296875, 2.0927734375, 2.25274658203125, 2.4127197265625, 2.57269287109375, 2.732666015625, 2.89263916015625, 3.0526123046875, 3.21258544921875, 3.37255859375, 3.53253173828125, 3.6925048828125, 3.85247802734375, 4.012451171875, 4.17242431640625, 4.3323974609375, 4.49237060546875, 4.65234375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 5.0, 3.0, 5.0, 7.0, 6.0, 10.0, 14.0, 14.0, 13.0, 17.0, 17.0, 29.0, 26.0, 24.0, 28.0, 21.0, 31.0, 48.0, 50.0, 42.0, 51.0, 42.0, 39.0, 51.0, 51.0, 49.0, 35.0, 36.0, 37.0, 35.0, 33.0, 21.0, 16.0, 17.0, 15.0, 9.0, 14.0, 7.0, 3.0, 11.0, 6.0, 8.0, 4.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.546875, -3.442413330078125, -3.33795166015625, -3.233489990234375, -3.1290283203125, -3.024566650390625, -2.92010498046875, -2.815643310546875, -2.711181640625, -2.606719970703125, -2.50225830078125, -2.397796630859375, -2.2933349609375, -2.188873291015625, -2.08441162109375, -1.979949951171875, -1.87548828125, -1.771026611328125, -1.66656494140625, -1.562103271484375, -1.4576416015625, -1.353179931640625, -1.24871826171875, -1.144256591796875, -1.039794921875, -0.935333251953125, -0.83087158203125, -0.726409912109375, -0.6219482421875, -0.517486572265625, -0.41302490234375, -0.308563232421875, -0.2041015625, -0.099639892578125, 0.00482177734375, 0.109283447265625, 0.2137451171875, 0.318206787109375, 0.42266845703125, 0.527130126953125, 0.631591796875, 0.736053466796875, 0.84051513671875, 0.944976806640625, 1.0494384765625, 1.153900146484375, 1.25836181640625, 1.362823486328125, 1.46728515625, 1.571746826171875, 1.67620849609375, 1.780670166015625, 1.8851318359375, 1.989593505859375, 2.09405517578125, 2.198516845703125, 2.302978515625, 2.407440185546875, 2.51190185546875, 2.616363525390625, 2.7208251953125, 2.825286865234375, 2.92974853515625, 3.034210205078125, 3.138671875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 13.0, 5.0, 15.0, 20.0, 38.0, 50.0, 83.0, 120.0, 204.0, 279.0, 458.0, 689.0, 1109.0, 1859.0, 3049.0, 4974.0, 8279.0, 14246.0, 24046.0, 40489.0, 66289.0, 103157.0, 144125.0, 167947.0, 154708.0, 116696.0, 77523.0, 47560.0, 28645.0, 16925.0, 9933.0, 5881.0, 3519.0, 2111.0, 1305.0, 828.0, 494.0, 331.0, 188.0, 133.0, 83.0, 56.0, 38.0, 33.0, 13.0, 7.0, 6.0, 6.0, 3.0, 1.0, 2.0], "bins": [-2.98046875, -2.899169921875, -2.81787109375, -2.736572265625, -2.6552734375, -2.573974609375, -2.49267578125, -2.411376953125, -2.330078125, -2.248779296875, -2.16748046875, -2.086181640625, -2.0048828125, -1.923583984375, -1.84228515625, -1.760986328125, -1.6796875, -1.598388671875, -1.51708984375, -1.435791015625, -1.3544921875, -1.273193359375, -1.19189453125, -1.110595703125, -1.029296875, -0.947998046875, -0.86669921875, -0.785400390625, -0.7041015625, -0.622802734375, -0.54150390625, -0.460205078125, -0.37890625, -0.297607421875, -0.21630859375, -0.135009765625, -0.0537109375, 0.027587890625, 0.10888671875, 0.190185546875, 0.271484375, 0.352783203125, 0.43408203125, 0.515380859375, 0.5966796875, 0.677978515625, 0.75927734375, 0.840576171875, 0.921875, 1.003173828125, 1.08447265625, 1.165771484375, 1.2470703125, 1.328369140625, 1.40966796875, 1.490966796875, 1.572265625, 1.653564453125, 1.73486328125, 1.816162109375, 1.8974609375, 1.978759765625, 2.06005859375, 2.141357421875, 2.22265625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 2.0, 7.0, 9.0, 16.0, 14.0, 8.0, 18.0, 24.0, 28.0, 42.0, 32.0, 35.0, 52.0, 62.0, 50.0, 61.0, 56.0, 53.0, 58.0, 57.0, 55.0, 36.0, 40.0, 26.0, 35.0, 21.0, 20.0, 16.0, 12.0, 8.0, 8.0, 6.0, 5.0, 7.0, 8.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00025463104248046875, -0.00024595484137535095, -0.00023727864027023315, -0.00022860243916511536, -0.00021992623805999756, -0.00021125003695487976, -0.00020257383584976196, -0.00019389763474464417, -0.00018522143363952637, -0.00017654523253440857, -0.00016786903142929077, -0.00015919283032417297, -0.00015051662921905518, -0.00014184042811393738, -0.00013316422700881958, -0.00012448802590370178, -0.00011581182479858398, -0.00010713562369346619, -9.845942258834839e-05, -8.978322148323059e-05, -8.110702037811279e-05, -7.2430819272995e-05, -6.37546181678772e-05, -5.50784170627594e-05, -4.64022159576416e-05, -3.7726014852523804e-05, -2.9049813747406006e-05, -2.0373612642288208e-05, -1.169741153717041e-05, -3.0212104320526123e-06, 5.6549906730651855e-06, 1.4331191778182983e-05, 2.300739288330078e-05, 3.168359398841858e-05, 4.035979509353638e-05, 4.9035996198654175e-05, 5.771219730377197e-05, 6.638839840888977e-05, 7.506459951400757e-05, 8.374080061912537e-05, 9.241700172424316e-05, 0.00010109320282936096, 0.00010976940393447876, 0.00011844560503959656, 0.00012712180614471436, 0.00013579800724983215, 0.00014447420835494995, 0.00015315040946006775, 0.00016182661056518555, 0.00017050281167030334, 0.00017917901277542114, 0.00018785521388053894, 0.00019653141498565674, 0.00020520761609077454, 0.00021388381719589233, 0.00022256001830101013, 0.00023123621940612793, 0.00023991242051124573, 0.0002485886216163635, 0.0002572648227214813, 0.0002659410238265991, 0.0002746172249317169, 0.0002832934260368347, 0.0002919696271419525, 0.0003006458282470703]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 8.0, 13.0, 15.0, 21.0, 37.0, 44.0, 67.0, 85.0, 129.0, 211.0, 305.0, 458.0, 734.0, 1002.0, 1626.0, 2447.0, 3831.0, 5974.0, 9619.0, 14687.0, 23432.0, 36353.0, 56283.0, 83807.0, 115182.0, 141511.0, 145498.0, 126369.0, 94989.0, 65391.0, 42784.0, 27299.0, 17497.0, 11059.0, 7032.0, 4435.0, 2915.0, 1864.0, 1165.0, 823.0, 495.0, 331.0, 234.0, 163.0, 109.0, 72.0, 42.0, 39.0, 22.0, 15.0, 12.0, 6.0, 5.0, 7.0, 3.0, 4.0, 1.0, 2.0], "bins": [-2.3046875, -2.233062744140625, -2.16143798828125, -2.089813232421875, -2.0181884765625, -1.946563720703125, -1.87493896484375, -1.803314208984375, -1.731689453125, -1.660064697265625, -1.58843994140625, -1.516815185546875, -1.4451904296875, -1.373565673828125, -1.30194091796875, -1.230316162109375, -1.15869140625, -1.087066650390625, -1.01544189453125, -0.943817138671875, -0.8721923828125, -0.800567626953125, -0.72894287109375, -0.657318115234375, -0.585693359375, -0.514068603515625, -0.44244384765625, -0.370819091796875, -0.2991943359375, -0.227569580078125, -0.15594482421875, -0.084320068359375, -0.0126953125, 0.058929443359375, 0.13055419921875, 0.202178955078125, 0.2738037109375, 0.345428466796875, 0.41705322265625, 0.488677978515625, 0.560302734375, 0.631927490234375, 0.70355224609375, 0.775177001953125, 0.8468017578125, 0.918426513671875, 0.99005126953125, 1.061676025390625, 1.13330078125, 1.204925537109375, 1.27655029296875, 1.348175048828125, 1.4197998046875, 1.491424560546875, 1.56304931640625, 1.634674072265625, 1.706298828125, 1.777923583984375, 1.84954833984375, 1.921173095703125, 1.9927978515625, 2.064422607421875, 2.13604736328125, 2.207672119140625, 2.279296875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 8.0, 3.0, 3.0, 9.0, 5.0, 4.0, 11.0, 13.0, 16.0, 7.0, 23.0, 32.0, 25.0, 34.0, 32.0, 39.0, 49.0, 41.0, 47.0, 55.0, 36.0, 40.0, 47.0, 50.0, 51.0, 49.0, 38.0, 29.0, 35.0, 30.0, 21.0, 28.0, 17.0, 12.0, 11.0, 11.0, 12.0, 8.0, 5.0, 3.0, 5.0, 3.0, 8.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.63720703125, -0.615447998046875, -0.59368896484375, -0.571929931640625, -0.5501708984375, -0.528411865234375, -0.50665283203125, -0.484893798828125, -0.463134765625, -0.441375732421875, -0.41961669921875, -0.397857666015625, -0.3760986328125, -0.354339599609375, -0.33258056640625, -0.310821533203125, -0.2890625, -0.267303466796875, -0.24554443359375, -0.223785400390625, -0.2020263671875, -0.180267333984375, -0.15850830078125, -0.136749267578125, -0.114990234375, -0.093231201171875, -0.07147216796875, -0.049713134765625, -0.0279541015625, -0.006195068359375, 0.01556396484375, 0.037322998046875, 0.05908203125, 0.080841064453125, 0.10260009765625, 0.124359130859375, 0.1461181640625, 0.167877197265625, 0.18963623046875, 0.211395263671875, 0.233154296875, 0.254913330078125, 0.27667236328125, 0.298431396484375, 0.3201904296875, 0.341949462890625, 0.36370849609375, 0.385467529296875, 0.4072265625, 0.428985595703125, 0.45074462890625, 0.472503662109375, 0.4942626953125, 0.516021728515625, 0.53778076171875, 0.559539794921875, 0.581298828125, 0.603057861328125, 0.62481689453125, 0.646575927734375, 0.6683349609375, 0.690093994140625, 0.71185302734375, 0.733612060546875, 0.75537109375]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 7.0, 9.0, 10.0, 9.0, 4.0, 18.0, 14.0, 31.0, 32.0, 34.0, 37.0, 47.0, 60.0, 64.0, 53.0, 75.0, 63.0, 47.0, 58.0, 48.0, 49.0, 35.0, 38.0, 33.0, 17.0, 14.0, 23.0, 10.0, 7.0, 7.0, 12.0, 6.0, 3.0, 3.0, 6.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.54723072052002, -8.286473274230957, -8.025716781616211, -7.764959335327148, -7.504201889038086, -7.243444442749023, -6.982687473297119, -6.721930503845215, -6.461173057556152, -6.20041561126709, -5.9396586418151855, -5.678901672363281, -5.418144226074219, -5.157386779785156, -4.896629810333252, -4.635872840881348, -4.375115394592285, -4.114357948303223, -3.8536009788513184, -3.592843770980835, -3.3320865631103516, -3.071329355239868, -2.8105721473693848, -2.5498149394989014, -2.289057731628418, -2.0283005237579346, -1.7675433158874512, -1.5067861080169678, -1.2460289001464844, -0.985271692276001, -0.7245144844055176, -0.4637572765350342, -0.20299911499023438, 0.05775809288024902, 0.3185153007507324, 0.5792725086212158, 0.8400297164916992, 1.1007869243621826, 1.361544132232666, 1.6223013401031494, 1.8830585479736328, 2.143815755844116, 2.4045729637145996, 2.665330171585083, 2.9260873794555664, 3.18684458732605, 3.447601795196533, 3.7083590030670166, 3.9691162109375, 4.2298736572265625, 4.490630626678467, 4.751387596130371, 5.012145042419434, 5.272902488708496, 5.5336594581604, 5.794416427612305, 6.055173873901367, 6.31593132019043, 6.576688289642334, 6.837445259094238, 7.098202705383301, 7.358960151672363, 7.619717121124268, 7.880474090576172, 8.141231536865234]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 6.0, 4.0, 3.0, 3.0, 5.0, 13.0, 10.0, 4.0, 13.0, 20.0, 8.0, 19.0, 28.0, 33.0, 29.0, 27.0, 38.0, 23.0, 41.0, 34.0, 33.0, 42.0, 43.0, 36.0, 41.0, 29.0, 39.0, 33.0, 47.0, 32.0, 37.0, 32.0, 20.0, 20.0, 25.0, 34.0, 17.0, 15.0, 15.0, 6.0, 15.0, 11.0, 6.0, 6.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-5.270878791809082, -5.108799934387207, -4.946721076965332, -4.784642696380615, -4.62256383895874, -4.460484981536865, -4.29840612411499, -4.136327266693115, -3.9742486476898193, -3.8121697902679443, -3.6500911712646484, -3.4880123138427734, -3.3259334564208984, -3.1638548374176025, -3.0017759799957275, -2.8396973609924316, -2.6776185035705566, -2.5155396461486816, -2.3534610271453857, -2.1913821697235107, -2.029303550720215, -1.8672246932983398, -1.7051458358764648, -1.5430670976638794, -1.380988359451294, -1.2189096212387085, -1.056830883026123, -0.894752025604248, -0.7326732873916626, -0.5705945491790771, -0.4085157513618469, -0.2464369535446167, -0.08435773849487305, 0.07772102952003479, 0.23979979753494263, 0.40187856554985046, 0.5639573335647583, 0.7260360717773438, 0.888114869594574, 1.0501936674118042, 1.2122724056243896, 1.374351143836975, 1.5364298820495605, 1.6985087394714355, 1.860587477684021, 2.0226662158966064, 2.1847450733184814, 2.3468236923217773, 2.5089025497436523, 2.6709814071655273, 2.8330600261688232, 2.9951388835906982, 3.157217502593994, 3.319296360015869, 3.481375217437744, 3.643454074859619, 3.805532693862915, 3.96761155128479, 4.129690170288086, 4.291769027709961, 4.453847885131836, 4.615926742553711, 4.778005123138428, 4.940083980560303, 5.102162837982178]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 1.0, 5.0, 7.0, 8.0, 11.0, 13.0, 34.0, 47.0, 66.0, 117.0, 163.0, 278.0, 393.0, 670.0, 1072.0, 1888.0, 3306.0, 5885.0, 10399.0, 20285.0, 41019.0, 90970.0, 218605.0, 553826.0, 1147926.0, 1151243.0, 556718.0, 216571.0, 88194.0, 40015.0, 19913.0, 10384.0, 5698.0, 3407.0, 1891.0, 1208.0, 756.0, 442.0, 302.0, 185.0, 123.0, 83.0, 59.0, 35.0, 25.0, 12.0, 11.0, 5.0, 4.0, 3.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.03125, -9.7177734375, -9.404296875, -9.0908203125, -8.77734375, -8.4638671875, -8.150390625, -7.8369140625, -7.5234375, -7.2099609375, -6.896484375, -6.5830078125, -6.26953125, -5.9560546875, -5.642578125, -5.3291015625, -5.015625, -4.7021484375, -4.388671875, -4.0751953125, -3.76171875, -3.4482421875, -3.134765625, -2.8212890625, -2.5078125, -2.1943359375, -1.880859375, -1.5673828125, -1.25390625, -0.9404296875, -0.626953125, -0.3134765625, 0.0, 0.3134765625, 0.626953125, 0.9404296875, 1.25390625, 1.5673828125, 1.880859375, 2.1943359375, 2.5078125, 2.8212890625, 3.134765625, 3.4482421875, 3.76171875, 4.0751953125, 4.388671875, 4.7021484375, 5.015625, 5.3291015625, 5.642578125, 5.9560546875, 6.26953125, 6.5830078125, 6.896484375, 7.2099609375, 7.5234375, 7.8369140625, 8.150390625, 8.4638671875, 8.77734375, 9.0908203125, 9.404296875, 9.7177734375, 10.03125]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 8.0, 5.0, 5.0, 8.0, 10.0, 11.0, 18.0, 15.0, 18.0, 21.0, 25.0, 31.0, 26.0, 34.0, 32.0, 29.0, 42.0, 39.0, 33.0, 39.0, 41.0, 34.0, 35.0, 46.0, 34.0, 43.0, 27.0, 33.0, 36.0, 24.0, 29.0, 25.0, 21.0, 14.0, 21.0, 19.0, 15.0, 8.0, 11.0, 12.0, 7.0, 8.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.33984375, -4.208984375, -4.078125, -3.947265625, -3.81640625, -3.685546875, -3.5546875, -3.423828125, -3.29296875, -3.162109375, -3.03125, -2.900390625, -2.76953125, -2.638671875, -2.5078125, -2.376953125, -2.24609375, -2.115234375, -1.984375, -1.853515625, -1.72265625, -1.591796875, -1.4609375, -1.330078125, -1.19921875, -1.068359375, -0.9375, -0.806640625, -0.67578125, -0.544921875, -0.4140625, -0.283203125, -0.15234375, -0.021484375, 0.109375, 0.240234375, 0.37109375, 0.501953125, 0.6328125, 0.763671875, 0.89453125, 1.025390625, 1.15625, 1.287109375, 1.41796875, 1.548828125, 1.6796875, 1.810546875, 1.94140625, 2.072265625, 2.203125, 2.333984375, 2.46484375, 2.595703125, 2.7265625, 2.857421875, 2.98828125, 3.119140625, 3.25, 3.380859375, 3.51171875, 3.642578125, 3.7734375, 3.904296875, 4.03515625]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 3.0, 5.0, 6.0, 10.0, 7.0, 15.0, 33.0, 49.0, 66.0, 113.0, 133.0, 203.0, 327.0, 499.0, 700.0, 1098.0, 1592.0, 2490.0, 3782.0, 6051.0, 9608.0, 15788.0, 25943.0, 43763.0, 75909.0, 136455.0, 251503.0, 458018.0, 747012.0, 881119.0, 663363.0, 383922.0, 209589.0, 114571.0, 64441.0, 36977.0, 22079.0, 13452.0, 8188.0, 5282.0, 3443.0, 2202.0, 1489.0, 937.0, 650.0, 485.0, 284.0, 225.0, 141.0, 91.0, 67.0, 29.0, 37.0, 19.0, 11.0, 11.0, 2.0, 4.0, 3.0, 0.0, 2.0], "bins": [-8.0859375, -7.83599853515625, -7.5860595703125, -7.33612060546875, -7.086181640625, -6.83624267578125, -6.5863037109375, -6.33636474609375, -6.08642578125, -5.83648681640625, -5.5865478515625, -5.33660888671875, -5.086669921875, -4.83673095703125, -4.5867919921875, -4.33685302734375, -4.0869140625, -3.83697509765625, -3.5870361328125, -3.33709716796875, -3.087158203125, -2.83721923828125, -2.5872802734375, -2.33734130859375, -2.08740234375, -1.83746337890625, -1.5875244140625, -1.33758544921875, -1.087646484375, -0.83770751953125, -0.5877685546875, -0.33782958984375, -0.087890625, 0.16204833984375, 0.4119873046875, 0.66192626953125, 0.911865234375, 1.16180419921875, 1.4117431640625, 1.66168212890625, 1.91162109375, 2.16156005859375, 2.4114990234375, 2.66143798828125, 2.911376953125, 3.16131591796875, 3.4112548828125, 3.66119384765625, 3.9111328125, 4.16107177734375, 4.4110107421875, 4.66094970703125, 4.910888671875, 5.16082763671875, 5.4107666015625, 5.66070556640625, 5.91064453125, 6.16058349609375, 6.4105224609375, 6.66046142578125, 6.910400390625, 7.16033935546875, 7.4102783203125, 7.66021728515625, 7.91015625]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 8.0, 5.0, 8.0, 9.0, 10.0, 21.0, 19.0, 24.0, 25.0, 31.0, 54.0, 61.0, 62.0, 89.0, 104.0, 142.0, 180.0, 216.0, 221.0, 256.0, 296.0, 288.0, 306.0, 259.0, 274.0, 199.0, 182.0, 159.0, 122.0, 98.0, 72.0, 67.0, 49.0, 39.0, 24.0, 25.0, 14.0, 19.0, 11.0, 5.0, 4.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.04296875, -2.954254150390625, -2.86553955078125, -2.776824951171875, -2.6881103515625, -2.599395751953125, -2.51068115234375, -2.421966552734375, -2.333251953125, -2.244537353515625, -2.15582275390625, -2.067108154296875, -1.9783935546875, -1.889678955078125, -1.80096435546875, -1.712249755859375, -1.62353515625, -1.534820556640625, -1.44610595703125, -1.357391357421875, -1.2686767578125, -1.179962158203125, -1.09124755859375, -1.002532958984375, -0.913818359375, -0.825103759765625, -0.73638916015625, -0.647674560546875, -0.5589599609375, -0.470245361328125, -0.38153076171875, -0.292816162109375, -0.2041015625, -0.115386962890625, -0.02667236328125, 0.062042236328125, 0.1507568359375, 0.239471435546875, 0.32818603515625, 0.416900634765625, 0.505615234375, 0.594329833984375, 0.68304443359375, 0.771759033203125, 0.8604736328125, 0.949188232421875, 1.03790283203125, 1.126617431640625, 1.21533203125, 1.304046630859375, 1.39276123046875, 1.481475830078125, 1.5701904296875, 1.658905029296875, 1.74761962890625, 1.836334228515625, 1.925048828125, 2.013763427734375, 2.10247802734375, 2.191192626953125, 2.2799072265625, 2.368621826171875, 2.45733642578125, 2.546051025390625, 2.634765625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 6.0, 5.0, 3.0, 10.0, 4.0, 15.0, 14.0, 17.0, 29.0, 17.0, 31.0, 41.0, 39.0, 76.0, 62.0, 75.0, 70.0, 74.0, 64.0, 57.0, 42.0, 57.0, 50.0, 28.0, 28.0, 14.0, 23.0, 11.0, 11.0, 9.0, 3.0, 9.0, 5.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.641690254211426, -11.29724407196045, -10.952796936035156, -10.60835075378418, -10.263903617858887, -9.91945743560791, -9.575010299682617, -9.23056411743164, -8.886117935180664, -8.541671752929688, -8.197224617004395, -7.852778434753418, -7.508331298828125, -7.163885116577148, -6.819438457489014, -6.474991798400879, -6.130544662475586, -5.786098003387451, -5.441651344299316, -5.09720516204834, -4.752758026123047, -4.40831184387207, -4.0638651847839355, -3.719418525695801, -3.374971866607666, -3.0305252075195312, -2.6860785484313965, -2.341632127761841, -1.997185468673706, -1.6527388095855713, -1.3082923889160156, -0.9638457298278809, -0.6193981170654297, -0.2749515175819397, 0.06949508190155029, 0.4139416217803955, 0.7583882808685303, 1.102834939956665, 1.4472813606262207, 1.7917280197143555, 2.1361746788024902, 2.480621337890625, 2.8250679969787598, 3.1695144176483154, 3.51396107673645, 3.858407735824585, 4.202854156494141, 4.547300815582275, 4.89174747467041, 5.236194133758545, 5.58064079284668, 5.925086975097656, 6.269534111022949, 6.613980293273926, 6.9584269523620605, 7.302873611450195, 7.64732027053833, 7.991766929626465, 8.336213111877441, 8.680660247802734, 9.025106430053711, 9.369553565979004, 9.71399974822998, 10.058446884155273, 10.40289306640625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 6.0, 10.0, 12.0, 15.0, 10.0, 14.0, 18.0, 14.0, 29.0, 24.0, 29.0, 25.0, 31.0, 31.0, 39.0, 35.0, 37.0, 49.0, 47.0, 45.0, 35.0, 40.0, 30.0, 34.0, 36.0, 31.0, 40.0, 40.0, 29.0, 20.0, 20.0, 25.0, 20.0, 9.0, 14.0, 12.0, 13.0, 9.0, 4.0, 6.0, 2.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.996007442474365, -5.813138484954834, -5.630269527435303, -5.447400093078613, -5.264531135559082, -5.081662178039551, -4.8987932205200195, -4.715924263000488, -4.533055305480957, -4.350186347961426, -4.1673173904418945, -3.984448194503784, -3.801579236984253, -3.6187100410461426, -3.4358410835266113, -3.25297212600708, -3.0701029300689697, -2.8872339725494385, -2.704364776611328, -2.521495819091797, -2.3386268615722656, -2.1557579040527344, -1.972888708114624, -1.7900197505950928, -1.607150673866272, -1.4242815971374512, -1.24141263961792, -1.0585435628890991, -0.8756745457649231, -0.6928055286407471, -0.5099364519119263, -0.327067494392395, -0.14419841766357422, 0.038670614361763, 0.22153964638710022, 0.40440869331359863, 0.5872777104377747, 0.7701467275619507, 0.9530158042907715, 1.1358847618103027, 1.3187538385391235, 1.5016229152679443, 1.6844918727874756, 1.8673609495162964, 2.050230026245117, 2.2330989837646484, 2.4159679412841797, 2.598836898803711, 2.7817060947418213, 2.9645750522613525, 3.147444248199463, 3.330313205718994, 3.5131821632385254, 3.6960511207580566, 3.878920316696167, 4.061789512634277, 4.244658470153809, 4.42752742767334, 4.610396385192871, 4.793265342712402, 4.976134777069092, 5.159003734588623, 5.341872692108154, 5.5247416496276855, 5.707610607147217]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 7.0, 8.0, 29.0, 16.0, 28.0, 59.0, 81.0, 132.0, 215.0, 283.0, 453.0, 687.0, 1127.0, 1780.0, 2699.0, 4572.0, 7536.0, 12563.0, 21458.0, 35885.0, 59743.0, 96527.0, 141020.0, 172421.0, 163778.0, 123172.0, 80934.0, 48651.0, 28903.0, 17122.0, 10405.0, 6106.0, 3736.0, 2368.0, 1418.0, 934.0, 561.0, 376.0, 267.0, 154.0, 105.0, 81.0, 56.0, 29.0, 28.0, 15.0, 6.0, 8.0, 4.0, 7.0, 5.0, 0.0, 2.0, 1.0], "bins": [-4.65625, -4.51849365234375, -4.3807373046875, -4.24298095703125, -4.105224609375, -3.96746826171875, -3.8297119140625, -3.69195556640625, -3.55419921875, -3.41644287109375, -3.2786865234375, -3.14093017578125, -3.003173828125, -2.86541748046875, -2.7276611328125, -2.58990478515625, -2.4521484375, -2.31439208984375, -2.1766357421875, -2.03887939453125, -1.901123046875, -1.76336669921875, -1.6256103515625, -1.48785400390625, -1.35009765625, -1.21234130859375, -1.0745849609375, -0.93682861328125, -0.799072265625, -0.66131591796875, -0.5235595703125, -0.38580322265625, -0.248046875, -0.11029052734375, 0.0274658203125, 0.16522216796875, 0.302978515625, 0.44073486328125, 0.5784912109375, 0.71624755859375, 0.85400390625, 0.99176025390625, 1.1295166015625, 1.26727294921875, 1.405029296875, 1.54278564453125, 1.6805419921875, 1.81829833984375, 1.9560546875, 2.09381103515625, 2.2315673828125, 2.36932373046875, 2.507080078125, 2.64483642578125, 2.7825927734375, 2.92034912109375, 3.05810546875, 3.19586181640625, 3.3336181640625, 3.47137451171875, 3.609130859375, 3.74688720703125, 3.8846435546875, 4.02239990234375, 4.16015625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 9.0, 10.0, 11.0, 11.0, 13.0, 18.0, 15.0, 17.0, 22.0, 16.0, 17.0, 21.0, 24.0, 23.0, 19.0, 39.0, 42.0, 41.0, 43.0, 40.0, 42.0, 32.0, 27.0, 35.0, 32.0, 34.0, 31.0, 30.0, 36.0, 30.0, 29.0, 18.0, 28.0, 21.0, 10.0, 18.0, 12.0, 10.0, 18.0, 9.0, 6.0, 9.0, 7.0, 9.0, 3.0, 3.0, 1.0, 2.0, 3.0, 6.0, 1.0], "bins": [-5.9453125, -5.7720947265625, -5.598876953125, -5.4256591796875, -5.25244140625, -5.0792236328125, -4.906005859375, -4.7327880859375, -4.5595703125, -4.3863525390625, -4.213134765625, -4.0399169921875, -3.86669921875, -3.6934814453125, -3.520263671875, -3.3470458984375, -3.173828125, -3.0006103515625, -2.827392578125, -2.6541748046875, -2.48095703125, -2.3077392578125, -2.134521484375, -1.9613037109375, -1.7880859375, -1.6148681640625, -1.441650390625, -1.2684326171875, -1.09521484375, -0.9219970703125, -0.748779296875, -0.5755615234375, -0.40234375, -0.2291259765625, -0.055908203125, 0.1173095703125, 0.29052734375, 0.4637451171875, 0.636962890625, 0.8101806640625, 0.9833984375, 1.1566162109375, 1.329833984375, 1.5030517578125, 1.67626953125, 1.8494873046875, 2.022705078125, 2.1959228515625, 2.369140625, 2.5423583984375, 2.715576171875, 2.8887939453125, 3.06201171875, 3.2352294921875, 3.408447265625, 3.5816650390625, 3.7548828125, 3.9281005859375, 4.101318359375, 4.2745361328125, 4.44775390625, 4.6209716796875, 4.794189453125, 4.9674072265625, 5.140625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 7.0, 6.0, 10.0, 14.0, 9.0, 21.0, 29.0, 27.0, 43.0, 68.0, 95.0, 136.0, 233.0, 369.0, 516.0, 905.0, 1526.0, 2657.0, 4736.0, 9143.0, 18226.0, 37078.0, 77481.0, 155263.0, 251213.0, 231105.0, 130367.0, 64044.0, 30582.0, 15010.0, 7715.0, 4041.0, 2309.0, 1273.0, 804.0, 503.0, 308.0, 204.0, 159.0, 113.0, 57.0, 44.0, 27.0, 24.0, 18.0, 16.0, 9.0, 6.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-7.57421875, -7.3505859375, -7.126953125, -6.9033203125, -6.6796875, -6.4560546875, -6.232421875, -6.0087890625, -5.78515625, -5.5615234375, -5.337890625, -5.1142578125, -4.890625, -4.6669921875, -4.443359375, -4.2197265625, -3.99609375, -3.7724609375, -3.548828125, -3.3251953125, -3.1015625, -2.8779296875, -2.654296875, -2.4306640625, -2.20703125, -1.9833984375, -1.759765625, -1.5361328125, -1.3125, -1.0888671875, -0.865234375, -0.6416015625, -0.41796875, -0.1943359375, 0.029296875, 0.2529296875, 0.4765625, 0.7001953125, 0.923828125, 1.1474609375, 1.37109375, 1.5947265625, 1.818359375, 2.0419921875, 2.265625, 2.4892578125, 2.712890625, 2.9365234375, 3.16015625, 3.3837890625, 3.607421875, 3.8310546875, 4.0546875, 4.2783203125, 4.501953125, 4.7255859375, 4.94921875, 5.1728515625, 5.396484375, 5.6201171875, 5.84375, 6.0673828125, 6.291015625, 6.5146484375, 6.73828125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 5.0, 2.0, 5.0, 12.0, 5.0, 11.0, 16.0, 15.0, 13.0, 21.0, 25.0, 24.0, 35.0, 18.0, 23.0, 39.0, 30.0, 33.0, 34.0, 28.0, 36.0, 40.0, 39.0, 45.0, 32.0, 42.0, 36.0, 32.0, 29.0, 27.0, 19.0, 30.0, 34.0, 26.0, 19.0, 20.0, 19.0, 24.0, 12.0, 9.0, 10.0, 4.0, 7.0, 5.0, 5.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-3.16796875, -3.063690185546875, -2.95941162109375, -2.855133056640625, -2.7508544921875, -2.646575927734375, -2.54229736328125, -2.438018798828125, -2.333740234375, -2.229461669921875, -2.12518310546875, -2.020904541015625, -1.9166259765625, -1.812347412109375, -1.70806884765625, -1.603790283203125, -1.49951171875, -1.395233154296875, -1.29095458984375, -1.186676025390625, -1.0823974609375, -0.978118896484375, -0.87384033203125, -0.769561767578125, -0.665283203125, -0.561004638671875, -0.45672607421875, -0.352447509765625, -0.2481689453125, -0.143890380859375, -0.03961181640625, 0.064666748046875, 0.1689453125, 0.273223876953125, 0.37750244140625, 0.481781005859375, 0.5860595703125, 0.690338134765625, 0.79461669921875, 0.898895263671875, 1.003173828125, 1.107452392578125, 1.21173095703125, 1.316009521484375, 1.4202880859375, 1.524566650390625, 1.62884521484375, 1.733123779296875, 1.83740234375, 1.941680908203125, 2.04595947265625, 2.150238037109375, 2.2545166015625, 2.358795166015625, 2.46307373046875, 2.567352294921875, 2.671630859375, 2.775909423828125, 2.88018798828125, 2.984466552734375, 3.0887451171875, 3.193023681640625, 3.29730224609375, 3.401580810546875, 3.505859375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 3.0, 12.0, 11.0, 10.0, 28.0, 38.0, 51.0, 76.0, 101.0, 165.0, 297.0, 477.0, 770.0, 1237.0, 2091.0, 3840.0, 7309.0, 14701.0, 30860.0, 69290.0, 160030.0, 300929.0, 246790.0, 113532.0, 49501.0, 22575.0, 10852.0, 5555.0, 3103.0, 1708.0, 991.0, 580.0, 365.0, 218.0, 172.0, 87.0, 70.0, 42.0, 22.0, 23.0, 18.0, 9.0, 3.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.51171875, -4.3741455078125, -4.236572265625, -4.0989990234375, -3.96142578125, -3.8238525390625, -3.686279296875, -3.5487060546875, -3.4111328125, -3.2735595703125, -3.135986328125, -2.9984130859375, -2.86083984375, -2.7232666015625, -2.585693359375, -2.4481201171875, -2.310546875, -2.1729736328125, -2.035400390625, -1.8978271484375, -1.76025390625, -1.6226806640625, -1.485107421875, -1.3475341796875, -1.2099609375, -1.0723876953125, -0.934814453125, -0.7972412109375, -0.65966796875, -0.5220947265625, -0.384521484375, -0.2469482421875, -0.109375, 0.0281982421875, 0.165771484375, 0.3033447265625, 0.44091796875, 0.5784912109375, 0.716064453125, 0.8536376953125, 0.9912109375, 1.1287841796875, 1.266357421875, 1.4039306640625, 1.54150390625, 1.6790771484375, 1.816650390625, 1.9542236328125, 2.091796875, 2.2293701171875, 2.366943359375, 2.5045166015625, 2.64208984375, 2.7796630859375, 2.917236328125, 3.0548095703125, 3.1923828125, 3.3299560546875, 3.467529296875, 3.6051025390625, 3.74267578125, 3.8802490234375, 4.017822265625, 4.1553955078125, 4.29296875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 4.0, 6.0, 3.0, 12.0, 15.0, 34.0, 35.0, 61.0, 73.0, 104.0, 99.0, 129.0, 108.0, 76.0, 74.0, 47.0, 40.0, 29.0, 20.0, 11.0, 6.0, 11.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023627281188964844, -0.0002266019582748413, -0.00021693110466003418, -0.00020726025104522705, -0.00019758939743041992, -0.0001879185438156128, -0.00017824769020080566, -0.00016857683658599854, -0.0001589059829711914, -0.00014923512935638428, -0.00013956427574157715, -0.00012989342212677002, -0.00012022256851196289, -0.00011055171489715576, -0.00010088086128234863, -9.12100076675415e-05, -8.153915405273438e-05, -7.186830043792725e-05, -6.219744682312012e-05, -5.252659320831299e-05, -4.285573959350586e-05, -3.318488597869873e-05, -2.35140323638916e-05, -1.3843178749084473e-05, -4.172325134277344e-06, 5.498528480529785e-06, 1.5169382095336914e-05, 2.4840235710144043e-05, 3.451108932495117e-05, 4.41819429397583e-05, 5.385279655456543e-05, 6.352365016937256e-05, 7.319450378417969e-05, 8.286535739898682e-05, 9.253621101379395e-05, 0.00010220706462860107, 0.0001118779182434082, 0.00012154877185821533, 0.00013121962547302246, 0.0001408904790878296, 0.00015056133270263672, 0.00016023218631744385, 0.00016990303993225098, 0.0001795738935470581, 0.00018924474716186523, 0.00019891560077667236, 0.0002085864543914795, 0.00021825730800628662, 0.00022792816162109375, 0.00023759901523590088, 0.000247269868850708, 0.00025694072246551514, 0.00026661157608032227, 0.0002762824296951294, 0.0002859532833099365, 0.00029562413692474365, 0.0003052949905395508, 0.0003149658441543579, 0.00032463669776916504, 0.00033430755138397217, 0.0003439784049987793, 0.0003536492586135864, 0.00036332011222839355, 0.0003729909658432007, 0.0003826618194580078]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 7.0, 9.0, 11.0, 13.0, 27.0, 39.0, 56.0, 68.0, 107.0, 145.0, 232.0, 323.0, 571.0, 976.0, 1572.0, 2621.0, 4733.0, 8641.0, 16461.0, 31093.0, 61286.0, 117472.0, 195105.0, 230628.0, 172535.0, 97414.0, 50344.0, 25480.0, 13263.0, 7278.0, 4134.0, 2350.0, 1395.0, 761.0, 470.0, 320.0, 177.0, 121.0, 87.0, 74.0, 45.0, 26.0, 28.0, 21.0, 9.0, 10.0, 7.0, 3.0, 0.0, 6.0, 1.0, 1.0, 3.0], "bins": [-4.09375, -3.974578857421875, -3.85540771484375, -3.736236572265625, -3.6170654296875, -3.497894287109375, -3.37872314453125, -3.259552001953125, -3.140380859375, -3.021209716796875, -2.90203857421875, -2.782867431640625, -2.6636962890625, -2.544525146484375, -2.42535400390625, -2.306182861328125, -2.18701171875, -2.067840576171875, -1.94866943359375, -1.829498291015625, -1.7103271484375, -1.591156005859375, -1.47198486328125, -1.352813720703125, -1.233642578125, -1.114471435546875, -0.99530029296875, -0.876129150390625, -0.7569580078125, -0.637786865234375, -0.51861572265625, -0.399444580078125, -0.2802734375, -0.161102294921875, -0.04193115234375, 0.077239990234375, 0.1964111328125, 0.315582275390625, 0.43475341796875, 0.553924560546875, 0.673095703125, 0.792266845703125, 0.91143798828125, 1.030609130859375, 1.1497802734375, 1.268951416015625, 1.38812255859375, 1.507293701171875, 1.62646484375, 1.745635986328125, 1.86480712890625, 1.983978271484375, 2.1031494140625, 2.222320556640625, 2.34149169921875, 2.460662841796875, 2.579833984375, 2.699005126953125, 2.81817626953125, 2.937347412109375, 3.0565185546875, 3.175689697265625, 3.29486083984375, 3.414031982421875, 3.533203125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 7.0, 8.0, 6.0, 6.0, 20.0, 14.0, 19.0, 16.0, 32.0, 30.0, 31.0, 48.0, 57.0, 57.0, 53.0, 75.0, 66.0, 57.0, 63.0, 58.0, 52.0, 46.0, 37.0, 30.0, 20.0, 19.0, 13.0, 19.0, 12.0, 8.0, 9.0, 4.0, 4.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-1.1826171875, -1.1511459350585938, -1.1196746826171875, -1.0882034301757812, -1.056732177734375, -1.0252609252929688, -0.9937896728515625, -0.9623184204101562, -0.93084716796875, -0.8993759155273438, -0.8679046630859375, -0.8364334106445312, -0.804962158203125, -0.7734909057617188, -0.7420196533203125, -0.7105484008789062, -0.6790771484375, -0.6476058959960938, -0.6161346435546875, -0.5846633911132812, -0.553192138671875, -0.5217208862304688, -0.4902496337890625, -0.45877838134765625, -0.42730712890625, -0.39583587646484375, -0.3643646240234375, -0.33289337158203125, -0.301422119140625, -0.26995086669921875, -0.2384796142578125, -0.20700836181640625, -0.175537109375, -0.14406585693359375, -0.1125946044921875, -0.08112335205078125, -0.049652099609375, -0.01818084716796875, 0.0132904052734375, 0.04476165771484375, 0.07623291015625, 0.10770416259765625, 0.1391754150390625, 0.17064666748046875, 0.202117919921875, 0.23358917236328125, 0.2650604248046875, 0.29653167724609375, 0.3280029296875, 0.35947418212890625, 0.3909454345703125, 0.42241668701171875, 0.453887939453125, 0.48535919189453125, 0.5168304443359375, 0.5483016967773438, 0.57977294921875, 0.6112442016601562, 0.6427154541015625, 0.6741867065429688, 0.705657958984375, 0.7371292114257812, 0.7686004638671875, 0.8000717163085938, 0.83154296875]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0, 7.0, 6.0, 6.0, 6.0, 11.0, 9.0, 12.0, 26.0, 20.0, 25.0, 38.0, 34.0, 49.0, 61.0, 71.0, 89.0, 78.0, 79.0, 59.0, 48.0, 50.0, 52.0, 40.0, 36.0, 20.0, 13.0, 13.0, 14.0, 7.0, 12.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.844240188598633, -11.490038871765137, -11.135836601257324, -10.781635284423828, -10.427433013916016, -10.07323169708252, -9.719030380249023, -9.364828109741211, -9.010625839233398, -8.656424522399902, -8.30222225189209, -7.948020935058594, -7.593818664550781, -7.239617347717285, -6.885415554046631, -6.531213760375977, -6.1770124435424805, -5.822810649871826, -5.468608856201172, -5.114407539367676, -4.760205268859863, -4.406003952026367, -4.051802158355713, -3.6976003646850586, -3.3433985710144043, -2.98919677734375, -2.6349949836730957, -2.2807934284210205, -1.9265916347503662, -1.572389841079712, -1.2181882858276367, -0.8639864921569824, -0.5097856521606445, -0.155583918094635, 0.1986178159713745, 0.5528194904327393, 0.9070212841033936, 1.2612230777740479, 1.615424633026123, 1.9696264266967773, 2.3238282203674316, 2.678030014038086, 3.0322318077087402, 3.3864333629608154, 3.7406351566314697, 4.094837188720703, 4.449038505554199, 4.8032402992248535, 5.157442092895508, 5.511643886566162, 5.865845680236816, 6.2200469970703125, 6.574249267578125, 6.928450584411621, 7.282652378082275, 7.63685417175293, 7.991055965423584, 8.345257759094238, 8.699459075927734, 9.053661346435547, 9.407862663269043, 9.762064933776855, 10.116266250610352, 10.470468521118164, 10.82466983795166]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 8.0, 9.0, 18.0, 12.0, 8.0, 20.0, 15.0, 30.0, 28.0, 25.0, 27.0, 28.0, 30.0, 34.0, 34.0, 41.0, 50.0, 35.0, 59.0, 40.0, 29.0, 40.0, 26.0, 35.0, 39.0, 38.0, 34.0, 36.0, 19.0, 20.0, 19.0, 18.0, 20.0, 11.0, 16.0, 12.0, 11.0, 3.0, 3.0, 4.0, 4.0, 1.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.831948280334473, -5.648662090301514, -5.4653754234313965, -5.2820892333984375, -5.09880256652832, -4.915516376495361, -4.732230186462402, -4.548943519592285, -4.365656852722168, -4.182370662689209, -3.999083995819092, -3.815797805786133, -3.6325111389160156, -3.4492249488830566, -3.2659385204315186, -3.0826520919799805, -2.8993659019470215, -2.7160794734954834, -2.5327930450439453, -2.3495068550109863, -2.166220188140869, -1.9829338788986206, -1.799647569656372, -1.616361141204834, -1.433074712753296, -1.2497882843017578, -1.0665018558502197, -0.8832155466079712, -0.6999291181564331, -0.516642689704895, -0.3333563804626465, -0.1500699520111084, 0.033215999603271484, 0.21650239825248718, 0.3997887969017029, 0.5830751657485962, 0.7663615942001343, 0.9496480226516724, 1.132934331893921, 1.316220760345459, 1.499507188796997, 1.6827936172485352, 1.8660800457000732, 2.0493664741516113, 2.2326526641845703, 2.4159393310546875, 2.5992255210876465, 2.7825119495391846, 2.9657983779907227, 3.1490848064422607, 3.332371234893799, 3.515657424926758, 3.698944091796875, 3.882230281829834, 4.065516471862793, 4.24880313873291, 4.432089805603027, 4.615375995635986, 4.7986626625061035, 4.9819488525390625, 5.16523551940918, 5.348521709442139, 5.531807899475098, 5.715094566345215, 5.898380756378174]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 8.0, 9.0, 12.0, 22.0, 37.0, 42.0, 77.0, 118.0, 173.0, 241.0, 394.0, 620.0, 1013.0, 1602.0, 2787.0, 4515.0, 7272.0, 12239.0, 20649.0, 34321.0, 54779.0, 85272.0, 121978.0, 152267.0, 157236.0, 132279.0, 95638.0, 63164.0, 39182.0, 24161.0, 14363.0, 8644.0, 5179.0, 3030.0, 1978.0, 1182.0, 727.0, 492.0, 291.0, 203.0, 124.0, 86.0, 53.0, 36.0, 17.0, 19.0, 7.0, 7.0, 6.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0], "bins": [-5.75, -5.5765380859375, -5.403076171875, -5.2296142578125, -5.05615234375, -4.8826904296875, -4.709228515625, -4.5357666015625, -4.3623046875, -4.1888427734375, -4.015380859375, -3.8419189453125, -3.66845703125, -3.4949951171875, -3.321533203125, -3.1480712890625, -2.974609375, -2.8011474609375, -2.627685546875, -2.4542236328125, -2.28076171875, -2.1072998046875, -1.933837890625, -1.7603759765625, -1.5869140625, -1.4134521484375, -1.239990234375, -1.0665283203125, -0.89306640625, -0.7196044921875, -0.546142578125, -0.3726806640625, -0.19921875, -0.0257568359375, 0.147705078125, 0.3211669921875, 0.49462890625, 0.6680908203125, 0.841552734375, 1.0150146484375, 1.1884765625, 1.3619384765625, 1.535400390625, 1.7088623046875, 1.88232421875, 2.0557861328125, 2.229248046875, 2.4027099609375, 2.576171875, 2.7496337890625, 2.923095703125, 3.0965576171875, 3.27001953125, 3.4434814453125, 3.616943359375, 3.7904052734375, 3.9638671875, 4.1373291015625, 4.310791015625, 4.4842529296875, 4.65771484375, 4.8311767578125, 5.004638671875, 5.1781005859375, 5.3515625]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 6.0, 1.0, 4.0, 6.0, 3.0, 9.0, 4.0, 11.0, 14.0, 14.0, 14.0, 14.0, 19.0, 24.0, 28.0, 31.0, 24.0, 37.0, 36.0, 43.0, 39.0, 44.0, 46.0, 44.0, 39.0, 35.0, 34.0, 40.0, 33.0, 38.0, 31.0, 28.0, 25.0, 31.0, 13.0, 29.0, 24.0, 16.0, 13.0, 14.0, 12.0, 10.0, 3.0, 10.0, 4.0, 2.0, 3.0, 0.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.30859375, -6.117431640625, -5.92626953125, -5.735107421875, -5.5439453125, -5.352783203125, -5.16162109375, -4.970458984375, -4.779296875, -4.588134765625, -4.39697265625, -4.205810546875, -4.0146484375, -3.823486328125, -3.63232421875, -3.441162109375, -3.25, -3.058837890625, -2.86767578125, -2.676513671875, -2.4853515625, -2.294189453125, -2.10302734375, -1.911865234375, -1.720703125, -1.529541015625, -1.33837890625, -1.147216796875, -0.9560546875, -0.764892578125, -0.57373046875, -0.382568359375, -0.19140625, -0.000244140625, 0.19091796875, 0.382080078125, 0.5732421875, 0.764404296875, 0.95556640625, 1.146728515625, 1.337890625, 1.529052734375, 1.72021484375, 1.911376953125, 2.1025390625, 2.293701171875, 2.48486328125, 2.676025390625, 2.8671875, 3.058349609375, 3.24951171875, 3.440673828125, 3.6318359375, 3.822998046875, 4.01416015625, 4.205322265625, 4.396484375, 4.587646484375, 4.77880859375, 4.969970703125, 5.1611328125, 5.352294921875, 5.54345703125, 5.734619140625, 5.92578125]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 5.0, 10.0, 18.0, 41.0, 63.0, 99.0, 149.0, 242.0, 383.0, 768.0, 1195.0, 2040.0, 3637.0, 6121.0, 10578.0, 18146.0, 30587.0, 51259.0, 80724.0, 118069.0, 150908.0, 161304.0, 139403.0, 103427.0, 67639.0, 41702.0, 24992.0, 14642.0, 8435.0, 5019.0, 2877.0, 1658.0, 1011.0, 566.0, 322.0, 205.0, 145.0, 71.0, 35.0, 32.0, 16.0, 7.0, 6.0, 2.0, 6.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-6.40625, -6.219482421875, -6.03271484375, -5.845947265625, -5.6591796875, -5.472412109375, -5.28564453125, -5.098876953125, -4.912109375, -4.725341796875, -4.53857421875, -4.351806640625, -4.1650390625, -3.978271484375, -3.79150390625, -3.604736328125, -3.41796875, -3.231201171875, -3.04443359375, -2.857666015625, -2.6708984375, -2.484130859375, -2.29736328125, -2.110595703125, -1.923828125, -1.737060546875, -1.55029296875, -1.363525390625, -1.1767578125, -0.989990234375, -0.80322265625, -0.616455078125, -0.4296875, -0.242919921875, -0.05615234375, 0.130615234375, 0.3173828125, 0.504150390625, 0.69091796875, 0.877685546875, 1.064453125, 1.251220703125, 1.43798828125, 1.624755859375, 1.8115234375, 1.998291015625, 2.18505859375, 2.371826171875, 2.55859375, 2.745361328125, 2.93212890625, 3.118896484375, 3.3056640625, 3.492431640625, 3.67919921875, 3.865966796875, 4.052734375, 4.239501953125, 4.42626953125, 4.613037109375, 4.7998046875, 4.986572265625, 5.17333984375, 5.360107421875, 5.546875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 13.0, 9.0, 17.0, 12.0, 15.0, 12.0, 18.0, 21.0, 26.0, 27.0, 32.0, 50.0, 54.0, 33.0, 37.0, 34.0, 33.0, 33.0, 46.0, 49.0, 40.0, 49.0, 36.0, 29.0, 34.0, 36.0, 36.0, 32.0, 25.0, 21.0, 15.0, 19.0, 18.0, 5.0, 9.0, 8.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.55078125, -4.41961669921875, -4.2884521484375, -4.15728759765625, -4.026123046875, -3.89495849609375, -3.7637939453125, -3.63262939453125, -3.50146484375, -3.37030029296875, -3.2391357421875, -3.10797119140625, -2.976806640625, -2.84564208984375, -2.7144775390625, -2.58331298828125, -2.4521484375, -2.32098388671875, -2.1898193359375, -2.05865478515625, -1.927490234375, -1.79632568359375, -1.6651611328125, -1.53399658203125, -1.40283203125, -1.27166748046875, -1.1405029296875, -1.00933837890625, -0.878173828125, -0.74700927734375, -0.6158447265625, -0.48468017578125, -0.353515625, -0.22235107421875, -0.0911865234375, 0.03997802734375, 0.171142578125, 0.30230712890625, 0.4334716796875, 0.56463623046875, 0.69580078125, 0.82696533203125, 0.9581298828125, 1.08929443359375, 1.220458984375, 1.35162353515625, 1.4827880859375, 1.61395263671875, 1.7451171875, 1.87628173828125, 2.0074462890625, 2.13861083984375, 2.269775390625, 2.40093994140625, 2.5321044921875, 2.66326904296875, 2.79443359375, 2.92559814453125, 3.0567626953125, 3.18792724609375, 3.319091796875, 3.45025634765625, 3.5814208984375, 3.71258544921875, 3.84375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 8.0, 8.0, 5.0, 8.0, 19.0, 35.0, 38.0, 58.0, 80.0, 127.0, 203.0, 283.0, 488.0, 722.0, 1037.0, 1604.0, 2572.0, 3905.0, 6243.0, 10024.0, 15712.0, 25242.0, 39452.0, 60695.0, 89752.0, 121665.0, 145975.0, 145479.0, 120830.0, 89059.0, 60220.0, 39241.0, 25060.0, 15801.0, 9978.0, 6187.0, 3707.0, 2456.0, 1574.0, 1017.0, 679.0, 414.0, 293.0, 194.0, 120.0, 96.0, 75.0, 36.0, 35.0, 21.0, 16.0, 6.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.57421875, -2.496185302734375, -2.41815185546875, -2.340118408203125, -2.2620849609375, -2.184051513671875, -2.10601806640625, -2.027984619140625, -1.949951171875, -1.871917724609375, -1.79388427734375, -1.715850830078125, -1.6378173828125, -1.559783935546875, -1.48175048828125, -1.403717041015625, -1.32568359375, -1.247650146484375, -1.16961669921875, -1.091583251953125, -1.0135498046875, -0.935516357421875, -0.85748291015625, -0.779449462890625, -0.701416015625, -0.623382568359375, -0.54534912109375, -0.467315673828125, -0.3892822265625, -0.311248779296875, -0.23321533203125, -0.155181884765625, -0.0771484375, 0.000885009765625, 0.07891845703125, 0.156951904296875, 0.2349853515625, 0.313018798828125, 0.39105224609375, 0.469085693359375, 0.547119140625, 0.625152587890625, 0.70318603515625, 0.781219482421875, 0.8592529296875, 0.937286376953125, 1.01531982421875, 1.093353271484375, 1.17138671875, 1.249420166015625, 1.32745361328125, 1.405487060546875, 1.4835205078125, 1.561553955078125, 1.63958740234375, 1.717620849609375, 1.795654296875, 1.873687744140625, 1.95172119140625, 2.029754638671875, 2.1077880859375, 2.185821533203125, 2.26385498046875, 2.341888427734375, 2.419921875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 5.0, 9.0, 5.0, 11.0, 8.0, 24.0, 22.0, 24.0, 21.0, 30.0, 29.0, 47.0, 50.0, 47.0, 55.0, 65.0, 54.0, 48.0, 57.0, 57.0, 37.0, 33.0, 42.0, 33.0, 32.0, 31.0, 25.0, 16.0, 17.0, 14.0, 8.0, 7.0, 7.0, 14.0, 1.0, 0.0, 2.0, 4.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00024080276489257812, -0.00023199990391731262, -0.00022319704294204712, -0.00021439418196678162, -0.0002055913209915161, -0.0001967884600162506, -0.0001879855990409851, -0.0001791827380657196, -0.0001703798770904541, -0.0001615770161151886, -0.0001527741551399231, -0.0001439712941646576, -0.0001351684331893921, -0.0001263655722141266, -0.00011756271123886108, -0.00010875985026359558, -9.995698928833008e-05, -9.115412831306458e-05, -8.235126733779907e-05, -7.354840636253357e-05, -6.474554538726807e-05, -5.5942684412002563e-05, -4.713982343673706e-05, -3.833696246147156e-05, -2.9534101486206055e-05, -2.0731240510940552e-05, -1.1928379535675049e-05, -3.125518560409546e-06, 5.677342414855957e-06, 1.448020339012146e-05, 2.3283064365386963e-05, 3.2085925340652466e-05, 4.088878631591797e-05, 4.969164729118347e-05, 5.8494508266448975e-05, 6.729736924171448e-05, 7.610023021697998e-05, 8.490309119224548e-05, 9.370595216751099e-05, 0.00010250881314277649, 0.00011131167411804199, 0.0001201145350933075, 0.000128917396068573, 0.0001377202570438385, 0.000146523118019104, 0.0001553259789943695, 0.000164128839969635, 0.0001729317009449005, 0.00018173456192016602, 0.00019053742289543152, 0.00019934028387069702, 0.00020814314484596252, 0.00021694600582122803, 0.00022574886679649353, 0.00023455172777175903, 0.00024335458874702454, 0.00025215744972229004, 0.00026096031069755554, 0.00026976317167282104, 0.00027856603264808655, 0.00028736889362335205, 0.00029617175459861755, 0.00030497461557388306, 0.00031377747654914856, 0.00032258033752441406]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 6.0, 12.0, 21.0, 30.0, 37.0, 54.0, 90.0, 144.0, 179.0, 290.0, 360.0, 594.0, 924.0, 1439.0, 2237.0, 3462.0, 5522.0, 8957.0, 14636.0, 24499.0, 40140.0, 65154.0, 101411.0, 139918.0, 164559.0, 153050.0, 116864.0, 78119.0, 48827.0, 29832.0, 17758.0, 11150.0, 6713.0, 4084.0, 2562.0, 1709.0, 1094.0, 723.0, 485.0, 294.0, 217.0, 110.0, 95.0, 60.0, 46.0, 36.0, 23.0, 15.0, 6.0, 3.0, 7.0, 2.0, 2.0, 3.0, 1.0], "bins": [-3.064453125, -2.9735107421875, -2.882568359375, -2.7916259765625, -2.70068359375, -2.6097412109375, -2.518798828125, -2.4278564453125, -2.3369140625, -2.2459716796875, -2.155029296875, -2.0640869140625, -1.97314453125, -1.8822021484375, -1.791259765625, -1.7003173828125, -1.609375, -1.5184326171875, -1.427490234375, -1.3365478515625, -1.24560546875, -1.1546630859375, -1.063720703125, -0.9727783203125, -0.8818359375, -0.7908935546875, -0.699951171875, -0.6090087890625, -0.51806640625, -0.4271240234375, -0.336181640625, -0.2452392578125, -0.154296875, -0.0633544921875, 0.027587890625, 0.1185302734375, 0.20947265625, 0.3004150390625, 0.391357421875, 0.4822998046875, 0.5732421875, 0.6641845703125, 0.755126953125, 0.8460693359375, 0.93701171875, 1.0279541015625, 1.118896484375, 1.2098388671875, 1.30078125, 1.3917236328125, 1.482666015625, 1.5736083984375, 1.66455078125, 1.7554931640625, 1.846435546875, 1.9373779296875, 2.0283203125, 2.1192626953125, 2.210205078125, 2.3011474609375, 2.39208984375, 2.4830322265625, 2.573974609375, 2.6649169921875, 2.755859375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 9.0, 5.0, 2.0, 11.0, 6.0, 12.0, 16.0, 18.0, 22.0, 28.0, 27.0, 25.0, 29.0, 41.0, 44.0, 45.0, 48.0, 46.0, 48.0, 47.0, 41.0, 51.0, 48.0, 48.0, 34.0, 24.0, 38.0, 21.0, 32.0, 26.0, 17.0, 14.0, 19.0, 15.0, 14.0, 7.0, 6.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.80126953125, -0.7725753784179688, -0.7438812255859375, -0.7151870727539062, -0.686492919921875, -0.6577987670898438, -0.6291046142578125, -0.6004104614257812, -0.57171630859375, -0.5430221557617188, -0.5143280029296875, -0.48563385009765625, -0.456939697265625, -0.42824554443359375, -0.3995513916015625, -0.37085723876953125, -0.3421630859375, -0.31346893310546875, -0.2847747802734375, -0.25608062744140625, -0.227386474609375, -0.19869232177734375, -0.1699981689453125, -0.14130401611328125, -0.11260986328125, -0.08391571044921875, -0.0552215576171875, -0.02652740478515625, 0.002166748046875, 0.03086090087890625, 0.0595550537109375, 0.08824920654296875, 0.116943359375, 0.14563751220703125, 0.1743316650390625, 0.20302581787109375, 0.231719970703125, 0.26041412353515625, 0.2891082763671875, 0.31780242919921875, 0.34649658203125, 0.37519073486328125, 0.4038848876953125, 0.43257904052734375, 0.461273193359375, 0.48996734619140625, 0.5186614990234375, 0.5473556518554688, 0.5760498046875, 0.6047439575195312, 0.6334381103515625, 0.6621322631835938, 0.690826416015625, 0.7195205688476562, 0.7482147216796875, 0.7769088745117188, 0.80560302734375, 0.8342971801757812, 0.8629913330078125, 0.8916854858398438, 0.920379638671875, 0.9490737915039062, 0.9777679443359375, 1.0064620971679688, 1.03515625]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 1.0, 2.0, 5.0, 6.0, 2.0, 8.0, 10.0, 9.0, 22.0, 27.0, 19.0, 32.0, 41.0, 45.0, 77.0, 61.0, 76.0, 81.0, 81.0, 65.0, 62.0, 60.0, 47.0, 38.0, 34.0, 32.0, 17.0, 11.0, 9.0, 7.0, 8.0, 4.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.307778358459473, -11.931976318359375, -11.556175231933594, -11.180374145507812, -10.804572105407715, -10.428770065307617, -10.052968978881836, -9.677167892456055, -9.301365852355957, -8.92556381225586, -8.549762725830078, -8.173961639404297, -7.798159599304199, -7.42235803604126, -7.04655647277832, -6.670754909515381, -6.294953346252441, -5.919151782989502, -5.5433502197265625, -5.167548656463623, -4.791747093200684, -4.415945529937744, -4.040143966674805, -3.6643424034118652, -3.288540840148926, -2.9127392768859863, -2.536937713623047, -2.1611361503601074, -1.785334587097168, -1.4095330238342285, -1.033731460571289, -0.6579298973083496, -0.28212928771972656, 0.09367227554321289, 0.46947383880615234, 0.8452754020690918, 1.2210769653320312, 1.5968785285949707, 1.9726800918579102, 2.3484816551208496, 2.724283218383789, 3.1000847816467285, 3.475886344909668, 3.8516879081726074, 4.227489471435547, 4.603291034698486, 4.979092597961426, 5.354894161224365, 5.730695724487305, 6.106497287750244, 6.482298851013184, 6.858100414276123, 7.2339019775390625, 7.609703540802002, 7.985505104064941, 8.361307144165039, 8.73710823059082, 9.112909317016602, 9.4887113571167, 9.864513397216797, 10.240314483642578, 10.61611557006836, 10.991917610168457, 11.367719650268555, 11.743520736694336]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 2.0, 5.0, 6.0, 3.0, 4.0, 11.0, 9.0, 10.0, 16.0, 9.0, 18.0, 25.0, 27.0, 25.0, 29.0, 25.0, 26.0, 33.0, 38.0, 46.0, 38.0, 33.0, 52.0, 47.0, 39.0, 32.0, 48.0, 43.0, 38.0, 29.0, 34.0, 27.0, 26.0, 24.0, 21.0, 17.0, 17.0, 15.0, 13.0, 9.0, 8.0, 7.0, 6.0, 7.0, 4.0, 3.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.901891231536865, -5.707763671875, -5.513636589050293, -5.319509029388428, -5.1253814697265625, -4.931253910064697, -4.737126350402832, -4.542999267578125, -4.34887170791626, -4.1547441482543945, -3.9606168270111084, -3.7664895057678223, -3.572361946105957, -3.378234386444092, -3.1841070652008057, -2.9899797439575195, -2.7958521842956543, -2.601724624633789, -2.407597303390503, -2.213469982147217, -2.0193424224853516, -1.8252149820327759, -1.6310875415802002, -1.4369601011276245, -1.2428326606750488, -1.0487052202224731, -0.8545777797698975, -0.6604503393173218, -0.4663228988647461, -0.2721954584121704, -0.07806801795959473, 0.11605942249298096, 0.31018686294555664, 0.5043143033981323, 0.698441743850708, 0.8925691843032837, 1.0866966247558594, 1.280824065208435, 1.4749515056610107, 1.6690789461135864, 1.863206386566162, 2.0573339462280273, 2.2514612674713135, 2.4455885887145996, 2.639716148376465, 2.83384370803833, 3.027971029281616, 3.2220983505249023, 3.4162259101867676, 3.610353469848633, 3.804480791091919, 3.998608112335205, 4.19273567199707, 4.3868632316589355, 4.580990791320801, 4.775117874145508, 4.969245433807373, 5.163372993469238, 5.357500076293945, 5.5516276359558105, 5.745755195617676, 5.939882755279541, 6.134010314941406, 6.328137397766113, 6.5222649574279785]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 5.0, 8.0, 8.0, 12.0, 24.0, 43.0, 61.0, 100.0, 159.0, 261.0, 381.0, 640.0, 1049.0, 1769.0, 2985.0, 5087.0, 9567.0, 18421.0, 37909.0, 83114.0, 205924.0, 530090.0, 1127762.0, 1185023.0, 581553.0, 226937.0, 91372.0, 40778.0, 19547.0, 10264.0, 5598.0, 3145.0, 1809.0, 1090.0, 669.0, 420.0, 271.0, 139.0, 108.0, 54.0, 44.0, 34.0, 16.0, 11.0, 12.0, 5.0, 4.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.6015625, -9.2330322265625, -8.864501953125, -8.4959716796875, -8.12744140625, -7.7589111328125, -7.390380859375, -7.0218505859375, -6.6533203125, -6.2847900390625, -5.916259765625, -5.5477294921875, -5.17919921875, -4.8106689453125, -4.442138671875, -4.0736083984375, -3.705078125, -3.3365478515625, -2.968017578125, -2.5994873046875, -2.23095703125, -1.8624267578125, -1.493896484375, -1.1253662109375, -0.7568359375, -0.3883056640625, -0.019775390625, 0.3487548828125, 0.71728515625, 1.0858154296875, 1.454345703125, 1.8228759765625, 2.19140625, 2.5599365234375, 2.928466796875, 3.2969970703125, 3.66552734375, 4.0340576171875, 4.402587890625, 4.7711181640625, 5.1396484375, 5.5081787109375, 5.876708984375, 6.2452392578125, 6.61376953125, 6.9822998046875, 7.350830078125, 7.7193603515625, 8.087890625, 8.4564208984375, 8.824951171875, 9.1934814453125, 9.56201171875, 9.9305419921875, 10.299072265625, 10.6676025390625, 11.0361328125, 11.4046630859375, 11.773193359375, 12.1417236328125, 12.51025390625, 12.8787841796875, 13.247314453125, 13.6158447265625, 13.984375]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 5.0, 5.0, 11.0, 12.0, 7.0, 12.0, 20.0, 21.0, 24.0, 21.0, 25.0, 26.0, 29.0, 30.0, 32.0, 36.0, 32.0, 45.0, 43.0, 41.0, 40.0, 42.0, 40.0, 52.0, 31.0, 38.0, 32.0, 38.0, 30.0, 29.0, 18.0, 24.0, 17.0, 11.0, 14.0, 12.0, 7.0, 10.0, 8.0, 13.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.26953125, -5.1148681640625, -4.960205078125, -4.8055419921875, -4.65087890625, -4.4962158203125, -4.341552734375, -4.1868896484375, -4.0322265625, -3.8775634765625, -3.722900390625, -3.5682373046875, -3.41357421875, -3.2589111328125, -3.104248046875, -2.9495849609375, -2.794921875, -2.6402587890625, -2.485595703125, -2.3309326171875, -2.17626953125, -2.0216064453125, -1.866943359375, -1.7122802734375, -1.5576171875, -1.4029541015625, -1.248291015625, -1.0936279296875, -0.93896484375, -0.7843017578125, -0.629638671875, -0.4749755859375, -0.3203125, -0.1656494140625, -0.010986328125, 0.1436767578125, 0.29833984375, 0.4530029296875, 0.607666015625, 0.7623291015625, 0.9169921875, 1.0716552734375, 1.226318359375, 1.3809814453125, 1.53564453125, 1.6903076171875, 1.844970703125, 1.9996337890625, 2.154296875, 2.3089599609375, 2.463623046875, 2.6182861328125, 2.77294921875, 2.9276123046875, 3.082275390625, 3.2369384765625, 3.3916015625, 3.5462646484375, 3.700927734375, 3.8555908203125, 4.01025390625, 4.1649169921875, 4.319580078125, 4.4742431640625, 4.62890625]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 9.0, 12.0, 25.0, 22.0, 30.0, 60.0, 73.0, 113.0, 139.0, 230.0, 333.0, 499.0, 681.0, 1096.0, 1807.0, 2751.0, 4323.0, 7270.0, 12328.0, 21468.0, 38459.0, 71287.0, 136756.0, 272232.0, 532521.0, 888364.0, 941793.0, 604150.0, 313011.0, 157590.0, 81353.0, 43795.0, 24192.0, 13644.0, 8178.0, 5093.0, 3042.0, 1885.0, 1185.0, 787.0, 527.0, 362.0, 265.0, 167.0, 111.0, 72.0, 55.0, 42.0, 30.0, 21.0, 9.0, 14.0, 7.0, 5.0, 6.0, 3.0, 6.0, 4.0], "bins": [-10.8671875, -10.5286865234375, -10.190185546875, -9.8516845703125, -9.51318359375, -9.1746826171875, -8.836181640625, -8.4976806640625, -8.1591796875, -7.8206787109375, -7.482177734375, -7.1436767578125, -6.80517578125, -6.4666748046875, -6.128173828125, -5.7896728515625, -5.451171875, -5.1126708984375, -4.774169921875, -4.4356689453125, -4.09716796875, -3.7586669921875, -3.420166015625, -3.0816650390625, -2.7431640625, -2.4046630859375, -2.066162109375, -1.7276611328125, -1.38916015625, -1.0506591796875, -0.712158203125, -0.3736572265625, -0.03515625, 0.3033447265625, 0.641845703125, 0.9803466796875, 1.31884765625, 1.6573486328125, 1.995849609375, 2.3343505859375, 2.6728515625, 3.0113525390625, 3.349853515625, 3.6883544921875, 4.02685546875, 4.3653564453125, 4.703857421875, 5.0423583984375, 5.380859375, 5.7193603515625, 6.057861328125, 6.3963623046875, 6.73486328125, 7.0733642578125, 7.411865234375, 7.7503662109375, 8.0888671875, 8.4273681640625, 8.765869140625, 9.1043701171875, 9.44287109375, 9.7813720703125, 10.119873046875, 10.4583740234375, 10.796875]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 1.0, 3.0, 10.0, 13.0, 14.0, 10.0, 15.0, 26.0, 40.0, 47.0, 55.0, 58.0, 81.0, 95.0, 131.0, 185.0, 211.0, 244.0, 279.0, 326.0, 308.0, 349.0, 315.0, 280.0, 208.0, 185.0, 133.0, 102.0, 98.0, 76.0, 43.0, 27.0, 35.0, 19.0, 15.0, 8.0, 14.0, 3.0, 3.0, 0.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.837890625, -3.719329833984375, -3.60076904296875, -3.482208251953125, -3.3636474609375, -3.245086669921875, -3.12652587890625, -3.007965087890625, -2.889404296875, -2.770843505859375, -2.65228271484375, -2.533721923828125, -2.4151611328125, -2.296600341796875, -2.17803955078125, -2.059478759765625, -1.94091796875, -1.822357177734375, -1.70379638671875, -1.585235595703125, -1.4666748046875, -1.348114013671875, -1.22955322265625, -1.110992431640625, -0.992431640625, -0.873870849609375, -0.75531005859375, -0.636749267578125, -0.5181884765625, -0.399627685546875, -0.28106689453125, -0.162506103515625, -0.0439453125, 0.074615478515625, 0.19317626953125, 0.311737060546875, 0.4302978515625, 0.548858642578125, 0.66741943359375, 0.785980224609375, 0.904541015625, 1.023101806640625, 1.14166259765625, 1.260223388671875, 1.3787841796875, 1.497344970703125, 1.61590576171875, 1.734466552734375, 1.85302734375, 1.971588134765625, 2.09014892578125, 2.208709716796875, 2.3272705078125, 2.445831298828125, 2.56439208984375, 2.682952880859375, 2.801513671875, 2.920074462890625, 3.03863525390625, 3.157196044921875, 3.2757568359375, 3.394317626953125, 3.51287841796875, 3.631439208984375, 3.75]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 11.0, 5.0, 5.0, 12.0, 14.0, 18.0, 22.0, 31.0, 39.0, 41.0, 44.0, 53.0, 68.0, 68.0, 78.0, 93.0, 88.0, 60.0, 50.0, 46.0, 35.0, 31.0, 20.0, 12.0, 11.0, 11.0, 10.0, 4.0, 1.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.259316444396973, -10.833648681640625, -10.407981872558594, -9.982314109802246, -9.556647300720215, -9.130979537963867, -8.705312728881836, -8.279644966125488, -7.853978157043457, -7.428310871124268, -7.002643585205078, -6.576976299285889, -6.151309013366699, -5.725641250610352, -5.29997444152832, -4.874306678771973, -4.448639392852783, -4.022972106933594, -3.5973048210144043, -3.171637535095215, -2.7459702491760254, -2.320302724838257, -1.8946354389190674, -1.468968152999878, -1.0433008670806885, -0.617633581161499, -0.1919662356376648, 0.23370110988616943, 0.6593683958053589, 1.085035800933838, 1.5107030868530273, 1.9363703727722168, 2.3620376586914062, 2.7877049446105957, 3.213372230529785, 3.6390395164489746, 4.064706802368164, 4.490374565124512, 4.916041374206543, 5.341709136962891, 5.767375946044922, 6.193043231964111, 6.618710517883301, 7.04437780380249, 7.47004508972168, 7.895712852478027, 8.321379661560059, 8.747047424316406, 9.172714233398438, 9.598381996154785, 10.024048805236816, 10.449716567993164, 10.875383377075195, 11.301051139831543, 11.726717948913574, 12.152385711669922, 12.57805347442627, 13.003721237182617, 13.429388046264648, 13.855055809020996, 14.280722618103027, 14.706390380859375, 15.132057189941406, 15.557724952697754, 15.983391761779785]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 8.0, 1.0, 2.0, 3.0, 13.0, 9.0, 12.0, 15.0, 12.0, 19.0, 22.0, 20.0, 31.0, 16.0, 28.0, 41.0, 36.0, 37.0, 44.0, 44.0, 33.0, 37.0, 38.0, 50.0, 40.0, 34.0, 31.0, 37.0, 37.0, 33.0, 32.0, 26.0, 26.0, 29.0, 23.0, 13.0, 9.0, 15.0, 12.0, 11.0, 10.0, 3.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.2488226890563965, -7.030524730682373, -6.812226295471191, -6.593928337097168, -6.375629901885986, -6.157331943511963, -5.939033508300781, -5.720735549926758, -5.502437591552734, -5.284139633178711, -5.065841197967529, -4.847543239593506, -4.629244804382324, -4.410946846008301, -4.192648887634277, -3.9743504524230957, -3.756052017211914, -3.5377538204193115, -3.319455623626709, -3.1011576652526855, -2.882859230041504, -2.6645612716674805, -2.446263074874878, -2.2279648780822754, -2.009666681289673, -1.7913684844970703, -1.5730702877044678, -1.3547722101211548, -1.1364740133285522, -0.9181758165359497, -0.6998777389526367, -0.4815795421600342, -0.26328182220458984, -0.04498365521430969, 0.17331451177597046, 0.3916126489639282, 0.6099108457565308, 0.8282090425491333, 1.0465071201324463, 1.2648053169250488, 1.4831035137176514, 1.701401710510254, 1.9196999073028564, 2.137998104095459, 2.3562960624694824, 2.574594497680664, 2.7928924560546875, 3.01119065284729, 3.2294888496398926, 3.447787046432495, 3.6660852432250977, 3.884383201599121, 4.102681636810303, 4.320979595184326, 4.539278030395508, 4.757575988769531, 4.975873947143555, 5.194171905517578, 5.41247034072876, 5.630768299102783, 5.849066734313965, 6.067364692687988, 6.285662651062012, 6.503961086273193, 6.722259521484375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 8.0, 7.0, 11.0, 20.0, 22.0, 35.0, 62.0, 87.0, 141.0, 223.0, 322.0, 563.0, 964.0, 1482.0, 2529.0, 4242.0, 7246.0, 12255.0, 21100.0, 36597.0, 61748.0, 99979.0, 144932.0, 174543.0, 163429.0, 121806.0, 79133.0, 47760.0, 28074.0, 16029.0, 9462.0, 5453.0, 3194.0, 1983.0, 1204.0, 731.0, 422.0, 275.0, 155.0, 117.0, 68.0, 48.0, 38.0, 21.0, 8.0, 12.0, 3.0, 4.0, 4.0, 3.0, 4.0, 1.0, 4.0], "bins": [-5.87890625, -5.709716796875, -5.54052734375, -5.371337890625, -5.2021484375, -5.032958984375, -4.86376953125, -4.694580078125, -4.525390625, -4.356201171875, -4.18701171875, -4.017822265625, -3.8486328125, -3.679443359375, -3.51025390625, -3.341064453125, -3.171875, -3.002685546875, -2.83349609375, -2.664306640625, -2.4951171875, -2.325927734375, -2.15673828125, -1.987548828125, -1.818359375, -1.649169921875, -1.47998046875, -1.310791015625, -1.1416015625, -0.972412109375, -0.80322265625, -0.634033203125, -0.46484375, -0.295654296875, -0.12646484375, 0.042724609375, 0.2119140625, 0.381103515625, 0.55029296875, 0.719482421875, 0.888671875, 1.057861328125, 1.22705078125, 1.396240234375, 1.5654296875, 1.734619140625, 1.90380859375, 2.072998046875, 2.2421875, 2.411376953125, 2.58056640625, 2.749755859375, 2.9189453125, 3.088134765625, 3.25732421875, 3.426513671875, 3.595703125, 3.764892578125, 3.93408203125, 4.103271484375, 4.2724609375, 4.441650390625, 4.61083984375, 4.780029296875, 4.94921875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 3.0, 2.0, 8.0, 13.0, 8.0, 12.0, 10.0, 10.0, 16.0, 10.0, 30.0, 21.0, 19.0, 24.0, 36.0, 40.0, 34.0, 42.0, 28.0, 43.0, 50.0, 32.0, 39.0, 44.0, 47.0, 42.0, 41.0, 41.0, 37.0, 27.0, 25.0, 22.0, 20.0, 25.0, 20.0, 13.0, 12.0, 15.0, 7.0, 11.0, 7.0, 4.0, 7.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.203125, -6.968994140625, -6.73486328125, -6.500732421875, -6.2666015625, -6.032470703125, -5.79833984375, -5.564208984375, -5.330078125, -5.095947265625, -4.86181640625, -4.627685546875, -4.3935546875, -4.159423828125, -3.92529296875, -3.691162109375, -3.45703125, -3.222900390625, -2.98876953125, -2.754638671875, -2.5205078125, -2.286376953125, -2.05224609375, -1.818115234375, -1.583984375, -1.349853515625, -1.11572265625, -0.881591796875, -0.6474609375, -0.413330078125, -0.17919921875, 0.054931640625, 0.2890625, 0.523193359375, 0.75732421875, 0.991455078125, 1.2255859375, 1.459716796875, 1.69384765625, 1.927978515625, 2.162109375, 2.396240234375, 2.63037109375, 2.864501953125, 3.0986328125, 3.332763671875, 3.56689453125, 3.801025390625, 4.03515625, 4.269287109375, 4.50341796875, 4.737548828125, 4.9716796875, 5.205810546875, 5.43994140625, 5.674072265625, 5.908203125, 6.142333984375, 6.37646484375, 6.610595703125, 6.8447265625, 7.078857421875, 7.31298828125, 7.547119140625, 7.78125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 3.0, 8.0, 7.0, 13.0, 17.0, 32.0, 45.0, 73.0, 111.0, 224.0, 421.0, 702.0, 1312.0, 2610.0, 5559.0, 13335.0, 33418.0, 90433.0, 234836.0, 354039.0, 192960.0, 71501.0, 26534.0, 10798.0, 4718.0, 2245.0, 1112.0, 610.0, 341.0, 219.0, 123.0, 74.0, 45.0, 22.0, 17.0, 15.0, 6.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1640625, -11.7884521484375, -11.412841796875, -11.0372314453125, -10.66162109375, -10.2860107421875, -9.910400390625, -9.5347900390625, -9.1591796875, -8.7835693359375, -8.407958984375, -8.0323486328125, -7.65673828125, -7.2811279296875, -6.905517578125, -6.5299072265625, -6.154296875, -5.7786865234375, -5.403076171875, -5.0274658203125, -4.65185546875, -4.2762451171875, -3.900634765625, -3.5250244140625, -3.1494140625, -2.7738037109375, -2.398193359375, -2.0225830078125, -1.64697265625, -1.2713623046875, -0.895751953125, -0.5201416015625, -0.14453125, 0.2310791015625, 0.606689453125, 0.9822998046875, 1.35791015625, 1.7335205078125, 2.109130859375, 2.4847412109375, 2.8603515625, 3.2359619140625, 3.611572265625, 3.9871826171875, 4.36279296875, 4.7384033203125, 5.114013671875, 5.4896240234375, 5.865234375, 6.2408447265625, 6.616455078125, 6.9920654296875, 7.36767578125, 7.7432861328125, 8.118896484375, 8.4945068359375, 8.8701171875, 9.2457275390625, 9.621337890625, 9.9969482421875, 10.37255859375, 10.7481689453125, 11.123779296875, 11.4993896484375, 11.875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 5.0, 2.0, 2.0, 5.0, 12.0, 5.0, 16.0, 20.0, 18.0, 20.0, 24.0, 27.0, 30.0, 29.0, 34.0, 40.0, 35.0, 49.0, 41.0, 34.0, 38.0, 42.0, 57.0, 48.0, 47.0, 38.0, 25.0, 39.0, 38.0, 19.0, 28.0, 18.0, 22.0, 14.0, 19.0, 10.0, 6.0, 8.0, 17.0, 11.0, 4.0, 2.0, 5.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.44921875, -4.3017578125, -4.154296875, -4.0068359375, -3.859375, -3.7119140625, -3.564453125, -3.4169921875, -3.26953125, -3.1220703125, -2.974609375, -2.8271484375, -2.6796875, -2.5322265625, -2.384765625, -2.2373046875, -2.08984375, -1.9423828125, -1.794921875, -1.6474609375, -1.5, -1.3525390625, -1.205078125, -1.0576171875, -0.91015625, -0.7626953125, -0.615234375, -0.4677734375, -0.3203125, -0.1728515625, -0.025390625, 0.1220703125, 0.26953125, 0.4169921875, 0.564453125, 0.7119140625, 0.859375, 1.0068359375, 1.154296875, 1.3017578125, 1.44921875, 1.5966796875, 1.744140625, 1.8916015625, 2.0390625, 2.1865234375, 2.333984375, 2.4814453125, 2.62890625, 2.7763671875, 2.923828125, 3.0712890625, 3.21875, 3.3662109375, 3.513671875, 3.6611328125, 3.80859375, 3.9560546875, 4.103515625, 4.2509765625, 4.3984375, 4.5458984375, 4.693359375, 4.8408203125, 4.98828125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 3.0, 9.0, 7.0, 2.0, 8.0, 11.0, 16.0, 37.0, 43.0, 45.0, 88.0, 137.0, 197.0, 258.0, 432.0, 649.0, 1049.0, 1509.0, 2620.0, 4333.0, 7538.0, 13213.0, 24600.0, 47617.0, 93880.0, 178856.0, 261632.0, 193948.0, 102004.0, 52155.0, 27041.0, 14465.0, 7872.0, 4742.0, 2763.0, 1700.0, 1057.0, 713.0, 423.0, 288.0, 195.0, 131.0, 102.0, 41.0, 36.0, 36.0, 18.0, 14.0, 18.0, 5.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.5390625, -4.38555908203125, -4.2320556640625, -4.07855224609375, -3.925048828125, -3.77154541015625, -3.6180419921875, -3.46453857421875, -3.31103515625, -3.15753173828125, -3.0040283203125, -2.85052490234375, -2.697021484375, -2.54351806640625, -2.3900146484375, -2.23651123046875, -2.0830078125, -1.92950439453125, -1.7760009765625, -1.62249755859375, -1.468994140625, -1.31549072265625, -1.1619873046875, -1.00848388671875, -0.85498046875, -0.70147705078125, -0.5479736328125, -0.39447021484375, -0.240966796875, -0.08746337890625, 0.0660400390625, 0.21954345703125, 0.373046875, 0.52655029296875, 0.6800537109375, 0.83355712890625, 0.987060546875, 1.14056396484375, 1.2940673828125, 1.44757080078125, 1.60107421875, 1.75457763671875, 1.9080810546875, 2.06158447265625, 2.215087890625, 2.36859130859375, 2.5220947265625, 2.67559814453125, 2.8291015625, 2.98260498046875, 3.1361083984375, 3.28961181640625, 3.443115234375, 3.59661865234375, 3.7501220703125, 3.90362548828125, 4.05712890625, 4.21063232421875, 4.3641357421875, 4.51763916015625, 4.671142578125, 4.82464599609375, 4.9781494140625, 5.13165283203125, 5.28515625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 3.0, 4.0, 7.0, 7.0, 7.0, 12.0, 10.0, 21.0, 24.0, 23.0, 32.0, 40.0, 68.0, 47.0, 56.0, 56.0, 84.0, 61.0, 66.0, 49.0, 55.0, 49.0, 45.0, 34.0, 29.0, 32.0, 18.0, 20.0, 10.0, 10.0, 3.0, 7.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00023734569549560547, -0.000229736790060997, -0.00022212788462638855, -0.0002145189791917801, -0.00020691007375717163, -0.00019930116832256317, -0.0001916922628879547, -0.00018408335745334625, -0.0001764744520187378, -0.00016886554658412933, -0.00016125664114952087, -0.00015364773571491241, -0.00014603883028030396, -0.0001384299248456955, -0.00013082101941108704, -0.00012321211397647858, -0.00011560320854187012, -0.00010799430310726166, -0.0001003853976726532, -9.277649223804474e-05, -8.516758680343628e-05, -7.755868136882782e-05, -6.994977593421936e-05, -6.23408704996109e-05, -5.473196506500244e-05, -4.712305963039398e-05, -3.951415419578552e-05, -3.190524876117706e-05, -2.4296343326568604e-05, -1.6687437891960144e-05, -9.078532457351685e-06, -1.469627022743225e-06, 6.139278411865234e-06, 1.3748183846473694e-05, 2.1357089281082153e-05, 2.8965994715690613e-05, 3.657490015029907e-05, 4.418380558490753e-05, 5.179271101951599e-05, 5.940161645412445e-05, 6.701052188873291e-05, 7.461942732334137e-05, 8.222833275794983e-05, 8.983723819255829e-05, 9.744614362716675e-05, 0.00010505504906177521, 0.00011266395449638367, 0.00012027285993099213, 0.00012788176536560059, 0.00013549067080020905, 0.0001430995762348175, 0.00015070848166942596, 0.00015831738710403442, 0.00016592629253864288, 0.00017353519797325134, 0.0001811441034078598, 0.00018875300884246826, 0.00019636191427707672, 0.00020397081971168518, 0.00021157972514629364, 0.0002191886305809021, 0.00022679753601551056, 0.00023440644145011902, 0.00024201534688472748, 0.00024962425231933594]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 6.0, 1.0, 7.0, 11.0, 16.0, 18.0, 26.0, 26.0, 47.0, 65.0, 87.0, 148.0, 182.0, 293.0, 484.0, 773.0, 1259.0, 2098.0, 3562.0, 5931.0, 10574.0, 19179.0, 34697.0, 62326.0, 107824.0, 168342.0, 204030.0, 171236.0, 110049.0, 64093.0, 35204.0, 19673.0, 10925.0, 6121.0, 3654.0, 2074.0, 1264.0, 793.0, 510.0, 326.0, 215.0, 120.0, 96.0, 61.0, 45.0, 22.0, 18.0, 18.0, 14.0, 9.0, 5.0, 4.0, 6.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.4921875, -4.34967041015625, -4.2071533203125, -4.06463623046875, -3.922119140625, -3.77960205078125, -3.6370849609375, -3.49456787109375, -3.35205078125, -3.20953369140625, -3.0670166015625, -2.92449951171875, -2.781982421875, -2.63946533203125, -2.4969482421875, -2.35443115234375, -2.2119140625, -2.06939697265625, -1.9268798828125, -1.78436279296875, -1.641845703125, -1.49932861328125, -1.3568115234375, -1.21429443359375, -1.07177734375, -0.92926025390625, -0.7867431640625, -0.64422607421875, -0.501708984375, -0.35919189453125, -0.2166748046875, -0.07415771484375, 0.068359375, 0.21087646484375, 0.3533935546875, 0.49591064453125, 0.638427734375, 0.78094482421875, 0.9234619140625, 1.06597900390625, 1.20849609375, 1.35101318359375, 1.4935302734375, 1.63604736328125, 1.778564453125, 1.92108154296875, 2.0635986328125, 2.20611572265625, 2.3486328125, 2.49114990234375, 2.6336669921875, 2.77618408203125, 2.918701171875, 3.06121826171875, 3.2037353515625, 3.34625244140625, 3.48876953125, 3.63128662109375, 3.7738037109375, 3.91632080078125, 4.058837890625, 4.20135498046875, 4.3438720703125, 4.48638916015625, 4.62890625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 11.0, 12.0, 19.0, 19.0, 27.0, 29.0, 48.0, 58.0, 86.0, 76.0, 93.0, 83.0, 76.0, 82.0, 72.0, 64.0, 40.0, 36.0, 32.0, 14.0, 7.0, 9.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.130859375, -2.065185546875, -1.99951171875, -1.933837890625, -1.8681640625, -1.802490234375, -1.73681640625, -1.671142578125, -1.60546875, -1.539794921875, -1.47412109375, -1.408447265625, -1.3427734375, -1.277099609375, -1.21142578125, -1.145751953125, -1.080078125, -1.014404296875, -0.94873046875, -0.883056640625, -0.8173828125, -0.751708984375, -0.68603515625, -0.620361328125, -0.5546875, -0.489013671875, -0.42333984375, -0.357666015625, -0.2919921875, -0.226318359375, -0.16064453125, -0.094970703125, -0.029296875, 0.036376953125, 0.10205078125, 0.167724609375, 0.2333984375, 0.299072265625, 0.36474609375, 0.430419921875, 0.49609375, 0.561767578125, 0.62744140625, 0.693115234375, 0.7587890625, 0.824462890625, 0.89013671875, 0.955810546875, 1.021484375, 1.087158203125, 1.15283203125, 1.218505859375, 1.2841796875, 1.349853515625, 1.41552734375, 1.481201171875, 1.546875, 1.612548828125, 1.67822265625, 1.743896484375, 1.8095703125, 1.875244140625, 1.94091796875, 2.006591796875, 2.072265625]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 8.0, 4.0, 7.0, 18.0, 11.0, 23.0, 25.0, 30.0, 39.0, 42.0, 53.0, 61.0, 71.0, 65.0, 96.0, 85.0, 87.0, 62.0, 36.0, 47.0, 37.0, 23.0, 14.0, 9.0, 13.0, 11.0, 3.0, 3.0, 3.0, 2.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.542037010192871, -11.099223136901855, -10.656408309936523, -10.213594436645508, -9.770779609680176, -9.32796573638916, -8.885150909423828, -8.442337036132812, -7.999522686004639, -7.556708335876465, -7.113893985748291, -6.671079635620117, -6.228265762329102, -5.7854509353637695, -5.342637062072754, -4.89982271194458, -4.457008361816406, -4.014194011688232, -3.5713796615600586, -3.128565549850464, -2.68575119972229, -2.242936849594116, -1.8001227378845215, -1.3573083877563477, -0.9144940376281738, -0.4716797471046448, -0.028865456581115723, 0.41394877433776855, 0.8567631244659424, 1.2995774745941162, 1.742391586303711, 2.1852059364318848, 2.628021240234375, 3.070835590362549, 3.5136499404907227, 3.9564640522003174, 4.39927864074707, 4.842092514038086, 5.28490686416626, 5.727721214294434, 6.170535564422607, 6.613349914550781, 7.056164264678955, 7.498978614807129, 7.9417924880981445, 8.384607315063477, 8.827421188354492, 9.270235061645508, 9.71304988861084, 10.155863761901855, 10.598678588867188, 11.041492462158203, 11.484307289123535, 11.92712116241455, 12.369935989379883, 12.812749862670898, 13.255563735961914, 13.69837760925293, 14.141192436218262, 14.584006309509277, 15.02682113647461, 15.469635009765625, 15.91244888305664, 16.355262756347656, 16.798078536987305]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 2.0, 0.0, 4.0, 13.0, 18.0, 10.0, 21.0, 14.0, 23.0, 17.0, 19.0, 27.0, 22.0, 32.0, 36.0, 44.0, 35.0, 44.0, 41.0, 42.0, 29.0, 45.0, 38.0, 47.0, 33.0, 39.0, 29.0, 27.0, 38.0, 29.0, 26.0, 29.0, 25.0, 17.0, 9.0, 19.0, 12.0, 16.0, 5.0, 5.0, 7.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.177400588989258, -6.958394527435303, -6.739388942718506, -6.520382881164551, -6.301377296447754, -6.082371234893799, -5.863365650177002, -5.644359588623047, -5.42535400390625, -5.206347942352295, -4.987342357635498, -4.768336296081543, -4.549330711364746, -4.330324649810791, -4.111319065093994, -3.892313003540039, -3.673307180404663, -3.454301357269287, -3.235295534133911, -3.016289710998535, -2.797283887863159, -2.578278064727783, -2.359272003173828, -2.1402664184570312, -1.9212604761123657, -1.7022546529769897, -1.4832488298416138, -1.2642428874969482, -1.0452370643615723, -0.8262312412261963, -0.6072254180908203, -0.38821959495544434, -0.16921377182006836, 0.04979206621646881, 0.268797904253006, 0.48780375719070435, 0.7068095803260803, 0.9258154630661011, 1.144821286201477, 1.363827109336853, 1.582832932472229, 1.801838755607605, 2.0208446979522705, 2.2398505210876465, 2.4588563442230225, 2.6778621673583984, 2.8968679904937744, 3.1158738136291504, 3.3348796367645264, 3.5538854598999023, 3.7728912830352783, 3.9918971061706543, 4.210903167724609, 4.429908752441406, 4.648914813995361, 4.867920398712158, 5.086926460266113, 5.305932521820068, 5.524938106536865, 5.74394416809082, 5.962949752807617, 6.181955814361572, 6.400961399078369, 6.619967460632324, 6.838973045349121]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 10.0, 19.0, 28.0, 43.0, 66.0, 86.0, 162.0, 231.0, 398.0, 596.0, 1096.0, 1836.0, 3340.0, 5801.0, 10948.0, 20256.0, 37763.0, 69428.0, 117214.0, 170115.0, 193186.0, 164650.0, 110617.0, 64139.0, 34958.0, 18660.0, 10064.0, 5533.0, 2991.0, 1751.0, 1006.0, 601.0, 326.0, 223.0, 144.0, 82.0, 61.0, 37.0, 26.0, 20.0, 9.0, 13.0, 7.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.3671875, -8.116943359375, -7.86669921875, -7.616455078125, -7.3662109375, -7.115966796875, -6.86572265625, -6.615478515625, -6.365234375, -6.114990234375, -5.86474609375, -5.614501953125, -5.3642578125, -5.114013671875, -4.86376953125, -4.613525390625, -4.36328125, -4.113037109375, -3.86279296875, -3.612548828125, -3.3623046875, -3.112060546875, -2.86181640625, -2.611572265625, -2.361328125, -2.111083984375, -1.86083984375, -1.610595703125, -1.3603515625, -1.110107421875, -0.85986328125, -0.609619140625, -0.359375, -0.109130859375, 0.14111328125, 0.391357421875, 0.6416015625, 0.891845703125, 1.14208984375, 1.392333984375, 1.642578125, 1.892822265625, 2.14306640625, 2.393310546875, 2.6435546875, 2.893798828125, 3.14404296875, 3.394287109375, 3.64453125, 3.894775390625, 4.14501953125, 4.395263671875, 4.6455078125, 4.895751953125, 5.14599609375, 5.396240234375, 5.646484375, 5.896728515625, 6.14697265625, 6.397216796875, 6.6474609375, 6.897705078125, 7.14794921875, 7.398193359375, 7.6484375]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 7.0, 7.0, 8.0, 12.0, 9.0, 18.0, 16.0, 13.0, 23.0, 21.0, 26.0, 27.0, 27.0, 36.0, 43.0, 26.0, 27.0, 40.0, 33.0, 57.0, 54.0, 59.0, 38.0, 35.0, 43.0, 39.0, 29.0, 24.0, 26.0, 19.0, 29.0, 16.0, 16.0, 27.0, 16.0, 12.0, 8.0, 11.0, 7.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2890625, -7.0545654296875, -6.820068359375, -6.5855712890625, -6.35107421875, -6.1165771484375, -5.882080078125, -5.6475830078125, -5.4130859375, -5.1785888671875, -4.944091796875, -4.7095947265625, -4.47509765625, -4.2406005859375, -4.006103515625, -3.7716064453125, -3.537109375, -3.3026123046875, -3.068115234375, -2.8336181640625, -2.59912109375, -2.3646240234375, -2.130126953125, -1.8956298828125, -1.6611328125, -1.4266357421875, -1.192138671875, -0.9576416015625, -0.72314453125, -0.4886474609375, -0.254150390625, -0.0196533203125, 0.21484375, 0.4493408203125, 0.683837890625, 0.9183349609375, 1.15283203125, 1.3873291015625, 1.621826171875, 1.8563232421875, 2.0908203125, 2.3253173828125, 2.559814453125, 2.7943115234375, 3.02880859375, 3.2633056640625, 3.497802734375, 3.7322998046875, 3.966796875, 4.2012939453125, 4.435791015625, 4.6702880859375, 4.90478515625, 5.1392822265625, 5.373779296875, 5.6082763671875, 5.8427734375, 6.0772705078125, 6.311767578125, 6.5462646484375, 6.78076171875, 7.0152587890625, 7.249755859375, 7.4842529296875, 7.71875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [4.0, 2.0, 4.0, 6.0, 8.0, 12.0, 16.0, 27.0, 27.0, 62.0, 70.0, 116.0, 173.0, 266.0, 362.0, 576.0, 824.0, 1247.0, 1896.0, 3022.0, 4640.0, 7211.0, 11128.0, 17493.0, 26946.0, 40706.0, 59588.0, 83335.0, 109600.0, 128889.0, 132564.0, 118090.0, 94292.0, 68292.0, 47107.0, 31419.0, 20851.0, 13329.0, 8509.0, 5473.0, 3559.0, 2334.0, 1511.0, 986.0, 650.0, 410.0, 306.0, 213.0, 131.0, 90.0, 66.0, 51.0, 35.0, 22.0, 15.0, 6.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.51953125, -5.33673095703125, -5.1539306640625, -4.97113037109375, -4.788330078125, -4.60552978515625, -4.4227294921875, -4.23992919921875, -4.05712890625, -3.87432861328125, -3.6915283203125, -3.50872802734375, -3.325927734375, -3.14312744140625, -2.9603271484375, -2.77752685546875, -2.5947265625, -2.41192626953125, -2.2291259765625, -2.04632568359375, -1.863525390625, -1.68072509765625, -1.4979248046875, -1.31512451171875, -1.13232421875, -0.94952392578125, -0.7667236328125, -0.58392333984375, -0.401123046875, -0.21832275390625, -0.0355224609375, 0.14727783203125, 0.330078125, 0.51287841796875, 0.6956787109375, 0.87847900390625, 1.061279296875, 1.24407958984375, 1.4268798828125, 1.60968017578125, 1.79248046875, 1.97528076171875, 2.1580810546875, 2.34088134765625, 2.523681640625, 2.70648193359375, 2.8892822265625, 3.07208251953125, 3.2548828125, 3.43768310546875, 3.6204833984375, 3.80328369140625, 3.986083984375, 4.16888427734375, 4.3516845703125, 4.53448486328125, 4.71728515625, 4.90008544921875, 5.0828857421875, 5.26568603515625, 5.448486328125, 5.63128662109375, 5.8140869140625, 5.99688720703125, 6.1796875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 6.0, 1.0, 5.0, 4.0, 9.0, 8.0, 14.0, 24.0, 12.0, 27.0, 22.0, 24.0, 27.0, 25.0, 28.0, 31.0, 37.0, 50.0, 37.0, 40.0, 35.0, 44.0, 52.0, 33.0, 41.0, 50.0, 43.0, 37.0, 28.0, 24.0, 33.0, 19.0, 26.0, 23.0, 18.0, 19.0, 11.0, 7.0, 14.0, 5.0, 1.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-5.34765625, -5.19378662109375, -5.0399169921875, -4.88604736328125, -4.732177734375, -4.57830810546875, -4.4244384765625, -4.27056884765625, -4.11669921875, -3.96282958984375, -3.8089599609375, -3.65509033203125, -3.501220703125, -3.34735107421875, -3.1934814453125, -3.03961181640625, -2.8857421875, -2.73187255859375, -2.5780029296875, -2.42413330078125, -2.270263671875, -2.11639404296875, -1.9625244140625, -1.80865478515625, -1.65478515625, -1.50091552734375, -1.3470458984375, -1.19317626953125, -1.039306640625, -0.88543701171875, -0.7315673828125, -0.57769775390625, -0.423828125, -0.26995849609375, -0.1160888671875, 0.03778076171875, 0.191650390625, 0.34552001953125, 0.4993896484375, 0.65325927734375, 0.80712890625, 0.96099853515625, 1.1148681640625, 1.26873779296875, 1.422607421875, 1.57647705078125, 1.7303466796875, 1.88421630859375, 2.0380859375, 2.19195556640625, 2.3458251953125, 2.49969482421875, 2.653564453125, 2.80743408203125, 2.9613037109375, 3.11517333984375, 3.26904296875, 3.42291259765625, 3.5767822265625, 3.73065185546875, 3.884521484375, 4.03839111328125, 4.1922607421875, 4.34613037109375, 4.5]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 3.0, 7.0, 6.0, 8.0, 19.0, 22.0, 21.0, 35.0, 59.0, 86.0, 125.0, 175.0, 264.0, 438.0, 584.0, 970.0, 1532.0, 2652.0, 4272.0, 7632.0, 13321.0, 23713.0, 42913.0, 76230.0, 129399.0, 183105.0, 195849.0, 150093.0, 93301.0, 53373.0, 29082.0, 16446.0, 9183.0, 5382.0, 3203.0, 1935.0, 1106.0, 702.0, 437.0, 264.0, 195.0, 121.0, 100.0, 58.0, 34.0, 34.0, 20.0, 14.0, 14.0, 8.0, 7.0, 5.0, 4.0, 3.0, 0.0, 0.0, 2.0], "bins": [-4.23046875, -4.10296630859375, -3.9754638671875, -3.84796142578125, -3.720458984375, -3.59295654296875, -3.4654541015625, -3.33795166015625, -3.21044921875, -3.08294677734375, -2.9554443359375, -2.82794189453125, -2.700439453125, -2.57293701171875, -2.4454345703125, -2.31793212890625, -2.1904296875, -2.06292724609375, -1.9354248046875, -1.80792236328125, -1.680419921875, -1.55291748046875, -1.4254150390625, -1.29791259765625, -1.17041015625, -1.04290771484375, -0.9154052734375, -0.78790283203125, -0.660400390625, -0.53289794921875, -0.4053955078125, -0.27789306640625, -0.150390625, -0.02288818359375, 0.1046142578125, 0.23211669921875, 0.359619140625, 0.48712158203125, 0.6146240234375, 0.74212646484375, 0.86962890625, 0.99713134765625, 1.1246337890625, 1.25213623046875, 1.379638671875, 1.50714111328125, 1.6346435546875, 1.76214599609375, 1.8896484375, 2.01715087890625, 2.1446533203125, 2.27215576171875, 2.399658203125, 2.52716064453125, 2.6546630859375, 2.78216552734375, 2.90966796875, 3.03717041015625, 3.1646728515625, 3.29217529296875, 3.419677734375, 3.54718017578125, 3.6746826171875, 3.80218505859375, 3.9296875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 4.0, 4.0, 3.0, 2.0, 8.0, 11.0, 17.0, 15.0, 17.0, 19.0, 34.0, 30.0, 33.0, 54.0, 53.0, 67.0, 59.0, 56.0, 71.0, 76.0, 61.0, 50.0, 46.0, 46.0, 31.0, 28.0, 27.0, 20.0, 11.0, 10.0, 8.0, 7.0, 4.0, 6.0, 4.0, 3.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0004611015319824219, -0.0004482269287109375, -0.0004353523254394531, -0.00042247772216796875, -0.0004096031188964844, -0.000396728515625, -0.0003838539123535156, -0.00037097930908203125, -0.0003581047058105469, -0.0003452301025390625, -0.0003323554992675781, -0.00031948089599609375, -0.0003066062927246094, -0.000293731689453125, -0.0002808570861816406, -0.00026798248291015625, -0.0002551078796386719, -0.0002422332763671875, -0.00022935867309570312, -0.00021648406982421875, -0.00020360946655273438, -0.00019073486328125, -0.00017786026000976562, -0.00016498565673828125, -0.00015211105346679688, -0.0001392364501953125, -0.00012636184692382812, -0.00011348724365234375, -0.00010061264038085938, -8.7738037109375e-05, -7.486343383789062e-05, -6.198883056640625e-05, -4.9114227294921875e-05, -3.62396240234375e-05, -2.3365020751953125e-05, -1.049041748046875e-05, 2.384185791015625e-06, 1.52587890625e-05, 2.8133392333984375e-05, 4.100799560546875e-05, 5.3882598876953125e-05, 6.67572021484375e-05, 7.963180541992188e-05, 9.250640869140625e-05, 0.00010538101196289062, 0.000118255615234375, 0.00013113021850585938, 0.00014400482177734375, 0.00015687942504882812, 0.0001697540283203125, 0.00018262863159179688, 0.00019550323486328125, 0.00020837783813476562, 0.00022125244140625, 0.00023412704467773438, 0.00024700164794921875, 0.0002598762512207031, 0.0002727508544921875, 0.0002856254577636719, 0.00029850006103515625, 0.0003113746643066406, 0.000324249267578125, 0.0003371238708496094, 0.00034999847412109375, 0.0003628730773925781]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 6.0, 5.0, 7.0, 17.0, 29.0, 38.0, 56.0, 81.0, 164.0, 239.0, 354.0, 574.0, 1017.0, 1624.0, 2774.0, 4682.0, 7992.0, 14269.0, 25248.0, 44975.0, 77732.0, 126985.0, 177567.0, 189559.0, 147692.0, 95119.0, 55922.0, 31587.0, 17922.0, 10088.0, 5691.0, 3307.0, 2011.0, 1234.0, 765.0, 461.0, 275.0, 172.0, 118.0, 78.0, 41.0, 26.0, 9.0, 17.0, 7.0, 4.0, 6.0, 6.0, 2.0, 1.0, 4.0, 0.0, 2.0], "bins": [-4.45703125, -4.326690673828125, -4.19635009765625, -4.066009521484375, -3.9356689453125, -3.805328369140625, -3.67498779296875, -3.544647216796875, -3.414306640625, -3.283966064453125, -3.15362548828125, -3.023284912109375, -2.8929443359375, -2.762603759765625, -2.63226318359375, -2.501922607421875, -2.37158203125, -2.241241455078125, -2.11090087890625, -1.980560302734375, -1.8502197265625, -1.719879150390625, -1.58953857421875, -1.459197998046875, -1.328857421875, -1.198516845703125, -1.06817626953125, -0.937835693359375, -0.8074951171875, -0.677154541015625, -0.54681396484375, -0.416473388671875, -0.2861328125, -0.155792236328125, -0.02545166015625, 0.104888916015625, 0.2352294921875, 0.365570068359375, 0.49591064453125, 0.626251220703125, 0.756591796875, 0.886932373046875, 1.01727294921875, 1.147613525390625, 1.2779541015625, 1.408294677734375, 1.53863525390625, 1.668975830078125, 1.79931640625, 1.929656982421875, 2.05999755859375, 2.190338134765625, 2.3206787109375, 2.451019287109375, 2.58135986328125, 2.711700439453125, 2.842041015625, 2.972381591796875, 3.10272216796875, 3.233062744140625, 3.3634033203125, 3.493743896484375, 3.62408447265625, 3.754425048828125, 3.884765625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 4.0, 3.0, 7.0, 6.0, 9.0, 13.0, 18.0, 28.0, 26.0, 24.0, 23.0, 28.0, 41.0, 44.0, 47.0, 42.0, 51.0, 64.0, 52.0, 52.0, 49.0, 56.0, 43.0, 47.0, 32.0, 23.0, 31.0, 25.0, 17.0, 26.0, 12.0, 19.0, 7.0, 10.0, 9.0, 2.0, 4.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.341796875, -1.3036651611328125, -1.265533447265625, -1.2274017333984375, -1.18927001953125, -1.1511383056640625, -1.113006591796875, -1.0748748779296875, -1.0367431640625, -0.9986114501953125, -0.960479736328125, -0.9223480224609375, -0.88421630859375, -0.8460845947265625, -0.807952880859375, -0.7698211669921875, -0.731689453125, -0.6935577392578125, -0.655426025390625, -0.6172943115234375, -0.57916259765625, -0.5410308837890625, -0.502899169921875, -0.4647674560546875, -0.4266357421875, -0.3885040283203125, -0.350372314453125, -0.3122406005859375, -0.27410888671875, -0.2359771728515625, -0.197845458984375, -0.1597137451171875, -0.12158203125, -0.0834503173828125, -0.045318603515625, -0.0071868896484375, 0.03094482421875, 0.0690765380859375, 0.107208251953125, 0.1453399658203125, 0.1834716796875, 0.2216033935546875, 0.259735107421875, 0.2978668212890625, 0.33599853515625, 0.3741302490234375, 0.412261962890625, 0.4503936767578125, 0.488525390625, 0.5266571044921875, 0.564788818359375, 0.6029205322265625, 0.64105224609375, 0.6791839599609375, 0.717315673828125, 0.7554473876953125, 0.7935791015625, 0.8317108154296875, 0.869842529296875, 0.9079742431640625, 0.94610595703125, 0.9842376708984375, 1.022369384765625, 1.0605010986328125, 1.0986328125]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 7.0, 6.0, 8.0, 12.0, 16.0, 12.0, 20.0, 38.0, 35.0, 47.0, 53.0, 61.0, 73.0, 76.0, 84.0, 91.0, 76.0, 49.0, 59.0, 36.0, 38.0, 29.0, 18.0, 16.0, 14.0, 7.0, 5.0, 4.0, 1.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.42067813873291, -11.963934898376465, -11.507190704345703, -11.050447463989258, -10.593703269958496, -10.13696002960205, -9.680215835571289, -9.223472595214844, -8.766729354858398, -8.309986114501953, -7.853241920471191, -7.396498680114746, -6.939754486083984, -6.483011245727539, -6.0262675285339355, -5.569523811340332, -5.11277961730957, -4.656035900115967, -4.199292182922363, -3.742548704147339, -3.2858049869537354, -2.829061269760132, -2.3723177909851074, -1.915574073791504, -1.4588303565979004, -1.0020866394042969, -0.5453430414199829, -0.08859944343566895, 0.36814427375793457, 0.8248879909515381, 1.2816314697265625, 1.738375186920166, 2.195117950439453, 2.6518616676330566, 3.10860538482666, 3.5653488636016846, 4.022092819213867, 4.4788360595703125, 4.935579776763916, 5.3923234939575195, 5.849067211151123, 6.305810928344727, 6.76255464553833, 7.219298362731934, 7.676041603088379, 8.13278579711914, 8.589529037475586, 9.046272277832031, 9.503016471862793, 9.959759712219238, 10.41650390625, 10.873247146606445, 11.329991340637207, 11.786734580993652, 12.243478775024414, 12.70022201538086, 13.156965255737305, 13.61370849609375, 14.070452690124512, 14.527195930480957, 14.983940124511719, 15.440683364868164, 15.89742660522461, 16.354171752929688, 16.810914993286133]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 4.0, 5.0, 6.0, 6.0, 5.0, 12.0, 7.0, 5.0, 12.0, 16.0, 18.0, 19.0, 17.0, 18.0, 28.0, 28.0, 30.0, 34.0, 35.0, 34.0, 40.0, 39.0, 39.0, 46.0, 41.0, 28.0, 37.0, 43.0, 36.0, 36.0, 32.0, 33.0, 29.0, 18.0, 15.0, 19.0, 17.0, 24.0, 13.0, 10.0, 12.0, 11.0, 12.0, 7.0, 5.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0], "bins": [-6.598753452301025, -6.39119291305542, -6.1836323738098145, -5.976071834564209, -5.7685112953186035, -5.560950756072998, -5.353390216827393, -5.145829677581787, -4.938269138336182, -4.730708599090576, -4.523148059844971, -4.315587520599365, -4.10802698135376, -3.9004664421081543, -3.692905902862549, -3.4853453636169434, -3.277784824371338, -3.0702242851257324, -2.862663745880127, -2.6551032066345215, -2.447542667388916, -2.2399821281433105, -2.032421588897705, -1.8248610496520996, -1.6173005104064941, -1.4097399711608887, -1.2021794319152832, -0.9946188926696777, -0.7870583534240723, -0.5794978141784668, -0.37193727493286133, -0.16437673568725586, 0.04318428039550781, 0.2507448196411133, 0.45830535888671875, 0.6658658981323242, 0.8734264373779297, 1.0809869766235352, 1.2885475158691406, 1.496108055114746, 1.7036685943603516, 1.911229133605957, 2.1187896728515625, 2.326350212097168, 2.5339107513427734, 2.741471290588379, 2.9490318298339844, 3.15659236907959, 3.3641529083251953, 3.571713447570801, 3.7792739868164062, 3.9868345260620117, 4.194395065307617, 4.401955604553223, 4.609516143798828, 4.817076683044434, 5.024637222290039, 5.2321977615356445, 5.43975830078125, 5.6473188400268555, 5.854879379272461, 6.062439918518066, 6.270000457763672, 6.477560997009277, 6.685121536254883]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 4.0, 1.0, 4.0, 11.0, 11.0, 9.0, 12.0, 19.0, 28.0, 64.0, 64.0, 116.0, 143.0, 219.0, 369.0, 545.0, 848.0, 1339.0, 2163.0, 3636.0, 5952.0, 10694.0, 19535.0, 37997.0, 78719.0, 176883.0, 408992.0, 856629.0, 1145658.0, 780916.0, 362146.0, 157189.0, 70476.0, 33767.0, 17291.0, 9206.0, 5105.0, 2958.0, 1658.0, 1065.0, 678.0, 406.0, 255.0, 178.0, 127.0, 74.0, 49.0, 28.0, 21.0, 9.0, 10.0, 11.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-12.8828125, -12.4854736328125, -12.088134765625, -11.6907958984375, -11.29345703125, -10.8961181640625, -10.498779296875, -10.1014404296875, -9.7041015625, -9.3067626953125, -8.909423828125, -8.5120849609375, -8.11474609375, -7.7174072265625, -7.320068359375, -6.9227294921875, -6.525390625, -6.1280517578125, -5.730712890625, -5.3333740234375, -4.93603515625, -4.5386962890625, -4.141357421875, -3.7440185546875, -3.3466796875, -2.9493408203125, -2.552001953125, -2.1546630859375, -1.75732421875, -1.3599853515625, -0.962646484375, -0.5653076171875, -0.16796875, 0.2293701171875, 0.626708984375, 1.0240478515625, 1.42138671875, 1.8187255859375, 2.216064453125, 2.6134033203125, 3.0107421875, 3.4080810546875, 3.805419921875, 4.2027587890625, 4.60009765625, 4.9974365234375, 5.394775390625, 5.7921142578125, 6.189453125, 6.5867919921875, 6.984130859375, 7.3814697265625, 7.77880859375, 8.1761474609375, 8.573486328125, 8.9708251953125, 9.3681640625, 9.7655029296875, 10.162841796875, 10.5601806640625, 10.95751953125, 11.3548583984375, 11.752197265625, 12.1495361328125, 12.546875]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 2.0, 5.0, 4.0, 5.0, 6.0, 15.0, 11.0, 9.0, 12.0, 18.0, 16.0, 15.0, 16.0, 26.0, 30.0, 27.0, 23.0, 33.0, 28.0, 46.0, 52.0, 43.0, 35.0, 35.0, 31.0, 39.0, 46.0, 39.0, 33.0, 37.0, 30.0, 19.0, 25.0, 27.0, 16.0, 21.0, 17.0, 24.0, 15.0, 17.0, 5.0, 10.0, 7.0, 8.0, 4.0, 2.0, 7.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0], "bins": [-6.2578125, -6.0767822265625, -5.895751953125, -5.7147216796875, -5.53369140625, -5.3526611328125, -5.171630859375, -4.9906005859375, -4.8095703125, -4.6285400390625, -4.447509765625, -4.2664794921875, -4.08544921875, -3.9044189453125, -3.723388671875, -3.5423583984375, -3.361328125, -3.1802978515625, -2.999267578125, -2.8182373046875, -2.63720703125, -2.4561767578125, -2.275146484375, -2.0941162109375, -1.9130859375, -1.7320556640625, -1.551025390625, -1.3699951171875, -1.18896484375, -1.0079345703125, -0.826904296875, -0.6458740234375, -0.46484375, -0.2838134765625, -0.102783203125, 0.0782470703125, 0.25927734375, 0.4403076171875, 0.621337890625, 0.8023681640625, 0.9833984375, 1.1644287109375, 1.345458984375, 1.5264892578125, 1.70751953125, 1.8885498046875, 2.069580078125, 2.2506103515625, 2.431640625, 2.6126708984375, 2.793701171875, 2.9747314453125, 3.15576171875, 3.3367919921875, 3.517822265625, 3.6988525390625, 3.8798828125, 4.0609130859375, 4.241943359375, 4.4229736328125, 4.60400390625, 4.7850341796875, 4.966064453125, 5.1470947265625, 5.328125]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 4.0, 11.0, 16.0, 33.0, 50.0, 78.0, 90.0, 171.0, 250.0, 389.0, 610.0, 1047.0, 1547.0, 2594.0, 4318.0, 7203.0, 12934.0, 22607.0, 41164.0, 78132.0, 151681.0, 303542.0, 590991.0, 942975.0, 908417.0, 545912.0, 277196.0, 139572.0, 72206.0, 38485.0, 20711.0, 11839.0, 6935.0, 3937.0, 2503.0, 1503.0, 943.0, 589.0, 396.0, 243.0, 153.0, 118.0, 89.0, 30.0, 16.0, 19.0, 12.0, 15.0, 6.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.8828125, -13.4481201171875, -13.013427734375, -12.5787353515625, -12.14404296875, -11.7093505859375, -11.274658203125, -10.8399658203125, -10.4052734375, -9.9705810546875, -9.535888671875, -9.1011962890625, -8.66650390625, -8.2318115234375, -7.797119140625, -7.3624267578125, -6.927734375, -6.4930419921875, -6.058349609375, -5.6236572265625, -5.18896484375, -4.7542724609375, -4.319580078125, -3.8848876953125, -3.4501953125, -3.0155029296875, -2.580810546875, -2.1461181640625, -1.71142578125, -1.2767333984375, -0.842041015625, -0.4073486328125, 0.02734375, 0.4620361328125, 0.896728515625, 1.3314208984375, 1.76611328125, 2.2008056640625, 2.635498046875, 3.0701904296875, 3.5048828125, 3.9395751953125, 4.374267578125, 4.8089599609375, 5.24365234375, 5.6783447265625, 6.113037109375, 6.5477294921875, 6.982421875, 7.4171142578125, 7.851806640625, 8.2864990234375, 8.72119140625, 9.1558837890625, 9.590576171875, 10.0252685546875, 10.4599609375, 10.8946533203125, 11.329345703125, 11.7640380859375, 12.19873046875, 12.6334228515625, 13.068115234375, 13.5028076171875, 13.9375]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 2.0, 8.0, 1.0, 3.0, 2.0, 8.0, 13.0, 11.0, 10.0, 10.0, 19.0, 30.0, 39.0, 43.0, 48.0, 66.0, 79.0, 123.0, 145.0, 167.0, 225.0, 233.0, 308.0, 263.0, 296.0, 280.0, 282.0, 264.0, 213.0, 165.0, 164.0, 120.0, 92.0, 78.0, 59.0, 49.0, 42.0, 27.0, 23.0, 16.0, 13.0, 8.0, 10.0, 9.0, 2.0, 5.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.69140625, -4.55560302734375, -4.4197998046875, -4.28399658203125, -4.148193359375, -4.01239013671875, -3.8765869140625, -3.74078369140625, -3.60498046875, -3.46917724609375, -3.3333740234375, -3.19757080078125, -3.061767578125, -2.92596435546875, -2.7901611328125, -2.65435791015625, -2.5185546875, -2.38275146484375, -2.2469482421875, -2.11114501953125, -1.975341796875, -1.83953857421875, -1.7037353515625, -1.56793212890625, -1.43212890625, -1.29632568359375, -1.1605224609375, -1.02471923828125, -0.888916015625, -0.75311279296875, -0.6173095703125, -0.48150634765625, -0.345703125, -0.20989990234375, -0.0740966796875, 0.06170654296875, 0.197509765625, 0.33331298828125, 0.4691162109375, 0.60491943359375, 0.74072265625, 0.87652587890625, 1.0123291015625, 1.14813232421875, 1.283935546875, 1.41973876953125, 1.5555419921875, 1.69134521484375, 1.8271484375, 1.96295166015625, 2.0987548828125, 2.23455810546875, 2.370361328125, 2.50616455078125, 2.6419677734375, 2.77777099609375, 2.91357421875, 3.04937744140625, 3.1851806640625, 3.32098388671875, 3.456787109375, 3.59259033203125, 3.7283935546875, 3.86419677734375, 4.0]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 3.0, 4.0, 7.0, 12.0, 18.0, 25.0, 26.0, 17.0, 36.0, 39.0, 34.0, 45.0, 61.0, 67.0, 56.0, 65.0, 62.0, 53.0, 62.0, 54.0, 43.0, 35.0, 22.0, 32.0, 35.0, 23.0, 15.0, 10.0, 10.0, 10.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.131260871887207, -11.676679611206055, -11.222098350524902, -10.76751708984375, -10.312935829162598, -9.858354568481445, -9.403772354125977, -8.94919204711914, -8.494609832763672, -8.04002857208252, -7.585447311401367, -7.130866050720215, -6.6762847900390625, -6.22170352935791, -5.7671217918396, -5.312540531158447, -4.857959747314453, -4.403378486633301, -3.9487972259521484, -3.494215726852417, -3.0396344661712646, -2.5850532054901123, -2.130471706390381, -1.6758904457092285, -1.2213091850280762, -0.766727864742279, -0.31214654445648193, 0.14243483543395996, 0.5970160961151123, 1.0515973567962646, 1.506178855895996, 1.9607601165771484, 2.415342330932617, 2.8699235916137695, 3.324504852294922, 3.7790863513946533, 4.233667373657227, 4.688248634338379, 5.1428303718566895, 5.597411632537842, 6.051992893218994, 6.5065741539001465, 6.961155414581299, 7.415737152099609, 7.870318412780762, 8.324899673461914, 8.779480934143066, 9.234062194824219, 9.688643455505371, 10.143224716186523, 10.597805976867676, 11.052387237548828, 11.50696849822998, 11.961549758911133, 12.416131973266602, 12.870712280273438, 13.325294494628906, 13.779875755310059, 14.234457015991211, 14.689038276672363, 15.143619537353516, 15.598200798034668, 16.05278205871582, 16.50736427307129, 16.961944580078125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 3.0, 3.0, 5.0, 5.0, 10.0, 7.0, 17.0, 6.0, 16.0, 12.0, 16.0, 22.0, 18.0, 29.0, 36.0, 33.0, 38.0, 48.0, 41.0, 44.0, 44.0, 45.0, 33.0, 40.0, 54.0, 24.0, 46.0, 41.0, 24.0, 28.0, 40.0, 31.0, 22.0, 19.0, 18.0, 12.0, 13.0, 19.0, 13.0, 7.0, 8.0, 6.0, 1.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.43345832824707, -9.149964332580566, -8.866470336914062, -8.582977294921875, -8.299483299255371, -8.015989303588867, -7.732495307922363, -7.449001312255859, -7.165507793426514, -6.88201379776001, -6.598520278930664, -6.31502628326416, -6.031532287597656, -5.7480387687683105, -5.464544773101807, -5.181051254272461, -4.897557258605957, -4.614063262939453, -4.330569744110107, -4.0470757484436035, -3.7635819911956787, -3.480088233947754, -3.19659423828125, -2.913100481033325, -2.6296067237854004, -2.3461129665374756, -2.062619209289551, -1.7791252136230469, -1.495631456375122, -1.2121376991271973, -0.9286438226699829, -0.6451499462127686, -0.36165618896484375, -0.07816237211227417, 0.2053314447402954, 0.488825261592865, 0.7723190784454346, 1.0558128356933594, 1.3393067121505737, 1.622800588607788, 1.906294345855713, 2.1897881031036377, 2.4732818603515625, 2.7567758560180664, 3.040269613265991, 3.323763370513916, 3.60725736618042, 3.8907511234283447, 4.1742448806762695, 4.457738876342773, 4.741232395172119, 5.024726390838623, 5.308219909667969, 5.591713905334473, 5.875207901000977, 6.1587018966674805, 6.442195415496826, 6.72568941116333, 7.009182929992676, 7.29267692565918, 7.576170921325684, 7.859664440155029, 8.143157958984375, 8.426651954650879, 8.710145950317383]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 6.0, 6.0, 5.0, 5.0, 12.0, 21.0, 24.0, 40.0, 64.0, 88.0, 110.0, 184.0, 255.0, 407.0, 590.0, 984.0, 1510.0, 2510.0, 3745.0, 6143.0, 10231.0, 16670.0, 28084.0, 46879.0, 77675.0, 122588.0, 167851.0, 178076.0, 142943.0, 94622.0, 57504.0, 34640.0, 21190.0, 12551.0, 7485.0, 4697.0, 3000.0, 1857.0, 1127.0, 745.0, 452.0, 306.0, 225.0, 138.0, 99.0, 73.0, 47.0, 37.0, 20.0, 17.0, 7.0, 7.0, 4.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-7.76171875, -7.51300048828125, -7.2642822265625, -7.01556396484375, -6.766845703125, -6.51812744140625, -6.2694091796875, -6.02069091796875, -5.77197265625, -5.52325439453125, -5.2745361328125, -5.02581787109375, -4.777099609375, -4.52838134765625, -4.2796630859375, -4.03094482421875, -3.7822265625, -3.53350830078125, -3.2847900390625, -3.03607177734375, -2.787353515625, -2.53863525390625, -2.2899169921875, -2.04119873046875, -1.79248046875, -1.54376220703125, -1.2950439453125, -1.04632568359375, -0.797607421875, -0.54888916015625, -0.3001708984375, -0.05145263671875, 0.197265625, 0.44598388671875, 0.6947021484375, 0.94342041015625, 1.192138671875, 1.44085693359375, 1.6895751953125, 1.93829345703125, 2.18701171875, 2.43572998046875, 2.6844482421875, 2.93316650390625, 3.181884765625, 3.43060302734375, 3.6793212890625, 3.92803955078125, 4.1767578125, 4.42547607421875, 4.6741943359375, 4.92291259765625, 5.171630859375, 5.42034912109375, 5.6690673828125, 5.91778564453125, 6.16650390625, 6.41522216796875, 6.6639404296875, 6.91265869140625, 7.161376953125, 7.41009521484375, 7.6588134765625, 7.90753173828125, 8.15625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 2.0, 6.0, 12.0, 4.0, 9.0, 14.0, 17.0, 11.0, 18.0, 21.0, 28.0, 20.0, 38.0, 41.0, 35.0, 42.0, 42.0, 48.0, 45.0, 44.0, 40.0, 52.0, 42.0, 31.0, 42.0, 37.0, 35.0, 36.0, 31.0, 19.0, 17.0, 23.0, 17.0, 14.0, 15.0, 10.0, 11.0, 4.0, 5.0, 5.0, 6.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.96875, -8.6590576171875, -8.349365234375, -8.0396728515625, -7.72998046875, -7.4202880859375, -7.110595703125, -6.8009033203125, -6.4912109375, -6.1815185546875, -5.871826171875, -5.5621337890625, -5.25244140625, -4.9427490234375, -4.633056640625, -4.3233642578125, -4.013671875, -3.7039794921875, -3.394287109375, -3.0845947265625, -2.77490234375, -2.4652099609375, -2.155517578125, -1.8458251953125, -1.5361328125, -1.2264404296875, -0.916748046875, -0.6070556640625, -0.29736328125, 0.0123291015625, 0.322021484375, 0.6317138671875, 0.94140625, 1.2510986328125, 1.560791015625, 1.8704833984375, 2.18017578125, 2.4898681640625, 2.799560546875, 3.1092529296875, 3.4189453125, 3.7286376953125, 4.038330078125, 4.3480224609375, 4.65771484375, 4.9674072265625, 5.277099609375, 5.5867919921875, 5.896484375, 6.2061767578125, 6.515869140625, 6.8255615234375, 7.13525390625, 7.4449462890625, 7.754638671875, 8.0643310546875, 8.3740234375, 8.6837158203125, 8.993408203125, 9.3031005859375, 9.61279296875, 9.9224853515625, 10.232177734375, 10.5418701171875, 10.8515625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 7.0, 4.0, 5.0, 10.0, 10.0, 8.0, 14.0, 19.0, 27.0, 41.0, 47.0, 79.0, 114.0, 192.0, 276.0, 428.0, 669.0, 1233.0, 2074.0, 3807.0, 7820.0, 17326.0, 43573.0, 115734.0, 284676.0, 325558.0, 148159.0, 54883.0, 21754.0, 9537.0, 4580.0, 2395.0, 1323.0, 754.0, 496.0, 297.0, 192.0, 117.0, 94.0, 62.0, 49.0, 27.0, 24.0, 11.0, 12.0, 10.0, 9.0, 5.0, 2.0, 7.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0], "bins": [-17.515625, -16.98681640625, -16.4580078125, -15.92919921875, -15.400390625, -14.87158203125, -14.3427734375, -13.81396484375, -13.28515625, -12.75634765625, -12.2275390625, -11.69873046875, -11.169921875, -10.64111328125, -10.1123046875, -9.58349609375, -9.0546875, -8.52587890625, -7.9970703125, -7.46826171875, -6.939453125, -6.41064453125, -5.8818359375, -5.35302734375, -4.82421875, -4.29541015625, -3.7666015625, -3.23779296875, -2.708984375, -2.18017578125, -1.6513671875, -1.12255859375, -0.59375, -0.06494140625, 0.4638671875, 0.99267578125, 1.521484375, 2.05029296875, 2.5791015625, 3.10791015625, 3.63671875, 4.16552734375, 4.6943359375, 5.22314453125, 5.751953125, 6.28076171875, 6.8095703125, 7.33837890625, 7.8671875, 8.39599609375, 8.9248046875, 9.45361328125, 9.982421875, 10.51123046875, 11.0400390625, 11.56884765625, 12.09765625, 12.62646484375, 13.1552734375, 13.68408203125, 14.212890625, 14.74169921875, 15.2705078125, 15.79931640625, 16.328125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 6.0, 5.0, 5.0, 5.0, 12.0, 9.0, 6.0, 15.0, 19.0, 18.0, 18.0, 24.0, 26.0, 30.0, 28.0, 38.0, 20.0, 41.0, 37.0, 42.0, 38.0, 37.0, 48.0, 32.0, 45.0, 36.0, 38.0, 29.0, 28.0, 34.0, 30.0, 35.0, 22.0, 23.0, 12.0, 19.0, 19.0, 13.0, 14.0, 12.0, 4.0, 12.0, 6.0, 5.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-5.5234375, -5.3529052734375, -5.182373046875, -5.0118408203125, -4.84130859375, -4.6707763671875, -4.500244140625, -4.3297119140625, -4.1591796875, -3.9886474609375, -3.818115234375, -3.6475830078125, -3.47705078125, -3.3065185546875, -3.135986328125, -2.9654541015625, -2.794921875, -2.6243896484375, -2.453857421875, -2.2833251953125, -2.11279296875, -1.9422607421875, -1.771728515625, -1.6011962890625, -1.4306640625, -1.2601318359375, -1.089599609375, -0.9190673828125, -0.74853515625, -0.5780029296875, -0.407470703125, -0.2369384765625, -0.06640625, 0.1041259765625, 0.274658203125, 0.4451904296875, 0.61572265625, 0.7862548828125, 0.956787109375, 1.1273193359375, 1.2978515625, 1.4683837890625, 1.638916015625, 1.8094482421875, 1.97998046875, 2.1505126953125, 2.321044921875, 2.4915771484375, 2.662109375, 2.8326416015625, 3.003173828125, 3.1737060546875, 3.34423828125, 3.5147705078125, 3.685302734375, 3.8558349609375, 4.0263671875, 4.1968994140625, 4.367431640625, 4.5379638671875, 4.70849609375, 4.8790283203125, 5.049560546875, 5.2200927734375, 5.390625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 5.0, 11.0, 12.0, 22.0, 39.0, 61.0, 98.0, 161.0, 262.0, 458.0, 764.0, 1325.0, 2279.0, 4277.0, 8420.0, 17622.0, 40722.0, 102550.0, 260103.0, 340926.0, 158217.0, 60431.0, 25138.0, 11720.0, 5752.0, 3061.0, 1642.0, 968.0, 557.0, 383.0, 200.0, 139.0, 82.0, 47.0, 33.0, 21.0, 23.0, 5.0, 5.0, 8.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5859375, -9.2884521484375, -8.990966796875, -8.6934814453125, -8.39599609375, -8.0985107421875, -7.801025390625, -7.5035400390625, -7.2060546875, -6.9085693359375, -6.611083984375, -6.3135986328125, -6.01611328125, -5.7186279296875, -5.421142578125, -5.1236572265625, -4.826171875, -4.5286865234375, -4.231201171875, -3.9337158203125, -3.63623046875, -3.3387451171875, -3.041259765625, -2.7437744140625, -2.4462890625, -2.1488037109375, -1.851318359375, -1.5538330078125, -1.25634765625, -0.9588623046875, -0.661376953125, -0.3638916015625, -0.06640625, 0.2310791015625, 0.528564453125, 0.8260498046875, 1.12353515625, 1.4210205078125, 1.718505859375, 2.0159912109375, 2.3134765625, 2.6109619140625, 2.908447265625, 3.2059326171875, 3.50341796875, 3.8009033203125, 4.098388671875, 4.3958740234375, 4.693359375, 4.9908447265625, 5.288330078125, 5.5858154296875, 5.88330078125, 6.1807861328125, 6.478271484375, 6.7757568359375, 7.0732421875, 7.3707275390625, 7.668212890625, 7.9656982421875, 8.26318359375, 8.5606689453125, 8.858154296875, 9.1556396484375, 9.453125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 3.0, 5.0, 6.0, 11.0, 13.0, 11.0, 22.0, 14.0, 34.0, 30.0, 42.0, 52.0, 60.0, 61.0, 54.0, 71.0, 73.0, 66.0, 59.0, 54.0, 55.0, 39.0, 30.0, 28.0, 22.0, 20.0, 10.0, 11.0, 9.0, 8.0, 12.0, 8.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.00039005279541015625, -0.0003794766962528229, -0.0003689005970954895, -0.00035832449793815613, -0.00034774839878082275, -0.0003371722996234894, -0.000326596200466156, -0.00031602010130882263, -0.00030544400215148926, -0.0002948679029941559, -0.0002842918038368225, -0.00027371570467948914, -0.00026313960552215576, -0.0002525635063648224, -0.00024198740720748901, -0.00023141130805015564, -0.00022083520889282227, -0.0002102591097354889, -0.00019968301057815552, -0.00018910691142082214, -0.00017853081226348877, -0.0001679547131061554, -0.00015737861394882202, -0.00014680251479148865, -0.00013622641563415527, -0.0001256503164768219, -0.00011507421731948853, -0.00010449811816215515, -9.392201900482178e-05, -8.33459198474884e-05, -7.276982069015503e-05, -6.219372153282166e-05, -5.161762237548828e-05, -4.104152321815491e-05, -3.0465424060821533e-05, -1.988932490348816e-05, -9.313225746154785e-06, 1.2628734111785889e-06, 1.1838972568511963e-05, 2.2415071725845337e-05, 3.299117088317871e-05, 4.3567270040512085e-05, 5.414336919784546e-05, 6.471946835517883e-05, 7.529556751251221e-05, 8.587166666984558e-05, 9.644776582717896e-05, 0.00010702386498451233, 0.0001175999641418457, 0.00012817606329917908, 0.00013875216245651245, 0.00014932826161384583, 0.0001599043607711792, 0.00017048045992851257, 0.00018105655908584595, 0.00019163265824317932, 0.0002022087574005127, 0.00021278485655784607, 0.00022336095571517944, 0.00023393705487251282, 0.0002445131540298462, 0.00025508925318717957, 0.00026566535234451294, 0.0002762414515018463, 0.0002868175506591797]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 7.0, 12.0, 20.0, 24.0, 25.0, 41.0, 54.0, 64.0, 96.0, 169.0, 224.0, 329.0, 475.0, 743.0, 1094.0, 1656.0, 2583.0, 3973.0, 6329.0, 9845.0, 16816.0, 28510.0, 49808.0, 87376.0, 143634.0, 196489.0, 186728.0, 128485.0, 75587.0, 42901.0, 24887.0, 14834.0, 8819.0, 5514.0, 3602.0, 2223.0, 1512.0, 1043.0, 636.0, 456.0, 280.0, 190.0, 127.0, 114.0, 60.0, 44.0, 28.0, 26.0, 18.0, 15.0, 9.0, 9.0, 5.0, 1.0, 7.0, 3.0, 1.0], "bins": [-6.921875, -6.7113037109375, -6.500732421875, -6.2901611328125, -6.07958984375, -5.8690185546875, -5.658447265625, -5.4478759765625, -5.2373046875, -5.0267333984375, -4.816162109375, -4.6055908203125, -4.39501953125, -4.1844482421875, -3.973876953125, -3.7633056640625, -3.552734375, -3.3421630859375, -3.131591796875, -2.9210205078125, -2.71044921875, -2.4998779296875, -2.289306640625, -2.0787353515625, -1.8681640625, -1.6575927734375, -1.447021484375, -1.2364501953125, -1.02587890625, -0.8153076171875, -0.604736328125, -0.3941650390625, -0.18359375, 0.0269775390625, 0.237548828125, 0.4481201171875, 0.65869140625, 0.8692626953125, 1.079833984375, 1.2904052734375, 1.5009765625, 1.7115478515625, 1.922119140625, 2.1326904296875, 2.34326171875, 2.5538330078125, 2.764404296875, 2.9749755859375, 3.185546875, 3.3961181640625, 3.606689453125, 3.8172607421875, 4.02783203125, 4.2384033203125, 4.448974609375, 4.6595458984375, 4.8701171875, 5.0806884765625, 5.291259765625, 5.5018310546875, 5.71240234375, 5.9229736328125, 6.133544921875, 6.3441162109375, 6.5546875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 9.0, 5.0, 6.0, 7.0, 5.0, 15.0, 11.0, 20.0, 23.0, 35.0, 40.0, 52.0, 72.0, 77.0, 91.0, 87.0, 92.0, 81.0, 69.0, 46.0, 44.0, 25.0, 19.0, 12.0, 13.0, 12.0, 10.0, 7.0, 2.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.669921875, -2.574920654296875, -2.47991943359375, -2.384918212890625, -2.2899169921875, -2.194915771484375, -2.09991455078125, -2.004913330078125, -1.909912109375, -1.814910888671875, -1.71990966796875, -1.624908447265625, -1.5299072265625, -1.434906005859375, -1.33990478515625, -1.244903564453125, -1.14990234375, -1.054901123046875, -0.95989990234375, -0.864898681640625, -0.7698974609375, -0.674896240234375, -0.57989501953125, -0.484893798828125, -0.389892578125, -0.294891357421875, -0.19989013671875, -0.104888916015625, -0.0098876953125, 0.085113525390625, 0.18011474609375, 0.275115966796875, 0.3701171875, 0.465118408203125, 0.56011962890625, 0.655120849609375, 0.7501220703125, 0.845123291015625, 0.94012451171875, 1.035125732421875, 1.130126953125, 1.225128173828125, 1.32012939453125, 1.415130615234375, 1.5101318359375, 1.605133056640625, 1.70013427734375, 1.795135498046875, 1.89013671875, 1.985137939453125, 2.08013916015625, 2.175140380859375, 2.2701416015625, 2.365142822265625, 2.46014404296875, 2.555145263671875, 2.650146484375, 2.745147705078125, 2.84014892578125, 2.935150146484375, 3.0301513671875, 3.125152587890625, 3.22015380859375, 3.315155029296875, 3.41015625]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 6.0, 4.0, 4.0, 10.0, 21.0, 17.0, 23.0, 31.0, 22.0, 54.0, 42.0, 48.0, 71.0, 63.0, 52.0, 69.0, 68.0, 63.0, 67.0, 47.0, 42.0, 35.0, 29.0, 37.0, 20.0, 19.0, 4.0, 14.0, 5.0, 4.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.911978721618652, -12.421529769897461, -11.93108081817627, -11.440631866455078, -10.950182914733887, -10.459733963012695, -9.96928596496582, -9.478836059570312, -8.988388061523438, -8.497939109802246, -8.007490158081055, -7.517041206359863, -7.026592254638672, -6.5361433029174805, -6.045694828033447, -5.555245876312256, -5.064796447753906, -4.574347496032715, -4.083898544311523, -3.593449831008911, -3.1030008792877197, -2.6125519275665283, -2.122103214263916, -1.6316542625427246, -1.1412053108215332, -0.6507564187049866, -0.16030752658843994, 0.3301413059234619, 0.8205902576446533, 1.3110392093658447, 1.801487922668457, 2.2919368743896484, 2.7823848724365234, 3.272833824157715, 3.7632827758789062, 4.253731727600098, 4.744180679321289, 5.2346296310424805, 5.725078105926514, 6.215527057647705, 6.7059760093688965, 7.196424961090088, 7.686873912811279, 8.177322387695312, 8.667771339416504, 9.158220291137695, 9.648669242858887, 10.139118194580078, 10.62956714630127, 11.120016098022461, 11.610465049743652, 12.100914001464844, 12.591362953186035, 13.081811904907227, 13.572259902954102, 14.06270980834961, 14.553157806396484, 15.043606758117676, 15.534055709838867, 16.024503707885742, 16.51495361328125, 17.005401611328125, 17.495851516723633, 17.986299514770508, 18.476749420166016]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 3.0, 7.0, 5.0, 12.0, 11.0, 10.0, 7.0, 22.0, 18.0, 24.0, 20.0, 26.0, 41.0, 30.0, 39.0, 47.0, 41.0, 52.0, 48.0, 43.0, 41.0, 48.0, 41.0, 42.0, 33.0, 33.0, 38.0, 33.0, 27.0, 31.0, 26.0, 18.0, 15.0, 15.0, 13.0, 12.0, 14.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.819650650024414, -9.521260261535645, -9.222870826721191, -8.924480438232422, -8.626090049743652, -8.327699661254883, -8.02931022644043, -7.73091983795166, -7.432529926300049, -7.1341400146484375, -6.835749626159668, -6.537359714508057, -6.238969802856445, -5.940579414367676, -5.6421895027160645, -5.343799591064453, -5.045409202575684, -4.747019290924072, -4.448628902435303, -4.150238990783691, -3.851848840713501, -3.5534586906433105, -3.255068778991699, -2.956678628921509, -2.6582884788513184, -2.359898328781128, -2.0615081787109375, -1.7631182670593262, -1.4647281169891357, -1.1663379669189453, -0.8679479360580444, -0.5695579051971436, -0.2711668014526367, 0.027223289012908936, 0.3256133794784546, 0.6240034699440002, 0.9223935604095459, 1.2207837104797363, 1.5191737413406372, 1.817563772201538, 2.1159539222717285, 2.414344072341919, 2.7127342224121094, 3.0111241340637207, 3.309514284133911, 3.6079044342041016, 3.906294345855713, 4.204684257507324, 4.503074645996094, 4.801464557647705, 5.099854946136475, 5.398244857788086, 5.6966352462768555, 5.995025157928467, 6.293415069580078, 6.591805458068848, 6.890195369720459, 7.18858528137207, 7.48697566986084, 7.785365581512451, 8.083755493164062, 8.382145881652832, 8.680536270141602, 8.978925704956055, 9.277316093444824]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 6.0, 20.0, 11.0, 25.0, 42.0, 54.0, 79.0, 148.0, 181.0, 317.0, 458.0, 674.0, 1081.0, 1595.0, 2605.0, 4193.0, 6472.0, 10389.0, 16519.0, 26047.0, 40650.0, 62421.0, 91461.0, 122403.0, 142722.0, 142144.0, 119889.0, 88653.0, 60291.0, 39058.0, 25007.0, 15830.0, 9821.0, 6225.0, 3886.0, 2608.0, 1578.0, 1081.0, 605.0, 424.0, 288.0, 201.0, 132.0, 98.0, 54.0, 38.0, 31.0, 22.0, 8.0, 6.0, 4.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.11328125, -6.88348388671875, -6.6536865234375, -6.42388916015625, -6.194091796875, -5.96429443359375, -5.7344970703125, -5.50469970703125, -5.27490234375, -5.04510498046875, -4.8153076171875, -4.58551025390625, -4.355712890625, -4.12591552734375, -3.8961181640625, -3.66632080078125, -3.4365234375, -3.20672607421875, -2.9769287109375, -2.74713134765625, -2.517333984375, -2.28753662109375, -2.0577392578125, -1.82794189453125, -1.59814453125, -1.36834716796875, -1.1385498046875, -0.90875244140625, -0.678955078125, -0.44915771484375, -0.2193603515625, 0.01043701171875, 0.240234375, 0.47003173828125, 0.6998291015625, 0.92962646484375, 1.159423828125, 1.38922119140625, 1.6190185546875, 1.84881591796875, 2.07861328125, 2.30841064453125, 2.5382080078125, 2.76800537109375, 2.997802734375, 3.22760009765625, 3.4573974609375, 3.68719482421875, 3.9169921875, 4.14678955078125, 4.3765869140625, 4.60638427734375, 4.836181640625, 5.06597900390625, 5.2957763671875, 5.52557373046875, 5.75537109375, 5.98516845703125, 6.2149658203125, 6.44476318359375, 6.674560546875, 6.90435791015625, 7.1341552734375, 7.36395263671875, 7.59375]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 2.0, 5.0, 5.0, 7.0, 10.0, 4.0, 13.0, 19.0, 16.0, 16.0, 12.0, 21.0, 29.0, 37.0, 26.0, 21.0, 40.0, 47.0, 42.0, 45.0, 47.0, 45.0, 41.0, 30.0, 33.0, 37.0, 38.0, 38.0, 31.0, 27.0, 31.0, 25.0, 24.0, 20.0, 18.0, 20.0, 21.0, 9.0, 12.0, 5.0, 7.0, 5.0, 8.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.2265625, -8.9312744140625, -8.635986328125, -8.3406982421875, -8.04541015625, -7.7501220703125, -7.454833984375, -7.1595458984375, -6.8642578125, -6.5689697265625, -6.273681640625, -5.9783935546875, -5.68310546875, -5.3878173828125, -5.092529296875, -4.7972412109375, -4.501953125, -4.2066650390625, -3.911376953125, -3.6160888671875, -3.32080078125, -3.0255126953125, -2.730224609375, -2.4349365234375, -2.1396484375, -1.8443603515625, -1.549072265625, -1.2537841796875, -0.95849609375, -0.6632080078125, -0.367919921875, -0.0726318359375, 0.22265625, 0.5179443359375, 0.813232421875, 1.1085205078125, 1.40380859375, 1.6990966796875, 1.994384765625, 2.2896728515625, 2.5849609375, 2.8802490234375, 3.175537109375, 3.4708251953125, 3.76611328125, 4.0614013671875, 4.356689453125, 4.6519775390625, 4.947265625, 5.2425537109375, 5.537841796875, 5.8331298828125, 6.12841796875, 6.4237060546875, 6.718994140625, 7.0142822265625, 7.3095703125, 7.6048583984375, 7.900146484375, 8.1954345703125, 8.49072265625, 8.7860107421875, 9.081298828125, 9.3765869140625, 9.671875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 10.0, 6.0, 17.0, 20.0, 31.0, 65.0, 85.0, 128.0, 186.0, 277.0, 384.0, 621.0, 924.0, 1350.0, 2172.0, 3384.0, 5307.0, 8233.0, 13080.0, 20131.0, 31417.0, 47837.0, 70902.0, 99867.0, 126972.0, 142246.0, 132654.0, 107561.0, 78701.0, 53877.0, 36026.0, 23091.0, 14579.0, 9338.0, 6048.0, 3826.0, 2473.0, 1633.0, 1022.0, 706.0, 454.0, 304.0, 198.0, 142.0, 85.0, 58.0, 41.0, 42.0, 14.0, 16.0, 6.0, 5.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0], "bins": [-7.640625, -7.399169921875, -7.15771484375, -6.916259765625, -6.6748046875, -6.433349609375, -6.19189453125, -5.950439453125, -5.708984375, -5.467529296875, -5.22607421875, -4.984619140625, -4.7431640625, -4.501708984375, -4.26025390625, -4.018798828125, -3.77734375, -3.535888671875, -3.29443359375, -3.052978515625, -2.8115234375, -2.570068359375, -2.32861328125, -2.087158203125, -1.845703125, -1.604248046875, -1.36279296875, -1.121337890625, -0.8798828125, -0.638427734375, -0.39697265625, -0.155517578125, 0.0859375, 0.327392578125, 0.56884765625, 0.810302734375, 1.0517578125, 1.293212890625, 1.53466796875, 1.776123046875, 2.017578125, 2.259033203125, 2.50048828125, 2.741943359375, 2.9833984375, 3.224853515625, 3.46630859375, 3.707763671875, 3.94921875, 4.190673828125, 4.43212890625, 4.673583984375, 4.9150390625, 5.156494140625, 5.39794921875, 5.639404296875, 5.880859375, 6.122314453125, 6.36376953125, 6.605224609375, 6.8466796875, 7.088134765625, 7.32958984375, 7.571044921875, 7.8125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 5.0, 6.0, 6.0, 8.0, 5.0, 12.0, 20.0, 12.0, 19.0, 21.0, 12.0, 32.0, 36.0, 33.0, 36.0, 43.0, 39.0, 42.0, 41.0, 29.0, 44.0, 46.0, 40.0, 27.0, 34.0, 35.0, 36.0, 30.0, 41.0, 31.0, 29.0, 19.0, 19.0, 22.0, 23.0, 24.0, 11.0, 10.0, 5.0, 7.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-6.33203125, -6.13580322265625, -5.9395751953125, -5.74334716796875, -5.547119140625, -5.35089111328125, -5.1546630859375, -4.95843505859375, -4.76220703125, -4.56597900390625, -4.3697509765625, -4.17352294921875, -3.977294921875, -3.78106689453125, -3.5848388671875, -3.38861083984375, -3.1923828125, -2.99615478515625, -2.7999267578125, -2.60369873046875, -2.407470703125, -2.21124267578125, -2.0150146484375, -1.81878662109375, -1.62255859375, -1.42633056640625, -1.2301025390625, -1.03387451171875, -0.837646484375, -0.64141845703125, -0.4451904296875, -0.24896240234375, -0.052734375, 0.14349365234375, 0.3397216796875, 0.53594970703125, 0.732177734375, 0.92840576171875, 1.1246337890625, 1.32086181640625, 1.51708984375, 1.71331787109375, 1.9095458984375, 2.10577392578125, 2.302001953125, 2.49822998046875, 2.6944580078125, 2.89068603515625, 3.0869140625, 3.28314208984375, 3.4793701171875, 3.67559814453125, 3.871826171875, 4.06805419921875, 4.2642822265625, 4.46051025390625, 4.65673828125, 4.85296630859375, 5.0491943359375, 5.24542236328125, 5.441650390625, 5.63787841796875, 5.8341064453125, 6.03033447265625, 6.2265625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 7.0, 11.0, 12.0, 17.0, 32.0, 38.0, 76.0, 103.0, 150.0, 249.0, 387.0, 583.0, 850.0, 1316.0, 2146.0, 3423.0, 5654.0, 10243.0, 18308.0, 36437.0, 72005.0, 139573.0, 217800.0, 224226.0, 149260.0, 79334.0, 39438.0, 20207.0, 10801.0, 6002.0, 3694.0, 2200.0, 1383.0, 897.0, 576.0, 384.0, 249.0, 161.0, 114.0, 66.0, 42.0, 34.0, 28.0, 17.0, 9.0, 10.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.26953125, -6.06097412109375, -5.8524169921875, -5.64385986328125, -5.435302734375, -5.22674560546875, -5.0181884765625, -4.80963134765625, -4.60107421875, -4.39251708984375, -4.1839599609375, -3.97540283203125, -3.766845703125, -3.55828857421875, -3.3497314453125, -3.14117431640625, -2.9326171875, -2.72406005859375, -2.5155029296875, -2.30694580078125, -2.098388671875, -1.88983154296875, -1.6812744140625, -1.47271728515625, -1.26416015625, -1.05560302734375, -0.8470458984375, -0.63848876953125, -0.429931640625, -0.22137451171875, -0.0128173828125, 0.19573974609375, 0.404296875, 0.61285400390625, 0.8214111328125, 1.02996826171875, 1.238525390625, 1.44708251953125, 1.6556396484375, 1.86419677734375, 2.07275390625, 2.28131103515625, 2.4898681640625, 2.69842529296875, 2.906982421875, 3.11553955078125, 3.3240966796875, 3.53265380859375, 3.7412109375, 3.94976806640625, 4.1583251953125, 4.36688232421875, 4.575439453125, 4.78399658203125, 4.9925537109375, 5.20111083984375, 5.40966796875, 5.61822509765625, 5.8267822265625, 6.03533935546875, 6.243896484375, 6.45245361328125, 6.6610107421875, 6.86956787109375, 7.078125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 4.0, 2.0, 5.0, 7.0, 4.0, 10.0, 11.0, 20.0, 16.0, 37.0, 41.0, 49.0, 65.0, 107.0, 136.0, 121.0, 106.0, 77.0, 59.0, 45.0, 26.0, 20.0, 12.0, 8.0, 7.0, 0.0, 5.0, 3.0, 4.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007772445678710938, -0.0007472783327102661, -0.0007173120975494385, -0.0006873458623886108, -0.0006573796272277832, -0.0006274133920669556, -0.0005974471569061279, -0.0005674809217453003, -0.0005375146865844727, -0.000507548451423645, -0.0004775822162628174, -0.00044761598110198975, -0.0004176497459411621, -0.00038768351078033447, -0.00035771727561950684, -0.0003277510404586792, -0.00029778480529785156, -0.0002678185701370239, -0.0002378523349761963, -0.00020788609981536865, -0.00017791986465454102, -0.00014795362949371338, -0.00011798739433288574, -8.80211591720581e-05, -5.805492401123047e-05, -2.8088688850402832e-05, 1.8775463104248047e-06, 3.184378147125244e-05, 6.181001663208008e-05, 9.177625179290771e-05, 0.00012174248695373535, 0.000151708722114563, 0.00018167495727539062, 0.00021164119243621826, 0.0002416074275970459, 0.00027157366275787354, 0.00030153989791870117, 0.0003315061330795288, 0.00036147236824035645, 0.0003914386034011841, 0.0004214048385620117, 0.00045137107372283936, 0.000481337308883667, 0.0005113035440444946, 0.0005412697792053223, 0.0005712360143661499, 0.0006012022495269775, 0.0006311684846878052, 0.0006611347198486328, 0.0006911009550094604, 0.0007210671901702881, 0.0007510334253311157, 0.0007809996604919434, 0.000810965895652771, 0.0008409321308135986, 0.0008708983659744263, 0.0009008646011352539, 0.0009308308362960815, 0.0009607970714569092, 0.0009907633066177368, 0.0010207295417785645, 0.001050695776939392, 0.0010806620121002197, 0.0011106282472610474, 0.001140594482421875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 9.0, 9.0, 7.0, 21.0, 33.0, 40.0, 49.0, 89.0, 115.0, 170.0, 207.0, 278.0, 475.0, 642.0, 865.0, 1248.0, 1902.0, 2615.0, 4073.0, 6118.0, 9525.0, 14695.0, 23134.0, 37534.0, 59805.0, 93722.0, 134896.0, 161987.0, 155917.0, 119559.0, 80109.0, 50257.0, 31976.0, 19619.0, 12548.0, 7905.0, 5251.0, 3453.0, 2415.0, 1605.0, 1109.0, 744.0, 581.0, 379.0, 248.0, 181.0, 123.0, 98.0, 83.0, 43.0, 37.0, 14.0, 14.0, 14.0, 7.0, 2.0, 4.0, 5.0, 1.0, 3.0], "bins": [-4.7421875, -4.5931396484375, -4.444091796875, -4.2950439453125, -4.14599609375, -3.9969482421875, -3.847900390625, -3.6988525390625, -3.5498046875, -3.4007568359375, -3.251708984375, -3.1026611328125, -2.95361328125, -2.8045654296875, -2.655517578125, -2.5064697265625, -2.357421875, -2.2083740234375, -2.059326171875, -1.9102783203125, -1.76123046875, -1.6121826171875, -1.463134765625, -1.3140869140625, -1.1650390625, -1.0159912109375, -0.866943359375, -0.7178955078125, -0.56884765625, -0.4197998046875, -0.270751953125, -0.1217041015625, 0.02734375, 0.1763916015625, 0.325439453125, 0.4744873046875, 0.62353515625, 0.7725830078125, 0.921630859375, 1.0706787109375, 1.2197265625, 1.3687744140625, 1.517822265625, 1.6668701171875, 1.81591796875, 1.9649658203125, 2.114013671875, 2.2630615234375, 2.412109375, 2.5611572265625, 2.710205078125, 2.8592529296875, 3.00830078125, 3.1573486328125, 3.306396484375, 3.4554443359375, 3.6044921875, 3.7535400390625, 3.902587890625, 4.0516357421875, 4.20068359375, 4.3497314453125, 4.498779296875, 4.6478271484375, 4.796875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 3.0, 3.0, 4.0, 5.0, 5.0, 8.0, 16.0, 16.0, 17.0, 20.0, 20.0, 29.0, 32.0, 36.0, 45.0, 57.0, 45.0, 56.0, 74.0, 70.0, 56.0, 59.0, 50.0, 39.0, 43.0, 28.0, 28.0, 28.0, 18.0, 17.0, 9.0, 12.0, 9.0, 11.0, 8.0, 12.0, 4.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.7685546875, -1.713287353515625, -1.65802001953125, -1.602752685546875, -1.5474853515625, -1.492218017578125, -1.43695068359375, -1.381683349609375, -1.326416015625, -1.271148681640625, -1.21588134765625, -1.160614013671875, -1.1053466796875, -1.050079345703125, -0.99481201171875, -0.939544677734375, -0.88427734375, -0.829010009765625, -0.77374267578125, -0.718475341796875, -0.6632080078125, -0.607940673828125, -0.55267333984375, -0.497406005859375, -0.442138671875, -0.386871337890625, -0.33160400390625, -0.276336669921875, -0.2210693359375, -0.165802001953125, -0.11053466796875, -0.055267333984375, 0.0, 0.055267333984375, 0.11053466796875, 0.165802001953125, 0.2210693359375, 0.276336669921875, 0.33160400390625, 0.386871337890625, 0.442138671875, 0.497406005859375, 0.55267333984375, 0.607940673828125, 0.6632080078125, 0.718475341796875, 0.77374267578125, 0.829010009765625, 0.88427734375, 0.939544677734375, 0.99481201171875, 1.050079345703125, 1.1053466796875, 1.160614013671875, 1.21588134765625, 1.271148681640625, 1.326416015625, 1.381683349609375, 1.43695068359375, 1.492218017578125, 1.5474853515625, 1.602752685546875, 1.65802001953125, 1.713287353515625, 1.7685546875]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 6.0, 7.0, 7.0, 11.0, 13.0, 18.0, 21.0, 37.0, 21.0, 33.0, 40.0, 45.0, 48.0, 70.0, 53.0, 61.0, 55.0, 66.0, 63.0, 55.0, 46.0, 42.0, 34.0, 25.0, 23.0, 26.0, 21.0, 21.0, 9.0, 5.0, 9.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.75258731842041, -13.276729583740234, -12.800870895385742, -12.32501220703125, -11.849154472351074, -11.373296737670898, -10.897438049316406, -10.421579360961914, -9.945721626281738, -9.469863891601562, -8.99400520324707, -8.518146514892578, -8.042288780212402, -7.566430568695068, -7.090572357177734, -6.6147141456604, -6.138855934143066, -5.662997722625732, -5.187139511108398, -4.7112812995910645, -4.2354230880737305, -3.7595648765563965, -3.2837066650390625, -2.8078484535217285, -2.3319902420043945, -1.8561320304870605, -1.3802738189697266, -0.9044156074523926, -0.4285573959350586, 0.04730081558227539, 0.5231590270996094, 0.9990172386169434, 1.4748764038085938, 1.9507346153259277, 2.4265928268432617, 2.9024510383605957, 3.3783092498779297, 3.8541674613952637, 4.330025672912598, 4.805883884429932, 5.281742095947266, 5.7576003074646, 6.233458518981934, 6.709316730499268, 7.185174942016602, 7.6610331535339355, 8.13689136505127, 8.612749099731445, 9.088607788085938, 9.56446647644043, 10.040324211120605, 10.516181945800781, 10.992040634155273, 11.467899322509766, 11.943757057189941, 12.419614791870117, 12.89547348022461, 13.371332168579102, 13.847189903259277, 14.323047637939453, 14.798906326293945, 15.274765014648438, 15.750622749328613, 16.22648048400879, 16.70233917236328]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 8.0, 10.0, 7.0, 12.0, 11.0, 13.0, 16.0, 13.0, 24.0, 22.0, 21.0, 33.0, 37.0, 34.0, 37.0, 40.0, 34.0, 54.0, 35.0, 46.0, 59.0, 38.0, 36.0, 38.0, 43.0, 43.0, 34.0, 26.0, 22.0, 29.0, 23.0, 22.0, 14.0, 14.0, 12.0, 11.0, 5.0, 6.0, 10.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.46254825592041, -9.14201545715332, -8.82148265838623, -8.500950813293457, -8.180418014526367, -7.859885215759277, -7.5393524169921875, -7.218819618225098, -6.898287296295166, -6.577754497528076, -6.2572221755981445, -5.936689376831055, -5.616156578063965, -5.295624256134033, -4.975091457366943, -4.654559135437012, -4.334026336669922, -4.013493537902832, -3.6929612159729004, -3.3724284172058105, -3.0518958568573, -2.731363296508789, -2.410830497741699, -2.0902979373931885, -1.7697653770446777, -1.449232816696167, -1.1287001371383667, -0.8081675171852112, -0.48763489723205566, -0.16710233688354492, 0.15343034267425537, 0.47396302223205566, 0.7944965362548828, 1.1150290966033936, 1.4355617761611938, 1.7560944557189941, 2.076627016067505, 2.3971595764160156, 2.7176923751831055, 3.038224935531616, 3.358757495880127, 3.6792900562286377, 3.9998226165771484, 4.320355415344238, 4.640888214111328, 4.96142053604126, 5.28195333480835, 5.602485656738281, 5.923018455505371, 6.243551254272461, 6.564083576202393, 6.884616374969482, 7.205148696899414, 7.525681495666504, 7.846214294433594, 8.166747093200684, 8.487279891967773, 8.807812690734863, 9.128345489501953, 9.448877334594727, 9.769410133361816, 10.089942932128906, 10.410475730895996, 10.731008529663086, 11.05154037475586]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 8.0, 10.0, 12.0, 21.0, 30.0, 50.0, 84.0, 104.0, 164.0, 229.0, 383.0, 563.0, 849.0, 1345.0, 2115.0, 3398.0, 5708.0, 9424.0, 16976.0, 31351.0, 61446.0, 127985.0, 280279.0, 598047.0, 1006224.0, 980716.0, 563688.0, 262340.0, 118864.0, 56039.0, 28789.0, 15238.0, 8478.0, 4958.0, 2971.0, 1809.0, 1201.0, 747.0, 531.0, 362.0, 224.0, 152.0, 124.0, 72.0, 54.0, 38.0, 36.0, 17.0, 12.0, 9.0, 9.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-14.5546875, -14.08447265625, -13.6142578125, -13.14404296875, -12.673828125, -12.20361328125, -11.7333984375, -11.26318359375, -10.79296875, -10.32275390625, -9.8525390625, -9.38232421875, -8.912109375, -8.44189453125, -7.9716796875, -7.50146484375, -7.03125, -6.56103515625, -6.0908203125, -5.62060546875, -5.150390625, -4.68017578125, -4.2099609375, -3.73974609375, -3.26953125, -2.79931640625, -2.3291015625, -1.85888671875, -1.388671875, -0.91845703125, -0.4482421875, 0.02197265625, 0.4921875, 0.96240234375, 1.4326171875, 1.90283203125, 2.373046875, 2.84326171875, 3.3134765625, 3.78369140625, 4.25390625, 4.72412109375, 5.1943359375, 5.66455078125, 6.134765625, 6.60498046875, 7.0751953125, 7.54541015625, 8.015625, 8.48583984375, 8.9560546875, 9.42626953125, 9.896484375, 10.36669921875, 10.8369140625, 11.30712890625, 11.77734375, 12.24755859375, 12.7177734375, 13.18798828125, 13.658203125, 14.12841796875, 14.5986328125, 15.06884765625, 15.5390625]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 6.0, 8.0, 8.0, 14.0, 9.0, 16.0, 19.0, 15.0, 18.0, 13.0, 29.0, 38.0, 37.0, 30.0, 33.0, 35.0, 48.0, 40.0, 56.0, 54.0, 49.0, 33.0, 41.0, 39.0, 44.0, 38.0, 37.0, 31.0, 22.0, 28.0, 20.0, 15.0, 14.0, 9.0, 13.0, 14.0, 6.0, 8.0, 4.0, 4.0, 0.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.2109375, -8.928466796875, -8.64599609375, -8.363525390625, -8.0810546875, -7.798583984375, -7.51611328125, -7.233642578125, -6.951171875, -6.668701171875, -6.38623046875, -6.103759765625, -5.8212890625, -5.538818359375, -5.25634765625, -4.973876953125, -4.69140625, -4.408935546875, -4.12646484375, -3.843994140625, -3.5615234375, -3.279052734375, -2.99658203125, -2.714111328125, -2.431640625, -2.149169921875, -1.86669921875, -1.584228515625, -1.3017578125, -1.019287109375, -0.73681640625, -0.454345703125, -0.171875, 0.110595703125, 0.39306640625, 0.675537109375, 0.9580078125, 1.240478515625, 1.52294921875, 1.805419921875, 2.087890625, 2.370361328125, 2.65283203125, 2.935302734375, 3.2177734375, 3.500244140625, 3.78271484375, 4.065185546875, 4.34765625, 4.630126953125, 4.91259765625, 5.195068359375, 5.4775390625, 5.760009765625, 6.04248046875, 6.324951171875, 6.607421875, 6.889892578125, 7.17236328125, 7.454833984375, 7.7373046875, 8.019775390625, 8.30224609375, 8.584716796875, 8.8671875]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 6.0, 5.0, 8.0, 23.0, 21.0, 28.0, 42.0, 63.0, 98.0, 136.0, 228.0, 287.0, 387.0, 654.0, 969.0, 1512.0, 2106.0, 3286.0, 4928.0, 7638.0, 12014.0, 19088.0, 30690.0, 50803.0, 83565.0, 141096.0, 238625.0, 394770.0, 605324.0, 758746.0, 672638.0, 459994.0, 282319.0, 167193.0, 98806.0, 58852.0, 35864.0, 22115.0, 13829.0, 8836.0, 5646.0, 3624.0, 2397.0, 1645.0, 1041.0, 718.0, 507.0, 354.0, 226.0, 180.0, 112.0, 82.0, 60.0, 43.0, 33.0, 10.0, 15.0, 9.0, 4.0, 2.0, 2.0], "bins": [-14.109375, -13.6773681640625, -13.245361328125, -12.8133544921875, -12.38134765625, -11.9493408203125, -11.517333984375, -11.0853271484375, -10.6533203125, -10.2213134765625, -9.789306640625, -9.3572998046875, -8.92529296875, -8.4932861328125, -8.061279296875, -7.6292724609375, -7.197265625, -6.7652587890625, -6.333251953125, -5.9012451171875, -5.46923828125, -5.0372314453125, -4.605224609375, -4.1732177734375, -3.7412109375, -3.3092041015625, -2.877197265625, -2.4451904296875, -2.01318359375, -1.5811767578125, -1.149169921875, -0.7171630859375, -0.28515625, 0.1468505859375, 0.578857421875, 1.0108642578125, 1.44287109375, 1.8748779296875, 2.306884765625, 2.7388916015625, 3.1708984375, 3.6029052734375, 4.034912109375, 4.4669189453125, 4.89892578125, 5.3309326171875, 5.762939453125, 6.1949462890625, 6.626953125, 7.0589599609375, 7.490966796875, 7.9229736328125, 8.35498046875, 8.7869873046875, 9.218994140625, 9.6510009765625, 10.0830078125, 10.5150146484375, 10.947021484375, 11.3790283203125, 11.81103515625, 12.2430419921875, 12.675048828125, 13.1070556640625, 13.5390625]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 0.0, 2.0, 4.0, 7.0, 10.0, 8.0, 7.0, 14.0, 16.0, 23.0, 29.0, 31.0, 43.0, 50.0, 68.0, 99.0, 99.0, 139.0, 112.0, 196.0, 223.0, 233.0, 256.0, 257.0, 262.0, 247.0, 244.0, 220.0, 208.0, 204.0, 154.0, 123.0, 97.0, 97.0, 68.0, 48.0, 45.0, 35.0, 17.0, 20.0, 17.0, 12.0, 10.0, 7.0, 4.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.3671875, -5.20074462890625, -5.0343017578125, -4.86785888671875, -4.701416015625, -4.53497314453125, -4.3685302734375, -4.20208740234375, -4.03564453125, -3.86920166015625, -3.7027587890625, -3.53631591796875, -3.369873046875, -3.20343017578125, -3.0369873046875, -2.87054443359375, -2.7041015625, -2.53765869140625, -2.3712158203125, -2.20477294921875, -2.038330078125, -1.87188720703125, -1.7054443359375, -1.53900146484375, -1.37255859375, -1.20611572265625, -1.0396728515625, -0.87322998046875, -0.706787109375, -0.54034423828125, -0.3739013671875, -0.20745849609375, -0.041015625, 0.12542724609375, 0.2918701171875, 0.45831298828125, 0.624755859375, 0.79119873046875, 0.9576416015625, 1.12408447265625, 1.29052734375, 1.45697021484375, 1.6234130859375, 1.78985595703125, 1.956298828125, 2.12274169921875, 2.2891845703125, 2.45562744140625, 2.6220703125, 2.78851318359375, 2.9549560546875, 3.12139892578125, 3.287841796875, 3.45428466796875, 3.6207275390625, 3.78717041015625, 3.95361328125, 4.12005615234375, 4.2864990234375, 4.45294189453125, 4.619384765625, 4.78582763671875, 4.9522705078125, 5.11871337890625, 5.28515625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 9.0, 2.0, 4.0, 6.0, 11.0, 10.0, 10.0, 10.0, 18.0, 26.0, 32.0, 29.0, 35.0, 46.0, 50.0, 33.0, 57.0, 43.0, 53.0, 58.0, 41.0, 64.0, 53.0, 34.0, 31.0, 34.0, 27.0, 32.0, 25.0, 24.0, 18.0, 19.0, 13.0, 13.0, 7.0, 6.0, 8.0, 4.0, 2.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.737723350524902, -15.2180757522583, -14.698427200317383, -14.178779602050781, -13.65913200378418, -13.139483451843262, -12.61983585357666, -12.100187301635742, -11.58053970336914, -11.060892105102539, -10.541243553161621, -10.02159595489502, -9.501947402954102, -8.9822998046875, -8.462652206420898, -7.943004131317139, -7.423356056213379, -6.903707981109619, -6.384059906005859, -5.864412307739258, -5.344764232635498, -4.825116157531738, -4.305468559265137, -3.785820484161377, -3.266172409057617, -2.7465243339538574, -2.2268764972686768, -1.7072285413742065, -1.1875805854797363, -0.6679325103759766, -0.1482846736907959, 0.37136316299438477, 0.8910102844238281, 1.4106582403182983, 1.9303061962127686, 2.449954032897949, 2.969602108001709, 3.4892501831054688, 4.00889778137207, 4.52854585647583, 5.04819393157959, 5.56784200668335, 6.087490081787109, 6.607137680053711, 7.126785755157471, 7.6464338302612305, 8.166081428527832, 8.68572998046875, 9.205377578735352, 9.725025177001953, 10.244673728942871, 10.764321327209473, 11.28396987915039, 11.803617477416992, 12.323265075683594, 12.842912673950195, 13.362561225891113, 13.882208824157715, 14.401857376098633, 14.921504974365234, 15.441152572631836, 15.960801124572754, 16.480449676513672, 17.000097274780273, 17.519744873046875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 4.0, 7.0, 4.0, 5.0, 10.0, 9.0, 14.0, 16.0, 24.0, 22.0, 19.0, 26.0, 34.0, 20.0, 31.0, 28.0, 37.0, 37.0, 28.0, 55.0, 45.0, 47.0, 43.0, 45.0, 36.0, 32.0, 37.0, 41.0, 26.0, 21.0, 23.0, 33.0, 25.0, 28.0, 21.0, 11.0, 14.0, 11.0, 7.0, 11.0, 6.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.929536819458008, -10.570655822753906, -10.211775779724121, -9.852895736694336, -9.494014739990234, -9.135133743286133, -8.776253700256348, -8.417373657226562, -8.058492660522461, -7.699612140655518, -7.340731620788574, -6.981851100921631, -6.6229705810546875, -6.264090061187744, -5.905209541320801, -5.546329021453857, -5.187448501586914, -4.828567981719971, -4.469687461853027, -4.110806941986084, -3.7519264221191406, -3.3930459022521973, -3.034165382385254, -2.6752848625183105, -2.316404342651367, -1.9575238227844238, -1.5986433029174805, -1.239762783050537, -0.8808822631835938, -0.5220017433166504, -0.16312122344970703, 0.19575929641723633, 0.5546388626098633, 0.9135193824768066, 1.27239990234375, 1.6312804222106934, 1.9901609420776367, 2.34904146194458, 2.7079219818115234, 3.066802501678467, 3.42568302154541, 3.7845635414123535, 4.143444061279297, 4.50232458114624, 4.861205101013184, 5.220085620880127, 5.57896614074707, 5.937846660614014, 6.296727180480957, 6.6556077003479, 7.014488220214844, 7.373368740081787, 7.7322492599487305, 8.091129302978516, 8.450010299682617, 8.808891296386719, 9.167771339416504, 9.526651382446289, 9.88553237915039, 10.244413375854492, 10.603293418884277, 10.962173461914062, 11.321054458618164, 11.679935455322266, 12.03881549835205]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 11.0, 12.0, 12.0, 25.0, 27.0, 41.0, 68.0, 99.0, 122.0, 214.0, 324.0, 484.0, 756.0, 1237.0, 2129.0, 3589.0, 6114.0, 10877.0, 19935.0, 35607.0, 62420.0, 104786.0, 157879.0, 190791.0, 169648.0, 117184.0, 71038.0, 40797.0, 22650.0, 12516.0, 7133.0, 3886.0, 2297.0, 1403.0, 920.0, 518.0, 353.0, 219.0, 135.0, 85.0, 69.0, 48.0, 30.0, 22.0, 10.0, 13.0, 8.0, 8.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.6796875, -9.363525390625, -9.04736328125, -8.731201171875, -8.4150390625, -8.098876953125, -7.78271484375, -7.466552734375, -7.150390625, -6.834228515625, -6.51806640625, -6.201904296875, -5.8857421875, -5.569580078125, -5.25341796875, -4.937255859375, -4.62109375, -4.304931640625, -3.98876953125, -3.672607421875, -3.3564453125, -3.040283203125, -2.72412109375, -2.407958984375, -2.091796875, -1.775634765625, -1.45947265625, -1.143310546875, -0.8271484375, -0.510986328125, -0.19482421875, 0.121337890625, 0.4375, 0.753662109375, 1.06982421875, 1.385986328125, 1.7021484375, 2.018310546875, 2.33447265625, 2.650634765625, 2.966796875, 3.282958984375, 3.59912109375, 3.915283203125, 4.2314453125, 4.547607421875, 4.86376953125, 5.179931640625, 5.49609375, 5.812255859375, 6.12841796875, 6.444580078125, 6.7607421875, 7.076904296875, 7.39306640625, 7.709228515625, 8.025390625, 8.341552734375, 8.65771484375, 8.973876953125, 9.2900390625, 9.606201171875, 9.92236328125, 10.238525390625, 10.5546875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 5.0, 2.0, 6.0, 6.0, 11.0, 16.0, 10.0, 14.0, 24.0, 22.0, 22.0, 28.0, 23.0, 32.0, 27.0, 33.0, 41.0, 47.0, 39.0, 52.0, 39.0, 29.0, 41.0, 43.0, 42.0, 45.0, 35.0, 46.0, 33.0, 23.0, 25.0, 20.0, 27.0, 22.0, 19.0, 12.0, 9.0, 7.0, 11.0, 4.0, 5.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.96875, -11.5711669921875, -11.173583984375, -10.7760009765625, -10.37841796875, -9.9808349609375, -9.583251953125, -9.1856689453125, -8.7880859375, -8.3905029296875, -7.992919921875, -7.5953369140625, -7.19775390625, -6.8001708984375, -6.402587890625, -6.0050048828125, -5.607421875, -5.2098388671875, -4.812255859375, -4.4146728515625, -4.01708984375, -3.6195068359375, -3.221923828125, -2.8243408203125, -2.4267578125, -2.0291748046875, -1.631591796875, -1.2340087890625, -0.83642578125, -0.4388427734375, -0.041259765625, 0.3563232421875, 0.75390625, 1.1514892578125, 1.549072265625, 1.9466552734375, 2.34423828125, 2.7418212890625, 3.139404296875, 3.5369873046875, 3.9345703125, 4.3321533203125, 4.729736328125, 5.1273193359375, 5.52490234375, 5.9224853515625, 6.320068359375, 6.7176513671875, 7.115234375, 7.5128173828125, 7.910400390625, 8.3079833984375, 8.70556640625, 9.1031494140625, 9.500732421875, 9.8983154296875, 10.2958984375, 10.6934814453125, 11.091064453125, 11.4886474609375, 11.88623046875, 12.2838134765625, 12.681396484375, 13.0789794921875, 13.4765625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 8.0, 7.0, 4.0, 9.0, 25.0, 29.0, 46.0, 57.0, 71.0, 94.0, 147.0, 199.0, 263.0, 397.0, 546.0, 895.0, 1376.0, 2256.0, 3742.0, 6904.0, 13263.0, 27013.0, 59433.0, 130989.0, 251628.0, 269468.0, 148486.0, 67273.0, 30415.0, 14717.0, 7671.0, 4248.0, 2354.0, 1555.0, 939.0, 635.0, 434.0, 272.0, 187.0, 153.0, 118.0, 72.0, 53.0, 37.0, 23.0, 18.0, 9.0, 4.0, 6.0, 5.0, 7.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-17.078125, -16.5618896484375, -16.045654296875, -15.5294189453125, -15.01318359375, -14.4969482421875, -13.980712890625, -13.4644775390625, -12.9482421875, -12.4320068359375, -11.915771484375, -11.3995361328125, -10.88330078125, -10.3670654296875, -9.850830078125, -9.3345947265625, -8.818359375, -8.3021240234375, -7.785888671875, -7.2696533203125, -6.75341796875, -6.2371826171875, -5.720947265625, -5.2047119140625, -4.6884765625, -4.1722412109375, -3.656005859375, -3.1397705078125, -2.62353515625, -2.1072998046875, -1.591064453125, -1.0748291015625, -0.55859375, -0.0423583984375, 0.473876953125, 0.9901123046875, 1.50634765625, 2.0225830078125, 2.538818359375, 3.0550537109375, 3.5712890625, 4.0875244140625, 4.603759765625, 5.1199951171875, 5.63623046875, 6.1524658203125, 6.668701171875, 7.1849365234375, 7.701171875, 8.2174072265625, 8.733642578125, 9.2498779296875, 9.76611328125, 10.2823486328125, 10.798583984375, 11.3148193359375, 11.8310546875, 12.3472900390625, 12.863525390625, 13.3797607421875, 13.89599609375, 14.4122314453125, 14.928466796875, 15.4447021484375, 15.9609375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 7.0, 2.0, 4.0, 9.0, 10.0, 5.0, 8.0, 17.0, 14.0, 16.0, 18.0, 22.0, 33.0, 36.0, 27.0, 31.0, 26.0, 45.0, 29.0, 29.0, 49.0, 28.0, 44.0, 44.0, 42.0, 42.0, 34.0, 47.0, 27.0, 26.0, 39.0, 27.0, 23.0, 24.0, 19.0, 16.0, 17.0, 24.0, 11.0, 6.0, 5.0, 3.0, 3.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.1953125, -6.96746826171875, -6.7396240234375, -6.51177978515625, -6.283935546875, -6.05609130859375, -5.8282470703125, -5.60040283203125, -5.37255859375, -5.14471435546875, -4.9168701171875, -4.68902587890625, -4.461181640625, -4.23333740234375, -4.0054931640625, -3.77764892578125, -3.5498046875, -3.32196044921875, -3.0941162109375, -2.86627197265625, -2.638427734375, -2.41058349609375, -2.1827392578125, -1.95489501953125, -1.72705078125, -1.49920654296875, -1.2713623046875, -1.04351806640625, -0.815673828125, -0.58782958984375, -0.3599853515625, -0.13214111328125, 0.095703125, 0.32354736328125, 0.5513916015625, 0.77923583984375, 1.007080078125, 1.23492431640625, 1.4627685546875, 1.69061279296875, 1.91845703125, 2.14630126953125, 2.3741455078125, 2.60198974609375, 2.829833984375, 3.05767822265625, 3.2855224609375, 3.51336669921875, 3.7412109375, 3.96905517578125, 4.1968994140625, 4.42474365234375, 4.652587890625, 4.88043212890625, 5.1082763671875, 5.33612060546875, 5.56396484375, 5.79180908203125, 6.0196533203125, 6.24749755859375, 6.475341796875, 6.70318603515625, 6.9310302734375, 7.15887451171875, 7.38671875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 9.0, 15.0, 23.0, 33.0, 61.0, 87.0, 113.0, 153.0, 257.0, 370.0, 606.0, 899.0, 1450.0, 2319.0, 3905.0, 6788.0, 12162.0, 22542.0, 42815.0, 84211.0, 159953.0, 250112.0, 211567.0, 117733.0, 60276.0, 31072.0, 16448.0, 9134.0, 5256.0, 3073.0, 1831.0, 1219.0, 717.0, 450.0, 304.0, 193.0, 139.0, 65.0, 59.0, 43.0, 29.0, 26.0, 13.0, 6.0, 7.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.8359375, -8.566162109375, -8.29638671875, -8.026611328125, -7.7568359375, -7.487060546875, -7.21728515625, -6.947509765625, -6.677734375, -6.407958984375, -6.13818359375, -5.868408203125, -5.5986328125, -5.328857421875, -5.05908203125, -4.789306640625, -4.51953125, -4.249755859375, -3.97998046875, -3.710205078125, -3.4404296875, -3.170654296875, -2.90087890625, -2.631103515625, -2.361328125, -2.091552734375, -1.82177734375, -1.552001953125, -1.2822265625, -1.012451171875, -0.74267578125, -0.472900390625, -0.203125, 0.066650390625, 0.33642578125, 0.606201171875, 0.8759765625, 1.145751953125, 1.41552734375, 1.685302734375, 1.955078125, 2.224853515625, 2.49462890625, 2.764404296875, 3.0341796875, 3.303955078125, 3.57373046875, 3.843505859375, 4.11328125, 4.383056640625, 4.65283203125, 4.922607421875, 5.1923828125, 5.462158203125, 5.73193359375, 6.001708984375, 6.271484375, 6.541259765625, 6.81103515625, 7.080810546875, 7.3505859375, 7.620361328125, 7.89013671875, 8.159912109375, 8.4296875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 6.0, 10.0, 8.0, 11.0, 13.0, 13.0, 8.0, 20.0, 25.0, 28.0, 25.0, 41.0, 52.0, 58.0, 53.0, 56.0, 52.0, 57.0, 45.0, 60.0, 44.0, 51.0, 43.0, 27.0, 25.0, 30.0, 22.0, 30.0, 13.0, 8.0, 10.0, 7.0, 9.0, 8.0, 3.0, 8.0, 1.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0003669261932373047, -0.0003559477627277374, -0.00034496933221817017, -0.0003339909017086029, -0.00032301247119903564, -0.0003120340406894684, -0.0003010556101799011, -0.00029007717967033386, -0.0002790987491607666, -0.00026812031865119934, -0.0002571418881416321, -0.0002461634576320648, -0.00023518502712249756, -0.0002242065966129303, -0.00021322816610336304, -0.00020224973559379578, -0.00019127130508422852, -0.00018029287457466125, -0.000169314444065094, -0.00015833601355552673, -0.00014735758304595947, -0.0001363791525363922, -0.00012540072202682495, -0.00011442229151725769, -0.00010344386100769043, -9.246543049812317e-05, -8.148699998855591e-05, -7.050856947898865e-05, -5.953013896942139e-05, -4.8551708459854126e-05, -3.7573277950286865e-05, -2.6594847440719604e-05, -1.5616416931152344e-05, -4.637986421585083e-06, 6.340444087982178e-06, 1.731887459754944e-05, 2.82973051071167e-05, 3.927573561668396e-05, 5.025416612625122e-05, 6.123259663581848e-05, 7.221102714538574e-05, 8.3189457654953e-05, 9.416788816452026e-05, 0.00010514631867408752, 0.00011612474918365479, 0.00012710317969322205, 0.0001380816102027893, 0.00014906004071235657, 0.00016003847122192383, 0.0001710169017314911, 0.00018199533224105835, 0.0001929737627506256, 0.00020395219326019287, 0.00021493062376976013, 0.0002259090542793274, 0.00023688748478889465, 0.0002478659152984619, 0.0002588443458080292, 0.00026982277631759644, 0.0002808012068271637, 0.00029177963733673096, 0.0003027580678462982, 0.0003137364983558655, 0.00032471492886543274, 0.000335693359375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 3.0, 5.0, 0.0, 4.0, 5.0, 6.0, 12.0, 16.0, 28.0, 43.0, 48.0, 58.0, 98.0, 148.0, 251.0, 345.0, 511.0, 717.0, 1091.0, 1677.0, 2530.0, 3900.0, 6081.0, 9485.0, 14656.0, 22544.0, 35184.0, 54383.0, 81787.0, 115935.0, 146723.0, 152256.0, 127303.0, 92739.0, 62729.0, 40810.0, 26251.0, 16824.0, 10860.0, 7131.0, 4617.0, 2939.0, 2034.0, 1266.0, 783.0, 522.0, 368.0, 289.0, 171.0, 123.0, 93.0, 65.0, 45.0, 23.0, 17.0, 16.0, 8.0, 5.0, 7.0, 3.0, 1.0, 1.0, 2.0], "bins": [-6.7109375, -6.5023193359375, -6.293701171875, -6.0850830078125, -5.87646484375, -5.6678466796875, -5.459228515625, -5.2506103515625, -5.0419921875, -4.8333740234375, -4.624755859375, -4.4161376953125, -4.20751953125, -3.9989013671875, -3.790283203125, -3.5816650390625, -3.373046875, -3.1644287109375, -2.955810546875, -2.7471923828125, -2.53857421875, -2.3299560546875, -2.121337890625, -1.9127197265625, -1.7041015625, -1.4954833984375, -1.286865234375, -1.0782470703125, -0.86962890625, -0.6610107421875, -0.452392578125, -0.2437744140625, -0.03515625, 0.1734619140625, 0.382080078125, 0.5906982421875, 0.79931640625, 1.0079345703125, 1.216552734375, 1.4251708984375, 1.6337890625, 1.8424072265625, 2.051025390625, 2.2596435546875, 2.46826171875, 2.6768798828125, 2.885498046875, 3.0941162109375, 3.302734375, 3.5113525390625, 3.719970703125, 3.9285888671875, 4.13720703125, 4.3458251953125, 4.554443359375, 4.7630615234375, 4.9716796875, 5.1802978515625, 5.388916015625, 5.5975341796875, 5.80615234375, 6.0147705078125, 6.223388671875, 6.4320068359375, 6.640625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 7.0, 6.0, 12.0, 7.0, 20.0, 15.0, 18.0, 33.0, 37.0, 50.0, 49.0, 54.0, 81.0, 74.0, 75.0, 80.0, 71.0, 58.0, 54.0, 51.0, 30.0, 36.0, 23.0, 16.0, 17.0, 4.0, 6.0, 5.0, 5.0, 8.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7265625, -2.624664306640625, -2.52276611328125, -2.420867919921875, -2.3189697265625, -2.217071533203125, -2.11517333984375, -2.013275146484375, -1.911376953125, -1.809478759765625, -1.70758056640625, -1.605682373046875, -1.5037841796875, -1.401885986328125, -1.29998779296875, -1.198089599609375, -1.09619140625, -0.994293212890625, -0.89239501953125, -0.790496826171875, -0.6885986328125, -0.586700439453125, -0.48480224609375, -0.382904052734375, -0.281005859375, -0.179107666015625, -0.07720947265625, 0.024688720703125, 0.1265869140625, 0.228485107421875, 0.33038330078125, 0.432281494140625, 0.5341796875, 0.636077880859375, 0.73797607421875, 0.839874267578125, 0.9417724609375, 1.043670654296875, 1.14556884765625, 1.247467041015625, 1.349365234375, 1.451263427734375, 1.55316162109375, 1.655059814453125, 1.7569580078125, 1.858856201171875, 1.96075439453125, 2.062652587890625, 2.16455078125, 2.266448974609375, 2.36834716796875, 2.470245361328125, 2.5721435546875, 2.674041748046875, 2.77593994140625, 2.877838134765625, 2.979736328125, 3.081634521484375, 3.18353271484375, 3.285430908203125, 3.3873291015625, 3.489227294921875, 3.59112548828125, 3.693023681640625, 3.794921875]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 7.0, 7.0, 7.0, 8.0, 8.0, 16.0, 23.0, 25.0, 33.0, 38.0, 27.0, 43.0, 51.0, 48.0, 40.0, 64.0, 57.0, 57.0, 51.0, 63.0, 53.0, 33.0, 39.0, 21.0, 30.0, 27.0, 26.0, 22.0, 22.0, 15.0, 8.0, 7.0, 8.0, 5.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.555696487426758, -16.001737594604492, -15.44778060913086, -14.89382266998291, -14.339864730834961, -13.785905838012695, -13.231947898864746, -12.677989959716797, -12.124032020568848, -11.570074081420898, -11.01611614227295, -10.462158203125, -9.908199310302734, -9.354242324829102, -8.800283432006836, -8.246325492858887, -7.6923675537109375, -7.138409614562988, -6.584451675415039, -6.030493259429932, -5.476535320281982, -4.922577381134033, -4.368618965148926, -3.8146610260009766, -3.2607030868530273, -2.706745147705078, -2.15278697013855, -1.598828911781311, -1.0448708534240723, -0.49091291427612305, 0.06304526329040527, 0.6170034408569336, 1.1709613800048828, 1.7249194383621216, 2.2788774967193604, 2.8328356742858887, 3.386793613433838, 3.940751552581787, 4.4947099685668945, 5.048667907714844, 5.602625846862793, 6.156583786010742, 6.710541725158691, 7.264500141143799, 7.818458080291748, 8.372415542602539, 8.926374435424805, 9.480332374572754, 10.034290313720703, 10.588248252868652, 11.142206192016602, 11.69616413116455, 12.2501220703125, 12.804080963134766, 13.358038902282715, 13.911996841430664, 14.465954780578613, 15.019912719726562, 15.573870658874512, 16.12782859802246, 16.681787490844727, 17.23574447631836, 17.789703369140625, 18.34366226196289, 18.897619247436523]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 5.0, 7.0, 7.0, 5.0, 9.0, 17.0, 15.0, 12.0, 21.0, 23.0, 29.0, 23.0, 20.0, 33.0, 26.0, 36.0, 37.0, 25.0, 37.0, 47.0, 31.0, 48.0, 48.0, 40.0, 47.0, 27.0, 30.0, 47.0, 30.0, 17.0, 27.0, 20.0, 28.0, 27.0, 24.0, 15.0, 14.0, 9.0, 7.0, 10.0, 6.0, 6.0, 2.0, 6.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.247703552246094, -9.898707389831543, -9.549710273742676, -9.200714111328125, -8.851716995239258, -8.502720832824707, -8.153724670410156, -7.804727554321289, -7.45573091506958, -7.106734275817871, -6.757737636566162, -6.408740997314453, -6.059744834899902, -5.710747718811035, -5.361751556396484, -5.012754917144775, -4.663758277893066, -4.314761638641357, -3.9657649993896484, -3.6167685985565186, -3.2677719593048096, -2.9187753200531006, -2.5697789192199707, -2.2207822799682617, -1.8717856407165527, -1.5227890014648438, -1.1737924814224243, -0.8247959613800049, -0.4757993221282959, -0.12680268287658691, 0.22219371795654297, 0.571190357208252, 0.9201879501342773, 1.2691845893859863, 1.6181811094284058, 1.9671776294708252, 2.316174268722534, 2.665170907974243, 3.014167308807373, 3.363163948059082, 3.712160587310791, 4.0611572265625, 4.410153865814209, 4.759150505065918, 5.108146667480469, 5.457143783569336, 5.806139945983887, 6.155136585235596, 6.504133224487305, 6.853129863739014, 7.202126502990723, 7.551122665405273, 7.900119781494141, 8.249115943908691, 8.598112106323242, 8.94710922241211, 9.296106338500977, 9.645102500915527, 9.994099617004395, 10.343095779418945, 10.692092895507812, 11.041089057922363, 11.390085220336914, 11.739082336425781, 12.088078498840332]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 8.0, 10.0, 20.0, 19.0, 34.0, 50.0, 74.0, 96.0, 164.0, 219.0, 329.0, 476.0, 666.0, 1045.0, 1485.0, 2261.0, 3399.0, 5284.0, 8337.0, 13116.0, 20766.0, 32776.0, 50739.0, 77192.0, 107672.0, 135619.0, 145180.0, 131824.0, 103735.0, 73095.0, 47753.0, 30643.0, 19375.0, 12319.0, 7819.0, 5022.0, 3309.0, 2133.0, 1519.0, 978.0, 596.0, 438.0, 309.0, 219.0, 122.0, 110.0, 64.0, 41.0, 34.0, 15.0, 12.0, 14.0, 15.0, 8.0, 4.0, 8.0, 2.0], "bins": [-9.953125, -9.6553955078125, -9.357666015625, -9.0599365234375, -8.76220703125, -8.4644775390625, -8.166748046875, -7.8690185546875, -7.5712890625, -7.2735595703125, -6.975830078125, -6.6781005859375, -6.38037109375, -6.0826416015625, -5.784912109375, -5.4871826171875, -5.189453125, -4.8917236328125, -4.593994140625, -4.2962646484375, -3.99853515625, -3.7008056640625, -3.403076171875, -3.1053466796875, -2.8076171875, -2.5098876953125, -2.212158203125, -1.9144287109375, -1.61669921875, -1.3189697265625, -1.021240234375, -0.7235107421875, -0.42578125, -0.1280517578125, 0.169677734375, 0.4674072265625, 0.76513671875, 1.0628662109375, 1.360595703125, 1.6583251953125, 1.9560546875, 2.2537841796875, 2.551513671875, 2.8492431640625, 3.14697265625, 3.4447021484375, 3.742431640625, 4.0401611328125, 4.337890625, 4.6356201171875, 4.933349609375, 5.2310791015625, 5.52880859375, 5.8265380859375, 6.124267578125, 6.4219970703125, 6.7197265625, 7.0174560546875, 7.315185546875, 7.6129150390625, 7.91064453125, 8.2083740234375, 8.506103515625, 8.8038330078125, 9.1015625]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 6.0, 2.0, 7.0, 4.0, 4.0, 11.0, 10.0, 13.0, 13.0, 13.0, 16.0, 24.0, 19.0, 20.0, 27.0, 29.0, 43.0, 31.0, 29.0, 37.0, 41.0, 44.0, 32.0, 47.0, 38.0, 44.0, 37.0, 43.0, 31.0, 34.0, 24.0, 30.0, 37.0, 21.0, 18.0, 34.0, 13.0, 17.0, 15.0, 8.0, 4.0, 12.0, 3.0, 5.0, 8.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4609375, -11.095458984375, -10.72998046875, -10.364501953125, -9.9990234375, -9.633544921875, -9.26806640625, -8.902587890625, -8.537109375, -8.171630859375, -7.80615234375, -7.440673828125, -7.0751953125, -6.709716796875, -6.34423828125, -5.978759765625, -5.61328125, -5.247802734375, -4.88232421875, -4.516845703125, -4.1513671875, -3.785888671875, -3.42041015625, -3.054931640625, -2.689453125, -2.323974609375, -1.95849609375, -1.593017578125, -1.2275390625, -0.862060546875, -0.49658203125, -0.131103515625, 0.234375, 0.599853515625, 0.96533203125, 1.330810546875, 1.6962890625, 2.061767578125, 2.42724609375, 2.792724609375, 3.158203125, 3.523681640625, 3.88916015625, 4.254638671875, 4.6201171875, 4.985595703125, 5.35107421875, 5.716552734375, 6.08203125, 6.447509765625, 6.81298828125, 7.178466796875, 7.5439453125, 7.909423828125, 8.27490234375, 8.640380859375, 9.005859375, 9.371337890625, 9.73681640625, 10.102294921875, 10.4677734375, 10.833251953125, 11.19873046875, 11.564208984375, 11.9296875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 1.0, 7.0, 5.0, 15.0, 27.0, 31.0, 45.0, 46.0, 78.0, 101.0, 160.0, 232.0, 348.0, 477.0, 768.0, 1110.0, 1716.0, 2714.0, 4450.0, 7117.0, 12344.0, 20384.0, 34516.0, 58501.0, 93953.0, 138192.0, 169249.0, 163897.0, 126900.0, 84158.0, 51128.0, 30288.0, 17785.0, 10431.0, 6251.0, 3929.0, 2496.0, 1542.0, 1066.0, 690.0, 456.0, 295.0, 198.0, 146.0, 93.0, 81.0, 51.0, 34.0, 24.0, 11.0, 10.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.8203125, -12.405029296875, -11.98974609375, -11.574462890625, -11.1591796875, -10.743896484375, -10.32861328125, -9.913330078125, -9.498046875, -9.082763671875, -8.66748046875, -8.252197265625, -7.8369140625, -7.421630859375, -7.00634765625, -6.591064453125, -6.17578125, -5.760498046875, -5.34521484375, -4.929931640625, -4.5146484375, -4.099365234375, -3.68408203125, -3.268798828125, -2.853515625, -2.438232421875, -2.02294921875, -1.607666015625, -1.1923828125, -0.777099609375, -0.36181640625, 0.053466796875, 0.46875, 0.884033203125, 1.29931640625, 1.714599609375, 2.1298828125, 2.545166015625, 2.96044921875, 3.375732421875, 3.791015625, 4.206298828125, 4.62158203125, 5.036865234375, 5.4521484375, 5.867431640625, 6.28271484375, 6.697998046875, 7.11328125, 7.528564453125, 7.94384765625, 8.359130859375, 8.7744140625, 9.189697265625, 9.60498046875, 10.020263671875, 10.435546875, 10.850830078125, 11.26611328125, 11.681396484375, 12.0966796875, 12.511962890625, 12.92724609375, 13.342529296875, 13.7578125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 6.0, 2.0, 7.0, 5.0, 7.0, 9.0, 13.0, 10.0, 13.0, 9.0, 22.0, 21.0, 20.0, 25.0, 24.0, 28.0, 28.0, 37.0, 33.0, 30.0, 35.0, 37.0, 41.0, 44.0, 37.0, 44.0, 36.0, 40.0, 47.0, 30.0, 28.0, 32.0, 29.0, 26.0, 19.0, 24.0, 14.0, 14.0, 11.0, 14.0, 10.0, 8.0, 9.0, 7.0, 4.0, 6.0, 3.0, 7.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-8.4609375, -8.2200927734375, -7.979248046875, -7.7384033203125, -7.49755859375, -7.2567138671875, -7.015869140625, -6.7750244140625, -6.5341796875, -6.2933349609375, -6.052490234375, -5.8116455078125, -5.57080078125, -5.3299560546875, -5.089111328125, -4.8482666015625, -4.607421875, -4.3665771484375, -4.125732421875, -3.8848876953125, -3.64404296875, -3.4031982421875, -3.162353515625, -2.9215087890625, -2.6806640625, -2.4398193359375, -2.198974609375, -1.9581298828125, -1.71728515625, -1.4764404296875, -1.235595703125, -0.9947509765625, -0.75390625, -0.5130615234375, -0.272216796875, -0.0313720703125, 0.20947265625, 0.4503173828125, 0.691162109375, 0.9320068359375, 1.1728515625, 1.4136962890625, 1.654541015625, 1.8953857421875, 2.13623046875, 2.3770751953125, 2.617919921875, 2.8587646484375, 3.099609375, 3.3404541015625, 3.581298828125, 3.8221435546875, 4.06298828125, 4.3038330078125, 4.544677734375, 4.7855224609375, 5.0263671875, 5.2672119140625, 5.508056640625, 5.7489013671875, 5.98974609375, 6.2305908203125, 6.471435546875, 6.7122802734375, 6.953125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 8.0, 2.0, 8.0, 10.0, 17.0, 22.0, 26.0, 42.0, 57.0, 87.0, 101.0, 172.0, 205.0, 399.0, 543.0, 831.0, 1358.0, 2066.0, 3471.0, 6099.0, 11566.0, 24178.0, 55334.0, 134284.0, 267148.0, 277911.0, 146796.0, 60966.0, 25854.0, 12401.0, 6531.0, 3805.0, 2380.0, 1369.0, 834.0, 570.0, 330.0, 242.0, 191.0, 121.0, 70.0, 49.0, 28.0, 22.0, 17.0, 9.0, 6.0, 8.0, 9.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.09375, -11.7164306640625, -11.339111328125, -10.9617919921875, -10.58447265625, -10.2071533203125, -9.829833984375, -9.4525146484375, -9.0751953125, -8.6978759765625, -8.320556640625, -7.9432373046875, -7.56591796875, -7.1885986328125, -6.811279296875, -6.4339599609375, -6.056640625, -5.6793212890625, -5.302001953125, -4.9246826171875, -4.54736328125, -4.1700439453125, -3.792724609375, -3.4154052734375, -3.0380859375, -2.6607666015625, -2.283447265625, -1.9061279296875, -1.52880859375, -1.1514892578125, -0.774169921875, -0.3968505859375, -0.01953125, 0.3577880859375, 0.735107421875, 1.1124267578125, 1.48974609375, 1.8670654296875, 2.244384765625, 2.6217041015625, 2.9990234375, 3.3763427734375, 3.753662109375, 4.1309814453125, 4.50830078125, 4.8856201171875, 5.262939453125, 5.6402587890625, 6.017578125, 6.3948974609375, 6.772216796875, 7.1495361328125, 7.52685546875, 7.9041748046875, 8.281494140625, 8.6588134765625, 9.0361328125, 9.4134521484375, 9.790771484375, 10.1680908203125, 10.54541015625, 10.9227294921875, 11.300048828125, 11.6773681640625, 12.0546875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 6.0, 4.0, 11.0, 11.0, 27.0, 37.0, 73.0, 114.0, 150.0, 163.0, 127.0, 91.0, 67.0, 37.0, 21.0, 19.0, 11.0, 13.0, 4.0, 7.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001922607421875, -0.0018632113933563232, -0.0018038153648376465, -0.0017444193363189697, -0.001685023307800293, -0.0016256272792816162, -0.0015662312507629395, -0.0015068352222442627, -0.001447439193725586, -0.0013880431652069092, -0.0013286471366882324, -0.0012692511081695557, -0.001209855079650879, -0.0011504590511322021, -0.0010910630226135254, -0.0010316669940948486, -0.0009722709655761719, -0.0009128749370574951, -0.0008534789085388184, -0.0007940828800201416, -0.0007346868515014648, -0.0006752908229827881, -0.0006158947944641113, -0.0005564987659454346, -0.0004971027374267578, -0.00043770670890808105, -0.0003783106803894043, -0.00031891465187072754, -0.0002595186233520508, -0.00020012259483337402, -0.00014072656631469727, -8.133053779602051e-05, -2.193450927734375e-05, 3.746151924133301e-05, 9.685754776000977e-05, 0.00015625357627868652, 0.00021564960479736328, 0.00027504563331604004, 0.0003344416618347168, 0.00039383769035339355, 0.0004532337188720703, 0.0005126297473907471, 0.0005720257759094238, 0.0006314218044281006, 0.0006908178329467773, 0.0007502138614654541, 0.0008096098899841309, 0.0008690059185028076, 0.0009284019470214844, 0.0009877979755401611, 0.0010471940040588379, 0.0011065900325775146, 0.0011659860610961914, 0.0012253820896148682, 0.001284778118133545, 0.0013441741466522217, 0.0014035701751708984, 0.0014629662036895752, 0.001522362232208252, 0.0015817582607269287, 0.0016411542892456055, 0.0017005503177642822, 0.001759946346282959, 0.0018193423748016357, 0.0018787384033203125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 2.0, 2.0, 4.0, 6.0, 11.0, 12.0, 22.0, 20.0, 40.0, 83.0, 116.0, 169.0, 267.0, 377.0, 586.0, 966.0, 1442.0, 2272.0, 3472.0, 5558.0, 9366.0, 16246.0, 30954.0, 63120.0, 129424.0, 220829.0, 240451.0, 157999.0, 78078.0, 38363.0, 19617.0, 10934.0, 6535.0, 3902.0, 2570.0, 1605.0, 1032.0, 747.0, 442.0, 328.0, 198.0, 148.0, 89.0, 60.0, 31.0, 31.0, 21.0, 8.0, 3.0, 6.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.515625, -9.189208984375, -8.86279296875, -8.536376953125, -8.2099609375, -7.883544921875, -7.55712890625, -7.230712890625, -6.904296875, -6.577880859375, -6.25146484375, -5.925048828125, -5.5986328125, -5.272216796875, -4.94580078125, -4.619384765625, -4.29296875, -3.966552734375, -3.64013671875, -3.313720703125, -2.9873046875, -2.660888671875, -2.33447265625, -2.008056640625, -1.681640625, -1.355224609375, -1.02880859375, -0.702392578125, -0.3759765625, -0.049560546875, 0.27685546875, 0.603271484375, 0.9296875, 1.256103515625, 1.58251953125, 1.908935546875, 2.2353515625, 2.561767578125, 2.88818359375, 3.214599609375, 3.541015625, 3.867431640625, 4.19384765625, 4.520263671875, 4.8466796875, 5.173095703125, 5.49951171875, 5.825927734375, 6.15234375, 6.478759765625, 6.80517578125, 7.131591796875, 7.4580078125, 7.784423828125, 8.11083984375, 8.437255859375, 8.763671875, 9.090087890625, 9.41650390625, 9.742919921875, 10.0693359375, 10.395751953125, 10.72216796875, 11.048583984375, 11.375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 4.0, 2.0, 5.0, 6.0, 9.0, 14.0, 12.0, 27.0, 17.0, 30.0, 20.0, 43.0, 63.0, 54.0, 68.0, 73.0, 71.0, 75.0, 90.0, 61.0, 54.0, 38.0, 39.0, 29.0, 13.0, 27.0, 13.0, 5.0, 6.0, 7.0, 7.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.171875, -3.070404052734375, -2.96893310546875, -2.867462158203125, -2.7659912109375, -2.664520263671875, -2.56304931640625, -2.461578369140625, -2.360107421875, -2.258636474609375, -2.15716552734375, -2.055694580078125, -1.9542236328125, -1.852752685546875, -1.75128173828125, -1.649810791015625, -1.54833984375, -1.446868896484375, -1.34539794921875, -1.243927001953125, -1.1424560546875, -1.040985107421875, -0.93951416015625, -0.838043212890625, -0.736572265625, -0.635101318359375, -0.53363037109375, -0.432159423828125, -0.3306884765625, -0.229217529296875, -0.12774658203125, -0.026275634765625, 0.0751953125, 0.176666259765625, 0.27813720703125, 0.379608154296875, 0.4810791015625, 0.582550048828125, 0.68402099609375, 0.785491943359375, 0.886962890625, 0.988433837890625, 1.08990478515625, 1.191375732421875, 1.2928466796875, 1.394317626953125, 1.49578857421875, 1.597259521484375, 1.69873046875, 1.800201416015625, 1.90167236328125, 2.003143310546875, 2.1046142578125, 2.206085205078125, 2.30755615234375, 2.409027099609375, 2.510498046875, 2.611968994140625, 2.71343994140625, 2.814910888671875, 2.9163818359375, 3.017852783203125, 3.11932373046875, 3.220794677734375, 3.322265625]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 5.0, 3.0, 10.0, 8.0, 15.0, 14.0, 15.0, 20.0, 38.0, 23.0, 31.0, 45.0, 37.0, 58.0, 46.0, 42.0, 53.0, 55.0, 67.0, 62.0, 52.0, 42.0, 33.0, 32.0, 21.0, 34.0, 23.0, 24.0, 25.0, 18.0, 13.0, 6.0, 7.0, 3.0, 7.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.171552658081055, -17.60867691040039, -17.045801162719727, -16.48292350769043, -15.920047760009766, -15.357172012329102, -14.794296264648438, -14.231420516967773, -13.668543815612793, -13.105668067932129, -12.542791366577148, -11.979915618896484, -11.41703987121582, -10.85416316986084, -10.291287422180176, -9.728410720825195, -9.165534973144531, -8.602659225463867, -8.039782524108887, -7.476906776428223, -6.9140305519104, -6.351154327392578, -5.788278579711914, -5.225402355194092, -4.6625261306762695, -4.099649906158447, -3.536773920059204, -2.973897933959961, -2.4110217094421387, -1.8481454849243164, -1.2852694988250732, -0.7223935127258301, -0.159515380859375, 0.4033607244491577, 0.9662368297576904, 1.5291129350662231, 2.091989040374756, 2.654865264892578, 3.2177412509918213, 3.7806172370910645, 4.343493461608887, 4.906369686126709, 5.469245910644531, 6.032121658325195, 6.594997882843018, 7.15787410736084, 7.720749855041504, 8.283626556396484, 8.846502304077148, 9.409378051757812, 9.972254753112793, 10.535130500793457, 11.098007202148438, 11.660882949829102, 12.223758697509766, 12.78663444519043, 13.34951114654541, 13.912386894226074, 14.475263595581055, 15.038139343261719, 15.601015090942383, 16.163890838623047, 16.726768493652344, 17.289644241333008, 17.852519989013672]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 3.0, 5.0, 4.0, 6.0, 6.0, 10.0, 8.0, 14.0, 18.0, 25.0, 21.0, 19.0, 30.0, 29.0, 28.0, 27.0, 31.0, 34.0, 32.0, 34.0, 27.0, 45.0, 48.0, 28.0, 45.0, 41.0, 40.0, 30.0, 50.0, 29.0, 42.0, 23.0, 22.0, 19.0, 15.0, 18.0, 14.0, 17.0, 10.0, 19.0, 13.0, 11.0, 5.0, 3.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.908498764038086, -11.512176513671875, -11.115854263305664, -10.719532012939453, -10.323209762573242, -9.926887512207031, -9.53056526184082, -9.13424301147461, -8.737920761108398, -8.341598510742188, -7.945276260375977, -7.548954010009766, -7.152631759643555, -6.756309509277344, -6.359987258911133, -5.963665008544922, -5.567342758178711, -5.1710205078125, -4.774698257446289, -4.378376007080078, -3.982053756713867, -3.5857315063476562, -3.1894092559814453, -2.7930870056152344, -2.3967647552490234, -2.0004425048828125, -1.6041202545166016, -1.2077980041503906, -0.8114757537841797, -0.41515350341796875, -0.018831253051757812, 0.3774909973144531, 0.7738142013549805, 1.1701364517211914, 1.5664587020874023, 1.9627809524536133, 2.359103202819824, 2.755425453186035, 3.151747703552246, 3.548069953918457, 3.944392204284668, 4.340714454650879, 4.73703670501709, 5.133358955383301, 5.529681205749512, 5.926003456115723, 6.322325706481934, 6.7186479568481445, 7.1149702072143555, 7.511292457580566, 7.907614707946777, 8.303936958312988, 8.7002592086792, 9.09658145904541, 9.492903709411621, 9.889225959777832, 10.285548210144043, 10.681870460510254, 11.078192710876465, 11.474514961242676, 11.870837211608887, 12.267159461975098, 12.663481712341309, 13.05980396270752, 13.45612621307373]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 4.0, 7.0, 7.0, 14.0, 25.0, 30.0, 55.0, 68.0, 155.0, 196.0, 294.0, 429.0, 713.0, 1069.0, 1683.0, 2682.0, 4394.0, 7126.0, 12801.0, 22412.0, 41338.0, 80805.0, 164102.0, 343773.0, 683686.0, 1000824.0, 865037.0, 490337.0, 234620.0, 113411.0, 56122.0, 28498.0, 15488.0, 8759.0, 5179.0, 2945.0, 1799.0, 1182.0, 697.0, 461.0, 339.0, 237.0, 143.0, 112.0, 67.0, 51.0, 41.0, 33.0, 15.0, 5.0, 6.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.125, -16.529052734375, -15.93310546875, -15.337158203125, -14.7412109375, -14.145263671875, -13.54931640625, -12.953369140625, -12.357421875, -11.761474609375, -11.16552734375, -10.569580078125, -9.9736328125, -9.377685546875, -8.78173828125, -8.185791015625, -7.58984375, -6.993896484375, -6.39794921875, -5.802001953125, -5.2060546875, -4.610107421875, -4.01416015625, -3.418212890625, -2.822265625, -2.226318359375, -1.63037109375, -1.034423828125, -0.4384765625, 0.157470703125, 0.75341796875, 1.349365234375, 1.9453125, 2.541259765625, 3.13720703125, 3.733154296875, 4.3291015625, 4.925048828125, 5.52099609375, 6.116943359375, 6.712890625, 7.308837890625, 7.90478515625, 8.500732421875, 9.0966796875, 9.692626953125, 10.28857421875, 10.884521484375, 11.48046875, 12.076416015625, 12.67236328125, 13.268310546875, 13.8642578125, 14.460205078125, 15.05615234375, 15.652099609375, 16.248046875, 16.843994140625, 17.43994140625, 18.035888671875, 18.6318359375, 19.227783203125, 19.82373046875, 20.419677734375, 21.015625]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 11.0, 9.0, 8.0, 3.0, 12.0, 9.0, 15.0, 19.0, 21.0, 19.0, 26.0, 19.0, 28.0, 20.0, 20.0, 34.0, 23.0, 31.0, 28.0, 34.0, 31.0, 25.0, 46.0, 35.0, 36.0, 45.0, 41.0, 31.0, 30.0, 30.0, 25.0, 32.0, 29.0, 19.0, 22.0, 10.0, 17.0, 19.0, 12.0, 11.0, 15.0, 10.0, 15.0, 5.0, 3.0, 3.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 3.0], "bins": [-11.5, -11.157958984375, -10.81591796875, -10.473876953125, -10.1318359375, -9.789794921875, -9.44775390625, -9.105712890625, -8.763671875, -8.421630859375, -8.07958984375, -7.737548828125, -7.3955078125, -7.053466796875, -6.71142578125, -6.369384765625, -6.02734375, -5.685302734375, -5.34326171875, -5.001220703125, -4.6591796875, -4.317138671875, -3.97509765625, -3.633056640625, -3.291015625, -2.948974609375, -2.60693359375, -2.264892578125, -1.9228515625, -1.580810546875, -1.23876953125, -0.896728515625, -0.5546875, -0.212646484375, 0.12939453125, 0.471435546875, 0.8134765625, 1.155517578125, 1.49755859375, 1.839599609375, 2.181640625, 2.523681640625, 2.86572265625, 3.207763671875, 3.5498046875, 3.891845703125, 4.23388671875, 4.575927734375, 4.91796875, 5.260009765625, 5.60205078125, 5.944091796875, 6.2861328125, 6.628173828125, 6.97021484375, 7.312255859375, 7.654296875, 7.996337890625, 8.33837890625, 8.680419921875, 9.0224609375, 9.364501953125, 9.70654296875, 10.048583984375, 10.390625]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 3.0, 8.0, 16.0, 19.0, 25.0, 38.0, 61.0, 86.0, 112.0, 156.0, 236.0, 371.0, 517.0, 733.0, 1106.0, 1642.0, 2596.0, 4040.0, 6301.0, 10265.0, 17178.0, 28939.0, 52278.0, 95136.0, 182114.0, 351225.0, 648021.0, 938282.0, 819632.0, 482482.0, 253379.0, 131293.0, 69913.0, 38614.0, 22114.0, 13019.0, 7988.0, 4921.0, 3176.0, 2064.0, 1361.0, 911.0, 613.0, 405.0, 289.0, 206.0, 119.0, 80.0, 67.0, 42.0, 35.0, 21.0, 17.0, 11.0, 6.0, 6.0, 1.0, 3.0, 2.0, 2.0], "bins": [-24.625, -23.849365234375, -23.07373046875, -22.298095703125, -21.5224609375, -20.746826171875, -19.97119140625, -19.195556640625, -18.419921875, -17.644287109375, -16.86865234375, -16.093017578125, -15.3173828125, -14.541748046875, -13.76611328125, -12.990478515625, -12.21484375, -11.439208984375, -10.66357421875, -9.887939453125, -9.1123046875, -8.336669921875, -7.56103515625, -6.785400390625, -6.009765625, -5.234130859375, -4.45849609375, -3.682861328125, -2.9072265625, -2.131591796875, -1.35595703125, -0.580322265625, 0.1953125, 0.970947265625, 1.74658203125, 2.522216796875, 3.2978515625, 4.073486328125, 4.84912109375, 5.624755859375, 6.400390625, 7.176025390625, 7.95166015625, 8.727294921875, 9.5029296875, 10.278564453125, 11.05419921875, 11.829833984375, 12.60546875, 13.381103515625, 14.15673828125, 14.932373046875, 15.7080078125, 16.483642578125, 17.25927734375, 18.034912109375, 18.810546875, 19.586181640625, 20.36181640625, 21.137451171875, 21.9130859375, 22.688720703125, 23.46435546875, 24.239990234375, 25.015625]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 2.0, 4.0, 9.0, 9.0, 10.0, 5.0, 13.0, 17.0, 23.0, 42.0, 30.0, 39.0, 47.0, 62.0, 78.0, 89.0, 108.0, 121.0, 157.0, 196.0, 211.0, 253.0, 279.0, 273.0, 301.0, 238.0, 211.0, 212.0, 201.0, 162.0, 137.0, 102.0, 72.0, 87.0, 60.0, 35.0, 33.0, 26.0, 25.0, 32.0, 18.0, 10.0, 9.0, 8.0, 7.0, 4.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.6015625, -7.3621826171875, -7.122802734375, -6.8834228515625, -6.64404296875, -6.4046630859375, -6.165283203125, -5.9259033203125, -5.6865234375, -5.4471435546875, -5.207763671875, -4.9683837890625, -4.72900390625, -4.4896240234375, -4.250244140625, -4.0108642578125, -3.771484375, -3.5321044921875, -3.292724609375, -3.0533447265625, -2.81396484375, -2.5745849609375, -2.335205078125, -2.0958251953125, -1.8564453125, -1.6170654296875, -1.377685546875, -1.1383056640625, -0.89892578125, -0.6595458984375, -0.420166015625, -0.1807861328125, 0.05859375, 0.2979736328125, 0.537353515625, 0.7767333984375, 1.01611328125, 1.2554931640625, 1.494873046875, 1.7342529296875, 1.9736328125, 2.2130126953125, 2.452392578125, 2.6917724609375, 2.93115234375, 3.1705322265625, 3.409912109375, 3.6492919921875, 3.888671875, 4.1280517578125, 4.367431640625, 4.6068115234375, 4.84619140625, 5.0855712890625, 5.324951171875, 5.5643310546875, 5.8037109375, 6.0430908203125, 6.282470703125, 6.5218505859375, 6.76123046875, 7.0006103515625, 7.239990234375, 7.4793701171875, 7.71875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 0.0, 3.0, 6.0, 4.0, 6.0, 16.0, 5.0, 12.0, 17.0, 8.0, 21.0, 25.0, 32.0, 37.0, 31.0, 33.0, 53.0, 46.0, 44.0, 62.0, 56.0, 46.0, 66.0, 45.0, 43.0, 41.0, 34.0, 37.0, 31.0, 19.0, 26.0, 23.0, 16.0, 14.0, 9.0, 4.0, 6.0, 3.0, 3.0, 6.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-26.721359252929688, -25.900625228881836, -25.079891204833984, -24.259157180786133, -23.43842315673828, -22.617687225341797, -21.796953201293945, -20.976219177246094, -20.155485153198242, -19.33475112915039, -18.51401710510254, -17.693283081054688, -16.872547149658203, -16.051815032958984, -15.2310791015625, -14.410345077514648, -13.589611053466797, -12.768877029418945, -11.948143005371094, -11.127408027648926, -10.306674003601074, -9.485939979553223, -8.665205001831055, -7.844470977783203, -7.023736953735352, -6.2030029296875, -5.38226842880249, -4.5615339279174805, -3.740799903869629, -2.9200658798217773, -2.0993313789367676, -1.2785968780517578, -0.45786285400390625, 0.3628714084625244, 1.183605670928955, 2.0043399333953857, 2.8250741958618164, 3.645808219909668, 4.466542720794678, 5.2872772216796875, 6.108011245727539, 6.928745269775391, 7.7494797706604, 8.57021427154541, 9.390948295593262, 10.211682319641113, 11.032417297363281, 11.853151321411133, 12.673885345458984, 13.494619369506836, 14.315353393554688, 15.136088371276855, 15.956822395324707, 16.777557373046875, 17.598291397094727, 18.419025421142578, 19.23975944519043, 20.06049346923828, 20.881227493286133, 21.701961517333984, 22.52269744873047, 23.343429565429688, 24.164165496826172, 24.984899520874023, 25.805633544921875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 4.0, 7.0, 12.0, 12.0, 14.0, 14.0, 10.0, 18.0, 18.0, 21.0, 27.0, 21.0, 37.0, 29.0, 38.0, 33.0, 41.0, 41.0, 40.0, 47.0, 36.0, 26.0, 47.0, 37.0, 35.0, 41.0, 32.0, 29.0, 31.0, 26.0, 31.0, 22.0, 13.0, 24.0, 14.0, 16.0, 12.0, 5.0, 10.0, 10.0, 10.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-17.098608016967773, -16.550521850585938, -16.002437591552734, -15.454351425170898, -14.906265258789062, -14.358179092407227, -13.810093879699707, -13.262008666992188, -12.713922500610352, -12.165836334228516, -11.617751121520996, -11.069665908813477, -10.52157974243164, -9.973493576049805, -9.425408363342285, -8.877323150634766, -8.32923698425293, -7.781151294708252, -7.233065605163574, -6.6849799156188965, -6.136894226074219, -5.588808536529541, -5.040722846984863, -4.4926371574401855, -3.944551467895508, -3.39646577835083, -2.8483800888061523, -2.3002943992614746, -1.7522087097167969, -1.2041230201721191, -0.6560373306274414, -0.10795164108276367, 0.44013214111328125, 0.988217830657959, 1.5363035202026367, 2.0843892097473145, 2.632474899291992, 3.18056058883667, 3.7286462783813477, 4.276731967926025, 4.824817657470703, 5.372903347015381, 5.920989036560059, 6.469074726104736, 7.017160415649414, 7.565246105194092, 8.11333179473877, 8.661417007446289, 9.209503173828125, 9.757589340209961, 10.30567455291748, 10.853759765625, 11.401845932006836, 11.949932098388672, 12.498017311096191, 13.046102523803711, 13.594188690185547, 14.142274856567383, 14.690360069274902, 15.238445281982422, 15.786531448364258, 16.334617614746094, 16.882701873779297, 17.430788040161133, 17.97887420654297]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 10.0, 14.0, 25.0, 26.0, 39.0, 71.0, 105.0, 154.0, 259.0, 389.0, 604.0, 976.0, 1442.0, 2207.0, 3323.0, 5461.0, 8373.0, 14036.0, 22228.0, 35270.0, 56033.0, 86307.0, 122638.0, 152794.0, 155249.0, 128102.0, 90629.0, 59992.0, 38055.0, 23512.0, 14734.0, 9241.0, 5808.0, 3751.0, 2413.0, 1525.0, 943.0, 612.0, 405.0, 284.0, 174.0, 112.0, 89.0, 61.0, 41.0, 15.0, 14.0, 5.0, 6.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-11.6953125, -11.3416748046875, -10.988037109375, -10.6343994140625, -10.28076171875, -9.9271240234375, -9.573486328125, -9.2198486328125, -8.8662109375, -8.5125732421875, -8.158935546875, -7.8052978515625, -7.45166015625, -7.0980224609375, -6.744384765625, -6.3907470703125, -6.037109375, -5.6834716796875, -5.329833984375, -4.9761962890625, -4.62255859375, -4.2689208984375, -3.915283203125, -3.5616455078125, -3.2080078125, -2.8543701171875, -2.500732421875, -2.1470947265625, -1.79345703125, -1.4398193359375, -1.086181640625, -0.7325439453125, -0.37890625, -0.0252685546875, 0.328369140625, 0.6820068359375, 1.03564453125, 1.3892822265625, 1.742919921875, 2.0965576171875, 2.4501953125, 2.8038330078125, 3.157470703125, 3.5111083984375, 3.86474609375, 4.2183837890625, 4.572021484375, 4.9256591796875, 5.279296875, 5.6329345703125, 5.986572265625, 6.3402099609375, 6.69384765625, 7.0474853515625, 7.401123046875, 7.7547607421875, 8.1083984375, 8.4620361328125, 8.815673828125, 9.1693115234375, 9.52294921875, 9.8765869140625, 10.230224609375, 10.5838623046875, 10.9375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 5.0, 3.0, 3.0, 5.0, 10.0, 11.0, 15.0, 11.0, 8.0, 13.0, 27.0, 22.0, 30.0, 27.0, 35.0, 49.0, 35.0, 36.0, 40.0, 41.0, 48.0, 40.0, 40.0, 47.0, 40.0, 36.0, 44.0, 29.0, 43.0, 37.0, 26.0, 20.0, 25.0, 10.0, 26.0, 11.0, 13.0, 12.0, 9.0, 11.0, 4.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-20.671875, -20.0234375, -19.375, -18.7265625, -18.078125, -17.4296875, -16.78125, -16.1328125, -15.484375, -14.8359375, -14.1875, -13.5390625, -12.890625, -12.2421875, -11.59375, -10.9453125, -10.296875, -9.6484375, -9.0, -8.3515625, -7.703125, -7.0546875, -6.40625, -5.7578125, -5.109375, -4.4609375, -3.8125, -3.1640625, -2.515625, -1.8671875, -1.21875, -0.5703125, 0.078125, 0.7265625, 1.375, 2.0234375, 2.671875, 3.3203125, 3.96875, 4.6171875, 5.265625, 5.9140625, 6.5625, 7.2109375, 7.859375, 8.5078125, 9.15625, 9.8046875, 10.453125, 11.1015625, 11.75, 12.3984375, 13.046875, 13.6953125, 14.34375, 14.9921875, 15.640625, 16.2890625, 16.9375, 17.5859375, 18.234375, 18.8828125, 19.53125, 20.1796875, 20.828125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 2.0, 6.0, 1.0, 8.0, 8.0, 14.0, 32.0, 30.0, 44.0, 89.0, 110.0, 197.0, 266.0, 437.0, 630.0, 1031.0, 1642.0, 2553.0, 4254.0, 7335.0, 12598.0, 22364.0, 40679.0, 73417.0, 127462.0, 194710.0, 209206.0, 148469.0, 88331.0, 48846.0, 26923.0, 15050.0, 8636.0, 4999.0, 3035.0, 1823.0, 1120.0, 744.0, 508.0, 316.0, 231.0, 135.0, 90.0, 50.0, 39.0, 32.0, 26.0, 7.0, 7.0, 6.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-16.125, -15.62353515625, -15.1220703125, -14.62060546875, -14.119140625, -13.61767578125, -13.1162109375, -12.61474609375, -12.11328125, -11.61181640625, -11.1103515625, -10.60888671875, -10.107421875, -9.60595703125, -9.1044921875, -8.60302734375, -8.1015625, -7.60009765625, -7.0986328125, -6.59716796875, -6.095703125, -5.59423828125, -5.0927734375, -4.59130859375, -4.08984375, -3.58837890625, -3.0869140625, -2.58544921875, -2.083984375, -1.58251953125, -1.0810546875, -0.57958984375, -0.078125, 0.42333984375, 0.9248046875, 1.42626953125, 1.927734375, 2.42919921875, 2.9306640625, 3.43212890625, 3.93359375, 4.43505859375, 4.9365234375, 5.43798828125, 5.939453125, 6.44091796875, 6.9423828125, 7.44384765625, 7.9453125, 8.44677734375, 8.9482421875, 9.44970703125, 9.951171875, 10.45263671875, 10.9541015625, 11.45556640625, 11.95703125, 12.45849609375, 12.9599609375, 13.46142578125, 13.962890625, 14.46435546875, 14.9658203125, 15.46728515625, 15.96875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 7.0, 3.0, 5.0, 9.0, 14.0, 13.0, 8.0, 17.0, 16.0, 21.0, 18.0, 27.0, 21.0, 34.0, 42.0, 44.0, 47.0, 43.0, 48.0, 47.0, 46.0, 51.0, 47.0, 39.0, 42.0, 43.0, 51.0, 32.0, 27.0, 26.0, 20.0, 13.0, 21.0, 18.0, 9.0, 10.0, 11.0, 5.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.2734375, -12.87109375, -12.46875, -12.06640625, -11.6640625, -11.26171875, -10.859375, -10.45703125, -10.0546875, -9.65234375, -9.25, -8.84765625, -8.4453125, -8.04296875, -7.640625, -7.23828125, -6.8359375, -6.43359375, -6.03125, -5.62890625, -5.2265625, -4.82421875, -4.421875, -4.01953125, -3.6171875, -3.21484375, -2.8125, -2.41015625, -2.0078125, -1.60546875, -1.203125, -0.80078125, -0.3984375, 0.00390625, 0.40625, 0.80859375, 1.2109375, 1.61328125, 2.015625, 2.41796875, 2.8203125, 3.22265625, 3.625, 4.02734375, 4.4296875, 4.83203125, 5.234375, 5.63671875, 6.0390625, 6.44140625, 6.84375, 7.24609375, 7.6484375, 8.05078125, 8.453125, 8.85546875, 9.2578125, 9.66015625, 10.0625, 10.46484375, 10.8671875, 11.26953125, 11.671875, 12.07421875, 12.4765625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 2.0, 10.0, 24.0, 29.0, 19.0, 43.0, 79.0, 67.0, 148.0, 230.0, 297.0, 551.0, 805.0, 1313.0, 2093.0, 3484.0, 6017.0, 10396.0, 18709.0, 35221.0, 65856.0, 122654.0, 202921.0, 229910.0, 156782.0, 87305.0, 46229.0, 24589.0, 13573.0, 7657.0, 4432.0, 2635.0, 1652.0, 1003.0, 640.0, 405.0, 273.0, 185.0, 112.0, 79.0, 40.0, 31.0, 18.0, 13.0, 12.0, 7.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-9.6328125, -9.351318359375, -9.06982421875, -8.788330078125, -8.5068359375, -8.225341796875, -7.94384765625, -7.662353515625, -7.380859375, -7.099365234375, -6.81787109375, -6.536376953125, -6.2548828125, -5.973388671875, -5.69189453125, -5.410400390625, -5.12890625, -4.847412109375, -4.56591796875, -4.284423828125, -4.0029296875, -3.721435546875, -3.43994140625, -3.158447265625, -2.876953125, -2.595458984375, -2.31396484375, -2.032470703125, -1.7509765625, -1.469482421875, -1.18798828125, -0.906494140625, -0.625, -0.343505859375, -0.06201171875, 0.219482421875, 0.5009765625, 0.782470703125, 1.06396484375, 1.345458984375, 1.626953125, 1.908447265625, 2.18994140625, 2.471435546875, 2.7529296875, 3.034423828125, 3.31591796875, 3.597412109375, 3.87890625, 4.160400390625, 4.44189453125, 4.723388671875, 5.0048828125, 5.286376953125, 5.56787109375, 5.849365234375, 6.130859375, 6.412353515625, 6.69384765625, 6.975341796875, 7.2568359375, 7.538330078125, 7.81982421875, 8.101318359375, 8.3828125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 2.0, 5.0, 8.0, 9.0, 7.0, 10.0, 16.0, 11.0, 17.0, 25.0, 27.0, 31.0, 36.0, 31.0, 59.0, 44.0, 47.0, 56.0, 59.0, 78.0, 54.0, 48.0, 47.0, 44.0, 34.0, 36.0, 34.0, 23.0, 23.0, 13.0, 12.0, 15.0, 13.0, 4.0, 7.0, 6.0, 5.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0003979206085205078, -0.00038359686732292175, -0.0003692731261253357, -0.00035494938492774963, -0.0003406256437301636, -0.0003263019025325775, -0.00031197816133499146, -0.0002976544201374054, -0.00028333067893981934, -0.0002690069377422333, -0.0002546831965446472, -0.00024035945534706116, -0.0002260357141494751, -0.00021171197295188904, -0.00019738823175430298, -0.00018306449055671692, -0.00016874074935913086, -0.0001544170081615448, -0.00014009326696395874, -0.00012576952576637268, -0.00011144578456878662, -9.712204337120056e-05, -8.27983021736145e-05, -6.847456097602844e-05, -5.415081977844238e-05, -3.982707858085632e-05, -2.5503337383270264e-05, -1.1179596185684204e-05, 3.1441450119018555e-06, 1.7467886209487915e-05, 3.1791627407073975e-05, 4.6115368604660034e-05, 6.0439109802246094e-05, 7.476285099983215e-05, 8.908659219741821e-05, 0.00010341033339500427, 0.00011773407459259033, 0.0001320578157901764, 0.00014638155698776245, 0.0001607052981853485, 0.00017502903938293457, 0.00018935278058052063, 0.0002036765217781067, 0.00021800026297569275, 0.0002323240041732788, 0.00024664774537086487, 0.00026097148656845093, 0.000275295227766037, 0.00028961896896362305, 0.0003039427101612091, 0.00031826645135879517, 0.0003325901925563812, 0.0003469139337539673, 0.00036123767495155334, 0.0003755614161491394, 0.00038988515734672546, 0.0004042088985443115, 0.0004185326397418976, 0.00043285638093948364, 0.0004471801221370697, 0.00046150386333465576, 0.0004758276045322418, 0.0004901513457298279, 0.0005044750869274139, 0.000518798828125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 13.0, 7.0, 8.0, 18.0, 26.0, 38.0, 59.0, 90.0, 107.0, 193.0, 253.0, 366.0, 530.0, 823.0, 1203.0, 1880.0, 2895.0, 4636.0, 7194.0, 11724.0, 19485.0, 33313.0, 55735.0, 91587.0, 138687.0, 174663.0, 168636.0, 126644.0, 81877.0, 49852.0, 29701.0, 17675.0, 10609.0, 6437.0, 3928.0, 2534.0, 1666.0, 1115.0, 700.0, 504.0, 365.0, 256.0, 153.0, 111.0, 87.0, 59.0, 39.0, 25.0, 20.0, 7.0, 9.0, 5.0, 6.0, 1.0, 3.0, 3.0, 1.0], "bins": [-8.7109375, -8.446044921875, -8.18115234375, -7.916259765625, -7.6513671875, -7.386474609375, -7.12158203125, -6.856689453125, -6.591796875, -6.326904296875, -6.06201171875, -5.797119140625, -5.5322265625, -5.267333984375, -5.00244140625, -4.737548828125, -4.47265625, -4.207763671875, -3.94287109375, -3.677978515625, -3.4130859375, -3.148193359375, -2.88330078125, -2.618408203125, -2.353515625, -2.088623046875, -1.82373046875, -1.558837890625, -1.2939453125, -1.029052734375, -0.76416015625, -0.499267578125, -0.234375, 0.030517578125, 0.29541015625, 0.560302734375, 0.8251953125, 1.090087890625, 1.35498046875, 1.619873046875, 1.884765625, 2.149658203125, 2.41455078125, 2.679443359375, 2.9443359375, 3.209228515625, 3.47412109375, 3.739013671875, 4.00390625, 4.268798828125, 4.53369140625, 4.798583984375, 5.0634765625, 5.328369140625, 5.59326171875, 5.858154296875, 6.123046875, 6.387939453125, 6.65283203125, 6.917724609375, 7.1826171875, 7.447509765625, 7.71240234375, 7.977294921875, 8.2421875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 1.0, 0.0, 5.0, 2.0, 4.0, 3.0, 6.0, 5.0, 8.0, 6.0, 9.0, 11.0, 14.0, 27.0, 35.0, 26.0, 29.0, 37.0, 43.0, 51.0, 60.0, 56.0, 67.0, 55.0, 56.0, 59.0, 60.0, 33.0, 34.0, 34.0, 33.0, 36.0, 19.0, 18.0, 17.0, 8.0, 6.0, 12.0, 11.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.36328125, -3.27142333984375, -3.1795654296875, -3.08770751953125, -2.995849609375, -2.90399169921875, -2.8121337890625, -2.72027587890625, -2.62841796875, -2.53656005859375, -2.4447021484375, -2.35284423828125, -2.260986328125, -2.16912841796875, -2.0772705078125, -1.98541259765625, -1.8935546875, -1.80169677734375, -1.7098388671875, -1.61798095703125, -1.526123046875, -1.43426513671875, -1.3424072265625, -1.25054931640625, -1.15869140625, -1.06683349609375, -0.9749755859375, -0.88311767578125, -0.791259765625, -0.69940185546875, -0.6075439453125, -0.51568603515625, -0.423828125, -0.33197021484375, -0.2401123046875, -0.14825439453125, -0.056396484375, 0.03546142578125, 0.1273193359375, 0.21917724609375, 0.31103515625, 0.40289306640625, 0.4947509765625, 0.58660888671875, 0.678466796875, 0.77032470703125, 0.8621826171875, 0.95404052734375, 1.0458984375, 1.13775634765625, 1.2296142578125, 1.32147216796875, 1.413330078125, 1.50518798828125, 1.5970458984375, 1.68890380859375, 1.78076171875, 1.87261962890625, 1.9644775390625, 2.05633544921875, 2.148193359375, 2.24005126953125, 2.3319091796875, 2.42376708984375, 2.515625]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 7.0, 2.0, 5.0, 9.0, 7.0, 10.0, 9.0, 13.0, 12.0, 23.0, 23.0, 33.0, 29.0, 30.0, 41.0, 52.0, 43.0, 50.0, 58.0, 47.0, 66.0, 67.0, 46.0, 48.0, 29.0, 40.0, 39.0, 27.0, 35.0, 21.0, 16.0, 18.0, 8.0, 9.0, 5.0, 3.0, 6.0, 2.0, 2.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.771923065185547, -26.920028686523438, -26.06813621520996, -25.21624183654785, -24.364349365234375, -23.512454986572266, -22.660560607910156, -21.80866813659668, -20.95677375793457, -20.10487937927246, -19.252986907958984, -18.401092529296875, -17.5492000579834, -16.69730567932129, -15.845412254333496, -14.993518829345703, -14.14162540435791, -13.289731979370117, -12.437838554382324, -11.585945129394531, -10.734050750732422, -9.882157325744629, -9.030263900756836, -8.178369522094727, -7.326476573944092, -6.474583148956299, -5.622689247131348, -4.770795822143555, -3.9189021587371826, -3.0670084953308105, -2.2151150703430176, -1.3632211685180664, -0.5113277435302734, 0.34056586027145386, 1.1924594640731812, 2.0443530082702637, 2.8962466716766357, 3.748140335083008, 4.600033760070801, 5.451927661895752, 6.303821086883545, 7.155714511871338, 8.007608413696289, 8.859501838684082, 9.711395263671875, 10.563289642333984, 11.415182113647461, 12.26707649230957, 13.118969917297363, 13.970863342285156, 14.82275676727295, 15.674650192260742, 16.52654457092285, 17.378437042236328, 18.230331420898438, 19.082225799560547, 19.934118270874023, 20.786012649536133, 21.63790512084961, 22.48979949951172, 23.341691970825195, 24.193586349487305, 25.04547882080078, 25.89737319946289, 26.749267578125]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 4.0, 6.0, 7.0, 8.0, 14.0, 13.0, 10.0, 16.0, 15.0, 19.0, 21.0, 26.0, 20.0, 40.0, 24.0, 33.0, 40.0, 39.0, 39.0, 39.0, 44.0, 38.0, 42.0, 34.0, 41.0, 29.0, 34.0, 31.0, 41.0, 37.0, 23.0, 23.0, 28.0, 26.0, 17.0, 12.0, 17.0, 10.0, 8.0, 12.0, 12.0, 2.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-17.176673889160156, -16.617765426635742, -16.058856964111328, -15.499948501586914, -14.941040992736816, -14.382132530212402, -13.823224067687988, -13.264315605163574, -12.705408096313477, -12.146499633789062, -11.587591171264648, -11.028682708740234, -10.469775199890137, -9.910866737365723, -9.351958274841309, -8.793049812316895, -8.23414134979248, -7.675232887268066, -7.1163249015808105, -6.5574164390563965, -5.998508453369141, -5.439599990844727, -4.8806915283203125, -4.321783065795898, -3.7628750801086426, -3.2039668560028076, -2.6450586318969727, -2.0861501693725586, -1.5272419452667236, -0.9683337211608887, -0.4094252586364746, 0.14948296546936035, 0.7083911895751953, 1.2672994136810303, 1.8262077569961548, 2.3851161003112793, 2.9440243244171143, 3.502932548522949, 4.061841011047363, 4.620749473571777, 5.179657459259033, 5.738565921783447, 6.297473907470703, 6.856382369995117, 7.415290832519531, 7.974198818206787, 8.53310775756836, 9.092015266418457, 9.650923728942871, 10.209832191467285, 10.7687406539917, 11.327648162841797, 11.886556625366211, 12.445465087890625, 13.004373550415039, 13.563282012939453, 14.122190475463867, 14.681098937988281, 15.240007400512695, 15.79891586303711, 16.357824325561523, 16.916732788085938, 17.47563934326172, 18.034547805786133, 18.593456268310547]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 3.0, 7.0, 10.0, 12.0, 7.0, 24.0, 35.0, 70.0, 87.0, 112.0, 186.0, 298.0, 421.0, 643.0, 909.0, 1384.0, 2307.0, 3504.0, 5569.0, 9011.0, 15083.0, 24990.0, 42396.0, 70714.0, 110640.0, 153094.0, 171329.0, 150873.0, 109606.0, 69854.0, 41583.0, 24764.0, 14577.0, 9020.0, 5501.0, 3477.0, 2264.0, 1383.0, 920.0, 635.0, 386.0, 338.0, 186.0, 136.0, 77.0, 49.0, 27.0, 29.0, 16.0, 8.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.546875, -15.036865234375, -14.52685546875, -14.016845703125, -13.5068359375, -12.996826171875, -12.48681640625, -11.976806640625, -11.466796875, -10.956787109375, -10.44677734375, -9.936767578125, -9.4267578125, -8.916748046875, -8.40673828125, -7.896728515625, -7.38671875, -6.876708984375, -6.36669921875, -5.856689453125, -5.3466796875, -4.836669921875, -4.32666015625, -3.816650390625, -3.306640625, -2.796630859375, -2.28662109375, -1.776611328125, -1.2666015625, -0.756591796875, -0.24658203125, 0.263427734375, 0.7734375, 1.283447265625, 1.79345703125, 2.303466796875, 2.8134765625, 3.323486328125, 3.83349609375, 4.343505859375, 4.853515625, 5.363525390625, 5.87353515625, 6.383544921875, 6.8935546875, 7.403564453125, 7.91357421875, 8.423583984375, 8.93359375, 9.443603515625, 9.95361328125, 10.463623046875, 10.9736328125, 11.483642578125, 11.99365234375, 12.503662109375, 13.013671875, 13.523681640625, 14.03369140625, 14.543701171875, 15.0537109375, 15.563720703125, 16.07373046875, 16.583740234375, 17.09375]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 4.0, 3.0, 12.0, 9.0, 12.0, 13.0, 23.0, 14.0, 19.0, 22.0, 25.0, 35.0, 32.0, 31.0, 39.0, 34.0, 48.0, 56.0, 37.0, 43.0, 41.0, 43.0, 45.0, 33.0, 46.0, 31.0, 29.0, 38.0, 29.0, 25.0, 29.0, 15.0, 12.0, 13.0, 14.0, 8.0, 14.0, 6.0, 3.0, 6.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-19.5, -18.86083984375, -18.2216796875, -17.58251953125, -16.943359375, -16.30419921875, -15.6650390625, -15.02587890625, -14.38671875, -13.74755859375, -13.1083984375, -12.46923828125, -11.830078125, -11.19091796875, -10.5517578125, -9.91259765625, -9.2734375, -8.63427734375, -7.9951171875, -7.35595703125, -6.716796875, -6.07763671875, -5.4384765625, -4.79931640625, -4.16015625, -3.52099609375, -2.8818359375, -2.24267578125, -1.603515625, -0.96435546875, -0.3251953125, 0.31396484375, 0.953125, 1.59228515625, 2.2314453125, 2.87060546875, 3.509765625, 4.14892578125, 4.7880859375, 5.42724609375, 6.06640625, 6.70556640625, 7.3447265625, 7.98388671875, 8.623046875, 9.26220703125, 9.9013671875, 10.54052734375, 11.1796875, 11.81884765625, 12.4580078125, 13.09716796875, 13.736328125, 14.37548828125, 15.0146484375, 15.65380859375, 16.29296875, 16.93212890625, 17.5712890625, 18.21044921875, 18.849609375, 19.48876953125, 20.1279296875, 20.76708984375, 21.40625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 3.0, 9.0, 7.0, 9.0, 15.0, 21.0, 32.0, 50.0, 67.0, 104.0, 154.0, 289.0, 402.0, 680.0, 1078.0, 1633.0, 2702.0, 4429.0, 7429.0, 12554.0, 21029.0, 36921.0, 65233.0, 112800.0, 173991.0, 203012.0, 162739.0, 101590.0, 58369.0, 33626.0, 19300.0, 11126.0, 6666.0, 3907.0, 2448.0, 1499.0, 901.0, 594.0, 414.0, 247.0, 168.0, 98.0, 78.0, 42.0, 31.0, 11.0, 14.0, 8.0, 8.0, 4.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0], "bins": [-27.515625, -26.639404296875, -25.76318359375, -24.886962890625, -24.0107421875, -23.134521484375, -22.25830078125, -21.382080078125, -20.505859375, -19.629638671875, -18.75341796875, -17.877197265625, -17.0009765625, -16.124755859375, -15.24853515625, -14.372314453125, -13.49609375, -12.619873046875, -11.74365234375, -10.867431640625, -9.9912109375, -9.114990234375, -8.23876953125, -7.362548828125, -6.486328125, -5.610107421875, -4.73388671875, -3.857666015625, -2.9814453125, -2.105224609375, -1.22900390625, -0.352783203125, 0.5234375, 1.399658203125, 2.27587890625, 3.152099609375, 4.0283203125, 4.904541015625, 5.78076171875, 6.656982421875, 7.533203125, 8.409423828125, 9.28564453125, 10.161865234375, 11.0380859375, 11.914306640625, 12.79052734375, 13.666748046875, 14.54296875, 15.419189453125, 16.29541015625, 17.171630859375, 18.0478515625, 18.924072265625, 19.80029296875, 20.676513671875, 21.552734375, 22.428955078125, 23.30517578125, 24.181396484375, 25.0576171875, 25.933837890625, 26.81005859375, 27.686279296875, 28.5625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 7.0, 11.0, 8.0, 13.0, 11.0, 12.0, 12.0, 12.0, 23.0, 28.0, 28.0, 25.0, 31.0, 32.0, 36.0, 28.0, 38.0, 38.0, 48.0, 46.0, 58.0, 44.0, 35.0, 38.0, 36.0, 27.0, 35.0, 38.0, 34.0, 25.0, 28.0, 25.0, 19.0, 13.0, 9.0, 9.0, 17.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.53125, -13.11181640625, -12.6923828125, -12.27294921875, -11.853515625, -11.43408203125, -11.0146484375, -10.59521484375, -10.17578125, -9.75634765625, -9.3369140625, -8.91748046875, -8.498046875, -8.07861328125, -7.6591796875, -7.23974609375, -6.8203125, -6.40087890625, -5.9814453125, -5.56201171875, -5.142578125, -4.72314453125, -4.3037109375, -3.88427734375, -3.46484375, -3.04541015625, -2.6259765625, -2.20654296875, -1.787109375, -1.36767578125, -0.9482421875, -0.52880859375, -0.109375, 0.31005859375, 0.7294921875, 1.14892578125, 1.568359375, 1.98779296875, 2.4072265625, 2.82666015625, 3.24609375, 3.66552734375, 4.0849609375, 4.50439453125, 4.923828125, 5.34326171875, 5.7626953125, 6.18212890625, 6.6015625, 7.02099609375, 7.4404296875, 7.85986328125, 8.279296875, 8.69873046875, 9.1181640625, 9.53759765625, 9.95703125, 10.37646484375, 10.7958984375, 11.21533203125, 11.634765625, 12.05419921875, 12.4736328125, 12.89306640625, 13.3125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 5.0, 8.0, 15.0, 21.0, 42.0, 53.0, 78.0, 142.0, 184.0, 274.0, 496.0, 845.0, 1517.0, 2812.0, 5452.0, 12209.0, 28325.0, 66843.0, 149869.0, 260805.0, 257528.0, 145049.0, 65011.0, 27314.0, 11883.0, 5524.0, 2698.0, 1485.0, 777.0, 503.0, 272.0, 171.0, 107.0, 71.0, 56.0, 37.0, 24.0, 20.0, 12.0, 9.0, 6.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-20.4375, -19.8695068359375, -19.301513671875, -18.7335205078125, -18.16552734375, -17.5975341796875, -17.029541015625, -16.4615478515625, -15.8935546875, -15.3255615234375, -14.757568359375, -14.1895751953125, -13.62158203125, -13.0535888671875, -12.485595703125, -11.9176025390625, -11.349609375, -10.7816162109375, -10.213623046875, -9.6456298828125, -9.07763671875, -8.5096435546875, -7.941650390625, -7.3736572265625, -6.8056640625, -6.2376708984375, -5.669677734375, -5.1016845703125, -4.53369140625, -3.9656982421875, -3.397705078125, -2.8297119140625, -2.26171875, -1.6937255859375, -1.125732421875, -0.5577392578125, 0.01025390625, 0.5782470703125, 1.146240234375, 1.7142333984375, 2.2822265625, 2.8502197265625, 3.418212890625, 3.9862060546875, 4.55419921875, 5.1221923828125, 5.690185546875, 6.2581787109375, 6.826171875, 7.3941650390625, 7.962158203125, 8.5301513671875, 9.09814453125, 9.6661376953125, 10.234130859375, 10.8021240234375, 11.3701171875, 11.9381103515625, 12.506103515625, 13.0740966796875, 13.64208984375, 14.2100830078125, 14.778076171875, 15.3460693359375, 15.9140625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 8.0, 7.0, 12.0, 16.0, 23.0, 29.0, 32.0, 37.0, 31.0, 50.0, 43.0, 65.0, 62.0, 83.0, 72.0, 52.0, 62.0, 50.0, 48.0, 48.0, 35.0, 25.0, 19.0, 20.0, 19.0, 12.0, 13.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.001163482666015625, -0.0011239498853683472, -0.0010844171047210693, -0.0010448843240737915, -0.0010053515434265137, -0.0009658187627792358, -0.000926285982131958, -0.0008867532014846802, -0.0008472204208374023, -0.0008076876401901245, -0.0007681548595428467, -0.0007286220788955688, -0.000689089298248291, -0.0006495565176010132, -0.0006100237369537354, -0.0005704909563064575, -0.0005309581756591797, -0.0004914253950119019, -0.000451892614364624, -0.0004123598337173462, -0.00037282705307006836, -0.00033329427242279053, -0.0002937614917755127, -0.00025422871112823486, -0.00021469593048095703, -0.0001751631498336792, -0.00013563036918640137, -9.609758853912354e-05, -5.65648078918457e-05, -1.703202724456787e-05, 2.250075340270996e-05, 6.203353404998779e-05, 0.00010156631469726562, 0.00014109909534454346, 0.0001806318759918213, 0.00022016465663909912, 0.00025969743728637695, 0.0002992302179336548, 0.0003387629985809326, 0.00037829577922821045, 0.0004178285598754883, 0.0004573613405227661, 0.0004968941211700439, 0.0005364269018173218, 0.0005759596824645996, 0.0006154924631118774, 0.0006550252437591553, 0.0006945580244064331, 0.0007340908050537109, 0.0007736235857009888, 0.0008131563663482666, 0.0008526891469955444, 0.0008922219276428223, 0.0009317547082901001, 0.0009712874889373779, 0.0010108202695846558, 0.0010503530502319336, 0.0010898858308792114, 0.0011294186115264893, 0.001168951392173767, 0.001208484172821045, 0.0012480169534683228, 0.0012875497341156006, 0.0013270825147628784, 0.0013666152954101562]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 8.0, 9.0, 13.0, 9.0, 26.0, 32.0, 29.0, 54.0, 81.0, 89.0, 152.0, 242.0, 360.0, 521.0, 806.0, 1308.0, 2197.0, 3724.0, 6616.0, 12642.0, 24058.0, 47295.0, 89436.0, 154725.0, 211447.0, 200126.0, 134117.0, 74774.0, 39156.0, 20106.0, 10390.0, 5700.0, 3190.0, 1846.0, 1143.0, 705.0, 444.0, 296.0, 201.0, 139.0, 83.0, 78.0, 42.0, 41.0, 39.0, 16.0, 20.0, 10.0, 4.0, 2.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-13.0546875, -12.6448974609375, -12.235107421875, -11.8253173828125, -11.41552734375, -11.0057373046875, -10.595947265625, -10.1861572265625, -9.7763671875, -9.3665771484375, -8.956787109375, -8.5469970703125, -8.13720703125, -7.7274169921875, -7.317626953125, -6.9078369140625, -6.498046875, -6.0882568359375, -5.678466796875, -5.2686767578125, -4.85888671875, -4.4490966796875, -4.039306640625, -3.6295166015625, -3.2197265625, -2.8099365234375, -2.400146484375, -1.9903564453125, -1.58056640625, -1.1707763671875, -0.760986328125, -0.3511962890625, 0.05859375, 0.4683837890625, 0.878173828125, 1.2879638671875, 1.69775390625, 2.1075439453125, 2.517333984375, 2.9271240234375, 3.3369140625, 3.7467041015625, 4.156494140625, 4.5662841796875, 4.97607421875, 5.3858642578125, 5.795654296875, 6.2054443359375, 6.615234375, 7.0250244140625, 7.434814453125, 7.8446044921875, 8.25439453125, 8.6641845703125, 9.073974609375, 9.4837646484375, 9.8935546875, 10.3033447265625, 10.713134765625, 11.1229248046875, 11.53271484375, 11.9425048828125, 12.352294921875, 12.7620849609375, 13.171875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 1.0, 2.0, 6.0, 7.0, 12.0, 13.0, 17.0, 26.0, 16.0, 27.0, 36.0, 35.0, 34.0, 44.0, 70.0, 50.0, 48.0, 57.0, 69.0, 55.0, 57.0, 51.0, 35.0, 43.0, 36.0, 29.0, 17.0, 25.0, 13.0, 20.0, 12.0, 9.0, 6.0, 6.0, 8.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.203125, -3.09539794921875, -2.9876708984375, -2.87994384765625, -2.772216796875, -2.66448974609375, -2.5567626953125, -2.44903564453125, -2.34130859375, -2.23358154296875, -2.1258544921875, -2.01812744140625, -1.910400390625, -1.80267333984375, -1.6949462890625, -1.58721923828125, -1.4794921875, -1.37176513671875, -1.2640380859375, -1.15631103515625, -1.048583984375, -0.94085693359375, -0.8331298828125, -0.72540283203125, -0.61767578125, -0.50994873046875, -0.4022216796875, -0.29449462890625, -0.186767578125, -0.07904052734375, 0.0286865234375, 0.13641357421875, 0.244140625, 0.35186767578125, 0.4595947265625, 0.56732177734375, 0.675048828125, 0.78277587890625, 0.8905029296875, 0.99822998046875, 1.10595703125, 1.21368408203125, 1.3214111328125, 1.42913818359375, 1.536865234375, 1.64459228515625, 1.7523193359375, 1.86004638671875, 1.9677734375, 2.07550048828125, 2.1832275390625, 2.29095458984375, 2.398681640625, 2.50640869140625, 2.6141357421875, 2.72186279296875, 2.82958984375, 2.93731689453125, 3.0450439453125, 3.15277099609375, 3.260498046875, 3.36822509765625, 3.4759521484375, 3.58367919921875, 3.69140625]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 1.0, 4.0, 7.0, 8.0, 8.0, 13.0, 20.0, 14.0, 20.0, 20.0, 30.0, 27.0, 47.0, 40.0, 45.0, 61.0, 61.0, 60.0, 58.0, 61.0, 53.0, 51.0, 41.0, 46.0, 27.0, 29.0, 39.0, 26.0, 22.0, 13.0, 5.0, 11.0, 2.0, 6.0, 5.0, 0.0, 6.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.87222671508789, -30.914466857910156, -29.956707000732422, -28.998945236206055, -28.04118537902832, -27.083425521850586, -26.12566566467285, -25.167903900146484, -24.21014404296875, -23.252384185791016, -22.29462432861328, -21.336862564086914, -20.37910270690918, -19.421342849731445, -18.46358299255371, -17.505821228027344, -16.54806137084961, -15.590301513671875, -14.632540702819824, -13.67478084564209, -12.717020034790039, -11.759260177612305, -10.80150032043457, -9.84373950958252, -8.885980606079102, -7.928220272064209, -6.970459938049316, -6.012700080871582, -5.054939270019531, -4.097179412841797, -3.1394190788269043, -2.1816587448120117, -1.223897933959961, -0.26613765954971313, 0.6916226148605347, 1.6493828296661377, 2.6071431636810303, 3.5649032592773438, 4.522663593292236, 5.480423927307129, 6.4381842613220215, 7.395944595336914, 8.353704452514648, 9.3114652633667, 10.269225120544434, 11.226985931396484, 12.184745788574219, 13.142505645751953, 14.100266456604004, 15.058026313781738, 16.01578712463379, 16.973546981811523, 17.931306838989258, 18.889068603515625, 19.84682846069336, 20.804588317871094, 21.762348175048828, 22.720108032226562, 23.677867889404297, 24.635629653930664, 25.5933895111084, 26.551149368286133, 27.508909225463867, 28.466670989990234, 29.42443084716797]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 4.0, 10.0, 7.0, 10.0, 12.0, 12.0, 24.0, 18.0, 23.0, 27.0, 42.0, 23.0, 36.0, 36.0, 41.0, 52.0, 46.0, 37.0, 39.0, 42.0, 46.0, 56.0, 50.0, 40.0, 37.0, 27.0, 36.0, 25.0, 22.0, 24.0, 27.0, 16.0, 14.0, 13.0, 12.0, 6.0, 2.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-29.52432632446289, -28.70242691040039, -27.880525588989258, -27.058624267578125, -26.236724853515625, -25.414825439453125, -24.592924118041992, -23.77102279663086, -22.94912338256836, -22.12722396850586, -21.305322647094727, -20.483421325683594, -19.661521911621094, -18.839622497558594, -18.01772117614746, -17.195819854736328, -16.373920440673828, -15.552020072937012, -14.730119705200195, -13.908219337463379, -13.086318969726562, -12.264418601989746, -11.44251823425293, -10.620617866516113, -9.798717498779297, -8.97681713104248, -8.154916763305664, -7.333016395568848, -6.511116027832031, -5.689215660095215, -4.867315292358398, -4.045414924621582, -3.2235145568847656, -2.401614189147949, -1.5797138214111328, -0.7578134536743164, 0.0640869140625, 0.8859872817993164, 1.7078876495361328, 2.529788017272949, 3.3516883850097656, 4.173588752746582, 4.995489120483398, 5.817389488220215, 6.639289855957031, 7.461190223693848, 8.283090591430664, 9.10499095916748, 9.926891326904297, 10.748791694641113, 11.57069206237793, 12.392592430114746, 13.214492797851562, 14.036393165588379, 14.858293533325195, 15.680193901062012, 16.502094268798828, 17.323993682861328, 18.14589500427246, 18.967796325683594, 19.789695739746094, 20.611595153808594, 21.433496475219727, 22.25539779663086, 23.07729721069336]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 3.0, 6.0, 6.0, 7.0, 14.0, 8.0, 5.0, 22.0, 19.0, 24.0, 39.0, 46.0, 64.0, 89.0, 123.0, 176.0, 275.0, 444.0, 837.0, 1605.0, 4089.0, 506287.0, 5432.0, 2087.0, 935.0, 572.0, 322.0, 201.0, 138.0, 95.0, 60.0, 50.0, 39.0, 28.0, 22.0, 10.0, 14.0, 17.0, 15.0, 6.0, 5.0, 8.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 5.0, 3.0, 1.0], "bins": [-618.67529296875, -600.8162841796875, -582.957275390625, -565.0983276367188, -547.2393188476562, -529.3803100585938, -511.52130126953125, -493.66229248046875, -475.8033142089844, -457.9443054199219, -440.0853271484375, -422.226318359375, -404.3673095703125, -386.5083312988281, -368.6493225097656, -350.79034423828125, -332.93133544921875, -315.07232666015625, -297.2133483886719, -279.3543395996094, -261.495361328125, -243.6363525390625, -225.77734375, -207.91835021972656, -190.05935668945312, -172.2003631591797, -154.34136962890625, -136.48236083984375, -118.62336730957031, -100.76437377929688, -82.9053726196289, -65.04637145996094, -47.18743896484375, -29.328441619873047, -11.469444274902344, 6.389553070068359, 24.248550415039062, 42.1075439453125, 59.96654510498047, 77.82554626464844, 95.68453979492188, 113.54353332519531, 131.40252685546875, 149.26153564453125, 167.1205291748047, 184.97952270507812, 202.83853149414062, 220.69752502441406, 238.5565185546875, 256.41552734375, 274.2745056152344, 292.1335144042969, 309.99249267578125, 327.85150146484375, 345.71051025390625, 363.56951904296875, 381.4284973144531, 399.2875061035156, 417.146484375, 435.0054931640625, 452.864501953125, 470.7234802246094, 488.5824890136719, 506.44146728515625, 524.3004760742188]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 3.0, 9.0, 6.0, 9.0, 12.0, 9.0, 21.0, 21.0, 22.0, 19.0, 39.0, 36.0, 31.0, 30.0, 39.0, 48.0, 40.0, 50.0, 35.0, 1067.0, 41.0, 52.0, 51.0, 45.0, 40.0, 30.0, 34.0, 29.0, 25.0, 23.0, 27.0, 20.0, 16.0, 13.0, 14.0, 8.0, 5.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-949.3104248046875, -923.1917724609375, -897.0731201171875, -870.9544677734375, -844.8358154296875, -818.7171630859375, -792.5985107421875, -766.4797973632812, -740.3611450195312, -714.2424926757812, -688.1238403320312, -662.0051879882812, -635.8865356445312, -609.767822265625, -583.649169921875, -557.530517578125, -531.411865234375, -505.293212890625, -479.174560546875, -453.055908203125, -426.9372253417969, -400.8185729980469, -374.6999206542969, -348.58123779296875, -322.462646484375, -296.343994140625, -270.225341796875, -244.10667419433594, -217.98800659179688, -191.86935424804688, -165.75070190429688, -139.6320343017578, -113.51336669921875, -87.39470672607422, -61.27605056762695, -35.15739440917969, -9.038734436035156, 17.079925537109375, 43.198577880859375, 69.31724548339844, 95.43589782714844, 121.55455780029297, 147.6732177734375, 173.7918701171875, 199.9105224609375, 226.02919006347656, 252.14784240722656, 278.2665100097656, 304.3851623535156, 330.5038146972656, 356.6224670410156, 382.74114990234375, 408.85980224609375, 434.97845458984375, 461.09710693359375, 487.21575927734375, 513.3344116210938, 539.4530639648438, 565.5717163085938, 591.6903686523438, 617.8090209960938, 643.927734375, 670.04638671875, 696.1650390625, 722.28369140625]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 7.0, 16.0, 11.0, 26.0, 34.0, 35.0, 62.0, 68.0, 69.0, 83.0, 134.0, 165.0, 178.0, 259.0, 315.0, 344.0, 426.0, 494.0, 608.0, 713.0, 904.0, 1259.0, 1812.0, 2353.0, 3734.0, 16856.0, 31192476.0, 13317.0, 5525.0, 3383.0, 3105.0, 2660.0, 1672.0, 672.0, 314.0, 163.0, 79.0, 53.0, 38.0, 24.0, 19.0, 12.0, 10.0, 9.0, 4.0, 6.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1011.7003784179688, -986.0008544921875, -960.3013305664062, -934.601806640625, -908.9022827148438, -883.2027587890625, -857.5032958984375, -831.8037109375, -806.104248046875, -780.4047241210938, -754.7052001953125, -729.0056762695312, -703.30615234375, -677.6066284179688, -651.9071044921875, -626.2076416015625, -600.508056640625, -574.8085327148438, -549.1090087890625, -523.4094848632812, -497.7099609375, -472.01043701171875, -446.3109436035156, -420.6114196777344, -394.9118957519531, -369.2123718261719, -343.5128479003906, -317.8133544921875, -292.11383056640625, -266.414306640625, -240.71478271484375, -215.0152587890625, -189.315673828125, -163.61614990234375, -137.9166259765625, -112.21711730957031, -86.51759338378906, -60.81806945800781, -35.118560791015625, -9.419036865234375, 16.280487060546875, 41.98000717163086, 67.67952728271484, 93.37904357910156, 119.07856750488281, 144.77809143066406, 170.47760009765625, 196.1771240234375, 221.87664794921875, 247.576171875, 273.27569580078125, 298.9752197265625, 324.67474365234375, 350.374267578125, 376.0737609863281, 401.7732849121094, 427.4728088378906, 453.1723327636719, 478.8718566894531, 504.57135009765625, 530.2708740234375, 555.9703979492188, 581.669921875, 607.3694458007812, 633.0689697265625]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 4.0, 5.0, 8.0, 15.0, 19.0, 33.0, 55.0, 93.0, 117.0, 179.0, 261.0, 507.0, 791.0, 1235.0, 2062.0, 3519.0, 6021.0, 10128.0, 17478.0, 31410.0, 57965.0, 108811.0, 213528.0, 449444.0, 1085266.0, 2149341.0, 1185804.0, 484018.0, 227976.0, 115907.0, 61278.0, 33579.0, 18518.0, 10496.0, 6203.0, 3607.0, 2156.0, 1297.0, 888.0, 507.0, 316.0, 225.0, 144.0, 76.0, 47.0, 44.0, 18.0, 19.0, 9.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-65.25, -63.181640625, -61.11328125, -59.044921875, -56.9765625, -54.908203125, -52.83984375, -50.771484375, -48.703125, -46.634765625, -44.56640625, -42.498046875, -40.4296875, -38.361328125, -36.29296875, -34.224609375, -32.15625, -30.087890625, -28.01953125, -25.951171875, -23.8828125, -21.814453125, -19.74609375, -17.677734375, -15.609375, -13.541015625, -11.47265625, -9.404296875, -7.3359375, -5.267578125, -3.19921875, -1.130859375, 0.9375, 3.005859375, 5.07421875, 7.142578125, 9.2109375, 11.279296875, 13.34765625, 15.416015625, 17.484375, 19.552734375, 21.62109375, 23.689453125, 25.7578125, 27.826171875, 29.89453125, 31.962890625, 34.03125, 36.099609375, 38.16796875, 40.236328125, 42.3046875, 44.373046875, 46.44140625, 48.509765625, 50.578125, 52.646484375, 54.71484375, 56.783203125, 58.8515625, 60.919921875, 62.98828125, 65.056640625, 67.125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 4.0, 2.0, 6.0, 3.0, 6.0, 7.0, 4.0, 6.0, 15.0, 10.0, 17.0, 29.0, 21.0, 30.0, 37.0, 56.0, 49.0, 92.0, 125.0, 141.0, 155.0, 191.0, 192.0, 190.0, 120.0, 103.0, 65.0, 75.0, 51.0, 41.0, 28.0, 27.0, 27.0, 17.0, 23.0, 12.0, 10.0, 11.0, 12.0, 8.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-26.921875, -26.02587890625, -25.1298828125, -24.23388671875, -23.337890625, -22.44189453125, -21.5458984375, -20.64990234375, -19.75390625, -18.85791015625, -17.9619140625, -17.06591796875, -16.169921875, -15.27392578125, -14.3779296875, -13.48193359375, -12.5859375, -11.68994140625, -10.7939453125, -9.89794921875, -9.001953125, -8.10595703125, -7.2099609375, -6.31396484375, -5.41796875, -4.52197265625, -3.6259765625, -2.72998046875, -1.833984375, -0.93798828125, -0.0419921875, 0.85400390625, 1.75, 2.64599609375, 3.5419921875, 4.43798828125, 5.333984375, 6.22998046875, 7.1259765625, 8.02197265625, 8.91796875, 9.81396484375, 10.7099609375, 11.60595703125, 12.501953125, 13.39794921875, 14.2939453125, 15.18994140625, 16.0859375, 16.98193359375, 17.8779296875, 18.77392578125, 19.669921875, 20.56591796875, 21.4619140625, 22.35791015625, 23.25390625, 24.14990234375, 25.0458984375, 25.94189453125, 26.837890625, 27.73388671875, 28.6298828125, 29.52587890625, 30.421875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 7.0, 17.0, 18.0, 43.0, 70.0, 126.0, 187.0, 291.0, 510.0, 767.0, 1178.0, 1864.0, 2819.0, 4536.0, 7286.0, 11707.0, 18704.0, 30457.0, 49536.0, 79766.0, 128317.0, 214897.0, 377048.0, 785860.0, 1770570.0, 1421950.0, 602614.0, 309151.0, 181198.0, 110968.0, 68525.0, 41935.0, 25781.0, 16005.0, 10111.0, 6179.0, 3767.0, 2527.0, 1558.0, 1011.0, 599.0, 397.0, 208.0, 133.0, 77.0, 54.0, 35.0, 31.0, 18.0, 12.0, 9.0, 1.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.25, -28.301513671875, -27.35302734375, -26.404541015625, -25.4560546875, -24.507568359375, -23.55908203125, -22.610595703125, -21.662109375, -20.713623046875, -19.76513671875, -18.816650390625, -17.8681640625, -16.919677734375, -15.97119140625, -15.022705078125, -14.07421875, -13.125732421875, -12.17724609375, -11.228759765625, -10.2802734375, -9.331787109375, -8.38330078125, -7.434814453125, -6.486328125, -5.537841796875, -4.58935546875, -3.640869140625, -2.6923828125, -1.743896484375, -0.79541015625, 0.153076171875, 1.1015625, 2.050048828125, 2.99853515625, 3.947021484375, 4.8955078125, 5.843994140625, 6.79248046875, 7.740966796875, 8.689453125, 9.637939453125, 10.58642578125, 11.534912109375, 12.4833984375, 13.431884765625, 14.38037109375, 15.328857421875, 16.27734375, 17.225830078125, 18.17431640625, 19.122802734375, 20.0712890625, 21.019775390625, 21.96826171875, 22.916748046875, 23.865234375, 24.813720703125, 25.76220703125, 26.710693359375, 27.6591796875, 28.607666015625, 29.55615234375, 30.504638671875, 31.453125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 12.0, 7.0, 7.0, 10.0, 17.0, 11.0, 19.0, 18.0, 12.0, 27.0, 37.0, 41.0, 45.0, 54.0, 65.0, 119.0, 179.0, 191.0, 267.0, 193.0, 155.0, 115.0, 102.0, 55.0, 40.0, 33.0, 28.0, 26.0, 20.0, 18.0, 17.0, 18.0, 12.0, 11.0, 8.0, 7.0, 7.0, 3.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-39.3125, -38.1015625, -36.890625, -35.6796875, -34.46875, -33.2578125, -32.046875, -30.8359375, -29.625, -28.4140625, -27.203125, -25.9921875, -24.78125, -23.5703125, -22.359375, -21.1484375, -19.9375, -18.7265625, -17.515625, -16.3046875, -15.09375, -13.8828125, -12.671875, -11.4609375, -10.25, -9.0390625, -7.828125, -6.6171875, -5.40625, -4.1953125, -2.984375, -1.7734375, -0.5625, 0.6484375, 1.859375, 3.0703125, 4.28125, 5.4921875, 6.703125, 7.9140625, 9.125, 10.3359375, 11.546875, 12.7578125, 13.96875, 15.1796875, 16.390625, 17.6015625, 18.8125, 20.0234375, 21.234375, 22.4453125, 23.65625, 24.8671875, 26.078125, 27.2890625, 28.5, 29.7109375, 30.921875, 32.1328125, 33.34375, 34.5546875, 35.765625, 36.9765625, 38.1875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 9.0, 1.0, 7.0, 3.0, 10.0, 7.0, 8.0, 16.0, 34.0, 44.0, 76.0, 93.0, 132.0, 217.0, 305.0, 444.0, 698.0, 1076.0, 1718.0, 2787.0, 4815.0, 8926.0, 16826.0, 34449.0, 78720.0, 334024.0, 5588492.0, 120772.0, 47326.0, 22306.0, 11699.0, 6159.0, 3337.0, 2180.0, 1319.0, 819.0, 490.0, 302.0, 228.0, 182.0, 121.0, 82.0, 57.0, 47.0, 21.0, 18.0, 16.0, 7.0, 6.0, 6.0, 4.0, 1.0, 3.0, 0.0, 3.0], "bins": [-123.5625, -120.052734375, -116.54296875, -113.033203125, -109.5234375, -106.013671875, -102.50390625, -98.994140625, -95.484375, -91.974609375, -88.46484375, -84.955078125, -81.4453125, -77.935546875, -74.42578125, -70.916015625, -67.40625, -63.896484375, -60.38671875, -56.876953125, -53.3671875, -49.857421875, -46.34765625, -42.837890625, -39.328125, -35.818359375, -32.30859375, -28.798828125, -25.2890625, -21.779296875, -18.26953125, -14.759765625, -11.25, -7.740234375, -4.23046875, -0.720703125, 2.7890625, 6.298828125, 9.80859375, 13.318359375, 16.828125, 20.337890625, 23.84765625, 27.357421875, 30.8671875, 34.376953125, 37.88671875, 41.396484375, 44.90625, 48.416015625, 51.92578125, 55.435546875, 58.9453125, 62.455078125, 65.96484375, 69.474609375, 72.984375, 76.494140625, 80.00390625, 83.513671875, 87.0234375, 90.533203125, 94.04296875, 97.552734375, 101.0625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 8.0, 4.0, 5.0, 9.0, 7.0, 8.0, 16.0, 13.0, 16.0, 26.0, 24.0, 26.0, 38.0, 42.0, 40.0, 59.0, 92.0, 162.0, 339.0, 419.0, 186.0, 100.0, 61.0, 42.0, 45.0, 45.0, 34.0, 22.0, 18.0, 27.0, 19.0, 15.0, 12.0, 7.0, 12.0, 8.0, 6.0, 4.0, 8.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.4375, -65.0439453125, -62.650390625, -60.2568359375, -57.86328125, -55.4697265625, -53.076171875, -50.6826171875, -48.2890625, -45.8955078125, -43.501953125, -41.1083984375, -38.71484375, -36.3212890625, -33.927734375, -31.5341796875, -29.140625, -26.7470703125, -24.353515625, -21.9599609375, -19.56640625, -17.1728515625, -14.779296875, -12.3857421875, -9.9921875, -7.5986328125, -5.205078125, -2.8115234375, -0.41796875, 1.9755859375, 4.369140625, 6.7626953125, 9.15625, 11.5498046875, 13.943359375, 16.3369140625, 18.73046875, 21.1240234375, 23.517578125, 25.9111328125, 28.3046875, 30.6982421875, 33.091796875, 35.4853515625, 37.87890625, 40.2724609375, 42.666015625, 45.0595703125, 47.453125, 49.8466796875, 52.240234375, 54.6337890625, 57.02734375, 59.4208984375, 61.814453125, 64.2080078125, 66.6015625, 68.9951171875, 71.388671875, 73.7822265625, 76.17578125, 78.5693359375, 80.962890625, 83.3564453125, 85.75]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 8.0, 3.0, 5.0, 3.0, 11.0, 18.0, 21.0, 14.0, 21.0, 29.0, 46.0, 85.0, 130.0, 236.0, 111.0, 64.0, 60.0, 30.0, 29.0, 25.0, 12.0, 22.0, 9.0, 3.0, 5.0, 7.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3233.22998046875, -3155.23974609375, -3077.24951171875, -2999.25927734375, -2921.26904296875, -2843.27880859375, -2765.28857421875, -2687.29833984375, -2609.30810546875, -2531.31787109375, -2453.32763671875, -2375.33740234375, -2297.34716796875, -2219.35693359375, -2141.36669921875, -2063.37646484375, -1985.386474609375, -1907.396240234375, -1829.406005859375, -1751.415771484375, -1673.425537109375, -1595.435302734375, -1517.4451904296875, -1439.4549560546875, -1361.4647216796875, -1283.4744873046875, -1205.4842529296875, -1127.4940185546875, -1049.50390625, -971.5136108398438, -893.5234375, -815.533203125, -737.5428466796875, -659.5526123046875, -581.5623779296875, -503.57220458984375, -425.58197021484375, -347.59173583984375, -269.6015319824219, -191.611328125, -113.62109375, -35.63087463378906, 42.359344482421875, 120.34956359863281, 198.33978271484375, 276.33001708984375, 354.3202209472656, 432.3104248046875, 510.3006591796875, 588.2908935546875, 666.2811279296875, 744.2713012695312, 822.2615356445312, 900.2517700195312, 978.241943359375, 1056.232177734375, 1134.222412109375, 1212.212646484375, 1290.202880859375, 1368.193115234375, 1446.183349609375, 1524.173583984375, 1602.1636962890625, 1680.1539306640625, 1758.1441650390625]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 4.0, 6.0, 7.0, 8.0, 11.0, 7.0, 13.0, 13.0, 16.0, 11.0, 15.0, 18.0, 14.0, 24.0, 21.0, 24.0, 33.0, 45.0, 62.0, 126.0, 127.0, 78.0, 53.0, 35.0, 25.0, 13.0, 24.0, 18.0, 21.0, 22.0, 20.0, 12.0, 10.0, 14.0, 13.0, 7.0, 6.0, 7.0, 6.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2016.4866943359375, -1949.412841796875, -1882.3389892578125, -1815.26513671875, -1748.1912841796875, -1681.117431640625, -1614.04345703125, -1546.9697265625, -1479.895751953125, -1412.8218994140625, -1345.748046875, -1278.6741943359375, -1211.600341796875, -1144.5264892578125, -1077.45263671875, -1010.3787231445312, -943.304931640625, -876.2310791015625, -809.1572265625, -742.0833740234375, -675.009521484375, -607.9356689453125, -540.8617553710938, -473.78790283203125, -406.71405029296875, -339.64019775390625, -272.56634521484375, -205.49246215820312, -138.41860961914062, -71.34475708007812, -4.2708740234375, 62.802978515625, 129.876708984375, 196.9505615234375, 264.0244140625, 331.0982971191406, 398.1721496582031, 465.2460021972656, 532.3198852539062, 599.3937377929688, 666.4675903320312, 733.5414428710938, 800.6152954101562, 867.689208984375, 934.7630615234375, 1001.8369140625, 1068.9107666015625, 1135.984619140625, 1203.0584716796875, 1270.13232421875, 1337.2061767578125, 1404.280029296875, 1471.3538818359375, 1538.427734375, 1605.501708984375, 1672.575439453125, 1739.6494140625, 1806.7232666015625, 1873.797119140625, 1940.8709716796875, 2007.94482421875, 2075.018798828125, 2142.092529296875, 2209.16650390625, 2276.240234375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 8.0, 16.0, 22.0, 27.0, 30.0, 52.0, 69.0, 99.0, 152.0, 194.0, 328.0, 452.0, 650.0, 948.0, 1521.0, 2418.0, 3946.0, 6571.0, 11784.0, 24813.0, 66532.0, 313118.0, 3306225.0, 343523.0, 66571.0, 22076.0, 9760.0, 4925.0, 2857.0, 1711.0, 1023.0, 675.0, 407.0, 271.0, 175.0, 111.0, 69.0, 49.0, 31.0, 19.0, 14.0, 14.0, 11.0, 3.0, 7.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-26.578125, -25.849853515625, -25.12158203125, -24.393310546875, -23.6650390625, -22.936767578125, -22.20849609375, -21.480224609375, -20.751953125, -20.023681640625, -19.29541015625, -18.567138671875, -17.8388671875, -17.110595703125, -16.38232421875, -15.654052734375, -14.92578125, -14.197509765625, -13.46923828125, -12.740966796875, -12.0126953125, -11.284423828125, -10.55615234375, -9.827880859375, -9.099609375, -8.371337890625, -7.64306640625, -6.914794921875, -6.1865234375, -5.458251953125, -4.72998046875, -4.001708984375, -3.2734375, -2.545166015625, -1.81689453125, -1.088623046875, -0.3603515625, 0.367919921875, 1.09619140625, 1.824462890625, 2.552734375, 3.281005859375, 4.00927734375, 4.737548828125, 5.4658203125, 6.194091796875, 6.92236328125, 7.650634765625, 8.37890625, 9.107177734375, 9.83544921875, 10.563720703125, 11.2919921875, 12.020263671875, 12.74853515625, 13.476806640625, 14.205078125, 14.933349609375, 15.66162109375, 16.389892578125, 17.1181640625, 17.846435546875, 18.57470703125, 19.302978515625, 20.03125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 3.0, 7.0, 14.0, 5.0, 18.0, 33.0, 50.0, 64.0, 97.0, 161.0, 194.0, 110.0, 78.0, 45.0, 36.0, 19.0, 13.0, 9.0, 6.0, 7.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.646484375, -2.568511962890625, -2.49053955078125, -2.412567138671875, -2.3345947265625, -2.256622314453125, -2.17864990234375, -2.100677490234375, -2.022705078125, -1.944732666015625, -1.86676025390625, -1.788787841796875, -1.7108154296875, -1.632843017578125, -1.55487060546875, -1.476898193359375, -1.39892578125, -1.320953369140625, -1.24298095703125, -1.165008544921875, -1.0870361328125, -1.009063720703125, -0.93109130859375, -0.853118896484375, -0.775146484375, -0.697174072265625, -0.61920166015625, -0.541229248046875, -0.4632568359375, -0.385284423828125, -0.30731201171875, -0.229339599609375, -0.1513671875, -0.073394775390625, 0.00457763671875, 0.082550048828125, 0.1605224609375, 0.238494873046875, 0.31646728515625, 0.394439697265625, 0.472412109375, 0.550384521484375, 0.62835693359375, 0.706329345703125, 0.7843017578125, 0.862274169921875, 0.94024658203125, 1.018218994140625, 1.09619140625, 1.174163818359375, 1.25213623046875, 1.330108642578125, 1.4080810546875, 1.486053466796875, 1.56402587890625, 1.641998291015625, 1.719970703125, 1.797943115234375, 1.87591552734375, 1.953887939453125, 2.0318603515625, 2.109832763671875, 2.18780517578125, 2.265777587890625, 2.34375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 6.0, 12.0, 18.0, 27.0, 33.0, 45.0, 56.0, 77.0, 135.0, 245.0, 361.0, 666.0, 1241.0, 2568.0, 6071.0, 17541.0, 65625.0, 354826.0, 2721496.0, 847103.0, 129662.0, 29757.0, 9388.0, 3598.0, 1608.0, 863.0, 504.0, 253.0, 159.0, 115.0, 63.0, 47.0, 41.0, 23.0, 13.0, 11.0, 8.0, 10.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.109375, -27.275390625, -26.44140625, -25.607421875, -24.7734375, -23.939453125, -23.10546875, -22.271484375, -21.4375, -20.603515625, -19.76953125, -18.935546875, -18.1015625, -17.267578125, -16.43359375, -15.599609375, -14.765625, -13.931640625, -13.09765625, -12.263671875, -11.4296875, -10.595703125, -9.76171875, -8.927734375, -8.09375, -7.259765625, -6.42578125, -5.591796875, -4.7578125, -3.923828125, -3.08984375, -2.255859375, -1.421875, -0.587890625, 0.24609375, 1.080078125, 1.9140625, 2.748046875, 3.58203125, 4.416015625, 5.25, 6.083984375, 6.91796875, 7.751953125, 8.5859375, 9.419921875, 10.25390625, 11.087890625, 11.921875, 12.755859375, 13.58984375, 14.423828125, 15.2578125, 16.091796875, 16.92578125, 17.759765625, 18.59375, 19.427734375, 20.26171875, 21.095703125, 21.9296875, 22.763671875, 23.59765625, 24.431640625, 25.265625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 4.0, 6.0, 4.0, 16.0, 13.0, 13.0, 18.0, 27.0, 36.0, 62.0, 45.0, 86.0, 110.0, 134.0, 165.0, 293.0, 367.0, 740.0, 508.0, 354.0, 265.0, 171.0, 135.0, 116.0, 93.0, 71.0, 51.0, 44.0, 28.0, 29.0, 19.0, 11.0, 6.0, 9.0, 8.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.203125, -4.993408203125, -4.78369140625, -4.573974609375, -4.3642578125, -4.154541015625, -3.94482421875, -3.735107421875, -3.525390625, -3.315673828125, -3.10595703125, -2.896240234375, -2.6865234375, -2.476806640625, -2.26708984375, -2.057373046875, -1.84765625, -1.637939453125, -1.42822265625, -1.218505859375, -1.0087890625, -0.799072265625, -0.58935546875, -0.379638671875, -0.169921875, 0.039794921875, 0.24951171875, 0.459228515625, 0.6689453125, 0.878662109375, 1.08837890625, 1.298095703125, 1.5078125, 1.717529296875, 1.92724609375, 2.136962890625, 2.3466796875, 2.556396484375, 2.76611328125, 2.975830078125, 3.185546875, 3.395263671875, 3.60498046875, 3.814697265625, 4.0244140625, 4.234130859375, 4.44384765625, 4.653564453125, 4.86328125, 5.072998046875, 5.28271484375, 5.492431640625, 5.7021484375, 5.911865234375, 6.12158203125, 6.331298828125, 6.541015625, 6.750732421875, 6.96044921875, 7.170166015625, 7.3798828125, 7.589599609375, 7.79931640625, 8.009033203125, 8.21875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 5.0, 16.0, 25.0, 30.0, 53.0, 79.0, 124.0, 144.0, 141.0, 121.0, 88.0, 67.0, 34.0, 24.0, 16.0, 10.0, 6.0, 4.0, 1.0, 4.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-86.24186706542969, -83.62004089355469, -80.99822235107422, -78.37639617919922, -75.75457763671875, -73.13275146484375, -70.51092529296875, -67.88910675048828, -65.26728057861328, -62.64545822143555, -60.02363586425781, -57.40180969238281, -54.77998733520508, -52.158164978027344, -49.53634262084961, -46.914520263671875, -44.29269790649414, -41.670875549316406, -39.04905319213867, -36.42723083496094, -33.80540466308594, -31.183582305908203, -28.56175994873047, -25.9399356842041, -23.318113327026367, -20.696290969848633, -18.074466705322266, -15.452644348144531, -12.83082103729248, -10.20899772644043, -7.587175369262695, -4.965351104736328, -2.3435287475585938, 0.27829432487487793, 2.9001173973083496, 5.521940231323242, 8.143763542175293, 10.765586853027344, 13.387409210205078, 16.009233474731445, 18.63105583190918, 21.252878189086914, 23.87470245361328, 26.496524810791016, 29.11834716796875, 31.740171432495117, 34.36199188232422, 36.98381805419922, 39.60564041137695, 42.22746276855469, 44.84928512573242, 47.471107482910156, 50.092933654785156, 52.71475601196289, 55.336578369140625, 57.958404541015625, 60.580223083496094, 63.20204544067383, 65.82386779785156, 68.44569396972656, 71.06751251220703, 73.68933868408203, 76.3111572265625, 78.9329833984375, 81.5548095703125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 6.0, 10.0, 10.0, 11.0, 15.0, 41.0, 24.0, 33.0, 32.0, 49.0, 62.0, 42.0, 57.0, 50.0, 55.0, 68.0, 52.0, 69.0, 62.0, 51.0, 32.0, 40.0, 32.0, 27.0, 27.0, 14.0, 10.0, 5.0, 7.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-76.68160247802734, -74.87442779541016, -73.06725311279297, -71.26007843017578, -69.4529037475586, -67.6457290649414, -65.83855438232422, -64.03138732910156, -62.22420883178711, -60.41703414916992, -58.609859466552734, -56.80268478393555, -54.995513916015625, -53.18833923339844, -51.38116455078125, -49.57398986816406, -47.766815185546875, -45.95964050292969, -44.1524658203125, -42.34529113769531, -40.538116455078125, -38.73094177246094, -36.923770904541016, -35.11659622192383, -33.30942153930664, -31.502246856689453, -29.695072174072266, -27.88789939880371, -26.080724716186523, -24.273550033569336, -22.46637725830078, -20.659202575683594, -18.852027893066406, -17.04485321044922, -15.237679481506348, -13.430505752563477, -11.623331069946289, -9.816156387329102, -8.00898265838623, -6.201808929443359, -4.394634246826172, -2.5874600410461426, -0.7802858352661133, 1.026888370513916, 2.8340625762939453, 4.641237258911133, 6.448410987854004, 8.255584716796875, 10.062759399414062, 11.86993408203125, 13.677107810974121, 15.484281539916992, 17.29145622253418, 19.098630905151367, 20.905803680419922, 22.71297836303711, 24.520153045654297, 26.327327728271484, 28.134502410888672, 29.941675186157227, 31.748849868774414, 33.55602264404297, 35.363197326660156, 37.170372009277344, 38.97754669189453]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 9.0, 8.0, 13.0, 10.0, 17.0, 26.0, 42.0, 48.0, 84.0, 143.0, 196.0, 284.0, 430.0, 614.0, 1077.0, 1764.0, 3091.0, 6382.0, 15220.0, 40714.0, 141256.0, 559740.0, 192602.0, 50691.0, 18029.0, 7482.0, 3560.0, 1900.0, 1088.0, 721.0, 439.0, 271.0, 175.0, 119.0, 87.0, 73.0, 48.0, 28.0, 20.0, 27.0, 13.0, 6.0, 5.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.203125, -15.7208251953125, -15.238525390625, -14.7562255859375, -14.27392578125, -13.7916259765625, -13.309326171875, -12.8270263671875, -12.3447265625, -11.8624267578125, -11.380126953125, -10.8978271484375, -10.41552734375, -9.9332275390625, -9.450927734375, -8.9686279296875, -8.486328125, -8.0040283203125, -7.521728515625, -7.0394287109375, -6.55712890625, -6.0748291015625, -5.592529296875, -5.1102294921875, -4.6279296875, -4.1456298828125, -3.663330078125, -3.1810302734375, -2.69873046875, -2.2164306640625, -1.734130859375, -1.2518310546875, -0.76953125, -0.2872314453125, 0.195068359375, 0.6773681640625, 1.15966796875, 1.6419677734375, 2.124267578125, 2.6065673828125, 3.0888671875, 3.5711669921875, 4.053466796875, 4.5357666015625, 5.01806640625, 5.5003662109375, 5.982666015625, 6.4649658203125, 6.947265625, 7.4295654296875, 7.911865234375, 8.3941650390625, 8.87646484375, 9.3587646484375, 9.841064453125, 10.3233642578125, 10.8056640625, 11.2879638671875, 11.770263671875, 12.2525634765625, 12.73486328125, 13.2171630859375, 13.699462890625, 14.1817626953125, 14.6640625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 7.0, 10.0, 16.0, 16.0, 26.0, 31.0, 40.0, 46.0, 56.0, 86.0, 91.0, 89.0, 91.0, 83.0, 73.0, 53.0, 51.0, 33.0, 29.0, 18.0, 16.0, 10.0, 9.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.287109375, -2.20416259765625, -2.1212158203125, -2.03826904296875, -1.955322265625, -1.87237548828125, -1.7894287109375, -1.70648193359375, -1.62353515625, -1.54058837890625, -1.4576416015625, -1.37469482421875, -1.291748046875, -1.20880126953125, -1.1258544921875, -1.04290771484375, -0.9599609375, -0.87701416015625, -0.7940673828125, -0.71112060546875, -0.628173828125, -0.54522705078125, -0.4622802734375, -0.37933349609375, -0.29638671875, -0.21343994140625, -0.1304931640625, -0.04754638671875, 0.035400390625, 0.11834716796875, 0.2012939453125, 0.28424072265625, 0.3671875, 0.45013427734375, 0.5330810546875, 0.61602783203125, 0.698974609375, 0.78192138671875, 0.8648681640625, 0.94781494140625, 1.03076171875, 1.11370849609375, 1.1966552734375, 1.27960205078125, 1.362548828125, 1.44549560546875, 1.5284423828125, 1.61138916015625, 1.6943359375, 1.77728271484375, 1.8602294921875, 1.94317626953125, 2.026123046875, 2.10906982421875, 2.1920166015625, 2.27496337890625, 2.35791015625, 2.44085693359375, 2.5238037109375, 2.60675048828125, 2.689697265625, 2.77264404296875, 2.8555908203125, 2.93853759765625, 3.021484375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 8.0, 8.0, 7.0, 17.0, 20.0, 25.0, 41.0, 56.0, 78.0, 112.0, 186.0, 242.0, 406.0, 636.0, 1081.0, 1674.0, 3289.0, 6143.0, 12354.0, 28694.0, 75426.0, 272453.0, 450254.0, 119193.0, 40872.0, 17284.0, 8038.0, 4154.0, 2277.0, 1310.0, 811.0, 496.0, 320.0, 200.0, 116.0, 94.0, 61.0, 39.0, 22.0, 24.0, 14.0, 11.0, 7.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0], "bins": [-12.5078125, -12.14208984375, -11.7763671875, -11.41064453125, -11.044921875, -10.67919921875, -10.3134765625, -9.94775390625, -9.58203125, -9.21630859375, -8.8505859375, -8.48486328125, -8.119140625, -7.75341796875, -7.3876953125, -7.02197265625, -6.65625, -6.29052734375, -5.9248046875, -5.55908203125, -5.193359375, -4.82763671875, -4.4619140625, -4.09619140625, -3.73046875, -3.36474609375, -2.9990234375, -2.63330078125, -2.267578125, -1.90185546875, -1.5361328125, -1.17041015625, -0.8046875, -0.43896484375, -0.0732421875, 0.29248046875, 0.658203125, 1.02392578125, 1.3896484375, 1.75537109375, 2.12109375, 2.48681640625, 2.8525390625, 3.21826171875, 3.583984375, 3.94970703125, 4.3154296875, 4.68115234375, 5.046875, 5.41259765625, 5.7783203125, 6.14404296875, 6.509765625, 6.87548828125, 7.2412109375, 7.60693359375, 7.97265625, 8.33837890625, 8.7041015625, 9.06982421875, 9.435546875, 9.80126953125, 10.1669921875, 10.53271484375, 10.8984375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 10.0, 6.0, 7.0, 11.0, 11.0, 22.0, 26.0, 23.0, 32.0, 29.0, 26.0, 29.0, 38.0, 34.0, 31.0, 38.0, 40.0, 49.0, 52.0, 52.0, 53.0, 43.0, 33.0, 50.0, 31.0, 30.0, 29.0, 28.0, 23.0, 21.0, 19.0, 12.0, 14.0, 19.0, 6.0, 11.0, 6.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-12.5390625, -12.1859130859375, -11.832763671875, -11.4796142578125, -11.12646484375, -10.7733154296875, -10.420166015625, -10.0670166015625, -9.7138671875, -9.3607177734375, -9.007568359375, -8.6544189453125, -8.30126953125, -7.9481201171875, -7.594970703125, -7.2418212890625, -6.888671875, -6.5355224609375, -6.182373046875, -5.8292236328125, -5.47607421875, -5.1229248046875, -4.769775390625, -4.4166259765625, -4.0634765625, -3.7103271484375, -3.357177734375, -3.0040283203125, -2.65087890625, -2.2977294921875, -1.944580078125, -1.5914306640625, -1.23828125, -0.8851318359375, -0.531982421875, -0.1788330078125, 0.17431640625, 0.5274658203125, 0.880615234375, 1.2337646484375, 1.5869140625, 1.9400634765625, 2.293212890625, 2.6463623046875, 2.99951171875, 3.3526611328125, 3.705810546875, 4.0589599609375, 4.412109375, 4.7652587890625, 5.118408203125, 5.4715576171875, 5.82470703125, 6.1778564453125, 6.531005859375, 6.8841552734375, 7.2373046875, 7.5904541015625, 7.943603515625, 8.2967529296875, 8.64990234375, 9.0030517578125, 9.356201171875, 9.7093505859375, 10.0625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 3.0, 8.0, 11.0, 16.0, 36.0, 44.0, 101.0, 191.0, 423.0, 1140.0, 3612.0, 17816.0, 230767.0, 736416.0, 47968.0, 6956.0, 1821.0, 658.0, 251.0, 147.0, 54.0, 34.0, 21.0, 21.0, 13.0, 9.0, 4.0, 8.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.109375, -13.626708984375, -13.14404296875, -12.661376953125, -12.1787109375, -11.696044921875, -11.21337890625, -10.730712890625, -10.248046875, -9.765380859375, -9.28271484375, -8.800048828125, -8.3173828125, -7.834716796875, -7.35205078125, -6.869384765625, -6.38671875, -5.904052734375, -5.42138671875, -4.938720703125, -4.4560546875, -3.973388671875, -3.49072265625, -3.008056640625, -2.525390625, -2.042724609375, -1.56005859375, -1.077392578125, -0.5947265625, -0.112060546875, 0.37060546875, 0.853271484375, 1.3359375, 1.818603515625, 2.30126953125, 2.783935546875, 3.2666015625, 3.749267578125, 4.23193359375, 4.714599609375, 5.197265625, 5.679931640625, 6.16259765625, 6.645263671875, 7.1279296875, 7.610595703125, 8.09326171875, 8.575927734375, 9.05859375, 9.541259765625, 10.02392578125, 10.506591796875, 10.9892578125, 11.471923828125, 11.95458984375, 12.437255859375, 12.919921875, 13.402587890625, 13.88525390625, 14.367919921875, 14.8505859375, 15.333251953125, 15.81591796875, 16.298583984375, 16.78125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 12.0, 26.0, 32.0, 43.0, 93.0, 89.0, 157.0, 126.0, 142.0, 89.0, 73.0, 35.0, 28.0, 17.0, 16.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006003379821777344, -0.0005805566906929016, -0.0005607753992080688, -0.0005409941077232361, -0.0005212128162384033, -0.0005014315247535706, -0.0004816502332687378, -0.00046186894178390503, -0.00044208765029907227, -0.0004223063588142395, -0.00040252506732940674, -0.000382743775844574, -0.0003629624843597412, -0.00034318119287490845, -0.0003233999013900757, -0.0003036186099052429, -0.00028383731842041016, -0.0002640560269355774, -0.00024427473545074463, -0.00022449344396591187, -0.0002047121524810791, -0.00018493086099624634, -0.00016514956951141357, -0.0001453682780265808, -0.00012558698654174805, -0.00010580569505691528, -8.602440357208252e-05, -6.624311208724976e-05, -4.646182060241699e-05, -2.668052911758423e-05, -6.899237632751465e-06, 1.2882053852081299e-05, 3.266334533691406e-05, 5.2444636821746826e-05, 7.222592830657959e-05, 9.200721979141235e-05, 0.00011178851127624512, 0.00013156980276107788, 0.00015135109424591064, 0.0001711323857307434, 0.00019091367721557617, 0.00021069496870040894, 0.0002304762601852417, 0.00025025755167007446, 0.0002700388431549072, 0.00028982013463974, 0.00030960142612457275, 0.0003293827176094055, 0.0003491640090942383, 0.00036894530057907104, 0.0003887265920639038, 0.00040850788354873657, 0.00042828917503356934, 0.0004480704665184021, 0.00046785175800323486, 0.0004876330494880676, 0.0005074143409729004, 0.0005271956324577332, 0.0005469769239425659, 0.0005667582154273987, 0.0005865395069122314, 0.0006063207983970642, 0.000626102089881897, 0.0006458833813667297, 0.0006656646728515625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 8.0, 11.0, 4.0, 13.0, 18.0, 25.0, 30.0, 45.0, 92.0, 137.0, 226.0, 433.0, 860.0, 2021.0, 5727.0, 20902.0, 124671.0, 672890.0, 182277.0, 26647.0, 6908.0, 2471.0, 959.0, 466.0, 232.0, 174.0, 124.0, 56.0, 32.0, 27.0, 16.0, 12.0, 9.0, 10.0, 6.0, 6.0, 2.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.46875, -10.12646484375, -9.7841796875, -9.44189453125, -9.099609375, -8.75732421875, -8.4150390625, -8.07275390625, -7.73046875, -7.38818359375, -7.0458984375, -6.70361328125, -6.361328125, -6.01904296875, -5.6767578125, -5.33447265625, -4.9921875, -4.64990234375, -4.3076171875, -3.96533203125, -3.623046875, -3.28076171875, -2.9384765625, -2.59619140625, -2.25390625, -1.91162109375, -1.5693359375, -1.22705078125, -0.884765625, -0.54248046875, -0.2001953125, 0.14208984375, 0.484375, 0.82666015625, 1.1689453125, 1.51123046875, 1.853515625, 2.19580078125, 2.5380859375, 2.88037109375, 3.22265625, 3.56494140625, 3.9072265625, 4.24951171875, 4.591796875, 4.93408203125, 5.2763671875, 5.61865234375, 5.9609375, 6.30322265625, 6.6455078125, 6.98779296875, 7.330078125, 7.67236328125, 8.0146484375, 8.35693359375, 8.69921875, 9.04150390625, 9.3837890625, 9.72607421875, 10.068359375, 10.41064453125, 10.7529296875, 11.09521484375, 11.4375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 15.0, 14.0, 26.0, 35.0, 44.0, 69.0, 75.0, 102.0, 95.0, 131.0, 118.0, 75.0, 55.0, 45.0, 29.0, 22.0, 19.0, 7.0, 10.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.265625, -7.0133056640625, -6.760986328125, -6.5086669921875, -6.25634765625, -6.0040283203125, -5.751708984375, -5.4993896484375, -5.2470703125, -4.9947509765625, -4.742431640625, -4.4901123046875, -4.23779296875, -3.9854736328125, -3.733154296875, -3.4808349609375, -3.228515625, -2.9761962890625, -2.723876953125, -2.4715576171875, -2.21923828125, -1.9669189453125, -1.714599609375, -1.4622802734375, -1.2099609375, -0.9576416015625, -0.705322265625, -0.4530029296875, -0.20068359375, 0.0516357421875, 0.303955078125, 0.5562744140625, 0.80859375, 1.0609130859375, 1.313232421875, 1.5655517578125, 1.81787109375, 2.0701904296875, 2.322509765625, 2.5748291015625, 2.8271484375, 3.0794677734375, 3.331787109375, 3.5841064453125, 3.83642578125, 4.0887451171875, 4.341064453125, 4.5933837890625, 4.845703125, 5.0980224609375, 5.350341796875, 5.6026611328125, 5.85498046875, 6.1072998046875, 6.359619140625, 6.6119384765625, 6.8642578125, 7.1165771484375, 7.368896484375, 7.6212158203125, 7.87353515625, 8.1258544921875, 8.378173828125, 8.6304931640625, 8.8828125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 3.0, 9.0, 7.0, 15.0, 22.0, 35.0, 51.0, 143.0, 269.0, 216.0, 103.0, 44.0, 25.0, 19.0, 9.0, 5.0, 6.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-137.60899353027344, -132.98910522460938, -128.36923217773438, -123.74935150146484, -119.12947082519531, -114.50958251953125, -109.88970184326172, -105.26982116699219, -100.64994049072266, -96.03005981445312, -91.4101791381836, -86.79029846191406, -82.17041015625, -77.550537109375, -72.93064880371094, -68.3107681274414, -63.690887451171875, -59.071006774902344, -54.45112609863281, -49.831241607666016, -45.211360931396484, -40.59148025512695, -35.971595764160156, -31.351715087890625, -26.731834411621094, -22.111953735351562, -17.4920711517334, -12.87218952178955, -8.252307891845703, -3.632427215576172, 0.9874553680419922, 5.607337951660156, 10.22723388671875, 14.847115516662598, 19.466997146606445, 24.08687973022461, 28.70676040649414, 33.32664108276367, 37.94652557373047, 42.56640625, 47.18628692626953, 51.80616760253906, 56.426048278808594, 61.04593276977539, 65.66581726074219, 70.28569030761719, 74.90557861328125, 79.52545928955078, 84.14533996582031, 88.76522064208984, 93.38510131835938, 98.0049819946289, 102.62486267089844, 107.2447509765625, 111.86463165283203, 116.48451232910156, 121.1043930053711, 125.72427368164062, 130.3441619873047, 134.9640350341797, 139.58392333984375, 144.20379638671875, 148.8236846923828, 153.44357299804688, 158.06344604492188]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 3.0, 7.0, 11.0, 6.0, 18.0, 22.0, 50.0, 82.0, 105.0, 137.0, 145.0, 136.0, 96.0, 56.0, 27.0, 21.0, 16.0, 11.0, 7.0, 9.0, 4.0, 5.0, 5.0, 2.0, 4.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-210.1232147216797, -204.0203399658203, -197.91744995117188, -191.8145751953125, -185.71168518066406, -179.6088104248047, -173.50592041015625, -167.40304565429688, -161.3001708984375, -155.19729614257812, -149.0944061279297, -142.9915313720703, -136.88864135742188, -130.7857666015625, -124.6828842163086, -118.58000183105469, -112.47711181640625, -106.37422943115234, -100.27134704589844, -94.16847229003906, -88.06558227539062, -81.96270751953125, -75.85982513427734, -69.75694274902344, -63.65406036376953, -57.551177978515625, -51.44829559326172, -45.34541702270508, -39.24253463745117, -33.139652252197266, -27.036773681640625, -20.93389129638672, -14.831024169921875, -8.728142738342285, -2.6252613067626953, 3.477619171142578, 9.580501556396484, 15.68338394165039, 21.78626251220703, 27.889144897460938, 33.992027282714844, 40.09490966796875, 46.197792053222656, 52.3006706237793, 58.4035530090332, 64.50643920898438, 70.60931396484375, 76.71219635009766, 82.81507873535156, 88.91796112060547, 95.02084350585938, 101.12371826171875, 107.22660827636719, 113.32948303222656, 119.43236541748047, 125.53524780273438, 131.63812255859375, 137.74099731445312, 143.84388732910156, 149.94676208496094, 156.04965209960938, 162.15252685546875, 168.25540161132812, 174.35829162597656, 180.461181640625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 8.0, 4.0, 9.0, 9.0, 10.0, 19.0, 37.0, 52.0, 93.0, 176.0, 299.0, 582.0, 1175.0, 2738.0, 7303.0, 24075.0, 124118.0, 3645417.0, 327120.0, 41793.0, 11115.0, 4023.0, 1818.0, 903.0, 532.0, 279.0, 159.0, 126.0, 81.0, 52.0, 39.0, 27.0, 20.0, 23.0, 13.0, 16.0, 4.0, 10.0, 1.0, 6.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.6875, -35.2021484375, -33.716796875, -32.2314453125, -30.74609375, -29.2607421875, -27.775390625, -26.2900390625, -24.8046875, -23.3193359375, -21.833984375, -20.3486328125, -18.86328125, -17.3779296875, -15.892578125, -14.4072265625, -12.921875, -11.4365234375, -9.951171875, -8.4658203125, -6.98046875, -5.4951171875, -4.009765625, -2.5244140625, -1.0390625, 0.4462890625, 1.931640625, 3.4169921875, 4.90234375, 6.3876953125, 7.873046875, 9.3583984375, 10.84375, 12.3291015625, 13.814453125, 15.2998046875, 16.78515625, 18.2705078125, 19.755859375, 21.2412109375, 22.7265625, 24.2119140625, 25.697265625, 27.1826171875, 28.66796875, 30.1533203125, 31.638671875, 33.1240234375, 34.609375, 36.0947265625, 37.580078125, 39.0654296875, 40.55078125, 42.0361328125, 43.521484375, 45.0068359375, 46.4921875, 47.9775390625, 49.462890625, 50.9482421875, 52.43359375, 53.9189453125, 55.404296875, 56.8896484375, 58.375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 4.0, 9.0, 10.0, 6.0, 18.0, 14.0, 27.0, 44.0, 43.0, 55.0, 63.0, 93.0, 75.0, 88.0, 80.0, 78.0, 70.0, 54.0, 38.0, 25.0, 33.0, 13.0, 7.0, 8.0, 13.0, 5.0, 6.0, 5.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.880859375, -1.79681396484375, -1.7127685546875, -1.62872314453125, -1.544677734375, -1.46063232421875, -1.3765869140625, -1.29254150390625, -1.20849609375, -1.12445068359375, -1.0404052734375, -0.95635986328125, -0.872314453125, -0.78826904296875, -0.7042236328125, -0.62017822265625, -0.5361328125, -0.45208740234375, -0.3680419921875, -0.28399658203125, -0.199951171875, -0.11590576171875, -0.0318603515625, 0.05218505859375, 0.13623046875, 0.22027587890625, 0.3043212890625, 0.38836669921875, 0.472412109375, 0.55645751953125, 0.6405029296875, 0.72454833984375, 0.80859375, 0.89263916015625, 0.9766845703125, 1.06072998046875, 1.144775390625, 1.22882080078125, 1.3128662109375, 1.39691162109375, 1.48095703125, 1.56500244140625, 1.6490478515625, 1.73309326171875, 1.817138671875, 1.90118408203125, 1.9852294921875, 2.06927490234375, 2.1533203125, 2.23736572265625, 2.3214111328125, 2.40545654296875, 2.489501953125, 2.57354736328125, 2.6575927734375, 2.74163818359375, 2.82568359375, 2.90972900390625, 2.9937744140625, 3.07781982421875, 3.161865234375, 3.24591064453125, 3.3299560546875, 3.41400146484375, 3.498046875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 7.0, 13.0, 6.0, 12.0, 13.0, 20.0, 24.0, 44.0, 86.0, 83.0, 132.0, 217.0, 330.0, 532.0, 917.0, 1527.0, 3015.0, 6192.0, 14269.0, 37039.0, 115990.0, 528724.0, 2986614.0, 356639.0, 88909.0, 29769.0, 11808.0, 5148.0, 2556.0, 1441.0, 851.0, 445.0, 335.0, 191.0, 111.0, 84.0, 51.0, 33.0, 27.0, 24.0, 17.0, 7.0, 11.0, 4.0, 5.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.4375, -26.53466796875, -25.6318359375, -24.72900390625, -23.826171875, -22.92333984375, -22.0205078125, -21.11767578125, -20.21484375, -19.31201171875, -18.4091796875, -17.50634765625, -16.603515625, -15.70068359375, -14.7978515625, -13.89501953125, -12.9921875, -12.08935546875, -11.1865234375, -10.28369140625, -9.380859375, -8.47802734375, -7.5751953125, -6.67236328125, -5.76953125, -4.86669921875, -3.9638671875, -3.06103515625, -2.158203125, -1.25537109375, -0.3525390625, 0.55029296875, 1.453125, 2.35595703125, 3.2587890625, 4.16162109375, 5.064453125, 5.96728515625, 6.8701171875, 7.77294921875, 8.67578125, 9.57861328125, 10.4814453125, 11.38427734375, 12.287109375, 13.18994140625, 14.0927734375, 14.99560546875, 15.8984375, 16.80126953125, 17.7041015625, 18.60693359375, 19.509765625, 20.41259765625, 21.3154296875, 22.21826171875, 23.12109375, 24.02392578125, 24.9267578125, 25.82958984375, 26.732421875, 27.63525390625, 28.5380859375, 29.44091796875, 30.34375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 13.0, 16.0, 15.0, 37.0, 27.0, 64.0, 107.0, 191.0, 338.0, 809.0, 1535.0, 336.0, 205.0, 101.0, 116.0, 46.0, 40.0, 12.0, 17.0, 14.0, 6.0, 8.0, 5.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7578125, -6.54052734375, -6.3232421875, -6.10595703125, -5.888671875, -5.67138671875, -5.4541015625, -5.23681640625, -5.01953125, -4.80224609375, -4.5849609375, -4.36767578125, -4.150390625, -3.93310546875, -3.7158203125, -3.49853515625, -3.28125, -3.06396484375, -2.8466796875, -2.62939453125, -2.412109375, -2.19482421875, -1.9775390625, -1.76025390625, -1.54296875, -1.32568359375, -1.1083984375, -0.89111328125, -0.673828125, -0.45654296875, -0.2392578125, -0.02197265625, 0.1953125, 0.41259765625, 0.6298828125, 0.84716796875, 1.064453125, 1.28173828125, 1.4990234375, 1.71630859375, 1.93359375, 2.15087890625, 2.3681640625, 2.58544921875, 2.802734375, 3.02001953125, 3.2373046875, 3.45458984375, 3.671875, 3.88916015625, 4.1064453125, 4.32373046875, 4.541015625, 4.75830078125, 4.9755859375, 5.19287109375, 5.41015625, 5.62744140625, 5.8447265625, 6.06201171875, 6.279296875, 6.49658203125, 6.7138671875, 6.93115234375, 7.1484375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 0.0, 11.0, 16.0, 25.0, 44.0, 71.0, 132.0, 181.0, 164.0, 132.0, 102.0, 55.0, 31.0, 15.0, 8.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-52.51515579223633, -50.81681442260742, -49.11847686767578, -47.420135498046875, -45.721797943115234, -44.02345657348633, -42.32511901855469, -40.62677764892578, -38.928436279296875, -37.23009490966797, -35.53175735473633, -33.83341598510742, -32.13507843017578, -30.436737060546875, -28.7383975982666, -27.040058135986328, -25.341718673706055, -23.64337921142578, -21.945039749145508, -20.246700286865234, -18.548358917236328, -16.850019454956055, -15.151679992675781, -13.453339576721191, -11.755000114440918, -10.056660652160645, -8.358320236206055, -6.659980773925781, -4.96164083480835, -3.263300895690918, -1.5649614334106445, 0.1333789825439453, 1.8317184448242188, 3.5300583839416504, 5.228398323059082, 6.9267377853393555, 8.625078201293945, 10.323417663574219, 12.021757125854492, 13.720097541809082, 15.418437004089355, 17.116777420043945, 18.81511688232422, 20.513456344604492, 22.211795806884766, 23.910137176513672, 25.608474731445312, 27.30681610107422, 29.005155563354492, 30.703495025634766, 32.40183639526367, 34.10017395019531, 35.79851531982422, 37.496856689453125, 39.195194244384766, 40.89353561401367, 42.59187316894531, 44.29021453857422, 45.98855209350586, 47.686893463134766, 49.385231018066406, 51.08357238769531, 52.78191375732422, 54.48025131225586, 56.178592681884766]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 10.0, 8.0, 8.0, 10.0, 15.0, 13.0, 17.0, 21.0, 29.0, 27.0, 42.0, 47.0, 56.0, 69.0, 90.0, 47.0, 69.0, 55.0, 61.0, 55.0, 46.0, 40.0, 36.0, 22.0, 25.0, 23.0, 15.0, 9.0, 10.0, 7.0, 10.0, 3.0, 0.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.689048767089844, -21.85130500793457, -21.013561248779297, -20.175819396972656, -19.338075637817383, -18.50033187866211, -17.66259002685547, -16.824846267700195, -15.987102508544922, -15.149358749389648, -14.311615943908691, -13.473873138427734, -12.636129379272461, -11.798385620117188, -10.96064281463623, -10.122900009155273, -9.28515625, -8.447412490844727, -7.6096696853637695, -6.771926403045654, -5.934183120727539, -5.096439838409424, -4.258696556091309, -3.4209532737731934, -2.583209991455078, -1.745466709136963, -0.9077234268188477, -0.06998014450073242, 0.7677631378173828, 1.605506420135498, 2.4432497024536133, 3.2809929847717285, 4.118736267089844, 4.956479549407959, 5.794222831726074, 6.6319661140441895, 7.469709396362305, 8.307453155517578, 9.145195960998535, 9.982938766479492, 10.820682525634766, 11.658426284790039, 12.496169090270996, 13.333911895751953, 14.171655654907227, 15.0093994140625, 15.847142219543457, 16.684885025024414, 17.522628784179688, 18.36037254333496, 19.198116302490234, 20.035858154296875, 20.87360191345215, 21.711345672607422, 22.549087524414062, 23.386831283569336, 24.22457504272461, 25.062318801879883, 25.900062561035156, 26.737804412841797, 27.57554817199707, 28.413291931152344, 29.251033782958984, 30.088777542114258, 30.92652130126953]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 7.0, 2.0, 3.0, 4.0, 4.0, 7.0, 7.0, 12.0, 32.0, 41.0, 60.0, 102.0, 156.0, 291.0, 580.0, 973.0, 1994.0, 4499.0, 10806.0, 31788.0, 120404.0, 537246.0, 254247.0, 55803.0, 17091.0, 6581.0, 2801.0, 1383.0, 711.0, 369.0, 216.0, 125.0, 83.0, 43.0, 34.0, 15.0, 10.0, 9.0, 6.0, 7.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.484375, -26.66943359375, -25.8544921875, -25.03955078125, -24.224609375, -23.40966796875, -22.5947265625, -21.77978515625, -20.96484375, -20.14990234375, -19.3349609375, -18.52001953125, -17.705078125, -16.89013671875, -16.0751953125, -15.26025390625, -14.4453125, -13.63037109375, -12.8154296875, -12.00048828125, -11.185546875, -10.37060546875, -9.5556640625, -8.74072265625, -7.92578125, -7.11083984375, -6.2958984375, -5.48095703125, -4.666015625, -3.85107421875, -3.0361328125, -2.22119140625, -1.40625, -0.59130859375, 0.2236328125, 1.03857421875, 1.853515625, 2.66845703125, 3.4833984375, 4.29833984375, 5.11328125, 5.92822265625, 6.7431640625, 7.55810546875, 8.373046875, 9.18798828125, 10.0029296875, 10.81787109375, 11.6328125, 12.44775390625, 13.2626953125, 14.07763671875, 14.892578125, 15.70751953125, 16.5224609375, 17.33740234375, 18.15234375, 18.96728515625, 19.7822265625, 20.59716796875, 21.412109375, 22.22705078125, 23.0419921875, 23.85693359375, 24.671875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 6.0, 8.0, 8.0, 5.0, 13.0, 15.0, 26.0, 27.0, 26.0, 39.0, 52.0, 55.0, 58.0, 68.0, 54.0, 60.0, 79.0, 71.0, 56.0, 52.0, 42.0, 34.0, 33.0, 25.0, 26.0, 19.0, 12.0, 10.0, 6.0, 7.0, 7.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.1875, -2.1134033203125, -2.039306640625, -1.9652099609375, -1.89111328125, -1.8170166015625, -1.742919921875, -1.6688232421875, -1.5947265625, -1.5206298828125, -1.446533203125, -1.3724365234375, -1.29833984375, -1.2242431640625, -1.150146484375, -1.0760498046875, -1.001953125, -0.9278564453125, -0.853759765625, -0.7796630859375, -0.70556640625, -0.6314697265625, -0.557373046875, -0.4832763671875, -0.4091796875, -0.3350830078125, -0.260986328125, -0.1868896484375, -0.11279296875, -0.0386962890625, 0.035400390625, 0.1094970703125, 0.18359375, 0.2576904296875, 0.331787109375, 0.4058837890625, 0.47998046875, 0.5540771484375, 0.628173828125, 0.7022705078125, 0.7763671875, 0.8504638671875, 0.924560546875, 0.9986572265625, 1.07275390625, 1.1468505859375, 1.220947265625, 1.2950439453125, 1.369140625, 1.4432373046875, 1.517333984375, 1.5914306640625, 1.66552734375, 1.7396240234375, 1.813720703125, 1.8878173828125, 1.9619140625, 2.0360107421875, 2.110107421875, 2.1842041015625, 2.25830078125, 2.3323974609375, 2.406494140625, 2.4805908203125, 2.5546875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 4.0, 25.0, 28.0, 45.0, 49.0, 85.0, 99.0, 159.0, 257.0, 451.0, 646.0, 1096.0, 1795.0, 3093.0, 5644.0, 11431.0, 25399.0, 67262.0, 220980.0, 439017.0, 174086.0, 54710.0, 21041.0, 9482.0, 4790.0, 2750.0, 1579.0, 927.0, 576.0, 358.0, 213.0, 163.0, 90.0, 71.0, 45.0, 26.0, 25.0, 15.0, 18.0, 6.0, 8.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-14.3828125, -13.93896484375, -13.4951171875, -13.05126953125, -12.607421875, -12.16357421875, -11.7197265625, -11.27587890625, -10.83203125, -10.38818359375, -9.9443359375, -9.50048828125, -9.056640625, -8.61279296875, -8.1689453125, -7.72509765625, -7.28125, -6.83740234375, -6.3935546875, -5.94970703125, -5.505859375, -5.06201171875, -4.6181640625, -4.17431640625, -3.73046875, -3.28662109375, -2.8427734375, -2.39892578125, -1.955078125, -1.51123046875, -1.0673828125, -0.62353515625, -0.1796875, 0.26416015625, 0.7080078125, 1.15185546875, 1.595703125, 2.03955078125, 2.4833984375, 2.92724609375, 3.37109375, 3.81494140625, 4.2587890625, 4.70263671875, 5.146484375, 5.59033203125, 6.0341796875, 6.47802734375, 6.921875, 7.36572265625, 7.8095703125, 8.25341796875, 8.697265625, 9.14111328125, 9.5849609375, 10.02880859375, 10.47265625, 10.91650390625, 11.3603515625, 11.80419921875, 12.248046875, 12.69189453125, 13.1357421875, 13.57958984375, 14.0234375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 8.0, 10.0, 12.0, 16.0, 19.0, 17.0, 21.0, 22.0, 31.0, 39.0, 40.0, 39.0, 41.0, 58.0, 62.0, 69.0, 42.0, 55.0, 50.0, 42.0, 55.0, 30.0, 43.0, 41.0, 32.0, 22.0, 12.0, 17.0, 11.0, 15.0, 6.0, 2.0, 7.0, 5.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.15625, -9.849853515625, -9.54345703125, -9.237060546875, -8.9306640625, -8.624267578125, -8.31787109375, -8.011474609375, -7.705078125, -7.398681640625, -7.09228515625, -6.785888671875, -6.4794921875, -6.173095703125, -5.86669921875, -5.560302734375, -5.25390625, -4.947509765625, -4.64111328125, -4.334716796875, -4.0283203125, -3.721923828125, -3.41552734375, -3.109130859375, -2.802734375, -2.496337890625, -2.18994140625, -1.883544921875, -1.5771484375, -1.270751953125, -0.96435546875, -0.657958984375, -0.3515625, -0.045166015625, 0.26123046875, 0.567626953125, 0.8740234375, 1.180419921875, 1.48681640625, 1.793212890625, 2.099609375, 2.406005859375, 2.71240234375, 3.018798828125, 3.3251953125, 3.631591796875, 3.93798828125, 4.244384765625, 4.55078125, 4.857177734375, 5.16357421875, 5.469970703125, 5.7763671875, 6.082763671875, 6.38916015625, 6.695556640625, 7.001953125, 7.308349609375, 7.61474609375, 7.921142578125, 8.2275390625, 8.533935546875, 8.84033203125, 9.146728515625, 9.453125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 3.0, 18.0, 14.0, 16.0, 36.0, 46.0, 100.0, 145.0, 283.0, 485.0, 986.0, 2185.0, 5365.0, 14407.0, 45120.0, 163934.0, 421548.0, 276846.0, 79425.0, 23527.0, 8024.0, 3197.0, 1414.0, 619.0, 336.0, 183.0, 109.0, 72.0, 32.0, 24.0, 14.0, 11.0, 9.0, 11.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.359375, -10.9771728515625, -10.594970703125, -10.2127685546875, -9.83056640625, -9.4483642578125, -9.066162109375, -8.6839599609375, -8.3017578125, -7.9195556640625, -7.537353515625, -7.1551513671875, -6.77294921875, -6.3907470703125, -6.008544921875, -5.6263427734375, -5.244140625, -4.8619384765625, -4.479736328125, -4.0975341796875, -3.71533203125, -3.3331298828125, -2.950927734375, -2.5687255859375, -2.1865234375, -1.8043212890625, -1.422119140625, -1.0399169921875, -0.65771484375, -0.2755126953125, 0.106689453125, 0.4888916015625, 0.87109375, 1.2532958984375, 1.635498046875, 2.0177001953125, 2.39990234375, 2.7821044921875, 3.164306640625, 3.5465087890625, 3.9287109375, 4.3109130859375, 4.693115234375, 5.0753173828125, 5.45751953125, 5.8397216796875, 6.221923828125, 6.6041259765625, 6.986328125, 7.3685302734375, 7.750732421875, 8.1329345703125, 8.51513671875, 8.8973388671875, 9.279541015625, 9.6617431640625, 10.0439453125, 10.4261474609375, 10.808349609375, 11.1905517578125, 11.57275390625, 11.9549560546875, 12.337158203125, 12.7193603515625, 13.1015625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 6.0, 15.0, 34.0, 67.0, 179.0, 284.0, 199.0, 106.0, 42.0, 25.0, 10.0, 7.0, 7.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015134811401367188, -0.001452133059501648, -0.0013907849788665771, -0.0013294368982315063, -0.0012680888175964355, -0.0012067407369613647, -0.001145392656326294, -0.0010840445756912231, -0.0010226964950561523, -0.0009613484144210815, -0.0009000003337860107, -0.0008386522531509399, -0.0007773041725158691, -0.0007159560918807983, -0.0006546080112457275, -0.0005932599306106567, -0.0005319118499755859, -0.00047056376934051514, -0.00040921568870544434, -0.00034786760807037354, -0.00028651952743530273, -0.00022517144680023193, -0.00016382336616516113, -0.00010247528553009033, -4.112720489501953e-05, 2.022087574005127e-05, 8.156895637512207e-05, 0.00014291703701019287, 0.00020426511764526367, 0.00026561319828033447, 0.0003269612789154053, 0.0003883093595504761, 0.0004496574401855469, 0.0005110055208206177, 0.0005723536014556885, 0.0006337016820907593, 0.0006950497627258301, 0.0007563978433609009, 0.0008177459239959717, 0.0008790940046310425, 0.0009404420852661133, 0.001001790165901184, 0.0010631382465362549, 0.0011244863271713257, 0.0011858344078063965, 0.0012471824884414673, 0.001308530569076538, 0.0013698786497116089, 0.0014312267303466797, 0.0014925748109817505, 0.0015539228916168213, 0.001615270972251892, 0.0016766190528869629, 0.0017379671335220337, 0.0017993152141571045, 0.0018606632947921753, 0.001922011375427246, 0.001983359456062317, 0.0020447075366973877, 0.0021060556173324585, 0.0021674036979675293, 0.0022287517786026, 0.002290099859237671, 0.0023514479398727417, 0.0024127960205078125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 5.0, 9.0, 10.0, 27.0, 45.0, 32.0, 66.0, 126.0, 199.0, 355.0, 593.0, 1073.0, 1964.0, 3501.0, 6765.0, 13617.0, 28553.0, 63608.0, 137257.0, 247745.0, 259705.0, 151186.0, 69627.0, 31577.0, 15014.0, 7306.0, 3803.0, 2039.0, 1136.0, 655.0, 404.0, 209.0, 117.0, 89.0, 54.0, 30.0, 26.0, 8.0, 12.0, 6.0, 7.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.72265625, -7.4818115234375, -7.240966796875, -7.0001220703125, -6.75927734375, -6.5184326171875, -6.277587890625, -6.0367431640625, -5.7958984375, -5.5550537109375, -5.314208984375, -5.0733642578125, -4.83251953125, -4.5916748046875, -4.350830078125, -4.1099853515625, -3.869140625, -3.6282958984375, -3.387451171875, -3.1466064453125, -2.90576171875, -2.6649169921875, -2.424072265625, -2.1832275390625, -1.9423828125, -1.7015380859375, -1.460693359375, -1.2198486328125, -0.97900390625, -0.7381591796875, -0.497314453125, -0.2564697265625, -0.015625, 0.2252197265625, 0.466064453125, 0.7069091796875, 0.94775390625, 1.1885986328125, 1.429443359375, 1.6702880859375, 1.9111328125, 2.1519775390625, 2.392822265625, 2.6336669921875, 2.87451171875, 3.1153564453125, 3.356201171875, 3.5970458984375, 3.837890625, 4.0787353515625, 4.319580078125, 4.5604248046875, 4.80126953125, 5.0421142578125, 5.282958984375, 5.5238037109375, 5.7646484375, 6.0054931640625, 6.246337890625, 6.4871826171875, 6.72802734375, 6.9688720703125, 7.209716796875, 7.4505615234375, 7.69140625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 5.0, 2.0, 7.0, 9.0, 8.0, 25.0, 17.0, 19.0, 22.0, 26.0, 37.0, 61.0, 48.0, 76.0, 59.0, 71.0, 53.0, 64.0, 54.0, 72.0, 46.0, 44.0, 33.0, 29.0, 27.0, 17.0, 17.0, 12.0, 11.0, 7.0, 7.0, 6.0, 6.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6796875, -6.491455078125, -6.30322265625, -6.114990234375, -5.9267578125, -5.738525390625, -5.55029296875, -5.362060546875, -5.173828125, -4.985595703125, -4.79736328125, -4.609130859375, -4.4208984375, -4.232666015625, -4.04443359375, -3.856201171875, -3.66796875, -3.479736328125, -3.29150390625, -3.103271484375, -2.9150390625, -2.726806640625, -2.53857421875, -2.350341796875, -2.162109375, -1.973876953125, -1.78564453125, -1.597412109375, -1.4091796875, -1.220947265625, -1.03271484375, -0.844482421875, -0.65625, -0.468017578125, -0.27978515625, -0.091552734375, 0.0966796875, 0.284912109375, 0.47314453125, 0.661376953125, 0.849609375, 1.037841796875, 1.22607421875, 1.414306640625, 1.6025390625, 1.790771484375, 1.97900390625, 2.167236328125, 2.35546875, 2.543701171875, 2.73193359375, 2.920166015625, 3.1083984375, 3.296630859375, 3.48486328125, 3.673095703125, 3.861328125, 4.049560546875, 4.23779296875, 4.426025390625, 4.6142578125, 4.802490234375, 4.99072265625, 5.178955078125, 5.3671875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 5.0, 16.0, 24.0, 56.0, 99.0, 154.0, 203.0, 167.0, 114.0, 72.0, 46.0, 20.0, 8.0, 6.0, 6.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.61648559570312, -73.21717071533203, -68.81785583496094, -64.41854858398438, -60.01923370361328, -55.61991882324219, -51.22060775756836, -46.82129669189453, -42.42198181152344, -38.022666931152344, -33.623355865478516, -29.224042892456055, -24.824729919433594, -20.425416946411133, -16.026103973388672, -11.626791000366211, -7.22747802734375, -2.828165054321289, 1.5711479187011719, 5.970460891723633, 10.369773864746094, 14.769086837768555, 19.168399810791016, 23.567712783813477, 27.967025756835938, 32.36634063720703, 36.76565170288086, 41.16496276855469, 45.56427764892578, 49.963592529296875, 54.3629035949707, 58.76221466064453, 63.16154479980469, 67.56085968017578, 71.96017456054688, 76.35948181152344, 80.75879669189453, 85.15811157226562, 89.55741882324219, 93.95673370361328, 98.35604858398438, 102.75536346435547, 107.15467834472656, 111.55398559570312, 115.95330047607422, 120.35261535644531, 124.75192260742188, 129.1512451171875, 133.55055236816406, 137.94985961914062, 142.34918212890625, 146.7484893798828, 151.14779663085938, 155.547119140625, 159.94642639160156, 164.3457489013672, 168.74505615234375, 173.1443634033203, 177.54368591308594, 181.9429931640625, 186.34231567382812, 190.7416229248047, 195.14093017578125, 199.54025268554688, 203.93955993652344]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 8.0, 14.0, 5.0, 16.0, 13.0, 25.0, 41.0, 40.0, 43.0, 50.0, 58.0, 67.0, 85.0, 79.0, 76.0, 77.0, 73.0, 50.0, 48.0, 43.0, 21.0, 23.0, 10.0, 8.0, 11.0, 5.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.6422119140625, -83.86802673339844, -81.09383392333984, -78.31964874267578, -75.54545593261719, -72.77127075195312, -69.99708557128906, -67.22289276123047, -64.44869995117188, -61.67451095581055, -58.90032196044922, -56.126136779785156, -53.35194396972656, -50.5777587890625, -47.80356979370117, -45.029380798339844, -42.25519561767578, -39.48100662231445, -36.706817626953125, -33.93263244628906, -31.1584415435791, -28.384252548217773, -25.610065460205078, -22.83587646484375, -20.061687469482422, -17.287498474121094, -14.513310432434082, -11.73912239074707, -8.964933395385742, -6.190744400024414, -3.4165573120117188, -0.6423683166503906, 2.1318130493164062, 4.906001567840576, 7.680190086364746, 10.454378128051758, 13.228567123413086, 16.002756118774414, 18.77694320678711, 21.551132202148438, 24.325321197509766, 27.099510192871094, 29.873699188232422, 32.64788818359375, 35.42207336425781, 38.196266174316406, 40.97045135498047, 43.7446403503418, 46.518829345703125, 49.29301834106445, 52.06720733642578, 54.841392517089844, 57.61558532714844, 60.3897705078125, 63.16395950317383, 65.93814849853516, 68.71234130859375, 71.48652648925781, 74.2607192993164, 77.03490447998047, 79.80909729003906, 82.58328247070312, 85.35746765136719, 88.13166046142578, 90.90584564208984]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 3.0, 4.0, 6.0, 12.0, 17.0, 26.0, 40.0, 56.0, 92.0, 118.0, 174.0, 268.0, 392.0, 653.0, 1024.0, 1724.0, 2871.0, 4886.0, 8887.0, 16985.0, 36851.0, 101079.0, 596391.0, 3155171.0, 166823.0, 52073.0, 22255.0, 11055.0, 5760.0, 3353.0, 1957.0, 1217.0, 714.0, 453.0, 315.0, 176.0, 120.0, 89.0, 43.0, 47.0, 26.0, 29.0, 15.0, 8.0, 14.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-35.3125, -34.1025390625, -32.892578125, -31.6826171875, -30.47265625, -29.2626953125, -28.052734375, -26.8427734375, -25.6328125, -24.4228515625, -23.212890625, -22.0029296875, -20.79296875, -19.5830078125, -18.373046875, -17.1630859375, -15.953125, -14.7431640625, -13.533203125, -12.3232421875, -11.11328125, -9.9033203125, -8.693359375, -7.4833984375, -6.2734375, -5.0634765625, -3.853515625, -2.6435546875, -1.43359375, -0.2236328125, 0.986328125, 2.1962890625, 3.40625, 4.6162109375, 5.826171875, 7.0361328125, 8.24609375, 9.4560546875, 10.666015625, 11.8759765625, 13.0859375, 14.2958984375, 15.505859375, 16.7158203125, 17.92578125, 19.1357421875, 20.345703125, 21.5556640625, 22.765625, 23.9755859375, 25.185546875, 26.3955078125, 27.60546875, 28.8154296875, 30.025390625, 31.2353515625, 32.4453125, 33.6552734375, 34.865234375, 36.0751953125, 37.28515625, 38.4951171875, 39.705078125, 40.9150390625, 42.125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 6.0, 7.0, 4.0, 8.0, 9.0, 20.0, 15.0, 16.0, 19.0, 21.0, 33.0, 33.0, 25.0, 26.0, 35.0, 38.0, 48.0, 59.0, 56.0, 63.0, 43.0, 53.0, 40.0, 43.0, 37.0, 40.0, 31.0, 21.0, 34.0, 23.0, 15.0, 8.0, 13.0, 16.0, 12.0, 8.0, 3.0, 6.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.787109375, -1.729949951171875, -1.67279052734375, -1.615631103515625, -1.5584716796875, -1.501312255859375, -1.44415283203125, -1.386993408203125, -1.329833984375, -1.272674560546875, -1.21551513671875, -1.158355712890625, -1.1011962890625, -1.044036865234375, -0.98687744140625, -0.929718017578125, -0.87255859375, -0.815399169921875, -0.75823974609375, -0.701080322265625, -0.6439208984375, -0.586761474609375, -0.52960205078125, -0.472442626953125, -0.415283203125, -0.358123779296875, -0.30096435546875, -0.243804931640625, -0.1866455078125, -0.129486083984375, -0.07232666015625, -0.015167236328125, 0.0419921875, 0.099151611328125, 0.15631103515625, 0.213470458984375, 0.2706298828125, 0.327789306640625, 0.38494873046875, 0.442108154296875, 0.499267578125, 0.556427001953125, 0.61358642578125, 0.670745849609375, 0.7279052734375, 0.785064697265625, 0.84222412109375, 0.899383544921875, 0.95654296875, 1.013702392578125, 1.07086181640625, 1.128021240234375, 1.1851806640625, 1.242340087890625, 1.29949951171875, 1.356658935546875, 1.413818359375, 1.470977783203125, 1.52813720703125, 1.585296630859375, 1.6424560546875, 1.699615478515625, 1.75677490234375, 1.813934326171875, 1.87109375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 6.0, 11.0, 16.0, 19.0, 36.0, 60.0, 82.0, 196.0, 284.0, 854.0, 4983.0, 97144.0, 3972283.0, 111388.0, 5386.0, 813.0, 300.0, 148.0, 89.0, 63.0, 42.0, 18.0, 19.0, 14.0, 9.0, 2.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-148.875, -144.296875, -139.71875, -135.140625, -130.5625, -125.984375, -121.40625, -116.828125, -112.25, -107.671875, -103.09375, -98.515625, -93.9375, -89.359375, -84.78125, -80.203125, -75.625, -71.046875, -66.46875, -61.890625, -57.3125, -52.734375, -48.15625, -43.578125, -39.0, -34.421875, -29.84375, -25.265625, -20.6875, -16.109375, -11.53125, -6.953125, -2.375, 2.203125, 6.78125, 11.359375, 15.9375, 20.515625, 25.09375, 29.671875, 34.25, 38.828125, 43.40625, 47.984375, 52.5625, 57.140625, 61.71875, 66.296875, 70.875, 75.453125, 80.03125, 84.609375, 89.1875, 93.765625, 98.34375, 102.921875, 107.5, 112.078125, 116.65625, 121.234375, 125.8125, 130.390625, 134.96875, 139.546875, 144.125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 7.0, 5.0, 4.0, 13.0, 11.0, 13.0, 22.0, 34.0, 29.0, 45.0, 60.0, 92.0, 182.0, 281.0, 655.0, 1577.0, 430.0, 215.0, 113.0, 85.0, 64.0, 50.0, 33.0, 17.0, 13.0, 3.0, 7.0, 10.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1953125, -7.948486328125, -7.70166015625, -7.454833984375, -7.2080078125, -6.961181640625, -6.71435546875, -6.467529296875, -6.220703125, -5.973876953125, -5.72705078125, -5.480224609375, -5.2333984375, -4.986572265625, -4.73974609375, -4.492919921875, -4.24609375, -3.999267578125, -3.75244140625, -3.505615234375, -3.2587890625, -3.011962890625, -2.76513671875, -2.518310546875, -2.271484375, -2.024658203125, -1.77783203125, -1.531005859375, -1.2841796875, -1.037353515625, -0.79052734375, -0.543701171875, -0.296875, -0.050048828125, 0.19677734375, 0.443603515625, 0.6904296875, 0.937255859375, 1.18408203125, 1.430908203125, 1.677734375, 1.924560546875, 2.17138671875, 2.418212890625, 2.6650390625, 2.911865234375, 3.15869140625, 3.405517578125, 3.65234375, 3.899169921875, 4.14599609375, 4.392822265625, 4.6396484375, 4.886474609375, 5.13330078125, 5.380126953125, 5.626953125, 5.873779296875, 6.12060546875, 6.367431640625, 6.6142578125, 6.861083984375, 7.10791015625, 7.354736328125, 7.6015625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 5.0, 4.0, 9.0, 11.0, 18.0, 30.0, 31.0, 34.0, 73.0, 94.0, 81.0, 112.0, 123.0, 103.0, 72.0, 63.0, 39.0, 42.0, 21.0, 14.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.46728515625, -58.737606048583984, -57.007930755615234, -55.27825164794922, -53.5485725402832, -51.81889343261719, -50.08921813964844, -48.35953903198242, -46.629859924316406, -44.90018081665039, -43.17050552368164, -41.440826416015625, -39.71114730834961, -37.981468200683594, -36.251792907714844, -34.52211380004883, -32.79243850708008, -31.062761306762695, -29.33308219909668, -27.603404998779297, -25.87372589111328, -24.1440486907959, -22.414371490478516, -20.6846923828125, -18.955015182495117, -17.225337982177734, -15.495658874511719, -13.765981674194336, -12.036303520202637, -10.306625366210938, -8.576948165893555, -6.8472700119018555, -5.117591857910156, -3.387913942337036, -1.658236026763916, 0.071441650390625, 1.8011198043823242, 3.5307979583740234, 5.260475158691406, 6.9901533126831055, 8.719831466674805, 10.449509620666504, 12.179187774658203, 13.908864974975586, 15.638543128967285, 17.368221282958984, 19.097898483276367, 20.82757568359375, 22.557254791259766, 24.28693199157715, 26.016611099243164, 27.746288299560547, 29.475967407226562, 31.205644607543945, 32.93532180786133, 34.665000915527344, 36.394676208496094, 38.12435531616211, 39.85403060913086, 41.583709716796875, 43.31338882446289, 45.043067932128906, 46.772743225097656, 48.50242233276367, 50.23210144042969]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 2.0, 3.0, 7.0, 6.0, 4.0, 14.0, 12.0, 12.0, 15.0, 21.0, 20.0, 35.0, 33.0, 34.0, 34.0, 45.0, 42.0, 44.0, 43.0, 45.0, 44.0, 53.0, 42.0, 64.0, 47.0, 39.0, 38.0, 35.0, 28.0, 35.0, 15.0, 19.0, 11.0, 22.0, 13.0, 5.0, 9.0, 2.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-37.74311828613281, -36.74064254760742, -35.73816680908203, -34.735694885253906, -33.733219146728516, -32.730743408203125, -31.728269577026367, -30.72579574584961, -29.72332000732422, -28.720844268798828, -27.71837043762207, -26.715896606445312, -25.713420867919922, -24.71094512939453, -23.708471298217773, -22.705997467041016, -21.703521728515625, -20.701045989990234, -19.698572158813477, -18.69609832763672, -17.693622589111328, -16.691146850585938, -15.68867301940918, -14.686198234558105, -13.683723449707031, -12.681248664855957, -11.678773880004883, -10.676299095153809, -9.673824310302734, -8.67134952545166, -7.668874740600586, -6.666399955749512, -5.663928985595703, -4.661454200744629, -3.6589794158935547, -2.6565046310424805, -1.6540298461914062, -0.651555061340332, 0.3509197235107422, 1.3533945083618164, 2.3558692932128906, 3.358344078063965, 4.360818862915039, 5.363293647766113, 6.3657684326171875, 7.368243217468262, 8.370718002319336, 9.37319278717041, 10.375667572021484, 11.378142356872559, 12.380617141723633, 13.383091926574707, 14.385566711425781, 15.388041496276855, 16.39051628112793, 17.392990112304688, 18.395465850830078, 19.39794158935547, 20.400415420532227, 21.402889251708984, 22.405364990234375, 23.407840728759766, 24.410314559936523, 25.41278839111328, 26.415264129638672]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 3.0, 9.0, 10.0, 16.0, 18.0, 39.0, 56.0, 66.0, 116.0, 116.0, 241.0, 316.0, 502.0, 690.0, 1103.0, 1670.0, 2628.0, 3822.0, 6118.0, 9319.0, 15378.0, 23997.0, 37458.0, 58637.0, 90336.0, 127972.0, 161209.0, 155587.0, 119964.0, 82488.0, 53889.0, 34565.0, 21601.0, 13559.0, 8912.0, 5556.0, 3642.0, 2373.0, 1516.0, 1035.0, 705.0, 439.0, 297.0, 201.0, 129.0, 83.0, 62.0, 35.0, 29.0, 16.0, 14.0, 5.0, 8.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-12.0390625, -11.6494140625, -11.259765625, -10.8701171875, -10.48046875, -10.0908203125, -9.701171875, -9.3115234375, -8.921875, -8.5322265625, -8.142578125, -7.7529296875, -7.36328125, -6.9736328125, -6.583984375, -6.1943359375, -5.8046875, -5.4150390625, -5.025390625, -4.6357421875, -4.24609375, -3.8564453125, -3.466796875, -3.0771484375, -2.6875, -2.2978515625, -1.908203125, -1.5185546875, -1.12890625, -0.7392578125, -0.349609375, 0.0400390625, 0.4296875, 0.8193359375, 1.208984375, 1.5986328125, 1.98828125, 2.3779296875, 2.767578125, 3.1572265625, 3.546875, 3.9365234375, 4.326171875, 4.7158203125, 5.10546875, 5.4951171875, 5.884765625, 6.2744140625, 6.6640625, 7.0537109375, 7.443359375, 7.8330078125, 8.22265625, 8.6123046875, 9.001953125, 9.3916015625, 9.78125, 10.1708984375, 10.560546875, 10.9501953125, 11.33984375, 11.7294921875, 12.119140625, 12.5087890625, 12.8984375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 4.0, 9.0, 3.0, 7.0, 12.0, 7.0, 10.0, 16.0, 18.0, 17.0, 14.0, 27.0, 21.0, 40.0, 25.0, 28.0, 25.0, 34.0, 37.0, 34.0, 46.0, 40.0, 36.0, 46.0, 46.0, 40.0, 46.0, 54.0, 32.0, 32.0, 26.0, 27.0, 24.0, 15.0, 21.0, 17.0, 11.0, 9.0, 7.0, 9.0, 8.0, 5.0, 5.0, 1.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.654296875, -1.5994720458984375, -1.544647216796875, -1.4898223876953125, -1.43499755859375, -1.3801727294921875, -1.325347900390625, -1.2705230712890625, -1.2156982421875, -1.1608734130859375, -1.106048583984375, -1.0512237548828125, -0.99639892578125, -0.9415740966796875, -0.886749267578125, -0.8319244384765625, -0.777099609375, -0.7222747802734375, -0.667449951171875, -0.6126251220703125, -0.55780029296875, -0.5029754638671875, -0.448150634765625, -0.3933258056640625, -0.3385009765625, -0.2836761474609375, -0.228851318359375, -0.1740264892578125, -0.11920166015625, -0.0643768310546875, -0.009552001953125, 0.0452728271484375, 0.10009765625, 0.1549224853515625, 0.209747314453125, 0.2645721435546875, 0.31939697265625, 0.3742218017578125, 0.429046630859375, 0.4838714599609375, 0.5386962890625, 0.5935211181640625, 0.648345947265625, 0.7031707763671875, 0.75799560546875, 0.8128204345703125, 0.867645263671875, 0.9224700927734375, 0.977294921875, 1.0321197509765625, 1.086944580078125, 1.1417694091796875, 1.19659423828125, 1.2514190673828125, 1.306243896484375, 1.3610687255859375, 1.4158935546875, 1.4707183837890625, 1.525543212890625, 1.5803680419921875, 1.63519287109375, 1.6900177001953125, 1.744842529296875, 1.7996673583984375, 1.8544921875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 7.0, 8.0, 12.0, 17.0, 33.0, 78.0, 117.0, 217.0, 474.0, 921.0, 2161.0, 5920.0, 19335.0, 78743.0, 295138.0, 436053.0, 154275.0, 38271.0, 10418.0, 3493.0, 1456.0, 676.0, 355.0, 169.0, 75.0, 52.0, 24.0, 23.0, 11.0, 10.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.8125, -38.451171875, -37.08984375, -35.728515625, -34.3671875, -33.005859375, -31.64453125, -30.283203125, -28.921875, -27.560546875, -26.19921875, -24.837890625, -23.4765625, -22.115234375, -20.75390625, -19.392578125, -18.03125, -16.669921875, -15.30859375, -13.947265625, -12.5859375, -11.224609375, -9.86328125, -8.501953125, -7.140625, -5.779296875, -4.41796875, -3.056640625, -1.6953125, -0.333984375, 1.02734375, 2.388671875, 3.75, 5.111328125, 6.47265625, 7.833984375, 9.1953125, 10.556640625, 11.91796875, 13.279296875, 14.640625, 16.001953125, 17.36328125, 18.724609375, 20.0859375, 21.447265625, 22.80859375, 24.169921875, 25.53125, 26.892578125, 28.25390625, 29.615234375, 30.9765625, 32.337890625, 33.69921875, 35.060546875, 36.421875, 37.783203125, 39.14453125, 40.505859375, 41.8671875, 43.228515625, 44.58984375, 45.951171875, 47.3125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 10.0, 5.0, 4.0, 8.0, 14.0, 10.0, 14.0, 16.0, 15.0, 28.0, 23.0, 35.0, 29.0, 44.0, 40.0, 28.0, 44.0, 45.0, 47.0, 47.0, 53.0, 44.0, 42.0, 32.0, 48.0, 37.0, 29.0, 26.0, 44.0, 22.0, 19.0, 19.0, 13.0, 12.0, 10.0, 12.0, 7.0, 6.0, 7.0, 9.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-13.8984375, -13.4517822265625, -13.005126953125, -12.5584716796875, -12.11181640625, -11.6651611328125, -11.218505859375, -10.7718505859375, -10.3251953125, -9.8785400390625, -9.431884765625, -8.9852294921875, -8.53857421875, -8.0919189453125, -7.645263671875, -7.1986083984375, -6.751953125, -6.3052978515625, -5.858642578125, -5.4119873046875, -4.96533203125, -4.5186767578125, -4.072021484375, -3.6253662109375, -3.1787109375, -2.7320556640625, -2.285400390625, -1.8387451171875, -1.39208984375, -0.9454345703125, -0.498779296875, -0.0521240234375, 0.39453125, 0.8411865234375, 1.287841796875, 1.7344970703125, 2.18115234375, 2.6278076171875, 3.074462890625, 3.5211181640625, 3.9677734375, 4.4144287109375, 4.861083984375, 5.3077392578125, 5.75439453125, 6.2010498046875, 6.647705078125, 7.0943603515625, 7.541015625, 7.9876708984375, 8.434326171875, 8.8809814453125, 9.32763671875, 9.7742919921875, 10.220947265625, 10.6676025390625, 11.1142578125, 11.5609130859375, 12.007568359375, 12.4542236328125, 12.90087890625, 13.3475341796875, 13.794189453125, 14.2408447265625, 14.6875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 4.0, 3.0, 4.0, 7.0, 13.0, 16.0, 15.0, 22.0, 35.0, 63.0, 111.0, 136.0, 192.0, 285.0, 480.0, 852.0, 1476.0, 2860.0, 5851.0, 14101.0, 43576.0, 213277.0, 548535.0, 159010.0, 34637.0, 11927.0, 5161.0, 2532.0, 1331.0, 796.0, 431.0, 295.0, 171.0, 129.0, 60.0, 53.0, 30.0, 21.0, 21.0, 11.0, 15.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-35.21875, -34.09765625, -32.9765625, -31.85546875, -30.734375, -29.61328125, -28.4921875, -27.37109375, -26.25, -25.12890625, -24.0078125, -22.88671875, -21.765625, -20.64453125, -19.5234375, -18.40234375, -17.28125, -16.16015625, -15.0390625, -13.91796875, -12.796875, -11.67578125, -10.5546875, -9.43359375, -8.3125, -7.19140625, -6.0703125, -4.94921875, -3.828125, -2.70703125, -1.5859375, -0.46484375, 0.65625, 1.77734375, 2.8984375, 4.01953125, 5.140625, 6.26171875, 7.3828125, 8.50390625, 9.625, 10.74609375, 11.8671875, 12.98828125, 14.109375, 15.23046875, 16.3515625, 17.47265625, 18.59375, 19.71484375, 20.8359375, 21.95703125, 23.078125, 24.19921875, 25.3203125, 26.44140625, 27.5625, 28.68359375, 29.8046875, 30.92578125, 32.046875, 33.16796875, 34.2890625, 35.41015625, 36.53125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 7.0, 4.0, 12.0, 12.0, 18.0, 25.0, 20.0, 41.0, 24.0, 48.0, 57.0, 101.0, 104.0, 95.0, 104.0, 83.0, 54.0, 49.0, 36.0, 26.0, 22.0, 11.0, 12.0, 11.0, 5.0, 4.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003467559814453125, -0.0033602118492126465, -0.003252863883972168, -0.0031455159187316895, -0.003038167953491211, -0.0029308199882507324, -0.002823472023010254, -0.0027161240577697754, -0.002608776092529297, -0.0025014281272888184, -0.00239408016204834, -0.0022867321968078613, -0.002179384231567383, -0.0020720362663269043, -0.0019646883010864258, -0.0018573403358459473, -0.0017499923706054688, -0.0016426444053649902, -0.0015352964401245117, -0.0014279484748840332, -0.0013206005096435547, -0.0012132525444030762, -0.0011059045791625977, -0.0009985566139221191, -0.0008912086486816406, -0.0007838606834411621, -0.0006765127182006836, -0.0005691647529602051, -0.00046181678771972656, -0.00035446882247924805, -0.00024712085723876953, -0.00013977289199829102, -3.24249267578125e-05, 7.492303848266602e-05, 0.00018227100372314453, 0.00028961896896362305, 0.00039696693420410156, 0.0005043148994445801, 0.0006116628646850586, 0.0007190108299255371, 0.0008263587951660156, 0.0009337067604064941, 0.0010410547256469727, 0.0011484026908874512, 0.0012557506561279297, 0.0013630986213684082, 0.0014704465866088867, 0.0015777945518493652, 0.0016851425170898438, 0.0017924904823303223, 0.0018998384475708008, 0.0020071864128112793, 0.002114534378051758, 0.0022218823432922363, 0.002329230308532715, 0.0024365782737731934, 0.002543926239013672, 0.0026512742042541504, 0.002758622169494629, 0.0028659701347351074, 0.002973318099975586, 0.0030806660652160645, 0.003188014030456543, 0.0032953619956970215, 0.0034027099609375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 11.0, 12.0, 17.0, 14.0, 21.0, 39.0, 43.0, 75.0, 107.0, 167.0, 229.0, 337.0, 519.0, 784.0, 1233.0, 1957.0, 3273.0, 5628.0, 10962.0, 24009.0, 65414.0, 225534.0, 424839.0, 185259.0, 54398.0, 20570.0, 9696.0, 5193.0, 2972.0, 1837.0, 1150.0, 723.0, 481.0, 297.0, 229.0, 135.0, 128.0, 67.0, 44.0, 32.0, 39.0, 20.0, 14.0, 5.0, 5.0, 9.0, 6.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0], "bins": [-24.875, -24.130615234375, -23.38623046875, -22.641845703125, -21.8974609375, -21.153076171875, -20.40869140625, -19.664306640625, -18.919921875, -18.175537109375, -17.43115234375, -16.686767578125, -15.9423828125, -15.197998046875, -14.45361328125, -13.709228515625, -12.96484375, -12.220458984375, -11.47607421875, -10.731689453125, -9.9873046875, -9.242919921875, -8.49853515625, -7.754150390625, -7.009765625, -6.265380859375, -5.52099609375, -4.776611328125, -4.0322265625, -3.287841796875, -2.54345703125, -1.799072265625, -1.0546875, -0.310302734375, 0.43408203125, 1.178466796875, 1.9228515625, 2.667236328125, 3.41162109375, 4.156005859375, 4.900390625, 5.644775390625, 6.38916015625, 7.133544921875, 7.8779296875, 8.622314453125, 9.36669921875, 10.111083984375, 10.85546875, 11.599853515625, 12.34423828125, 13.088623046875, 13.8330078125, 14.577392578125, 15.32177734375, 16.066162109375, 16.810546875, 17.554931640625, 18.29931640625, 19.043701171875, 19.7880859375, 20.532470703125, 21.27685546875, 22.021240234375, 22.765625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 5.0, 0.0, 3.0, 4.0, 5.0, 10.0, 7.0, 5.0, 21.0, 14.0, 22.0, 44.0, 41.0, 50.0, 68.0, 78.0, 101.0, 99.0, 96.0, 81.0, 47.0, 48.0, 26.0, 26.0, 20.0, 18.0, 7.0, 14.0, 7.0, 6.0, 2.0, 5.0, 4.0, 7.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.40625, -15.894287109375, -15.38232421875, -14.870361328125, -14.3583984375, -13.846435546875, -13.33447265625, -12.822509765625, -12.310546875, -11.798583984375, -11.28662109375, -10.774658203125, -10.2626953125, -9.750732421875, -9.23876953125, -8.726806640625, -8.21484375, -7.702880859375, -7.19091796875, -6.678955078125, -6.1669921875, -5.655029296875, -5.14306640625, -4.631103515625, -4.119140625, -3.607177734375, -3.09521484375, -2.583251953125, -2.0712890625, -1.559326171875, -1.04736328125, -0.535400390625, -0.0234375, 0.488525390625, 1.00048828125, 1.512451171875, 2.0244140625, 2.536376953125, 3.04833984375, 3.560302734375, 4.072265625, 4.584228515625, 5.09619140625, 5.608154296875, 6.1201171875, 6.632080078125, 7.14404296875, 7.656005859375, 8.16796875, 8.679931640625, 9.19189453125, 9.703857421875, 10.2158203125, 10.727783203125, 11.23974609375, 11.751708984375, 12.263671875, 12.775634765625, 13.28759765625, 13.799560546875, 14.3115234375, 14.823486328125, 15.33544921875, 15.847412109375, 16.359375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 7.0, 12.0, 18.0, 31.0, 87.0, 113.0, 168.0, 199.0, 177.0, 87.0, 53.0, 23.0, 11.0, 8.0, 4.0, 1.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-189.0165252685547, -177.53866577148438, -166.06082153320312, -154.5829620361328, -143.10511779785156, -131.62725830078125, -120.14940643310547, -108.67155456542969, -97.1937026977539, -85.71585083007812, -74.23799896240234, -62.7601432800293, -51.282291412353516, -39.804439544677734, -28.326583862304688, -16.848731994628906, -5.370880126953125, 6.106972694396973, 17.58482551574707, 29.062679290771484, 40.540531158447266, 52.01838302612305, 63.496238708496094, 74.97409057617188, 86.45194244384766, 97.92979431152344, 109.40764617919922, 120.885498046875, 132.3633575439453, 143.84120178222656, 155.31906127929688, 166.79690551757812, 178.27474975585938, 189.7526092529297, 201.23045349121094, 212.70831298828125, 224.1861572265625, 235.6640167236328, 247.14187622070312, 258.6197204589844, 270.0975646972656, 281.5754089355469, 293.05328369140625, 304.5311279296875, 316.00897216796875, 327.48681640625, 338.9646911621094, 350.4425354003906, 361.92041015625, 373.39825439453125, 384.8761291503906, 396.3539733886719, 407.8318176269531, 419.3096618652344, 430.78753662109375, 442.265380859375, 453.74322509765625, 465.2210693359375, 476.6989440917969, 488.1767883300781, 499.6546325683594, 511.1324768066406, 522.6103515625, 534.0881958007812, 545.5660400390625]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 6.0, 13.0, 17.0, 19.0, 28.0, 38.0, 38.0, 47.0, 41.0, 65.0, 78.0, 71.0, 88.0, 65.0, 68.0, 64.0, 57.0, 43.0, 43.0, 29.0, 20.0, 16.0, 14.0, 9.0, 14.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-179.1793975830078, -173.3857421875, -167.59210205078125, -161.79844665527344, -156.0048065185547, -150.21115112304688, -144.41751098632812, -138.6238555908203, -132.8302001953125, -127.03655242919922, -121.24290466308594, -115.44924926757812, -109.65560913085938, -103.86195373535156, -98.06830596923828, -92.274658203125, -86.48101806640625, -80.68737030029297, -74.89372253417969, -69.10006713867188, -63.30642318725586, -57.51277542114258, -51.71912384033203, -45.92547607421875, -40.13182830810547, -34.33818054199219, -28.544530868530273, -22.75088119506836, -16.957233428955078, -11.163585662841797, -5.36993408203125, 0.42371368408203125, 6.21734619140625, 12.010994911193848, 17.804643630981445, 23.59829330444336, 29.39194107055664, 35.18558883666992, 40.97924041748047, 46.77288818359375, 52.56653594970703, 58.36018371582031, 64.1538314819336, 69.94747924804688, 75.74113464355469, 81.53477478027344, 87.32843017578125, 93.12207794189453, 98.91572570800781, 104.7093734741211, 110.50302124023438, 116.29667663574219, 122.09031677246094, 127.88397216796875, 133.6776123046875, 139.4712677001953, 145.26492309570312, 151.05857849121094, 156.8522186279297, 162.6458740234375, 168.43951416015625, 174.23316955566406, 180.02682495117188, 185.82046508789062, 191.61410522460938]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 4.0, 10.0, 17.0, 17.0, 33.0, 67.0, 88.0, 194.0, 597.0, 2413.0, 18610.0, 538328.0, 3598158.0, 31366.0, 3367.0, 572.0, 191.0, 89.0, 60.0, 40.0, 24.0, 17.0, 10.0, 8.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-156.125, -150.14453125, -144.1640625, -138.18359375, -132.203125, -126.22265625, -120.2421875, -114.26171875, -108.28125, -102.30078125, -96.3203125, -90.33984375, -84.359375, -78.37890625, -72.3984375, -66.41796875, -60.4375, -54.45703125, -48.4765625, -42.49609375, -36.515625, -30.53515625, -24.5546875, -18.57421875, -12.59375, -6.61328125, -0.6328125, 5.34765625, 11.328125, 17.30859375, 23.2890625, 29.26953125, 35.25, 41.23046875, 47.2109375, 53.19140625, 59.171875, 65.15234375, 71.1328125, 77.11328125, 83.09375, 89.07421875, 95.0546875, 101.03515625, 107.015625, 112.99609375, 118.9765625, 124.95703125, 130.9375, 136.91796875, 142.8984375, 148.87890625, 154.859375, 160.83984375, 166.8203125, 172.80078125, 178.78125, 184.76171875, 190.7421875, 196.72265625, 202.703125, 208.68359375, 214.6640625, 220.64453125, 226.625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 13.0, 16.0, 19.0, 25.0, 34.0, 55.0, 71.0, 65.0, 70.0, 107.0, 91.0, 82.0, 88.0, 64.0, 54.0, 37.0, 31.0, 27.0, 19.0, 9.0, 11.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.09765625, -4.92889404296875, -4.7601318359375, -4.59136962890625, -4.422607421875, -4.25384521484375, -4.0850830078125, -3.91632080078125, -3.74755859375, -3.57879638671875, -3.4100341796875, -3.24127197265625, -3.072509765625, -2.90374755859375, -2.7349853515625, -2.56622314453125, -2.3974609375, -2.22869873046875, -2.0599365234375, -1.89117431640625, -1.722412109375, -1.55364990234375, -1.3848876953125, -1.21612548828125, -1.04736328125, -0.87860107421875, -0.7098388671875, -0.54107666015625, -0.372314453125, -0.20355224609375, -0.0347900390625, 0.13397216796875, 0.302734375, 0.47149658203125, 0.6402587890625, 0.80902099609375, 0.977783203125, 1.14654541015625, 1.3153076171875, 1.48406982421875, 1.65283203125, 1.82159423828125, 1.9903564453125, 2.15911865234375, 2.327880859375, 2.49664306640625, 2.6654052734375, 2.83416748046875, 3.0029296875, 3.17169189453125, 3.3404541015625, 3.50921630859375, 3.677978515625, 3.84674072265625, 4.0155029296875, 4.18426513671875, 4.35302734375, 4.52178955078125, 4.6905517578125, 4.85931396484375, 5.028076171875, 5.19683837890625, 5.3656005859375, 5.53436279296875, 5.703125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 5.0, 2.0, 5.0, 7.0, 10.0, 10.0, 18.0, 11.0, 23.0, 24.0, 34.0, 37.0, 46.0, 69.0, 118.0, 435.0, 2520.0, 23020.0, 514919.0, 3570769.0, 75198.0, 5810.0, 768.0, 175.0, 44.0, 35.0, 37.0, 17.0, 23.0, 17.0, 20.0, 21.0, 10.0, 12.0, 6.0, 6.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-182.5, -177.724609375, -172.94921875, -168.173828125, -163.3984375, -158.623046875, -153.84765625, -149.072265625, -144.296875, -139.521484375, -134.74609375, -129.970703125, -125.1953125, -120.419921875, -115.64453125, -110.869140625, -106.09375, -101.318359375, -96.54296875, -91.767578125, -86.9921875, -82.216796875, -77.44140625, -72.666015625, -67.890625, -63.115234375, -58.33984375, -53.564453125, -48.7890625, -44.013671875, -39.23828125, -34.462890625, -29.6875, -24.912109375, -20.13671875, -15.361328125, -10.5859375, -5.810546875, -1.03515625, 3.740234375, 8.515625, 13.291015625, 18.06640625, 22.841796875, 27.6171875, 32.392578125, 37.16796875, 41.943359375, 46.71875, 51.494140625, 56.26953125, 61.044921875, 65.8203125, 70.595703125, 75.37109375, 80.146484375, 84.921875, 89.697265625, 94.47265625, 99.248046875, 104.0234375, 108.798828125, 113.57421875, 118.349609375, 123.125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 2.0, 5.0, 12.0, 25.0, 40.0, 59.0, 111.0, 190.0, 383.0, 1774.0, 823.0, 309.0, 169.0, 72.0, 43.0, 36.0, 13.0, 11.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-35.21875, -34.5260009765625, -33.833251953125, -33.1405029296875, -32.44775390625, -31.7550048828125, -31.062255859375, -30.3695068359375, -29.6767578125, -28.9840087890625, -28.291259765625, -27.5985107421875, -26.90576171875, -26.2130126953125, -25.520263671875, -24.8275146484375, -24.134765625, -23.4420166015625, -22.749267578125, -22.0565185546875, -21.36376953125, -20.6710205078125, -19.978271484375, -19.2855224609375, -18.5927734375, -17.9000244140625, -17.207275390625, -16.5145263671875, -15.82177734375, -15.1290283203125, -14.436279296875, -13.7435302734375, -13.05078125, -12.3580322265625, -11.665283203125, -10.9725341796875, -10.27978515625, -9.5870361328125, -8.894287109375, -8.2015380859375, -7.5087890625, -6.8160400390625, -6.123291015625, -5.4305419921875, -4.73779296875, -4.0450439453125, -3.352294921875, -2.6595458984375, -1.966796875, -1.2740478515625, -0.581298828125, 0.1114501953125, 0.80419921875, 1.4969482421875, 2.189697265625, 2.8824462890625, 3.5751953125, 4.2679443359375, 4.960693359375, 5.6534423828125, 6.34619140625, 7.0389404296875, 7.731689453125, 8.4244384765625, 9.1171875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 11.0, 8.0, 22.0, 27.0, 58.0, 99.0, 129.0, 171.0, 157.0, 131.0, 84.0, 42.0, 27.0, 16.0, 6.0, 7.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.67965698242188, -86.5381088256836, -82.39656829833984, -78.25502014160156, -74.11347961425781, -69.97193145751953, -65.83038330078125, -61.6888427734375, -57.547298431396484, -53.40575408935547, -49.26420974731445, -45.12266540527344, -40.981117248535156, -36.839576721191406, -32.698028564453125, -28.55648422241211, -24.414939880371094, -20.273395538330078, -16.131851196289062, -11.990304946899414, -7.848760604858398, -3.707216262817383, 0.4343299865722656, 4.575874328613281, 8.717418670654297, 12.858963012695312, 17.000507354736328, 21.142053604125977, 25.283597946166992, 29.425142288208008, 33.566688537597656, 37.70823287963867, 41.84977722167969, 45.9913215637207, 50.13286590576172, 54.2744140625, 58.41595458984375, 62.55750274658203, 66.69905090332031, 70.84059143066406, 74.98213195800781, 79.1236801147461, 83.26522064208984, 87.40676879882812, 91.54830932617188, 95.68985748291016, 99.83140563964844, 103.97294616699219, 108.11449432373047, 112.25604248046875, 116.3975830078125, 120.53913116455078, 124.68067169189453, 128.8222198486328, 132.96376037597656, 137.10531616210938, 141.24685668945312, 145.38839721679688, 149.5299530029297, 153.67149353027344, 157.8130340576172, 161.95457458496094, 166.09613037109375, 170.2376708984375, 174.37921142578125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 3.0, 7.0, 3.0, 8.0, 8.0, 12.0, 17.0, 13.0, 17.0, 17.0, 17.0, 21.0, 22.0, 33.0, 31.0, 32.0, 42.0, 41.0, 45.0, 56.0, 31.0, 37.0, 47.0, 59.0, 35.0, 39.0, 34.0, 29.0, 31.0, 27.0, 32.0, 23.0, 14.0, 20.0, 17.0, 11.0, 10.0, 11.0, 9.0, 9.0, 7.0, 6.0, 7.0, 4.0, 1.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-54.44488525390625, -52.906551361083984, -51.368221282958984, -49.82988739013672, -48.29155349731445, -46.75321960449219, -45.21488952636719, -43.67655563354492, -42.138221740722656, -40.59988784790039, -39.06155776977539, -37.523223876953125, -35.98488998413086, -34.446556091308594, -32.908226013183594, -31.369892120361328, -29.831560134887695, -28.293228149414062, -26.754894256591797, -25.216562271118164, -23.6782283782959, -22.139896392822266, -20.6015625, -19.063230514526367, -17.524898529052734, -15.986565589904785, -14.448232650756836, -12.909900665283203, -11.371566772460938, -9.833234786987305, -8.294901847839355, -6.756568908691406, -5.218235015869141, -3.6799020767211914, -2.1415693759918213, -0.6032366752624512, 0.935096263885498, 2.4734292030334473, 4.011761665344238, 5.5500946044921875, 7.088427543640137, 8.626760482788086, 10.165093421936035, 11.703426361083984, 13.241758346557617, 14.780092239379883, 16.318424224853516, 17.85675811767578, 19.395090103149414, 20.933422088623047, 22.471755981445312, 24.010087966918945, 25.54842185974121, 27.086753845214844, 28.62508773803711, 30.163419723510742, 31.701751708984375, 33.24008560180664, 34.77841567993164, 36.316749572753906, 37.85508346557617, 39.39341735839844, 40.93174743652344, 42.4700813293457, 44.00841522216797]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 4.0, 10.0, 12.0, 13.0, 24.0, 30.0, 39.0, 58.0, 89.0, 92.0, 139.0, 236.0, 350.0, 548.0, 976.0, 1898.0, 4173.0, 10338.0, 29336.0, 82643.0, 211275.0, 350419.0, 219420.0, 86185.0, 30455.0, 10877.0, 4211.0, 1929.0, 1027.0, 607.0, 334.0, 246.0, 167.0, 111.0, 72.0, 63.0, 43.0, 30.0, 20.0, 20.0, 12.0, 3.0, 7.0, 3.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-35.125, -34.044921875, -32.96484375, -31.884765625, -30.8046875, -29.724609375, -28.64453125, -27.564453125, -26.484375, -25.404296875, -24.32421875, -23.244140625, -22.1640625, -21.083984375, -20.00390625, -18.923828125, -17.84375, -16.763671875, -15.68359375, -14.603515625, -13.5234375, -12.443359375, -11.36328125, -10.283203125, -9.203125, -8.123046875, -7.04296875, -5.962890625, -4.8828125, -3.802734375, -2.72265625, -1.642578125, -0.5625, 0.517578125, 1.59765625, 2.677734375, 3.7578125, 4.837890625, 5.91796875, 6.998046875, 8.078125, 9.158203125, 10.23828125, 11.318359375, 12.3984375, 13.478515625, 14.55859375, 15.638671875, 16.71875, 17.798828125, 18.87890625, 19.958984375, 21.0390625, 22.119140625, 23.19921875, 24.279296875, 25.359375, 26.439453125, 27.51953125, 28.599609375, 29.6796875, 30.759765625, 31.83984375, 32.919921875, 34.0]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 7.0, 6.0, 8.0, 9.0, 20.0, 38.0, 40.0, 54.0, 54.0, 87.0, 71.0, 89.0, 79.0, 87.0, 62.0, 64.0, 52.0, 39.0, 36.0, 27.0, 25.0, 24.0, 10.0, 6.0, 6.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.3359375, -5.16021728515625, -4.9844970703125, -4.80877685546875, -4.633056640625, -4.45733642578125, -4.2816162109375, -4.10589599609375, -3.93017578125, -3.75445556640625, -3.5787353515625, -3.40301513671875, -3.227294921875, -3.05157470703125, -2.8758544921875, -2.70013427734375, -2.5244140625, -2.34869384765625, -2.1729736328125, -1.99725341796875, -1.821533203125, -1.64581298828125, -1.4700927734375, -1.29437255859375, -1.11865234375, -0.94293212890625, -0.7672119140625, -0.59149169921875, -0.415771484375, -0.24005126953125, -0.0643310546875, 0.11138916015625, 0.287109375, 0.46282958984375, 0.6385498046875, 0.81427001953125, 0.989990234375, 1.16571044921875, 1.3414306640625, 1.51715087890625, 1.69287109375, 1.86859130859375, 2.0443115234375, 2.22003173828125, 2.395751953125, 2.57147216796875, 2.7471923828125, 2.92291259765625, 3.0986328125, 3.27435302734375, 3.4500732421875, 3.62579345703125, 3.801513671875, 3.97723388671875, 4.1529541015625, 4.32867431640625, 4.50439453125, 4.68011474609375, 4.8558349609375, 5.03155517578125, 5.207275390625, 5.38299560546875, 5.5587158203125, 5.73443603515625, 5.91015625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 7.0, 6.0, 10.0, 18.0, 26.0, 31.0, 66.0, 75.0, 139.0, 242.0, 419.0, 760.0, 1377.0, 3141.0, 8163.0, 25922.0, 91283.0, 296564.0, 405585.0, 150516.0, 42715.0, 12577.0, 4550.0, 1998.0, 1029.0, 509.0, 313.0, 209.0, 117.0, 78.0, 40.0, 25.0, 12.0, 14.0, 9.0, 6.0, 6.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.0625, -40.71435546875, -39.3662109375, -38.01806640625, -36.669921875, -35.32177734375, -33.9736328125, -32.62548828125, -31.27734375, -29.92919921875, -28.5810546875, -27.23291015625, -25.884765625, -24.53662109375, -23.1884765625, -21.84033203125, -20.4921875, -19.14404296875, -17.7958984375, -16.44775390625, -15.099609375, -13.75146484375, -12.4033203125, -11.05517578125, -9.70703125, -8.35888671875, -7.0107421875, -5.66259765625, -4.314453125, -2.96630859375, -1.6181640625, -0.27001953125, 1.078125, 2.42626953125, 3.7744140625, 5.12255859375, 6.470703125, 7.81884765625, 9.1669921875, 10.51513671875, 11.86328125, 13.21142578125, 14.5595703125, 15.90771484375, 17.255859375, 18.60400390625, 19.9521484375, 21.30029296875, 22.6484375, 23.99658203125, 25.3447265625, 26.69287109375, 28.041015625, 29.38916015625, 30.7373046875, 32.08544921875, 33.43359375, 34.78173828125, 36.1298828125, 37.47802734375, 38.826171875, 40.17431640625, 41.5224609375, 42.87060546875, 44.21875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 5.0, 7.0, 7.0, 4.0, 8.0, 7.0, 12.0, 19.0, 24.0, 20.0, 26.0, 34.0, 39.0, 42.0, 52.0, 50.0, 55.0, 54.0, 52.0, 47.0, 51.0, 48.0, 55.0, 40.0, 41.0, 37.0, 25.0, 34.0, 28.0, 15.0, 15.0, 9.0, 7.0, 7.0, 8.0, 7.0, 7.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.84375, -20.114501953125, -19.38525390625, -18.656005859375, -17.9267578125, -17.197509765625, -16.46826171875, -15.739013671875, -15.009765625, -14.280517578125, -13.55126953125, -12.822021484375, -12.0927734375, -11.363525390625, -10.63427734375, -9.905029296875, -9.17578125, -8.446533203125, -7.71728515625, -6.988037109375, -6.2587890625, -5.529541015625, -4.80029296875, -4.071044921875, -3.341796875, -2.612548828125, -1.88330078125, -1.154052734375, -0.4248046875, 0.304443359375, 1.03369140625, 1.762939453125, 2.4921875, 3.221435546875, 3.95068359375, 4.679931640625, 5.4091796875, 6.138427734375, 6.86767578125, 7.596923828125, 8.326171875, 9.055419921875, 9.78466796875, 10.513916015625, 11.2431640625, 11.972412109375, 12.70166015625, 13.430908203125, 14.16015625, 14.889404296875, 15.61865234375, 16.347900390625, 17.0771484375, 17.806396484375, 18.53564453125, 19.264892578125, 19.994140625, 20.723388671875, 21.45263671875, 22.181884765625, 22.9111328125, 23.640380859375, 24.36962890625, 25.098876953125, 25.828125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 11.0, 8.0, 4.0, 13.0, 14.0, 14.0, 29.0, 37.0, 63.0, 119.0, 181.0, 318.0, 522.0, 1147.0, 2438.0, 6281.0, 19911.0, 81039.0, 329669.0, 432661.0, 129229.0, 29805.0, 8774.0, 3298.0, 1437.0, 637.0, 336.0, 207.0, 127.0, 76.0, 35.0, 35.0, 34.0, 15.0, 7.0, 9.0, 2.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.15625, -21.445068359375, -20.73388671875, -20.022705078125, -19.3115234375, -18.600341796875, -17.88916015625, -17.177978515625, -16.466796875, -15.755615234375, -15.04443359375, -14.333251953125, -13.6220703125, -12.910888671875, -12.19970703125, -11.488525390625, -10.77734375, -10.066162109375, -9.35498046875, -8.643798828125, -7.9326171875, -7.221435546875, -6.51025390625, -5.799072265625, -5.087890625, -4.376708984375, -3.66552734375, -2.954345703125, -2.2431640625, -1.531982421875, -0.82080078125, -0.109619140625, 0.6015625, 1.312744140625, 2.02392578125, 2.735107421875, 3.4462890625, 4.157470703125, 4.86865234375, 5.579833984375, 6.291015625, 7.002197265625, 7.71337890625, 8.424560546875, 9.1357421875, 9.846923828125, 10.55810546875, 11.269287109375, 11.98046875, 12.691650390625, 13.40283203125, 14.114013671875, 14.8251953125, 15.536376953125, 16.24755859375, 16.958740234375, 17.669921875, 18.381103515625, 19.09228515625, 19.803466796875, 20.5146484375, 21.225830078125, 21.93701171875, 22.648193359375, 23.359375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 4.0, 4.0, 11.0, 9.0, 14.0, 15.0, 16.0, 26.0, 30.0, 38.0, 50.0, 68.0, 81.0, 76.0, 102.0, 79.0, 82.0, 73.0, 61.0, 31.0, 36.0, 21.0, 15.0, 11.0, 10.0, 7.0, 5.0, 8.0, 4.0, 0.0, 9.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0030155181884765625, -0.00293537974357605, -0.002855241298675537, -0.0027751028537750244, -0.0026949644088745117, -0.002614825963973999, -0.0025346875190734863, -0.0024545490741729736, -0.002374410629272461, -0.0022942721843719482, -0.0022141337394714355, -0.002133995294570923, -0.00205385684967041, -0.0019737184047698975, -0.0018935799598693848, -0.001813441514968872, -0.0017333030700683594, -0.0016531646251678467, -0.001573026180267334, -0.0014928877353668213, -0.0014127492904663086, -0.001332610845565796, -0.0012524724006652832, -0.0011723339557647705, -0.0010921955108642578, -0.0010120570659637451, -0.0009319186210632324, -0.0008517801761627197, -0.000771641731262207, -0.0006915032863616943, -0.0006113648414611816, -0.0005312263965606689, -0.00045108795166015625, -0.00037094950675964355, -0.00029081106185913086, -0.00021067261695861816, -0.00013053417205810547, -5.0395727157592773e-05, 2.9742717742919922e-05, 0.00010988116264343262, 0.0001900196075439453, 0.000270158052444458, 0.0003502964973449707, 0.0004304349422454834, 0.0005105733871459961, 0.0005907118320465088, 0.0006708502769470215, 0.0007509887218475342, 0.0008311271667480469, 0.0009112656116485596, 0.0009914040565490723, 0.001071542501449585, 0.0011516809463500977, 0.0012318193912506104, 0.001311957836151123, 0.0013920962810516357, 0.0014722347259521484, 0.0015523731708526611, 0.0016325116157531738, 0.0017126500606536865, 0.0017927885055541992, 0.001872926950454712, 0.0019530653953552246, 0.0020332038402557373, 0.00211334228515625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 8.0, 9.0, 15.0, 18.0, 23.0, 57.0, 65.0, 105.0, 192.0, 325.0, 673.0, 1548.0, 4115.0, 11891.0, 49518.0, 262732.0, 529896.0, 144874.0, 29223.0, 8018.0, 2760.0, 1158.0, 588.0, 282.0, 175.0, 102.0, 59.0, 43.0, 22.0, 18.0, 19.0, 10.0, 12.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-32.15625, -31.317138671875, -30.47802734375, -29.638916015625, -28.7998046875, -27.960693359375, -27.12158203125, -26.282470703125, -25.443359375, -24.604248046875, -23.76513671875, -22.926025390625, -22.0869140625, -21.247802734375, -20.40869140625, -19.569580078125, -18.73046875, -17.891357421875, -17.05224609375, -16.213134765625, -15.3740234375, -14.534912109375, -13.69580078125, -12.856689453125, -12.017578125, -11.178466796875, -10.33935546875, -9.500244140625, -8.6611328125, -7.822021484375, -6.98291015625, -6.143798828125, -5.3046875, -4.465576171875, -3.62646484375, -2.787353515625, -1.9482421875, -1.109130859375, -0.27001953125, 0.569091796875, 1.408203125, 2.247314453125, 3.08642578125, 3.925537109375, 4.7646484375, 5.603759765625, 6.44287109375, 7.281982421875, 8.12109375, 8.960205078125, 9.79931640625, 10.638427734375, 11.4775390625, 12.316650390625, 13.15576171875, 13.994873046875, 14.833984375, 15.673095703125, 16.51220703125, 17.351318359375, 18.1904296875, 19.029541015625, 19.86865234375, 20.707763671875, 21.546875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 6.0, 7.0, 11.0, 17.0, 36.0, 35.0, 34.0, 55.0, 68.0, 69.0, 77.0, 92.0, 88.0, 90.0, 83.0, 54.0, 50.0, 37.0, 30.0, 15.0, 7.0, 16.0, 8.0, 7.0, 5.0, 1.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.7109375, -10.2769775390625, -9.843017578125, -9.4090576171875, -8.97509765625, -8.5411376953125, -8.107177734375, -7.6732177734375, -7.2392578125, -6.8052978515625, -6.371337890625, -5.9373779296875, -5.50341796875, -5.0694580078125, -4.635498046875, -4.2015380859375, -3.767578125, -3.3336181640625, -2.899658203125, -2.4656982421875, -2.03173828125, -1.5977783203125, -1.163818359375, -0.7298583984375, -0.2958984375, 0.1380615234375, 0.572021484375, 1.0059814453125, 1.43994140625, 1.8739013671875, 2.307861328125, 2.7418212890625, 3.17578125, 3.6097412109375, 4.043701171875, 4.4776611328125, 4.91162109375, 5.3455810546875, 5.779541015625, 6.2135009765625, 6.6474609375, 7.0814208984375, 7.515380859375, 7.9493408203125, 8.38330078125, 8.8172607421875, 9.251220703125, 9.6851806640625, 10.119140625, 10.5531005859375, 10.987060546875, 11.4210205078125, 11.85498046875, 12.2889404296875, 12.722900390625, 13.1568603515625, 13.5908203125, 14.0247802734375, 14.458740234375, 14.8927001953125, 15.32666015625, 15.7606201171875, 16.194580078125, 16.6285400390625, 17.0625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 8.0, 15.0, 19.0, 27.0, 46.0, 66.0, 93.0, 125.0, 146.0, 116.0, 101.0, 75.0, 51.0, 30.0, 20.0, 20.0, 20.0, 4.0, 7.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-236.0174102783203, -228.56361389160156, -221.1098175048828, -213.65602111816406, -206.2022247314453, -198.74842834472656, -191.29461669921875, -183.8408203125, -176.38702392578125, -168.9332275390625, -161.47943115234375, -154.025634765625, -146.57183837890625, -139.1180419921875, -131.66424560546875, -124.21044158935547, -116.75665283203125, -109.3028564453125, -101.84906005859375, -94.395263671875, -86.94146728515625, -79.4876708984375, -72.03386688232422, -64.58007049560547, -57.12627410888672, -49.67247772216797, -42.21868133544922, -34.7648811340332, -27.311084747314453, -19.857288360595703, -12.403488159179688, -4.9496917724609375, 2.5041046142578125, 9.957901954650879, 17.411699295043945, 24.865497589111328, 32.31929397583008, 39.77309036254883, 47.226890563964844, 54.680686950683594, 62.134483337402344, 69.5882797241211, 77.04207611083984, 84.49588012695312, 91.94967651367188, 99.40347290039062, 106.85726928710938, 114.31106567382812, 121.76486206054688, 129.21865844726562, 136.67245483398438, 144.12625122070312, 151.58004760742188, 159.03384399414062, 166.48764038085938, 173.94143676757812, 181.39523315429688, 188.84902954101562, 196.30282592773438, 203.75662231445312, 211.21041870117188, 218.66421508789062, 226.11801147460938, 233.57180786132812, 241.02561950683594]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 0.0, 5.0, 8.0, 7.0, 12.0, 25.0, 17.0, 22.0, 22.0, 41.0, 47.0, 43.0, 46.0, 50.0, 65.0, 58.0, 62.0, 68.0, 63.0, 66.0, 44.0, 55.0, 48.0, 31.0, 20.0, 18.0, 15.0, 14.0, 8.0, 10.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-195.95518493652344, -189.98155212402344, -184.00791931152344, -178.03427124023438, -172.06063842773438, -166.08700561523438, -160.11337280273438, -154.13973999023438, -148.16610717773438, -142.19247436523438, -136.21884155273438, -130.24520874023438, -124.27156066894531, -118.29792785644531, -112.32429504394531, -106.35066223144531, -100.37701416015625, -94.40338134765625, -88.42974090576172, -82.45610809326172, -76.48246765136719, -70.50883483886719, -64.53520202636719, -58.56156539916992, -52.587928771972656, -46.61429214477539, -40.640655517578125, -34.667022705078125, -28.69338607788086, -22.719749450683594, -16.746116638183594, -10.772480010986328, -4.798828125, 1.1748075485229492, 7.148443222045898, 13.122077941894531, 19.095714569091797, 25.069351196289062, 31.042984008789062, 37.01662063598633, 42.990257263183594, 48.96389389038086, 54.937530517578125, 60.911163330078125, 66.88479614257812, 72.85843658447266, 78.83206939697266, 84.80570983886719, 90.77934265136719, 96.75297546386719, 102.72661590576172, 108.70024871826172, 114.67388916015625, 120.64752197265625, 126.62115478515625, 132.59478759765625, 138.56842041015625, 144.54205322265625, 150.51568603515625, 156.48931884765625, 162.4629669189453, 168.4365997314453, 174.4102325439453, 180.3838653564453, 186.35751342773438]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 9.0, 21.0, 20.0, 44.0, 71.0, 210.0, 625.0, 3059.0, 31976.0, 4023299.0, 127020.0, 6318.0, 988.0, 295.0, 148.0, 80.0, 41.0, 29.0, 13.0, 6.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-192.0, -185.744140625, -179.48828125, -173.232421875, -166.9765625, -160.720703125, -154.46484375, -148.208984375, -141.953125, -135.697265625, -129.44140625, -123.185546875, -116.9296875, -110.673828125, -104.41796875, -98.162109375, -91.90625, -85.650390625, -79.39453125, -73.138671875, -66.8828125, -60.626953125, -54.37109375, -48.115234375, -41.859375, -35.603515625, -29.34765625, -23.091796875, -16.8359375, -10.580078125, -4.32421875, 1.931640625, 8.1875, 14.443359375, 20.69921875, 26.955078125, 33.2109375, 39.466796875, 45.72265625, 51.978515625, 58.234375, 64.490234375, 70.74609375, 77.001953125, 83.2578125, 89.513671875, 95.76953125, 102.025390625, 108.28125, 114.537109375, 120.79296875, 127.048828125, 133.3046875, 139.560546875, 145.81640625, 152.072265625, 158.328125, 164.583984375, 170.83984375, 177.095703125, 183.3515625, 189.607421875, 195.86328125, 202.119140625, 208.375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 9.0, 10.0, 18.0, 28.0, 45.0, 60.0, 79.0, 99.0, 111.0, 114.0, 113.0, 85.0, 79.0, 54.0, 36.0, 30.0, 16.0, 10.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.875, -8.58251953125, -8.2900390625, -7.99755859375, -7.705078125, -7.41259765625, -7.1201171875, -6.82763671875, -6.53515625, -6.24267578125, -5.9501953125, -5.65771484375, -5.365234375, -5.07275390625, -4.7802734375, -4.48779296875, -4.1953125, -3.90283203125, -3.6103515625, -3.31787109375, -3.025390625, -2.73291015625, -2.4404296875, -2.14794921875, -1.85546875, -1.56298828125, -1.2705078125, -0.97802734375, -0.685546875, -0.39306640625, -0.1005859375, 0.19189453125, 0.484375, 0.77685546875, 1.0693359375, 1.36181640625, 1.654296875, 1.94677734375, 2.2392578125, 2.53173828125, 2.82421875, 3.11669921875, 3.4091796875, 3.70166015625, 3.994140625, 4.28662109375, 4.5791015625, 4.87158203125, 5.1640625, 5.45654296875, 5.7490234375, 6.04150390625, 6.333984375, 6.62646484375, 6.9189453125, 7.21142578125, 7.50390625, 7.79638671875, 8.0888671875, 8.38134765625, 8.673828125, 8.96630859375, 9.2587890625, 9.55126953125, 9.84375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 7.0, 10.0, 6.0, 15.0, 20.0, 30.0, 52.0, 79.0, 108.0, 182.0, 245.0, 397.0, 689.0, 1191.0, 2125.0, 3907.0, 7731.0, 17531.0, 43438.0, 128958.0, 611340.0, 2940878.0, 298710.0, 81984.0, 29459.0, 12331.0, 5629.0, 3019.0, 1599.0, 990.0, 563.0, 352.0, 228.0, 138.0, 116.0, 68.0, 47.0, 35.0, 23.0, 18.0, 11.0, 5.0, 4.0, 7.0, 7.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0], "bins": [-41.25, -39.97314453125, -38.6962890625, -37.41943359375, -36.142578125, -34.86572265625, -33.5888671875, -32.31201171875, -31.03515625, -29.75830078125, -28.4814453125, -27.20458984375, -25.927734375, -24.65087890625, -23.3740234375, -22.09716796875, -20.8203125, -19.54345703125, -18.2666015625, -16.98974609375, -15.712890625, -14.43603515625, -13.1591796875, -11.88232421875, -10.60546875, -9.32861328125, -8.0517578125, -6.77490234375, -5.498046875, -4.22119140625, -2.9443359375, -1.66748046875, -0.390625, 0.88623046875, 2.1630859375, 3.43994140625, 4.716796875, 5.99365234375, 7.2705078125, 8.54736328125, 9.82421875, 11.10107421875, 12.3779296875, 13.65478515625, 14.931640625, 16.20849609375, 17.4853515625, 18.76220703125, 20.0390625, 21.31591796875, 22.5927734375, 23.86962890625, 25.146484375, 26.42333984375, 27.7001953125, 28.97705078125, 30.25390625, 31.53076171875, 32.8076171875, 34.08447265625, 35.361328125, 36.63818359375, 37.9150390625, 39.19189453125, 40.46875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 5.0, 4.0, 8.0, 8.0, 16.0, 10.0, 25.0, 39.0, 43.0, 60.0, 83.0, 135.0, 251.0, 435.0, 1569.0, 580.0, 291.0, 162.0, 104.0, 74.0, 44.0, 29.0, 20.0, 17.0, 11.0, 5.0, 12.0, 4.0, 6.0, 4.0, 3.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.15625, -10.767333984375, -10.37841796875, -9.989501953125, -9.6005859375, -9.211669921875, -8.82275390625, -8.433837890625, -8.044921875, -7.656005859375, -7.26708984375, -6.878173828125, -6.4892578125, -6.100341796875, -5.71142578125, -5.322509765625, -4.93359375, -4.544677734375, -4.15576171875, -3.766845703125, -3.3779296875, -2.989013671875, -2.60009765625, -2.211181640625, -1.822265625, -1.433349609375, -1.04443359375, -0.655517578125, -0.2666015625, 0.122314453125, 0.51123046875, 0.900146484375, 1.2890625, 1.677978515625, 2.06689453125, 2.455810546875, 2.8447265625, 3.233642578125, 3.62255859375, 4.011474609375, 4.400390625, 4.789306640625, 5.17822265625, 5.567138671875, 5.9560546875, 6.344970703125, 6.73388671875, 7.122802734375, 7.51171875, 7.900634765625, 8.28955078125, 8.678466796875, 9.0673828125, 9.456298828125, 9.84521484375, 10.234130859375, 10.623046875, 11.011962890625, 11.40087890625, 11.789794921875, 12.1787109375, 12.567626953125, 12.95654296875, 13.345458984375, 13.734375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 5.0, 2.0, 8.0, 9.0, 18.0, 20.0, 56.0, 99.0, 111.0, 143.0, 158.0, 141.0, 94.0, 66.0, 27.0, 13.0, 15.0, 6.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-103.37364196777344, -100.0563735961914, -96.73910522460938, -93.42183685302734, -90.10456848144531, -86.78730010986328, -83.47003173828125, -80.15276336669922, -76.83549499511719, -73.51822662353516, -70.20095825195312, -66.8836898803711, -63.56642150878906, -60.24915313720703, -56.931884765625, -53.61461639404297, -50.29734802246094, -46.980079650878906, -43.662811279296875, -40.345542907714844, -37.02827453613281, -33.71100616455078, -30.39373779296875, -27.07646942138672, -23.759201049804688, -20.441932678222656, -17.124664306640625, -13.807395935058594, -10.490127563476562, -7.172859191894531, -3.8555908203125, -0.5383224487304688, 2.7789459228515625, 6.096214294433594, 9.413482666015625, 12.730751037597656, 16.048019409179688, 19.36528778076172, 22.68255615234375, 25.99982452392578, 29.317092895507812, 32.634361267089844, 35.951629638671875, 39.268898010253906, 42.58616638183594, 45.90343475341797, 49.220703125, 52.53797149658203, 55.85523986816406, 59.172508239746094, 62.489776611328125, 65.80704498291016, 69.12431335449219, 72.44158172607422, 75.75885009765625, 79.07611846923828, 82.39338684082031, 85.71065521240234, 89.02792358398438, 92.3451919555664, 95.66246032714844, 98.97972869873047, 102.2969970703125, 105.61426544189453, 108.93153381347656]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 8.0, 8.0, 7.0, 22.0, 17.0, 29.0, 44.0, 45.0, 56.0, 55.0, 69.0, 76.0, 73.0, 80.0, 75.0, 56.0, 52.0, 61.0, 36.0, 39.0, 27.0, 20.0, 17.0, 11.0, 10.0, 5.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.8619384765625, -69.64143371582031, -67.4209213256836, -65.2004165649414, -62.97990417480469, -60.7593994140625, -58.53889083862305, -56.318382263183594, -54.09787368774414, -51.87736511230469, -49.656856536865234, -47.43634796142578, -45.215843200683594, -42.995330810546875, -40.77482604980469, -38.554317474365234, -36.33380889892578, -34.11330032348633, -31.892791748046875, -29.672285079956055, -27.4517765045166, -25.23126792907715, -23.010761260986328, -20.790252685546875, -18.569744110107422, -16.34923553466797, -14.128727912902832, -11.908220291137695, -9.687711715698242, -7.467203140258789, -5.246695518493652, -3.0261878967285156, -0.8056716918945312, 1.4148364067077637, 3.6353445053100586, 5.8558526039123535, 8.076360702514648, 10.296869277954102, 12.517376899719238, 14.737884521484375, 16.958393096923828, 19.17890167236328, 21.399410247802734, 23.619916915893555, 25.840425491333008, 28.06093406677246, 30.28144073486328, 32.501949310302734, 34.72245788574219, 36.94296646118164, 39.163475036621094, 41.38398361206055, 43.6044921875, 45.82499694824219, 48.04550552368164, 50.266014099121094, 52.48652267456055, 54.70703125, 56.92753982543945, 59.148048400878906, 61.368553161621094, 63.58906555175781, 65.8095703125, 68.03007507324219, 70.2505874633789]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 4.0, 5.0, 3.0, 11.0, 8.0, 14.0, 14.0, 27.0, 29.0, 45.0, 65.0, 93.0, 104.0, 148.0, 208.0, 295.0, 492.0, 760.0, 1259.0, 2359.0, 4772.0, 11018.0, 27549.0, 73853.0, 187845.0, 346620.0, 232535.0, 95748.0, 35971.0, 13954.0, 5791.0, 2806.0, 1495.0, 880.0, 555.0, 332.0, 225.0, 178.0, 114.0, 91.0, 61.0, 61.0, 41.0, 35.0, 22.0, 12.0, 19.0, 6.0, 7.0, 10.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-30.203125, -29.277587890625, -28.35205078125, -27.426513671875, -26.5009765625, -25.575439453125, -24.64990234375, -23.724365234375, -22.798828125, -21.873291015625, -20.94775390625, -20.022216796875, -19.0966796875, -18.171142578125, -17.24560546875, -16.320068359375, -15.39453125, -14.468994140625, -13.54345703125, -12.617919921875, -11.6923828125, -10.766845703125, -9.84130859375, -8.915771484375, -7.990234375, -7.064697265625, -6.13916015625, -5.213623046875, -4.2880859375, -3.362548828125, -2.43701171875, -1.511474609375, -0.5859375, 0.339599609375, 1.26513671875, 2.190673828125, 3.1162109375, 4.041748046875, 4.96728515625, 5.892822265625, 6.818359375, 7.743896484375, 8.66943359375, 9.594970703125, 10.5205078125, 11.446044921875, 12.37158203125, 13.297119140625, 14.22265625, 15.148193359375, 16.07373046875, 16.999267578125, 17.9248046875, 18.850341796875, 19.77587890625, 20.701416015625, 21.626953125, 22.552490234375, 23.47802734375, 24.403564453125, 25.3291015625, 26.254638671875, 27.18017578125, 28.105712890625, 29.03125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 1.0, 3.0, 1.0, 4.0, 4.0, 8.0, 13.0, 26.0, 23.0, 42.0, 65.0, 70.0, 92.0, 95.0, 123.0, 108.0, 90.0, 77.0, 56.0, 37.0, 21.0, 19.0, 12.0, 9.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.1796875, -8.8953857421875, -8.611083984375, -8.3267822265625, -8.04248046875, -7.7581787109375, -7.473876953125, -7.1895751953125, -6.9052734375, -6.6209716796875, -6.336669921875, -6.0523681640625, -5.76806640625, -5.4837646484375, -5.199462890625, -4.9151611328125, -4.630859375, -4.3465576171875, -4.062255859375, -3.7779541015625, -3.49365234375, -3.2093505859375, -2.925048828125, -2.6407470703125, -2.3564453125, -2.0721435546875, -1.787841796875, -1.5035400390625, -1.21923828125, -0.9349365234375, -0.650634765625, -0.3663330078125, -0.08203125, 0.2022705078125, 0.486572265625, 0.7708740234375, 1.05517578125, 1.3394775390625, 1.623779296875, 1.9080810546875, 2.1923828125, 2.4766845703125, 2.760986328125, 3.0452880859375, 3.32958984375, 3.6138916015625, 3.898193359375, 4.1824951171875, 4.466796875, 4.7510986328125, 5.035400390625, 5.3197021484375, 5.60400390625, 5.8883056640625, 6.172607421875, 6.4569091796875, 6.7412109375, 7.0255126953125, 7.309814453125, 7.5941162109375, 7.87841796875, 8.1627197265625, 8.447021484375, 8.7313232421875, 9.015625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 9.0, 15.0, 13.0, 26.0, 38.0, 41.0, 64.0, 94.0, 153.0, 227.0, 323.0, 506.0, 787.0, 1282.0, 2132.0, 4017.0, 7553.0, 14868.0, 31739.0, 68965.0, 142422.0, 247907.0, 249001.0, 142870.0, 69079.0, 31918.0, 15283.0, 7623.0, 3934.0, 2177.0, 1278.0, 727.0, 495.0, 302.0, 212.0, 143.0, 98.0, 61.0, 54.0, 33.0, 33.0, 14.0, 13.0, 10.0, 7.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-22.015625, -21.3681640625, -20.720703125, -20.0732421875, -19.42578125, -18.7783203125, -18.130859375, -17.4833984375, -16.8359375, -16.1884765625, -15.541015625, -14.8935546875, -14.24609375, -13.5986328125, -12.951171875, -12.3037109375, -11.65625, -11.0087890625, -10.361328125, -9.7138671875, -9.06640625, -8.4189453125, -7.771484375, -7.1240234375, -6.4765625, -5.8291015625, -5.181640625, -4.5341796875, -3.88671875, -3.2392578125, -2.591796875, -1.9443359375, -1.296875, -0.6494140625, -0.001953125, 0.6455078125, 1.29296875, 1.9404296875, 2.587890625, 3.2353515625, 3.8828125, 4.5302734375, 5.177734375, 5.8251953125, 6.47265625, 7.1201171875, 7.767578125, 8.4150390625, 9.0625, 9.7099609375, 10.357421875, 11.0048828125, 11.65234375, 12.2998046875, 12.947265625, 13.5947265625, 14.2421875, 14.8896484375, 15.537109375, 16.1845703125, 16.83203125, 17.4794921875, 18.126953125, 18.7744140625, 19.421875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 7.0, 7.0, 7.0, 4.0, 7.0, 11.0, 12.0, 19.0, 16.0, 20.0, 16.0, 24.0, 23.0, 42.0, 27.0, 29.0, 32.0, 32.0, 32.0, 42.0, 55.0, 45.0, 34.0, 41.0, 34.0, 45.0, 37.0, 41.0, 35.0, 28.0, 25.0, 34.0, 30.0, 21.0, 16.0, 10.0, 13.0, 4.0, 8.0, 7.0, 8.0, 6.0, 2.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-21.1875, -20.575439453125, -19.96337890625, -19.351318359375, -18.7392578125, -18.127197265625, -17.51513671875, -16.903076171875, -16.291015625, -15.678955078125, -15.06689453125, -14.454833984375, -13.8427734375, -13.230712890625, -12.61865234375, -12.006591796875, -11.39453125, -10.782470703125, -10.17041015625, -9.558349609375, -8.9462890625, -8.334228515625, -7.72216796875, -7.110107421875, -6.498046875, -5.885986328125, -5.27392578125, -4.661865234375, -4.0498046875, -3.437744140625, -2.82568359375, -2.213623046875, -1.6015625, -0.989501953125, -0.37744140625, 0.234619140625, 0.8466796875, 1.458740234375, 2.07080078125, 2.682861328125, 3.294921875, 3.906982421875, 4.51904296875, 5.131103515625, 5.7431640625, 6.355224609375, 6.96728515625, 7.579345703125, 8.19140625, 8.803466796875, 9.41552734375, 10.027587890625, 10.6396484375, 11.251708984375, 11.86376953125, 12.475830078125, 13.087890625, 13.699951171875, 14.31201171875, 14.924072265625, 15.5361328125, 16.148193359375, 16.76025390625, 17.372314453125, 17.984375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 7.0, 11.0, 5.0, 8.0, 18.0, 19.0, 28.0, 40.0, 44.0, 100.0, 119.0, 200.0, 341.0, 629.0, 1196.0, 2520.0, 5773.0, 14580.0, 42132.0, 136179.0, 366015.0, 316327.0, 107584.0, 33481.0, 11721.0, 4781.0, 2200.0, 1087.0, 555.0, 338.0, 172.0, 106.0, 68.0, 55.0, 33.0, 31.0, 13.0, 11.0, 10.0, 14.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.890625, -11.5291748046875, -11.167724609375, -10.8062744140625, -10.44482421875, -10.0833740234375, -9.721923828125, -9.3604736328125, -8.9990234375, -8.6375732421875, -8.276123046875, -7.9146728515625, -7.55322265625, -7.1917724609375, -6.830322265625, -6.4688720703125, -6.107421875, -5.7459716796875, -5.384521484375, -5.0230712890625, -4.66162109375, -4.3001708984375, -3.938720703125, -3.5772705078125, -3.2158203125, -2.8543701171875, -2.492919921875, -2.1314697265625, -1.77001953125, -1.4085693359375, -1.047119140625, -0.6856689453125, -0.32421875, 0.0372314453125, 0.398681640625, 0.7601318359375, 1.12158203125, 1.4830322265625, 1.844482421875, 2.2059326171875, 2.5673828125, 2.9288330078125, 3.290283203125, 3.6517333984375, 4.01318359375, 4.3746337890625, 4.736083984375, 5.0975341796875, 5.458984375, 5.8204345703125, 6.181884765625, 6.5433349609375, 6.90478515625, 7.2662353515625, 7.627685546875, 7.9891357421875, 8.3505859375, 8.7120361328125, 9.073486328125, 9.4349365234375, 9.79638671875, 10.1578369140625, 10.519287109375, 10.8807373046875, 11.2421875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 2.0, 4.0, 3.0, 3.0, 7.0, 7.0, 11.0, 14.0, 12.0, 23.0, 23.0, 25.0, 39.0, 30.0, 35.0, 42.0, 41.0, 72.0, 75.0, 69.0, 76.0, 58.0, 69.0, 40.0, 36.0, 34.0, 33.0, 19.0, 11.0, 15.0, 10.0, 13.0, 5.0, 9.0, 3.0, 7.0, 3.0, 7.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.00146484375, -0.0014165490865707397, -0.0013682544231414795, -0.0013199597597122192, -0.001271665096282959, -0.0012233704328536987, -0.0011750757694244385, -0.0011267811059951782, -0.001078486442565918, -0.0010301917791366577, -0.0009818971157073975, -0.0009336024522781372, -0.000885307788848877, -0.0008370131254196167, -0.0007887184619903564, -0.0007404237985610962, -0.0006921291351318359, -0.0006438344717025757, -0.0005955398082733154, -0.0005472451448440552, -0.0004989504814147949, -0.00045065581798553467, -0.0004023611545562744, -0.00035406649112701416, -0.0003057718276977539, -0.00025747716426849365, -0.0002091825008392334, -0.00016088783740997314, -0.00011259317398071289, -6.429851055145264e-05, -1.6003847122192383e-05, 3.229081630706787e-05, 8.058547973632812e-05, 0.00012888014316558838, 0.00017717480659484863, 0.0002254694700241089, 0.00027376413345336914, 0.0003220587968826294, 0.00037035346031188965, 0.0004186481237411499, 0.00046694278717041016, 0.0005152374505996704, 0.0005635321140289307, 0.0006118267774581909, 0.0006601214408874512, 0.0007084161043167114, 0.0007567107677459717, 0.0008050054311752319, 0.0008533000946044922, 0.0009015947580337524, 0.0009498894214630127, 0.000998184084892273, 0.0010464787483215332, 0.0010947734117507935, 0.0011430680751800537, 0.001191362738609314, 0.0012396574020385742, 0.0012879520654678345, 0.0013362467288970947, 0.001384541392326355, 0.0014328360557556152, 0.0014811307191848755, 0.0015294253826141357, 0.001577720046043396, 0.0016260147094726562]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 17.0, 9.0, 25.0, 23.0, 46.0, 75.0, 119.0, 242.0, 379.0, 693.0, 1545.0, 3244.0, 8295.0, 23705.0, 80879.0, 314874.0, 430954.0, 128281.0, 35050.0, 11667.0, 4438.0, 2002.0, 895.0, 428.0, 244.0, 151.0, 95.0, 59.0, 32.0, 24.0, 17.0, 19.0, 10.0, 8.0, 6.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.828125, -15.3905029296875, -14.952880859375, -14.5152587890625, -14.07763671875, -13.6400146484375, -13.202392578125, -12.7647705078125, -12.3271484375, -11.8895263671875, -11.451904296875, -11.0142822265625, -10.57666015625, -10.1390380859375, -9.701416015625, -9.2637939453125, -8.826171875, -8.3885498046875, -7.950927734375, -7.5133056640625, -7.07568359375, -6.6380615234375, -6.200439453125, -5.7628173828125, -5.3251953125, -4.8875732421875, -4.449951171875, -4.0123291015625, -3.57470703125, -3.1370849609375, -2.699462890625, -2.2618408203125, -1.82421875, -1.3865966796875, -0.948974609375, -0.5113525390625, -0.07373046875, 0.3638916015625, 0.801513671875, 1.2391357421875, 1.6767578125, 2.1143798828125, 2.552001953125, 2.9896240234375, 3.42724609375, 3.8648681640625, 4.302490234375, 4.7401123046875, 5.177734375, 5.6153564453125, 6.052978515625, 6.4906005859375, 6.92822265625, 7.3658447265625, 7.803466796875, 8.2410888671875, 8.6787109375, 9.1163330078125, 9.553955078125, 9.9915771484375, 10.42919921875, 10.8668212890625, 11.304443359375, 11.7420654296875, 12.1796875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 0.0, 3.0, 0.0, 3.0, 4.0, 4.0, 6.0, 12.0, 6.0, 15.0, 18.0, 13.0, 27.0, 36.0, 40.0, 65.0, 68.0, 73.0, 95.0, 109.0, 84.0, 66.0, 61.0, 47.0, 38.0, 32.0, 17.0, 19.0, 12.0, 7.0, 6.0, 12.0, 7.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.65625, -6.3541259765625, -6.052001953125, -5.7498779296875, -5.44775390625, -5.1456298828125, -4.843505859375, -4.5413818359375, -4.2392578125, -3.9371337890625, -3.635009765625, -3.3328857421875, -3.03076171875, -2.7286376953125, -2.426513671875, -2.1243896484375, -1.822265625, -1.5201416015625, -1.218017578125, -0.9158935546875, -0.61376953125, -0.3116455078125, -0.009521484375, 0.2926025390625, 0.5947265625, 0.8968505859375, 1.198974609375, 1.5010986328125, 1.80322265625, 2.1053466796875, 2.407470703125, 2.7095947265625, 3.01171875, 3.3138427734375, 3.615966796875, 3.9180908203125, 4.22021484375, 4.5223388671875, 4.824462890625, 5.1265869140625, 5.4287109375, 5.7308349609375, 6.032958984375, 6.3350830078125, 6.63720703125, 6.9393310546875, 7.241455078125, 7.5435791015625, 7.845703125, 8.1478271484375, 8.449951171875, 8.7520751953125, 9.05419921875, 9.3563232421875, 9.658447265625, 9.9605712890625, 10.2626953125, 10.5648193359375, 10.866943359375, 11.1690673828125, 11.47119140625, 11.7733154296875, 12.075439453125, 12.3775634765625, 12.6796875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 3.0, 7.0, 11.0, 24.0, 40.0, 46.0, 90.0, 124.0, 138.0, 135.0, 127.0, 98.0, 66.0, 28.0, 32.0, 15.0, 9.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-211.49996948242188, -204.92770385742188, -198.35545349121094, -191.78318786621094, -185.21092224121094, -178.638671875, -172.06640625, -165.494140625, -158.921875, -152.349609375, -145.77735900878906, -139.20509338378906, -132.63282775878906, -126.0605697631836, -119.48831176757812, -112.91604614257812, -106.34378814697266, -99.77153015136719, -93.19926452636719, -86.62700653076172, -80.05474090576172, -73.48248291015625, -66.91021728515625, -60.33795928955078, -53.76569747924805, -47.19343566894531, -40.62117385864258, -34.048912048339844, -27.476652145385742, -20.90439224243164, -14.332130432128906, -7.759868621826172, -1.1876068115234375, 5.384654521942139, 11.956915855407715, 18.529176712036133, 25.101438522338867, 31.67369842529297, 38.2459602355957, 44.81822204589844, 51.39048385620117, 57.962745666503906, 64.53500366210938, 71.10726928710938, 77.67952728271484, 84.25178527832031, 90.82405090332031, 97.39631652832031, 103.96857452392578, 110.54083251953125, 117.11309814453125, 123.68535614013672, 130.2576141357422, 136.8298797607422, 143.4021453857422, 149.97439575195312, 156.54666137695312, 163.11892700195312, 169.69117736816406, 176.26344299316406, 182.83570861816406, 189.407958984375, 195.980224609375, 202.552490234375, 209.124755859375]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 4.0, 6.0, 8.0, 5.0, 8.0, 10.0, 22.0, 15.0, 19.0, 22.0, 28.0, 27.0, 41.0, 45.0, 45.0, 39.0, 58.0, 37.0, 43.0, 47.0, 48.0, 66.0, 41.0, 38.0, 36.0, 47.0, 31.0, 24.0, 27.0, 23.0, 13.0, 17.0, 13.0, 11.0, 11.0, 3.0, 4.0, 5.0, 6.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-120.724609375, -116.72987365722656, -112.73514556884766, -108.74040985107422, -104.74567413330078, -100.75094604492188, -96.75621032714844, -92.761474609375, -88.76673889160156, -84.77200317382812, -80.77727508544922, -76.78253936767578, -72.78780364990234, -68.79307556152344, -64.79833984375, -60.80360412597656, -56.808876037597656, -52.814144134521484, -48.81940841674805, -44.824676513671875, -40.82994079589844, -36.835208892822266, -32.840476989746094, -28.84574317932129, -24.851009368896484, -20.85627555847168, -16.861541748046875, -12.866809844970703, -8.872076034545898, -4.877342224121094, -0.8826103210449219, 3.112123489379883, 7.1068572998046875, 11.101591110229492, 15.09632396697998, 19.09105682373047, 23.085790634155273, 27.080524444580078, 31.07525634765625, 35.06999206542969, 39.06472396850586, 43.05945587158203, 47.05419158935547, 51.04892349243164, 55.04365539550781, 59.03839111328125, 63.03312301635742, 67.0278549194336, 71.02259063720703, 75.01732635498047, 79.01205444335938, 83.00679016113281, 87.00152587890625, 90.99626159667969, 94.9909896850586, 98.98572540283203, 102.98045349121094, 106.97518920898438, 110.96991729736328, 114.96465301513672, 118.95938873291016, 122.95411682128906, 126.9488525390625, 130.94358825683594, 134.93832397460938]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 8.0, 9.0, 7.0, 21.0, 38.0, 34.0, 55.0, 58.0, 98.0, 180.0, 287.0, 493.0, 844.0, 1588.0, 3339.0, 7836.0, 22828.0, 102599.0, 3652070.0, 336811.0, 43053.0, 12459.0, 4885.0, 2190.0, 1008.0, 571.0, 320.0, 190.0, 110.0, 75.0, 48.0, 35.0, 27.0, 16.0, 11.0, 16.0, 18.0, 13.0, 5.0, 9.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.625, -46.0234375, -44.421875, -42.8203125, -41.21875, -39.6171875, -38.015625, -36.4140625, -34.8125, -33.2109375, -31.609375, -30.0078125, -28.40625, -26.8046875, -25.203125, -23.6015625, -22.0, -20.3984375, -18.796875, -17.1953125, -15.59375, -13.9921875, -12.390625, -10.7890625, -9.1875, -7.5859375, -5.984375, -4.3828125, -2.78125, -1.1796875, 0.421875, 2.0234375, 3.625, 5.2265625, 6.828125, 8.4296875, 10.03125, 11.6328125, 13.234375, 14.8359375, 16.4375, 18.0390625, 19.640625, 21.2421875, 22.84375, 24.4453125, 26.046875, 27.6484375, 29.25, 30.8515625, 32.453125, 34.0546875, 35.65625, 37.2578125, 38.859375, 40.4609375, 42.0625, 43.6640625, 45.265625, 46.8671875, 48.46875, 50.0703125, 51.671875, 53.2734375, 54.875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 7.0, 5.0, 8.0, 19.0, 15.0, 24.0, 43.0, 53.0, 65.0, 75.0, 69.0, 98.0, 100.0, 84.0, 77.0, 79.0, 58.0, 40.0, 26.0, 22.0, 9.0, 14.0, 6.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.87890625, -7.62493896484375, -7.3709716796875, -7.11700439453125, -6.863037109375, -6.60906982421875, -6.3551025390625, -6.10113525390625, -5.84716796875, -5.59320068359375, -5.3392333984375, -5.08526611328125, -4.831298828125, -4.57733154296875, -4.3233642578125, -4.06939697265625, -3.8154296875, -3.56146240234375, -3.3074951171875, -3.05352783203125, -2.799560546875, -2.54559326171875, -2.2916259765625, -2.03765869140625, -1.78369140625, -1.52972412109375, -1.2757568359375, -1.02178955078125, -0.767822265625, -0.51385498046875, -0.2598876953125, -0.00592041015625, 0.248046875, 0.50201416015625, 0.7559814453125, 1.00994873046875, 1.263916015625, 1.51788330078125, 1.7718505859375, 2.02581787109375, 2.27978515625, 2.53375244140625, 2.7877197265625, 3.04168701171875, 3.295654296875, 3.54962158203125, 3.8035888671875, 4.05755615234375, 4.3115234375, 4.56549072265625, 4.8194580078125, 5.07342529296875, 5.327392578125, 5.58135986328125, 5.8353271484375, 6.08929443359375, 6.34326171875, 6.59722900390625, 6.8511962890625, 7.10516357421875, 7.359130859375, 7.61309814453125, 7.8670654296875, 8.12103271484375, 8.375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 1.0, 5.0, 5.0, 8.0, 12.0, 12.0, 21.0, 27.0, 26.0, 36.0, 57.0, 69.0, 104.0, 166.0, 200.0, 307.0, 526.0, 922.0, 1665.0, 3151.0, 6965.0, 16274.0, 43733.0, 146577.0, 1279774.0, 2448249.0, 164017.0, 48090.0, 17865.0, 7693.0, 3468.0, 1797.0, 913.0, 546.0, 336.0, 188.0, 139.0, 95.0, 81.0, 41.0, 23.0, 25.0, 20.0, 8.0, 16.0, 7.0, 6.0, 7.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-33.03125, -32.031494140625, -31.03173828125, -30.031982421875, -29.0322265625, -28.032470703125, -27.03271484375, -26.032958984375, -25.033203125, -24.033447265625, -23.03369140625, -22.033935546875, -21.0341796875, -20.034423828125, -19.03466796875, -18.034912109375, -17.03515625, -16.035400390625, -15.03564453125, -14.035888671875, -13.0361328125, -12.036376953125, -11.03662109375, -10.036865234375, -9.037109375, -8.037353515625, -7.03759765625, -6.037841796875, -5.0380859375, -4.038330078125, -3.03857421875, -2.038818359375, -1.0390625, -0.039306640625, 0.96044921875, 1.960205078125, 2.9599609375, 3.959716796875, 4.95947265625, 5.959228515625, 6.958984375, 7.958740234375, 8.95849609375, 9.958251953125, 10.9580078125, 11.957763671875, 12.95751953125, 13.957275390625, 14.95703125, 15.956787109375, 16.95654296875, 17.956298828125, 18.9560546875, 19.955810546875, 20.95556640625, 21.955322265625, 22.955078125, 23.954833984375, 24.95458984375, 25.954345703125, 26.9541015625, 27.953857421875, 28.95361328125, 29.953369140625, 30.953125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 5.0, 6.0, 10.0, 18.0, 23.0, 32.0, 66.0, 101.0, 229.0, 555.0, 2145.0, 452.0, 155.0, 107.0, 58.0, 35.0, 29.0, 20.0, 13.0, 6.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.359375, -16.8953857421875, -16.431396484375, -15.9674072265625, -15.50341796875, -15.0394287109375, -14.575439453125, -14.1114501953125, -13.6474609375, -13.1834716796875, -12.719482421875, -12.2554931640625, -11.79150390625, -11.3275146484375, -10.863525390625, -10.3995361328125, -9.935546875, -9.4715576171875, -9.007568359375, -8.5435791015625, -8.07958984375, -7.6156005859375, -7.151611328125, -6.6876220703125, -6.2236328125, -5.7596435546875, -5.295654296875, -4.8316650390625, -4.36767578125, -3.9036865234375, -3.439697265625, -2.9757080078125, -2.51171875, -2.0477294921875, -1.583740234375, -1.1197509765625, -0.65576171875, -0.1917724609375, 0.272216796875, 0.7362060546875, 1.2001953125, 1.6641845703125, 2.128173828125, 2.5921630859375, 3.05615234375, 3.5201416015625, 3.984130859375, 4.4481201171875, 4.912109375, 5.3760986328125, 5.840087890625, 6.3040771484375, 6.76806640625, 7.2320556640625, 7.696044921875, 8.1600341796875, 8.6240234375, 9.0880126953125, 9.552001953125, 10.0159912109375, 10.47998046875, 10.9439697265625, 11.407958984375, 11.8719482421875, 12.3359375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 9.0, 17.0, 27.0, 53.0, 109.0, 153.0, 180.0, 155.0, 125.0, 82.0, 50.0, 18.0, 15.0, 4.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-129.70103454589844, -126.7995376586914, -123.89804077148438, -120.99653625488281, -118.09503936767578, -115.19354248046875, -112.29204559326172, -109.39054870605469, -106.48904418945312, -103.5875473022461, -100.68605041503906, -97.7845458984375, -94.88304901123047, -91.98155212402344, -89.0800552368164, -86.17855834960938, -83.27706146240234, -80.37556457519531, -77.47406768798828, -74.57257080078125, -71.67106628417969, -68.76956939697266, -65.86807250976562, -62.966575622558594, -60.0650749206543, -57.163578033447266, -54.26207733154297, -51.36058044433594, -48.459083557128906, -45.55758285522461, -42.65608596801758, -39.75458526611328, -36.85308074951172, -33.95158386230469, -31.05008316040039, -28.14858627319336, -25.247087478637695, -22.34558868408203, -19.444091796875, -16.542593002319336, -13.641094207763672, -10.739595413208008, -7.83809757232666, -4.9365997314453125, -2.0351009368896484, 0.8663978576660156, 3.767894744873047, 6.669393539428711, 9.570892333984375, 12.472391128540039, 15.373888969421387, 18.275386810302734, 21.1768856048584, 24.078384399414062, 26.979881286621094, 29.881380081176758, 32.78287887573242, 35.68437576293945, 38.58587646484375, 41.48737335205078, 44.38887023925781, 47.29037094116211, 50.19186782836914, 53.09336853027344, 55.99486541748047]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 4.0, 5.0, 6.0, 13.0, 16.0, 22.0, 28.0, 17.0, 24.0, 22.0, 25.0, 29.0, 46.0, 33.0, 52.0, 52.0, 56.0, 53.0, 59.0, 37.0, 51.0, 39.0, 41.0, 38.0, 37.0, 38.0, 32.0, 27.0, 23.0, 14.0, 13.0, 16.0, 12.0, 8.0, 4.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.12269973754883, -40.94355010986328, -39.764404296875, -38.58525466918945, -37.40610885620117, -36.226959228515625, -35.047813415527344, -33.8686637878418, -32.68951416015625, -31.510366439819336, -30.331218719482422, -29.152070999145508, -27.972923278808594, -26.793773651123047, -25.614625930786133, -24.43547821044922, -23.256332397460938, -22.077184677124023, -20.89803695678711, -19.718889236450195, -18.53974151611328, -17.360591888427734, -16.18144416809082, -15.002296447753906, -13.823148727416992, -12.644001007080078, -11.464853286743164, -10.285704612731934, -9.10655689239502, -7.9274091720581055, -6.748260974884033, -5.569112777709961, -4.3899688720703125, -3.2108209133148193, -2.031672954559326, -0.852524995803833, 0.32662296295166016, 1.5057706832885742, 2.6849188804626465, 3.8640670776367188, 5.043214797973633, 6.222362518310547, 7.401510715484619, 8.580658912658691, 9.759806632995605, 10.93895435333252, 12.11810302734375, 13.297250747680664, 14.476398468017578, 15.655546188354492, 16.834693908691406, 18.01384162902832, 19.192989349365234, 20.37213897705078, 21.551286697387695, 22.73043441772461, 23.909582138061523, 25.088729858398438, 26.26787757873535, 27.447025299072266, 28.626174926757812, 29.805320739746094, 30.98447036743164, 32.16361999511719, 33.34276580810547]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 8.0, 13.0, 12.0, 11.0, 22.0, 30.0, 42.0, 76.0, 109.0, 115.0, 193.0, 241.0, 374.0, 644.0, 1127.0, 2273.0, 5123.0, 13063.0, 37406.0, 111186.0, 299889.0, 355985.0, 143196.0, 48151.0, 16811.0, 6356.0, 2707.0, 1329.0, 727.0, 448.0, 239.0, 199.0, 136.0, 94.0, 62.0, 36.0, 33.0, 19.0, 19.0, 8.0, 10.0, 12.0, 7.0, 3.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-31.875, -30.882568359375, -29.89013671875, -28.897705078125, -27.9052734375, -26.912841796875, -25.92041015625, -24.927978515625, -23.935546875, -22.943115234375, -21.95068359375, -20.958251953125, -19.9658203125, -18.973388671875, -17.98095703125, -16.988525390625, -15.99609375, -15.003662109375, -14.01123046875, -13.018798828125, -12.0263671875, -11.033935546875, -10.04150390625, -9.049072265625, -8.056640625, -7.064208984375, -6.07177734375, -5.079345703125, -4.0869140625, -3.094482421875, -2.10205078125, -1.109619140625, -0.1171875, 0.875244140625, 1.86767578125, 2.860107421875, 3.8525390625, 4.844970703125, 5.83740234375, 6.829833984375, 7.822265625, 8.814697265625, 9.80712890625, 10.799560546875, 11.7919921875, 12.784423828125, 13.77685546875, 14.769287109375, 15.76171875, 16.754150390625, 17.74658203125, 18.739013671875, 19.7314453125, 20.723876953125, 21.71630859375, 22.708740234375, 23.701171875, 24.693603515625, 25.68603515625, 26.678466796875, 27.6708984375, 28.663330078125, 29.65576171875, 30.648193359375, 31.640625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 0.0, 6.0, 10.0, 7.0, 22.0, 28.0, 35.0, 47.0, 56.0, 75.0, 90.0, 102.0, 121.0, 88.0, 76.0, 76.0, 61.0, 38.0, 17.0, 22.0, 10.0, 7.0, 9.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.34375, -8.0657958984375, -7.787841796875, -7.5098876953125, -7.23193359375, -6.9539794921875, -6.676025390625, -6.3980712890625, -6.1201171875, -5.8421630859375, -5.564208984375, -5.2862548828125, -5.00830078125, -4.7303466796875, -4.452392578125, -4.1744384765625, -3.896484375, -3.6185302734375, -3.340576171875, -3.0626220703125, -2.78466796875, -2.5067138671875, -2.228759765625, -1.9508056640625, -1.6728515625, -1.3948974609375, -1.116943359375, -0.8389892578125, -0.56103515625, -0.2830810546875, -0.005126953125, 0.2728271484375, 0.55078125, 0.8287353515625, 1.106689453125, 1.3846435546875, 1.66259765625, 1.9405517578125, 2.218505859375, 2.4964599609375, 2.7744140625, 3.0523681640625, 3.330322265625, 3.6082763671875, 3.88623046875, 4.1641845703125, 4.442138671875, 4.7200927734375, 4.998046875, 5.2760009765625, 5.553955078125, 5.8319091796875, 6.10986328125, 6.3878173828125, 6.665771484375, 6.9437255859375, 7.2216796875, 7.4996337890625, 7.777587890625, 8.0555419921875, 8.33349609375, 8.6114501953125, 8.889404296875, 9.1673583984375, 9.4453125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 8.0, 8.0, 8.0, 18.0, 26.0, 30.0, 40.0, 68.0, 114.0, 155.0, 254.0, 395.0, 683.0, 1058.0, 1795.0, 3520.0, 6893.0, 15314.0, 36679.0, 87755.0, 193174.0, 316057.0, 211300.0, 98146.0, 41208.0, 17380.0, 7675.0, 3787.0, 1910.0, 1126.0, 720.0, 436.0, 279.0, 196.0, 111.0, 72.0, 61.0, 35.0, 19.0, 14.0, 14.0, 5.0, 4.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-20.71875, -20.08251953125, -19.4462890625, -18.81005859375, -18.173828125, -17.53759765625, -16.9013671875, -16.26513671875, -15.62890625, -14.99267578125, -14.3564453125, -13.72021484375, -13.083984375, -12.44775390625, -11.8115234375, -11.17529296875, -10.5390625, -9.90283203125, -9.2666015625, -8.63037109375, -7.994140625, -7.35791015625, -6.7216796875, -6.08544921875, -5.44921875, -4.81298828125, -4.1767578125, -3.54052734375, -2.904296875, -2.26806640625, -1.6318359375, -0.99560546875, -0.359375, 0.27685546875, 0.9130859375, 1.54931640625, 2.185546875, 2.82177734375, 3.4580078125, 4.09423828125, 4.73046875, 5.36669921875, 6.0029296875, 6.63916015625, 7.275390625, 7.91162109375, 8.5478515625, 9.18408203125, 9.8203125, 10.45654296875, 11.0927734375, 11.72900390625, 12.365234375, 13.00146484375, 13.6376953125, 14.27392578125, 14.91015625, 15.54638671875, 16.1826171875, 16.81884765625, 17.455078125, 18.09130859375, 18.7275390625, 19.36376953125, 20.0]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 6.0, 6.0, 9.0, 18.0, 23.0, 19.0, 18.0, 24.0, 39.0, 41.0, 41.0, 45.0, 49.0, 48.0, 44.0, 79.0, 55.0, 54.0, 45.0, 46.0, 44.0, 41.0, 26.0, 36.0, 28.0, 19.0, 13.0, 17.0, 15.0, 15.0, 11.0, 4.0, 4.0, 4.0, 5.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.96875, -18.28076171875, -17.5927734375, -16.90478515625, -16.216796875, -15.52880859375, -14.8408203125, -14.15283203125, -13.46484375, -12.77685546875, -12.0888671875, -11.40087890625, -10.712890625, -10.02490234375, -9.3369140625, -8.64892578125, -7.9609375, -7.27294921875, -6.5849609375, -5.89697265625, -5.208984375, -4.52099609375, -3.8330078125, -3.14501953125, -2.45703125, -1.76904296875, -1.0810546875, -0.39306640625, 0.294921875, 0.98291015625, 1.6708984375, 2.35888671875, 3.046875, 3.73486328125, 4.4228515625, 5.11083984375, 5.798828125, 6.48681640625, 7.1748046875, 7.86279296875, 8.55078125, 9.23876953125, 9.9267578125, 10.61474609375, 11.302734375, 11.99072265625, 12.6787109375, 13.36669921875, 14.0546875, 14.74267578125, 15.4306640625, 16.11865234375, 16.806640625, 17.49462890625, 18.1826171875, 18.87060546875, 19.55859375, 20.24658203125, 20.9345703125, 21.62255859375, 22.310546875, 22.99853515625, 23.6865234375, 24.37451171875, 25.0625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 4.0, 2.0, 8.0, 11.0, 14.0, 32.0, 25.0, 54.0, 98.0, 181.0, 321.0, 690.0, 1609.0, 4611.0, 15995.0, 67960.0, 338909.0, 470499.0, 113143.0, 23813.0, 6600.0, 2194.0, 871.0, 385.0, 200.0, 109.0, 73.0, 39.0, 32.0, 15.0, 15.0, 11.0, 12.0, 9.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-15.6015625, -15.1309814453125, -14.660400390625, -14.1898193359375, -13.71923828125, -13.2486572265625, -12.778076171875, -12.3074951171875, -11.8369140625, -11.3663330078125, -10.895751953125, -10.4251708984375, -9.95458984375, -9.4840087890625, -9.013427734375, -8.5428466796875, -8.072265625, -7.6016845703125, -7.131103515625, -6.6605224609375, -6.18994140625, -5.7193603515625, -5.248779296875, -4.7781982421875, -4.3076171875, -3.8370361328125, -3.366455078125, -2.8958740234375, -2.42529296875, -1.9547119140625, -1.484130859375, -1.0135498046875, -0.54296875, -0.0723876953125, 0.398193359375, 0.8687744140625, 1.33935546875, 1.8099365234375, 2.280517578125, 2.7510986328125, 3.2216796875, 3.6922607421875, 4.162841796875, 4.6334228515625, 5.10400390625, 5.5745849609375, 6.045166015625, 6.5157470703125, 6.986328125, 7.4569091796875, 7.927490234375, 8.3980712890625, 8.86865234375, 9.3392333984375, 9.809814453125, 10.2803955078125, 10.7509765625, 11.2215576171875, 11.692138671875, 12.1627197265625, 12.63330078125, 13.1038818359375, 13.574462890625, 14.0450439453125, 14.515625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 5.0, 6.0, 7.0, 11.0, 11.0, 17.0, 23.0, 41.0, 44.0, 54.0, 102.0, 120.0, 137.0, 118.0, 90.0, 55.0, 46.0, 31.0, 20.0, 18.0, 15.0, 11.0, 4.0, 3.0, 8.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00229644775390625, -0.0022152066230773926, -0.002133965492248535, -0.0020527243614196777, -0.0019714832305908203, -0.0018902420997619629, -0.0018090009689331055, -0.001727759838104248, -0.0016465187072753906, -0.0015652775764465332, -0.0014840364456176758, -0.0014027953147888184, -0.001321554183959961, -0.0012403130531311035, -0.001159071922302246, -0.0010778307914733887, -0.0009965896606445312, -0.0009153485298156738, -0.0008341073989868164, -0.000752866268157959, -0.0006716251373291016, -0.0005903840065002441, -0.0005091428756713867, -0.0004279017448425293, -0.0003466606140136719, -0.00026541948318481445, -0.00018417835235595703, -0.00010293722152709961, -2.1696090698242188e-05, 5.9545040130615234e-05, 0.00014078617095947266, 0.00022202730178833008, 0.0003032684326171875, 0.0003845095634460449, 0.00046575069427490234, 0.0005469918251037598, 0.0006282329559326172, 0.0007094740867614746, 0.000790715217590332, 0.0008719563484191895, 0.0009531974792480469, 0.0010344386100769043, 0.0011156797409057617, 0.0011969208717346191, 0.0012781620025634766, 0.001359403133392334, 0.0014406442642211914, 0.0015218853950500488, 0.0016031265258789062, 0.0016843676567077637, 0.001765608787536621, 0.0018468499183654785, 0.001928091049194336, 0.0020093321800231934, 0.0020905733108520508, 0.002171814441680908, 0.0022530555725097656, 0.002334296703338623, 0.0024155378341674805, 0.002496778964996338, 0.0025780200958251953, 0.0026592612266540527, 0.00274050235748291, 0.0028217434883117676, 0.002902984619140625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 3.0, 5.0, 9.0, 10.0, 15.0, 20.0, 16.0, 29.0, 51.0, 88.0, 129.0, 193.0, 374.0, 660.0, 1385.0, 2882.0, 8303.0, 30649.0, 161063.0, 591567.0, 199003.0, 36291.0, 9456.0, 3253.0, 1396.0, 710.0, 406.0, 210.0, 119.0, 89.0, 52.0, 28.0, 26.0, 21.0, 12.0, 12.0, 1.0, 7.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.390625, -16.8564453125, -16.322265625, -15.7880859375, -15.25390625, -14.7197265625, -14.185546875, -13.6513671875, -13.1171875, -12.5830078125, -12.048828125, -11.5146484375, -10.98046875, -10.4462890625, -9.912109375, -9.3779296875, -8.84375, -8.3095703125, -7.775390625, -7.2412109375, -6.70703125, -6.1728515625, -5.638671875, -5.1044921875, -4.5703125, -4.0361328125, -3.501953125, -2.9677734375, -2.43359375, -1.8994140625, -1.365234375, -0.8310546875, -0.296875, 0.2373046875, 0.771484375, 1.3056640625, 1.83984375, 2.3740234375, 2.908203125, 3.4423828125, 3.9765625, 4.5107421875, 5.044921875, 5.5791015625, 6.11328125, 6.6474609375, 7.181640625, 7.7158203125, 8.25, 8.7841796875, 9.318359375, 9.8525390625, 10.38671875, 10.9208984375, 11.455078125, 11.9892578125, 12.5234375, 13.0576171875, 13.591796875, 14.1259765625, 14.66015625, 15.1943359375, 15.728515625, 16.2626953125, 16.796875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 7.0, 7.0, 8.0, 7.0, 8.0, 9.0, 14.0, 17.0, 28.0, 35.0, 43.0, 48.0, 62.0, 73.0, 67.0, 83.0, 80.0, 64.0, 80.0, 47.0, 57.0, 39.0, 25.0, 20.0, 16.0, 15.0, 12.0, 6.0, 6.0, 3.0, 7.0, 7.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1875, -6.92919921875, -6.6708984375, -6.41259765625, -6.154296875, -5.89599609375, -5.6376953125, -5.37939453125, -5.12109375, -4.86279296875, -4.6044921875, -4.34619140625, -4.087890625, -3.82958984375, -3.5712890625, -3.31298828125, -3.0546875, -2.79638671875, -2.5380859375, -2.27978515625, -2.021484375, -1.76318359375, -1.5048828125, -1.24658203125, -0.98828125, -0.72998046875, -0.4716796875, -0.21337890625, 0.044921875, 0.30322265625, 0.5615234375, 0.81982421875, 1.078125, 1.33642578125, 1.5947265625, 1.85302734375, 2.111328125, 2.36962890625, 2.6279296875, 2.88623046875, 3.14453125, 3.40283203125, 3.6611328125, 3.91943359375, 4.177734375, 4.43603515625, 4.6943359375, 4.95263671875, 5.2109375, 5.46923828125, 5.7275390625, 5.98583984375, 6.244140625, 6.50244140625, 6.7607421875, 7.01904296875, 7.27734375, 7.53564453125, 7.7939453125, 8.05224609375, 8.310546875, 8.56884765625, 8.8271484375, 9.08544921875, 9.34375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 6.0, 6.0, 10.0, 11.0, 17.0, 26.0, 41.0, 51.0, 56.0, 64.0, 104.0, 106.0, 98.0, 94.0, 71.0, 84.0, 49.0, 42.0, 21.0, 17.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-141.43487548828125, -136.9160919189453, -132.39732360839844, -127.8785400390625, -123.3597640991211, -118.84098815917969, -114.32220458984375, -109.80342864990234, -105.28465270996094, -100.76587677001953, -96.2470932006836, -91.72831726074219, -87.20954132080078, -82.69076538085938, -78.17198181152344, -73.65320587158203, -69.1344223022461, -64.61564636230469, -60.096866607666016, -55.578086853027344, -51.05931091308594, -46.540531158447266, -42.021751403808594, -37.50297546386719, -32.984195709228516, -28.465417861938477, -23.946640014648438, -19.427860260009766, -14.909082412719727, -10.390304565429688, -5.871524810791016, -1.3527469635009766, 3.1660308837890625, 7.68480920791626, 12.203587532043457, 16.722366333007812, 21.24114418029785, 25.75992202758789, 30.278701782226562, 34.79747772216797, 39.31625747680664, 43.83503723144531, 48.35381317138672, 52.87259292602539, 57.39137268066406, 61.91014862060547, 66.42892456054688, 70.94770812988281, 75.46648406982422, 79.98526000976562, 84.50404357910156, 89.02281951904297, 93.54159545898438, 98.06037902832031, 102.57915496826172, 107.09793090820312, 111.61671447753906, 116.13549041748047, 120.6542739868164, 125.17304992675781, 129.69183349609375, 134.21060180664062, 138.72938537597656, 143.2481689453125, 147.76693725585938]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 6.0, 4.0, 6.0, 7.0, 2.0, 8.0, 10.0, 9.0, 26.0, 14.0, 27.0, 23.0, 26.0, 31.0, 39.0, 37.0, 38.0, 45.0, 40.0, 34.0, 56.0, 33.0, 41.0, 34.0, 47.0, 55.0, 40.0, 34.0, 35.0, 34.0, 26.0, 23.0, 13.0, 20.0, 14.0, 16.0, 12.0, 10.0, 9.0, 4.0, 3.0, 5.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.88111877441406, -95.6190185546875, -92.35691833496094, -89.09481811523438, -85.83271026611328, -82.57061004638672, -79.30850982666016, -76.0464096069336, -72.7843017578125, -69.52220153808594, -66.26010131835938, -62.99799728393555, -59.73589324951172, -56.473793029785156, -53.211692810058594, -49.94959259033203, -46.68749237060547, -43.425392150878906, -40.16328811645508, -36.901187896728516, -33.63908386230469, -30.376983642578125, -27.114883422851562, -23.852781295776367, -20.590679168701172, -17.328577041625977, -14.066475868225098, -10.804374694824219, -7.542272567749023, -4.280170440673828, -1.0180702209472656, 2.2440319061279297, 5.506134033203125, 8.76823616027832, 12.0303373336792, 15.292438507080078, 18.554540634155273, 21.81664276123047, 25.07874298095703, 28.340845108032227, 31.602947235107422, 34.865047454833984, 38.12715148925781, 41.389251708984375, 44.65135192871094, 47.913455963134766, 51.17555618286133, 54.437660217285156, 57.69976043701172, 60.96186065673828, 64.22396087646484, 67.48606872558594, 70.7481689453125, 74.01026916503906, 77.27236938476562, 80.53446960449219, 83.79656982421875, 87.05867004394531, 90.32077026367188, 93.58287048339844, 96.84497833251953, 100.1070785522461, 103.36917877197266, 106.63127899169922, 109.89338684082031]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 2.0, 5.0, 11.0, 16.0, 21.0, 14.0, 30.0, 43.0, 57.0, 112.0, 164.0, 267.0, 478.0, 904.0, 1771.0, 3656.0, 8923.0, 26100.0, 107766.0, 2593141.0, 1314425.0, 97563.0, 23821.0, 8198.0, 3402.0, 1500.0, 750.0, 427.0, 225.0, 135.0, 92.0, 70.0, 37.0, 37.0, 27.0, 17.0, 13.0, 13.0, 11.0, 10.0, 8.0, 6.0, 2.0, 4.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-41.6875, -40.29638671875, -38.9052734375, -37.51416015625, -36.123046875, -34.73193359375, -33.3408203125, -31.94970703125, -30.55859375, -29.16748046875, -27.7763671875, -26.38525390625, -24.994140625, -23.60302734375, -22.2119140625, -20.82080078125, -19.4296875, -18.03857421875, -16.6474609375, -15.25634765625, -13.865234375, -12.47412109375, -11.0830078125, -9.69189453125, -8.30078125, -6.90966796875, -5.5185546875, -4.12744140625, -2.736328125, -1.34521484375, 0.0458984375, 1.43701171875, 2.828125, 4.21923828125, 5.6103515625, 7.00146484375, 8.392578125, 9.78369140625, 11.1748046875, 12.56591796875, 13.95703125, 15.34814453125, 16.7392578125, 18.13037109375, 19.521484375, 20.91259765625, 22.3037109375, 23.69482421875, 25.0859375, 26.47705078125, 27.8681640625, 29.25927734375, 30.650390625, 32.04150390625, 33.4326171875, 34.82373046875, 36.21484375, 37.60595703125, 38.9970703125, 40.38818359375, 41.779296875, 43.17041015625, 44.5615234375, 45.95263671875, 47.34375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 7.0, 3.0, 11.0, 18.0, 30.0, 29.0, 46.0, 66.0, 68.0, 93.0, 89.0, 109.0, 98.0, 72.0, 79.0, 71.0, 37.0, 36.0, 20.0, 11.0, 4.0, 2.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8671875, -8.591552734375, -8.31591796875, -8.040283203125, -7.7646484375, -7.489013671875, -7.21337890625, -6.937744140625, -6.662109375, -6.386474609375, -6.11083984375, -5.835205078125, -5.5595703125, -5.283935546875, -5.00830078125, -4.732666015625, -4.45703125, -4.181396484375, -3.90576171875, -3.630126953125, -3.3544921875, -3.078857421875, -2.80322265625, -2.527587890625, -2.251953125, -1.976318359375, -1.70068359375, -1.425048828125, -1.1494140625, -0.873779296875, -0.59814453125, -0.322509765625, -0.046875, 0.228759765625, 0.50439453125, 0.780029296875, 1.0556640625, 1.331298828125, 1.60693359375, 1.882568359375, 2.158203125, 2.433837890625, 2.70947265625, 2.985107421875, 3.2607421875, 3.536376953125, 3.81201171875, 4.087646484375, 4.36328125, 4.638916015625, 4.91455078125, 5.190185546875, 5.4658203125, 5.741455078125, 6.01708984375, 6.292724609375, 6.568359375, 6.843994140625, 7.11962890625, 7.395263671875, 7.6708984375, 7.946533203125, 8.22216796875, 8.497802734375, 8.7734375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 11.0, 15.0, 26.0, 46.0, 69.0, 103.0, 155.0, 264.0, 493.0, 983.0, 2519.0, 8486.0, 44795.0, 708405.0, 3302595.0, 103714.0, 14623.0, 3831.0, 1508.0, 703.0, 375.0, 219.0, 106.0, 94.0, 50.0, 29.0, 24.0, 11.0, 13.0, 2.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-63.21875, -61.369140625, -59.51953125, -57.669921875, -55.8203125, -53.970703125, -52.12109375, -50.271484375, -48.421875, -46.572265625, -44.72265625, -42.873046875, -41.0234375, -39.173828125, -37.32421875, -35.474609375, -33.625, -31.775390625, -29.92578125, -28.076171875, -26.2265625, -24.376953125, -22.52734375, -20.677734375, -18.828125, -16.978515625, -15.12890625, -13.279296875, -11.4296875, -9.580078125, -7.73046875, -5.880859375, -4.03125, -2.181640625, -0.33203125, 1.517578125, 3.3671875, 5.216796875, 7.06640625, 8.916015625, 10.765625, 12.615234375, 14.46484375, 16.314453125, 18.1640625, 20.013671875, 21.86328125, 23.712890625, 25.5625, 27.412109375, 29.26171875, 31.111328125, 32.9609375, 34.810546875, 36.66015625, 38.509765625, 40.359375, 42.208984375, 44.05859375, 45.908203125, 47.7578125, 49.607421875, 51.45703125, 53.306640625, 55.15625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 6.0, 14.0, 14.0, 32.0, 83.0, 133.0, 341.0, 1258.0, 1475.0, 376.0, 158.0, 82.0, 33.0, 27.0, 14.0, 11.0, 4.0, 5.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.53125, -19.742431640625, -18.95361328125, -18.164794921875, -17.3759765625, -16.587158203125, -15.79833984375, -15.009521484375, -14.220703125, -13.431884765625, -12.64306640625, -11.854248046875, -11.0654296875, -10.276611328125, -9.48779296875, -8.698974609375, -7.91015625, -7.121337890625, -6.33251953125, -5.543701171875, -4.7548828125, -3.966064453125, -3.17724609375, -2.388427734375, -1.599609375, -0.810791015625, -0.02197265625, 0.766845703125, 1.5556640625, 2.344482421875, 3.13330078125, 3.922119140625, 4.7109375, 5.499755859375, 6.28857421875, 7.077392578125, 7.8662109375, 8.655029296875, 9.44384765625, 10.232666015625, 11.021484375, 11.810302734375, 12.59912109375, 13.387939453125, 14.1767578125, 14.965576171875, 15.75439453125, 16.543212890625, 17.33203125, 18.120849609375, 18.90966796875, 19.698486328125, 20.4873046875, 21.276123046875, 22.06494140625, 22.853759765625, 23.642578125, 24.431396484375, 25.22021484375, 26.009033203125, 26.7978515625, 27.586669921875, 28.37548828125, 29.164306640625, 29.953125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 9.0, 19.0, 29.0, 52.0, 81.0, 112.0, 134.0, 138.0, 126.0, 99.0, 81.0, 44.0, 28.0, 21.0, 12.0, 7.0, 3.0, 3.0, 0.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-127.51722717285156, -123.79232788085938, -120.06743621826172, -116.34253692626953, -112.61764526367188, -108.89274597167969, -105.1678466796875, -101.44294738769531, -97.71805572509766, -93.99315643310547, -90.26826477050781, -86.54336547851562, -82.81846618652344, -79.09357452392578, -75.3686752319336, -71.64378356933594, -67.91888427734375, -64.19398498535156, -60.469093322753906, -56.74419403076172, -53.0192985534668, -49.294403076171875, -45.56950378417969, -41.844608306884766, -38.119712829589844, -34.39481735229492, -30.669919967651367, -26.945022583007812, -23.22012710571289, -19.49523162841797, -15.770334243774414, -12.04543685913086, -8.320549011230469, -4.5956525802612305, -0.8707561492919922, 2.854140281677246, 6.579036712646484, 10.303932189941406, 14.028829574584961, 17.753726959228516, 21.478622436523438, 25.20351791381836, 28.928415298461914, 32.65331268310547, 36.37820816040039, 40.10310363769531, 43.8280029296875, 47.55289840698242, 51.277793884277344, 55.002689361572266, 58.72758483886719, 62.452484130859375, 66.17738342285156, 69.90227508544922, 73.6271743774414, 77.35206604003906, 81.07696533203125, 84.80186462402344, 88.5267562866211, 92.25165557861328, 95.97654724121094, 99.70144653320312, 103.42634582519531, 107.1512451171875, 110.87613677978516]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 6.0, 7.0, 5.0, 13.0, 23.0, 24.0, 30.0, 54.0, 58.0, 63.0, 62.0, 68.0, 85.0, 96.0, 88.0, 61.0, 64.0, 48.0, 34.0, 35.0, 21.0, 17.0, 20.0, 13.0, 3.0, 1.0, 4.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.40766143798828, -96.59231567382812, -93.77696228027344, -90.96161651611328, -88.14627075195312, -85.33092498779297, -82.51557922363281, -79.70022583007812, -76.88488006591797, -74.06953430175781, -71.25418090820312, -68.43883514404297, -65.62348937988281, -62.808143615722656, -59.992794036865234, -57.17744445800781, -54.362098693847656, -51.5467529296875, -48.73140335083008, -45.916053771972656, -43.1007080078125, -40.285362243652344, -37.47001266479492, -34.6546630859375, -31.839317321777344, -29.023969650268555, -26.208621978759766, -23.393274307250977, -20.577926635742188, -17.7625789642334, -14.94723129272461, -12.13188362121582, -9.3165283203125, -6.501180648803711, -3.685832977294922, -0.8704853057861328, 1.9448623657226562, 4.760210037231445, 7.575557708740234, 10.390905380249023, 13.206253051757812, 16.0216007232666, 18.83694839477539, 21.65229606628418, 24.46764373779297, 27.282991409301758, 30.098339080810547, 32.91368865966797, 35.729034423828125, 38.54438018798828, 41.3597297668457, 44.175079345703125, 46.99042510986328, 49.80577087402344, 52.62112045288086, 55.43647003173828, 58.25181579589844, 61.067161560058594, 63.882511138916016, 66.69786071777344, 69.5132064819336, 72.32855224609375, 75.14390563964844, 77.9592514038086, 80.77459716796875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 3.0, 7.0, 10.0, 15.0, 24.0, 50.0, 85.0, 106.0, 238.0, 374.0, 715.0, 1457.0, 3838.0, 16806.0, 112253.0, 629587.0, 239385.0, 33373.0, 6194.0, 1991.0, 934.0, 471.0, 267.0, 146.0, 90.0, 56.0, 31.0, 16.0, 7.0, 8.0, 2.0, 4.0, 3.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0], "bins": [-82.1875, -80.11669921875, -78.0458984375, -75.97509765625, -73.904296875, -71.83349609375, -69.7626953125, -67.69189453125, -65.62109375, -63.55029296875, -61.4794921875, -59.40869140625, -57.337890625, -55.26708984375, -53.1962890625, -51.12548828125, -49.0546875, -46.98388671875, -44.9130859375, -42.84228515625, -40.771484375, -38.70068359375, -36.6298828125, -34.55908203125, -32.48828125, -30.41748046875, -28.3466796875, -26.27587890625, -24.205078125, -22.13427734375, -20.0634765625, -17.99267578125, -15.921875, -13.85107421875, -11.7802734375, -9.70947265625, -7.638671875, -5.56787109375, -3.4970703125, -1.42626953125, 0.64453125, 2.71533203125, 4.7861328125, 6.85693359375, 8.927734375, 10.99853515625, 13.0693359375, 15.14013671875, 17.2109375, 19.28173828125, 21.3525390625, 23.42333984375, 25.494140625, 27.56494140625, 29.6357421875, 31.70654296875, 33.77734375, 35.84814453125, 37.9189453125, 39.98974609375, 42.060546875, 44.13134765625, 46.2021484375, 48.27294921875, 50.34375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 11.0, 18.0, 17.0, 32.0, 54.0, 61.0, 93.0, 96.0, 113.0, 107.0, 94.0, 89.0, 69.0, 56.0, 32.0, 24.0, 19.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6953125, -8.3939208984375, -8.092529296875, -7.7911376953125, -7.48974609375, -7.1883544921875, -6.886962890625, -6.5855712890625, -6.2841796875, -5.9827880859375, -5.681396484375, -5.3800048828125, -5.07861328125, -4.7772216796875, -4.475830078125, -4.1744384765625, -3.873046875, -3.5716552734375, -3.270263671875, -2.9688720703125, -2.66748046875, -2.3660888671875, -2.064697265625, -1.7633056640625, -1.4619140625, -1.1605224609375, -0.859130859375, -0.5577392578125, -0.25634765625, 0.0450439453125, 0.346435546875, 0.6478271484375, 0.94921875, 1.2506103515625, 1.552001953125, 1.8533935546875, 2.15478515625, 2.4561767578125, 2.757568359375, 3.0589599609375, 3.3603515625, 3.6617431640625, 3.963134765625, 4.2645263671875, 4.56591796875, 4.8673095703125, 5.168701171875, 5.4700927734375, 5.771484375, 6.0728759765625, 6.374267578125, 6.6756591796875, 6.97705078125, 7.2784423828125, 7.579833984375, 7.8812255859375, 8.1826171875, 8.4840087890625, 8.785400390625, 9.0867919921875, 9.38818359375, 9.6895751953125, 9.990966796875, 10.2923583984375, 10.59375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 7.0, 8.0, 17.0, 17.0, 25.0, 53.0, 75.0, 135.0, 212.0, 336.0, 600.0, 1182.0, 2286.0, 4775.0, 11130.0, 26591.0, 64900.0, 156769.0, 342762.0, 254668.0, 106116.0, 43504.0, 17756.0, 7613.0, 3351.0, 1585.0, 868.0, 490.0, 274.0, 137.0, 111.0, 69.0, 43.0, 32.0, 23.0, 17.0, 9.0, 5.0, 3.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.328125, -17.691162109375, -17.05419921875, -16.417236328125, -15.7802734375, -15.143310546875, -14.50634765625, -13.869384765625, -13.232421875, -12.595458984375, -11.95849609375, -11.321533203125, -10.6845703125, -10.047607421875, -9.41064453125, -8.773681640625, -8.13671875, -7.499755859375, -6.86279296875, -6.225830078125, -5.5888671875, -4.951904296875, -4.31494140625, -3.677978515625, -3.041015625, -2.404052734375, -1.76708984375, -1.130126953125, -0.4931640625, 0.143798828125, 0.78076171875, 1.417724609375, 2.0546875, 2.691650390625, 3.32861328125, 3.965576171875, 4.6025390625, 5.239501953125, 5.87646484375, 6.513427734375, 7.150390625, 7.787353515625, 8.42431640625, 9.061279296875, 9.6982421875, 10.335205078125, 10.97216796875, 11.609130859375, 12.24609375, 12.883056640625, 13.52001953125, 14.156982421875, 14.7939453125, 15.430908203125, 16.06787109375, 16.704833984375, 17.341796875, 17.978759765625, 18.61572265625, 19.252685546875, 19.8896484375, 20.526611328125, 21.16357421875, 21.800537109375, 22.4375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 8.0, 13.0, 6.0, 15.0, 19.0, 21.0, 27.0, 12.0, 24.0, 15.0, 24.0, 33.0, 29.0, 29.0, 27.0, 35.0, 29.0, 48.0, 42.0, 35.0, 34.0, 43.0, 37.0, 28.0, 37.0, 35.0, 33.0, 33.0, 23.0, 21.0, 25.0, 11.0, 23.0, 22.0, 16.0, 8.0, 12.0, 14.0, 10.0, 2.0, 10.0, 6.0, 4.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.359375, -13.9122314453125, -13.465087890625, -13.0179443359375, -12.57080078125, -12.1236572265625, -11.676513671875, -11.2293701171875, -10.7822265625, -10.3350830078125, -9.887939453125, -9.4407958984375, -8.99365234375, -8.5465087890625, -8.099365234375, -7.6522216796875, -7.205078125, -6.7579345703125, -6.310791015625, -5.8636474609375, -5.41650390625, -4.9693603515625, -4.522216796875, -4.0750732421875, -3.6279296875, -3.1807861328125, -2.733642578125, -2.2864990234375, -1.83935546875, -1.3922119140625, -0.945068359375, -0.4979248046875, -0.05078125, 0.3963623046875, 0.843505859375, 1.2906494140625, 1.73779296875, 2.1849365234375, 2.632080078125, 3.0792236328125, 3.5263671875, 3.9735107421875, 4.420654296875, 4.8677978515625, 5.31494140625, 5.7620849609375, 6.209228515625, 6.6563720703125, 7.103515625, 7.5506591796875, 7.997802734375, 8.4449462890625, 8.89208984375, 9.3392333984375, 9.786376953125, 10.2335205078125, 10.6806640625, 11.1278076171875, 11.574951171875, 12.0220947265625, 12.46923828125, 12.9163818359375, 13.363525390625, 13.8106689453125, 14.2578125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 6.0, 11.0, 4.0, 8.0, 15.0, 25.0, 31.0, 80.0, 110.0, 199.0, 406.0, 804.0, 1911.0, 5373.0, 19338.0, 98804.0, 519117.0, 331120.0, 52741.0, 12033.0, 3717.0, 1374.0, 624.0, 313.0, 152.0, 116.0, 58.0, 18.0, 21.0, 9.0, 8.0, 6.0, 5.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.46875, -17.888427734375, -17.30810546875, -16.727783203125, -16.1474609375, -15.567138671875, -14.98681640625, -14.406494140625, -13.826171875, -13.245849609375, -12.66552734375, -12.085205078125, -11.5048828125, -10.924560546875, -10.34423828125, -9.763916015625, -9.18359375, -8.603271484375, -8.02294921875, -7.442626953125, -6.8623046875, -6.281982421875, -5.70166015625, -5.121337890625, -4.541015625, -3.960693359375, -3.38037109375, -2.800048828125, -2.2197265625, -1.639404296875, -1.05908203125, -0.478759765625, 0.1015625, 0.681884765625, 1.26220703125, 1.842529296875, 2.4228515625, 3.003173828125, 3.58349609375, 4.163818359375, 4.744140625, 5.324462890625, 5.90478515625, 6.485107421875, 7.0654296875, 7.645751953125, 8.22607421875, 8.806396484375, 9.38671875, 9.967041015625, 10.54736328125, 11.127685546875, 11.7080078125, 12.288330078125, 12.86865234375, 13.448974609375, 14.029296875, 14.609619140625, 15.18994140625, 15.770263671875, 16.3505859375, 16.930908203125, 17.51123046875, 18.091552734375, 18.671875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 4.0, 5.0, 2.0, 5.0, 8.0, 3.0, 8.0, 15.0, 17.0, 15.0, 22.0, 29.0, 35.0, 62.0, 52.0, 89.0, 113.0, 117.0, 96.0, 56.0, 47.0, 46.0, 31.0, 17.0, 21.0, 16.0, 20.0, 13.0, 6.0, 8.0, 5.0, 3.0, 4.0, 2.0, 4.0, 4.0, 0.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.002231597900390625, -0.0021696239709854126, -0.0021076500415802, -0.002045676112174988, -0.0019837021827697754, -0.001921728253364563, -0.0018597543239593506, -0.0017977803945541382, -0.0017358064651489258, -0.0016738325357437134, -0.001611858606338501, -0.0015498846769332886, -0.0014879107475280762, -0.0014259368181228638, -0.0013639628887176514, -0.001301988959312439, -0.0012400150299072266, -0.0011780411005020142, -0.0011160671710968018, -0.0010540932416915894, -0.000992119312286377, -0.0009301453828811646, -0.0008681714534759521, -0.0008061975240707397, -0.0007442235946655273, -0.0006822496652603149, -0.0006202757358551025, -0.0005583018064498901, -0.0004963278770446777, -0.00043435394763946533, -0.00037238001823425293, -0.00031040608882904053, -0.0002484321594238281, -0.00018645823001861572, -0.00012448430061340332, -6.251037120819092e-05, -5.364418029785156e-07, 6.143748760223389e-05, 0.0001234114170074463, 0.0001853853464126587, 0.0002473592758178711, 0.0003093332052230835, 0.0003713071346282959, 0.0004332810640335083, 0.0004952549934387207, 0.0005572289228439331, 0.0006192028522491455, 0.0006811767816543579, 0.0007431507110595703, 0.0008051246404647827, 0.0008670985698699951, 0.0009290724992752075, 0.00099104642868042, 0.0010530203580856323, 0.0011149942874908447, 0.0011769682168960571, 0.0012389421463012695, 0.001300916075706482, 0.0013628900051116943, 0.0014248639345169067, 0.0014868378639221191, 0.0015488117933273315, 0.001610785722732544, 0.0016727596521377563, 0.0017347335815429688]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 3.0, 10.0, 11.0, 13.0, 23.0, 29.0, 51.0, 81.0, 146.0, 247.0, 455.0, 783.0, 1626.0, 3616.0, 9609.0, 31163.0, 131027.0, 484661.0, 292777.0, 63755.0, 17267.0, 6078.0, 2467.0, 1208.0, 574.0, 336.0, 203.0, 110.0, 73.0, 61.0, 27.0, 21.0, 18.0, 8.0, 5.0, 6.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0], "bins": [-15.6328125, -15.1697998046875, -14.706787109375, -14.2437744140625, -13.78076171875, -13.3177490234375, -12.854736328125, -12.3917236328125, -11.9287109375, -11.4656982421875, -11.002685546875, -10.5396728515625, -10.07666015625, -9.6136474609375, -9.150634765625, -8.6876220703125, -8.224609375, -7.7615966796875, -7.298583984375, -6.8355712890625, -6.37255859375, -5.9095458984375, -5.446533203125, -4.9835205078125, -4.5205078125, -4.0574951171875, -3.594482421875, -3.1314697265625, -2.66845703125, -2.2054443359375, -1.742431640625, -1.2794189453125, -0.81640625, -0.3533935546875, 0.109619140625, 0.5726318359375, 1.03564453125, 1.4986572265625, 1.961669921875, 2.4246826171875, 2.8876953125, 3.3507080078125, 3.813720703125, 4.2767333984375, 4.73974609375, 5.2027587890625, 5.665771484375, 6.1287841796875, 6.591796875, 7.0548095703125, 7.517822265625, 7.9808349609375, 8.44384765625, 8.9068603515625, 9.369873046875, 9.8328857421875, 10.2958984375, 10.7589111328125, 11.221923828125, 11.6849365234375, 12.14794921875, 12.6109619140625, 13.073974609375, 13.5369873046875, 14.0]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 6.0, 6.0, 8.0, 6.0, 15.0, 9.0, 15.0, 25.0, 33.0, 30.0, 41.0, 77.0, 65.0, 86.0, 74.0, 100.0, 60.0, 70.0, 50.0, 42.0, 28.0, 35.0, 15.0, 23.0, 23.0, 10.0, 10.0, 13.0, 10.0, 4.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.01171875, -6.74200439453125, -6.4722900390625, -6.20257568359375, -5.932861328125, -5.66314697265625, -5.3934326171875, -5.12371826171875, -4.85400390625, -4.58428955078125, -4.3145751953125, -4.04486083984375, -3.775146484375, -3.50543212890625, -3.2357177734375, -2.96600341796875, -2.6962890625, -2.42657470703125, -2.1568603515625, -1.88714599609375, -1.617431640625, -1.34771728515625, -1.0780029296875, -0.80828857421875, -0.53857421875, -0.26885986328125, 0.0008544921875, 0.27056884765625, 0.540283203125, 0.80999755859375, 1.0797119140625, 1.34942626953125, 1.619140625, 1.88885498046875, 2.1585693359375, 2.42828369140625, 2.697998046875, 2.96771240234375, 3.2374267578125, 3.50714111328125, 3.77685546875, 4.04656982421875, 4.3162841796875, 4.58599853515625, 4.855712890625, 5.12542724609375, 5.3951416015625, 5.66485595703125, 5.9345703125, 6.20428466796875, 6.4739990234375, 6.74371337890625, 7.013427734375, 7.28314208984375, 7.5528564453125, 7.82257080078125, 8.09228515625, 8.36199951171875, 8.6317138671875, 8.90142822265625, 9.171142578125, 9.44085693359375, 9.7105712890625, 9.98028564453125, 10.25]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 6.0, 5.0, 5.0, 9.0, 5.0, 17.0, 20.0, 25.0, 26.0, 45.0, 42.0, 51.0, 72.0, 63.0, 78.0, 90.0, 91.0, 70.0, 65.0, 50.0, 38.0, 36.0, 27.0, 16.0, 9.0, 13.0, 7.0, 4.0, 3.0, 3.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-125.41755676269531, -121.87175750732422, -118.3259506225586, -114.7801513671875, -111.2343521118164, -107.68855285644531, -104.14274597167969, -100.5969467163086, -97.0511474609375, -93.5053482055664, -89.95954132080078, -86.41374206542969, -82.8679428100586, -79.3221435546875, -75.77633666992188, -72.23053741455078, -68.68473815917969, -65.1389389038086, -61.593135833740234, -58.047332763671875, -54.50153350830078, -50.95573043823242, -47.40992736816406, -43.86412811279297, -40.318321228027344, -36.772518157958984, -33.22671890258789, -29.68091583251953, -26.135116577148438, -22.589313507080078, -19.04351234436035, -15.497711181640625, -11.951911926269531, -8.406110763549805, -4.86030912399292, -1.3145074844360352, 2.2312936782836914, 5.777095794677734, 9.322896957397461, 12.868698120117188, 16.414499282836914, 19.96030044555664, 23.506101608276367, 27.051902770996094, 30.597705841064453, 34.14350891113281, 37.689308166503906, 41.235107421875, 44.78091049194336, 48.32671356201172, 51.87251281738281, 55.41831588745117, 58.964115142822266, 62.509918212890625, 66.05571746826172, 69.60151672363281, 73.14732360839844, 76.69312286376953, 80.23892974853516, 83.78472900390625, 87.33052825927734, 90.87632751464844, 94.42213439941406, 97.96793365478516, 101.51373291015625]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 6.0, 17.0, 15.0, 17.0, 26.0, 29.0, 29.0, 29.0, 54.0, 39.0, 54.0, 69.0, 53.0, 59.0, 66.0, 57.0, 56.0, 36.0, 35.0, 34.0, 33.0, 30.0, 30.0, 20.0, 22.0, 25.0, 12.0, 12.0, 13.0, 5.0, 3.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.90045166015625, -116.26812744140625, -112.63581085205078, -109.00348663330078, -105.37116241455078, -101.73884582519531, -98.10652160644531, -94.47419738769531, -90.84187316894531, -87.20954895019531, -83.57723236083984, -79.94490814208984, -76.31258392333984, -72.68026733398438, -69.04794311523438, -65.41561889648438, -61.78329849243164, -58.150978088378906, -54.518653869628906, -50.88633346557617, -47.25400924682617, -43.62168884277344, -39.98936462402344, -36.3570442199707, -32.72472381591797, -29.0924015045166, -25.460079193115234, -21.8277587890625, -18.1954345703125, -14.563114166259766, -10.930791854858398, -7.298469543457031, -3.6661453247070312, -0.033823251724243164, 3.598498821258545, 7.230820655822754, 10.863142967224121, 14.495464324951172, 18.12778663635254, 21.760108947753906, 25.392431259155273, 29.02475357055664, 32.657073974609375, 36.289398193359375, 39.92171859741211, 43.554039001464844, 47.186363220214844, 50.818687438964844, 54.45100784301758, 58.08332824707031, 61.71565246582031, 65.34797668457031, 68.98029327392578, 72.61261749267578, 76.24494171142578, 79.87725830078125, 83.50958251953125, 87.14190673828125, 90.77422332763672, 94.40654754638672, 98.03887176513672, 101.67118835449219, 105.30351257324219, 108.93583679199219, 112.56816101074219]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 5.0, 1.0, 3.0, 5.0, 6.0, 6.0, 14.0, 18.0, 29.0, 48.0, 78.0, 135.0, 296.0, 572.0, 1656.0, 5785.0, 46577.0, 3968622.0, 156142.0, 10570.0, 2219.0, 761.0, 341.0, 174.0, 82.0, 46.0, 29.0, 16.0, 15.0, 11.0, 8.0, 6.0, 2.0, 1.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.5625, -62.5380859375, -59.513671875, -56.4892578125, -53.46484375, -50.4404296875, -47.416015625, -44.3916015625, -41.3671875, -38.3427734375, -35.318359375, -32.2939453125, -29.26953125, -26.2451171875, -23.220703125, -20.1962890625, -17.171875, -14.1474609375, -11.123046875, -8.0986328125, -5.07421875, -2.0498046875, 0.974609375, 3.9990234375, 7.0234375, 10.0478515625, 13.072265625, 16.0966796875, 19.12109375, 22.1455078125, 25.169921875, 28.1943359375, 31.21875, 34.2431640625, 37.267578125, 40.2919921875, 43.31640625, 46.3408203125, 49.365234375, 52.3896484375, 55.4140625, 58.4384765625, 61.462890625, 64.4873046875, 67.51171875, 70.5361328125, 73.560546875, 76.5849609375, 79.609375, 82.6337890625, 85.658203125, 88.6826171875, 91.70703125, 94.7314453125, 97.755859375, 100.7802734375, 103.8046875, 106.8291015625, 109.853515625, 112.8779296875, 115.90234375, 118.9267578125, 121.951171875, 124.9755859375, 128.0]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 0.0, 4.0, 3.0, 2.0, 4.0, 7.0, 22.0, 14.0, 21.0, 44.0, 52.0, 72.0, 71.0, 109.0, 109.0, 103.0, 87.0, 87.0, 48.0, 47.0, 46.0, 24.0, 11.0, 6.0, 7.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8046875, -8.5072021484375, -8.209716796875, -7.9122314453125, -7.61474609375, -7.3172607421875, -7.019775390625, -6.7222900390625, -6.4248046875, -6.1273193359375, -5.829833984375, -5.5323486328125, -5.23486328125, -4.9373779296875, -4.639892578125, -4.3424072265625, -4.044921875, -3.7474365234375, -3.449951171875, -3.1524658203125, -2.85498046875, -2.5574951171875, -2.260009765625, -1.9625244140625, -1.6650390625, -1.3675537109375, -1.070068359375, -0.7725830078125, -0.47509765625, -0.1776123046875, 0.119873046875, 0.4173583984375, 0.71484375, 1.0123291015625, 1.309814453125, 1.6072998046875, 1.90478515625, 2.2022705078125, 2.499755859375, 2.7972412109375, 3.0947265625, 3.3922119140625, 3.689697265625, 3.9871826171875, 4.28466796875, 4.5821533203125, 4.879638671875, 5.1771240234375, 5.474609375, 5.7720947265625, 6.069580078125, 6.3670654296875, 6.66455078125, 6.9620361328125, 7.259521484375, 7.5570068359375, 7.8544921875, 8.1519775390625, 8.449462890625, 8.7469482421875, 9.04443359375, 9.3419189453125, 9.639404296875, 9.9368896484375, 10.234375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 5.0, 5.0, 11.0, 10.0, 10.0, 15.0, 13.0, 19.0, 23.0, 28.0, 45.0, 93.0, 190.0, 383.0, 788.0, 1839.0, 4816.0, 14791.0, 57840.0, 363705.0, 3392602.0, 286309.0, 49689.0, 13083.0, 4485.0, 1735.0, 811.0, 384.0, 197.0, 111.0, 68.0, 56.0, 30.0, 23.0, 22.0, 17.0, 6.0, 3.0, 2.0, 10.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-37.0625, -35.986572265625, -34.91064453125, -33.834716796875, -32.7587890625, -31.682861328125, -30.60693359375, -29.531005859375, -28.455078125, -27.379150390625, -26.30322265625, -25.227294921875, -24.1513671875, -23.075439453125, -21.99951171875, -20.923583984375, -19.84765625, -18.771728515625, -17.69580078125, -16.619873046875, -15.5439453125, -14.468017578125, -13.39208984375, -12.316162109375, -11.240234375, -10.164306640625, -9.08837890625, -8.012451171875, -6.9365234375, -5.860595703125, -4.78466796875, -3.708740234375, -2.6328125, -1.556884765625, -0.48095703125, 0.594970703125, 1.6708984375, 2.746826171875, 3.82275390625, 4.898681640625, 5.974609375, 7.050537109375, 8.12646484375, 9.202392578125, 10.2783203125, 11.354248046875, 12.43017578125, 13.506103515625, 14.58203125, 15.657958984375, 16.73388671875, 17.809814453125, 18.8857421875, 19.961669921875, 21.03759765625, 22.113525390625, 23.189453125, 24.265380859375, 25.34130859375, 26.417236328125, 27.4931640625, 28.569091796875, 29.64501953125, 30.720947265625, 31.796875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 9.0, 10.0, 21.0, 29.0, 44.0, 59.0, 69.0, 127.0, 210.0, 414.0, 1583.0, 703.0, 293.0, 171.0, 101.0, 62.0, 55.0, 35.0, 16.0, 12.0, 13.0, 7.0, 4.0, 4.0, 3.0, 1.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.6875, -10.3399658203125, -9.992431640625, -9.6448974609375, -9.29736328125, -8.9498291015625, -8.602294921875, -8.2547607421875, -7.9072265625, -7.5596923828125, -7.212158203125, -6.8646240234375, -6.51708984375, -6.1695556640625, -5.822021484375, -5.4744873046875, -5.126953125, -4.7794189453125, -4.431884765625, -4.0843505859375, -3.73681640625, -3.3892822265625, -3.041748046875, -2.6942138671875, -2.3466796875, -1.9991455078125, -1.651611328125, -1.3040771484375, -0.95654296875, -0.6090087890625, -0.261474609375, 0.0860595703125, 0.43359375, 0.7811279296875, 1.128662109375, 1.4761962890625, 1.82373046875, 2.1712646484375, 2.518798828125, 2.8663330078125, 3.2138671875, 3.5614013671875, 3.908935546875, 4.2564697265625, 4.60400390625, 4.9515380859375, 5.299072265625, 5.6466064453125, 5.994140625, 6.3416748046875, 6.689208984375, 7.0367431640625, 7.38427734375, 7.7318115234375, 8.079345703125, 8.4268798828125, 8.7744140625, 9.1219482421875, 9.469482421875, 9.8170166015625, 10.16455078125, 10.5120849609375, 10.859619140625, 11.2071533203125, 11.5546875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 8.0, 9.0, 13.0, 15.0, 23.0, 45.0, 47.0, 71.0, 72.0, 88.0, 83.0, 110.0, 111.0, 72.0, 56.0, 41.0, 26.0, 35.0, 28.0, 12.0, 8.0, 5.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.73387145996094, -69.87832641601562, -68.02277374267578, -66.16722869873047, -64.31168365478516, -62.45613098144531, -60.6005859375, -58.74503707885742, -56.889488220214844, -55.033939361572266, -53.17839431762695, -51.322845458984375, -49.4672966003418, -47.61174774169922, -45.756202697753906, -43.90065383911133, -42.04510498046875, -40.18955612182617, -38.33401107788086, -36.47846221923828, -34.6229133605957, -32.767364501953125, -30.911819458007812, -29.056270599365234, -27.200725555419922, -25.345178604125977, -23.4896297454834, -21.634082794189453, -19.778533935546875, -17.92298698425293, -16.067440032958984, -14.211891174316406, -12.356342315673828, -10.500794410705566, -8.645246505737305, -6.789699077606201, -4.9341511726379395, -3.078603744506836, -1.2230558395385742, 0.6324920654296875, 2.488039970397949, 4.343587875366211, 6.199135780334473, 8.054683685302734, 9.91023063659668, 11.765778541564941, 13.621326446533203, 15.476874351501465, 17.332422256469727, 19.187969207763672, 21.04351806640625, 22.899065017700195, 24.754613876342773, 26.61016082763672, 28.465709686279297, 30.321256637573242, 32.17680358886719, 34.032352447509766, 35.88789749145508, 37.743446350097656, 39.598995208740234, 41.45454406738281, 43.310089111328125, 45.1656379699707, 47.02118682861328]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 3.0, 13.0, 12.0, 6.0, 13.0, 18.0, 22.0, 30.0, 31.0, 29.0, 39.0, 44.0, 47.0, 45.0, 44.0, 59.0, 44.0, 44.0, 63.0, 57.0, 43.0, 41.0, 36.0, 30.0, 46.0, 25.0, 23.0, 14.0, 17.0, 20.0, 9.0, 10.0, 8.0, 3.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.77099609375, -45.430599212646484, -44.09020233154297, -42.74980545043945, -41.40940856933594, -40.069007873535156, -38.728614807128906, -37.388214111328125, -36.04781723022461, -34.707420349121094, -33.36702346801758, -32.02662658691406, -30.686227798461914, -29.3458309173584, -28.005434036254883, -26.665035247802734, -25.32464027404785, -23.984243392944336, -22.64384651184082, -21.303447723388672, -19.963050842285156, -18.62265396118164, -17.282257080078125, -15.941859245300293, -14.601462364196777, -13.261065483093262, -11.92066764831543, -10.580270767211914, -9.239873886108398, -7.899476051330566, -6.559079170227051, -5.218681335449219, -3.878284454345703, -2.5378870964050293, -1.1974899768829346, 0.14290714263916016, 1.483304500579834, 2.823701858520508, 4.164098739624023, 5.5044965744018555, 6.844893455505371, 8.185290336608887, 9.525688171386719, 10.866085052490234, 12.20648193359375, 13.546879768371582, 14.887276649475098, 16.22767448425293, 17.568071365356445, 18.90846824645996, 20.248865127563477, 21.589263916015625, 22.92966079711914, 24.270057678222656, 25.610454559326172, 26.950851440429688, 28.291248321533203, 29.63164520263672, 30.972042083740234, 32.31243896484375, 33.652835845947266, 34.99323272705078, 36.33363342285156, 37.67403030395508, 39.014427185058594]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 4.0, 3.0, 5.0, 9.0, 15.0, 25.0, 26.0, 28.0, 44.0, 76.0, 123.0, 169.0, 278.0, 425.0, 720.0, 1303.0, 2895.0, 7398.0, 24327.0, 93599.0, 355478.0, 406300.0, 111195.0, 28773.0, 8646.0, 3161.0, 1444.0, 800.0, 469.0, 260.0, 176.0, 111.0, 78.0, 55.0, 35.0, 30.0, 27.0, 19.0, 10.0, 2.0, 5.0, 3.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-47.21875, -45.8720703125, -44.525390625, -43.1787109375, -41.83203125, -40.4853515625, -39.138671875, -37.7919921875, -36.4453125, -35.0986328125, -33.751953125, -32.4052734375, -31.05859375, -29.7119140625, -28.365234375, -27.0185546875, -25.671875, -24.3251953125, -22.978515625, -21.6318359375, -20.28515625, -18.9384765625, -17.591796875, -16.2451171875, -14.8984375, -13.5517578125, -12.205078125, -10.8583984375, -9.51171875, -8.1650390625, -6.818359375, -5.4716796875, -4.125, -2.7783203125, -1.431640625, -0.0849609375, 1.26171875, 2.6083984375, 3.955078125, 5.3017578125, 6.6484375, 7.9951171875, 9.341796875, 10.6884765625, 12.03515625, 13.3818359375, 14.728515625, 16.0751953125, 17.421875, 18.7685546875, 20.115234375, 21.4619140625, 22.80859375, 24.1552734375, 25.501953125, 26.8486328125, 28.1953125, 29.5419921875, 30.888671875, 32.2353515625, 33.58203125, 34.9287109375, 36.275390625, 37.6220703125, 38.96875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 4.0, 3.0, 1.0, 5.0, 11.0, 19.0, 27.0, 30.0, 58.0, 56.0, 60.0, 90.0, 101.0, 103.0, 97.0, 89.0, 64.0, 51.0, 42.0, 37.0, 21.0, 13.0, 10.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5390625, -8.2462158203125, -7.953369140625, -7.6605224609375, -7.36767578125, -7.0748291015625, -6.781982421875, -6.4891357421875, -6.1962890625, -5.9034423828125, -5.610595703125, -5.3177490234375, -5.02490234375, -4.7320556640625, -4.439208984375, -4.1463623046875, -3.853515625, -3.5606689453125, -3.267822265625, -2.9749755859375, -2.68212890625, -2.3892822265625, -2.096435546875, -1.8035888671875, -1.5107421875, -1.2178955078125, -0.925048828125, -0.6322021484375, -0.33935546875, -0.0465087890625, 0.246337890625, 0.5391845703125, 0.83203125, 1.1248779296875, 1.417724609375, 1.7105712890625, 2.00341796875, 2.2962646484375, 2.589111328125, 2.8819580078125, 3.1748046875, 3.4676513671875, 3.760498046875, 4.0533447265625, 4.34619140625, 4.6390380859375, 4.931884765625, 5.2247314453125, 5.517578125, 5.8104248046875, 6.103271484375, 6.3961181640625, 6.68896484375, 6.9818115234375, 7.274658203125, 7.5675048828125, 7.8603515625, 8.1531982421875, 8.446044921875, 8.7388916015625, 9.03173828125, 9.3245849609375, 9.617431640625, 9.9102783203125, 10.203125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 7.0, 5.0, 5.0, 11.0, 12.0, 18.0, 25.0, 34.0, 53.0, 87.0, 113.0, 167.0, 300.0, 499.0, 805.0, 1496.0, 3393.0, 8820.0, 25753.0, 78945.0, 239478.0, 417237.0, 180677.0, 58892.0, 19119.0, 6725.0, 2698.0, 1305.0, 666.0, 409.0, 250.0, 175.0, 110.0, 78.0, 51.0, 47.0, 19.0, 18.0, 17.0, 13.0, 7.0, 6.0, 3.0, 4.0, 2.0, 2.0, 5.0, 2.0, 2.0], "bins": [-26.984375, -26.242431640625, -25.50048828125, -24.758544921875, -24.0166015625, -23.274658203125, -22.53271484375, -21.790771484375, -21.048828125, -20.306884765625, -19.56494140625, -18.822998046875, -18.0810546875, -17.339111328125, -16.59716796875, -15.855224609375, -15.11328125, -14.371337890625, -13.62939453125, -12.887451171875, -12.1455078125, -11.403564453125, -10.66162109375, -9.919677734375, -9.177734375, -8.435791015625, -7.69384765625, -6.951904296875, -6.2099609375, -5.468017578125, -4.72607421875, -3.984130859375, -3.2421875, -2.500244140625, -1.75830078125, -1.016357421875, -0.2744140625, 0.467529296875, 1.20947265625, 1.951416015625, 2.693359375, 3.435302734375, 4.17724609375, 4.919189453125, 5.6611328125, 6.403076171875, 7.14501953125, 7.886962890625, 8.62890625, 9.370849609375, 10.11279296875, 10.854736328125, 11.5966796875, 12.338623046875, 13.08056640625, 13.822509765625, 14.564453125, 15.306396484375, 16.04833984375, 16.790283203125, 17.5322265625, 18.274169921875, 19.01611328125, 19.758056640625, 20.5]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 9.0, 7.0, 5.0, 8.0, 13.0, 22.0, 15.0, 26.0, 26.0, 28.0, 24.0, 33.0, 47.0, 56.0, 51.0, 48.0, 39.0, 52.0, 56.0, 53.0, 71.0, 60.0, 41.0, 31.0, 42.0, 32.0, 27.0, 15.0, 18.0, 12.0, 16.0, 8.0, 6.0, 4.0, 0.0, 3.0, 2.0, 1.0, 3.0], "bins": [-29.546875, -28.8427734375, -28.138671875, -27.4345703125, -26.73046875, -26.0263671875, -25.322265625, -24.6181640625, -23.9140625, -23.2099609375, -22.505859375, -21.8017578125, -21.09765625, -20.3935546875, -19.689453125, -18.9853515625, -18.28125, -17.5771484375, -16.873046875, -16.1689453125, -15.46484375, -14.7607421875, -14.056640625, -13.3525390625, -12.6484375, -11.9443359375, -11.240234375, -10.5361328125, -9.83203125, -9.1279296875, -8.423828125, -7.7197265625, -7.015625, -6.3115234375, -5.607421875, -4.9033203125, -4.19921875, -3.4951171875, -2.791015625, -2.0869140625, -1.3828125, -0.6787109375, 0.025390625, 0.7294921875, 1.43359375, 2.1376953125, 2.841796875, 3.5458984375, 4.25, 4.9541015625, 5.658203125, 6.3623046875, 7.06640625, 7.7705078125, 8.474609375, 9.1787109375, 9.8828125, 10.5869140625, 11.291015625, 11.9951171875, 12.69921875, 13.4033203125, 14.107421875, 14.8115234375, 15.515625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 5.0, 3.0, 7.0, 9.0, 17.0, 12.0, 15.0, 34.0, 48.0, 86.0, 142.0, 242.0, 428.0, 790.0, 1482.0, 2993.0, 6450.0, 15348.0, 39694.0, 115507.0, 311611.0, 342234.0, 134087.0, 45586.0, 17540.0, 7444.0, 3211.0, 1611.0, 816.0, 460.0, 235.0, 147.0, 92.0, 62.0, 31.0, 33.0, 17.0, 11.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.2734375, -9.9627685546875, -9.652099609375, -9.3414306640625, -9.03076171875, -8.7200927734375, -8.409423828125, -8.0987548828125, -7.7880859375, -7.4774169921875, -7.166748046875, -6.8560791015625, -6.54541015625, -6.2347412109375, -5.924072265625, -5.6134033203125, -5.302734375, -4.9920654296875, -4.681396484375, -4.3707275390625, -4.06005859375, -3.7493896484375, -3.438720703125, -3.1280517578125, -2.8173828125, -2.5067138671875, -2.196044921875, -1.8853759765625, -1.57470703125, -1.2640380859375, -0.953369140625, -0.6427001953125, -0.33203125, -0.0213623046875, 0.289306640625, 0.5999755859375, 0.91064453125, 1.2213134765625, 1.531982421875, 1.8426513671875, 2.1533203125, 2.4639892578125, 2.774658203125, 3.0853271484375, 3.39599609375, 3.7066650390625, 4.017333984375, 4.3280029296875, 4.638671875, 4.9493408203125, 5.260009765625, 5.5706787109375, 5.88134765625, 6.1920166015625, 6.502685546875, 6.8133544921875, 7.1240234375, 7.4346923828125, 7.745361328125, 8.0560302734375, 8.36669921875, 8.6773681640625, 8.988037109375, 9.2987060546875, 9.609375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 6.0, 7.0, 5.0, 2.0, 15.0, 19.0, 16.0, 32.0, 34.0, 60.0, 60.0, 98.0, 144.0, 126.0, 86.0, 61.0, 57.0, 39.0, 30.0, 24.0, 22.0, 17.0, 9.0, 8.0, 9.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00200653076171875, -0.0019353926181793213, -0.0018642544746398926, -0.0017931163311004639, -0.0017219781875610352, -0.0016508400440216064, -0.0015797019004821777, -0.001508563756942749, -0.0014374256134033203, -0.0013662874698638916, -0.0012951493263244629, -0.0012240111827850342, -0.0011528730392456055, -0.0010817348957061768, -0.001010596752166748, -0.0009394586086273193, -0.0008683204650878906, -0.0007971823215484619, -0.0007260441780090332, -0.0006549060344696045, -0.0005837678909301758, -0.0005126297473907471, -0.00044149160385131836, -0.00037035346031188965, -0.00029921531677246094, -0.00022807717323303223, -0.00015693902969360352, -8.58008861541748e-05, -1.4662742614746094e-05, 5.647540092468262e-05, 0.00012761354446411133, 0.00019875168800354004, 0.00026988983154296875, 0.00034102797508239746, 0.00041216611862182617, 0.0004833042621612549, 0.0005544424057006836, 0.0006255805492401123, 0.000696718692779541, 0.0007678568363189697, 0.0008389949798583984, 0.0009101331233978271, 0.0009812712669372559, 0.0010524094104766846, 0.0011235475540161133, 0.001194685697555542, 0.0012658238410949707, 0.0013369619846343994, 0.0014081001281738281, 0.0014792382717132568, 0.0015503764152526855, 0.0016215145587921143, 0.001692652702331543, 0.0017637908458709717, 0.0018349289894104004, 0.001906067132949829, 0.001977205276489258, 0.0020483434200286865, 0.0021194815635681152, 0.002190619707107544, 0.0022617578506469727, 0.0023328959941864014, 0.00240403413772583, 0.002475172281265259, 0.0025463104248046875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 7.0, 4.0, 5.0, 3.0, 13.0, 19.0, 29.0, 49.0, 75.0, 114.0, 186.0, 304.0, 525.0, 1016.0, 2023.0, 4722.0, 12580.0, 39430.0, 156911.0, 477326.0, 260012.0, 62935.0, 18077.0, 6471.0, 2760.0, 1305.0, 685.0, 384.0, 215.0, 139.0, 75.0, 62.0, 31.0, 25.0, 14.0, 12.0, 5.0, 4.0, 6.0, 1.0, 3.0, 0.0, 1.0, 3.0], "bins": [-15.484375, -15.0941162109375, -14.703857421875, -14.3135986328125, -13.92333984375, -13.5330810546875, -13.142822265625, -12.7525634765625, -12.3623046875, -11.9720458984375, -11.581787109375, -11.1915283203125, -10.80126953125, -10.4110107421875, -10.020751953125, -9.6304931640625, -9.240234375, -8.8499755859375, -8.459716796875, -8.0694580078125, -7.67919921875, -7.2889404296875, -6.898681640625, -6.5084228515625, -6.1181640625, -5.7279052734375, -5.337646484375, -4.9473876953125, -4.55712890625, -4.1668701171875, -3.776611328125, -3.3863525390625, -2.99609375, -2.6058349609375, -2.215576171875, -1.8253173828125, -1.43505859375, -1.0447998046875, -0.654541015625, -0.2642822265625, 0.1259765625, 0.5162353515625, 0.906494140625, 1.2967529296875, 1.68701171875, 2.0772705078125, 2.467529296875, 2.8577880859375, 3.248046875, 3.6383056640625, 4.028564453125, 4.4188232421875, 4.80908203125, 5.1993408203125, 5.589599609375, 5.9798583984375, 6.3701171875, 6.7603759765625, 7.150634765625, 7.5408935546875, 7.93115234375, 8.3214111328125, 8.711669921875, 9.1019287109375, 9.4921875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 2.0, 10.0, 6.0, 9.0, 18.0, 17.0, 24.0, 34.0, 31.0, 64.0, 62.0, 61.0, 95.0, 85.0, 78.0, 80.0, 80.0, 62.0, 38.0, 29.0, 20.0, 24.0, 16.0, 10.0, 7.0, 12.0, 8.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.3046875, -8.01611328125, -7.7275390625, -7.43896484375, -7.150390625, -6.86181640625, -6.5732421875, -6.28466796875, -5.99609375, -5.70751953125, -5.4189453125, -5.13037109375, -4.841796875, -4.55322265625, -4.2646484375, -3.97607421875, -3.6875, -3.39892578125, -3.1103515625, -2.82177734375, -2.533203125, -2.24462890625, -1.9560546875, -1.66748046875, -1.37890625, -1.09033203125, -0.8017578125, -0.51318359375, -0.224609375, 0.06396484375, 0.3525390625, 0.64111328125, 0.9296875, 1.21826171875, 1.5068359375, 1.79541015625, 2.083984375, 2.37255859375, 2.6611328125, 2.94970703125, 3.23828125, 3.52685546875, 3.8154296875, 4.10400390625, 4.392578125, 4.68115234375, 4.9697265625, 5.25830078125, 5.546875, 5.83544921875, 6.1240234375, 6.41259765625, 6.701171875, 6.98974609375, 7.2783203125, 7.56689453125, 7.85546875, 8.14404296875, 8.4326171875, 8.72119140625, 9.009765625, 9.29833984375, 9.5869140625, 9.87548828125, 10.1640625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 0.0, 5.0, 6.0, 9.0, 8.0, 11.0, 14.0, 23.0, 36.0, 60.0, 76.0, 73.0, 93.0, 92.0, 96.0, 108.0, 82.0, 60.0, 42.0, 36.0, 19.0, 16.0, 14.0, 11.0, 6.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-156.5966339111328, -152.22000122070312, -147.84336853027344, -143.46673583984375, -139.09010314941406, -134.71347045898438, -130.3368377685547, -125.960205078125, -121.58357238769531, -117.20693969726562, -112.83030700683594, -108.45367431640625, -104.07704162597656, -99.70040893554688, -95.32377624511719, -90.9471435546875, -86.57051849365234, -82.19388580322266, -77.81725311279297, -73.44062042236328, -69.0639877319336, -64.6873550415039, -60.310726165771484, -55.9340934753418, -51.55746078491211, -47.18082809448242, -42.804195404052734, -38.42756652832031, -34.050933837890625, -29.674299240112305, -25.29766845703125, -20.921035766601562, -16.544403076171875, -12.167770385742188, -7.791138648986816, -3.4145069122314453, 0.9621257781982422, 5.33875846862793, 9.715389251708984, 14.092021942138672, 18.46865463256836, 22.845287322998047, 27.221920013427734, 31.59855079650879, 35.975181579589844, 40.35181427001953, 44.72844696044922, 49.105079650878906, 53.481712341308594, 57.85834503173828, 62.23497772216797, 66.61161041259766, 70.98824310302734, 75.36487579345703, 79.74150085449219, 84.11813354492188, 88.49476623535156, 92.87139892578125, 97.24803161621094, 101.62466430664062, 106.00129699707031, 110.3779296875, 114.75456237792969, 119.13119506835938, 123.50782775878906]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 6.0, 10.0, 14.0, 10.0, 8.0, 16.0, 11.0, 21.0, 14.0, 21.0, 17.0, 24.0, 25.0, 31.0, 24.0, 47.0, 48.0, 33.0, 41.0, 35.0, 45.0, 40.0, 39.0, 35.0, 46.0, 43.0, 39.0, 27.0, 18.0, 39.0, 30.0, 15.0, 19.0, 11.0, 13.0, 14.0, 10.0, 9.0, 10.0, 7.0, 7.0, 8.0, 7.0, 4.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-85.59815979003906, -82.72219848632812, -79.84624481201172, -76.97028350830078, -74.09432220458984, -71.21836853027344, -68.3424072265625, -65.46644592285156, -62.590492248535156, -59.714534759521484, -56.83857345581055, -53.962615966796875, -51.0866584777832, -48.21070098876953, -45.334739685058594, -42.45878219604492, -39.582820892333984, -36.70686340332031, -33.830902099609375, -30.954944610595703, -28.07898712158203, -25.203027725219727, -22.327068328857422, -19.45111083984375, -16.575151443481445, -13.699193000793457, -10.823234558105469, -7.947275161743164, -5.071316719055176, -2.1953582763671875, 0.6806011199951172, 3.556558609008789, 6.432518005371094, 9.308476448059082, 12.18443489074707, 15.060394287109375, 17.936351776123047, 20.81231117248535, 23.688270568847656, 26.564228057861328, 29.440187454223633, 32.31614685058594, 35.19210433959961, 38.06806182861328, 40.94402313232422, 43.81998062133789, 46.69593811035156, 49.5718994140625, 52.44785690307617, 55.323814392089844, 58.19977569580078, 61.07573318481445, 63.951690673828125, 66.82765197753906, 69.70361328125, 72.5795669555664, 75.45552825927734, 78.33148956298828, 81.20744323730469, 84.08340454101562, 86.95936584472656, 89.83531951904297, 92.7112808227539, 95.58723449707031, 98.46319580078125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 5.0, 5.0, 8.0, 4.0, 8.0, 14.0, 16.0, 16.0, 25.0, 37.0, 44.0, 64.0, 98.0, 143.0, 223.0, 327.0, 535.0, 957.0, 1731.0, 3550.0, 8124.0, 21890.0, 79635.0, 665378.0, 3222135.0, 137535.0, 31867.0, 10620.0, 4370.0, 2143.0, 1080.0, 554.0, 346.0, 227.0, 151.0, 110.0, 65.0, 50.0, 35.0, 24.0, 23.0, 26.0, 14.0, 16.0, 18.0, 11.0, 6.0, 12.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0], "bins": [-33.28125, -32.00927734375, -30.7373046875, -29.46533203125, -28.193359375, -26.92138671875, -25.6494140625, -24.37744140625, -23.10546875, -21.83349609375, -20.5615234375, -19.28955078125, -18.017578125, -16.74560546875, -15.4736328125, -14.20166015625, -12.9296875, -11.65771484375, -10.3857421875, -9.11376953125, -7.841796875, -6.56982421875, -5.2978515625, -4.02587890625, -2.75390625, -1.48193359375, -0.2099609375, 1.06201171875, 2.333984375, 3.60595703125, 4.8779296875, 6.14990234375, 7.421875, 8.69384765625, 9.9658203125, 11.23779296875, 12.509765625, 13.78173828125, 15.0537109375, 16.32568359375, 17.59765625, 18.86962890625, 20.1416015625, 21.41357421875, 22.685546875, 23.95751953125, 25.2294921875, 26.50146484375, 27.7734375, 29.04541015625, 30.3173828125, 31.58935546875, 32.861328125, 34.13330078125, 35.4052734375, 36.67724609375, 37.94921875, 39.22119140625, 40.4931640625, 41.76513671875, 43.037109375, 44.30908203125, 45.5810546875, 46.85302734375, 48.125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 5.0, 6.0, 7.0, 13.0, 21.0, 28.0, 44.0, 36.0, 65.0, 70.0, 79.0, 94.0, 86.0, 79.0, 67.0, 75.0, 58.0, 44.0, 48.0, 28.0, 12.0, 11.0, 5.0, 9.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.109375, -7.8416748046875, -7.573974609375, -7.3062744140625, -7.03857421875, -6.7708740234375, -6.503173828125, -6.2354736328125, -5.9677734375, -5.7000732421875, -5.432373046875, -5.1646728515625, -4.89697265625, -4.6292724609375, -4.361572265625, -4.0938720703125, -3.826171875, -3.5584716796875, -3.290771484375, -3.0230712890625, -2.75537109375, -2.4876708984375, -2.219970703125, -1.9522705078125, -1.6845703125, -1.4168701171875, -1.149169921875, -0.8814697265625, -0.61376953125, -0.3460693359375, -0.078369140625, 0.1893310546875, 0.45703125, 0.7247314453125, 0.992431640625, 1.2601318359375, 1.52783203125, 1.7955322265625, 2.063232421875, 2.3309326171875, 2.5986328125, 2.8663330078125, 3.134033203125, 3.4017333984375, 3.66943359375, 3.9371337890625, 4.204833984375, 4.4725341796875, 4.740234375, 5.0079345703125, 5.275634765625, 5.5433349609375, 5.81103515625, 6.0787353515625, 6.346435546875, 6.6141357421875, 6.8818359375, 7.1495361328125, 7.417236328125, 7.6849365234375, 7.95263671875, 8.2203369140625, 8.488037109375, 8.7557373046875, 9.0234375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 10.0, 16.0, 12.0, 19.0, 32.0, 32.0, 37.0, 72.0, 122.0, 199.0, 439.0, 1012.0, 3718.0, 24234.0, 417907.0, 3630769.0, 102526.0, 9873.0, 1911.0, 604.0, 268.0, 159.0, 88.0, 55.0, 46.0, 36.0, 30.0, 16.0, 9.0, 9.0, 4.0, 7.0, 3.0, 4.0, 4.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0], "bins": [-71.25, -69.3388671875, -67.427734375, -65.5166015625, -63.60546875, -61.6943359375, -59.783203125, -57.8720703125, -55.9609375, -54.0498046875, -52.138671875, -50.2275390625, -48.31640625, -46.4052734375, -44.494140625, -42.5830078125, -40.671875, -38.7607421875, -36.849609375, -34.9384765625, -33.02734375, -31.1162109375, -29.205078125, -27.2939453125, -25.3828125, -23.4716796875, -21.560546875, -19.6494140625, -17.73828125, -15.8271484375, -13.916015625, -12.0048828125, -10.09375, -8.1826171875, -6.271484375, -4.3603515625, -2.44921875, -0.5380859375, 1.373046875, 3.2841796875, 5.1953125, 7.1064453125, 9.017578125, 10.9287109375, 12.83984375, 14.7509765625, 16.662109375, 18.5732421875, 20.484375, 22.3955078125, 24.306640625, 26.2177734375, 28.12890625, 30.0400390625, 31.951171875, 33.8623046875, 35.7734375, 37.6845703125, 39.595703125, 41.5068359375, 43.41796875, 45.3291015625, 47.240234375, 49.1513671875, 51.0625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 3.0, 20.0, 25.0, 75.0, 207.0, 557.0, 2189.0, 632.0, 213.0, 81.0, 36.0, 17.0, 12.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.984375, -20.053955078125, -19.12353515625, -18.193115234375, -17.2626953125, -16.332275390625, -15.40185546875, -14.471435546875, -13.541015625, -12.610595703125, -11.68017578125, -10.749755859375, -9.8193359375, -8.888916015625, -7.95849609375, -7.028076171875, -6.09765625, -5.167236328125, -4.23681640625, -3.306396484375, -2.3759765625, -1.445556640625, -0.51513671875, 0.415283203125, 1.345703125, 2.276123046875, 3.20654296875, 4.136962890625, 5.0673828125, 5.997802734375, 6.92822265625, 7.858642578125, 8.7890625, 9.719482421875, 10.64990234375, 11.580322265625, 12.5107421875, 13.441162109375, 14.37158203125, 15.302001953125, 16.232421875, 17.162841796875, 18.09326171875, 19.023681640625, 19.9541015625, 20.884521484375, 21.81494140625, 22.745361328125, 23.67578125, 24.606201171875, 25.53662109375, 26.467041015625, 27.3974609375, 28.327880859375, 29.25830078125, 30.188720703125, 31.119140625, 32.049560546875, 32.97998046875, 33.910400390625, 34.8408203125, 35.771240234375, 36.70166015625, 37.632080078125, 38.5625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 7.0, 13.0, 13.0, 27.0, 37.0, 80.0, 81.0, 98.0, 109.0, 94.0, 106.0, 92.0, 88.0, 40.0, 32.0, 29.0, 16.0, 9.0, 6.0, 6.0, 1.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-86.02826690673828, -83.38094329833984, -80.73361206054688, -78.08628845214844, -75.43896484375, -72.79164123535156, -70.14431762695312, -67.49698638916016, -64.84966278076172, -62.20233917236328, -59.55501174926758, -56.907684326171875, -54.26036071777344, -51.613037109375, -48.9657096862793, -46.318382263183594, -43.671058654785156, -41.02373504638672, -38.376407623291016, -35.72908020019531, -33.081756591796875, -30.434431076049805, -27.787105560302734, -25.139780044555664, -22.492454528808594, -19.845129013061523, -17.197803497314453, -14.550477981567383, -11.903152465820312, -9.255826950073242, -6.608501434326172, -3.9611759185791016, -1.3138427734375, 1.3334827423095703, 3.9808082580566406, 6.628133773803711, 9.275459289550781, 11.922784805297852, 14.570110321044922, 17.217435836791992, 19.864761352539062, 22.512086868286133, 25.159412384033203, 27.806737899780273, 30.454063415527344, 33.10138702392578, 35.748714447021484, 38.39604187011719, 41.043365478515625, 43.69068908691406, 46.338016510009766, 48.98534393310547, 51.632667541503906, 54.279991149902344, 56.92731857299805, 59.57464599609375, 62.22196960449219, 64.86929321289062, 67.51661682128906, 70.16394805908203, 72.81127166748047, 75.4585952758789, 78.10592651367188, 80.75325012207031, 83.40057373046875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 10.0, 3.0, 4.0, 7.0, 11.0, 6.0, 17.0, 27.0, 25.0, 24.0, 32.0, 35.0, 42.0, 47.0, 51.0, 60.0, 69.0, 55.0, 44.0, 66.0, 60.0, 36.0, 40.0, 46.0, 43.0, 27.0, 26.0, 22.0, 15.0, 16.0, 13.0, 10.0, 6.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0], "bins": [-68.8824234008789, -67.05390167236328, -65.22537994384766, -63.39685821533203, -61.568336486816406, -59.73981475830078, -57.91129684448242, -56.0827751159668, -54.25425338745117, -52.42573165893555, -50.59720993041992, -48.7686882019043, -46.94017028808594, -45.11164855957031, -43.28312683105469, -41.45460510253906, -39.62608337402344, -37.79756164550781, -35.96903991699219, -34.14051818847656, -32.31199645996094, -30.483476638793945, -28.654956817626953, -26.826435089111328, -24.997913360595703, -23.169391632080078, -21.340869903564453, -19.51235008239746, -17.683828353881836, -15.855306625366211, -14.026785850524902, -12.198265075683594, -10.369743347167969, -8.541221618652344, -6.712700843811035, -4.884179592132568, -3.0556583404541016, -1.2271366119384766, 0.601384162902832, 2.4299049377441406, 4.258426666259766, 6.086947917938232, 7.915469169616699, 9.743989944458008, 11.572511672973633, 13.401033401489258, 15.229554176330566, 17.058074951171875, 18.8865966796875, 20.715118408203125, 22.54364013671875, 24.372159957885742, 26.200681686401367, 28.029203414916992, 29.857723236083984, 31.68624496459961, 33.514766693115234, 35.34328842163086, 37.171810150146484, 39.00033187866211, 40.82884979248047, 42.657371520996094, 44.48589324951172, 46.314414978027344, 48.14293670654297]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 3.0, 9.0, 21.0, 8.0, 13.0, 30.0, 45.0, 67.0, 90.0, 152.0, 280.0, 482.0, 973.0, 2125.0, 5638.0, 18178.0, 86124.0, 594388.0, 277085.0, 44899.0, 11167.0, 3626.0, 1495.0, 677.0, 384.0, 204.0, 111.0, 86.0, 63.0, 30.0, 31.0, 19.0, 6.0, 14.0, 8.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-47.90625, -46.298828125, -44.69140625, -43.083984375, -41.4765625, -39.869140625, -38.26171875, -36.654296875, -35.046875, -33.439453125, -31.83203125, -30.224609375, -28.6171875, -27.009765625, -25.40234375, -23.794921875, -22.1875, -20.580078125, -18.97265625, -17.365234375, -15.7578125, -14.150390625, -12.54296875, -10.935546875, -9.328125, -7.720703125, -6.11328125, -4.505859375, -2.8984375, -1.291015625, 0.31640625, 1.923828125, 3.53125, 5.138671875, 6.74609375, 8.353515625, 9.9609375, 11.568359375, 13.17578125, 14.783203125, 16.390625, 17.998046875, 19.60546875, 21.212890625, 22.8203125, 24.427734375, 26.03515625, 27.642578125, 29.25, 30.857421875, 32.46484375, 34.072265625, 35.6796875, 37.287109375, 38.89453125, 40.501953125, 42.109375, 43.716796875, 45.32421875, 46.931640625, 48.5390625, 50.146484375, 51.75390625, 53.361328125, 54.96875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 10.0, 16.0, 32.0, 34.0, 53.0, 45.0, 98.0, 102.0, 103.0, 88.0, 76.0, 85.0, 68.0, 60.0, 38.0, 30.0, 18.0, 8.0, 8.0, 4.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.40625, -9.1021728515625, -8.798095703125, -8.4940185546875, -8.18994140625, -7.8858642578125, -7.581787109375, -7.2777099609375, -6.9736328125, -6.6695556640625, -6.365478515625, -6.0614013671875, -5.75732421875, -5.4532470703125, -5.149169921875, -4.8450927734375, -4.541015625, -4.2369384765625, -3.932861328125, -3.6287841796875, -3.32470703125, -3.0206298828125, -2.716552734375, -2.4124755859375, -2.1083984375, -1.8043212890625, -1.500244140625, -1.1961669921875, -0.89208984375, -0.5880126953125, -0.283935546875, 0.0201416015625, 0.32421875, 0.6282958984375, 0.932373046875, 1.2364501953125, 1.54052734375, 1.8446044921875, 2.148681640625, 2.4527587890625, 2.7568359375, 3.0609130859375, 3.364990234375, 3.6690673828125, 3.97314453125, 4.2772216796875, 4.581298828125, 4.8853759765625, 5.189453125, 5.4935302734375, 5.797607421875, 6.1016845703125, 6.40576171875, 6.7098388671875, 7.013916015625, 7.3179931640625, 7.6220703125, 7.9261474609375, 8.230224609375, 8.5343017578125, 8.83837890625, 9.1424560546875, 9.446533203125, 9.7506103515625, 10.0546875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 13.0, 13.0, 16.0, 17.0, 18.0, 42.0, 48.0, 84.0, 126.0, 146.0, 264.0, 395.0, 615.0, 1152.0, 2411.0, 5648.0, 15564.0, 47542.0, 159908.0, 506126.0, 214542.0, 61121.0, 19361.0, 7126.0, 2872.0, 1407.0, 666.0, 408.0, 262.0, 176.0, 154.0, 99.0, 42.0, 50.0, 27.0, 36.0, 27.0, 10.0, 5.0, 9.0, 3.0, 2.0, 4.0, 4.0], "bins": [-30.921875, -30.14111328125, -29.3603515625, -28.57958984375, -27.798828125, -27.01806640625, -26.2373046875, -25.45654296875, -24.67578125, -23.89501953125, -23.1142578125, -22.33349609375, -21.552734375, -20.77197265625, -19.9912109375, -19.21044921875, -18.4296875, -17.64892578125, -16.8681640625, -16.08740234375, -15.306640625, -14.52587890625, -13.7451171875, -12.96435546875, -12.18359375, -11.40283203125, -10.6220703125, -9.84130859375, -9.060546875, -8.27978515625, -7.4990234375, -6.71826171875, -5.9375, -5.15673828125, -4.3759765625, -3.59521484375, -2.814453125, -2.03369140625, -1.2529296875, -0.47216796875, 0.30859375, 1.08935546875, 1.8701171875, 2.65087890625, 3.431640625, 4.21240234375, 4.9931640625, 5.77392578125, 6.5546875, 7.33544921875, 8.1162109375, 8.89697265625, 9.677734375, 10.45849609375, 11.2392578125, 12.02001953125, 12.80078125, 13.58154296875, 14.3623046875, 15.14306640625, 15.923828125, 16.70458984375, 17.4853515625, 18.26611328125, 19.046875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 5.0, 8.0, 10.0, 8.0, 10.0, 19.0, 11.0, 22.0, 21.0, 13.0, 32.0, 22.0, 31.0, 42.0, 37.0, 45.0, 53.0, 41.0, 35.0, 44.0, 46.0, 46.0, 44.0, 38.0, 38.0, 40.0, 31.0, 25.0, 27.0, 22.0, 28.0, 21.0, 12.0, 7.0, 12.0, 12.0, 12.0, 6.0, 7.0, 6.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 3.0], "bins": [-20.53125, -19.943359375, -19.35546875, -18.767578125, -18.1796875, -17.591796875, -17.00390625, -16.416015625, -15.828125, -15.240234375, -14.65234375, -14.064453125, -13.4765625, -12.888671875, -12.30078125, -11.712890625, -11.125, -10.537109375, -9.94921875, -9.361328125, -8.7734375, -8.185546875, -7.59765625, -7.009765625, -6.421875, -5.833984375, -5.24609375, -4.658203125, -4.0703125, -3.482421875, -2.89453125, -2.306640625, -1.71875, -1.130859375, -0.54296875, 0.044921875, 0.6328125, 1.220703125, 1.80859375, 2.396484375, 2.984375, 3.572265625, 4.16015625, 4.748046875, 5.3359375, 5.923828125, 6.51171875, 7.099609375, 7.6875, 8.275390625, 8.86328125, 9.451171875, 10.0390625, 10.626953125, 11.21484375, 11.802734375, 12.390625, 12.978515625, 13.56640625, 14.154296875, 14.7421875, 15.330078125, 15.91796875, 16.505859375, 17.09375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 8.0, 4.0, 4.0, 13.0, 19.0, 23.0, 41.0, 78.0, 174.0, 296.0, 667.0, 1737.0, 5365.0, 20974.0, 124121.0, 667856.0, 188768.0, 27814.0, 6913.0, 2198.0, 754.0, 344.0, 186.0, 84.0, 46.0, 24.0, 20.0, 16.0, 8.0, 1.0, 7.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.421875, -13.91748046875, -13.4130859375, -12.90869140625, -12.404296875, -11.89990234375, -11.3955078125, -10.89111328125, -10.38671875, -9.88232421875, -9.3779296875, -8.87353515625, -8.369140625, -7.86474609375, -7.3603515625, -6.85595703125, -6.3515625, -5.84716796875, -5.3427734375, -4.83837890625, -4.333984375, -3.82958984375, -3.3251953125, -2.82080078125, -2.31640625, -1.81201171875, -1.3076171875, -0.80322265625, -0.298828125, 0.20556640625, 0.7099609375, 1.21435546875, 1.71875, 2.22314453125, 2.7275390625, 3.23193359375, 3.736328125, 4.24072265625, 4.7451171875, 5.24951171875, 5.75390625, 6.25830078125, 6.7626953125, 7.26708984375, 7.771484375, 8.27587890625, 8.7802734375, 9.28466796875, 9.7890625, 10.29345703125, 10.7978515625, 11.30224609375, 11.806640625, 12.31103515625, 12.8154296875, 13.31982421875, 13.82421875, 14.32861328125, 14.8330078125, 15.33740234375, 15.841796875, 16.34619140625, 16.8505859375, 17.35498046875, 17.859375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 3.0, 4.0, 9.0, 7.0, 16.0, 10.0, 12.0, 19.0, 12.0, 17.0, 23.0, 34.0, 62.0, 98.0, 121.0, 149.0, 127.0, 74.0, 35.0, 31.0, 24.0, 19.0, 9.0, 12.0, 7.0, 9.0, 5.0, 11.0, 6.0, 5.0, 3.0, 9.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0021076202392578125, -0.0020460784435272217, -0.001984536647796631, -0.00192299485206604, -0.0018614530563354492, -0.0017999112606048584, -0.0017383694648742676, -0.0016768276691436768, -0.001615285873413086, -0.0015537440776824951, -0.0014922022819519043, -0.0014306604862213135, -0.0013691186904907227, -0.0013075768947601318, -0.001246035099029541, -0.0011844933032989502, -0.0011229515075683594, -0.0010614097118377686, -0.0009998679161071777, -0.0009383261203765869, -0.0008767843246459961, -0.0008152425289154053, -0.0007537007331848145, -0.0006921589374542236, -0.0006306171417236328, -0.000569075345993042, -0.0005075335502624512, -0.00044599175453186035, -0.00038444995880126953, -0.0003229081630706787, -0.0002613663673400879, -0.00019982457160949707, -0.00013828277587890625, -7.674098014831543e-05, -1.519918441772461e-05, 4.634261131286621e-05, 0.00010788440704345703, 0.00016942620277404785, 0.00023096799850463867, 0.0002925097942352295, 0.0003540515899658203, 0.00041559338569641113, 0.00047713518142700195, 0.0005386769771575928, 0.0006002187728881836, 0.0006617605686187744, 0.0007233023643493652, 0.0007848441600799561, 0.0008463859558105469, 0.0009079277515411377, 0.0009694695472717285, 0.0010310113430023193, 0.0010925531387329102, 0.001154094934463501, 0.0012156367301940918, 0.0012771785259246826, 0.0013387203216552734, 0.0014002621173858643, 0.001461803913116455, 0.001523345708847046, 0.0015848875045776367, 0.0016464293003082275, 0.0017079710960388184, 0.0017695128917694092, 0.0018310546875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 9.0, 9.0, 20.0, 23.0, 26.0, 43.0, 74.0, 103.0, 188.0, 308.0, 526.0, 1256.0, 2833.0, 7497.0, 23110.0, 87234.0, 490591.0, 345013.0, 61801.0, 17429.0, 5939.0, 2270.0, 1032.0, 525.0, 285.0, 149.0, 90.0, 72.0, 35.0, 24.0, 14.0, 11.0, 4.0, 6.0, 2.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.4453125, -12.0780029296875, -11.710693359375, -11.3433837890625, -10.97607421875, -10.6087646484375, -10.241455078125, -9.8741455078125, -9.5068359375, -9.1395263671875, -8.772216796875, -8.4049072265625, -8.03759765625, -7.6702880859375, -7.302978515625, -6.9356689453125, -6.568359375, -6.2010498046875, -5.833740234375, -5.4664306640625, -5.09912109375, -4.7318115234375, -4.364501953125, -3.9971923828125, -3.6298828125, -3.2625732421875, -2.895263671875, -2.5279541015625, -2.16064453125, -1.7933349609375, -1.426025390625, -1.0587158203125, -0.69140625, -0.3240966796875, 0.043212890625, 0.4105224609375, 0.77783203125, 1.1451416015625, 1.512451171875, 1.8797607421875, 2.2470703125, 2.6143798828125, 2.981689453125, 3.3489990234375, 3.71630859375, 4.0836181640625, 4.450927734375, 4.8182373046875, 5.185546875, 5.5528564453125, 5.920166015625, 6.2874755859375, 6.65478515625, 7.0220947265625, 7.389404296875, 7.7567138671875, 8.1240234375, 8.4913330078125, 8.858642578125, 9.2259521484375, 9.59326171875, 9.9605712890625, 10.327880859375, 10.6951904296875, 11.0625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 6.0, 4.0, 4.0, 4.0, 7.0, 4.0, 8.0, 9.0, 6.0, 13.0, 16.0, 16.0, 16.0, 28.0, 30.0, 44.0, 42.0, 48.0, 70.0, 78.0, 58.0, 73.0, 81.0, 54.0, 50.0, 36.0, 40.0, 41.0, 19.0, 23.0, 9.0, 11.0, 14.0, 6.0, 8.0, 8.0, 4.0, 1.0, 6.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-6.30859375, -6.1268310546875, -5.945068359375, -5.7633056640625, -5.58154296875, -5.3997802734375, -5.218017578125, -5.0362548828125, -4.8544921875, -4.6727294921875, -4.490966796875, -4.3092041015625, -4.12744140625, -3.9456787109375, -3.763916015625, -3.5821533203125, -3.400390625, -3.2186279296875, -3.036865234375, -2.8551025390625, -2.67333984375, -2.4915771484375, -2.309814453125, -2.1280517578125, -1.9462890625, -1.7645263671875, -1.582763671875, -1.4010009765625, -1.21923828125, -1.0374755859375, -0.855712890625, -0.6739501953125, -0.4921875, -0.3104248046875, -0.128662109375, 0.0531005859375, 0.23486328125, 0.4166259765625, 0.598388671875, 0.7801513671875, 0.9619140625, 1.1436767578125, 1.325439453125, 1.5072021484375, 1.68896484375, 1.8707275390625, 2.052490234375, 2.2342529296875, 2.416015625, 2.5977783203125, 2.779541015625, 2.9613037109375, 3.14306640625, 3.3248291015625, 3.506591796875, 3.6883544921875, 3.8701171875, 4.0518798828125, 4.233642578125, 4.4154052734375, 4.59716796875, 4.7789306640625, 4.960693359375, 5.1424560546875, 5.32421875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 6.0, 9.0, 23.0, 24.0, 55.0, 72.0, 119.0, 180.0, 150.0, 151.0, 87.0, 49.0, 33.0, 25.0, 9.0, 6.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-127.94160461425781, -120.88534545898438, -113.8290786743164, -106.77281188964844, -99.716552734375, -92.66029357910156, -85.6040267944336, -78.54776000976562, -71.49150085449219, -64.43524169921875, -57.37897491455078, -50.32271194458008, -43.266448974609375, -36.21018600463867, -29.15392303466797, -22.097660064697266, -15.041397094726562, -7.985134124755859, -0.9288711547851562, 6.127391815185547, 13.18365478515625, 20.239917755126953, 27.296180725097656, 34.35244369506836, 41.40870666503906, 48.464969635009766, 55.52123260498047, 62.57749557495117, 69.63375854492188, 76.69001770019531, 83.74628448486328, 90.80255126953125, 97.85879516601562, 104.91505432128906, 111.97132110595703, 119.027587890625, 126.08384704589844, 133.14010620117188, 140.19638061523438, 147.2526397705078, 154.30889892578125, 161.3651580810547, 168.42141723632812, 175.47769165039062, 182.53395080566406, 189.5902099609375, 196.646484375, 203.70274353027344, 210.75900268554688, 217.8152618408203, 224.87152099609375, 231.92779541015625, 238.9840545654297, 246.04031372070312, 253.09658813476562, 260.15283203125, 267.2091064453125, 274.265380859375, 281.3216247558594, 288.3778991699219, 295.43414306640625, 302.49041748046875, 309.54669189453125, 316.6029357910156, 323.6592102050781]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 0.0, 3.0, 5.0, 12.0, 13.0, 13.0, 8.0, 17.0, 23.0, 19.0, 21.0, 21.0, 23.0, 29.0, 29.0, 37.0, 31.0, 45.0, 31.0, 37.0, 30.0, 42.0, 44.0, 36.0, 56.0, 46.0, 32.0, 25.0, 26.0, 35.0, 30.0, 28.0, 21.0, 20.0, 20.0, 12.0, 25.0, 15.0, 12.0, 5.0, 3.0, 6.0, 5.0, 2.0, 2.0, 0.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-89.68400573730469, -86.8517837524414, -84.01956176757812, -81.18733978271484, -78.35511779785156, -75.52288818359375, -72.690673828125, -69.85844421386719, -67.0262222290039, -64.19400024414062, -61.361778259277344, -58.52955627441406, -55.697330474853516, -52.865108489990234, -50.03288650512695, -47.200660705566406, -44.36844253540039, -41.53622055053711, -38.70399856567383, -35.87177276611328, -33.03955078125, -30.20732879638672, -27.375106811523438, -24.542882919311523, -21.710660934448242, -18.87843894958496, -16.046215057373047, -13.213993072509766, -10.381770133972168, -7.54954719543457, -4.717325210571289, -1.885101318359375, 0.9471206665039062, 3.779343366622925, 6.611566066741943, 9.443788528442383, 12.27601146697998, 15.108234405517578, 17.94045639038086, 20.772680282592773, 23.604902267456055, 26.437124252319336, 29.26934814453125, 32.10157012939453, 34.93379211425781, 37.766014099121094, 40.598236083984375, 43.43046188354492, 46.2626838684082, 49.094905853271484, 51.927127838134766, 54.75935363769531, 57.591575622558594, 60.423797607421875, 63.256019592285156, 66.08824157714844, 68.92046356201172, 71.752685546875, 74.58490753173828, 77.41712951660156, 80.24935150146484, 83.08157348632812, 85.91380310058594, 88.74602508544922, 91.5782470703125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 6.0, 5.0, 8.0, 10.0, 12.0, 22.0, 25.0, 31.0, 53.0, 66.0, 80.0, 122.0, 194.0, 321.0, 494.0, 979.0, 1712.0, 3741.0, 9044.0, 26926.0, 120348.0, 3460724.0, 483472.0, 58187.0, 16135.0, 5936.0, 2666.0, 1165.0, 645.0, 402.0, 196.0, 164.0, 78.0, 57.0, 47.0, 41.0, 39.0, 29.0, 23.0, 12.0, 11.0, 14.0, 8.0, 10.0, 7.0, 5.0, 5.0, 6.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-39.6875, -38.20556640625, -36.7236328125, -35.24169921875, -33.759765625, -32.27783203125, -30.7958984375, -29.31396484375, -27.83203125, -26.35009765625, -24.8681640625, -23.38623046875, -21.904296875, -20.42236328125, -18.9404296875, -17.45849609375, -15.9765625, -14.49462890625, -13.0126953125, -11.53076171875, -10.048828125, -8.56689453125, -7.0849609375, -5.60302734375, -4.12109375, -2.63916015625, -1.1572265625, 0.32470703125, 1.806640625, 3.28857421875, 4.7705078125, 6.25244140625, 7.734375, 9.21630859375, 10.6982421875, 12.18017578125, 13.662109375, 15.14404296875, 16.6259765625, 18.10791015625, 19.58984375, 21.07177734375, 22.5537109375, 24.03564453125, 25.517578125, 26.99951171875, 28.4814453125, 29.96337890625, 31.4453125, 32.92724609375, 34.4091796875, 35.89111328125, 37.373046875, 38.85498046875, 40.3369140625, 41.81884765625, 43.30078125, 44.78271484375, 46.2646484375, 47.74658203125, 49.228515625, 50.71044921875, 52.1923828125, 53.67431640625, 55.15625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 2.0, 3.0, 2.0, 5.0, 7.0, 12.0, 22.0, 24.0, 39.0, 50.0, 52.0, 78.0, 77.0, 112.0, 95.0, 88.0, 80.0, 55.0, 55.0, 39.0, 40.0, 21.0, 18.0, 9.0, 4.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.03125, -8.7315673828125, -8.431884765625, -8.1322021484375, -7.83251953125, -7.5328369140625, -7.233154296875, -6.9334716796875, -6.6337890625, -6.3341064453125, -6.034423828125, -5.7347412109375, -5.43505859375, -5.1353759765625, -4.835693359375, -4.5360107421875, -4.236328125, -3.9366455078125, -3.636962890625, -3.3372802734375, -3.03759765625, -2.7379150390625, -2.438232421875, -2.1385498046875, -1.8388671875, -1.5391845703125, -1.239501953125, -0.9398193359375, -0.64013671875, -0.3404541015625, -0.040771484375, 0.2589111328125, 0.55859375, 0.8582763671875, 1.157958984375, 1.4576416015625, 1.75732421875, 2.0570068359375, 2.356689453125, 2.6563720703125, 2.9560546875, 3.2557373046875, 3.555419921875, 3.8551025390625, 4.15478515625, 4.4544677734375, 4.754150390625, 5.0538330078125, 5.353515625, 5.6531982421875, 5.952880859375, 6.2525634765625, 6.55224609375, 6.8519287109375, 7.151611328125, 7.4512939453125, 7.7509765625, 8.0506591796875, 8.350341796875, 8.6500244140625, 8.94970703125, 9.2493896484375, 9.549072265625, 9.8487548828125, 10.1484375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 10.0, 8.0, 16.0, 29.0, 35.0, 51.0, 57.0, 106.0, 159.0, 214.0, 316.0, 545.0, 856.0, 1348.0, 2615.0, 4986.0, 11256.0, 29239.0, 89735.0, 421608.0, 3144900.0, 356061.0, 80996.0, 27285.0, 10784.0, 4909.0, 2534.0, 1338.0, 815.0, 468.0, 312.0, 225.0, 134.0, 86.0, 74.0, 48.0, 42.0, 18.0, 17.0, 11.0, 7.0, 6.0, 4.0, 4.0, 4.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.859375, -24.043212890625, -23.22705078125, -22.410888671875, -21.5947265625, -20.778564453125, -19.96240234375, -19.146240234375, -18.330078125, -17.513916015625, -16.69775390625, -15.881591796875, -15.0654296875, -14.249267578125, -13.43310546875, -12.616943359375, -11.80078125, -10.984619140625, -10.16845703125, -9.352294921875, -8.5361328125, -7.719970703125, -6.90380859375, -6.087646484375, -5.271484375, -4.455322265625, -3.63916015625, -2.822998046875, -2.0068359375, -1.190673828125, -0.37451171875, 0.441650390625, 1.2578125, 2.073974609375, 2.89013671875, 3.706298828125, 4.5224609375, 5.338623046875, 6.15478515625, 6.970947265625, 7.787109375, 8.603271484375, 9.41943359375, 10.235595703125, 11.0517578125, 11.867919921875, 12.68408203125, 13.500244140625, 14.31640625, 15.132568359375, 15.94873046875, 16.764892578125, 17.5810546875, 18.397216796875, 19.21337890625, 20.029541015625, 20.845703125, 21.661865234375, 22.47802734375, 23.294189453125, 24.1103515625, 24.926513671875, 25.74267578125, 26.558837890625, 27.375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 9.0, 9.0, 15.0, 22.0, 33.0, 49.0, 75.0, 124.0, 199.0, 447.0, 1476.0, 874.0, 281.0, 159.0, 89.0, 56.0, 48.0, 31.0, 17.0, 17.0, 8.0, 7.0, 4.0, 6.0, 2.0, 4.0, 3.0, 2.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-15.6640625, -15.2503662109375, -14.836669921875, -14.4229736328125, -14.00927734375, -13.5955810546875, -13.181884765625, -12.7681884765625, -12.3544921875, -11.9407958984375, -11.527099609375, -11.1134033203125, -10.69970703125, -10.2860107421875, -9.872314453125, -9.4586181640625, -9.044921875, -8.6312255859375, -8.217529296875, -7.8038330078125, -7.39013671875, -6.9764404296875, -6.562744140625, -6.1490478515625, -5.7353515625, -5.3216552734375, -4.907958984375, -4.4942626953125, -4.08056640625, -3.6668701171875, -3.253173828125, -2.8394775390625, -2.42578125, -2.0120849609375, -1.598388671875, -1.1846923828125, -0.77099609375, -0.3572998046875, 0.056396484375, 0.4700927734375, 0.8837890625, 1.2974853515625, 1.711181640625, 2.1248779296875, 2.53857421875, 2.9522705078125, 3.365966796875, 3.7796630859375, 4.193359375, 4.6070556640625, 5.020751953125, 5.4344482421875, 5.84814453125, 6.2618408203125, 6.675537109375, 7.0892333984375, 7.5029296875, 7.9166259765625, 8.330322265625, 8.7440185546875, 9.15771484375, 9.5714111328125, 9.985107421875, 10.3988037109375, 10.8125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 9.0, 19.0, 45.0, 69.0, 88.0, 107.0, 124.0, 144.0, 133.0, 86.0, 60.0, 55.0, 32.0, 13.0, 11.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-116.95199584960938, -114.00220489501953, -111.05241394042969, -108.10262298583984, -105.15283203125, -102.20304107666016, -99.25325012207031, -96.303466796875, -93.35366821289062, -90.40387725830078, -87.45408630371094, -84.5042953491211, -81.55450439453125, -78.6047134399414, -75.65492248535156, -72.70513916015625, -69.7553482055664, -66.80555725097656, -63.85576629638672, -60.905975341796875, -57.95618438720703, -55.00639343261719, -52.05660629272461, -49.106815338134766, -46.15702438354492, -43.20723342895508, -40.257442474365234, -37.307655334472656, -34.35786437988281, -31.408071517944336, -28.458282470703125, -25.50849151611328, -22.558692932128906, -19.608901977539062, -16.65911102294922, -13.709321975708008, -10.759531021118164, -7.80974006652832, -4.859951019287109, -1.9101600646972656, 1.0396308898925781, 3.9894213676452637, 6.939211845397949, 9.889001846313477, 12.83879280090332, 15.788583755493164, 18.738372802734375, 21.68816375732422, 24.637954711914062, 27.587745666503906, 30.53753662109375, 33.487327575683594, 36.43711853027344, 39.38690948486328, 42.33669662475586, 45.2864875793457, 48.23627853393555, 51.18606948852539, 54.135860443115234, 57.08564758300781, 60.035438537597656, 62.9852294921875, 65.93502044677734, 68.88481140136719, 71.83460235595703]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 6.0, 4.0, 7.0, 4.0, 6.0, 11.0, 11.0, 12.0, 31.0, 24.0, 26.0, 33.0, 32.0, 31.0, 30.0, 39.0, 34.0, 40.0, 56.0, 51.0, 59.0, 66.0, 40.0, 36.0, 44.0, 40.0, 35.0, 32.0, 26.0, 27.0, 27.0, 16.0, 9.0, 16.0, 12.0, 12.0, 11.0, 5.0, 1.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-48.68795394897461, -47.32981872558594, -45.971683502197266, -44.613548278808594, -43.255409240722656, -41.897274017333984, -40.53913879394531, -39.18100357055664, -37.82286834716797, -36.4647331237793, -35.106597900390625, -33.74846267700195, -32.39032745361328, -31.032190322875977, -29.674053192138672, -28.31591796875, -26.957782745361328, -25.599647521972656, -24.241512298583984, -22.88337516784668, -21.525239944458008, -20.167104721069336, -18.80896759033203, -17.45083236694336, -16.092697143554688, -14.734561920166016, -13.376425743103027, -12.018289566040039, -10.660154342651367, -9.302019119262695, -7.943882942199707, -6.585746765136719, -5.2276153564453125, -3.8694796562194824, -2.5113439559936523, -1.1532082557678223, 0.2049274444580078, 1.563063144683838, 2.921198844909668, 4.279335021972656, 5.637470245361328, 6.995605945587158, 8.353741645812988, 9.711877822875977, 11.070013046264648, 12.42814826965332, 13.786284446716309, 15.144420623779297, 16.50255584716797, 17.86069107055664, 19.218826293945312, 20.576963424682617, 21.93509864807129, 23.29323387145996, 24.651371002197266, 26.009506225585938, 27.36764144897461, 28.72577667236328, 30.083911895751953, 31.442049026489258, 32.80018615722656, 34.158321380615234, 35.516456604003906, 36.87459182739258, 38.23272705078125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 10.0, 11.0, 7.0, 15.0, 16.0, 26.0, 59.0, 87.0, 205.0, 362.0, 899.0, 2617.0, 12639.0, 90632.0, 775945.0, 141516.0, 18174.0, 3385.0, 1002.0, 442.0, 216.0, 129.0, 70.0, 43.0, 21.0, 10.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.75, -54.6162109375, -52.482421875, -50.3486328125, -48.21484375, -46.0810546875, -43.947265625, -41.8134765625, -39.6796875, -37.5458984375, -35.412109375, -33.2783203125, -31.14453125, -29.0107421875, -26.876953125, -24.7431640625, -22.609375, -20.4755859375, -18.341796875, -16.2080078125, -14.07421875, -11.9404296875, -9.806640625, -7.6728515625, -5.5390625, -3.4052734375, -1.271484375, 0.8623046875, 2.99609375, 5.1298828125, 7.263671875, 9.3974609375, 11.53125, 13.6650390625, 15.798828125, 17.9326171875, 20.06640625, 22.2001953125, 24.333984375, 26.4677734375, 28.6015625, 30.7353515625, 32.869140625, 35.0029296875, 37.13671875, 39.2705078125, 41.404296875, 43.5380859375, 45.671875, 47.8056640625, 49.939453125, 52.0732421875, 54.20703125, 56.3408203125, 58.474609375, 60.6083984375, 62.7421875, 64.8759765625, 67.009765625, 69.1435546875, 71.27734375, 73.4111328125, 75.544921875, 77.6787109375, 79.8125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 12.0, 12.0, 22.0, 28.0, 40.0, 47.0, 51.0, 76.0, 86.0, 100.0, 76.0, 94.0, 71.0, 58.0, 57.0, 39.0, 42.0, 29.0, 25.0, 7.0, 11.0, 3.0, 0.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0234375, -8.724853515625, -8.42626953125, -8.127685546875, -7.8291015625, -7.530517578125, -7.23193359375, -6.933349609375, -6.634765625, -6.336181640625, -6.03759765625, -5.739013671875, -5.4404296875, -5.141845703125, -4.84326171875, -4.544677734375, -4.24609375, -3.947509765625, -3.64892578125, -3.350341796875, -3.0517578125, -2.753173828125, -2.45458984375, -2.156005859375, -1.857421875, -1.558837890625, -1.26025390625, -0.961669921875, -0.6630859375, -0.364501953125, -0.06591796875, 0.232666015625, 0.53125, 0.829833984375, 1.12841796875, 1.427001953125, 1.7255859375, 2.024169921875, 2.32275390625, 2.621337890625, 2.919921875, 3.218505859375, 3.51708984375, 3.815673828125, 4.1142578125, 4.412841796875, 4.71142578125, 5.010009765625, 5.30859375, 5.607177734375, 5.90576171875, 6.204345703125, 6.5029296875, 6.801513671875, 7.10009765625, 7.398681640625, 7.697265625, 7.995849609375, 8.29443359375, 8.593017578125, 8.8916015625, 9.190185546875, 9.48876953125, 9.787353515625, 10.0859375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 4.0, 6.0, 9.0, 9.0, 19.0, 15.0, 37.0, 35.0, 52.0, 106.0, 156.0, 271.0, 511.0, 1000.0, 2241.0, 5576.0, 14518.0, 40184.0, 145566.0, 588157.0, 177380.0, 45304.0, 16314.0, 6149.0, 2483.0, 1098.0, 552.0, 311.0, 172.0, 105.0, 66.0, 54.0, 35.0, 17.0, 10.0, 8.0, 10.0, 7.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.796875, -22.933349609375, -22.06982421875, -21.206298828125, -20.3427734375, -19.479248046875, -18.61572265625, -17.752197265625, -16.888671875, -16.025146484375, -15.16162109375, -14.298095703125, -13.4345703125, -12.571044921875, -11.70751953125, -10.843994140625, -9.98046875, -9.116943359375, -8.25341796875, -7.389892578125, -6.5263671875, -5.662841796875, -4.79931640625, -3.935791015625, -3.072265625, -2.208740234375, -1.34521484375, -0.481689453125, 0.3818359375, 1.245361328125, 2.10888671875, 2.972412109375, 3.8359375, 4.699462890625, 5.56298828125, 6.426513671875, 7.2900390625, 8.153564453125, 9.01708984375, 9.880615234375, 10.744140625, 11.607666015625, 12.47119140625, 13.334716796875, 14.1982421875, 15.061767578125, 15.92529296875, 16.788818359375, 17.65234375, 18.515869140625, 19.37939453125, 20.242919921875, 21.1064453125, 21.969970703125, 22.83349609375, 23.697021484375, 24.560546875, 25.424072265625, 26.28759765625, 27.151123046875, 28.0146484375, 28.878173828125, 29.74169921875, 30.605224609375, 31.46875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 8.0, 8.0, 8.0, 8.0, 13.0, 15.0, 15.0, 14.0, 35.0, 37.0, 28.0, 42.0, 44.0, 36.0, 52.0, 61.0, 55.0, 55.0, 52.0, 50.0, 65.0, 39.0, 47.0, 32.0, 32.0, 27.0, 23.0, 18.0, 18.0, 14.0, 12.0, 7.0, 11.0, 8.0, 4.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.65625, -27.8466796875, -27.037109375, -26.2275390625, -25.41796875, -24.6083984375, -23.798828125, -22.9892578125, -22.1796875, -21.3701171875, -20.560546875, -19.7509765625, -18.94140625, -18.1318359375, -17.322265625, -16.5126953125, -15.703125, -14.8935546875, -14.083984375, -13.2744140625, -12.46484375, -11.6552734375, -10.845703125, -10.0361328125, -9.2265625, -8.4169921875, -7.607421875, -6.7978515625, -5.98828125, -5.1787109375, -4.369140625, -3.5595703125, -2.75, -1.9404296875, -1.130859375, -0.3212890625, 0.48828125, 1.2978515625, 2.107421875, 2.9169921875, 3.7265625, 4.5361328125, 5.345703125, 6.1552734375, 6.96484375, 7.7744140625, 8.583984375, 9.3935546875, 10.203125, 11.0126953125, 11.822265625, 12.6318359375, 13.44140625, 14.2509765625, 15.060546875, 15.8701171875, 16.6796875, 17.4892578125, 18.298828125, 19.1083984375, 19.91796875, 20.7275390625, 21.537109375, 22.3466796875, 23.15625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 2.0, 5.0, 3.0, 6.0, 2.0, 5.0, 23.0, 10.0, 11.0, 18.0, 28.0, 37.0, 46.0, 69.0, 116.0, 232.0, 455.0, 992.0, 2346.0, 5643.0, 17021.0, 69443.0, 530978.0, 351053.0, 48587.0, 13022.0, 4706.0, 1956.0, 830.0, 354.0, 184.0, 109.0, 60.0, 41.0, 39.0, 25.0, 16.0, 12.0, 15.0, 13.0, 7.0, 8.0, 7.0, 7.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.3046875, -12.900146484375, -12.49560546875, -12.091064453125, -11.6865234375, -11.281982421875, -10.87744140625, -10.472900390625, -10.068359375, -9.663818359375, -9.25927734375, -8.854736328125, -8.4501953125, -8.045654296875, -7.64111328125, -7.236572265625, -6.83203125, -6.427490234375, -6.02294921875, -5.618408203125, -5.2138671875, -4.809326171875, -4.40478515625, -4.000244140625, -3.595703125, -3.191162109375, -2.78662109375, -2.382080078125, -1.9775390625, -1.572998046875, -1.16845703125, -0.763916015625, -0.359375, 0.045166015625, 0.44970703125, 0.854248046875, 1.2587890625, 1.663330078125, 2.06787109375, 2.472412109375, 2.876953125, 3.281494140625, 3.68603515625, 4.090576171875, 4.4951171875, 4.899658203125, 5.30419921875, 5.708740234375, 6.11328125, 6.517822265625, 6.92236328125, 7.326904296875, 7.7314453125, 8.135986328125, 8.54052734375, 8.945068359375, 9.349609375, 9.754150390625, 10.15869140625, 10.563232421875, 10.9677734375, 11.372314453125, 11.77685546875, 12.181396484375, 12.5859375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 6.0, 3.0, 13.0, 13.0, 15.0, 24.0, 34.0, 60.0, 112.0, 270.0, 220.0, 86.0, 44.0, 22.0, 24.0, 4.0, 17.0, 12.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0026397705078125, -0.0025512278079986572, -0.0024626851081848145, -0.0023741424083709717, -0.002285599708557129, -0.002197057008743286, -0.0021085143089294434, -0.0020199716091156006, -0.0019314289093017578, -0.001842886209487915, -0.0017543435096740723, -0.0016658008098602295, -0.0015772581100463867, -0.001488715410232544, -0.0014001727104187012, -0.0013116300106048584, -0.0012230873107910156, -0.0011345446109771729, -0.00104600191116333, -0.0009574592113494873, -0.0008689165115356445, -0.0007803738117218018, -0.000691831111907959, -0.0006032884120941162, -0.0005147457122802734, -0.00042620301246643066, -0.0003376603126525879, -0.0002491176128387451, -0.00016057491302490234, -7.203221321105957e-05, 1.6510486602783203e-05, 0.00010505318641662598, 0.00019359588623046875, 0.0002821385860443115, 0.0003706812858581543, 0.00045922398567199707, 0.0005477666854858398, 0.0006363093852996826, 0.0007248520851135254, 0.0008133947849273682, 0.0009019374847412109, 0.0009904801845550537, 0.0010790228843688965, 0.0011675655841827393, 0.001256108283996582, 0.0013446509838104248, 0.0014331936836242676, 0.0015217363834381104, 0.0016102790832519531, 0.001698821783065796, 0.0017873644828796387, 0.0018759071826934814, 0.0019644498825073242, 0.002052992582321167, 0.0021415352821350098, 0.0022300779819488525, 0.0023186206817626953, 0.002407163381576538, 0.002495706081390381, 0.0025842487812042236, 0.0026727914810180664, 0.002761334180831909, 0.002849876880645752, 0.0029384195804595947, 0.0030269622802734375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 8.0, 8.0, 10.0, 14.0, 14.0, 13.0, 20.0, 39.0, 43.0, 46.0, 72.0, 112.0, 213.0, 397.0, 796.0, 1730.0, 4344.0, 12930.0, 45471.0, 302210.0, 575828.0, 74439.0, 19134.0, 6040.0, 2370.0, 1073.0, 478.0, 230.0, 135.0, 78.0, 67.0, 34.0, 23.0, 26.0, 22.0, 20.0, 14.0, 7.0, 3.0, 7.0, 7.0, 9.0, 6.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.8828125, -11.4888916015625, -11.094970703125, -10.7010498046875, -10.30712890625, -9.9132080078125, -9.519287109375, -9.1253662109375, -8.7314453125, -8.3375244140625, -7.943603515625, -7.5496826171875, -7.15576171875, -6.7618408203125, -6.367919921875, -5.9739990234375, -5.580078125, -5.1861572265625, -4.792236328125, -4.3983154296875, -4.00439453125, -3.6104736328125, -3.216552734375, -2.8226318359375, -2.4287109375, -2.0347900390625, -1.640869140625, -1.2469482421875, -0.85302734375, -0.4591064453125, -0.065185546875, 0.3287353515625, 0.72265625, 1.1165771484375, 1.510498046875, 1.9044189453125, 2.29833984375, 2.6922607421875, 3.086181640625, 3.4801025390625, 3.8740234375, 4.2679443359375, 4.661865234375, 5.0557861328125, 5.44970703125, 5.8436279296875, 6.237548828125, 6.6314697265625, 7.025390625, 7.4193115234375, 7.813232421875, 8.2071533203125, 8.60107421875, 8.9949951171875, 9.388916015625, 9.7828369140625, 10.1767578125, 10.5706787109375, 10.964599609375, 11.3585205078125, 11.75244140625, 12.1463623046875, 12.540283203125, 12.9342041015625, 13.328125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 0.0, 3.0, 5.0, 9.0, 8.0, 13.0, 21.0, 31.0, 28.0, 67.0, 93.0, 120.0, 119.0, 136.0, 102.0, 85.0, 40.0, 27.0, 27.0, 14.0, 11.0, 11.0, 8.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-10.6640625, -10.356201171875, -10.04833984375, -9.740478515625, -9.4326171875, -9.124755859375, -8.81689453125, -8.509033203125, -8.201171875, -7.893310546875, -7.58544921875, -7.277587890625, -6.9697265625, -6.661865234375, -6.35400390625, -6.046142578125, -5.73828125, -5.430419921875, -5.12255859375, -4.814697265625, -4.5068359375, -4.198974609375, -3.89111328125, -3.583251953125, -3.275390625, -2.967529296875, -2.65966796875, -2.351806640625, -2.0439453125, -1.736083984375, -1.42822265625, -1.120361328125, -0.8125, -0.504638671875, -0.19677734375, 0.111083984375, 0.4189453125, 0.726806640625, 1.03466796875, 1.342529296875, 1.650390625, 1.958251953125, 2.26611328125, 2.573974609375, 2.8818359375, 3.189697265625, 3.49755859375, 3.805419921875, 4.11328125, 4.421142578125, 4.72900390625, 5.036865234375, 5.3447265625, 5.652587890625, 5.96044921875, 6.268310546875, 6.576171875, 6.884033203125, 7.19189453125, 7.499755859375, 7.8076171875, 8.115478515625, 8.42333984375, 8.731201171875, 9.0390625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 8.0, 6.0, 5.0, 17.0, 26.0, 33.0, 48.0, 63.0, 72.0, 92.0, 103.0, 105.0, 94.0, 85.0, 67.0, 57.0, 43.0, 28.0, 17.0, 13.0, 13.0, 5.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.11668395996094, -98.92745971679688, -94.73824310302734, -90.54901885986328, -86.35980224609375, -82.17057800292969, -77.98135375976562, -73.79212951660156, -69.60291290283203, -65.41368865966797, -61.22447204589844, -57.035247802734375, -52.84602737426758, -48.65680694580078, -44.46758270263672, -40.27836227416992, -36.089141845703125, -31.899921417236328, -27.7106990814209, -23.52147674560547, -19.332256317138672, -15.143035888671875, -10.953813552856445, -6.764591217041016, -2.5753707885742188, 1.6138505935668945, 5.803071975708008, 9.992293357849121, 14.181514739990234, 18.37073516845703, 22.55995750427246, 26.74917984008789, 30.93841552734375, 35.12763595581055, 39.316856384277344, 43.506080627441406, 47.6953010559082, 51.884521484375, 56.07374572753906, 60.26296615600586, 64.45218658447266, 68.64141082763672, 72.83062744140625, 77.01985168457031, 81.20907592773438, 85.3982925415039, 89.58751678466797, 93.7767333984375, 97.96595764160156, 102.15518188476562, 106.34439849853516, 110.53362274169922, 114.72283935546875, 118.91206359863281, 123.10128784179688, 127.29051208496094, 131.479736328125, 135.66896057128906, 139.85818481445312, 144.04739379882812, 148.2366180419922, 152.42584228515625, 156.6150665283203, 160.80429077148438, 164.99349975585938]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 3.0, 3.0, 5.0, 6.0, 7.0, 10.0, 21.0, 7.0, 20.0, 22.0, 25.0, 26.0, 39.0, 35.0, 42.0, 47.0, 41.0, 48.0, 42.0, 49.0, 51.0, 49.0, 51.0, 42.0, 44.0, 42.0, 41.0, 37.0, 32.0, 31.0, 20.0, 12.0, 15.0, 12.0, 13.0, 6.0, 6.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-130.07212829589844, -126.45592498779297, -122.8397216796875, -119.22351837158203, -115.60731506347656, -111.9911117553711, -108.37490844726562, -104.75871276855469, -101.14250183105469, -97.52629852294922, -93.91009521484375, -90.29389190673828, -86.67768859863281, -83.06148529052734, -79.44528198242188, -75.82908630371094, -72.21288299560547, -68.5966796875, -64.98047637939453, -61.36427307128906, -57.748069763183594, -54.131866455078125, -50.51566696166992, -46.89946365356445, -43.283260345458984, -39.667057037353516, -36.05085372924805, -32.434654235839844, -28.818449020385742, -25.202245712280273, -21.586044311523438, -17.96984100341797, -14.3536376953125, -10.737434387207031, -7.121232032775879, -3.5050296783447266, 0.11117362976074219, 3.727376937866211, 7.343578338623047, 10.959781646728516, 14.575984954833984, 18.192188262939453, 21.808391571044922, 25.424592971801758, 29.040796279907227, 32.65699768066406, 36.27320098876953, 39.889404296875, 43.50560760498047, 47.12181091308594, 50.738014221191406, 54.354217529296875, 57.970420837402344, 61.58662414550781, 65.20281982421875, 68.81903076171875, 72.43522644042969, 76.05142974853516, 79.66763305664062, 83.2838363647461, 86.90003967285156, 90.51624298095703, 94.1324462890625, 97.74864196777344, 101.36485290527344]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 7.0, 16.0, 14.0, 17.0, 16.0, 35.0, 54.0, 68.0, 118.0, 201.0, 316.0, 504.0, 967.0, 1782.0, 4095.0, 10683.0, 35673.0, 191447.0, 3658232.0, 229882.0, 40058.0, 11787.0, 4291.0, 1806.0, 881.0, 465.0, 268.0, 178.0, 116.0, 81.0, 56.0, 39.0, 36.0, 15.0, 15.0, 18.0, 8.0, 9.0, 7.0, 4.0, 2.0, 4.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-48.21875, -46.40185546875, -44.5849609375, -42.76806640625, -40.951171875, -39.13427734375, -37.3173828125, -35.50048828125, -33.68359375, -31.86669921875, -30.0498046875, -28.23291015625, -26.416015625, -24.59912109375, -22.7822265625, -20.96533203125, -19.1484375, -17.33154296875, -15.5146484375, -13.69775390625, -11.880859375, -10.06396484375, -8.2470703125, -6.43017578125, -4.61328125, -2.79638671875, -0.9794921875, 0.83740234375, 2.654296875, 4.47119140625, 6.2880859375, 8.10498046875, 9.921875, 11.73876953125, 13.5556640625, 15.37255859375, 17.189453125, 19.00634765625, 20.8232421875, 22.64013671875, 24.45703125, 26.27392578125, 28.0908203125, 29.90771484375, 31.724609375, 33.54150390625, 35.3583984375, 37.17529296875, 38.9921875, 40.80908203125, 42.6259765625, 44.44287109375, 46.259765625, 48.07666015625, 49.8935546875, 51.71044921875, 53.52734375, 55.34423828125, 57.1611328125, 58.97802734375, 60.794921875, 62.61181640625, 64.4287109375, 66.24560546875, 68.0625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 5.0, 3.0, 4.0, 9.0, 14.0, 19.0, 13.0, 36.0, 48.0, 66.0, 57.0, 67.0, 97.0, 94.0, 76.0, 75.0, 61.0, 62.0, 47.0, 41.0, 32.0, 31.0, 15.0, 9.0, 6.0, 7.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.859375, -8.5616455078125, -8.263916015625, -7.9661865234375, -7.66845703125, -7.3707275390625, -7.072998046875, -6.7752685546875, -6.4775390625, -6.1798095703125, -5.882080078125, -5.5843505859375, -5.28662109375, -4.9888916015625, -4.691162109375, -4.3934326171875, -4.095703125, -3.7979736328125, -3.500244140625, -3.2025146484375, -2.90478515625, -2.6070556640625, -2.309326171875, -2.0115966796875, -1.7138671875, -1.4161376953125, -1.118408203125, -0.8206787109375, -0.52294921875, -0.2252197265625, 0.072509765625, 0.3702392578125, 0.66796875, 0.9656982421875, 1.263427734375, 1.5611572265625, 1.85888671875, 2.1566162109375, 2.454345703125, 2.7520751953125, 3.0498046875, 3.3475341796875, 3.645263671875, 3.9429931640625, 4.24072265625, 4.5384521484375, 4.836181640625, 5.1339111328125, 5.431640625, 5.7293701171875, 6.027099609375, 6.3248291015625, 6.62255859375, 6.9202880859375, 7.218017578125, 7.5157470703125, 7.8134765625, 8.1112060546875, 8.408935546875, 8.7066650390625, 9.00439453125, 9.3021240234375, 9.599853515625, 9.8975830078125, 10.1953125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 8.0, 11.0, 10.0, 12.0, 11.0, 22.0, 24.0, 28.0, 49.0, 83.0, 113.0, 152.0, 256.0, 394.0, 709.0, 1246.0, 2579.0, 5635.0, 14125.0, 40219.0, 147741.0, 1880327.0, 1886183.0, 148099.0, 40433.0, 14105.0, 5833.0, 2636.0, 1315.0, 724.0, 417.0, 225.0, 163.0, 92.0, 83.0, 40.0, 55.0, 36.0, 24.0, 19.0, 10.0, 12.0, 14.0, 1.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-33.375, -32.33203125, -31.2890625, -30.24609375, -29.203125, -28.16015625, -27.1171875, -26.07421875, -25.03125, -23.98828125, -22.9453125, -21.90234375, -20.859375, -19.81640625, -18.7734375, -17.73046875, -16.6875, -15.64453125, -14.6015625, -13.55859375, -12.515625, -11.47265625, -10.4296875, -9.38671875, -8.34375, -7.30078125, -6.2578125, -5.21484375, -4.171875, -3.12890625, -2.0859375, -1.04296875, 0.0, 1.04296875, 2.0859375, 3.12890625, 4.171875, 5.21484375, 6.2578125, 7.30078125, 8.34375, 9.38671875, 10.4296875, 11.47265625, 12.515625, 13.55859375, 14.6015625, 15.64453125, 16.6875, 17.73046875, 18.7734375, 19.81640625, 20.859375, 21.90234375, 22.9453125, 23.98828125, 25.03125, 26.07421875, 27.1171875, 28.16015625, 29.203125, 30.24609375, 31.2890625, 32.33203125, 33.375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 12.0, 4.0, 10.0, 28.0, 53.0, 78.0, 161.0, 382.0, 1948.0, 842.0, 272.0, 116.0, 71.0, 31.0, 18.0, 12.0, 12.0, 10.0, 5.0, 6.0, 3.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.75, -23.048095703125, -22.34619140625, -21.644287109375, -20.9423828125, -20.240478515625, -19.53857421875, -18.836669921875, -18.134765625, -17.432861328125, -16.73095703125, -16.029052734375, -15.3271484375, -14.625244140625, -13.92333984375, -13.221435546875, -12.51953125, -11.817626953125, -11.11572265625, -10.413818359375, -9.7119140625, -9.010009765625, -8.30810546875, -7.606201171875, -6.904296875, -6.202392578125, -5.50048828125, -4.798583984375, -4.0966796875, -3.394775390625, -2.69287109375, -1.990966796875, -1.2890625, -0.587158203125, 0.11474609375, 0.816650390625, 1.5185546875, 2.220458984375, 2.92236328125, 3.624267578125, 4.326171875, 5.028076171875, 5.72998046875, 6.431884765625, 7.1337890625, 7.835693359375, 8.53759765625, 9.239501953125, 9.94140625, 10.643310546875, 11.34521484375, 12.047119140625, 12.7490234375, 13.450927734375, 14.15283203125, 14.854736328125, 15.556640625, 16.258544921875, 16.96044921875, 17.662353515625, 18.3642578125, 19.066162109375, 19.76806640625, 20.469970703125, 21.171875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 14.0, 18.0, 52.0, 74.0, 133.0, 140.0, 173.0, 146.0, 127.0, 46.0, 33.0, 19.0, 9.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-133.68490600585938, -130.12982177734375, -126.57474517822266, -123.01966094970703, -119.4645767211914, -115.90950012207031, -112.35441589355469, -108.79933166503906, -105.24425506591797, -101.68917083740234, -98.13409423828125, -94.57901000976562, -91.02392578125, -87.4688491821289, -83.91376495361328, -80.35868835449219, -76.80360412597656, -73.24851989746094, -69.69344329833984, -66.13835906982422, -62.58327865600586, -59.0281982421875, -55.473114013671875, -51.918033599853516, -48.362945556640625, -44.807865142822266, -41.25278091430664, -37.69770050048828, -34.14262008666992, -30.58753776550293, -27.032455444335938, -23.477375030517578, -19.92229461669922, -16.367212295532227, -12.812131881713867, -9.257049560546875, -5.701968193054199, -2.1468868255615234, 1.4081954956054688, 4.963275909423828, 8.51835823059082, 12.073439598083496, 15.628520965576172, 19.183603286743164, 22.738685607910156, 26.293766021728516, 29.848848342895508, 33.4039306640625, 36.95901107788086, 40.51409149169922, 44.069175720214844, 47.6242561340332, 51.17933654785156, 54.73442077636719, 58.28950119018555, 61.844581604003906, 65.39966583251953, 68.95475006103516, 72.50982666015625, 76.06491088867188, 79.6199951171875, 83.1750717163086, 86.73015594482422, 90.28523254394531, 93.84031677246094]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 0.0, 2.0, 4.0, 2.0, 4.0, 6.0, 12.0, 12.0, 11.0, 13.0, 9.0, 14.0, 15.0, 19.0, 25.0, 20.0, 30.0, 22.0, 37.0, 45.0, 39.0, 44.0, 31.0, 45.0, 44.0, 33.0, 37.0, 31.0, 41.0, 37.0, 22.0, 50.0, 28.0, 28.0, 26.0, 22.0, 22.0, 20.0, 25.0, 12.0, 14.0, 9.0, 9.0, 5.0, 7.0, 3.0, 10.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-41.03485107421875, -39.71956253051758, -38.404273986816406, -37.08898162841797, -35.7736930847168, -34.458404541015625, -33.14311218261719, -31.827823638916016, -30.512535095214844, -29.197246551513672, -27.881956100463867, -26.566665649414062, -25.25137710571289, -23.93608856201172, -22.620798110961914, -21.30550765991211, -19.990219116210938, -18.674930572509766, -17.35964012145996, -16.044349670410156, -14.729061126708984, -13.413771629333496, -12.098482131958008, -10.78319263458252, -9.467903137207031, -8.152613639831543, -6.837324142456055, -5.522034645080566, -4.206745147705078, -2.89145565032959, -1.5761661529541016, -0.2608766555786133, 1.054412841796875, 2.3697023391723633, 3.6849918365478516, 5.00028133392334, 6.315570831298828, 7.630860328674316, 8.946149826049805, 10.261439323425293, 11.576728820800781, 12.89201831817627, 14.207307815551758, 15.522597312927246, 16.837886810302734, 18.153175354003906, 19.46846580505371, 20.783756256103516, 22.099044799804688, 23.41433334350586, 24.729623794555664, 26.04491424560547, 27.36020278930664, 28.675491333007812, 29.990781784057617, 31.306072235107422, 32.621360778808594, 33.936649322509766, 35.25193786621094, 36.567230224609375, 37.88251876831055, 39.19780731201172, 40.513099670410156, 41.82838821411133, 43.1436767578125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 10.0, 15.0, 28.0, 40.0, 72.0, 120.0, 211.0, 427.0, 935.0, 2487.0, 8846.0, 43809.0, 255632.0, 601362.0, 107369.0, 19781.0, 4585.0, 1484.0, 645.0, 310.0, 148.0, 85.0, 57.0, 34.0, 26.0, 5.0, 11.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-61.3125, -59.7099609375, -58.107421875, -56.5048828125, -54.90234375, -53.2998046875, -51.697265625, -50.0947265625, -48.4921875, -46.8896484375, -45.287109375, -43.6845703125, -42.08203125, -40.4794921875, -38.876953125, -37.2744140625, -35.671875, -34.0693359375, -32.466796875, -30.8642578125, -29.26171875, -27.6591796875, -26.056640625, -24.4541015625, -22.8515625, -21.2490234375, -19.646484375, -18.0439453125, -16.44140625, -14.8388671875, -13.236328125, -11.6337890625, -10.03125, -8.4287109375, -6.826171875, -5.2236328125, -3.62109375, -2.0185546875, -0.416015625, 1.1865234375, 2.7890625, 4.3916015625, 5.994140625, 7.5966796875, 9.19921875, 10.8017578125, 12.404296875, 14.0068359375, 15.609375, 17.2119140625, 18.814453125, 20.4169921875, 22.01953125, 23.6220703125, 25.224609375, 26.8271484375, 28.4296875, 30.0322265625, 31.634765625, 33.2373046875, 34.83984375, 36.4423828125, 38.044921875, 39.6474609375, 41.25]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 2.0, 1.0, 3.0, 9.0, 10.0, 18.0, 20.0, 24.0, 33.0, 34.0, 49.0, 57.0, 70.0, 91.0, 76.0, 87.0, 79.0, 65.0, 56.0, 47.0, 46.0, 36.0, 27.0, 18.0, 13.0, 14.0, 9.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.875, -8.5684814453125, -8.261962890625, -7.9554443359375, -7.64892578125, -7.3424072265625, -7.035888671875, -6.7293701171875, -6.4228515625, -6.1163330078125, -5.809814453125, -5.5032958984375, -5.19677734375, -4.8902587890625, -4.583740234375, -4.2772216796875, -3.970703125, -3.6641845703125, -3.357666015625, -3.0511474609375, -2.74462890625, -2.4381103515625, -2.131591796875, -1.8250732421875, -1.5185546875, -1.2120361328125, -0.905517578125, -0.5989990234375, -0.29248046875, 0.0140380859375, 0.320556640625, 0.6270751953125, 0.93359375, 1.2401123046875, 1.546630859375, 1.8531494140625, 2.15966796875, 2.4661865234375, 2.772705078125, 3.0792236328125, 3.3857421875, 3.6922607421875, 3.998779296875, 4.3052978515625, 4.61181640625, 4.9183349609375, 5.224853515625, 5.5313720703125, 5.837890625, 6.1444091796875, 6.450927734375, 6.7574462890625, 7.06396484375, 7.3704833984375, 7.677001953125, 7.9835205078125, 8.2900390625, 8.5965576171875, 8.903076171875, 9.2095947265625, 9.51611328125, 9.8226318359375, 10.129150390625, 10.4356689453125, 10.7421875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 6.0, 8.0, 18.0, 34.0, 31.0, 55.0, 97.0, 171.0, 227.0, 471.0, 719.0, 1618.0, 4875.0, 20270.0, 100310.0, 545024.0, 301977.0, 55220.0, 11668.0, 3112.0, 1193.0, 573.0, 347.0, 211.0, 131.0, 70.0, 49.0, 22.0, 18.0, 11.0, 7.0, 8.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.125, -25.072265625, -24.01953125, -22.966796875, -21.9140625, -20.861328125, -19.80859375, -18.755859375, -17.703125, -16.650390625, -15.59765625, -14.544921875, -13.4921875, -12.439453125, -11.38671875, -10.333984375, -9.28125, -8.228515625, -7.17578125, -6.123046875, -5.0703125, -4.017578125, -2.96484375, -1.912109375, -0.859375, 0.193359375, 1.24609375, 2.298828125, 3.3515625, 4.404296875, 5.45703125, 6.509765625, 7.5625, 8.615234375, 9.66796875, 10.720703125, 11.7734375, 12.826171875, 13.87890625, 14.931640625, 15.984375, 17.037109375, 18.08984375, 19.142578125, 20.1953125, 21.248046875, 22.30078125, 23.353515625, 24.40625, 25.458984375, 26.51171875, 27.564453125, 28.6171875, 29.669921875, 30.72265625, 31.775390625, 32.828125, 33.880859375, 34.93359375, 35.986328125, 37.0390625, 38.091796875, 39.14453125, 40.197265625, 41.25]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 8.0, 2.0, 2.0, 5.0, 6.0, 9.0, 16.0, 19.0, 17.0, 13.0, 23.0, 35.0, 29.0, 34.0, 34.0, 34.0, 40.0, 40.0, 53.0, 60.0, 55.0, 52.0, 51.0, 41.0, 43.0, 37.0, 49.0, 38.0, 21.0, 29.0, 25.0, 21.0, 7.0, 14.0, 13.0, 10.0, 10.0, 2.0, 7.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.609375, -26.7568359375, -25.904296875, -25.0517578125, -24.19921875, -23.3466796875, -22.494140625, -21.6416015625, -20.7890625, -19.9365234375, -19.083984375, -18.2314453125, -17.37890625, -16.5263671875, -15.673828125, -14.8212890625, -13.96875, -13.1162109375, -12.263671875, -11.4111328125, -10.55859375, -9.7060546875, -8.853515625, -8.0009765625, -7.1484375, -6.2958984375, -5.443359375, -4.5908203125, -3.73828125, -2.8857421875, -2.033203125, -1.1806640625, -0.328125, 0.5244140625, 1.376953125, 2.2294921875, 3.08203125, 3.9345703125, 4.787109375, 5.6396484375, 6.4921875, 7.3447265625, 8.197265625, 9.0498046875, 9.90234375, 10.7548828125, 11.607421875, 12.4599609375, 13.3125, 14.1650390625, 15.017578125, 15.8701171875, 16.72265625, 17.5751953125, 18.427734375, 19.2802734375, 20.1328125, 20.9853515625, 21.837890625, 22.6904296875, 23.54296875, 24.3955078125, 25.248046875, 26.1005859375, 26.953125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 7.0, 14.0, 17.0, 26.0, 45.0, 89.0, 135.0, 339.0, 781.0, 2145.0, 6073.0, 20639.0, 79764.0, 390713.0, 427740.0, 87528.0, 22209.0, 6541.0, 2131.0, 858.0, 376.0, 167.0, 78.0, 51.0, 38.0, 13.0, 9.0, 12.0, 6.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.375, -11.9761962890625, -11.577392578125, -11.1785888671875, -10.77978515625, -10.3809814453125, -9.982177734375, -9.5833740234375, -9.1845703125, -8.7857666015625, -8.386962890625, -7.9881591796875, -7.58935546875, -7.1905517578125, -6.791748046875, -6.3929443359375, -5.994140625, -5.5953369140625, -5.196533203125, -4.7977294921875, -4.39892578125, -4.0001220703125, -3.601318359375, -3.2025146484375, -2.8037109375, -2.4049072265625, -2.006103515625, -1.6072998046875, -1.20849609375, -0.8096923828125, -0.410888671875, -0.0120849609375, 0.38671875, 0.7855224609375, 1.184326171875, 1.5831298828125, 1.98193359375, 2.3807373046875, 2.779541015625, 3.1783447265625, 3.5771484375, 3.9759521484375, 4.374755859375, 4.7735595703125, 5.17236328125, 5.5711669921875, 5.969970703125, 6.3687744140625, 6.767578125, 7.1663818359375, 7.565185546875, 7.9639892578125, 8.36279296875, 8.7615966796875, 9.160400390625, 9.5592041015625, 9.9580078125, 10.3568115234375, 10.755615234375, 11.1544189453125, 11.55322265625, 11.9520263671875, 12.350830078125, 12.7496337890625, 13.1484375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 4.0, 5.0, 6.0, 14.0, 10.0, 25.0, 23.0, 23.0, 22.0, 27.0, 57.0, 72.0, 92.0, 117.0, 132.0, 89.0, 60.0, 43.0, 41.0, 28.0, 17.0, 17.0, 15.0, 15.0, 7.0, 2.0, 3.0, 6.0, 4.0, 9.0, 4.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015287399291992188, -0.0014649778604507446, -0.0014012157917022705, -0.0013374537229537964, -0.0012736916542053223, -0.0012099295854568481, -0.001146167516708374, -0.0010824054479599, -0.0010186433792114258, -0.0009548813104629517, -0.0008911192417144775, -0.0008273571729660034, -0.0007635951042175293, -0.0006998330354690552, -0.0006360709667205811, -0.0005723088979721069, -0.0005085468292236328, -0.0004447847604751587, -0.00038102269172668457, -0.00031726062297821045, -0.00025349855422973633, -0.0001897364854812622, -0.00012597441673278809, -6.221234798431396e-05, 1.5497207641601562e-06, 6.531178951263428e-05, 0.0001290738582611084, 0.00019283592700958252, 0.00025659799575805664, 0.00032036006450653076, 0.0003841221332550049, 0.000447884202003479, 0.0005116462707519531, 0.0005754083395004272, 0.0006391704082489014, 0.0007029324769973755, 0.0007666945457458496, 0.0008304566144943237, 0.0008942186832427979, 0.000957980751991272, 0.001021742820739746, 0.0010855048894882202, 0.0011492669582366943, 0.0012130290269851685, 0.0012767910957336426, 0.0013405531644821167, 0.0014043152332305908, 0.001468077301979065, 0.001531839370727539, 0.0015956014394760132, 0.0016593635082244873, 0.0017231255769729614, 0.0017868876457214355, 0.0018506497144699097, 0.0019144117832183838, 0.001978173851966858, 0.002041935920715332, 0.002105697989463806, 0.0021694600582122803, 0.0022332221269607544, 0.0022969841957092285, 0.0023607462644577026, 0.0024245083332061768, 0.002488270401954651, 0.002552032470703125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 5.0, 3.0, 9.0, 12.0, 34.0, 44.0, 63.0, 101.0, 208.0, 409.0, 862.0, 2255.0, 8471.0, 44792.0, 311958.0, 564835.0, 92587.0, 15821.0, 3727.0, 1217.0, 523.0, 231.0, 167.0, 79.0, 45.0, 35.0, 32.0, 14.0, 3.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.78125, -17.24560546875, -16.7099609375, -16.17431640625, -15.638671875, -15.10302734375, -14.5673828125, -14.03173828125, -13.49609375, -12.96044921875, -12.4248046875, -11.88916015625, -11.353515625, -10.81787109375, -10.2822265625, -9.74658203125, -9.2109375, -8.67529296875, -8.1396484375, -7.60400390625, -7.068359375, -6.53271484375, -5.9970703125, -5.46142578125, -4.92578125, -4.39013671875, -3.8544921875, -3.31884765625, -2.783203125, -2.24755859375, -1.7119140625, -1.17626953125, -0.640625, -0.10498046875, 0.4306640625, 0.96630859375, 1.501953125, 2.03759765625, 2.5732421875, 3.10888671875, 3.64453125, 4.18017578125, 4.7158203125, 5.25146484375, 5.787109375, 6.32275390625, 6.8583984375, 7.39404296875, 7.9296875, 8.46533203125, 9.0009765625, 9.53662109375, 10.072265625, 10.60791015625, 11.1435546875, 11.67919921875, 12.21484375, 12.75048828125, 13.2861328125, 13.82177734375, 14.357421875, 14.89306640625, 15.4287109375, 15.96435546875, 16.5]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 19.0, 21.0, 27.0, 49.0, 73.0, 97.0, 105.0, 132.0, 139.0, 116.0, 80.0, 44.0, 37.0, 30.0, 18.0, 8.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.484375, -24.927490234375, -24.37060546875, -23.813720703125, -23.2568359375, -22.699951171875, -22.14306640625, -21.586181640625, -21.029296875, -20.472412109375, -19.91552734375, -19.358642578125, -18.8017578125, -18.244873046875, -17.68798828125, -17.131103515625, -16.57421875, -16.017333984375, -15.46044921875, -14.903564453125, -14.3466796875, -13.789794921875, -13.23291015625, -12.676025390625, -12.119140625, -11.562255859375, -11.00537109375, -10.448486328125, -9.8916015625, -9.334716796875, -8.77783203125, -8.220947265625, -7.6640625, -7.107177734375, -6.55029296875, -5.993408203125, -5.4365234375, -4.879638671875, -4.32275390625, -3.765869140625, -3.208984375, -2.652099609375, -2.09521484375, -1.538330078125, -0.9814453125, -0.424560546875, 0.13232421875, 0.689208984375, 1.24609375, 1.802978515625, 2.35986328125, 2.916748046875, 3.4736328125, 4.030517578125, 4.58740234375, 5.144287109375, 5.701171875, 6.258056640625, 6.81494140625, 7.371826171875, 7.9287109375, 8.485595703125, 9.04248046875, 9.599365234375, 10.15625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 6.0, 12.0, 18.0, 30.0, 40.0, 72.0, 96.0, 116.0, 153.0, 147.0, 86.0, 79.0, 58.0, 35.0, 23.0, 13.0, 8.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-294.32867431640625, -288.0148010253906, -281.700927734375, -275.3870544433594, -269.07318115234375, -262.7593078613281, -256.4454345703125, -250.1315460205078, -243.8176727294922, -237.50379943847656, -231.18992614746094, -224.8760528564453, -218.5621795654297, -212.248291015625, -205.93441772460938, -199.62054443359375, -193.30667114257812, -186.9927978515625, -180.67892456054688, -174.36505126953125, -168.05117797851562, -161.7373046875, -155.42343139648438, -149.1095428466797, -142.79568481445312, -136.4818115234375, -130.16793823242188, -123.85406494140625, -117.5401840209961, -111.22631072998047, -104.91243743896484, -98.59855651855469, -92.28468322753906, -85.97080993652344, -79.65693664550781, -73.34306335449219, -67.02918243408203, -60.715309143066406, -54.40143585205078, -48.08755874633789, -41.773685455322266, -35.45981216430664, -29.14593505859375, -22.832061767578125, -16.518186569213867, -10.20431137084961, -3.8904380798339844, 2.4234390258789062, 8.737312316894531, 15.051187515258789, 21.365062713623047, 27.678936004638672, 33.99281311035156, 40.30668640136719, 46.62055969238281, 52.9344367980957, 59.24831008911133, 65.56218719482422, 71.87606048583984, 78.18993377685547, 84.5038070678711, 90.81768798828125, 97.13156127929688, 103.4454345703125, 109.75930786132812]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 0.0, 2.0, 1.0, 4.0, 3.0, 9.0, 5.0, 8.0, 10.0, 9.0, 24.0, 18.0, 18.0, 22.0, 28.0, 31.0, 34.0, 49.0, 39.0, 34.0, 44.0, 32.0, 55.0, 42.0, 53.0, 40.0, 47.0, 47.0, 39.0, 40.0, 35.0, 28.0, 21.0, 21.0, 16.0, 16.0, 10.0, 17.0, 13.0, 9.0, 6.0, 8.0, 4.0, 5.0, 5.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-133.0745849609375, -128.9332275390625, -124.79186248779297, -120.65050506591797, -116.50914001464844, -112.36778259277344, -108.22642517089844, -104.08506774902344, -99.9437026977539, -95.8023452758789, -91.66098022460938, -87.51962280273438, -83.37826538085938, -79.23690032958984, -75.09554290771484, -70.95417785644531, -66.81282043457031, -62.67145919799805, -58.53009796142578, -54.38874053955078, -50.247379302978516, -46.10601806640625, -41.96466064453125, -37.823299407958984, -33.68193817138672, -29.540576934814453, -25.39921760559082, -21.257858276367188, -17.116497039794922, -12.975135803222656, -8.833776473999023, -4.692417144775391, -0.551055908203125, 3.590304374694824, 7.731664657592773, 11.873024940490723, 16.014385223388672, 20.155746459960938, 24.29710578918457, 28.438465118408203, 32.57982635498047, 36.721187591552734, 40.862548828125, 45.00390625, 49.145267486572266, 53.28662872314453, 57.42798614501953, 61.5693473815918, 65.71070861816406, 69.85206604003906, 73.9934310913086, 78.1347885131836, 82.27615356445312, 86.41751098632812, 90.55886840820312, 94.70022583007812, 98.84159088134766, 102.98294830322266, 107.12431335449219, 111.26567077636719, 115.40702819824219, 119.54839324951172, 123.68975067138672, 127.83111572265625, 131.97247314453125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 10.0, 3.0, 14.0, 19.0, 42.0, 52.0, 68.0, 107.0, 156.0, 215.0, 377.0, 597.0, 1003.0, 1843.0, 3618.0, 8034.0, 20951.0, 65184.0, 288100.0, 3277238.0, 402636.0, 81518.0, 24644.0, 9131.0, 3936.0, 1935.0, 1016.0, 569.0, 375.0, 249.0, 173.0, 113.0, 77.0, 76.0, 45.0, 41.0, 27.0, 22.0, 28.0, 18.0, 9.0, 6.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-36.3125, -34.99609375, -33.6796875, -32.36328125, -31.046875, -29.73046875, -28.4140625, -27.09765625, -25.78125, -24.46484375, -23.1484375, -21.83203125, -20.515625, -19.19921875, -17.8828125, -16.56640625, -15.25, -13.93359375, -12.6171875, -11.30078125, -9.984375, -8.66796875, -7.3515625, -6.03515625, -4.71875, -3.40234375, -2.0859375, -0.76953125, 0.546875, 1.86328125, 3.1796875, 4.49609375, 5.8125, 7.12890625, 8.4453125, 9.76171875, 11.078125, 12.39453125, 13.7109375, 15.02734375, 16.34375, 17.66015625, 18.9765625, 20.29296875, 21.609375, 22.92578125, 24.2421875, 25.55859375, 26.875, 28.19140625, 29.5078125, 30.82421875, 32.140625, 33.45703125, 34.7734375, 36.08984375, 37.40625, 38.72265625, 40.0390625, 41.35546875, 42.671875, 43.98828125, 45.3046875, 46.62109375, 47.9375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 2.0, 3.0, 1.0, 10.0, 6.0, 16.0, 20.0, 29.0, 19.0, 39.0, 52.0, 76.0, 62.0, 73.0, 78.0, 65.0, 86.0, 81.0, 54.0, 42.0, 56.0, 35.0, 26.0, 15.0, 19.0, 14.0, 6.0, 8.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6953125, -8.386474609375, -8.07763671875, -7.768798828125, -7.4599609375, -7.151123046875, -6.84228515625, -6.533447265625, -6.224609375, -5.915771484375, -5.60693359375, -5.298095703125, -4.9892578125, -4.680419921875, -4.37158203125, -4.062744140625, -3.75390625, -3.445068359375, -3.13623046875, -2.827392578125, -2.5185546875, -2.209716796875, -1.90087890625, -1.592041015625, -1.283203125, -0.974365234375, -0.66552734375, -0.356689453125, -0.0478515625, 0.260986328125, 0.56982421875, 0.878662109375, 1.1875, 1.496337890625, 1.80517578125, 2.114013671875, 2.4228515625, 2.731689453125, 3.04052734375, 3.349365234375, 3.658203125, 3.967041015625, 4.27587890625, 4.584716796875, 4.8935546875, 5.202392578125, 5.51123046875, 5.820068359375, 6.12890625, 6.437744140625, 6.74658203125, 7.055419921875, 7.3642578125, 7.673095703125, 7.98193359375, 8.290771484375, 8.599609375, 8.908447265625, 9.21728515625, 9.526123046875, 9.8349609375, 10.143798828125, 10.45263671875, 10.761474609375, 11.0703125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 4.0, 7.0, 8.0, 15.0, 15.0, 25.0, 36.0, 51.0, 49.0, 65.0, 92.0, 129.0, 197.0, 322.0, 533.0, 1119.0, 3519.0, 16001.0, 113731.0, 2854035.0, 1110489.0, 76723.0, 11887.0, 2822.0, 973.0, 480.0, 257.0, 200.0, 134.0, 98.0, 62.0, 56.0, 47.0, 23.0, 16.0, 13.0, 11.0, 13.0, 11.0, 7.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-54.5625, -52.99951171875, -51.4365234375, -49.87353515625, -48.310546875, -46.74755859375, -45.1845703125, -43.62158203125, -42.05859375, -40.49560546875, -38.9326171875, -37.36962890625, -35.806640625, -34.24365234375, -32.6806640625, -31.11767578125, -29.5546875, -27.99169921875, -26.4287109375, -24.86572265625, -23.302734375, -21.73974609375, -20.1767578125, -18.61376953125, -17.05078125, -15.48779296875, -13.9248046875, -12.36181640625, -10.798828125, -9.23583984375, -7.6728515625, -6.10986328125, -4.546875, -2.98388671875, -1.4208984375, 0.14208984375, 1.705078125, 3.26806640625, 4.8310546875, 6.39404296875, 7.95703125, 9.52001953125, 11.0830078125, 12.64599609375, 14.208984375, 15.77197265625, 17.3349609375, 18.89794921875, 20.4609375, 22.02392578125, 23.5869140625, 25.14990234375, 26.712890625, 28.27587890625, 29.8388671875, 31.40185546875, 32.96484375, 34.52783203125, 36.0908203125, 37.65380859375, 39.216796875, 40.77978515625, 42.3427734375, 43.90576171875, 45.46875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 4.0, 12.0, 27.0, 54.0, 166.0, 563.0, 2286.0, 618.0, 219.0, 75.0, 31.0, 11.0, 10.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.1875, -37.90283203125, -36.6181640625, -35.33349609375, -34.048828125, -32.76416015625, -31.4794921875, -30.19482421875, -28.91015625, -27.62548828125, -26.3408203125, -25.05615234375, -23.771484375, -22.48681640625, -21.2021484375, -19.91748046875, -18.6328125, -17.34814453125, -16.0634765625, -14.77880859375, -13.494140625, -12.20947265625, -10.9248046875, -9.64013671875, -8.35546875, -7.07080078125, -5.7861328125, -4.50146484375, -3.216796875, -1.93212890625, -0.6474609375, 0.63720703125, 1.921875, 3.20654296875, 4.4912109375, 5.77587890625, 7.060546875, 8.34521484375, 9.6298828125, 10.91455078125, 12.19921875, 13.48388671875, 14.7685546875, 16.05322265625, 17.337890625, 18.62255859375, 19.9072265625, 21.19189453125, 22.4765625, 23.76123046875, 25.0458984375, 26.33056640625, 27.615234375, 28.89990234375, 30.1845703125, 31.46923828125, 32.75390625, 34.03857421875, 35.3232421875, 36.60791015625, 37.892578125, 39.17724609375, 40.4619140625, 41.74658203125, 43.03125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 9.0, 22.0, 100.0, 194.0, 230.0, 216.0, 122.0, 55.0, 36.0, 13.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-268.0732727050781, -260.47442626953125, -252.87559509277344, -245.27674865722656, -237.6779022216797, -230.07907104492188, -222.480224609375, -214.88137817382812, -207.28253173828125, -199.68368530273438, -192.08485412597656, -184.4860076904297, -176.8871612548828, -169.288330078125, -161.68948364257812, -154.09063720703125, -146.49180603027344, -138.89295959472656, -131.29412841796875, -123.69528198242188, -116.096435546875, -108.49759674072266, -100.89875793457031, -93.29991149902344, -85.7010726928711, -78.10223388671875, -70.50338745117188, -62.90454864501953, -55.30570602416992, -47.70686340332031, -40.10802459716797, -32.50918197631836, -24.910354614257812, -17.311511993408203, -9.712671279907227, -2.11383056640625, 5.485012054443359, 13.083854675292969, 20.682693481445312, 28.281536102294922, 35.88037872314453, 43.47922134399414, 51.07806396484375, 58.676902770996094, 66.27574157714844, 73.87458801269531, 81.47342681884766, 89.072265625, 96.67111206054688, 104.26995086669922, 111.8687973022461, 119.46763610839844, 127.06648254394531, 134.66531372070312, 142.26416015625, 149.86300659179688, 157.46185302734375, 165.06069946289062, 172.65953063964844, 180.2583770751953, 187.8572235107422, 195.4560546875, 203.05490112304688, 210.65374755859375, 218.25257873535156]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 6.0, 7.0, 5.0, 18.0, 16.0, 16.0, 26.0, 30.0, 31.0, 32.0, 58.0, 53.0, 45.0, 69.0, 59.0, 62.0, 59.0, 57.0, 49.0, 54.0, 45.0, 37.0, 28.0, 33.0, 26.0, 17.0, 16.0, 17.0, 8.0, 7.0, 4.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-81.58464050292969, -78.99730682373047, -76.40998077392578, -73.82264709472656, -71.23532104492188, -68.64798736572266, -66.06065368652344, -63.47332763671875, -60.88599395751953, -58.29866409301758, -55.711334228515625, -53.124000549316406, -50.53667068481445, -47.9493408203125, -45.36201095581055, -42.774681091308594, -40.18735122680664, -37.60002136230469, -35.012691497802734, -32.42536163330078, -29.838027954101562, -27.25069808959961, -24.663368225097656, -22.07603645324707, -19.488706588745117, -16.901376724243164, -14.314044952392578, -11.726715087890625, -9.139384269714355, -6.552053451538086, -3.964723587036133, -1.3773918151855469, 1.2099380493164062, 3.7972686290740967, 6.384599208831787, 8.971929550170898, 11.559260368347168, 14.146591186523438, 16.73392105102539, 19.321252822875977, 21.90858268737793, 24.495912551879883, 27.08324432373047, 29.670574188232422, 32.257904052734375, 34.845237731933594, 37.43256378173828, 40.0198974609375, 42.60722732543945, 45.194557189941406, 47.78188705444336, 50.36921691894531, 52.95655059814453, 55.543880462646484, 58.13121032714844, 60.718544006347656, 63.305870056152344, 65.89320373535156, 68.48052978515625, 71.06786346435547, 73.65518951416016, 76.24252319335938, 78.82984924316406, 81.41718292236328, 84.0045166015625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 2.0, 9.0, 8.0, 7.0, 12.0, 29.0, 30.0, 53.0, 91.0, 119.0, 237.0, 391.0, 747.0, 1712.0, 4204.0, 13426.0, 55198.0, 269865.0, 514934.0, 143085.0, 30768.0, 8171.0, 2808.0, 1260.0, 610.0, 300.0, 175.0, 115.0, 61.0, 37.0, 40.0, 14.0, 11.0, 9.0, 7.0, 2.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.53125, -36.205078125, -34.87890625, -33.552734375, -32.2265625, -30.900390625, -29.57421875, -28.248046875, -26.921875, -25.595703125, -24.26953125, -22.943359375, -21.6171875, -20.291015625, -18.96484375, -17.638671875, -16.3125, -14.986328125, -13.66015625, -12.333984375, -11.0078125, -9.681640625, -8.35546875, -7.029296875, -5.703125, -4.376953125, -3.05078125, -1.724609375, -0.3984375, 0.927734375, 2.25390625, 3.580078125, 4.90625, 6.232421875, 7.55859375, 8.884765625, 10.2109375, 11.537109375, 12.86328125, 14.189453125, 15.515625, 16.841796875, 18.16796875, 19.494140625, 20.8203125, 22.146484375, 23.47265625, 24.798828125, 26.125, 27.451171875, 28.77734375, 30.103515625, 31.4296875, 32.755859375, 34.08203125, 35.408203125, 36.734375, 38.060546875, 39.38671875, 40.712890625, 42.0390625, 43.365234375, 44.69140625, 46.017578125, 47.34375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 3.0, 4.0, 8.0, 20.0, 21.0, 31.0, 37.0, 32.0, 54.0, 57.0, 60.0, 74.0, 70.0, 86.0, 79.0, 67.0, 62.0, 42.0, 45.0, 27.0, 30.0, 24.0, 18.0, 12.0, 9.0, 9.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9921875, -8.6712646484375, -8.350341796875, -8.0294189453125, -7.70849609375, -7.3875732421875, -7.066650390625, -6.7457275390625, -6.4248046875, -6.1038818359375, -5.782958984375, -5.4620361328125, -5.14111328125, -4.8201904296875, -4.499267578125, -4.1783447265625, -3.857421875, -3.5364990234375, -3.215576171875, -2.8946533203125, -2.57373046875, -2.2528076171875, -1.931884765625, -1.6109619140625, -1.2900390625, -0.9691162109375, -0.648193359375, -0.3272705078125, -0.00634765625, 0.3145751953125, 0.635498046875, 0.9564208984375, 1.27734375, 1.5982666015625, 1.919189453125, 2.2401123046875, 2.56103515625, 2.8819580078125, 3.202880859375, 3.5238037109375, 3.8447265625, 4.1656494140625, 4.486572265625, 4.8074951171875, 5.12841796875, 5.4493408203125, 5.770263671875, 6.0911865234375, 6.412109375, 6.7330322265625, 7.053955078125, 7.3748779296875, 7.69580078125, 8.0167236328125, 8.337646484375, 8.6585693359375, 8.9794921875, 9.3004150390625, 9.621337890625, 9.9422607421875, 10.26318359375, 10.5841064453125, 10.905029296875, 11.2259521484375, 11.546875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 6.0, 6.0, 18.0, 11.0, 26.0, 34.0, 63.0, 86.0, 148.0, 197.0, 321.0, 489.0, 923.0, 1886.0, 4660.0, 15092.0, 58549.0, 280797.0, 511765.0, 129135.0, 29636.0, 8566.0, 3003.0, 1394.0, 649.0, 375.0, 250.0, 163.0, 103.0, 61.0, 39.0, 30.0, 26.0, 13.0, 8.0, 8.0, 5.0, 3.0, 0.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-33.28125, -32.309814453125, -31.33837890625, -30.366943359375, -29.3955078125, -28.424072265625, -27.45263671875, -26.481201171875, -25.509765625, -24.538330078125, -23.56689453125, -22.595458984375, -21.6240234375, -20.652587890625, -19.68115234375, -18.709716796875, -17.73828125, -16.766845703125, -15.79541015625, -14.823974609375, -13.8525390625, -12.881103515625, -11.90966796875, -10.938232421875, -9.966796875, -8.995361328125, -8.02392578125, -7.052490234375, -6.0810546875, -5.109619140625, -4.13818359375, -3.166748046875, -2.1953125, -1.223876953125, -0.25244140625, 0.718994140625, 1.6904296875, 2.661865234375, 3.63330078125, 4.604736328125, 5.576171875, 6.547607421875, 7.51904296875, 8.490478515625, 9.4619140625, 10.433349609375, 11.40478515625, 12.376220703125, 13.34765625, 14.319091796875, 15.29052734375, 16.261962890625, 17.2333984375, 18.204833984375, 19.17626953125, 20.147705078125, 21.119140625, 22.090576171875, 23.06201171875, 24.033447265625, 25.0048828125, 25.976318359375, 26.94775390625, 27.919189453125, 28.890625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 13.0, 10.0, 9.0, 24.0, 27.0, 27.0, 56.0, 52.0, 63.0, 67.0, 69.0, 77.0, 71.0, 73.0, 65.0, 65.0, 58.0, 40.0, 37.0, 22.0, 19.0, 14.0, 12.0, 6.0, 7.0, 3.0, 4.0, 1.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-50.90625, -49.4580078125, -48.009765625, -46.5615234375, -45.11328125, -43.6650390625, -42.216796875, -40.7685546875, -39.3203125, -37.8720703125, -36.423828125, -34.9755859375, -33.52734375, -32.0791015625, -30.630859375, -29.1826171875, -27.734375, -26.2861328125, -24.837890625, -23.3896484375, -21.94140625, -20.4931640625, -19.044921875, -17.5966796875, -16.1484375, -14.7001953125, -13.251953125, -11.8037109375, -10.35546875, -8.9072265625, -7.458984375, -6.0107421875, -4.5625, -3.1142578125, -1.666015625, -0.2177734375, 1.23046875, 2.6787109375, 4.126953125, 5.5751953125, 7.0234375, 8.4716796875, 9.919921875, 11.3681640625, 12.81640625, 14.2646484375, 15.712890625, 17.1611328125, 18.609375, 20.0576171875, 21.505859375, 22.9541015625, 24.40234375, 25.8505859375, 27.298828125, 28.7470703125, 30.1953125, 31.6435546875, 33.091796875, 34.5400390625, 35.98828125, 37.4365234375, 38.884765625, 40.3330078125, 41.78125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 4.0, 5.0, 2.0, 5.0, 11.0, 20.0, 28.0, 50.0, 70.0, 131.0, 273.0, 492.0, 1127.0, 3129.0, 10531.0, 46155.0, 211390.0, 493313.0, 217507.0, 47823.0, 11025.0, 3174.0, 1121.0, 515.0, 289.0, 153.0, 77.0, 43.0, 26.0, 26.0, 16.0, 12.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.90625, -11.5028076171875, -11.099365234375, -10.6959228515625, -10.29248046875, -9.8890380859375, -9.485595703125, -9.0821533203125, -8.6787109375, -8.2752685546875, -7.871826171875, -7.4683837890625, -7.06494140625, -6.6614990234375, -6.258056640625, -5.8546142578125, -5.451171875, -5.0477294921875, -4.644287109375, -4.2408447265625, -3.83740234375, -3.4339599609375, -3.030517578125, -2.6270751953125, -2.2236328125, -1.8201904296875, -1.416748046875, -1.0133056640625, -0.60986328125, -0.2064208984375, 0.197021484375, 0.6004638671875, 1.00390625, 1.4073486328125, 1.810791015625, 2.2142333984375, 2.61767578125, 3.0211181640625, 3.424560546875, 3.8280029296875, 4.2314453125, 4.6348876953125, 5.038330078125, 5.4417724609375, 5.84521484375, 6.2486572265625, 6.652099609375, 7.0555419921875, 7.458984375, 7.8624267578125, 8.265869140625, 8.6693115234375, 9.07275390625, 9.4761962890625, 9.879638671875, 10.2830810546875, 10.6865234375, 11.0899658203125, 11.493408203125, 11.8968505859375, 12.30029296875, 12.7037353515625, 13.107177734375, 13.5106201171875, 13.9140625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 9.0, 5.0, 6.0, 4.0, 16.0, 11.0, 22.0, 34.0, 48.0, 57.0, 68.0, 87.0, 101.0, 105.0, 99.0, 82.0, 62.0, 45.0, 33.0, 33.0, 17.0, 17.0, 19.0, 8.0, 5.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0024433135986328125, -0.002375677227973938, -0.0023080408573150635, -0.002240404486656189, -0.0021727681159973145, -0.00210513174533844, -0.0020374953746795654, -0.001969859004020691, -0.0019022226333618164, -0.001834586262702942, -0.0017669498920440674, -0.0016993135213851929, -0.0016316771507263184, -0.0015640407800674438, -0.0014964044094085693, -0.0014287680387496948, -0.0013611316680908203, -0.0012934952974319458, -0.0012258589267730713, -0.0011582225561141968, -0.0010905861854553223, -0.0010229498147964478, -0.0009553134441375732, -0.0008876770734786987, -0.0008200407028198242, -0.0007524043321609497, -0.0006847679615020752, -0.0006171315908432007, -0.0005494952201843262, -0.00048185884952545166, -0.00041422247886657715, -0.00034658610820770264, -0.0002789497375488281, -0.0002113133668899536, -0.0001436769962310791, -7.604062557220459e-05, -8.404254913330078e-06, 5.9232115745544434e-05, 0.00012686848640441895, 0.00019450485706329346, 0.00026214122772216797, 0.0003297775983810425, 0.000397413969039917, 0.0004650503396987915, 0.000532686710357666, 0.0006003230810165405, 0.000667959451675415, 0.0007355958223342896, 0.0008032321929931641, 0.0008708685636520386, 0.0009385049343109131, 0.0010061413049697876, 0.0010737776756286621, 0.0011414140462875366, 0.0012090504169464111, 0.0012766867876052856, 0.0013443231582641602, 0.0014119595289230347, 0.0014795958995819092, 0.0015472322702407837, 0.0016148686408996582, 0.0016825050115585327, 0.0017501413822174072, 0.0018177777528762817, 0.0018854141235351562]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 9.0, 12.0, 11.0, 27.0, 42.0, 68.0, 105.0, 193.0, 402.0, 834.0, 2343.0, 8385.0, 49269.0, 328292.0, 530738.0, 105891.0, 15986.0, 3665.0, 1222.0, 528.0, 245.0, 131.0, 66.0, 31.0, 25.0, 17.0, 6.0, 3.0, 1.0, 4.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.75, -19.218994140625, -18.68798828125, -18.156982421875, -17.6259765625, -17.094970703125, -16.56396484375, -16.032958984375, -15.501953125, -14.970947265625, -14.43994140625, -13.908935546875, -13.3779296875, -12.846923828125, -12.31591796875, -11.784912109375, -11.25390625, -10.722900390625, -10.19189453125, -9.660888671875, -9.1298828125, -8.598876953125, -8.06787109375, -7.536865234375, -7.005859375, -6.474853515625, -5.94384765625, -5.412841796875, -4.8818359375, -4.350830078125, -3.81982421875, -3.288818359375, -2.7578125, -2.226806640625, -1.69580078125, -1.164794921875, -0.6337890625, -0.102783203125, 0.42822265625, 0.959228515625, 1.490234375, 2.021240234375, 2.55224609375, 3.083251953125, 3.6142578125, 4.145263671875, 4.67626953125, 5.207275390625, 5.73828125, 6.269287109375, 6.80029296875, 7.331298828125, 7.8623046875, 8.393310546875, 8.92431640625, 9.455322265625, 9.986328125, 10.517333984375, 11.04833984375, 11.579345703125, 12.1103515625, 12.641357421875, 13.17236328125, 13.703369140625, 14.234375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 1.0, 7.0, 11.0, 14.0, 25.0, 21.0, 27.0, 46.0, 45.0, 57.0, 65.0, 74.0, 87.0, 86.0, 80.0, 82.0, 66.0, 46.0, 44.0, 24.0, 23.0, 22.0, 10.0, 11.0, 8.0, 6.0, 3.0, 6.0, 2.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-15.765625, -15.3804931640625, -14.995361328125, -14.6102294921875, -14.22509765625, -13.8399658203125, -13.454833984375, -13.0697021484375, -12.6845703125, -12.2994384765625, -11.914306640625, -11.5291748046875, -11.14404296875, -10.7589111328125, -10.373779296875, -9.9886474609375, -9.603515625, -9.2183837890625, -8.833251953125, -8.4481201171875, -8.06298828125, -7.6778564453125, -7.292724609375, -6.9075927734375, -6.5224609375, -6.1373291015625, -5.752197265625, -5.3670654296875, -4.98193359375, -4.5968017578125, -4.211669921875, -3.8265380859375, -3.44140625, -3.0562744140625, -2.671142578125, -2.2860107421875, -1.90087890625, -1.5157470703125, -1.130615234375, -0.7454833984375, -0.3603515625, 0.0247802734375, 0.409912109375, 0.7950439453125, 1.18017578125, 1.5653076171875, 1.950439453125, 2.3355712890625, 2.720703125, 3.1058349609375, 3.490966796875, 3.8760986328125, 4.26123046875, 4.6463623046875, 5.031494140625, 5.4166259765625, 5.8017578125, 6.1868896484375, 6.572021484375, 6.9571533203125, 7.34228515625, 7.7274169921875, 8.112548828125, 8.4976806640625, 8.8828125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 16.0, 27.0, 53.0, 150.0, 198.0, 237.0, 153.0, 92.0, 38.0, 22.0, 11.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-533.4025268554688, -522.0223388671875, -510.64215087890625, -499.2619934082031, -487.8818054199219, -476.5016174316406, -465.1214294433594, -453.74127197265625, -442.361083984375, -430.98089599609375, -419.6007080078125, -408.2205505371094, -396.8403625488281, -385.4601745605469, -374.0799865722656, -362.6998291015625, -351.31964111328125, -339.939453125, -328.55926513671875, -317.1791076660156, -305.7989196777344, -294.4187316894531, -283.0385437011719, -271.65838623046875, -260.2781677246094, -248.89797973632812, -237.51780700683594, -226.1376190185547, -214.7574462890625, -203.37725830078125, -191.9970703125, -180.6168975830078, -169.23672485351562, -157.85653686523438, -146.4763641357422, -135.09617614746094, -123.71600341796875, -112.3358154296875, -100.95563507080078, -89.57545471191406, -78.19527435302734, -66.81509399414062, -55.434913635253906, -44.05472946166992, -32.6745491027832, -21.294368743896484, -9.9141845703125, 1.4659957885742188, 12.846176147460938, 24.226356506347656, 35.606536865234375, 46.98672103881836, 58.36690139770508, 69.74708557128906, 81.12726593017578, 92.5074462890625, 103.88762664794922, 115.26780700683594, 126.64798736572266, 138.02816772460938, 149.40835571289062, 160.7885284423828, 172.16871643066406, 183.54888916015625, 194.9290771484375]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 3.0, 2.0, 4.0, 5.0, 9.0, 10.0, 16.0, 15.0, 18.0, 11.0, 21.0, 26.0, 23.0, 32.0, 36.0, 31.0, 32.0, 46.0, 51.0, 44.0, 42.0, 50.0, 40.0, 32.0, 39.0, 43.0, 34.0, 33.0, 28.0, 25.0, 31.0, 24.0, 29.0, 17.0, 16.0, 11.0, 17.0, 11.0, 9.0, 14.0, 7.0, 2.0, 2.0, 4.0, 5.0, 4.0, 3.0, 1.0, 3.0], "bins": [-155.40689086914062, -151.18545532226562, -146.9640350341797, -142.74261474609375, -138.52117919921875, -134.29974365234375, -130.0783233642578, -125.85689544677734, -121.63546752929688, -117.4140396118164, -113.19261169433594, -108.97118377685547, -104.749755859375, -100.52832794189453, -96.30690002441406, -92.0854721069336, -87.86404418945312, -83.64261627197266, -79.42118835449219, -75.19976043701172, -70.97833251953125, -66.75690460205078, -62.53547668457031, -58.314048767089844, -54.092620849609375, -49.871192932128906, -45.64976501464844, -41.42833709716797, -37.2069091796875, -32.98548126220703, -28.764053344726562, -24.542625427246094, -20.321197509765625, -16.099769592285156, -11.878341674804688, -7.656913757324219, -3.43548583984375, 0.7859420776367188, 5.0073699951171875, 9.228797912597656, 13.450225830078125, 17.671653747558594, 21.893081665039062, 26.11450958251953, 30.3359375, 34.55736541748047, 38.77879333496094, 43.000221252441406, 47.221649169921875, 51.443077087402344, 55.66450500488281, 59.88593292236328, 64.10736083984375, 68.32878875732422, 72.55021667480469, 76.77164459228516, 80.99307250976562, 85.2145004272461, 89.43592834472656, 93.65735626220703, 97.8787841796875, 102.10021209716797, 106.32164001464844, 110.5430679321289, 114.76449584960938]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 5.0, 1.0, 4.0, 7.0, 8.0, 13.0, 11.0, 16.0, 24.0, 48.0, 42.0, 65.0, 94.0, 151.0, 241.0, 421.0, 580.0, 1130.0, 2224.0, 4987.0, 13776.0, 61908.0, 3994759.0, 86150.0, 16382.0, 5662.0, 2518.0, 1253.0, 621.0, 424.0, 242.0, 164.0, 107.0, 47.0, 45.0, 32.0, 38.0, 23.0, 12.0, 12.0, 10.0, 10.0, 4.0, 3.0, 3.0, 2.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.59375, -52.68310546875, -50.7724609375, -48.86181640625, -46.951171875, -45.04052734375, -43.1298828125, -41.21923828125, -39.30859375, -37.39794921875, -35.4873046875, -33.57666015625, -31.666015625, -29.75537109375, -27.8447265625, -25.93408203125, -24.0234375, -22.11279296875, -20.2021484375, -18.29150390625, -16.380859375, -14.47021484375, -12.5595703125, -10.64892578125, -8.73828125, -6.82763671875, -4.9169921875, -3.00634765625, -1.095703125, 0.81494140625, 2.7255859375, 4.63623046875, 6.546875, 8.45751953125, 10.3681640625, 12.27880859375, 14.189453125, 16.10009765625, 18.0107421875, 19.92138671875, 21.83203125, 23.74267578125, 25.6533203125, 27.56396484375, 29.474609375, 31.38525390625, 33.2958984375, 35.20654296875, 37.1171875, 39.02783203125, 40.9384765625, 42.84912109375, 44.759765625, 46.67041015625, 48.5810546875, 50.49169921875, 52.40234375, 54.31298828125, 56.2236328125, 58.13427734375, 60.044921875, 61.95556640625, 63.8662109375, 65.77685546875, 67.6875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 14.0, 12.0, 12.0, 24.0, 20.0, 15.0, 26.0, 31.0, 45.0, 54.0, 52.0, 66.0, 75.0, 67.0, 80.0, 59.0, 69.0, 46.0, 52.0, 39.0, 39.0, 20.0, 22.0, 15.0, 12.0, 14.0, 3.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.75, -10.3966064453125, -10.043212890625, -9.6898193359375, -9.33642578125, -8.9830322265625, -8.629638671875, -8.2762451171875, -7.9228515625, -7.5694580078125, -7.216064453125, -6.8626708984375, -6.50927734375, -6.1558837890625, -5.802490234375, -5.4490966796875, -5.095703125, -4.7423095703125, -4.388916015625, -4.0355224609375, -3.68212890625, -3.3287353515625, -2.975341796875, -2.6219482421875, -2.2685546875, -1.9151611328125, -1.561767578125, -1.2083740234375, -0.85498046875, -0.5015869140625, -0.148193359375, 0.2052001953125, 0.55859375, 0.9119873046875, 1.265380859375, 1.6187744140625, 1.97216796875, 2.3255615234375, 2.678955078125, 3.0323486328125, 3.3857421875, 3.7391357421875, 4.092529296875, 4.4459228515625, 4.79931640625, 5.1527099609375, 5.506103515625, 5.8594970703125, 6.212890625, 6.5662841796875, 6.919677734375, 7.2730712890625, 7.62646484375, 7.9798583984375, 8.333251953125, 8.6866455078125, 9.0400390625, 9.3934326171875, 9.746826171875, 10.1002197265625, 10.45361328125, 10.8070068359375, 11.160400390625, 11.5137939453125, 11.8671875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 5.0, 6.0, 10.0, 12.0, 19.0, 25.0, 44.0, 65.0, 117.0, 181.0, 302.0, 490.0, 805.0, 1431.0, 2386.0, 4594.0, 9377.0, 21949.0, 70700.0, 3549525.0, 441991.0, 54236.0, 18287.0, 8235.0, 4132.0, 2214.0, 1235.0, 745.0, 452.0, 267.0, 166.0, 102.0, 59.0, 42.0, 28.0, 18.0, 16.0, 7.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.109375, -28.224609375, -27.33984375, -26.455078125, -25.5703125, -24.685546875, -23.80078125, -22.916015625, -22.03125, -21.146484375, -20.26171875, -19.376953125, -18.4921875, -17.607421875, -16.72265625, -15.837890625, -14.953125, -14.068359375, -13.18359375, -12.298828125, -11.4140625, -10.529296875, -9.64453125, -8.759765625, -7.875, -6.990234375, -6.10546875, -5.220703125, -4.3359375, -3.451171875, -2.56640625, -1.681640625, -0.796875, 0.087890625, 0.97265625, 1.857421875, 2.7421875, 3.626953125, 4.51171875, 5.396484375, 6.28125, 7.166015625, 8.05078125, 8.935546875, 9.8203125, 10.705078125, 11.58984375, 12.474609375, 13.359375, 14.244140625, 15.12890625, 16.013671875, 16.8984375, 17.783203125, 18.66796875, 19.552734375, 20.4375, 21.322265625, 22.20703125, 23.091796875, 23.9765625, 24.861328125, 25.74609375, 26.630859375, 27.515625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 6.0, 4.0, 9.0, 10.0, 2.0, 12.0, 12.0, 21.0, 40.0, 71.0, 132.0, 404.0, 2924.0, 168.0, 72.0, 63.0, 23.0, 29.0, 15.0, 9.0, 11.0, 6.0, 9.0, 8.0, 10.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.98046875, -5.7889404296875, -5.597412109375, -5.4058837890625, -5.21435546875, -5.0228271484375, -4.831298828125, -4.6397705078125, -4.4482421875, -4.2567138671875, -4.065185546875, -3.8736572265625, -3.68212890625, -3.4906005859375, -3.299072265625, -3.1075439453125, -2.916015625, -2.7244873046875, -2.532958984375, -2.3414306640625, -2.14990234375, -1.9583740234375, -1.766845703125, -1.5753173828125, -1.3837890625, -1.1922607421875, -1.000732421875, -0.8092041015625, -0.61767578125, -0.4261474609375, -0.234619140625, -0.0430908203125, 0.1484375, 0.3399658203125, 0.531494140625, 0.7230224609375, 0.91455078125, 1.1060791015625, 1.297607421875, 1.4891357421875, 1.6806640625, 1.8721923828125, 2.063720703125, 2.2552490234375, 2.44677734375, 2.6383056640625, 2.829833984375, 3.0213623046875, 3.212890625, 3.4044189453125, 3.595947265625, 3.7874755859375, 3.97900390625, 4.1705322265625, 4.362060546875, 4.5535888671875, 4.7451171875, 4.9366455078125, 5.128173828125, 5.3197021484375, 5.51123046875, 5.7027587890625, 5.894287109375, 6.0858154296875, 6.27734375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 12.0, 13.0, 33.0, 63.0, 101.0, 160.0, 159.0, 167.0, 124.0, 94.0, 36.0, 14.0, 19.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.821247100830078, -20.340980529785156, -18.860713958740234, -17.38044548034668, -15.900178909301758, -14.419912338256836, -12.939644813537598, -11.45937728881836, -9.979110717773438, -8.498844146728516, -7.018576622009277, -5.538309574127197, -4.058042526245117, -2.577775478363037, -1.097508430480957, 0.38275909423828125, 1.8630256652832031, 3.343292713165283, 4.823559761047363, 6.303826808929443, 7.784093856811523, 9.264360427856445, 10.744627952575684, 12.224895477294922, 13.705162048339844, 15.185428619384766, 16.665695190429688, 18.145963668823242, 19.626230239868164, 21.106496810913086, 22.58676528930664, 24.067031860351562, 25.54730224609375, 27.027568817138672, 28.507835388183594, 29.98810386657715, 31.46837043762207, 32.948638916015625, 34.42890548706055, 35.90917205810547, 37.38943862915039, 38.86970520019531, 40.349971771240234, 41.830238342285156, 43.310508728027344, 44.790775299072266, 46.27104187011719, 47.75130844116211, 49.23157501220703, 50.71184158325195, 52.192108154296875, 53.6723747253418, 55.15264129638672, 56.632911682128906, 58.11317825317383, 59.59344482421875, 61.07371139526367, 62.553977966308594, 64.03424835205078, 65.51451110839844, 66.99478149414062, 68.47504425048828, 69.95531463623047, 71.43557739257812, 72.91584777832031]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 5.0, 4.0, 10.0, 7.0, 6.0, 11.0, 22.0, 13.0, 19.0, 15.0, 21.0, 26.0, 25.0, 37.0, 36.0, 35.0, 40.0, 40.0, 56.0, 36.0, 46.0, 40.0, 58.0, 32.0, 33.0, 35.0, 42.0, 38.0, 38.0, 25.0, 24.0, 29.0, 15.0, 12.0, 18.0, 12.0, 16.0, 4.0, 5.0, 7.0, 4.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.061873435974121, -14.571001052856445, -14.080129623413086, -13.58925724029541, -13.098384857177734, -12.607513427734375, -12.1166410446167, -11.625768661499023, -11.134897232055664, -10.644024848937988, -10.153153419494629, -9.662281036376953, -9.171408653259277, -8.680536270141602, -8.189664840698242, -7.698792457580566, -7.207920074462891, -6.717048168182373, -6.226175785064697, -5.73530387878418, -5.244431495666504, -4.753559589385986, -4.262687683105469, -3.771815538406372, -3.2809433937072754, -2.7900712490081787, -2.299199104309082, -1.8083271980285645, -1.3174550533294678, -0.8265829086303711, -0.3357110023498535, 0.15516114234924316, 0.6460323333740234, 1.1369044780731201, 1.6277765035629272, 2.1186485290527344, 2.609520673751831, 3.1003928184509277, 3.5912647247314453, 4.082137107849121, 4.573009014129639, 5.063880920410156, 5.554753303527832, 6.04562520980835, 6.536497116088867, 7.027369499206543, 7.5182414054870605, 8.009113311767578, 8.499985694885254, 8.99085807800293, 9.481729507446289, 9.972601890563965, 10.46347427368164, 10.954345703125, 11.445218086242676, 11.936090469360352, 12.426961898803711, 12.917834281921387, 13.408705711364746, 13.899578094482422, 14.390450477600098, 14.881322860717773, 15.372194290161133, 15.863066673278809, 16.353939056396484]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 9.0, 12.0, 14.0, 38.0, 39.0, 109.0, 150.0, 249.0, 477.0, 1059.0, 2420.0, 6828.0, 22608.0, 83682.0, 313563.0, 429174.0, 136043.0, 35465.0, 10477.0, 3481.0, 1266.0, 647.0, 313.0, 160.0, 89.0, 65.0, 33.0, 32.0, 18.0, 12.0, 8.0, 8.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-38.3125, -37.281982421875, -36.25146484375, -35.220947265625, -34.1904296875, -33.159912109375, -32.12939453125, -31.098876953125, -30.068359375, -29.037841796875, -28.00732421875, -26.976806640625, -25.9462890625, -24.915771484375, -23.88525390625, -22.854736328125, -21.82421875, -20.793701171875, -19.76318359375, -18.732666015625, -17.7021484375, -16.671630859375, -15.64111328125, -14.610595703125, -13.580078125, -12.549560546875, -11.51904296875, -10.488525390625, -9.4580078125, -8.427490234375, -7.39697265625, -6.366455078125, -5.3359375, -4.305419921875, -3.27490234375, -2.244384765625, -1.2138671875, -0.183349609375, 0.84716796875, 1.877685546875, 2.908203125, 3.938720703125, 4.96923828125, 5.999755859375, 7.0302734375, 8.060791015625, 9.09130859375, 10.121826171875, 11.15234375, 12.182861328125, 13.21337890625, 14.243896484375, 15.2744140625, 16.304931640625, 17.33544921875, 18.365966796875, 19.396484375, 20.427001953125, 21.45751953125, 22.488037109375, 23.5185546875, 24.549072265625, 25.57958984375, 26.610107421875, 27.640625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 3.0, 0.0, 5.0, 17.0, 7.0, 7.0, 18.0, 16.0, 22.0, 23.0, 33.0, 37.0, 32.0, 54.0, 54.0, 47.0, 69.0, 60.0, 70.0, 65.0, 55.0, 47.0, 44.0, 47.0, 35.0, 29.0, 25.0, 17.0, 19.0, 11.0, 12.0, 4.0, 6.0, 3.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7734375, -9.4317626953125, -9.090087890625, -8.7484130859375, -8.40673828125, -8.0650634765625, -7.723388671875, -7.3817138671875, -7.0400390625, -6.6983642578125, -6.356689453125, -6.0150146484375, -5.67333984375, -5.3316650390625, -4.989990234375, -4.6483154296875, -4.306640625, -3.9649658203125, -3.623291015625, -3.2816162109375, -2.93994140625, -2.5982666015625, -2.256591796875, -1.9149169921875, -1.5732421875, -1.2315673828125, -0.889892578125, -0.5482177734375, -0.20654296875, 0.1351318359375, 0.476806640625, 0.8184814453125, 1.16015625, 1.5018310546875, 1.843505859375, 2.1851806640625, 2.52685546875, 2.8685302734375, 3.210205078125, 3.5518798828125, 3.8935546875, 4.2352294921875, 4.576904296875, 4.9185791015625, 5.26025390625, 5.6019287109375, 5.943603515625, 6.2852783203125, 6.626953125, 6.9686279296875, 7.310302734375, 7.6519775390625, 7.99365234375, 8.3353271484375, 8.677001953125, 9.0186767578125, 9.3603515625, 9.7020263671875, 10.043701171875, 10.3853759765625, 10.72705078125, 11.0687255859375, 11.410400390625, 11.7520751953125, 12.09375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 4.0, 12.0, 18.0, 31.0, 35.0, 51.0, 107.0, 163.0, 248.0, 408.0, 705.0, 1337.0, 3571.0, 13932.0, 79777.0, 539730.0, 345493.0, 48394.0, 9225.0, 2643.0, 1149.0, 611.0, 357.0, 188.0, 139.0, 82.0, 42.0, 42.0, 21.0, 10.0, 8.0, 7.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-45.375, -44.20751953125, -43.0400390625, -41.87255859375, -40.705078125, -39.53759765625, -38.3701171875, -37.20263671875, -36.03515625, -34.86767578125, -33.7001953125, -32.53271484375, -31.365234375, -30.19775390625, -29.0302734375, -27.86279296875, -26.6953125, -25.52783203125, -24.3603515625, -23.19287109375, -22.025390625, -20.85791015625, -19.6904296875, -18.52294921875, -17.35546875, -16.18798828125, -15.0205078125, -13.85302734375, -12.685546875, -11.51806640625, -10.3505859375, -9.18310546875, -8.015625, -6.84814453125, -5.6806640625, -4.51318359375, -3.345703125, -2.17822265625, -1.0107421875, 0.15673828125, 1.32421875, 2.49169921875, 3.6591796875, 4.82666015625, 5.994140625, 7.16162109375, 8.3291015625, 9.49658203125, 10.6640625, 11.83154296875, 12.9990234375, 14.16650390625, 15.333984375, 16.50146484375, 17.6689453125, 18.83642578125, 20.00390625, 21.17138671875, 22.3388671875, 23.50634765625, 24.673828125, 25.84130859375, 27.0087890625, 28.17626953125, 29.34375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 9.0, 5.0, 9.0, 11.0, 20.0, 22.0, 25.0, 37.0, 45.0, 53.0, 57.0, 58.0, 74.0, 70.0, 58.0, 72.0, 71.0, 57.0, 73.0, 45.0, 37.0, 21.0, 19.0, 15.0, 8.0, 10.0, 5.0, 9.0, 8.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.5, -43.7412109375, -41.982421875, -40.2236328125, -38.46484375, -36.7060546875, -34.947265625, -33.1884765625, -31.4296875, -29.6708984375, -27.912109375, -26.1533203125, -24.39453125, -22.6357421875, -20.876953125, -19.1181640625, -17.359375, -15.6005859375, -13.841796875, -12.0830078125, -10.32421875, -8.5654296875, -6.806640625, -5.0478515625, -3.2890625, -1.5302734375, 0.228515625, 1.9873046875, 3.74609375, 5.5048828125, 7.263671875, 9.0224609375, 10.78125, 12.5400390625, 14.298828125, 16.0576171875, 17.81640625, 19.5751953125, 21.333984375, 23.0927734375, 24.8515625, 26.6103515625, 28.369140625, 30.1279296875, 31.88671875, 33.6455078125, 35.404296875, 37.1630859375, 38.921875, 40.6806640625, 42.439453125, 44.1982421875, 45.95703125, 47.7158203125, 49.474609375, 51.2333984375, 52.9921875, 54.7509765625, 56.509765625, 58.2685546875, 60.02734375, 61.7861328125, 63.544921875, 65.3037109375, 67.0625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 4.0, 9.0, 24.0, 20.0, 48.0, 80.0, 141.0, 240.0, 594.0, 1889.0, 7727.0, 55964.0, 666447.0, 285193.0, 23915.0, 4171.0, 1212.0, 426.0, 190.0, 88.0, 52.0, 48.0, 25.0, 13.0, 7.0, 10.0, 7.0, 3.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.15625, -19.45654296875, -18.7568359375, -18.05712890625, -17.357421875, -16.65771484375, -15.9580078125, -15.25830078125, -14.55859375, -13.85888671875, -13.1591796875, -12.45947265625, -11.759765625, -11.06005859375, -10.3603515625, -9.66064453125, -8.9609375, -8.26123046875, -7.5615234375, -6.86181640625, -6.162109375, -5.46240234375, -4.7626953125, -4.06298828125, -3.36328125, -2.66357421875, -1.9638671875, -1.26416015625, -0.564453125, 0.13525390625, 0.8349609375, 1.53466796875, 2.234375, 2.93408203125, 3.6337890625, 4.33349609375, 5.033203125, 5.73291015625, 6.4326171875, 7.13232421875, 7.83203125, 8.53173828125, 9.2314453125, 9.93115234375, 10.630859375, 11.33056640625, 12.0302734375, 12.72998046875, 13.4296875, 14.12939453125, 14.8291015625, 15.52880859375, 16.228515625, 16.92822265625, 17.6279296875, 18.32763671875, 19.02734375, 19.72705078125, 20.4267578125, 21.12646484375, 21.826171875, 22.52587890625, 23.2255859375, 23.92529296875, 24.625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 6.0, 8.0, 8.0, 7.0, 12.0, 19.0, 16.0, 25.0, 35.0, 42.0, 61.0, 57.0, 100.0, 90.0, 97.0, 100.0, 81.0, 66.0, 47.0, 29.0, 21.0, 16.0, 10.0, 5.0, 7.0, 8.0, 6.0, 7.0, 2.0, 5.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0017881393432617188, -0.0017286986112594604, -0.0016692578792572021, -0.0016098171472549438, -0.0015503764152526855, -0.0014909356832504272, -0.001431494951248169, -0.0013720542192459106, -0.0013126134872436523, -0.001253172755241394, -0.0011937320232391357, -0.0011342912912368774, -0.0010748505592346191, -0.0010154098272323608, -0.0009559690952301025, -0.0008965283632278442, -0.0008370876312255859, -0.0007776468992233276, -0.0007182061672210693, -0.000658765435218811, -0.0005993247032165527, -0.0005398839712142944, -0.00048044323921203613, -0.00042100250720977783, -0.00036156177520751953, -0.00030212104320526123, -0.00024268031120300293, -0.00018323957920074463, -0.00012379884719848633, -6.435811519622803e-05, -4.9173831939697266e-06, 5.4523348808288574e-05, 0.00011396408081054688, 0.00017340481281280518, 0.00023284554481506348, 0.0002922862768173218, 0.0003517270088195801, 0.0004111677408218384, 0.0004706084728240967, 0.000530049204826355, 0.0005894899368286133, 0.0006489306688308716, 0.0007083714008331299, 0.0007678121328353882, 0.0008272528648376465, 0.0008866935968399048, 0.0009461343288421631, 0.0010055750608444214, 0.0010650157928466797, 0.001124456524848938, 0.0011838972568511963, 0.0012433379888534546, 0.0013027787208557129, 0.0013622194528579712, 0.0014216601848602295, 0.0014811009168624878, 0.001540541648864746, 0.0015999823808670044, 0.0016594231128692627, 0.001718863844871521, 0.0017783045768737793, 0.0018377453088760376, 0.001897186040878296, 0.001956626772880554, 0.0020160675048828125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 7.0, 6.0, 8.0, 17.0, 18.0, 35.0, 60.0, 104.0, 236.0, 576.0, 1799.0, 9962.0, 183686.0, 807592.0, 38576.0, 4129.0, 985.0, 369.0, 183.0, 81.0, 47.0, 29.0, 22.0, 10.0, 3.0, 7.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.34375, -19.38720703125, -18.4306640625, -17.47412109375, -16.517578125, -15.56103515625, -14.6044921875, -13.64794921875, -12.69140625, -11.73486328125, -10.7783203125, -9.82177734375, -8.865234375, -7.90869140625, -6.9521484375, -5.99560546875, -5.0390625, -4.08251953125, -3.1259765625, -2.16943359375, -1.212890625, -0.25634765625, 0.7001953125, 1.65673828125, 2.61328125, 3.56982421875, 4.5263671875, 5.48291015625, 6.439453125, 7.39599609375, 8.3525390625, 9.30908203125, 10.265625, 11.22216796875, 12.1787109375, 13.13525390625, 14.091796875, 15.04833984375, 16.0048828125, 16.96142578125, 17.91796875, 18.87451171875, 19.8310546875, 20.78759765625, 21.744140625, 22.70068359375, 23.6572265625, 24.61376953125, 25.5703125, 26.52685546875, 27.4833984375, 28.43994140625, 29.396484375, 30.35302734375, 31.3095703125, 32.26611328125, 33.22265625, 34.17919921875, 35.1357421875, 36.09228515625, 37.048828125, 38.00537109375, 38.9619140625, 39.91845703125, 40.875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 9.0, 21.0, 29.0, 58.0, 138.0, 291.0, 230.0, 114.0, 62.0, 18.0, 21.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.78125, -57.52490234375, -56.2685546875, -55.01220703125, -53.755859375, -52.49951171875, -51.2431640625, -49.98681640625, -48.73046875, -47.47412109375, -46.2177734375, -44.96142578125, -43.705078125, -42.44873046875, -41.1923828125, -39.93603515625, -38.6796875, -37.42333984375, -36.1669921875, -34.91064453125, -33.654296875, -32.39794921875, -31.1416015625, -29.88525390625, -28.62890625, -27.37255859375, -26.1162109375, -24.85986328125, -23.603515625, -22.34716796875, -21.0908203125, -19.83447265625, -18.578125, -17.32177734375, -16.0654296875, -14.80908203125, -13.552734375, -12.29638671875, -11.0400390625, -9.78369140625, -8.52734375, -7.27099609375, -6.0146484375, -4.75830078125, -3.501953125, -2.24560546875, -0.9892578125, 0.26708984375, 1.5234375, 2.77978515625, 4.0361328125, 5.29248046875, 6.548828125, 7.80517578125, 9.0615234375, 10.31787109375, 11.57421875, 12.83056640625, 14.0869140625, 15.34326171875, 16.599609375, 17.85595703125, 19.1123046875, 20.36865234375, 21.625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 27.0, 27.0, 83.0, 122.0, 200.0, 208.0, 154.0, 85.0, 46.0, 23.0, 17.0, 12.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-285.73980712890625, -273.4122009277344, -261.0846252441406, -248.75701904296875, -236.42942810058594, -224.10183715820312, -211.77423095703125, -199.44664001464844, -187.11904907226562, -174.7914581298828, -162.4638671875, -150.13626098632812, -137.8086700439453, -125.4810791015625, -113.15348052978516, -100.82588195800781, -88.498291015625, -76.17070007324219, -63.843101501464844, -51.515506744384766, -39.18791198730469, -26.86031723022461, -14.532722473144531, -2.2051239013671875, 10.122467041015625, 22.450061798095703, 34.77765655517578, 47.10525131225586, 59.43284606933594, 71.76043701171875, 84.0880355834961, 96.41563415527344, 108.74325561523438, 121.07084655761719, 133.3984375, 145.72604370117188, 158.0536346435547, 170.3812255859375, 182.70883178710938, 195.0364227294922, 207.364013671875, 219.6916046142578, 232.01919555664062, 244.3468017578125, 256.67437744140625, 269.0019836425781, 281.32958984375, 293.65716552734375, 305.9847717285156, 318.3123779296875, 330.63995361328125, 342.9675598144531, 355.295166015625, 367.62274169921875, 379.9503479003906, 392.2779541015625, 404.60552978515625, 416.9331359863281, 429.2607116699219, 441.58831787109375, 453.9158935546875, 466.2434997558594, 478.57110595703125, 490.898681640625, 503.2262878417969]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 10.0, 9.0, 16.0, 6.0, 16.0, 13.0, 21.0, 26.0, 24.0, 32.0, 24.0, 36.0, 42.0, 50.0, 45.0, 53.0, 42.0, 50.0, 49.0, 45.0, 42.0, 41.0, 38.0, 40.0, 33.0, 35.0, 22.0, 18.0, 17.0, 26.0, 15.0, 11.0, 11.0, 8.0, 2.0, 8.0, 8.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-171.52256774902344, -165.47189331054688, -159.42120361328125, -153.37051391601562, -147.31983947753906, -141.2691650390625, -135.21847534179688, -129.16778564453125, -123.11711120605469, -117.0664291381836, -111.0157470703125, -104.9650650024414, -98.91438293457031, -92.86370086669922, -86.81301879882812, -80.76233673095703, -74.71165466308594, -68.66097259521484, -62.61029052734375, -56.559608459472656, -50.50892639160156, -44.45824432373047, -38.407562255859375, -32.35688018798828, -26.306198120117188, -20.255516052246094, -14.204833984375, -8.154151916503906, -2.1034698486328125, 3.9472122192382812, 9.997894287109375, 16.04857635498047, 22.099273681640625, 28.14995574951172, 34.20063781738281, 40.251319885253906, 46.302001953125, 52.352684020996094, 58.40336608886719, 64.45404815673828, 70.50473022460938, 76.55541229248047, 82.60609436035156, 88.65677642822266, 94.70745849609375, 100.75814056396484, 106.80882263183594, 112.85950469970703, 118.91018676757812, 124.96086883544922, 131.0115509033203, 137.06222534179688, 143.1129150390625, 149.16360473632812, 155.2142791748047, 161.26495361328125, 167.31564331054688, 173.3663330078125, 179.41700744628906, 185.46768188476562, 191.51837158203125, 197.56906127929688, 203.61973571777344, 209.67041015625, 215.72109985351562]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 7.0, 11.0, 6.0, 18.0, 23.0, 29.0, 56.0, 75.0, 113.0, 158.0, 316.0, 474.0, 897.0, 1705.0, 4105.0, 12298.0, 62134.0, 3975148.0, 110311.0, 16735.0, 5137.0, 2082.0, 975.0, 528.0, 323.0, 204.0, 121.0, 80.0, 46.0, 36.0, 30.0, 26.0, 15.0, 15.0, 8.0, 8.0, 5.0, 3.0, 5.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-61.65625, -59.822265625, -57.98828125, -56.154296875, -54.3203125, -52.486328125, -50.65234375, -48.818359375, -46.984375, -45.150390625, -43.31640625, -41.482421875, -39.6484375, -37.814453125, -35.98046875, -34.146484375, -32.3125, -30.478515625, -28.64453125, -26.810546875, -24.9765625, -23.142578125, -21.30859375, -19.474609375, -17.640625, -15.806640625, -13.97265625, -12.138671875, -10.3046875, -8.470703125, -6.63671875, -4.802734375, -2.96875, -1.134765625, 0.69921875, 2.533203125, 4.3671875, 6.201171875, 8.03515625, 9.869140625, 11.703125, 13.537109375, 15.37109375, 17.205078125, 19.0390625, 20.873046875, 22.70703125, 24.541015625, 26.375, 28.208984375, 30.04296875, 31.876953125, 33.7109375, 35.544921875, 37.37890625, 39.212890625, 41.046875, 42.880859375, 44.71484375, 46.548828125, 48.3828125, 50.216796875, 52.05078125, 53.884765625, 55.71875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 4.0, 3.0, 3.0, 5.0, 6.0, 15.0, 10.0, 11.0, 23.0, 20.0, 19.0, 29.0, 27.0, 39.0, 47.0, 53.0, 61.0, 51.0, 56.0, 67.0, 61.0, 55.0, 55.0, 42.0, 46.0, 43.0, 34.0, 24.0, 19.0, 24.0, 14.0, 11.0, 9.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9609375, -9.616455078125, -9.27197265625, -8.927490234375, -8.5830078125, -8.238525390625, -7.89404296875, -7.549560546875, -7.205078125, -6.860595703125, -6.51611328125, -6.171630859375, -5.8271484375, -5.482666015625, -5.13818359375, -4.793701171875, -4.44921875, -4.104736328125, -3.76025390625, -3.415771484375, -3.0712890625, -2.726806640625, -2.38232421875, -2.037841796875, -1.693359375, -1.348876953125, -1.00439453125, -0.659912109375, -0.3154296875, 0.029052734375, 0.37353515625, 0.718017578125, 1.0625, 1.406982421875, 1.75146484375, 2.095947265625, 2.4404296875, 2.784912109375, 3.12939453125, 3.473876953125, 3.818359375, 4.162841796875, 4.50732421875, 4.851806640625, 5.1962890625, 5.540771484375, 5.88525390625, 6.229736328125, 6.57421875, 6.918701171875, 7.26318359375, 7.607666015625, 7.9521484375, 8.296630859375, 8.64111328125, 8.985595703125, 9.330078125, 9.674560546875, 10.01904296875, 10.363525390625, 10.7080078125, 11.052490234375, 11.39697265625, 11.741455078125, 12.0859375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 10.0, 6.0, 9.0, 15.0, 18.0, 29.0, 48.0, 50.0, 76.0, 110.0, 142.0, 224.0, 317.0, 523.0, 815.0, 1351.0, 2556.0, 5226.0, 12386.0, 36958.0, 172228.0, 3738484.0, 163419.0, 35970.0, 12142.0, 5092.0, 2525.0, 1257.0, 761.0, 507.0, 321.0, 215.0, 144.0, 93.0, 78.0, 52.0, 35.0, 31.0, 18.0, 15.0, 6.0, 7.0, 3.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.21875, -24.30126953125, -23.3837890625, -22.46630859375, -21.548828125, -20.63134765625, -19.7138671875, -18.79638671875, -17.87890625, -16.96142578125, -16.0439453125, -15.12646484375, -14.208984375, -13.29150390625, -12.3740234375, -11.45654296875, -10.5390625, -9.62158203125, -8.7041015625, -7.78662109375, -6.869140625, -5.95166015625, -5.0341796875, -4.11669921875, -3.19921875, -2.28173828125, -1.3642578125, -0.44677734375, 0.470703125, 1.38818359375, 2.3056640625, 3.22314453125, 4.140625, 5.05810546875, 5.9755859375, 6.89306640625, 7.810546875, 8.72802734375, 9.6455078125, 10.56298828125, 11.48046875, 12.39794921875, 13.3154296875, 14.23291015625, 15.150390625, 16.06787109375, 16.9853515625, 17.90283203125, 18.8203125, 19.73779296875, 20.6552734375, 21.57275390625, 22.490234375, 23.40771484375, 24.3251953125, 25.24267578125, 26.16015625, 27.07763671875, 27.9951171875, 28.91259765625, 29.830078125, 30.74755859375, 31.6650390625, 32.58251953125, 33.5]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 4.0, 4.0, 15.0, 11.0, 21.0, 34.0, 63.0, 108.0, 203.0, 2800.0, 440.0, 145.0, 66.0, 53.0, 30.0, 23.0, 13.0, 16.0, 7.0, 4.0, 4.0, 4.0, 3.0, 2.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.859375, -7.59521484375, -7.3310546875, -7.06689453125, -6.802734375, -6.53857421875, -6.2744140625, -6.01025390625, -5.74609375, -5.48193359375, -5.2177734375, -4.95361328125, -4.689453125, -4.42529296875, -4.1611328125, -3.89697265625, -3.6328125, -3.36865234375, -3.1044921875, -2.84033203125, -2.576171875, -2.31201171875, -2.0478515625, -1.78369140625, -1.51953125, -1.25537109375, -0.9912109375, -0.72705078125, -0.462890625, -0.19873046875, 0.0654296875, 0.32958984375, 0.59375, 0.85791015625, 1.1220703125, 1.38623046875, 1.650390625, 1.91455078125, 2.1787109375, 2.44287109375, 2.70703125, 2.97119140625, 3.2353515625, 3.49951171875, 3.763671875, 4.02783203125, 4.2919921875, 4.55615234375, 4.8203125, 5.08447265625, 5.3486328125, 5.61279296875, 5.876953125, 6.14111328125, 6.4052734375, 6.66943359375, 6.93359375, 7.19775390625, 7.4619140625, 7.72607421875, 7.990234375, 8.25439453125, 8.5185546875, 8.78271484375, 9.046875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 5.0, 12.0, 13.0, 14.0, 28.0, 20.0, 45.0, 37.0, 57.0, 67.0, 74.0, 79.0, 78.0, 91.0, 74.0, 83.0, 56.0, 43.0, 34.0, 21.0, 19.0, 19.0, 15.0, 4.0, 6.0, 2.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.86351776123047, -22.810800552368164, -21.75808334350586, -20.705366134643555, -19.65264892578125, -18.599933624267578, -17.547216415405273, -16.49449920654297, -15.441781997680664, -14.38906478881836, -13.336347579956055, -12.283631324768066, -11.230914115905762, -10.178196907043457, -9.125480651855469, -8.072763442993164, -7.020046234130859, -5.967329025268555, -4.914612293243408, -3.8618953227996826, -2.809178352355957, -1.7564611434936523, -0.7037444114685059, 0.3489723205566406, 1.4016895294189453, 2.454406499862671, 3.5071234703063965, 4.559840202331543, 5.612557411193848, 6.665274620056152, 7.717991352081299, 8.770708084106445, 9.82342529296875, 10.876142501831055, 11.92885971069336, 12.981575965881348, 14.034293174743652, 15.087010383605957, 16.139726638793945, 17.19244384765625, 18.245161056518555, 19.29787826538086, 20.350595474243164, 21.40331268310547, 22.45602798461914, 23.508747100830078, 24.56146240234375, 25.614179611206055, 26.66689682006836, 27.719614028930664, 28.77233123779297, 29.825048446655273, 30.877765655517578, 31.93048095703125, 32.98320007324219, 34.03591537475586, 35.08863067626953, 36.1413459777832, 37.19406509399414, 38.24678039550781, 39.29949951171875, 40.35221481323242, 41.40493392944336, 42.45764923095703, 43.51036834716797]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 1.0, 6.0, 3.0, 7.0, 8.0, 8.0, 13.0, 20.0, 17.0, 19.0, 17.0, 20.0, 18.0, 28.0, 23.0, 39.0, 28.0, 33.0, 36.0, 27.0, 35.0, 40.0, 33.0, 41.0, 41.0, 47.0, 33.0, 34.0, 36.0, 31.0, 34.0, 27.0, 35.0, 24.0, 27.0, 15.0, 17.0, 19.0, 10.0, 8.0, 7.0, 11.0, 7.0, 5.0, 1.0, 2.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0], "bins": [-20.44688606262207, -19.838655471801758, -19.230424880981445, -18.6221923828125, -18.013961791992188, -17.405731201171875, -16.797500610351562, -16.18927001953125, -15.581038475036621, -14.972807884216309, -14.36457633972168, -13.756345748901367, -13.148115158081055, -12.539883613586426, -11.931653022766113, -11.323421478271484, -10.715190887451172, -10.10696029663086, -9.49872875213623, -8.890498161315918, -8.282266616821289, -7.674036026000977, -7.065805435180664, -6.457574367523193, -5.849343299865723, -5.241112232208252, -4.632881164550781, -4.024650573730469, -3.416419506072998, -2.8081884384155273, -2.1999576091766357, -1.5917267799377441, -0.9834938049316406, -0.3752628564834595, 0.23296809196472168, 0.8411990404129028, 1.449429988861084, 2.0576610565185547, 2.6658918857574463, 3.274122714996338, 3.8823537826538086, 4.490584850311279, 5.09881591796875, 5.7070465087890625, 6.315277576446533, 6.923508644104004, 7.531739234924316, 8.139970779418945, 8.748201370239258, 9.35643196105957, 9.9646635055542, 10.572894096374512, 11.18112564086914, 11.789356231689453, 12.397586822509766, 13.005817413330078, 13.614048957824707, 14.22227954864502, 14.830511093139648, 15.438741683959961, 16.046972274780273, 16.65520477294922, 17.26343536376953, 17.871665954589844, 18.479896545410156]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 5.0, 7.0, 11.0, 11.0, 13.0, 23.0, 35.0, 33.0, 54.0, 98.0, 163.0, 226.0, 386.0, 714.0, 1307.0, 2392.0, 4898.0, 10575.0, 24868.0, 61761.0, 160364.0, 330136.0, 265697.0, 109294.0, 42368.0, 17463.0, 7788.0, 3700.0, 1773.0, 954.0, 549.0, 328.0, 171.0, 138.0, 83.0, 58.0, 45.0, 23.0, 12.0, 12.0, 9.0, 7.0, 4.0, 3.0, 3.0, 5.0], "bins": [-23.265625, -22.6810302734375, -22.096435546875, -21.5118408203125, -20.92724609375, -20.3426513671875, -19.758056640625, -19.1734619140625, -18.5888671875, -18.0042724609375, -17.419677734375, -16.8350830078125, -16.25048828125, -15.6658935546875, -15.081298828125, -14.4967041015625, -13.912109375, -13.3275146484375, -12.742919921875, -12.1583251953125, -11.57373046875, -10.9891357421875, -10.404541015625, -9.8199462890625, -9.2353515625, -8.6507568359375, -8.066162109375, -7.4815673828125, -6.89697265625, -6.3123779296875, -5.727783203125, -5.1431884765625, -4.55859375, -3.9739990234375, -3.389404296875, -2.8048095703125, -2.22021484375, -1.6356201171875, -1.051025390625, -0.4664306640625, 0.1181640625, 0.7027587890625, 1.287353515625, 1.8719482421875, 2.45654296875, 3.0411376953125, 3.625732421875, 4.2103271484375, 4.794921875, 5.3795166015625, 5.964111328125, 6.5487060546875, 7.13330078125, 7.7178955078125, 8.302490234375, 8.8870849609375, 9.4716796875, 10.0562744140625, 10.640869140625, 11.2254638671875, 11.81005859375, 12.3946533203125, 12.979248046875, 13.5638427734375, 14.1484375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 5.0, 6.0, 6.0, 13.0, 14.0, 17.0, 13.0, 18.0, 43.0, 23.0, 32.0, 40.0, 44.0, 43.0, 38.0, 49.0, 55.0, 71.0, 56.0, 53.0, 52.0, 45.0, 46.0, 49.0, 30.0, 30.0, 29.0, 17.0, 13.0, 12.0, 13.0, 4.0, 4.0, 2.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.671875, -10.3175048828125, -9.963134765625, -9.6087646484375, -9.25439453125, -8.9000244140625, -8.545654296875, -8.1912841796875, -7.8369140625, -7.4825439453125, -7.128173828125, -6.7738037109375, -6.41943359375, -6.0650634765625, -5.710693359375, -5.3563232421875, -5.001953125, -4.6475830078125, -4.293212890625, -3.9388427734375, -3.58447265625, -3.2301025390625, -2.875732421875, -2.5213623046875, -2.1669921875, -1.8126220703125, -1.458251953125, -1.1038818359375, -0.74951171875, -0.3951416015625, -0.040771484375, 0.3135986328125, 0.66796875, 1.0223388671875, 1.376708984375, 1.7310791015625, 2.08544921875, 2.4398193359375, 2.794189453125, 3.1485595703125, 3.5029296875, 3.8572998046875, 4.211669921875, 4.5660400390625, 4.92041015625, 5.2747802734375, 5.629150390625, 5.9835205078125, 6.337890625, 6.6922607421875, 7.046630859375, 7.4010009765625, 7.75537109375, 8.1097412109375, 8.464111328125, 8.8184814453125, 9.1728515625, 9.5272216796875, 9.881591796875, 10.2359619140625, 10.59033203125, 10.9447021484375, 11.299072265625, 11.6534423828125, 12.0078125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 6.0, 5.0, 7.0, 14.0, 17.0, 25.0, 38.0, 51.0, 109.0, 154.0, 286.0, 443.0, 807.0, 1514.0, 3996.0, 20550.0, 223846.0, 708073.0, 74141.0, 9319.0, 2496.0, 1097.0, 609.0, 362.0, 222.0, 130.0, 85.0, 58.0, 32.0, 19.0, 18.0, 15.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.09375, -38.77001953125, -37.4462890625, -36.12255859375, -34.798828125, -33.47509765625, -32.1513671875, -30.82763671875, -29.50390625, -28.18017578125, -26.8564453125, -25.53271484375, -24.208984375, -22.88525390625, -21.5615234375, -20.23779296875, -18.9140625, -17.59033203125, -16.2666015625, -14.94287109375, -13.619140625, -12.29541015625, -10.9716796875, -9.64794921875, -8.32421875, -7.00048828125, -5.6767578125, -4.35302734375, -3.029296875, -1.70556640625, -0.3818359375, 0.94189453125, 2.265625, 3.58935546875, 4.9130859375, 6.23681640625, 7.560546875, 8.88427734375, 10.2080078125, 11.53173828125, 12.85546875, 14.17919921875, 15.5029296875, 16.82666015625, 18.150390625, 19.47412109375, 20.7978515625, 22.12158203125, 23.4453125, 24.76904296875, 26.0927734375, 27.41650390625, 28.740234375, 30.06396484375, 31.3876953125, 32.71142578125, 34.03515625, 35.35888671875, 36.6826171875, 38.00634765625, 39.330078125, 40.65380859375, 41.9775390625, 43.30126953125, 44.625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 6.0, 10.0, 15.0, 11.0, 24.0, 28.0, 36.0, 47.0, 68.0, 68.0, 81.0, 97.0, 92.0, 82.0, 74.0, 74.0, 60.0, 46.0, 39.0, 12.0, 19.0, 8.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.125, -94.6435546875, -92.162109375, -89.6806640625, -87.19921875, -84.7177734375, -82.236328125, -79.7548828125, -77.2734375, -74.7919921875, -72.310546875, -69.8291015625, -67.34765625, -64.8662109375, -62.384765625, -59.9033203125, -57.421875, -54.9404296875, -52.458984375, -49.9775390625, -47.49609375, -45.0146484375, -42.533203125, -40.0517578125, -37.5703125, -35.0888671875, -32.607421875, -30.1259765625, -27.64453125, -25.1630859375, -22.681640625, -20.2001953125, -17.71875, -15.2373046875, -12.755859375, -10.2744140625, -7.79296875, -5.3115234375, -2.830078125, -0.3486328125, 2.1328125, 4.6142578125, 7.095703125, 9.5771484375, 12.05859375, 14.5400390625, 17.021484375, 19.5029296875, 21.984375, 24.4658203125, 26.947265625, 29.4287109375, 31.91015625, 34.3916015625, 36.873046875, 39.3544921875, 41.8359375, 44.3173828125, 46.798828125, 49.2802734375, 51.76171875, 54.2431640625, 56.724609375, 59.2060546875, 61.6875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 2.0, 3.0, 4.0, 5.0, 5.0, 9.0, 9.0, 20.0, 24.0, 36.0, 33.0, 46.0, 87.0, 165.0, 320.0, 830.0, 2377.0, 10241.0, 72716.0, 685320.0, 244919.0, 24460.0, 4593.0, 1227.0, 469.0, 236.0, 130.0, 79.0, 62.0, 28.0, 20.0, 23.0, 16.0, 12.0, 8.0, 7.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.90625, -14.4366455078125, -13.967041015625, -13.4974365234375, -13.02783203125, -12.5582275390625, -12.088623046875, -11.6190185546875, -11.1494140625, -10.6798095703125, -10.210205078125, -9.7406005859375, -9.27099609375, -8.8013916015625, -8.331787109375, -7.8621826171875, -7.392578125, -6.9229736328125, -6.453369140625, -5.9837646484375, -5.51416015625, -5.0445556640625, -4.574951171875, -4.1053466796875, -3.6357421875, -3.1661376953125, -2.696533203125, -2.2269287109375, -1.75732421875, -1.2877197265625, -0.818115234375, -0.3485107421875, 0.12109375, 0.5906982421875, 1.060302734375, 1.5299072265625, 1.99951171875, 2.4691162109375, 2.938720703125, 3.4083251953125, 3.8779296875, 4.3475341796875, 4.817138671875, 5.2867431640625, 5.75634765625, 6.2259521484375, 6.695556640625, 7.1651611328125, 7.634765625, 8.1043701171875, 8.573974609375, 9.0435791015625, 9.51318359375, 9.9827880859375, 10.452392578125, 10.9219970703125, 11.3916015625, 11.8612060546875, 12.330810546875, 12.8004150390625, 13.27001953125, 13.7396240234375, 14.209228515625, 14.6788330078125, 15.1484375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 1.0, 4.0, 1.0, 3.0, 7.0, 12.0, 14.0, 14.0, 23.0, 23.0, 26.0, 38.0, 49.0, 61.0, 86.0, 92.0, 97.0, 77.0, 94.0, 74.0, 52.0, 40.0, 21.0, 15.0, 27.0, 12.0, 6.0, 3.0, 7.0, 7.0, 3.0, 6.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015344619750976562, -0.001486077904701233, -0.0014376938343048096, -0.0013893097639083862, -0.0013409256935119629, -0.0012925416231155396, -0.0012441575527191162, -0.0011957734823226929, -0.0011473894119262695, -0.0010990053415298462, -0.0010506212711334229, -0.0010022372007369995, -0.0009538531303405762, -0.0009054690599441528, -0.0008570849895477295, -0.0008087009191513062, -0.0007603168487548828, -0.0007119327783584595, -0.0006635487079620361, -0.0006151646375656128, -0.0005667805671691895, -0.0005183964967727661, -0.0004700124263763428, -0.00042162835597991943, -0.0003732442855834961, -0.00032486021518707275, -0.0002764761447906494, -0.00022809207439422607, -0.00017970800399780273, -0.0001313239336013794, -8.293986320495605e-05, -3.4555792808532715e-05, 1.3828277587890625e-05, 6.221234798431396e-05, 0.0001105964183807373, 0.00015898048877716064, 0.00020736455917358398, 0.0002557486295700073, 0.00030413269996643066, 0.000352516770362854, 0.00040090084075927734, 0.0004492849111557007, 0.000497668981552124, 0.0005460530519485474, 0.0005944371223449707, 0.000642821192741394, 0.0006912052631378174, 0.0007395893335342407, 0.0007879734039306641, 0.0008363574743270874, 0.0008847415447235107, 0.0009331256151199341, 0.0009815096855163574, 0.0010298937559127808, 0.001078277826309204, 0.0011266618967056274, 0.0011750459671020508, 0.0012234300374984741, 0.0012718141078948975, 0.0013201981782913208, 0.0013685822486877441, 0.0014169663190841675, 0.0014653503894805908, 0.0015137344598770142, 0.0015621185302734375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 8.0, 12.0, 18.0, 39.0, 64.0, 96.0, 148.0, 340.0, 870.0, 2642.0, 15790.0, 292222.0, 693800.0, 35941.0, 4480.0, 1144.0, 420.0, 207.0, 125.0, 66.0, 45.0, 22.0, 17.0, 10.0, 6.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.984375, -22.365966796875, -21.74755859375, -21.129150390625, -20.5107421875, -19.892333984375, -19.27392578125, -18.655517578125, -18.037109375, -17.418701171875, -16.80029296875, -16.181884765625, -15.5634765625, -14.945068359375, -14.32666015625, -13.708251953125, -13.08984375, -12.471435546875, -11.85302734375, -11.234619140625, -10.6162109375, -9.997802734375, -9.37939453125, -8.760986328125, -8.142578125, -7.524169921875, -6.90576171875, -6.287353515625, -5.6689453125, -5.050537109375, -4.43212890625, -3.813720703125, -3.1953125, -2.576904296875, -1.95849609375, -1.340087890625, -0.7216796875, -0.103271484375, 0.51513671875, 1.133544921875, 1.751953125, 2.370361328125, 2.98876953125, 3.607177734375, 4.2255859375, 4.843994140625, 5.46240234375, 6.080810546875, 6.69921875, 7.317626953125, 7.93603515625, 8.554443359375, 9.1728515625, 9.791259765625, 10.40966796875, 11.028076171875, 11.646484375, 12.264892578125, 12.88330078125, 13.501708984375, 14.1201171875, 14.738525390625, 15.35693359375, 15.975341796875, 16.59375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 8.0, 16.0, 18.0, 29.0, 62.0, 116.0, 174.0, 212.0, 161.0, 82.0, 46.0, 35.0, 18.0, 11.0, 10.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.53125, -12.74658203125, -11.9619140625, -11.17724609375, -10.392578125, -9.60791015625, -8.8232421875, -8.03857421875, -7.25390625, -6.46923828125, -5.6845703125, -4.89990234375, -4.115234375, -3.33056640625, -2.5458984375, -1.76123046875, -0.9765625, -0.19189453125, 0.5927734375, 1.37744140625, 2.162109375, 2.94677734375, 3.7314453125, 4.51611328125, 5.30078125, 6.08544921875, 6.8701171875, 7.65478515625, 8.439453125, 9.22412109375, 10.0087890625, 10.79345703125, 11.578125, 12.36279296875, 13.1474609375, 13.93212890625, 14.716796875, 15.50146484375, 16.2861328125, 17.07080078125, 17.85546875, 18.64013671875, 19.4248046875, 20.20947265625, 20.994140625, 21.77880859375, 22.5634765625, 23.34814453125, 24.1328125, 24.91748046875, 25.7021484375, 26.48681640625, 27.271484375, 28.05615234375, 28.8408203125, 29.62548828125, 30.41015625, 31.19482421875, 31.9794921875, 32.76416015625, 33.548828125, 34.33349609375, 35.1181640625, 35.90283203125, 36.6875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 4.0, 10.0, 25.0, 62.0, 113.0, 178.0, 186.0, 198.0, 104.0, 67.0, 29.0, 16.0, 5.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-238.80343627929688, -229.04330444335938, -219.28317260742188, -209.52304077148438, -199.76290893554688, -190.00277709960938, -180.24266052246094, -170.48252868652344, -160.72239685058594, -150.96226501464844, -141.20213317871094, -131.44200134277344, -121.68187713623047, -111.92174530029297, -102.16162109375, -92.4014892578125, -82.641357421875, -72.8812255859375, -63.121097564697266, -53.36096954345703, -43.60083770751953, -33.84070587158203, -24.080577850341797, -14.320449829101562, -4.5603179931640625, 5.199811935424805, 14.959941864013672, 24.72007179260254, 34.480201721191406, 44.240333557128906, 54.00046157836914, 63.760589599609375, 73.520751953125, 83.2808837890625, 93.041015625, 102.80113983154297, 112.56127166748047, 122.32140350341797, 132.08152770996094, 141.84165954589844, 151.60179138183594, 161.36192321777344, 171.12205505371094, 180.88218688964844, 190.64230346679688, 200.40243530273438, 210.16256713867188, 219.92269897460938, 229.68283081054688, 239.44296264648438, 249.20309448242188, 258.9632263183594, 268.7233581542969, 278.4834899902344, 288.2436218261719, 298.00372314453125, 307.76385498046875, 317.52398681640625, 327.28411865234375, 337.04425048828125, 346.80438232421875, 356.56451416015625, 366.32464599609375, 376.08477783203125, 385.84490966796875]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 7.0, 8.0, 7.0, 6.0, 6.0, 9.0, 14.0, 20.0, 18.0, 19.0, 16.0, 25.0, 30.0, 30.0, 35.0, 39.0, 38.0, 69.0, 42.0, 46.0, 42.0, 49.0, 42.0, 61.0, 54.0, 39.0, 30.0, 26.0, 27.0, 29.0, 21.0, 22.0, 18.0, 14.0, 13.0, 6.0, 10.0, 4.0, 1.0, 5.0, 7.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-141.62432861328125, -136.12173461914062, -130.619140625, -125.11654663085938, -119.61395263671875, -114.11135864257812, -108.60877227783203, -103.1061782836914, -97.60358428955078, -92.10099029541016, -86.59839630126953, -81.09580993652344, -75.59321594238281, -70.09062194824219, -64.58802795410156, -59.08543395996094, -53.58283996582031, -48.08024597167969, -42.57765197753906, -37.0750617980957, -31.572467803955078, -26.069873809814453, -20.567283630371094, -15.064689636230469, -9.562095642089844, -4.059502601623535, 1.4430904388427734, 6.945682525634766, 12.44827651977539, 17.950870513916016, 23.453460693359375, 28.9560546875, 34.458648681640625, 39.96124267578125, 45.463836669921875, 50.966426849365234, 56.46902084350586, 61.971614837646484, 67.47420501708984, 72.97679901123047, 78.4793930053711, 83.98198699951172, 89.48458099365234, 94.98716735839844, 100.48976135253906, 105.99235534667969, 111.49494934082031, 116.99754333496094, 122.50013732910156, 128.0027313232422, 133.5053253173828, 139.00791931152344, 144.51051330566406, 150.0131072998047, 155.51568603515625, 161.01828002929688, 166.5208740234375, 172.02346801757812, 177.52606201171875, 183.02865600585938, 188.53125, 194.03384399414062, 199.53643798828125, 205.03903198242188, 210.5416259765625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 2.0, 14.0, 26.0, 29.0, 53.0, 47.0, 66.0, 127.0, 218.0, 303.0, 536.0, 921.0, 1679.0, 3633.0, 9746.0, 70909.0, 4076140.0, 19210.0, 5362.0, 2359.0, 1141.0, 627.0, 378.0, 244.0, 152.0, 105.0, 77.0, 44.0, 35.0, 20.0, 20.0, 19.0, 9.0, 13.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-59.28125, -57.54931640625, -55.8173828125, -54.08544921875, -52.353515625, -50.62158203125, -48.8896484375, -47.15771484375, -45.42578125, -43.69384765625, -41.9619140625, -40.22998046875, -38.498046875, -36.76611328125, -35.0341796875, -33.30224609375, -31.5703125, -29.83837890625, -28.1064453125, -26.37451171875, -24.642578125, -22.91064453125, -21.1787109375, -19.44677734375, -17.71484375, -15.98291015625, -14.2509765625, -12.51904296875, -10.787109375, -9.05517578125, -7.3232421875, -5.59130859375, -3.859375, -2.12744140625, -0.3955078125, 1.33642578125, 3.068359375, 4.80029296875, 6.5322265625, 8.26416015625, 9.99609375, 11.72802734375, 13.4599609375, 15.19189453125, 16.923828125, 18.65576171875, 20.3876953125, 22.11962890625, 23.8515625, 25.58349609375, 27.3154296875, 29.04736328125, 30.779296875, 32.51123046875, 34.2431640625, 35.97509765625, 37.70703125, 39.43896484375, 41.1708984375, 42.90283203125, 44.634765625, 46.36669921875, 48.0986328125, 49.83056640625, 51.5625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 8.0, 6.0, 6.0, 8.0, 11.0, 13.0, 24.0, 18.0, 25.0, 22.0, 32.0, 36.0, 58.0, 46.0, 48.0, 62.0, 69.0, 57.0, 66.0, 54.0, 45.0, 51.0, 46.0, 38.0, 28.0, 32.0, 25.0, 20.0, 14.0, 9.0, 12.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.859375, -11.4774169921875, -11.095458984375, -10.7135009765625, -10.33154296875, -9.9495849609375, -9.567626953125, -9.1856689453125, -8.8037109375, -8.4217529296875, -8.039794921875, -7.6578369140625, -7.27587890625, -6.8939208984375, -6.511962890625, -6.1300048828125, -5.748046875, -5.3660888671875, -4.984130859375, -4.6021728515625, -4.22021484375, -3.8382568359375, -3.456298828125, -3.0743408203125, -2.6923828125, -2.3104248046875, -1.928466796875, -1.5465087890625, -1.16455078125, -0.7825927734375, -0.400634765625, -0.0186767578125, 0.36328125, 0.7452392578125, 1.127197265625, 1.5091552734375, 1.89111328125, 2.2730712890625, 2.655029296875, 3.0369873046875, 3.4189453125, 3.8009033203125, 4.182861328125, 4.5648193359375, 4.94677734375, 5.3287353515625, 5.710693359375, 6.0926513671875, 6.474609375, 6.8565673828125, 7.238525390625, 7.6204833984375, 8.00244140625, 8.3843994140625, 8.766357421875, 9.1483154296875, 9.5302734375, 9.9122314453125, 10.294189453125, 10.6761474609375, 11.05810546875, 11.4400634765625, 11.822021484375, 12.2039794921875, 12.5859375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 6.0, 8.0, 15.0, 11.0, 26.0, 52.0, 42.0, 104.0, 135.0, 170.0, 258.0, 414.0, 679.0, 1214.0, 2261.0, 4717.0, 11633.0, 54635.0, 4044434.0, 52344.0, 11318.0, 4549.0, 2177.0, 1162.0, 696.0, 424.0, 248.0, 175.0, 103.0, 95.0, 68.0, 39.0, 24.0, 18.0, 17.0, 11.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.25, -38.0419921875, -36.833984375, -35.6259765625, -34.41796875, -33.2099609375, -32.001953125, -30.7939453125, -29.5859375, -28.3779296875, -27.169921875, -25.9619140625, -24.75390625, -23.5458984375, -22.337890625, -21.1298828125, -19.921875, -18.7138671875, -17.505859375, -16.2978515625, -15.08984375, -13.8818359375, -12.673828125, -11.4658203125, -10.2578125, -9.0498046875, -7.841796875, -6.6337890625, -5.42578125, -4.2177734375, -3.009765625, -1.8017578125, -0.59375, 0.6142578125, 1.822265625, 3.0302734375, 4.23828125, 5.4462890625, 6.654296875, 7.8623046875, 9.0703125, 10.2783203125, 11.486328125, 12.6943359375, 13.90234375, 15.1103515625, 16.318359375, 17.5263671875, 18.734375, 19.9423828125, 21.150390625, 22.3583984375, 23.56640625, 24.7744140625, 25.982421875, 27.1904296875, 28.3984375, 29.6064453125, 30.814453125, 32.0224609375, 33.23046875, 34.4384765625, 35.646484375, 36.8544921875, 38.0625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 1.0, 3.0, 11.0, 10.0, 10.0, 19.0, 34.0, 50.0, 169.0, 3543.0, 112.0, 38.0, 21.0, 14.0, 8.0, 4.0, 2.0, 4.0, 4.0, 2.0, 5.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3671875, -7.1163330078125, -6.865478515625, -6.6146240234375, -6.36376953125, -6.1129150390625, -5.862060546875, -5.6112060546875, -5.3603515625, -5.1094970703125, -4.858642578125, -4.6077880859375, -4.35693359375, -4.1060791015625, -3.855224609375, -3.6043701171875, -3.353515625, -3.1026611328125, -2.851806640625, -2.6009521484375, -2.35009765625, -2.0992431640625, -1.848388671875, -1.5975341796875, -1.3466796875, -1.0958251953125, -0.844970703125, -0.5941162109375, -0.34326171875, -0.0924072265625, 0.158447265625, 0.4093017578125, 0.66015625, 0.9110107421875, 1.161865234375, 1.4127197265625, 1.66357421875, 1.9144287109375, 2.165283203125, 2.4161376953125, 2.6669921875, 2.9178466796875, 3.168701171875, 3.4195556640625, 3.67041015625, 3.9212646484375, 4.172119140625, 4.4229736328125, 4.673828125, 4.9246826171875, 5.175537109375, 5.4263916015625, 5.67724609375, 5.9281005859375, 6.178955078125, 6.4298095703125, 6.6806640625, 6.9315185546875, 7.182373046875, 7.4332275390625, 7.68408203125, 7.9349365234375, 8.185791015625, 8.4366455078125, 8.6875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 7.0, 9.0, 7.0, 21.0, 32.0, 52.0, 76.0, 99.0, 165.0, 156.0, 145.0, 80.0, 56.0, 48.0, 21.0, 10.0, 8.0, 4.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.23912811279297, -28.971227645874023, -27.703327178955078, -26.435426712036133, -25.167526245117188, -23.89962387084961, -22.631723403930664, -21.36382293701172, -20.095922470092773, -18.828022003173828, -17.560121536254883, -16.292221069335938, -15.024319648742676, -13.75641918182373, -12.488517761230469, -11.220617294311523, -9.952716827392578, -8.684816360473633, -7.416915416717529, -6.149014472961426, -4.8811140060424805, -3.613213539123535, -2.3453125953674316, -1.0774116516113281, 0.1904888153076172, 1.4583895206451416, 2.726290225982666, 3.9941909313201904, 5.262091636657715, 6.52999210357666, 7.797893047332764, 9.065793991088867, 10.333694458007812, 11.601594924926758, 12.869495391845703, 14.137396812438965, 15.40529727935791, 16.673198699951172, 17.941099166870117, 19.208999633789062, 20.476900100708008, 21.744800567626953, 23.0127010345459, 24.280601501464844, 25.548503875732422, 26.816402435302734, 28.084304809570312, 29.352205276489258, 30.620105743408203, 31.88800621032715, 33.155906677246094, 34.42380905151367, 35.691707611083984, 36.95960998535156, 38.227508544921875, 39.49541091918945, 40.76331329345703, 42.03121566772461, 43.29911422729492, 44.5670166015625, 45.83491516113281, 47.10281753540039, 48.3707160949707, 49.63861846923828, 50.906517028808594]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 12.0, 5.0, 9.0, 12.0, 11.0, 24.0, 30.0, 36.0, 24.0, 44.0, 34.0, 48.0, 51.0, 34.0, 55.0, 45.0, 49.0, 48.0, 48.0, 44.0, 56.0, 40.0, 34.0, 37.0, 38.0, 27.0, 19.0, 17.0, 21.0, 15.0, 8.0, 5.0, 5.0, 6.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.48516845703125, -16.885601043701172, -16.286035537719727, -15.686468124389648, -15.086901664733887, -14.487335205078125, -13.887767791748047, -13.288201332092285, -12.688634872436523, -12.089068412780762, -11.489500999450684, -10.889934539794922, -10.29036808013916, -9.690801620483398, -9.09123420715332, -8.491667747497559, -7.8921003341674805, -7.2925333976745605, -6.692966938018799, -6.093400001525879, -5.493833541870117, -4.894266605377197, -4.294699668884277, -3.6951332092285156, -3.0955662727355957, -2.495999574661255, -1.8964327573776245, -1.2968659400939941, -0.6972992420196533, -0.0977325439453125, 0.5018343925476074, 1.1014008522033691, 1.700967788696289, 2.30053448677063, 2.9001011848449707, 3.4996681213378906, 4.099234580993652, 4.698801517486572, 5.298368453979492, 5.897934913635254, 6.497501850128174, 7.097068786621094, 7.6966352462768555, 8.296201705932617, 8.895769119262695, 9.495335578918457, 10.094902038574219, 10.694469451904297, 11.294035911560059, 11.89360237121582, 12.493169784545898, 13.09273624420166, 13.692302703857422, 14.2918701171875, 14.891436576843262, 15.491003036499023, 16.0905704498291, 16.69013786315918, 17.289703369140625, 17.889270782470703, 18.48883819580078, 19.088403701782227, 19.687971115112305, 20.28753662109375, 20.887104034423828]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 14.0, 13.0, 24.0, 22.0, 35.0, 50.0, 69.0, 98.0, 165.0, 271.0, 370.0, 609.0, 992.0, 1791.0, 3120.0, 5748.0, 10670.0, 21807.0, 44177.0, 91865.0, 181555.0, 271511.0, 203803.0, 106014.0, 51348.0, 24798.0, 12461.0, 6518.0, 3571.0, 1976.0, 1129.0, 670.0, 427.0, 283.0, 193.0, 122.0, 87.0, 41.0, 32.0, 27.0, 20.0, 18.0, 9.0, 10.0, 4.0, 6.0, 2.0, 1.0, 3.0, 2.0, 2.0], "bins": [-13.5078125, -13.117431640625, -12.72705078125, -12.336669921875, -11.9462890625, -11.555908203125, -11.16552734375, -10.775146484375, -10.384765625, -9.994384765625, -9.60400390625, -9.213623046875, -8.8232421875, -8.432861328125, -8.04248046875, -7.652099609375, -7.26171875, -6.871337890625, -6.48095703125, -6.090576171875, -5.7001953125, -5.309814453125, -4.91943359375, -4.529052734375, -4.138671875, -3.748291015625, -3.35791015625, -2.967529296875, -2.5771484375, -2.186767578125, -1.79638671875, -1.406005859375, -1.015625, -0.625244140625, -0.23486328125, 0.155517578125, 0.5458984375, 0.936279296875, 1.32666015625, 1.717041015625, 2.107421875, 2.497802734375, 2.88818359375, 3.278564453125, 3.6689453125, 4.059326171875, 4.44970703125, 4.840087890625, 5.23046875, 5.620849609375, 6.01123046875, 6.401611328125, 6.7919921875, 7.182373046875, 7.57275390625, 7.963134765625, 8.353515625, 8.743896484375, 9.13427734375, 9.524658203125, 9.9150390625, 10.305419921875, 10.69580078125, 11.086181640625, 11.4765625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 7.0, 5.0, 11.0, 12.0, 14.0, 12.0, 25.0, 32.0, 23.0, 37.0, 40.0, 29.0, 55.0, 57.0, 65.0, 69.0, 59.0, 61.0, 59.0, 46.0, 53.0, 50.0, 28.0, 40.0, 31.0, 18.0, 13.0, 11.0, 18.0, 7.0, 2.0, 4.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.6640625, -12.268310546875, -11.87255859375, -11.476806640625, -11.0810546875, -10.685302734375, -10.28955078125, -9.893798828125, -9.498046875, -9.102294921875, -8.70654296875, -8.310791015625, -7.9150390625, -7.519287109375, -7.12353515625, -6.727783203125, -6.33203125, -5.936279296875, -5.54052734375, -5.144775390625, -4.7490234375, -4.353271484375, -3.95751953125, -3.561767578125, -3.166015625, -2.770263671875, -2.37451171875, -1.978759765625, -1.5830078125, -1.187255859375, -0.79150390625, -0.395751953125, 0.0, 0.395751953125, 0.79150390625, 1.187255859375, 1.5830078125, 1.978759765625, 2.37451171875, 2.770263671875, 3.166015625, 3.561767578125, 3.95751953125, 4.353271484375, 4.7490234375, 5.144775390625, 5.54052734375, 5.936279296875, 6.33203125, 6.727783203125, 7.12353515625, 7.519287109375, 7.9150390625, 8.310791015625, 8.70654296875, 9.102294921875, 9.498046875, 9.893798828125, 10.28955078125, 10.685302734375, 11.0810546875, 11.476806640625, 11.87255859375, 12.268310546875, 12.6640625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 9.0, 16.0, 22.0, 22.0, 31.0, 48.0, 68.0, 110.0, 122.0, 163.0, 213.0, 293.0, 414.0, 591.0, 893.0, 1678.0, 4011.0, 16330.0, 101031.0, 630230.0, 245837.0, 33594.0, 6824.0, 2324.0, 1179.0, 727.0, 509.0, 328.0, 242.0, 203.0, 122.0, 97.0, 64.0, 56.0, 29.0, 48.0, 21.0, 15.0, 13.0, 9.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-27.0, -26.120849609375, -25.24169921875, -24.362548828125, -23.4833984375, -22.604248046875, -21.72509765625, -20.845947265625, -19.966796875, -19.087646484375, -18.20849609375, -17.329345703125, -16.4501953125, -15.571044921875, -14.69189453125, -13.812744140625, -12.93359375, -12.054443359375, -11.17529296875, -10.296142578125, -9.4169921875, -8.537841796875, -7.65869140625, -6.779541015625, -5.900390625, -5.021240234375, -4.14208984375, -3.262939453125, -2.3837890625, -1.504638671875, -0.62548828125, 0.253662109375, 1.1328125, 2.011962890625, 2.89111328125, 3.770263671875, 4.6494140625, 5.528564453125, 6.40771484375, 7.286865234375, 8.166015625, 9.045166015625, 9.92431640625, 10.803466796875, 11.6826171875, 12.561767578125, 13.44091796875, 14.320068359375, 15.19921875, 16.078369140625, 16.95751953125, 17.836669921875, 18.7158203125, 19.594970703125, 20.47412109375, 21.353271484375, 22.232421875, 23.111572265625, 23.99072265625, 24.869873046875, 25.7490234375, 26.628173828125, 27.50732421875, 28.386474609375, 29.265625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 5.0, 3.0, 6.0, 11.0, 6.0, 8.0, 11.0, 15.0, 23.0, 18.0, 24.0, 44.0, 32.0, 38.0, 40.0, 50.0, 46.0, 43.0, 55.0, 60.0, 51.0, 50.0, 47.0, 46.0, 41.0, 34.0, 29.0, 30.0, 27.0, 22.0, 20.0, 17.0, 16.0, 9.0, 8.0, 8.0, 5.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-53.03125, -51.62548828125, -50.2197265625, -48.81396484375, -47.408203125, -46.00244140625, -44.5966796875, -43.19091796875, -41.78515625, -40.37939453125, -38.9736328125, -37.56787109375, -36.162109375, -34.75634765625, -33.3505859375, -31.94482421875, -30.5390625, -29.13330078125, -27.7275390625, -26.32177734375, -24.916015625, -23.51025390625, -22.1044921875, -20.69873046875, -19.29296875, -17.88720703125, -16.4814453125, -15.07568359375, -13.669921875, -12.26416015625, -10.8583984375, -9.45263671875, -8.046875, -6.64111328125, -5.2353515625, -3.82958984375, -2.423828125, -1.01806640625, 0.3876953125, 1.79345703125, 3.19921875, 4.60498046875, 6.0107421875, 7.41650390625, 8.822265625, 10.22802734375, 11.6337890625, 13.03955078125, 14.4453125, 15.85107421875, 17.2568359375, 18.66259765625, 20.068359375, 21.47412109375, 22.8798828125, 24.28564453125, 25.69140625, 27.09716796875, 28.5029296875, 29.90869140625, 31.314453125, 32.72021484375, 34.1259765625, 35.53173828125, 36.9375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 3.0, 8.0, 9.0, 10.0, 13.0, 15.0, 23.0, 32.0, 48.0, 54.0, 80.0, 168.0, 350.0, 797.0, 2456.0, 10813.0, 120345.0, 844161.0, 58879.0, 7101.0, 1822.0, 648.0, 317.0, 161.0, 80.0, 53.0, 26.0, 23.0, 12.0, 11.0, 12.0, 10.0, 3.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.84375, -17.275146484375, -16.70654296875, -16.137939453125, -15.5693359375, -15.000732421875, -14.43212890625, -13.863525390625, -13.294921875, -12.726318359375, -12.15771484375, -11.589111328125, -11.0205078125, -10.451904296875, -9.88330078125, -9.314697265625, -8.74609375, -8.177490234375, -7.60888671875, -7.040283203125, -6.4716796875, -5.903076171875, -5.33447265625, -4.765869140625, -4.197265625, -3.628662109375, -3.06005859375, -2.491455078125, -1.9228515625, -1.354248046875, -0.78564453125, -0.217041015625, 0.3515625, 0.920166015625, 1.48876953125, 2.057373046875, 2.6259765625, 3.194580078125, 3.76318359375, 4.331787109375, 4.900390625, 5.468994140625, 6.03759765625, 6.606201171875, 7.1748046875, 7.743408203125, 8.31201171875, 8.880615234375, 9.44921875, 10.017822265625, 10.58642578125, 11.155029296875, 11.7236328125, 12.292236328125, 12.86083984375, 13.429443359375, 13.998046875, 14.566650390625, 15.13525390625, 15.703857421875, 16.2724609375, 16.841064453125, 17.40966796875, 17.978271484375, 18.546875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 5.0, 2.0, 3.0, 4.0, 3.0, 4.0, 6.0, 11.0, 11.0, 21.0, 25.0, 30.0, 64.0, 81.0, 104.0, 127.0, 141.0, 104.0, 82.0, 46.0, 35.0, 32.0, 23.0, 10.0, 5.0, 6.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015468597412109375, -0.001484990119934082, -0.0014231204986572266, -0.001361250877380371, -0.0012993812561035156, -0.0012375116348266602, -0.0011756420135498047, -0.0011137723922729492, -0.0010519027709960938, -0.0009900331497192383, -0.0009281635284423828, -0.0008662939071655273, -0.0008044242858886719, -0.0007425546646118164, -0.0006806850433349609, -0.0006188154220581055, -0.00055694580078125, -0.0004950761795043945, -0.00043320655822753906, -0.0003713369369506836, -0.0003094673156738281, -0.00024759769439697266, -0.0001857280731201172, -0.00012385845184326172, -6.198883056640625e-05, -1.1920928955078125e-07, 6.175041198730469e-05, 0.00012362003326416016, 0.00018548965454101562, 0.0002473592758178711, 0.00030922889709472656, 0.00037109851837158203, 0.0004329681396484375, 0.000494837760925293, 0.0005567073822021484, 0.0006185770034790039, 0.0006804466247558594, 0.0007423162460327148, 0.0008041858673095703, 0.0008660554885864258, 0.0009279251098632812, 0.0009897947311401367, 0.0010516643524169922, 0.0011135339736938477, 0.0011754035949707031, 0.0012372732162475586, 0.001299142837524414, 0.0013610124588012695, 0.001422882080078125, 0.0014847517013549805, 0.001546621322631836, 0.0016084909439086914, 0.0016703605651855469, 0.0017322301864624023, 0.0017940998077392578, 0.0018559694290161133, 0.0019178390502929688, 0.0019797086715698242, 0.0020415782928466797, 0.002103447914123535, 0.0021653175354003906, 0.002227187156677246, 0.0022890567779541016, 0.002350926399230957, 0.0024127960205078125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 5.0, 6.0, 8.0, 16.0, 24.0, 27.0, 69.0, 81.0, 123.0, 245.0, 426.0, 873.0, 2245.0, 7613.0, 40742.0, 548306.0, 404706.0, 32699.0, 6515.0, 2045.0, 803.0, 373.0, 208.0, 151.0, 86.0, 64.0, 37.0, 19.0, 12.0, 10.0, 3.0, 8.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.734375, -9.246337890625, -8.75830078125, -8.270263671875, -7.7822265625, -7.294189453125, -6.80615234375, -6.318115234375, -5.830078125, -5.342041015625, -4.85400390625, -4.365966796875, -3.8779296875, -3.389892578125, -2.90185546875, -2.413818359375, -1.92578125, -1.437744140625, -0.94970703125, -0.461669921875, 0.0263671875, 0.514404296875, 1.00244140625, 1.490478515625, 1.978515625, 2.466552734375, 2.95458984375, 3.442626953125, 3.9306640625, 4.418701171875, 4.90673828125, 5.394775390625, 5.8828125, 6.370849609375, 6.85888671875, 7.346923828125, 7.8349609375, 8.322998046875, 8.81103515625, 9.299072265625, 9.787109375, 10.275146484375, 10.76318359375, 11.251220703125, 11.7392578125, 12.227294921875, 12.71533203125, 13.203369140625, 13.69140625, 14.179443359375, 14.66748046875, 15.155517578125, 15.6435546875, 16.131591796875, 16.61962890625, 17.107666015625, 17.595703125, 18.083740234375, 18.57177734375, 19.059814453125, 19.5478515625, 20.035888671875, 20.52392578125, 21.011962890625, 21.5]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 5.0, 11.0, 12.0, 9.0, 14.0, 26.0, 30.0, 40.0, 61.0, 116.0, 142.0, 163.0, 131.0, 76.0, 50.0, 44.0, 25.0, 11.0, 14.0, 8.0, 4.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.453125, -10.8818359375, -10.310546875, -9.7392578125, -9.16796875, -8.5966796875, -8.025390625, -7.4541015625, -6.8828125, -6.3115234375, -5.740234375, -5.1689453125, -4.59765625, -4.0263671875, -3.455078125, -2.8837890625, -2.3125, -1.7412109375, -1.169921875, -0.5986328125, -0.02734375, 0.5439453125, 1.115234375, 1.6865234375, 2.2578125, 2.8291015625, 3.400390625, 3.9716796875, 4.54296875, 5.1142578125, 5.685546875, 6.2568359375, 6.828125, 7.3994140625, 7.970703125, 8.5419921875, 9.11328125, 9.6845703125, 10.255859375, 10.8271484375, 11.3984375, 11.9697265625, 12.541015625, 13.1123046875, 13.68359375, 14.2548828125, 14.826171875, 15.3974609375, 15.96875, 16.5400390625, 17.111328125, 17.6826171875, 18.25390625, 18.8251953125, 19.396484375, 19.9677734375, 20.5390625, 21.1103515625, 21.681640625, 22.2529296875, 22.82421875, 23.3955078125, 23.966796875, 24.5380859375, 25.109375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 12.0, 21.0, 37.0, 94.0, 211.0, 248.0, 191.0, 113.0, 44.0, 16.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-439.4387512207031, -428.66754150390625, -417.89630126953125, -407.1250915527344, -396.3538818359375, -385.5826416015625, -374.8114318847656, -364.04022216796875, -353.26898193359375, -342.4977722167969, -331.7265319824219, -320.955322265625, -310.18408203125, -299.4128723144531, -288.64166259765625, -277.87042236328125, -267.0992126464844, -256.3280029296875, -245.5567626953125, -234.78555297851562, -224.0143280029297, -213.24310302734375, -202.47189331054688, -191.70066833496094, -180.929443359375, -170.15821838378906, -159.38699340820312, -148.61578369140625, -137.8445587158203, -127.07333374023438, -116.30211639404297, -105.53089904785156, -94.7596435546875, -83.98841857910156, -73.21720123291016, -62.445980072021484, -51.67475891113281, -40.90353775024414, -30.13231658935547, -19.361099243164062, -8.589874267578125, 2.181346893310547, 12.952568054199219, 23.72378921508789, 34.49501037597656, 45.266231536865234, 56.037452697753906, 66.80867004394531, 77.57989501953125, 88.35111999511719, 99.1223373413086, 109.8935546875, 120.66477966308594, 131.43600463867188, 142.20721435546875, 152.9784393310547, 163.74966430664062, 174.52088928222656, 185.2921142578125, 196.06332397460938, 206.8345489501953, 217.60577392578125, 228.37698364257812, 239.14820861816406, 249.91943359375]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 9.0, 5.0, 8.0, 10.0, 11.0, 19.0, 20.0, 20.0, 28.0, 20.0, 31.0, 48.0, 41.0, 45.0, 56.0, 53.0, 51.0, 61.0, 50.0, 43.0, 56.0, 37.0, 43.0, 48.0, 38.0, 32.0, 23.0, 19.0, 10.0, 16.0, 9.0, 10.0, 11.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-169.14907836914062, -163.138427734375, -157.12777709960938, -151.11712646484375, -145.10647583007812, -139.0958251953125, -133.08517456054688, -127.07450866699219, -121.06385803222656, -115.05320739746094, -109.04255676269531, -103.03190612792969, -97.02124786376953, -91.0105972290039, -84.99994659423828, -78.98928833007812, -72.97864532470703, -66.9679946899414, -60.957340240478516, -54.94668960571289, -48.93603515625, -42.925384521484375, -36.91473388671875, -30.90407943725586, -24.893428802490234, -18.882776260375977, -12.872124671936035, -6.861473083496094, -0.8508205413818359, 5.159832000732422, 11.170482635498047, 17.181137084960938, 23.191787719726562, 29.20244026184082, 35.21309280395508, 41.2237434387207, 47.234397888183594, 53.24504852294922, 59.255699157714844, 65.266357421875, 71.27700805664062, 77.28765869140625, 83.29830932617188, 89.3089599609375, 95.31961822509766, 101.33026885986328, 107.3409194946289, 113.35157775878906, 119.36222076416016, 125.37287139892578, 131.38352966308594, 137.39418029785156, 143.4048309326172, 149.4154815673828, 155.42613220214844, 161.43678283691406, 167.4474334716797, 173.4580841064453, 179.46873474121094, 185.47938537597656, 191.4900360107422, 197.50070190429688, 203.5113525390625, 209.52200317382812, 215.53265380859375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 8.0, 20.0, 13.0, 21.0, 35.0, 44.0, 71.0, 143.0, 194.0, 419.0, 885.0, 1903.0, 5232.0, 20951.0, 360612.0, 3768590.0, 25309.0, 5836.0, 1995.0, 898.0, 471.0, 245.0, 116.0, 85.0, 52.0, 36.0, 28.0, 16.0, 17.0, 10.0, 11.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.28125, -34.888671875, -33.49609375, -32.103515625, -30.7109375, -29.318359375, -27.92578125, -26.533203125, -25.140625, -23.748046875, -22.35546875, -20.962890625, -19.5703125, -18.177734375, -16.78515625, -15.392578125, -14.0, -12.607421875, -11.21484375, -9.822265625, -8.4296875, -7.037109375, -5.64453125, -4.251953125, -2.859375, -1.466796875, -0.07421875, 1.318359375, 2.7109375, 4.103515625, 5.49609375, 6.888671875, 8.28125, 9.673828125, 11.06640625, 12.458984375, 13.8515625, 15.244140625, 16.63671875, 18.029296875, 19.421875, 20.814453125, 22.20703125, 23.599609375, 24.9921875, 26.384765625, 27.77734375, 29.169921875, 30.5625, 31.955078125, 33.34765625, 34.740234375, 36.1328125, 37.525390625, 38.91796875, 40.310546875, 41.703125, 43.095703125, 44.48828125, 45.880859375, 47.2734375, 48.666015625, 50.05859375, 51.451171875, 52.84375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 4.0, 5.0, 12.0, 8.0, 9.0, 18.0, 33.0, 47.0, 65.0, 80.0, 94.0, 92.0, 88.0, 96.0, 94.0, 82.0, 52.0, 43.0, 24.0, 24.0, 10.0, 6.0, 9.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.9375, -21.33203125, -20.7265625, -20.12109375, -19.515625, -18.91015625, -18.3046875, -17.69921875, -17.09375, -16.48828125, -15.8828125, -15.27734375, -14.671875, -14.06640625, -13.4609375, -12.85546875, -12.25, -11.64453125, -11.0390625, -10.43359375, -9.828125, -9.22265625, -8.6171875, -8.01171875, -7.40625, -6.80078125, -6.1953125, -5.58984375, -4.984375, -4.37890625, -3.7734375, -3.16796875, -2.5625, -1.95703125, -1.3515625, -0.74609375, -0.140625, 0.46484375, 1.0703125, 1.67578125, 2.28125, 2.88671875, 3.4921875, 4.09765625, 4.703125, 5.30859375, 5.9140625, 6.51953125, 7.125, 7.73046875, 8.3359375, 8.94140625, 9.546875, 10.15234375, 10.7578125, 11.36328125, 11.96875, 12.57421875, 13.1796875, 13.78515625, 14.390625, 14.99609375, 15.6015625, 16.20703125, 16.8125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 10.0, 8.0, 3.0, 7.0, 15.0, 17.0, 23.0, 42.0, 52.0, 70.0, 158.0, 240.0, 388.0, 725.0, 1497.0, 3144.0, 8743.0, 38268.0, 3855783.0, 251240.0, 22400.0, 6307.0, 2453.0, 1164.0, 603.0, 325.0, 195.0, 129.0, 86.0, 42.0, 34.0, 36.0, 24.0, 19.0, 9.0, 7.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-41.875, -40.7685546875, -39.662109375, -38.5556640625, -37.44921875, -36.3427734375, -35.236328125, -34.1298828125, -33.0234375, -31.9169921875, -30.810546875, -29.7041015625, -28.59765625, -27.4912109375, -26.384765625, -25.2783203125, -24.171875, -23.0654296875, -21.958984375, -20.8525390625, -19.74609375, -18.6396484375, -17.533203125, -16.4267578125, -15.3203125, -14.2138671875, -13.107421875, -12.0009765625, -10.89453125, -9.7880859375, -8.681640625, -7.5751953125, -6.46875, -5.3623046875, -4.255859375, -3.1494140625, -2.04296875, -0.9365234375, 0.169921875, 1.2763671875, 2.3828125, 3.4892578125, 4.595703125, 5.7021484375, 6.80859375, 7.9150390625, 9.021484375, 10.1279296875, 11.234375, 12.3408203125, 13.447265625, 14.5537109375, 15.66015625, 16.7666015625, 17.873046875, 18.9794921875, 20.0859375, 21.1923828125, 22.298828125, 23.4052734375, 24.51171875, 25.6181640625, 26.724609375, 27.8310546875, 28.9375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 4.0, 11.0, 11.0, 13.0, 16.0, 23.0, 37.0, 71.0, 126.0, 646.0, 2746.0, 152.0, 59.0, 38.0, 33.0, 21.0, 9.0, 11.0, 4.0, 8.0, 4.0, 2.0, 6.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0], "bins": [-12.3671875, -12.06622314453125, -11.7652587890625, -11.46429443359375, -11.163330078125, -10.86236572265625, -10.5614013671875, -10.26043701171875, -9.95947265625, -9.65850830078125, -9.3575439453125, -9.05657958984375, -8.755615234375, -8.45465087890625, -8.1536865234375, -7.85272216796875, -7.5517578125, -7.25079345703125, -6.9498291015625, -6.64886474609375, -6.347900390625, -6.04693603515625, -5.7459716796875, -5.44500732421875, -5.14404296875, -4.84307861328125, -4.5421142578125, -4.24114990234375, -3.940185546875, -3.63922119140625, -3.3382568359375, -3.03729248046875, -2.736328125, -2.43536376953125, -2.1343994140625, -1.83343505859375, -1.532470703125, -1.23150634765625, -0.9305419921875, -0.62957763671875, -0.32861328125, -0.02764892578125, 0.2733154296875, 0.57427978515625, 0.875244140625, 1.17620849609375, 1.4771728515625, 1.77813720703125, 2.0791015625, 2.38006591796875, 2.6810302734375, 2.98199462890625, 3.282958984375, 3.58392333984375, 3.8848876953125, 4.18585205078125, 4.48681640625, 4.78778076171875, 5.0887451171875, 5.38970947265625, 5.690673828125, 5.99163818359375, 6.2926025390625, 6.59356689453125, 6.89453125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 6.0, 6.0, 17.0, 32.0, 59.0, 74.0, 131.0, 154.0, 161.0, 141.0, 95.0, 62.0, 29.0, 13.0, 9.0, 7.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.1380844116211, -75.88655853271484, -73.63502502441406, -71.38349914550781, -69.13196563720703, -66.88043975830078, -64.62890625, -62.37738037109375, -60.125850677490234, -57.87432098388672, -55.6227912902832, -53.37126159667969, -51.11973571777344, -48.868202209472656, -46.616676330566406, -44.36514663696289, -42.113616943359375, -39.86208724975586, -37.610557556152344, -35.35902786254883, -33.10749816894531, -30.85597038269043, -28.604442596435547, -26.35291290283203, -24.101383209228516, -21.849853515625, -19.598323822021484, -17.3467960357666, -15.095266342163086, -12.84373664855957, -10.592207908630371, -8.340679168701172, -6.0891571044921875, -3.83762788772583, -1.5860986709594727, 0.6654305458068848, 2.916959762573242, 5.168489456176758, 7.420018196105957, 9.671546936035156, 11.923076629638672, 14.174606323242188, 16.426136016845703, 18.677663803100586, 20.9291934967041, 23.180723190307617, 25.4322509765625, 27.683780670166016, 29.93531036376953, 32.18684005737305, 34.43836975097656, 36.68989944458008, 38.941429138183594, 41.192955017089844, 43.44448471069336, 45.696014404296875, 47.94754409790039, 50.199073791503906, 52.45060348510742, 54.70213317871094, 56.95365905761719, 59.20519256591797, 61.45671844482422, 63.708248138427734, 65.95977783203125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 6.0, 7.0, 6.0, 8.0, 6.0, 12.0, 19.0, 13.0, 21.0, 24.0, 28.0, 33.0, 35.0, 52.0, 34.0, 36.0, 49.0, 31.0, 45.0, 46.0, 46.0, 36.0, 40.0, 38.0, 37.0, 43.0, 24.0, 32.0, 35.0, 32.0, 18.0, 15.0, 19.0, 23.0, 8.0, 6.0, 9.0, 6.0, 5.0, 2.0, 1.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-24.679134368896484, -23.871896743774414, -23.06465721130371, -22.25741958618164, -21.450180053710938, -20.642942428588867, -19.835704803466797, -19.028465270996094, -18.221227645874023, -17.413990020751953, -16.60675048828125, -15.79951286315918, -14.992274284362793, -14.185035705566406, -13.37779712677002, -12.570558547973633, -11.763319969177246, -10.95608139038086, -10.148842811584473, -9.341604232788086, -8.534366607666016, -7.727128028869629, -6.919889450073242, -6.112651348114014, -5.305412769317627, -4.49817419052124, -3.6909360885620117, -2.883697509765625, -2.0764591693878174, -1.2692208290100098, -0.46198225021362305, 0.34525585174560547, 1.1524944305419922, 1.9597327709197998, 2.7669711112976074, 3.574209690093994, 4.381447792053223, 5.188686370849609, 5.995924949645996, 6.803163051605225, 7.610401630401611, 8.41763973236084, 9.224878311157227, 10.032116889953613, 10.83935546875, 11.64659309387207, 12.453832626342773, 13.261070251464844, 14.06830883026123, 14.875547409057617, 15.682785987854004, 16.49002456665039, 17.29726219177246, 18.10449981689453, 18.911739349365234, 19.718976974487305, 20.526216506958008, 21.333454132080078, 22.14069366455078, 22.94793128967285, 23.755170822143555, 24.562408447265625, 25.369647979736328, 26.1768856048584, 26.98412322998047]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 4.0, 6.0, 11.0, 15.0, 12.0, 10.0, 22.0, 45.0, 52.0, 76.0, 103.0, 173.0, 262.0, 445.0, 811.0, 1405.0, 2711.0, 5983.0, 13357.0, 33453.0, 84438.0, 211461.0, 366751.0, 194291.0, 78263.0, 30621.0, 12460.0, 5443.0, 2571.0, 1351.0, 767.0, 415.0, 275.0, 142.0, 116.0, 70.0, 43.0, 39.0, 30.0, 18.0, 15.0, 11.0, 0.0, 6.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.40625, -20.703369140625, -20.00048828125, -19.297607421875, -18.5947265625, -17.891845703125, -17.18896484375, -16.486083984375, -15.783203125, -15.080322265625, -14.37744140625, -13.674560546875, -12.9716796875, -12.268798828125, -11.56591796875, -10.863037109375, -10.16015625, -9.457275390625, -8.75439453125, -8.051513671875, -7.3486328125, -6.645751953125, -5.94287109375, -5.239990234375, -4.537109375, -3.834228515625, -3.13134765625, -2.428466796875, -1.7255859375, -1.022705078125, -0.31982421875, 0.383056640625, 1.0859375, 1.788818359375, 2.49169921875, 3.194580078125, 3.8974609375, 4.600341796875, 5.30322265625, 6.006103515625, 6.708984375, 7.411865234375, 8.11474609375, 8.817626953125, 9.5205078125, 10.223388671875, 10.92626953125, 11.629150390625, 12.33203125, 13.034912109375, 13.73779296875, 14.440673828125, 15.1435546875, 15.846435546875, 16.54931640625, 17.252197265625, 17.955078125, 18.657958984375, 19.36083984375, 20.063720703125, 20.7666015625, 21.469482421875, 22.17236328125, 22.875244140625, 23.578125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 2.0, 6.0, 7.0, 6.0, 11.0, 10.0, 15.0, 24.0, 28.0, 49.0, 60.0, 73.0, 72.0, 77.0, 96.0, 72.0, 84.0, 76.0, 52.0, 43.0, 38.0, 27.0, 22.0, 21.0, 9.0, 5.0, 7.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-19.953125, -19.436279296875, -18.91943359375, -18.402587890625, -17.8857421875, -17.368896484375, -16.85205078125, -16.335205078125, -15.818359375, -15.301513671875, -14.78466796875, -14.267822265625, -13.7509765625, -13.234130859375, -12.71728515625, -12.200439453125, -11.68359375, -11.166748046875, -10.64990234375, -10.133056640625, -9.6162109375, -9.099365234375, -8.58251953125, -8.065673828125, -7.548828125, -7.031982421875, -6.51513671875, -5.998291015625, -5.4814453125, -4.964599609375, -4.44775390625, -3.930908203125, -3.4140625, -2.897216796875, -2.38037109375, -1.863525390625, -1.3466796875, -0.829833984375, -0.31298828125, 0.203857421875, 0.720703125, 1.237548828125, 1.75439453125, 2.271240234375, 2.7880859375, 3.304931640625, 3.82177734375, 4.338623046875, 4.85546875, 5.372314453125, 5.88916015625, 6.406005859375, 6.9228515625, 7.439697265625, 7.95654296875, 8.473388671875, 8.990234375, 9.507080078125, 10.02392578125, 10.540771484375, 11.0576171875, 11.574462890625, 12.09130859375, 12.608154296875, 13.125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 6.0, 9.0, 7.0, 16.0, 20.0, 22.0, 33.0, 59.0, 74.0, 102.0, 144.0, 207.0, 353.0, 629.0, 1192.0, 2735.0, 9321.0, 56398.0, 520188.0, 399974.0, 44054.0, 8010.0, 2440.0, 1062.0, 562.0, 341.0, 197.0, 122.0, 79.0, 67.0, 37.0, 34.0, 13.0, 11.0, 12.0, 14.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-44.1875, -42.9580078125, -41.728515625, -40.4990234375, -39.26953125, -38.0400390625, -36.810546875, -35.5810546875, -34.3515625, -33.1220703125, -31.892578125, -30.6630859375, -29.43359375, -28.2041015625, -26.974609375, -25.7451171875, -24.515625, -23.2861328125, -22.056640625, -20.8271484375, -19.59765625, -18.3681640625, -17.138671875, -15.9091796875, -14.6796875, -13.4501953125, -12.220703125, -10.9912109375, -9.76171875, -8.5322265625, -7.302734375, -6.0732421875, -4.84375, -3.6142578125, -2.384765625, -1.1552734375, 0.07421875, 1.3037109375, 2.533203125, 3.7626953125, 4.9921875, 6.2216796875, 7.451171875, 8.6806640625, 9.91015625, 11.1396484375, 12.369140625, 13.5986328125, 14.828125, 16.0576171875, 17.287109375, 18.5166015625, 19.74609375, 20.9755859375, 22.205078125, 23.4345703125, 24.6640625, 25.8935546875, 27.123046875, 28.3525390625, 29.58203125, 30.8115234375, 32.041015625, 33.2705078125, 34.5]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 8.0, 8.0, 8.0, 5.0, 10.0, 10.0, 11.0, 22.0, 16.0, 25.0, 21.0, 37.0, 30.0, 33.0, 48.0, 48.0, 57.0, 49.0, 43.0, 54.0, 56.0, 48.0, 46.0, 46.0, 49.0, 34.0, 24.0, 30.0, 24.0, 20.0, 15.0, 18.0, 9.0, 16.0, 5.0, 9.0, 4.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.78125, -34.5146484375, -33.248046875, -31.9814453125, -30.71484375, -29.4482421875, -28.181640625, -26.9150390625, -25.6484375, -24.3818359375, -23.115234375, -21.8486328125, -20.58203125, -19.3154296875, -18.048828125, -16.7822265625, -15.515625, -14.2490234375, -12.982421875, -11.7158203125, -10.44921875, -9.1826171875, -7.916015625, -6.6494140625, -5.3828125, -4.1162109375, -2.849609375, -1.5830078125, -0.31640625, 0.9501953125, 2.216796875, 3.4833984375, 4.75, 6.0166015625, 7.283203125, 8.5498046875, 9.81640625, 11.0830078125, 12.349609375, 13.6162109375, 14.8828125, 16.1494140625, 17.416015625, 18.6826171875, 19.94921875, 21.2158203125, 22.482421875, 23.7490234375, 25.015625, 26.2822265625, 27.548828125, 28.8154296875, 30.08203125, 31.3486328125, 32.615234375, 33.8818359375, 35.1484375, 36.4150390625, 37.681640625, 38.9482421875, 40.21484375, 41.4814453125, 42.748046875, 44.0146484375, 45.28125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 5.0, 10.0, 13.0, 29.0, 46.0, 56.0, 99.0, 161.0, 263.0, 574.0, 1259.0, 3455.0, 13267.0, 72578.0, 498860.0, 384502.0, 57273.0, 10977.0, 3026.0, 1000.0, 476.0, 246.0, 130.0, 94.0, 53.0, 36.0, 19.0, 17.0, 7.0, 8.0, 7.0, 2.0, 5.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.015625, -6.709716796875, -6.40380859375, -6.097900390625, -5.7919921875, -5.486083984375, -5.18017578125, -4.874267578125, -4.568359375, -4.262451171875, -3.95654296875, -3.650634765625, -3.3447265625, -3.038818359375, -2.73291015625, -2.427001953125, -2.12109375, -1.815185546875, -1.50927734375, -1.203369140625, -0.8974609375, -0.591552734375, -0.28564453125, 0.020263671875, 0.326171875, 0.632080078125, 0.93798828125, 1.243896484375, 1.5498046875, 1.855712890625, 2.16162109375, 2.467529296875, 2.7734375, 3.079345703125, 3.38525390625, 3.691162109375, 3.9970703125, 4.302978515625, 4.60888671875, 4.914794921875, 5.220703125, 5.526611328125, 5.83251953125, 6.138427734375, 6.4443359375, 6.750244140625, 7.05615234375, 7.362060546875, 7.66796875, 7.973876953125, 8.27978515625, 8.585693359375, 8.8916015625, 9.197509765625, 9.50341796875, 9.809326171875, 10.115234375, 10.421142578125, 10.72705078125, 11.032958984375, 11.3388671875, 11.644775390625, 11.95068359375, 12.256591796875, 12.5625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 3.0, 4.0, 6.0, 4.0, 15.0, 12.0, 12.0, 15.0, 19.0, 20.0, 35.0, 41.0, 63.0, 59.0, 87.0, 121.0, 102.0, 95.0, 65.0, 50.0, 37.0, 27.0, 22.0, 21.0, 16.0, 6.0, 8.0, 10.0, 5.0, 5.0, 6.0, 5.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.002079010009765625, -0.002019554376602173, -0.0019600987434387207, -0.0019006431102752686, -0.0018411874771118164, -0.0017817318439483643, -0.0017222762107849121, -0.00166282057762146, -0.0016033649444580078, -0.0015439093112945557, -0.0014844536781311035, -0.0014249980449676514, -0.0013655424118041992, -0.001306086778640747, -0.001246631145477295, -0.0011871755123138428, -0.0011277198791503906, -0.0010682642459869385, -0.0010088086128234863, -0.0009493529796600342, -0.000889897346496582, -0.0008304417133331299, -0.0007709860801696777, -0.0007115304470062256, -0.0006520748138427734, -0.0005926191806793213, -0.0005331635475158691, -0.000473707914352417, -0.00041425228118896484, -0.0003547966480255127, -0.00029534101486206055, -0.0002358853816986084, -0.00017642974853515625, -0.0001169741153717041, -5.751848220825195e-05, 1.9371509552001953e-06, 6.139278411865234e-05, 0.00012084841728210449, 0.00018030405044555664, 0.0002397596836090088, 0.00029921531677246094, 0.0003586709499359131, 0.00041812658309936523, 0.0004775822162628174, 0.0005370378494262695, 0.0005964934825897217, 0.0006559491157531738, 0.000715404748916626, 0.0007748603820800781, 0.0008343160152435303, 0.0008937716484069824, 0.0009532272815704346, 0.0010126829147338867, 0.0010721385478973389, 0.001131594181060791, 0.0011910498142242432, 0.0012505054473876953, 0.0013099610805511475, 0.0013694167137145996, 0.0014288723468780518, 0.001488327980041504, 0.001547783613204956, 0.0016072392463684082, 0.0016666948795318604, 0.0017261505126953125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 4.0, 11.0, 26.0, 37.0, 78.0, 189.0, 454.0, 1234.0, 5123.0, 58338.0, 833656.0, 138192.0, 8523.0, 1689.0, 545.0, 226.0, 110.0, 43.0, 36.0, 13.0, 11.0, 5.0, 8.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.078125, -19.498291015625, -18.91845703125, -18.338623046875, -17.7587890625, -17.178955078125, -16.59912109375, -16.019287109375, -15.439453125, -14.859619140625, -14.27978515625, -13.699951171875, -13.1201171875, -12.540283203125, -11.96044921875, -11.380615234375, -10.80078125, -10.220947265625, -9.64111328125, -9.061279296875, -8.4814453125, -7.901611328125, -7.32177734375, -6.741943359375, -6.162109375, -5.582275390625, -5.00244140625, -4.422607421875, -3.8427734375, -3.262939453125, -2.68310546875, -2.103271484375, -1.5234375, -0.943603515625, -0.36376953125, 0.216064453125, 0.7958984375, 1.375732421875, 1.95556640625, 2.535400390625, 3.115234375, 3.695068359375, 4.27490234375, 4.854736328125, 5.4345703125, 6.014404296875, 6.59423828125, 7.174072265625, 7.75390625, 8.333740234375, 8.91357421875, 9.493408203125, 10.0732421875, 10.653076171875, 11.23291015625, 11.812744140625, 12.392578125, 12.972412109375, 13.55224609375, 14.132080078125, 14.7119140625, 15.291748046875, 15.87158203125, 16.451416015625, 17.03125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 14.0, 15.0, 35.0, 28.0, 50.0, 53.0, 94.0, 91.0, 96.0, 101.0, 99.0, 91.0, 74.0, 43.0, 36.0, 21.0, 19.0, 16.0, 4.0, 5.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1328125, -7.7264404296875, -7.320068359375, -6.9136962890625, -6.50732421875, -6.1009521484375, -5.694580078125, -5.2882080078125, -4.8818359375, -4.4754638671875, -4.069091796875, -3.6627197265625, -3.25634765625, -2.8499755859375, -2.443603515625, -2.0372314453125, -1.630859375, -1.2244873046875, -0.818115234375, -0.4117431640625, -0.00537109375, 0.4010009765625, 0.807373046875, 1.2137451171875, 1.6201171875, 2.0264892578125, 2.432861328125, 2.8392333984375, 3.24560546875, 3.6519775390625, 4.058349609375, 4.4647216796875, 4.87109375, 5.2774658203125, 5.683837890625, 6.0902099609375, 6.49658203125, 6.9029541015625, 7.309326171875, 7.7156982421875, 8.1220703125, 8.5284423828125, 8.934814453125, 9.3411865234375, 9.74755859375, 10.1539306640625, 10.560302734375, 10.9666748046875, 11.373046875, 11.7794189453125, 12.185791015625, 12.5921630859375, 12.99853515625, 13.4049072265625, 13.811279296875, 14.2176513671875, 14.6240234375, 15.0303955078125, 15.436767578125, 15.8431396484375, 16.24951171875, 16.6558837890625, 17.062255859375, 17.4686279296875, 17.875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 8.0, 15.0, 12.0, 24.0, 27.0, 45.0, 62.0, 82.0, 93.0, 88.0, 123.0, 112.0, 82.0, 76.0, 57.0, 22.0, 20.0, 18.0, 7.0, 4.0, 0.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-195.87744140625, -189.8155975341797, -183.75375366210938, -177.69190979003906, -171.63006591796875, -165.56820678710938, -159.50637817382812, -153.44451904296875, -147.38267517089844, -141.32083129882812, -135.2589874267578, -129.1971435546875, -123.13529205322266, -117.07344818115234, -111.01160430908203, -104.94975280761719, -98.8879165649414, -92.8260726928711, -86.76422882080078, -80.70237731933594, -74.64053344726562, -68.57868957519531, -62.516845703125, -56.45499801635742, -50.39315414428711, -44.3313102722168, -38.26946258544922, -32.207618713378906, -26.14577293395996, -20.083927154541016, -14.022083282470703, -7.960235595703125, -1.8983917236328125, 4.163453578948975, 10.225298881530762, 16.28714370727539, 22.348989486694336, 28.41083526611328, 34.472679138183594, 40.53452682495117, 46.596370697021484, 52.6582145690918, 58.720062255859375, 64.78190612792969, 70.84375, 76.90559387207031, 82.96743774414062, 89.02928924560547, 95.09113311767578, 101.1529769897461, 107.2148208618164, 113.27667236328125, 119.33851623535156, 125.40036010742188, 131.4622039794922, 137.5240478515625, 143.5858917236328, 149.64773559570312, 155.70957946777344, 161.77142333984375, 167.83326721191406, 173.89511108398438, 179.95697021484375, 186.01881408691406, 192.08065795898438]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 4.0, 5.0, 19.0, 4.0, 13.0, 20.0, 28.0, 30.0, 27.0, 37.0, 42.0, 42.0, 55.0, 39.0, 70.0, 53.0, 61.0, 73.0, 53.0, 44.0, 42.0, 48.0, 35.0, 37.0, 20.0, 24.0, 19.0, 16.0, 9.0, 13.0, 6.0, 2.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-174.36550903320312, -168.04466247558594, -161.7238311767578, -155.40298461914062, -149.0821533203125, -142.7613067626953, -136.44046020507812, -130.11962890625, -123.79878997802734, -117.47795104980469, -111.15711212158203, -104.83627319335938, -98.51542663574219, -92.19459533691406, -85.87374877929688, -79.55290985107422, -73.23207092285156, -66.9112319946289, -60.59039306640625, -54.26955032348633, -47.94871139526367, -41.627872467041016, -35.307029724121094, -28.986190795898438, -22.66535186767578, -16.344512939453125, -10.023672103881836, -3.702831268310547, 2.6180076599121094, 8.938846588134766, 15.259689331054688, 21.580528259277344, 27.9013671875, 34.222206115722656, 40.54304504394531, 46.863887786865234, 53.18472671508789, 59.50556564331055, 65.82640838623047, 72.14724731445312, 78.46808624267578, 84.78892517089844, 91.1097640991211, 97.43060302734375, 103.75144958496094, 110.07228088378906, 116.39312744140625, 122.7139663696289, 129.03480529785156, 135.35565185546875, 141.67648315429688, 147.99732971191406, 154.3181610107422, 160.63900756835938, 166.9598388671875, 173.2806854248047, 179.60153198242188, 185.92237854003906, 192.2432098388672, 198.56405639648438, 204.8848876953125, 211.2057342529297, 217.52658081054688, 223.847412109375, 230.16824340820312]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 11.0, 9.0, 9.0, 15.0, 11.0, 28.0, 39.0, 47.0, 84.0, 149.0, 217.0, 383.0, 621.0, 1054.0, 2076.0, 3858.0, 8071.0, 18163.0, 47180.0, 167764.0, 1662907.0, 2010443.0, 185059.0, 49489.0, 18966.0, 8336.0, 4118.0, 2178.0, 1191.0, 675.0, 420.0, 235.0, 160.0, 101.0, 58.0, 46.0, 40.0, 11.0, 14.0, 10.0, 11.0, 2.0, 8.0, 4.0, 5.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.125, -13.62109375, -13.1171875, -12.61328125, -12.109375, -11.60546875, -11.1015625, -10.59765625, -10.09375, -9.58984375, -9.0859375, -8.58203125, -8.078125, -7.57421875, -7.0703125, -6.56640625, -6.0625, -5.55859375, -5.0546875, -4.55078125, -4.046875, -3.54296875, -3.0390625, -2.53515625, -2.03125, -1.52734375, -1.0234375, -0.51953125, -0.015625, 0.48828125, 0.9921875, 1.49609375, 2.0, 2.50390625, 3.0078125, 3.51171875, 4.015625, 4.51953125, 5.0234375, 5.52734375, 6.03125, 6.53515625, 7.0390625, 7.54296875, 8.046875, 8.55078125, 9.0546875, 9.55859375, 10.0625, 10.56640625, 11.0703125, 11.57421875, 12.078125, 12.58203125, 13.0859375, 13.58984375, 14.09375, 14.59765625, 15.1015625, 15.60546875, 16.109375, 16.61328125, 17.1171875, 17.62109375, 18.125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 10.0, 4.0, 3.0, 14.0, 14.0, 20.0, 18.0, 32.0, 19.0, 35.0, 47.0, 55.0, 64.0, 61.0, 64.0, 68.0, 72.0, 55.0, 48.0, 47.0, 45.0, 49.0, 33.0, 22.0, 24.0, 21.0, 8.0, 9.0, 8.0, 6.0, 7.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2578125, -8.9197998046875, -8.581787109375, -8.2437744140625, -7.90576171875, -7.5677490234375, -7.229736328125, -6.8917236328125, -6.5537109375, -6.2156982421875, -5.877685546875, -5.5396728515625, -5.20166015625, -4.8636474609375, -4.525634765625, -4.1876220703125, -3.849609375, -3.5115966796875, -3.173583984375, -2.8355712890625, -2.49755859375, -2.1595458984375, -1.821533203125, -1.4835205078125, -1.1455078125, -0.8074951171875, -0.469482421875, -0.1314697265625, 0.20654296875, 0.5445556640625, 0.882568359375, 1.2205810546875, 1.55859375, 1.8966064453125, 2.234619140625, 2.5726318359375, 2.91064453125, 3.2486572265625, 3.586669921875, 3.9246826171875, 4.2626953125, 4.6007080078125, 4.938720703125, 5.2767333984375, 5.61474609375, 5.9527587890625, 6.290771484375, 6.6287841796875, 6.966796875, 7.3048095703125, 7.642822265625, 7.9808349609375, 8.31884765625, 8.6568603515625, 8.994873046875, 9.3328857421875, 9.6708984375, 10.0089111328125, 10.346923828125, 10.6849365234375, 11.02294921875, 11.3609619140625, 11.698974609375, 12.0369873046875, 12.375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 1.0, 6.0, 5.0, 2.0, 4.0, 9.0, 6.0, 13.0, 18.0, 38.0, 43.0, 63.0, 128.0, 243.0, 455.0, 1178.0, 2871.0, 8084.0, 27439.0, 142782.0, 3095730.0, 818667.0, 70819.0, 16977.0, 5269.0, 1870.0, 785.0, 331.0, 172.0, 85.0, 52.0, 41.0, 23.0, 15.0, 10.0, 7.0, 5.0, 7.0, 5.0, 4.0, 7.0, 5.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.046875, -25.2529296875, -24.458984375, -23.6650390625, -22.87109375, -22.0771484375, -21.283203125, -20.4892578125, -19.6953125, -18.9013671875, -18.107421875, -17.3134765625, -16.51953125, -15.7255859375, -14.931640625, -14.1376953125, -13.34375, -12.5498046875, -11.755859375, -10.9619140625, -10.16796875, -9.3740234375, -8.580078125, -7.7861328125, -6.9921875, -6.1982421875, -5.404296875, -4.6103515625, -3.81640625, -3.0224609375, -2.228515625, -1.4345703125, -0.640625, 0.1533203125, 0.947265625, 1.7412109375, 2.53515625, 3.3291015625, 4.123046875, 4.9169921875, 5.7109375, 6.5048828125, 7.298828125, 8.0927734375, 8.88671875, 9.6806640625, 10.474609375, 11.2685546875, 12.0625, 12.8564453125, 13.650390625, 14.4443359375, 15.23828125, 16.0322265625, 16.826171875, 17.6201171875, 18.4140625, 19.2080078125, 20.001953125, 20.7958984375, 21.58984375, 22.3837890625, 23.177734375, 23.9716796875, 24.765625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 2.0, 4.0, 6.0, 4.0, 8.0, 9.0, 8.0, 23.0, 23.0, 39.0, 50.0, 113.0, 191.0, 415.0, 932.0, 1104.0, 494.0, 247.0, 142.0, 89.0, 51.0, 32.0, 21.0, 23.0, 13.0, 6.0, 4.0, 6.0, 3.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.9375, -27.068359375, -26.19921875, -25.330078125, -24.4609375, -23.591796875, -22.72265625, -21.853515625, -20.984375, -20.115234375, -19.24609375, -18.376953125, -17.5078125, -16.638671875, -15.76953125, -14.900390625, -14.03125, -13.162109375, -12.29296875, -11.423828125, -10.5546875, -9.685546875, -8.81640625, -7.947265625, -7.078125, -6.208984375, -5.33984375, -4.470703125, -3.6015625, -2.732421875, -1.86328125, -0.994140625, -0.125, 0.744140625, 1.61328125, 2.482421875, 3.3515625, 4.220703125, 5.08984375, 5.958984375, 6.828125, 7.697265625, 8.56640625, 9.435546875, 10.3046875, 11.173828125, 12.04296875, 12.912109375, 13.78125, 14.650390625, 15.51953125, 16.388671875, 17.2578125, 18.126953125, 18.99609375, 19.865234375, 20.734375, 21.603515625, 22.47265625, 23.341796875, 24.2109375, 25.080078125, 25.94921875, 26.818359375, 27.6875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 5.0, 6.0, 15.0, 39.0, 88.0, 143.0, 199.0, 206.0, 152.0, 77.0, 21.0, 19.0, 12.0, 8.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-301.9026794433594, -292.92535400390625, -283.947998046875, -274.9706726074219, -265.99334716796875, -257.0159912109375, -248.03866577148438, -239.06134033203125, -230.08399963378906, -221.10665893554688, -212.12933349609375, -203.15199279785156, -194.17465209960938, -185.19732666015625, -176.21998596191406, -167.24264526367188, -158.26531982421875, -149.28797912597656, -140.31065368652344, -131.33331298828125, -122.3559799194336, -113.37864685058594, -104.40130615234375, -95.4239730834961, -86.44664001464844, -77.46930694580078, -68.49197387695312, -59.51463317871094, -50.53730010986328, -41.559967041015625, -32.5826301574707, -23.60529327392578, -14.6279296875, -5.650594711303711, 3.326740264892578, 12.304075241088867, 21.281410217285156, 30.258743286132812, 39.236080169677734, 48.213417053222656, 57.19075012207031, 66.16808319091797, 75.14541625976562, 84.12275695800781, 93.10009002685547, 102.07742309570312, 111.05476379394531, 120.03209686279297, 129.00942993164062, 137.9867706298828, 146.96409606933594, 155.94143676757812, 164.91876220703125, 173.89610290527344, 182.87344360351562, 191.85076904296875, 200.82810974121094, 209.80545043945312, 218.78277587890625, 227.76011657714844, 236.73745727539062, 245.71478271484375, 254.69212341308594, 263.6694641113281, 272.64678955078125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 5.0, 7.0, 12.0, 10.0, 17.0, 19.0, 14.0, 29.0, 31.0, 26.0, 33.0, 38.0, 27.0, 43.0, 52.0, 57.0, 40.0, 59.0, 45.0, 37.0, 48.0, 53.0, 41.0, 28.0, 46.0, 37.0, 24.0, 20.0, 19.0, 22.0, 15.0, 9.0, 10.0, 15.0, 6.0, 6.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.10187530517578, -110.51746368408203, -106.93305969238281, -103.34864807128906, -99.76424407958984, -96.1798324584961, -92.59542846679688, -89.01101684570312, -85.42660522460938, -81.84219360351562, -78.2577896118164, -74.67337799072266, -71.08897399902344, -67.50456237792969, -63.9201545715332, -60.33574676513672, -56.751338958740234, -53.16693115234375, -49.582523345947266, -45.99811553955078, -42.41370391845703, -38.82929611206055, -35.24488830566406, -31.660478591918945, -28.07607078552246, -24.491662979125977, -20.90725326538086, -17.322845458984375, -13.738436698913574, -10.154027938842773, -6.569620132446289, -2.985210418701172, 0.5991973876953125, 4.183606147766113, 7.768014430999756, 11.352422714233398, 14.9368314743042, 18.521240234375, 22.105648040771484, 25.6900577545166, 29.274465560913086, 32.8588752746582, 36.44328308105469, 40.02769088745117, 43.612098693847656, 47.196510314941406, 50.780914306640625, 54.365325927734375, 57.94973373413086, 61.534141540527344, 65.1185531616211, 68.70295715332031, 72.28736877441406, 75.87178039550781, 79.45618438720703, 83.04059600830078, 86.625, 90.20941162109375, 93.79381561279297, 97.37822723388672, 100.96263122558594, 104.54704284667969, 108.13145446777344, 111.71585845947266, 115.3002700805664]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 5.0, 13.0, 14.0, 10.0, 21.0, 32.0, 57.0, 88.0, 135.0, 249.0, 359.0, 620.0, 1065.0, 1764.0, 3469.0, 6736.0, 13940.0, 31028.0, 70192.0, 173650.0, 367271.0, 219828.0, 86220.0, 37702.0, 17084.0, 7905.0, 3950.0, 2142.0, 1234.0, 667.0, 359.0, 242.0, 180.0, 111.0, 55.0, 48.0, 37.0, 25.0, 17.0, 8.0, 8.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.984375, -17.449462890625, -16.91455078125, -16.379638671875, -15.8447265625, -15.309814453125, -14.77490234375, -14.239990234375, -13.705078125, -13.170166015625, -12.63525390625, -12.100341796875, -11.5654296875, -11.030517578125, -10.49560546875, -9.960693359375, -9.42578125, -8.890869140625, -8.35595703125, -7.821044921875, -7.2861328125, -6.751220703125, -6.21630859375, -5.681396484375, -5.146484375, -4.611572265625, -4.07666015625, -3.541748046875, -3.0068359375, -2.471923828125, -1.93701171875, -1.402099609375, -0.8671875, -0.332275390625, 0.20263671875, 0.737548828125, 1.2724609375, 1.807373046875, 2.34228515625, 2.877197265625, 3.412109375, 3.947021484375, 4.48193359375, 5.016845703125, 5.5517578125, 6.086669921875, 6.62158203125, 7.156494140625, 7.69140625, 8.226318359375, 8.76123046875, 9.296142578125, 9.8310546875, 10.365966796875, 10.90087890625, 11.435791015625, 11.970703125, 12.505615234375, 13.04052734375, 13.575439453125, 14.1103515625, 14.645263671875, 15.18017578125, 15.715087890625, 16.25]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 12.0, 7.0, 17.0, 17.0, 23.0, 28.0, 19.0, 29.0, 33.0, 47.0, 52.0, 53.0, 59.0, 64.0, 72.0, 65.0, 59.0, 43.0, 53.0, 37.0, 40.0, 31.0, 28.0, 26.0, 21.0, 16.0, 8.0, 9.0, 8.0, 4.0, 1.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.3125, -8.9705810546875, -8.628662109375, -8.2867431640625, -7.94482421875, -7.6029052734375, -7.260986328125, -6.9190673828125, -6.5771484375, -6.2352294921875, -5.893310546875, -5.5513916015625, -5.20947265625, -4.8675537109375, -4.525634765625, -4.1837158203125, -3.841796875, -3.4998779296875, -3.157958984375, -2.8160400390625, -2.47412109375, -2.1322021484375, -1.790283203125, -1.4483642578125, -1.1064453125, -0.7645263671875, -0.422607421875, -0.0806884765625, 0.26123046875, 0.6031494140625, 0.945068359375, 1.2869873046875, 1.62890625, 1.9708251953125, 2.312744140625, 2.6546630859375, 2.99658203125, 3.3385009765625, 3.680419921875, 4.0223388671875, 4.3642578125, 4.7061767578125, 5.048095703125, 5.3900146484375, 5.73193359375, 6.0738525390625, 6.415771484375, 6.7576904296875, 7.099609375, 7.4415283203125, 7.783447265625, 8.1253662109375, 8.46728515625, 8.8092041015625, 9.151123046875, 9.4930419921875, 9.8349609375, 10.1768798828125, 10.518798828125, 10.8607177734375, 11.20263671875, 11.5445556640625, 11.886474609375, 12.2283935546875, 12.5703125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 4.0, 6.0, 7.0, 10.0, 16.0, 20.0, 22.0, 45.0, 60.0, 111.0, 178.0, 354.0, 711.0, 1603.0, 4796.0, 32380.0, 682445.0, 301532.0, 18270.0, 3380.0, 1215.0, 614.0, 290.0, 176.0, 94.0, 83.0, 51.0, 36.0, 19.0, 12.0, 4.0, 5.0, 2.0, 3.0, 0.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.59375, -47.0693359375, -45.544921875, -44.0205078125, -42.49609375, -40.9716796875, -39.447265625, -37.9228515625, -36.3984375, -34.8740234375, -33.349609375, -31.8251953125, -30.30078125, -28.7763671875, -27.251953125, -25.7275390625, -24.203125, -22.6787109375, -21.154296875, -19.6298828125, -18.10546875, -16.5810546875, -15.056640625, -13.5322265625, -12.0078125, -10.4833984375, -8.958984375, -7.4345703125, -5.91015625, -4.3857421875, -2.861328125, -1.3369140625, 0.1875, 1.7119140625, 3.236328125, 4.7607421875, 6.28515625, 7.8095703125, 9.333984375, 10.8583984375, 12.3828125, 13.9072265625, 15.431640625, 16.9560546875, 18.48046875, 20.0048828125, 21.529296875, 23.0537109375, 24.578125, 26.1025390625, 27.626953125, 29.1513671875, 30.67578125, 32.2001953125, 33.724609375, 35.2490234375, 36.7734375, 38.2978515625, 39.822265625, 41.3466796875, 42.87109375, 44.3955078125, 45.919921875, 47.4443359375, 48.96875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 1.0, 2.0, 12.0, 15.0, 22.0, 18.0, 24.0, 23.0, 26.0, 40.0, 37.0, 53.0, 49.0, 48.0, 60.0, 48.0, 62.0, 55.0, 51.0, 50.0, 50.0, 48.0, 25.0, 37.0, 32.0, 24.0, 18.0, 14.0, 20.0, 10.0, 8.0, 6.0, 5.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.53125, -41.2861328125, -40.041015625, -38.7958984375, -37.55078125, -36.3056640625, -35.060546875, -33.8154296875, -32.5703125, -31.3251953125, -30.080078125, -28.8349609375, -27.58984375, -26.3447265625, -25.099609375, -23.8544921875, -22.609375, -21.3642578125, -20.119140625, -18.8740234375, -17.62890625, -16.3837890625, -15.138671875, -13.8935546875, -12.6484375, -11.4033203125, -10.158203125, -8.9130859375, -7.66796875, -6.4228515625, -5.177734375, -3.9326171875, -2.6875, -1.4423828125, -0.197265625, 1.0478515625, 2.29296875, 3.5380859375, 4.783203125, 6.0283203125, 7.2734375, 8.5185546875, 9.763671875, 11.0087890625, 12.25390625, 13.4990234375, 14.744140625, 15.9892578125, 17.234375, 18.4794921875, 19.724609375, 20.9697265625, 22.21484375, 23.4599609375, 24.705078125, 25.9501953125, 27.1953125, 28.4404296875, 29.685546875, 30.9306640625, 32.17578125, 33.4208984375, 34.666015625, 35.9111328125, 37.15625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 5.0, 2.0, 2.0, 8.0, 6.0, 15.0, 19.0, 33.0, 46.0, 74.0, 133.0, 242.0, 621.0, 2135.0, 12394.0, 185781.0, 800742.0, 39773.0, 4548.0, 1122.0, 419.0, 165.0, 88.0, 57.0, 38.0, 26.0, 18.0, 16.0, 5.0, 5.0, 4.0, 1.0, 1.0, 5.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.703125, -16.15087890625, -15.5986328125, -15.04638671875, -14.494140625, -13.94189453125, -13.3896484375, -12.83740234375, -12.28515625, -11.73291015625, -11.1806640625, -10.62841796875, -10.076171875, -9.52392578125, -8.9716796875, -8.41943359375, -7.8671875, -7.31494140625, -6.7626953125, -6.21044921875, -5.658203125, -5.10595703125, -4.5537109375, -4.00146484375, -3.44921875, -2.89697265625, -2.3447265625, -1.79248046875, -1.240234375, -0.68798828125, -0.1357421875, 0.41650390625, 0.96875, 1.52099609375, 2.0732421875, 2.62548828125, 3.177734375, 3.72998046875, 4.2822265625, 4.83447265625, 5.38671875, 5.93896484375, 6.4912109375, 7.04345703125, 7.595703125, 8.14794921875, 8.7001953125, 9.25244140625, 9.8046875, 10.35693359375, 10.9091796875, 11.46142578125, 12.013671875, 12.56591796875, 13.1181640625, 13.67041015625, 14.22265625, 14.77490234375, 15.3271484375, 15.87939453125, 16.431640625, 16.98388671875, 17.5361328125, 18.08837890625, 18.640625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 6.0, 2.0, 4.0, 3.0, 8.0, 9.0, 7.0, 7.0, 14.0, 13.0, 10.0, 15.0, 15.0, 25.0, 27.0, 42.0, 59.0, 74.0, 96.0, 120.0, 124.0, 65.0, 55.0, 31.0, 33.0, 20.0, 21.0, 19.0, 7.0, 9.0, 5.0, 17.0, 9.0, 9.0, 10.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016498565673828125, -0.0015919506549835205, -0.0015340447425842285, -0.0014761388301849365, -0.0014182329177856445, -0.0013603270053863525, -0.0013024210929870605, -0.0012445151805877686, -0.0011866092681884766, -0.0011287033557891846, -0.0010707974433898926, -0.0010128915309906006, -0.0009549856185913086, -0.0008970797061920166, -0.0008391737937927246, -0.0007812678813934326, -0.0007233619689941406, -0.0006654560565948486, -0.0006075501441955566, -0.0005496442317962646, -0.0004917383193969727, -0.00043383240699768066, -0.00037592649459838867, -0.0003180205821990967, -0.0002601146697998047, -0.0002022087574005127, -0.0001443028450012207, -8.639693260192871e-05, -2.849102020263672e-05, 2.9414892196655273e-05, 8.732080459594727e-05, 0.00014522671699523926, 0.00020313262939453125, 0.00026103854179382324, 0.00031894445419311523, 0.0003768503665924072, 0.0004347562789916992, 0.0004926621913909912, 0.0005505681037902832, 0.0006084740161895752, 0.0006663799285888672, 0.0007242858409881592, 0.0007821917533874512, 0.0008400976657867432, 0.0008980035781860352, 0.0009559094905853271, 0.0010138154029846191, 0.0010717213153839111, 0.0011296272277832031, 0.0011875331401824951, 0.0012454390525817871, 0.001303344964981079, 0.001361250877380371, 0.001419156789779663, 0.001477062702178955, 0.001534968614578247, 0.001592874526977539, 0.001650780439376831, 0.001708686351776123, 0.001766592264175415, 0.001824498176574707, 0.001882404088973999, 0.001940310001373291, 0.001998215913772583, 0.002056121826171875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 9.0, 7.0, 16.0, 19.0, 33.0, 41.0, 54.0, 95.0, 150.0, 281.0, 485.0, 991.0, 2321.0, 7314.0, 44921.0, 604526.0, 348179.0, 29451.0, 5822.0, 1909.0, 900.0, 430.0, 216.0, 142.0, 69.0, 48.0, 31.0, 23.0, 15.0, 11.0, 8.0, 7.0, 7.0, 5.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.5703125, -11.1556396484375, -10.740966796875, -10.3262939453125, -9.91162109375, -9.4969482421875, -9.082275390625, -8.6676025390625, -8.2529296875, -7.8382568359375, -7.423583984375, -7.0089111328125, -6.59423828125, -6.1795654296875, -5.764892578125, -5.3502197265625, -4.935546875, -4.5208740234375, -4.106201171875, -3.6915283203125, -3.27685546875, -2.8621826171875, -2.447509765625, -2.0328369140625, -1.6181640625, -1.2034912109375, -0.788818359375, -0.3741455078125, 0.04052734375, 0.4552001953125, 0.869873046875, 1.2845458984375, 1.69921875, 2.1138916015625, 2.528564453125, 2.9432373046875, 3.35791015625, 3.7725830078125, 4.187255859375, 4.6019287109375, 5.0166015625, 5.4312744140625, 5.845947265625, 6.2606201171875, 6.67529296875, 7.0899658203125, 7.504638671875, 7.9193115234375, 8.333984375, 8.7486572265625, 9.163330078125, 9.5780029296875, 9.99267578125, 10.4073486328125, 10.822021484375, 11.2366943359375, 11.6513671875, 12.0660400390625, 12.480712890625, 12.8953857421875, 13.31005859375, 13.7247314453125, 14.139404296875, 14.5540771484375, 14.96875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 5.0, 8.0, 6.0, 14.0, 18.0, 27.0, 37.0, 35.0, 74.0, 86.0, 101.0, 123.0, 112.0, 103.0, 78.0, 50.0, 44.0, 30.0, 22.0, 10.0, 5.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.0625, -15.6256103515625, -15.188720703125, -14.7518310546875, -14.31494140625, -13.8780517578125, -13.441162109375, -13.0042724609375, -12.5673828125, -12.1304931640625, -11.693603515625, -11.2567138671875, -10.81982421875, -10.3829345703125, -9.946044921875, -9.5091552734375, -9.072265625, -8.6353759765625, -8.198486328125, -7.7615966796875, -7.32470703125, -6.8878173828125, -6.450927734375, -6.0140380859375, -5.5771484375, -5.1402587890625, -4.703369140625, -4.2664794921875, -3.82958984375, -3.3927001953125, -2.955810546875, -2.5189208984375, -2.08203125, -1.6451416015625, -1.208251953125, -0.7713623046875, -0.33447265625, 0.1024169921875, 0.539306640625, 0.9761962890625, 1.4130859375, 1.8499755859375, 2.286865234375, 2.7237548828125, 3.16064453125, 3.5975341796875, 4.034423828125, 4.4713134765625, 4.908203125, 5.3450927734375, 5.781982421875, 6.2188720703125, 6.65576171875, 7.0926513671875, 7.529541015625, 7.9664306640625, 8.4033203125, 8.8402099609375, 9.277099609375, 9.7139892578125, 10.15087890625, 10.5877685546875, 11.024658203125, 11.4615478515625, 11.8984375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 6.0, 2.0, 4.0, 18.0, 22.0, 62.0, 81.0, 126.0, 159.0, 170.0, 131.0, 91.0, 48.0, 28.0, 11.0, 14.0, 12.0, 4.0, 1.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-216.178466796875, -209.62818908691406, -203.07791137695312, -196.5276336669922, -189.97735595703125, -183.42709350585938, -176.87680053710938, -170.3265380859375, -163.77626037597656, -157.22598266601562, -150.6757049560547, -144.12542724609375, -137.5751495361328, -131.02487182617188, -124.47460174560547, -117.92433166503906, -111.3740463256836, -104.82376861572266, -98.27349090576172, -91.72322082519531, -85.17294311523438, -78.62266540527344, -72.0723876953125, -65.52210998535156, -58.97183609008789, -52.42155838012695, -45.87128448486328, -39.321006774902344, -32.770729064941406, -26.220455169677734, -19.670177459716797, -13.119903564453125, -6.5696258544921875, -0.01934957504272461, 6.530926704406738, 13.08120346069336, 19.631479263305664, 26.18175506591797, 32.732032775878906, 39.28230667114258, 45.832584381103516, 52.38286209106445, 58.933135986328125, 65.48341369628906, 72.03369140625, 78.58396911621094, 85.13424682617188, 91.68451690673828, 98.23479461669922, 104.78507232666016, 111.3353500366211, 117.8856201171875, 124.43589782714844, 130.98617553710938, 137.5364532470703, 144.08673095703125, 150.6370086669922, 157.18728637695312, 163.73756408691406, 170.287841796875, 176.83811950683594, 183.38839721679688, 189.93865966796875, 196.4889373779297, 203.03921508789062]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 9.0, 6.0, 11.0, 18.0, 16.0, 25.0, 26.0, 38.0, 43.0, 41.0, 48.0, 64.0, 69.0, 81.0, 73.0, 76.0, 63.0, 57.0, 41.0, 41.0, 33.0, 32.0, 22.0, 15.0, 13.0, 12.0, 10.0, 7.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.09713745117188, -134.03933715820312, -127.98152160644531, -121.92372131347656, -115.86591339111328, -109.80810546875, -103.75030517578125, -97.69249725341797, -91.63468933105469, -85.5768814086914, -79.51907348632812, -73.46127319335938, -67.4034652709961, -61.34565734863281, -55.2878532409668, -49.23004913330078, -43.1722412109375, -37.11443328857422, -31.056629180908203, -24.998823165893555, -18.941017150878906, -12.883211135864258, -6.825405120849609, -0.7676010131835938, 5.2902069091796875, 11.348012924194336, 17.405818939208984, 23.463624954223633, 29.52143096923828, 35.57923889160156, 41.63704299926758, 47.694847106933594, 53.752655029296875, 59.810462951660156, 65.86827087402344, 71.92607116699219, 77.98387908935547, 84.04168701171875, 90.0994873046875, 96.15729522705078, 102.21510314941406, 108.27291107177734, 114.33071899414062, 120.38851928710938, 126.44632720947266, 132.50413513183594, 138.5619354248047, 144.6197509765625, 150.67755126953125, 156.7353515625, 162.7931671142578, 168.85096740722656, 174.90878295898438, 180.96658325195312, 187.02438354492188, 193.08218383789062, 199.13999938964844, 205.1977996826172, 211.255615234375, 217.31341552734375, 223.3712158203125, 229.4290313720703, 235.48683166503906, 241.54464721679688, 247.60244750976562]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [5.0, 1.0, 4.0, 2.0, 7.0, 10.0, 14.0, 27.0, 39.0, 63.0, 119.0, 250.0, 505.0, 1063.0, 2503.0, 6068.0, 17955.0, 66859.0, 721727.0, 3155161.0, 173419.0, 31791.0, 9914.0, 3668.0, 1574.0, 705.0, 313.0, 190.0, 126.0, 65.0, 35.0, 25.0, 17.0, 23.0, 8.0, 13.0, 9.0, 3.0, 2.0, 6.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.703125, -10.147216796875, -9.59130859375, -9.035400390625, -8.4794921875, -7.923583984375, -7.36767578125, -6.811767578125, -6.255859375, -5.699951171875, -5.14404296875, -4.588134765625, -4.0322265625, -3.476318359375, -2.92041015625, -2.364501953125, -1.80859375, -1.252685546875, -0.69677734375, -0.140869140625, 0.4150390625, 0.970947265625, 1.52685546875, 2.082763671875, 2.638671875, 3.194580078125, 3.75048828125, 4.306396484375, 4.8623046875, 5.418212890625, 5.97412109375, 6.530029296875, 7.0859375, 7.641845703125, 8.19775390625, 8.753662109375, 9.3095703125, 9.865478515625, 10.42138671875, 10.977294921875, 11.533203125, 12.089111328125, 12.64501953125, 13.200927734375, 13.7568359375, 14.312744140625, 14.86865234375, 15.424560546875, 15.98046875, 16.536376953125, 17.09228515625, 17.648193359375, 18.2041015625, 18.760009765625, 19.31591796875, 19.871826171875, 20.427734375, 20.983642578125, 21.53955078125, 22.095458984375, 22.6513671875, 23.207275390625, 23.76318359375, 24.319091796875, 24.875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 0.0, 3.0, 1.0, 7.0, 7.0, 9.0, 12.0, 25.0, 33.0, 37.0, 73.0, 64.0, 94.0, 88.0, 101.0, 91.0, 90.0, 73.0, 74.0, 44.0, 36.0, 15.0, 11.0, 10.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3125, -8.77880859375, -8.2451171875, -7.71142578125, -7.177734375, -6.64404296875, -6.1103515625, -5.57666015625, -5.04296875, -4.50927734375, -3.9755859375, -3.44189453125, -2.908203125, -2.37451171875, -1.8408203125, -1.30712890625, -0.7734375, -0.23974609375, 0.2939453125, 0.82763671875, 1.361328125, 1.89501953125, 2.4287109375, 2.96240234375, 3.49609375, 4.02978515625, 4.5634765625, 5.09716796875, 5.630859375, 6.16455078125, 6.6982421875, 7.23193359375, 7.765625, 8.29931640625, 8.8330078125, 9.36669921875, 9.900390625, 10.43408203125, 10.9677734375, 11.50146484375, 12.03515625, 12.56884765625, 13.1025390625, 13.63623046875, 14.169921875, 14.70361328125, 15.2373046875, 15.77099609375, 16.3046875, 16.83837890625, 17.3720703125, 17.90576171875, 18.439453125, 18.97314453125, 19.5068359375, 20.04052734375, 20.57421875, 21.10791015625, 21.6416015625, 22.17529296875, 22.708984375, 23.24267578125, 23.7763671875, 24.31005859375, 24.84375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 6.0, 3.0, 5.0, 7.0, 11.0, 10.0, 27.0, 32.0, 40.0, 51.0, 97.0, 192.0, 334.0, 730.0, 1574.0, 3764.0, 9842.0, 32750.0, 175578.0, 3078958.0, 789752.0, 72434.0, 17892.0, 5961.0, 2314.0, 1001.0, 439.0, 218.0, 107.0, 51.0, 36.0, 27.0, 22.0, 10.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-25.375, -24.720458984375, -24.06591796875, -23.411376953125, -22.7568359375, -22.102294921875, -21.44775390625, -20.793212890625, -20.138671875, -19.484130859375, -18.82958984375, -18.175048828125, -17.5205078125, -16.865966796875, -16.21142578125, -15.556884765625, -14.90234375, -14.247802734375, -13.59326171875, -12.938720703125, -12.2841796875, -11.629638671875, -10.97509765625, -10.320556640625, -9.666015625, -9.011474609375, -8.35693359375, -7.702392578125, -7.0478515625, -6.393310546875, -5.73876953125, -5.084228515625, -4.4296875, -3.775146484375, -3.12060546875, -2.466064453125, -1.8115234375, -1.156982421875, -0.50244140625, 0.152099609375, 0.806640625, 1.461181640625, 2.11572265625, 2.770263671875, 3.4248046875, 4.079345703125, 4.73388671875, 5.388427734375, 6.04296875, 6.697509765625, 7.35205078125, 8.006591796875, 8.6611328125, 9.315673828125, 9.97021484375, 10.624755859375, 11.279296875, 11.933837890625, 12.58837890625, 13.242919921875, 13.8974609375, 14.552001953125, 15.20654296875, 15.861083984375, 16.515625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 1.0, 4.0, 3.0, 10.0, 5.0, 11.0, 16.0, 15.0, 37.0, 60.0, 116.0, 179.0, 379.0, 835.0, 1163.0, 605.0, 275.0, 135.0, 81.0, 45.0, 32.0, 21.0, 11.0, 6.0, 14.0, 9.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-32.65625, -31.88427734375, -31.1123046875, -30.34033203125, -29.568359375, -28.79638671875, -28.0244140625, -27.25244140625, -26.48046875, -25.70849609375, -24.9365234375, -24.16455078125, -23.392578125, -22.62060546875, -21.8486328125, -21.07666015625, -20.3046875, -19.53271484375, -18.7607421875, -17.98876953125, -17.216796875, -16.44482421875, -15.6728515625, -14.90087890625, -14.12890625, -13.35693359375, -12.5849609375, -11.81298828125, -11.041015625, -10.26904296875, -9.4970703125, -8.72509765625, -7.953125, -7.18115234375, -6.4091796875, -5.63720703125, -4.865234375, -4.09326171875, -3.3212890625, -2.54931640625, -1.77734375, -1.00537109375, -0.2333984375, 0.53857421875, 1.310546875, 2.08251953125, 2.8544921875, 3.62646484375, 4.3984375, 5.17041015625, 5.9423828125, 6.71435546875, 7.486328125, 8.25830078125, 9.0302734375, 9.80224609375, 10.57421875, 11.34619140625, 12.1181640625, 12.89013671875, 13.662109375, 14.43408203125, 15.2060546875, 15.97802734375, 16.75]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 12.0, 17.0, 54.0, 94.0, 191.0, 230.0, 183.0, 118.0, 53.0, 26.0, 7.0, 6.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-209.417236328125, -202.32986450195312, -195.24249267578125, -188.15512084960938, -181.0677490234375, -173.98037719726562, -166.89300537109375, -159.80563354492188, -152.71826171875, -145.63088989257812, -138.54351806640625, -131.45614624023438, -124.3687744140625, -117.28140258789062, -110.19403076171875, -103.10665893554688, -96.019287109375, -88.93191528320312, -81.84454345703125, -74.75717163085938, -67.6697998046875, -60.582427978515625, -53.49505615234375, -46.407684326171875, -39.3203125, -32.232940673828125, -25.14556884765625, -18.058197021484375, -10.9708251953125, -3.883453369140625, 3.20391845703125, 10.291290283203125, 17.378662109375, 24.466033935546875, 31.55340576171875, 38.640777587890625, 45.7281494140625, 52.815521240234375, 59.90289306640625, 66.99026489257812, 74.07763671875, 81.16500854492188, 88.25238037109375, 95.33975219726562, 102.4271240234375, 109.51449584960938, 116.60186767578125, 123.68923950195312, 130.776611328125, 137.86398315429688, 144.95135498046875, 152.03872680664062, 159.1260986328125, 166.21347045898438, 173.30084228515625, 180.38821411132812, 187.4755859375, 194.56295776367188, 201.65032958984375, 208.73770141601562, 215.8250732421875, 222.91244506835938, 229.99981689453125, 237.08718872070312, 244.174560546875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 9.0, 10.0, 11.0, 8.0, 15.0, 19.0, 23.0, 22.0, 39.0, 39.0, 36.0, 52.0, 56.0, 68.0, 72.0, 58.0, 72.0, 67.0, 59.0, 45.0, 42.0, 42.0, 23.0, 24.0, 28.0, 18.0, 14.0, 12.0, 8.0, 6.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-120.9265365600586, -117.66624450683594, -114.40595245361328, -111.14566040039062, -107.8853759765625, -104.62508392333984, -101.36479187011719, -98.10449981689453, -94.84420776367188, -91.58391571044922, -88.32362365722656, -85.06333923339844, -81.80304718017578, -78.54275512695312, -75.28246307373047, -72.02217102050781, -68.76188659667969, -65.50159454345703, -62.24130630493164, -58.981014251708984, -55.720726013183594, -52.46043395996094, -49.20014190673828, -45.939849853515625, -42.679561614990234, -39.41926956176758, -36.15898132324219, -32.89868927001953, -29.638399124145508, -26.378108978271484, -23.117816925048828, -19.857526779174805, -16.597244262695312, -13.336954116821289, -10.07666301727295, -6.816371917724609, -3.556081771850586, -0.2957916259765625, 2.9645004272460938, 6.224790573120117, 9.48508071899414, 12.745370864868164, 16.005661010742188, 19.265953063964844, 22.526243209838867, 25.78653335571289, 29.046825408935547, 32.30711364746094, 35.567405700683594, 38.82769775390625, 42.08798599243164, 45.3482780456543, 48.60856628417969, 51.868858337402344, 55.129150390625, 58.389442443847656, 61.64973068237305, 64.91001892089844, 68.1703109741211, 71.43060302734375, 74.6908950805664, 77.95118713378906, 81.21147155761719, 84.47176361083984, 87.7320556640625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 5.0, 7.0, 14.0, 32.0, 34.0, 63.0, 98.0, 167.0, 292.0, 486.0, 855.0, 1618.0, 3098.0, 6175.0, 12384.0, 26965.0, 62128.0, 160510.0, 367629.0, 243384.0, 91021.0, 37652.0, 17175.0, 7991.0, 4000.0, 2184.0, 1112.0, 609.0, 365.0, 176.0, 120.0, 78.0, 49.0, 22.0, 21.0, 8.0, 7.0, 7.0, 6.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0], "bins": [-19.046875, -18.541748046875, -18.03662109375, -17.531494140625, -17.0263671875, -16.521240234375, -16.01611328125, -15.510986328125, -15.005859375, -14.500732421875, -13.99560546875, -13.490478515625, -12.9853515625, -12.480224609375, -11.97509765625, -11.469970703125, -10.96484375, -10.459716796875, -9.95458984375, -9.449462890625, -8.9443359375, -8.439208984375, -7.93408203125, -7.428955078125, -6.923828125, -6.418701171875, -5.91357421875, -5.408447265625, -4.9033203125, -4.398193359375, -3.89306640625, -3.387939453125, -2.8828125, -2.377685546875, -1.87255859375, -1.367431640625, -0.8623046875, -0.357177734375, 0.14794921875, 0.653076171875, 1.158203125, 1.663330078125, 2.16845703125, 2.673583984375, 3.1787109375, 3.683837890625, 4.18896484375, 4.694091796875, 5.19921875, 5.704345703125, 6.20947265625, 6.714599609375, 7.2197265625, 7.724853515625, 8.22998046875, 8.735107421875, 9.240234375, 9.745361328125, 10.25048828125, 10.755615234375, 11.2607421875, 11.765869140625, 12.27099609375, 12.776123046875, 13.28125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 4.0, 7.0, 15.0, 11.0, 16.0, 16.0, 17.0, 19.0, 37.0, 55.0, 38.0, 42.0, 47.0, 56.0, 61.0, 66.0, 68.0, 61.0, 63.0, 51.0, 49.0, 40.0, 44.0, 23.0, 19.0, 17.0, 15.0, 13.0, 12.0, 4.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.4140625, -9.0723876953125, -8.730712890625, -8.3890380859375, -8.04736328125, -7.7056884765625, -7.364013671875, -7.0223388671875, -6.6806640625, -6.3389892578125, -5.997314453125, -5.6556396484375, -5.31396484375, -4.9722900390625, -4.630615234375, -4.2889404296875, -3.947265625, -3.6055908203125, -3.263916015625, -2.9222412109375, -2.58056640625, -2.2388916015625, -1.897216796875, -1.5555419921875, -1.2138671875, -0.8721923828125, -0.530517578125, -0.1888427734375, 0.15283203125, 0.4945068359375, 0.836181640625, 1.1778564453125, 1.51953125, 1.8612060546875, 2.202880859375, 2.5445556640625, 2.88623046875, 3.2279052734375, 3.569580078125, 3.9112548828125, 4.2529296875, 4.5946044921875, 4.936279296875, 5.2779541015625, 5.61962890625, 5.9613037109375, 6.302978515625, 6.6446533203125, 6.986328125, 7.3280029296875, 7.669677734375, 8.0113525390625, 8.35302734375, 8.6947021484375, 9.036376953125, 9.3780517578125, 9.7197265625, 10.0614013671875, 10.403076171875, 10.7447509765625, 11.08642578125, 11.4281005859375, 11.769775390625, 12.1114501953125, 12.453125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 2.0, 4.0, 7.0, 10.0, 15.0, 17.0, 24.0, 38.0, 35.0, 58.0, 101.0, 129.0, 168.0, 286.0, 509.0, 850.0, 1675.0, 3610.0, 9543.0, 30482.0, 126131.0, 606141.0, 202810.0, 44058.0, 12770.0, 4489.0, 1931.0, 996.0, 584.0, 348.0, 223.0, 156.0, 106.0, 73.0, 46.0, 36.0, 25.0, 22.0, 11.0, 8.0, 10.0, 6.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.984375, -23.226318359375, -22.46826171875, -21.710205078125, -20.9521484375, -20.194091796875, -19.43603515625, -18.677978515625, -17.919921875, -17.161865234375, -16.40380859375, -15.645751953125, -14.8876953125, -14.129638671875, -13.37158203125, -12.613525390625, -11.85546875, -11.097412109375, -10.33935546875, -9.581298828125, -8.8232421875, -8.065185546875, -7.30712890625, -6.549072265625, -5.791015625, -5.032958984375, -4.27490234375, -3.516845703125, -2.7587890625, -2.000732421875, -1.24267578125, -0.484619140625, 0.2734375, 1.031494140625, 1.78955078125, 2.547607421875, 3.3056640625, 4.063720703125, 4.82177734375, 5.579833984375, 6.337890625, 7.095947265625, 7.85400390625, 8.612060546875, 9.3701171875, 10.128173828125, 10.88623046875, 11.644287109375, 12.40234375, 13.160400390625, 13.91845703125, 14.676513671875, 15.4345703125, 16.192626953125, 16.95068359375, 17.708740234375, 18.466796875, 19.224853515625, 19.98291015625, 20.740966796875, 21.4990234375, 22.257080078125, 23.01513671875, 23.773193359375, 24.53125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 4.0, 3.0, 6.0, 8.0, 7.0, 5.0, 5.0, 13.0, 11.0, 10.0, 13.0, 20.0, 22.0, 29.0, 38.0, 52.0, 60.0, 59.0, 43.0, 61.0, 45.0, 70.0, 57.0, 54.0, 43.0, 45.0, 32.0, 51.0, 36.0, 18.0, 23.0, 18.0, 5.0, 10.0, 5.0, 7.0, 4.0, 6.0, 1.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.8125, -36.65087890625, -35.4892578125, -34.32763671875, -33.166015625, -32.00439453125, -30.8427734375, -29.68115234375, -28.51953125, -27.35791015625, -26.1962890625, -25.03466796875, -23.873046875, -22.71142578125, -21.5498046875, -20.38818359375, -19.2265625, -18.06494140625, -16.9033203125, -15.74169921875, -14.580078125, -13.41845703125, -12.2568359375, -11.09521484375, -9.93359375, -8.77197265625, -7.6103515625, -6.44873046875, -5.287109375, -4.12548828125, -2.9638671875, -1.80224609375, -0.640625, 0.52099609375, 1.6826171875, 2.84423828125, 4.005859375, 5.16748046875, 6.3291015625, 7.49072265625, 8.65234375, 9.81396484375, 10.9755859375, 12.13720703125, 13.298828125, 14.46044921875, 15.6220703125, 16.78369140625, 17.9453125, 19.10693359375, 20.2685546875, 21.43017578125, 22.591796875, 23.75341796875, 24.9150390625, 26.07666015625, 27.23828125, 28.39990234375, 29.5615234375, 30.72314453125, 31.884765625, 33.04638671875, 34.2080078125, 35.36962890625, 36.53125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 7.0, 11.0, 7.0, 12.0, 20.0, 25.0, 43.0, 107.0, 325.0, 1028.0, 7801.0, 287122.0, 735056.0, 14669.0, 1614.0, 416.0, 138.0, 69.0, 31.0, 18.0, 9.0, 10.0, 6.0, 2.0, 3.0, 0.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.1875, -20.459716796875, -19.73193359375, -19.004150390625, -18.2763671875, -17.548583984375, -16.82080078125, -16.093017578125, -15.365234375, -14.637451171875, -13.90966796875, -13.181884765625, -12.4541015625, -11.726318359375, -10.99853515625, -10.270751953125, -9.54296875, -8.815185546875, -8.08740234375, -7.359619140625, -6.6318359375, -5.904052734375, -5.17626953125, -4.448486328125, -3.720703125, -2.992919921875, -2.26513671875, -1.537353515625, -0.8095703125, -0.081787109375, 0.64599609375, 1.373779296875, 2.1015625, 2.829345703125, 3.55712890625, 4.284912109375, 5.0126953125, 5.740478515625, 6.46826171875, 7.196044921875, 7.923828125, 8.651611328125, 9.37939453125, 10.107177734375, 10.8349609375, 11.562744140625, 12.29052734375, 13.018310546875, 13.74609375, 14.473876953125, 15.20166015625, 15.929443359375, 16.6572265625, 17.385009765625, 18.11279296875, 18.840576171875, 19.568359375, 20.296142578125, 21.02392578125, 21.751708984375, 22.4794921875, 23.207275390625, 23.93505859375, 24.662841796875, 25.390625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 6.0, 3.0, 2.0, 4.0, 8.0, 8.0, 6.0, 9.0, 18.0, 18.0, 25.0, 16.0, 19.0, 31.0, 38.0, 56.0, 63.0, 82.0, 82.0, 79.0, 76.0, 68.0, 46.0, 50.0, 29.0, 25.0, 24.0, 21.0, 14.0, 11.0, 16.0, 9.0, 7.0, 7.0, 8.0, 2.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0017986297607421875, -0.0017469674348831177, -0.0016953051090240479, -0.001643642783164978, -0.0015919804573059082, -0.0015403181314468384, -0.0014886558055877686, -0.0014369934797286987, -0.001385331153869629, -0.001333668828010559, -0.0012820065021514893, -0.0012303441762924194, -0.0011786818504333496, -0.0011270195245742798, -0.00107535719871521, -0.0010236948728561401, -0.0009720325469970703, -0.0009203702211380005, -0.0008687078952789307, -0.0008170455694198608, -0.000765383243560791, -0.0007137209177017212, -0.0006620585918426514, -0.0006103962659835815, -0.0005587339401245117, -0.0005070716142654419, -0.00045540928840637207, -0.00040374696254730225, -0.0003520846366882324, -0.0003004223108291626, -0.0002487599849700928, -0.00019709765911102295, -0.00014543533325195312, -9.37730073928833e-05, -4.2110681533813477e-05, 9.551644325256348e-06, 6.121397018432617e-05, 0.000112876296043396, 0.00016453862190246582, 0.00021620094776153564, 0.00026786327362060547, 0.0003195255994796753, 0.0003711879253387451, 0.00042285025119781494, 0.00047451257705688477, 0.0005261749029159546, 0.0005778372287750244, 0.0006294995546340942, 0.0006811618804931641, 0.0007328242063522339, 0.0007844865322113037, 0.0008361488580703735, 0.0008878111839294434, 0.0009394735097885132, 0.000991135835647583, 0.0010427981615066528, 0.0010944604873657227, 0.0011461228132247925, 0.0011977851390838623, 0.0012494474649429321, 0.001301109790802002, 0.0013527721166610718, 0.0014044344425201416, 0.0014560967683792114, 0.0015077590942382812]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 8.0, 7.0, 13.0, 20.0, 25.0, 51.0, 79.0, 133.0, 247.0, 440.0, 1042.0, 2641.0, 9569.0, 60542.0, 634637.0, 298529.0, 30936.0, 6091.0, 1897.0, 763.0, 384.0, 209.0, 109.0, 53.0, 41.0, 37.0, 17.0, 10.0, 4.0, 6.0, 2.0, 5.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.7578125, -10.384765625, -10.01171875, -9.638671875, -9.265625, -8.892578125, -8.51953125, -8.146484375, -7.7734375, -7.400390625, -7.02734375, -6.654296875, -6.28125, -5.908203125, -5.53515625, -5.162109375, -4.7890625, -4.416015625, -4.04296875, -3.669921875, -3.296875, -2.923828125, -2.55078125, -2.177734375, -1.8046875, -1.431640625, -1.05859375, -0.685546875, -0.3125, 0.060546875, 0.43359375, 0.806640625, 1.1796875, 1.552734375, 1.92578125, 2.298828125, 2.671875, 3.044921875, 3.41796875, 3.791015625, 4.1640625, 4.537109375, 4.91015625, 5.283203125, 5.65625, 6.029296875, 6.40234375, 6.775390625, 7.1484375, 7.521484375, 7.89453125, 8.267578125, 8.640625, 9.013671875, 9.38671875, 9.759765625, 10.1328125, 10.505859375, 10.87890625, 11.251953125, 11.625, 11.998046875, 12.37109375, 12.744140625, 13.1171875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 6.0, 13.0, 23.0, 31.0, 38.0, 66.0, 77.0, 95.0, 106.0, 139.0, 103.0, 87.0, 60.0, 39.0, 31.0, 17.0, 22.0, 12.0, 14.0, 7.0, 6.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3359375, -7.959716796875, -7.58349609375, -7.207275390625, -6.8310546875, -6.454833984375, -6.07861328125, -5.702392578125, -5.326171875, -4.949951171875, -4.57373046875, -4.197509765625, -3.8212890625, -3.445068359375, -3.06884765625, -2.692626953125, -2.31640625, -1.940185546875, -1.56396484375, -1.187744140625, -0.8115234375, -0.435302734375, -0.05908203125, 0.317138671875, 0.693359375, 1.069580078125, 1.44580078125, 1.822021484375, 2.1982421875, 2.574462890625, 2.95068359375, 3.326904296875, 3.703125, 4.079345703125, 4.45556640625, 4.831787109375, 5.2080078125, 5.584228515625, 5.96044921875, 6.336669921875, 6.712890625, 7.089111328125, 7.46533203125, 7.841552734375, 8.2177734375, 8.593994140625, 8.97021484375, 9.346435546875, 9.72265625, 10.098876953125, 10.47509765625, 10.851318359375, 11.2275390625, 11.603759765625, 11.97998046875, 12.356201171875, 12.732421875, 13.108642578125, 13.48486328125, 13.861083984375, 14.2373046875, 14.613525390625, 14.98974609375, 15.365966796875, 15.7421875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 4.0, 9.0, 30.0, 78.0, 149.0, 309.0, 214.0, 118.0, 53.0, 22.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-381.7818908691406, -371.64874267578125, -361.515625, -351.38250732421875, -341.2493591308594, -331.1162109375, -320.98309326171875, -310.8499755859375, -300.7168273925781, -290.58367919921875, -280.4505615234375, -270.31744384765625, -260.1842956542969, -250.05116271972656, -239.91802978515625, -229.78489685058594, -219.65176391601562, -209.5186309814453, -199.385498046875, -189.2523651123047, -179.11923217773438, -168.98609924316406, -158.85296630859375, -148.71983337402344, -138.58670043945312, -128.4535675048828, -118.3204345703125, -108.18730163574219, -98.05416870117188, -87.92103576660156, -77.78790283203125, -67.65476989746094, -57.52166748046875, -47.38853454589844, -37.255401611328125, -27.122268676757812, -16.9891357421875, -6.8560028076171875, 3.277130126953125, 13.410263061523438, 23.54339599609375, 33.67652893066406, 43.809661865234375, 53.94279479980469, 64.075927734375, 74.20906066894531, 84.34219360351562, 94.47532653808594, 104.60845947265625, 114.74159240722656, 124.87472534179688, 135.0078582763672, 145.1409912109375, 155.2741241455078, 165.40725708007812, 175.54039001464844, 185.67352294921875, 195.80665588378906, 205.93978881835938, 216.0729217529297, 226.2060546875, 236.3391876220703, 246.47232055664062, 256.60546875, 266.73858642578125]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 1.0, 5.0, 5.0, 11.0, 8.0, 15.0, 21.0, 29.0, 32.0, 30.0, 30.0, 28.0, 38.0, 49.0, 57.0, 60.0, 67.0, 69.0, 60.0, 62.0, 49.0, 41.0, 43.0, 40.0, 31.0, 24.0, 28.0, 21.0, 11.0, 10.0, 6.0, 2.0, 5.0, 3.0, 2.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-198.1376495361328, -192.92897033691406, -187.7202911376953, -182.51161193847656, -177.3029327392578, -172.09425354003906, -166.8855743408203, -161.67689514160156, -156.4682159423828, -151.25953674316406, -146.0508575439453, -140.84217834472656, -135.6334991455078, -130.42481994628906, -125.21614074707031, -120.00746154785156, -114.79878234863281, -109.59010314941406, -104.38142395019531, -99.17274475097656, -93.96406555175781, -88.75538635253906, -83.54670715332031, -78.33802795410156, -73.12934875488281, -67.92066955566406, -62.71199035644531, -57.50331115722656, -52.29463195800781, -47.08595275878906, -41.87727355957031, -36.66859436035156, -31.45989990234375, -26.251220703125, -21.04254150390625, -15.8338623046875, -10.62518310546875, -5.41650390625, -0.20782470703125, 5.0008544921875, 10.20953369140625, 15.418212890625, 20.62689208984375, 25.8355712890625, 31.04425048828125, 36.2529296875, 41.46160888671875, 46.6702880859375, 51.87896728515625, 57.087646484375, 62.29632568359375, 67.5050048828125, 72.71368408203125, 77.92236328125, 83.13104248046875, 88.3397216796875, 93.54840087890625, 98.757080078125, 103.96575927734375, 109.1744384765625, 114.38311767578125, 119.591796875, 124.80047607421875, 130.0091552734375, 135.21783447265625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 5.0, 6.0, 11.0, 8.0, 18.0, 23.0, 23.0, 46.0, 89.0, 119.0, 235.0, 517.0, 972.0, 2392.0, 6096.0, 17196.0, 59320.0, 286144.0, 2010203.0, 1526092.0, 213865.0, 47577.0, 14299.0, 5121.0, 2048.0, 929.0, 425.0, 203.0, 126.0, 59.0, 46.0, 13.0, 20.0, 13.0, 5.0, 6.0, 1.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0], "bins": [-15.34375, -14.949462890625, -14.55517578125, -14.160888671875, -13.7666015625, -13.372314453125, -12.97802734375, -12.583740234375, -12.189453125, -11.795166015625, -11.40087890625, -11.006591796875, -10.6123046875, -10.218017578125, -9.82373046875, -9.429443359375, -9.03515625, -8.640869140625, -8.24658203125, -7.852294921875, -7.4580078125, -7.063720703125, -6.66943359375, -6.275146484375, -5.880859375, -5.486572265625, -5.09228515625, -4.697998046875, -4.3037109375, -3.909423828125, -3.51513671875, -3.120849609375, -2.7265625, -2.332275390625, -1.93798828125, -1.543701171875, -1.1494140625, -0.755126953125, -0.36083984375, 0.033447265625, 0.427734375, 0.822021484375, 1.21630859375, 1.610595703125, 2.0048828125, 2.399169921875, 2.79345703125, 3.187744140625, 3.58203125, 3.976318359375, 4.37060546875, 4.764892578125, 5.1591796875, 5.553466796875, 5.94775390625, 6.342041015625, 6.736328125, 7.130615234375, 7.52490234375, 7.919189453125, 8.3134765625, 8.707763671875, 9.10205078125, 9.496337890625, 9.890625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 9.0, 5.0, 15.0, 21.0, 29.0, 34.0, 46.0, 59.0, 80.0, 113.0, 107.0, 91.0, 85.0, 71.0, 71.0, 53.0, 39.0, 34.0, 18.0, 12.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.734375, -18.2535400390625, -17.772705078125, -17.2918701171875, -16.81103515625, -16.3302001953125, -15.849365234375, -15.3685302734375, -14.8876953125, -14.4068603515625, -13.926025390625, -13.4451904296875, -12.96435546875, -12.4835205078125, -12.002685546875, -11.5218505859375, -11.041015625, -10.5601806640625, -10.079345703125, -9.5985107421875, -9.11767578125, -8.6368408203125, -8.156005859375, -7.6751708984375, -7.1943359375, -6.7135009765625, -6.232666015625, -5.7518310546875, -5.27099609375, -4.7901611328125, -4.309326171875, -3.8284912109375, -3.34765625, -2.8668212890625, -2.385986328125, -1.9051513671875, -1.42431640625, -0.9434814453125, -0.462646484375, 0.0181884765625, 0.4990234375, 0.9798583984375, 1.460693359375, 1.9415283203125, 2.42236328125, 2.9031982421875, 3.384033203125, 3.8648681640625, 4.345703125, 4.8265380859375, 5.307373046875, 5.7882080078125, 6.26904296875, 6.7498779296875, 7.230712890625, 7.7115478515625, 8.1923828125, 8.6732177734375, 9.154052734375, 9.6348876953125, 10.11572265625, 10.5965576171875, 11.077392578125, 11.5582275390625, 12.0390625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 8.0, 1.0, 6.0, 8.0, 22.0, 23.0, 14.0, 34.0, 63.0, 79.0, 106.0, 196.0, 352.0, 630.0, 1044.0, 2184.0, 4654.0, 10877.0, 28988.0, 93930.0, 455404.0, 2632134.0, 770028.0, 134387.0, 36985.0, 12671.0, 5001.0, 2147.0, 1004.0, 497.0, 298.0, 181.0, 110.0, 70.0, 52.0, 27.0, 17.0, 20.0, 8.0, 7.0, 8.0, 5.0, 0.0, 7.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-15.7890625, -15.35791015625, -14.9267578125, -14.49560546875, -14.064453125, -13.63330078125, -13.2021484375, -12.77099609375, -12.33984375, -11.90869140625, -11.4775390625, -11.04638671875, -10.615234375, -10.18408203125, -9.7529296875, -9.32177734375, -8.890625, -8.45947265625, -8.0283203125, -7.59716796875, -7.166015625, -6.73486328125, -6.3037109375, -5.87255859375, -5.44140625, -5.01025390625, -4.5791015625, -4.14794921875, -3.716796875, -3.28564453125, -2.8544921875, -2.42333984375, -1.9921875, -1.56103515625, -1.1298828125, -0.69873046875, -0.267578125, 0.16357421875, 0.5947265625, 1.02587890625, 1.45703125, 1.88818359375, 2.3193359375, 2.75048828125, 3.181640625, 3.61279296875, 4.0439453125, 4.47509765625, 4.90625, 5.33740234375, 5.7685546875, 6.19970703125, 6.630859375, 7.06201171875, 7.4931640625, 7.92431640625, 8.35546875, 8.78662109375, 9.2177734375, 9.64892578125, 10.080078125, 10.51123046875, 10.9423828125, 11.37353515625, 11.8046875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 6.0, 7.0, 5.0, 13.0, 19.0, 31.0, 25.0, 23.0, 36.0, 40.0, 61.0, 65.0, 114.0, 156.0, 258.0, 377.0, 502.0, 565.0, 488.0, 370.0, 264.0, 179.0, 108.0, 85.0, 65.0, 52.0, 42.0, 20.0, 25.0, 14.0, 13.0, 10.0, 5.0, 6.0, 4.0, 3.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 3.0], "bins": [-20.359375, -19.8297119140625, -19.300048828125, -18.7703857421875, -18.24072265625, -17.7110595703125, -17.181396484375, -16.6517333984375, -16.1220703125, -15.5924072265625, -15.062744140625, -14.5330810546875, -14.00341796875, -13.4737548828125, -12.944091796875, -12.4144287109375, -11.884765625, -11.3551025390625, -10.825439453125, -10.2957763671875, -9.76611328125, -9.2364501953125, -8.706787109375, -8.1771240234375, -7.6474609375, -7.1177978515625, -6.588134765625, -6.0584716796875, -5.52880859375, -4.9991455078125, -4.469482421875, -3.9398193359375, -3.41015625, -2.8804931640625, -2.350830078125, -1.8211669921875, -1.29150390625, -0.7618408203125, -0.232177734375, 0.2974853515625, 0.8271484375, 1.3568115234375, 1.886474609375, 2.4161376953125, 2.94580078125, 3.4754638671875, 4.005126953125, 4.5347900390625, 5.064453125, 5.5941162109375, 6.123779296875, 6.6534423828125, 7.18310546875, 7.7127685546875, 8.242431640625, 8.7720947265625, 9.3017578125, 9.8314208984375, 10.361083984375, 10.8907470703125, 11.42041015625, 11.9500732421875, 12.479736328125, 13.0093994140625, 13.5390625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 6.0, 7.0, 14.0, 20.0, 67.0, 149.0, 299.0, 247.0, 124.0, 43.0, 16.0, 5.0, 3.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-235.4140625, -224.6109619140625, -213.807861328125, -203.0047607421875, -192.20166015625, -181.3985595703125, -170.59544372558594, -159.79234313964844, -148.98924255371094, -138.18614196777344, -127.38304138183594, -116.5799331665039, -105.7768325805664, -94.9737319946289, -84.17062377929688, -73.36752319335938, -62.564422607421875, -51.761322021484375, -40.95821762084961, -30.155113220214844, -19.352012634277344, -8.548912048339844, 2.2541961669921875, 13.057296752929688, 23.860397338867188, 34.66349792480469, 45.46660232543945, 56.26970672607422, 67.07280731201172, 77.87590789794922, 88.67901611328125, 99.48211669921875, 110.28518676757812, 121.08828735351562, 131.89138793945312, 142.69448852539062, 153.49758911132812, 164.30068969726562, 175.1038055419922, 185.9069061279297, 196.7100067138672, 207.5131072998047, 218.3162078857422, 229.11932373046875, 239.92242431640625, 250.72552490234375, 261.52862548828125, 272.33172607421875, 283.13482666015625, 293.93792724609375, 304.74102783203125, 315.54412841796875, 326.34722900390625, 337.15032958984375, 347.95343017578125, 358.75653076171875, 369.55963134765625, 380.36273193359375, 391.16583251953125, 401.96893310546875, 412.77203369140625, 423.57513427734375, 434.37823486328125, 445.18133544921875, 455.9844665527344]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 9.0, 6.0, 10.0, 19.0, 10.0, 26.0, 21.0, 32.0, 48.0, 50.0, 54.0, 67.0, 61.0, 75.0, 53.0, 87.0, 56.0, 55.0, 50.0, 52.0, 31.0, 21.0, 25.0, 33.0, 21.0, 11.0, 9.0, 9.0, 7.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.06410217285156, -92.57223510742188, -88.08036041259766, -83.58848571777344, -79.09661865234375, -74.60475158691406, -70.11287689208984, -65.62100219726562, -61.12913513183594, -56.637264251708984, -52.14539337158203, -47.65352249145508, -43.161651611328125, -38.66978073120117, -34.17790985107422, -29.686038970947266, -25.194168090820312, -20.70229721069336, -16.210426330566406, -11.718555450439453, -7.2266845703125, -2.734813690185547, 1.7570571899414062, 6.248928070068359, 10.740798950195312, 15.232669830322266, 19.72454071044922, 24.216411590576172, 28.708282470703125, 33.20015335083008, 37.69202423095703, 42.183895111083984, 46.67578125, 51.16765213012695, 55.659523010253906, 60.15139389038086, 64.64326477050781, 69.1351318359375, 73.62700653076172, 78.11888122558594, 82.61074829101562, 87.10261535644531, 91.59449005126953, 96.08636474609375, 100.57823181152344, 105.07009887695312, 109.56197357177734, 114.05384826660156, 118.54571533203125, 123.03758239746094, 127.52945709228516, 132.02133178710938, 136.51319885253906, 141.00506591796875, 145.4969482421875, 149.9888153076172, 154.48068237304688, 158.97254943847656, 163.46441650390625, 167.956298828125, 172.4481658935547, 176.94003295898438, 181.43191528320312, 185.9237823486328, 190.4156494140625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 5.0, 2.0, 9.0, 7.0, 24.0, 15.0, 27.0, 32.0, 60.0, 61.0, 101.0, 157.0, 216.0, 373.0, 584.0, 942.0, 1725.0, 3162.0, 5898.0, 11932.0, 25070.0, 51958.0, 107479.0, 224456.0, 299694.0, 162129.0, 77564.0, 37724.0, 18106.0, 8868.0, 4389.0, 2356.0, 1294.0, 803.0, 432.0, 316.0, 201.0, 131.0, 72.0, 48.0, 47.0, 23.0, 17.0, 22.0, 8.0, 8.0, 4.0, 3.0, 4.0, 5.0, 0.0, 1.0, 1.0, 2.0], "bins": [-14.1640625, -13.7508544921875, -13.337646484375, -12.9244384765625, -12.51123046875, -12.0980224609375, -11.684814453125, -11.2716064453125, -10.8583984375, -10.4451904296875, -10.031982421875, -9.6187744140625, -9.20556640625, -8.7923583984375, -8.379150390625, -7.9659423828125, -7.552734375, -7.1395263671875, -6.726318359375, -6.3131103515625, -5.89990234375, -5.4866943359375, -5.073486328125, -4.6602783203125, -4.2470703125, -3.8338623046875, -3.420654296875, -3.0074462890625, -2.59423828125, -2.1810302734375, -1.767822265625, -1.3546142578125, -0.94140625, -0.5281982421875, -0.114990234375, 0.2982177734375, 0.71142578125, 1.1246337890625, 1.537841796875, 1.9510498046875, 2.3642578125, 2.7774658203125, 3.190673828125, 3.6038818359375, 4.01708984375, 4.4302978515625, 4.843505859375, 5.2567138671875, 5.669921875, 6.0831298828125, 6.496337890625, 6.9095458984375, 7.32275390625, 7.7359619140625, 8.149169921875, 8.5623779296875, 8.9755859375, 9.3887939453125, 9.802001953125, 10.2152099609375, 10.62841796875, 11.0416259765625, 11.454833984375, 11.8680419921875, 12.28125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 6.0, 9.0, 11.0, 16.0, 20.0, 18.0, 14.0, 49.0, 48.0, 38.0, 51.0, 68.0, 68.0, 65.0, 82.0, 65.0, 64.0, 49.0, 45.0, 36.0, 36.0, 29.0, 29.0, 20.0, 16.0, 15.0, 8.0, 8.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.4140625, -9.0787353515625, -8.743408203125, -8.4080810546875, -8.07275390625, -7.7374267578125, -7.402099609375, -7.0667724609375, -6.7314453125, -6.3961181640625, -6.060791015625, -5.7254638671875, -5.39013671875, -5.0548095703125, -4.719482421875, -4.3841552734375, -4.048828125, -3.7135009765625, -3.378173828125, -3.0428466796875, -2.70751953125, -2.3721923828125, -2.036865234375, -1.7015380859375, -1.3662109375, -1.0308837890625, -0.695556640625, -0.3602294921875, -0.02490234375, 0.3104248046875, 0.645751953125, 0.9810791015625, 1.31640625, 1.6517333984375, 1.987060546875, 2.3223876953125, 2.65771484375, 2.9930419921875, 3.328369140625, 3.6636962890625, 3.9990234375, 4.3343505859375, 4.669677734375, 5.0050048828125, 5.34033203125, 5.6756591796875, 6.010986328125, 6.3463134765625, 6.681640625, 7.0169677734375, 7.352294921875, 7.6876220703125, 8.02294921875, 8.3582763671875, 8.693603515625, 9.0289306640625, 9.3642578125, 9.6995849609375, 10.034912109375, 10.3702392578125, 10.70556640625, 11.0408935546875, 11.376220703125, 11.7115478515625, 12.046875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 8.0, 16.0, 9.0, 16.0, 20.0, 34.0, 61.0, 62.0, 102.0, 178.0, 253.0, 377.0, 629.0, 1044.0, 1921.0, 4267.0, 15119.0, 112119.0, 757066.0, 129376.0, 16702.0, 4307.0, 1935.0, 1094.0, 657.0, 410.0, 257.0, 172.0, 121.0, 61.0, 47.0, 29.0, 19.0, 18.0, 7.0, 12.0, 8.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-38.0, -36.86669921875, -35.7333984375, -34.60009765625, -33.466796875, -32.33349609375, -31.2001953125, -30.06689453125, -28.93359375, -27.80029296875, -26.6669921875, -25.53369140625, -24.400390625, -23.26708984375, -22.1337890625, -21.00048828125, -19.8671875, -18.73388671875, -17.6005859375, -16.46728515625, -15.333984375, -14.20068359375, -13.0673828125, -11.93408203125, -10.80078125, -9.66748046875, -8.5341796875, -7.40087890625, -6.267578125, -5.13427734375, -4.0009765625, -2.86767578125, -1.734375, -0.60107421875, 0.5322265625, 1.66552734375, 2.798828125, 3.93212890625, 5.0654296875, 6.19873046875, 7.33203125, 8.46533203125, 9.5986328125, 10.73193359375, 11.865234375, 12.99853515625, 14.1318359375, 15.26513671875, 16.3984375, 17.53173828125, 18.6650390625, 19.79833984375, 20.931640625, 22.06494140625, 23.1982421875, 24.33154296875, 25.46484375, 26.59814453125, 27.7314453125, 28.86474609375, 29.998046875, 31.13134765625, 32.2646484375, 33.39794921875, 34.53125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 7.0, 12.0, 10.0, 12.0, 12.0, 10.0, 11.0, 22.0, 20.0, 37.0, 30.0, 37.0, 47.0, 40.0, 54.0, 50.0, 56.0, 49.0, 49.0, 48.0, 42.0, 37.0, 30.0, 41.0, 32.0, 43.0, 22.0, 23.0, 23.0, 28.0, 16.0, 10.0, 10.0, 10.0, 5.0, 6.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.75, -33.69677734375, -32.6435546875, -31.59033203125, -30.537109375, -29.48388671875, -28.4306640625, -27.37744140625, -26.32421875, -25.27099609375, -24.2177734375, -23.16455078125, -22.111328125, -21.05810546875, -20.0048828125, -18.95166015625, -17.8984375, -16.84521484375, -15.7919921875, -14.73876953125, -13.685546875, -12.63232421875, -11.5791015625, -10.52587890625, -9.47265625, -8.41943359375, -7.3662109375, -6.31298828125, -5.259765625, -4.20654296875, -3.1533203125, -2.10009765625, -1.046875, 0.00634765625, 1.0595703125, 2.11279296875, 3.166015625, 4.21923828125, 5.2724609375, 6.32568359375, 7.37890625, 8.43212890625, 9.4853515625, 10.53857421875, 11.591796875, 12.64501953125, 13.6982421875, 14.75146484375, 15.8046875, 16.85791015625, 17.9111328125, 18.96435546875, 20.017578125, 21.07080078125, 22.1240234375, 23.17724609375, 24.23046875, 25.28369140625, 26.3369140625, 27.39013671875, 28.443359375, 29.49658203125, 30.5498046875, 31.60302734375, 32.65625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 10.0, 15.0, 12.0, 22.0, 48.0, 85.0, 138.0, 383.0, 1035.0, 6214.0, 105058.0, 875517.0, 54526.0, 4073.0, 795.0, 290.0, 132.0, 89.0, 55.0, 19.0, 13.0, 10.0, 2.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6328125, -14.1175537109375, -13.602294921875, -13.0870361328125, -12.57177734375, -12.0565185546875, -11.541259765625, -11.0260009765625, -10.5107421875, -9.9954833984375, -9.480224609375, -8.9649658203125, -8.44970703125, -7.9344482421875, -7.419189453125, -6.9039306640625, -6.388671875, -5.8734130859375, -5.358154296875, -4.8428955078125, -4.32763671875, -3.8123779296875, -3.297119140625, -2.7818603515625, -2.2666015625, -1.7513427734375, -1.236083984375, -0.7208251953125, -0.20556640625, 0.3096923828125, 0.824951171875, 1.3402099609375, 1.85546875, 2.3707275390625, 2.885986328125, 3.4012451171875, 3.91650390625, 4.4317626953125, 4.947021484375, 5.4622802734375, 5.9775390625, 6.4927978515625, 7.008056640625, 7.5233154296875, 8.03857421875, 8.5538330078125, 9.069091796875, 9.5843505859375, 10.099609375, 10.6148681640625, 11.130126953125, 11.6453857421875, 12.16064453125, 12.6759033203125, 13.191162109375, 13.7064208984375, 14.2216796875, 14.7369384765625, 15.252197265625, 15.7674560546875, 16.28271484375, 16.7979736328125, 17.313232421875, 17.8284912109375, 18.34375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 1.0, 4.0, 11.0, 8.0, 10.0, 13.0, 14.0, 19.0, 21.0, 18.0, 19.0, 24.0, 20.0, 35.0, 28.0, 51.0, 78.0, 84.0, 110.0, 99.0, 54.0, 41.0, 25.0, 28.0, 25.0, 24.0, 19.0, 14.0, 13.0, 11.0, 12.0, 9.0, 8.0, 10.0, 4.0, 6.0, 7.0, 4.0, 6.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0], "bins": [-0.0017766952514648438, -0.0017218589782714844, -0.001667022705078125, -0.0016121864318847656, -0.0015573501586914062, -0.0015025138854980469, -0.0014476776123046875, -0.0013928413391113281, -0.0013380050659179688, -0.0012831687927246094, -0.00122833251953125, -0.0011734962463378906, -0.0011186599731445312, -0.0010638236999511719, -0.0010089874267578125, -0.0009541511535644531, -0.0008993148803710938, -0.0008444786071777344, -0.000789642333984375, -0.0007348060607910156, -0.0006799697875976562, -0.0006251335144042969, -0.0005702972412109375, -0.0005154609680175781, -0.00046062469482421875, -0.0004057884216308594, -0.0003509521484375, -0.0002961158752441406, -0.00024127960205078125, -0.00018644332885742188, -0.0001316070556640625, -7.677078247070312e-05, -2.193450927734375e-05, 3.2901763916015625e-05, 8.7738037109375e-05, 0.00014257431030273438, 0.00019741058349609375, 0.0002522468566894531, 0.0003070831298828125, 0.0003619194030761719, 0.00041675567626953125, 0.0004715919494628906, 0.00052642822265625, 0.0005812644958496094, 0.0006361007690429688, 0.0006909370422363281, 0.0007457733154296875, 0.0008006095886230469, 0.0008554458618164062, 0.0009102821350097656, 0.000965118408203125, 0.0010199546813964844, 0.0010747909545898438, 0.0011296272277832031, 0.0011844635009765625, 0.0012392997741699219, 0.0012941360473632812, 0.0013489723205566406, 0.00140380859375, 0.0014586448669433594, 0.0015134811401367188, 0.0015683174133300781, 0.0016231536865234375, 0.0016779899597167969, 0.0017328262329101562]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 3.0, 7.0, 11.0, 28.0, 61.0, 84.0, 168.0, 426.0, 959.0, 2873.0, 13586.0, 212112.0, 774183.0, 36348.0, 5124.0, 1485.0, 568.0, 236.0, 141.0, 66.0, 30.0, 17.0, 16.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.9765625, -14.55126953125, -14.1259765625, -13.70068359375, -13.275390625, -12.85009765625, -12.4248046875, -11.99951171875, -11.57421875, -11.14892578125, -10.7236328125, -10.29833984375, -9.873046875, -9.44775390625, -9.0224609375, -8.59716796875, -8.171875, -7.74658203125, -7.3212890625, -6.89599609375, -6.470703125, -6.04541015625, -5.6201171875, -5.19482421875, -4.76953125, -4.34423828125, -3.9189453125, -3.49365234375, -3.068359375, -2.64306640625, -2.2177734375, -1.79248046875, -1.3671875, -0.94189453125, -0.5166015625, -0.09130859375, 0.333984375, 0.75927734375, 1.1845703125, 1.60986328125, 2.03515625, 2.46044921875, 2.8857421875, 3.31103515625, 3.736328125, 4.16162109375, 4.5869140625, 5.01220703125, 5.4375, 5.86279296875, 6.2880859375, 6.71337890625, 7.138671875, 7.56396484375, 7.9892578125, 8.41455078125, 8.83984375, 9.26513671875, 9.6904296875, 10.11572265625, 10.541015625, 10.96630859375, 11.3916015625, 11.81689453125, 12.2421875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 3.0, 2.0, 7.0, 9.0, 16.0, 16.0, 11.0, 23.0, 18.0, 42.0, 41.0, 48.0, 54.0, 71.0, 71.0, 84.0, 84.0, 63.0, 68.0, 45.0, 50.0, 33.0, 34.0, 25.0, 25.0, 15.0, 15.0, 6.0, 3.0, 4.0, 8.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7109375, -6.48797607421875, -6.2650146484375, -6.04205322265625, -5.819091796875, -5.59613037109375, -5.3731689453125, -5.15020751953125, -4.92724609375, -4.70428466796875, -4.4813232421875, -4.25836181640625, -4.035400390625, -3.81243896484375, -3.5894775390625, -3.36651611328125, -3.1435546875, -2.92059326171875, -2.6976318359375, -2.47467041015625, -2.251708984375, -2.02874755859375, -1.8057861328125, -1.58282470703125, -1.35986328125, -1.13690185546875, -0.9139404296875, -0.69097900390625, -0.468017578125, -0.24505615234375, -0.0220947265625, 0.20086669921875, 0.423828125, 0.64678955078125, 0.8697509765625, 1.09271240234375, 1.315673828125, 1.53863525390625, 1.7615966796875, 1.98455810546875, 2.20751953125, 2.43048095703125, 2.6534423828125, 2.87640380859375, 3.099365234375, 3.32232666015625, 3.5452880859375, 3.76824951171875, 3.9912109375, 4.21417236328125, 4.4371337890625, 4.66009521484375, 4.883056640625, 5.10601806640625, 5.3289794921875, 5.55194091796875, 5.77490234375, 5.99786376953125, 6.2208251953125, 6.44378662109375, 6.666748046875, 6.88970947265625, 7.1126708984375, 7.33563232421875, 7.55859375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 5.0, 7.0, 13.0, 31.0, 66.0, 102.0, 165.0, 231.0, 147.0, 76.0, 70.0, 32.0, 16.0, 10.0, 8.0, 8.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-219.60125732421875, -212.82029724121094, -206.0393524169922, -199.25839233398438, -192.47744750976562, -185.6964874267578, -178.91554260253906, -172.13458251953125, -165.3536376953125, -158.5726776123047, -151.79173278808594, -145.01077270507812, -138.22982788085938, -131.44886779785156, -124.66792297363281, -117.886962890625, -111.10601043701172, -104.32505798339844, -97.54410552978516, -90.76315307617188, -83.9822006225586, -77.20124816894531, -70.4202880859375, -63.639339447021484, -56.8583869934082, -50.07743453979492, -43.29648208618164, -36.515525817871094, -29.734575271606445, -22.95362091064453, -16.17266845703125, -9.391716003417969, -2.6107635498046875, 4.170189380645752, 10.951142311096191, 17.73209571838379, 24.51304817199707, 31.294002532958984, 38.074954986572266, 44.85590744018555, 51.63685989379883, 58.41781234741211, 65.19876861572266, 71.97972106933594, 78.76067352294922, 85.5416259765625, 92.32257843017578, 99.10353088378906, 105.88448333740234, 112.66543579101562, 119.4463882446289, 126.22734069824219, 133.00830078125, 139.78924560546875, 146.57020568847656, 153.3511505126953, 160.13211059570312, 166.91307067871094, 173.6940155029297, 180.4749755859375, 187.25592041015625, 194.03688049316406, 200.8178253173828, 207.59878540039062, 214.37973022460938]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 7.0, 3.0, 9.0, 9.0, 12.0, 17.0, 24.0, 19.0, 21.0, 27.0, 28.0, 37.0, 26.0, 35.0, 37.0, 43.0, 58.0, 81.0, 76.0, 52.0, 45.0, 60.0, 42.0, 34.0, 28.0, 29.0, 26.0, 17.0, 22.0, 15.0, 11.0, 6.0, 11.0, 10.0, 3.0, 3.0, 3.0, 8.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-145.24365234375, -140.96322631835938, -136.6827850341797, -132.40235900878906, -128.12193298339844, -123.84149932861328, -119.56106567382812, -115.2806396484375, -111.00021362304688, -106.71977996826172, -102.4393539428711, -98.15892028808594, -93.87849426269531, -89.59806060791016, -85.317626953125, -81.03720092773438, -76.75676727294922, -72.47633361816406, -68.19590759277344, -63.91547393798828, -59.635047912597656, -55.3546142578125, -51.07418441772461, -46.79375457763672, -42.51332473754883, -38.23289489746094, -33.95246505737305, -29.672033309936523, -25.391603469848633, -21.111173629760742, -16.83074188232422, -12.550312042236328, -8.269882202148438, -3.9894518852233887, 0.29097843170166016, 4.571409225463867, 8.851839065551758, 13.132268905639648, 17.412700653076172, 21.693130493164062, 25.973560333251953, 30.253990173339844, 34.534420013427734, 38.814849853515625, 43.09528350830078, 47.375709533691406, 51.65614318847656, 55.93657302856445, 60.217002868652344, 64.4974365234375, 68.77786254882812, 73.05829620361328, 77.3387222290039, 81.61915588378906, 85.89958190917969, 90.18001556396484, 94.46044921875, 98.74088287353516, 103.02130889892578, 107.30174255371094, 111.58216857910156, 115.86260223388672, 120.14303588867188, 124.4234619140625, 128.70388793945312]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 4.0, 9.0, 15.0, 13.0, 17.0, 34.0, 51.0, 84.0, 107.0, 217.0, 436.0, 767.0, 1524.0, 3615.0, 8955.0, 26043.0, 92947.0, 566098.0, 2564079.0, 765033.0, 117773.0, 29447.0, 9750.0, 3832.0, 1630.0, 745.0, 428.0, 229.0, 123.0, 91.0, 60.0, 48.0, 21.0, 16.0, 7.0, 7.0, 4.0, 3.0, 7.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.921875, -9.5745849609375, -9.227294921875, -8.8800048828125, -8.53271484375, -8.1854248046875, -7.838134765625, -7.4908447265625, -7.1435546875, -6.7962646484375, -6.448974609375, -6.1016845703125, -5.75439453125, -5.4071044921875, -5.059814453125, -4.7125244140625, -4.365234375, -4.0179443359375, -3.670654296875, -3.3233642578125, -2.97607421875, -2.6287841796875, -2.281494140625, -1.9342041015625, -1.5869140625, -1.2396240234375, -0.892333984375, -0.5450439453125, -0.19775390625, 0.1495361328125, 0.496826171875, 0.8441162109375, 1.19140625, 1.5386962890625, 1.885986328125, 2.2332763671875, 2.58056640625, 2.9278564453125, 3.275146484375, 3.6224365234375, 3.9697265625, 4.3170166015625, 4.664306640625, 5.0115966796875, 5.35888671875, 5.7061767578125, 6.053466796875, 6.4007568359375, 6.748046875, 7.0953369140625, 7.442626953125, 7.7899169921875, 8.13720703125, 8.4844970703125, 8.831787109375, 9.1790771484375, 9.5263671875, 9.8736572265625, 10.220947265625, 10.5682373046875, 10.91552734375, 11.2628173828125, 11.610107421875, 11.9573974609375, 12.3046875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 2.0, 5.0, 6.0, 15.0, 14.0, 15.0, 19.0, 22.0, 27.0, 44.0, 41.0, 64.0, 49.0, 69.0, 64.0, 60.0, 62.0, 62.0, 65.0, 59.0, 49.0, 44.0, 33.0, 21.0, 24.0, 19.0, 9.0, 12.0, 10.0, 3.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.9609375, -8.6356201171875, -8.310302734375, -7.9849853515625, -7.65966796875, -7.3343505859375, -7.009033203125, -6.6837158203125, -6.3583984375, -6.0330810546875, -5.707763671875, -5.3824462890625, -5.05712890625, -4.7318115234375, -4.406494140625, -4.0811767578125, -3.755859375, -3.4305419921875, -3.105224609375, -2.7799072265625, -2.45458984375, -2.1292724609375, -1.803955078125, -1.4786376953125, -1.1533203125, -0.8280029296875, -0.502685546875, -0.1773681640625, 0.14794921875, 0.4732666015625, 0.798583984375, 1.1239013671875, 1.44921875, 1.7745361328125, 2.099853515625, 2.4251708984375, 2.75048828125, 3.0758056640625, 3.401123046875, 3.7264404296875, 4.0517578125, 4.3770751953125, 4.702392578125, 5.0277099609375, 5.35302734375, 5.6783447265625, 6.003662109375, 6.3289794921875, 6.654296875, 6.9796142578125, 7.304931640625, 7.6302490234375, 7.95556640625, 8.2808837890625, 8.606201171875, 8.9315185546875, 9.2568359375, 9.5821533203125, 9.907470703125, 10.2327880859375, 10.55810546875, 10.8834228515625, 11.208740234375, 11.5340576171875, 11.859375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 5.0, 7.0, 6.0, 10.0, 18.0, 36.0, 38.0, 58.0, 106.0, 186.0, 359.0, 742.0, 1878.0, 5512.0, 18748.0, 86441.0, 1010641.0, 2862775.0, 169224.0, 27368.0, 6617.0, 2064.0, 759.0, 343.0, 172.0, 70.0, 42.0, 22.0, 13.0, 14.0, 9.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-26.296875, -25.673583984375, -25.05029296875, -24.427001953125, -23.8037109375, -23.180419921875, -22.55712890625, -21.933837890625, -21.310546875, -20.687255859375, -20.06396484375, -19.440673828125, -18.8173828125, -18.194091796875, -17.57080078125, -16.947509765625, -16.32421875, -15.700927734375, -15.07763671875, -14.454345703125, -13.8310546875, -13.207763671875, -12.58447265625, -11.961181640625, -11.337890625, -10.714599609375, -10.09130859375, -9.468017578125, -8.8447265625, -8.221435546875, -7.59814453125, -6.974853515625, -6.3515625, -5.728271484375, -5.10498046875, -4.481689453125, -3.8583984375, -3.235107421875, -2.61181640625, -1.988525390625, -1.365234375, -0.741943359375, -0.11865234375, 0.504638671875, 1.1279296875, 1.751220703125, 2.37451171875, 2.997802734375, 3.62109375, 4.244384765625, 4.86767578125, 5.490966796875, 6.1142578125, 6.737548828125, 7.36083984375, 7.984130859375, 8.607421875, 9.230712890625, 9.85400390625, 10.477294921875, 11.1005859375, 11.723876953125, 12.34716796875, 12.970458984375, 13.59375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 3.0, 2.0, 4.0, 12.0, 6.0, 12.0, 13.0, 22.0, 20.0, 28.0, 41.0, 44.0, 65.0, 103.0, 170.0, 296.0, 513.0, 755.0, 749.0, 472.0, 311.0, 148.0, 94.0, 54.0, 35.0, 31.0, 19.0, 17.0, 14.0, 11.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-26.828125, -26.156494140625, -25.48486328125, -24.813232421875, -24.1416015625, -23.469970703125, -22.79833984375, -22.126708984375, -21.455078125, -20.783447265625, -20.11181640625, -19.440185546875, -18.7685546875, -18.096923828125, -17.42529296875, -16.753662109375, -16.08203125, -15.410400390625, -14.73876953125, -14.067138671875, -13.3955078125, -12.723876953125, -12.05224609375, -11.380615234375, -10.708984375, -10.037353515625, -9.36572265625, -8.694091796875, -8.0224609375, -7.350830078125, -6.67919921875, -6.007568359375, -5.3359375, -4.664306640625, -3.99267578125, -3.321044921875, -2.6494140625, -1.977783203125, -1.30615234375, -0.634521484375, 0.037109375, 0.708740234375, 1.38037109375, 2.052001953125, 2.7236328125, 3.395263671875, 4.06689453125, 4.738525390625, 5.41015625, 6.081787109375, 6.75341796875, 7.425048828125, 8.0966796875, 8.768310546875, 9.43994140625, 10.111572265625, 10.783203125, 11.454833984375, 12.12646484375, 12.798095703125, 13.4697265625, 14.141357421875, 14.81298828125, 15.484619140625, 16.15625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 7.0, 7.0, 15.0, 32.0, 82.0, 195.0, 280.0, 214.0, 100.0, 36.0, 16.0, 5.0, 5.0, 3.0, 6.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-180.15786743164062, -171.47311401367188, -162.78836059570312, -154.10360717773438, -145.41885375976562, -136.73410034179688, -128.0493621826172, -119.36460876464844, -110.67985534667969, -101.99510192871094, -93.31034851074219, -84.62560272216797, -75.94084930419922, -67.25609588623047, -58.571346282958984, -49.8865966796875, -41.20184326171875, -32.51708984375, -23.832340240478516, -15.147588729858398, -6.462837219238281, 2.2219161987304688, 10.906665802001953, 19.591415405273438, 28.276168823242188, 36.96092224121094, 45.64567184448242, 54.330421447753906, 63.015174865722656, 71.6999282836914, 80.38467407226562, 89.06942749023438, 97.75421142578125, 106.43896484375, 115.12371826171875, 123.80846405029297, 132.49322509765625, 141.177978515625, 149.8627166748047, 158.54747009277344, 167.2322235107422, 175.91697692871094, 184.6017303466797, 193.28648376464844, 201.97122192382812, 210.65597534179688, 219.34072875976562, 228.02548217773438, 236.71023559570312, 245.39498901367188, 254.07974243164062, 262.7644958496094, 271.4492492675781, 280.1340026855469, 288.8187561035156, 297.50347900390625, 306.188232421875, 314.87298583984375, 323.5577392578125, 332.24249267578125, 340.92724609375, 349.61199951171875, 358.2967529296875, 366.98150634765625, 375.666259765625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 1.0, 6.0, 3.0, 5.0, 11.0, 18.0, 20.0, 24.0, 25.0, 40.0, 38.0, 35.0, 49.0, 52.0, 59.0, 45.0, 46.0, 55.0, 77.0, 45.0, 51.0, 46.0, 46.0, 38.0, 30.0, 22.0, 22.0, 23.0, 17.0, 15.0, 9.0, 9.0, 12.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.65245819091797, -122.11328125, -118.57410430908203, -115.03492736816406, -111.49575805664062, -107.95658111572266, -104.41740417480469, -100.87822723388672, -97.33905029296875, -93.79987335205078, -90.26069641113281, -86.72152709960938, -83.1823501586914, -79.64317321777344, -76.10399627685547, -72.5648193359375, -69.02565002441406, -65.4864730834961, -61.94729995727539, -58.40812301635742, -54.86894989013672, -51.32977294921875, -47.79059600830078, -44.25141906738281, -40.71224594116211, -37.17306900024414, -33.63389587402344, -30.09471893310547, -26.555543899536133, -23.016368865966797, -19.477191925048828, -15.938016891479492, -12.398834228515625, -8.859659194946289, -5.320483207702637, -1.7813072204589844, 1.7578678131103516, 5.2970428466796875, 8.836219787597656, 12.375394821166992, 15.914569854736328, 19.453744888305664, 22.992919921875, 26.53209686279297, 30.071271896362305, 33.61044692993164, 37.14962387084961, 40.68879699707031, 44.22797393798828, 47.76715087890625, 51.30632400512695, 54.84550094604492, 58.384674072265625, 61.923851013183594, 65.46302795410156, 69.00220489501953, 72.5413818359375, 76.08055877685547, 79.61973571777344, 83.15890502929688, 86.69808197021484, 90.23725891113281, 93.77643585205078, 97.31561279296875, 100.85478210449219]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 4.0, 1.0, 3.0, 8.0, 7.0, 9.0, 11.0, 26.0, 28.0, 55.0, 74.0, 86.0, 185.0, 228.0, 379.0, 556.0, 902.0, 1479.0, 2428.0, 3966.0, 6731.0, 11830.0, 21297.0, 38661.0, 74579.0, 155603.0, 282237.0, 222408.0, 106181.0, 52859.0, 28181.0, 15573.0, 8714.0, 5136.0, 3059.0, 1880.0, 1148.0, 753.0, 434.0, 267.0, 184.0, 131.0, 81.0, 63.0, 37.0, 27.0, 16.0, 17.0, 10.0, 10.0, 6.0, 7.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.421875, -10.0828857421875, -9.743896484375, -9.4049072265625, -9.06591796875, -8.7269287109375, -8.387939453125, -8.0489501953125, -7.7099609375, -7.3709716796875, -7.031982421875, -6.6929931640625, -6.35400390625, -6.0150146484375, -5.676025390625, -5.3370361328125, -4.998046875, -4.6590576171875, -4.320068359375, -3.9810791015625, -3.64208984375, -3.3031005859375, -2.964111328125, -2.6251220703125, -2.2861328125, -1.9471435546875, -1.608154296875, -1.2691650390625, -0.93017578125, -0.5911865234375, -0.252197265625, 0.0867919921875, 0.42578125, 0.7647705078125, 1.103759765625, 1.4427490234375, 1.78173828125, 2.1207275390625, 2.459716796875, 2.7987060546875, 3.1376953125, 3.4766845703125, 3.815673828125, 4.1546630859375, 4.49365234375, 4.8326416015625, 5.171630859375, 5.5106201171875, 5.849609375, 6.1885986328125, 6.527587890625, 6.8665771484375, 7.20556640625, 7.5445556640625, 7.883544921875, 8.2225341796875, 8.5615234375, 8.9005126953125, 9.239501953125, 9.5784912109375, 9.91748046875, 10.2564697265625, 10.595458984375, 10.9344482421875, 11.2734375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 11.0, 13.0, 7.0, 10.0, 18.0, 15.0, 28.0, 26.0, 37.0, 47.0, 46.0, 51.0, 47.0, 57.0, 59.0, 58.0, 56.0, 58.0, 39.0, 60.0, 44.0, 41.0, 37.0, 32.0, 21.0, 22.0, 10.0, 13.0, 13.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.171875, -8.86767578125, -8.5634765625, -8.25927734375, -7.955078125, -7.65087890625, -7.3466796875, -7.04248046875, -6.73828125, -6.43408203125, -6.1298828125, -5.82568359375, -5.521484375, -5.21728515625, -4.9130859375, -4.60888671875, -4.3046875, -4.00048828125, -3.6962890625, -3.39208984375, -3.087890625, -2.78369140625, -2.4794921875, -2.17529296875, -1.87109375, -1.56689453125, -1.2626953125, -0.95849609375, -0.654296875, -0.35009765625, -0.0458984375, 0.25830078125, 0.5625, 0.86669921875, 1.1708984375, 1.47509765625, 1.779296875, 2.08349609375, 2.3876953125, 2.69189453125, 2.99609375, 3.30029296875, 3.6044921875, 3.90869140625, 4.212890625, 4.51708984375, 4.8212890625, 5.12548828125, 5.4296875, 5.73388671875, 6.0380859375, 6.34228515625, 6.646484375, 6.95068359375, 7.2548828125, 7.55908203125, 7.86328125, 8.16748046875, 8.4716796875, 8.77587890625, 9.080078125, 9.38427734375, 9.6884765625, 9.99267578125, 10.296875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 2.0, 6.0, 3.0, 16.0, 16.0, 23.0, 45.0, 52.0, 70.0, 106.0, 163.0, 236.0, 339.0, 619.0, 1016.0, 1801.0, 4431.0, 16592.0, 110744.0, 769012.0, 116949.0, 17181.0, 4565.0, 1786.0, 1015.0, 591.0, 372.0, 261.0, 176.0, 98.0, 93.0, 47.0, 41.0, 28.0, 20.0, 15.0, 8.0, 7.0, 3.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0], "bins": [-41.125, -40.05712890625, -38.9892578125, -37.92138671875, -36.853515625, -35.78564453125, -34.7177734375, -33.64990234375, -32.58203125, -31.51416015625, -30.4462890625, -29.37841796875, -28.310546875, -27.24267578125, -26.1748046875, -25.10693359375, -24.0390625, -22.97119140625, -21.9033203125, -20.83544921875, -19.767578125, -18.69970703125, -17.6318359375, -16.56396484375, -15.49609375, -14.42822265625, -13.3603515625, -12.29248046875, -11.224609375, -10.15673828125, -9.0888671875, -8.02099609375, -6.953125, -5.88525390625, -4.8173828125, -3.74951171875, -2.681640625, -1.61376953125, -0.5458984375, 0.52197265625, 1.58984375, 2.65771484375, 3.7255859375, 4.79345703125, 5.861328125, 6.92919921875, 7.9970703125, 9.06494140625, 10.1328125, 11.20068359375, 12.2685546875, 13.33642578125, 14.404296875, 15.47216796875, 16.5400390625, 17.60791015625, 18.67578125, 19.74365234375, 20.8115234375, 21.87939453125, 22.947265625, 24.01513671875, 25.0830078125, 26.15087890625, 27.21875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 5.0, 13.0, 16.0, 16.0, 19.0, 29.0, 27.0, 28.0, 32.0, 40.0, 44.0, 52.0, 50.0, 58.0, 63.0, 58.0, 57.0, 50.0, 50.0, 41.0, 44.0, 30.0, 25.0, 27.0, 23.0, 20.0, 11.0, 15.0, 13.0, 6.0, 8.0, 0.0, 3.0, 3.0, 5.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-30.734375, -29.636474609375, -28.53857421875, -27.440673828125, -26.3427734375, -25.244873046875, -24.14697265625, -23.049072265625, -21.951171875, -20.853271484375, -19.75537109375, -18.657470703125, -17.5595703125, -16.461669921875, -15.36376953125, -14.265869140625, -13.16796875, -12.070068359375, -10.97216796875, -9.874267578125, -8.7763671875, -7.678466796875, -6.58056640625, -5.482666015625, -4.384765625, -3.286865234375, -2.18896484375, -1.091064453125, 0.0068359375, 1.104736328125, 2.20263671875, 3.300537109375, 4.3984375, 5.496337890625, 6.59423828125, 7.692138671875, 8.7900390625, 9.887939453125, 10.98583984375, 12.083740234375, 13.181640625, 14.279541015625, 15.37744140625, 16.475341796875, 17.5732421875, 18.671142578125, 19.76904296875, 20.866943359375, 21.96484375, 23.062744140625, 24.16064453125, 25.258544921875, 26.3564453125, 27.454345703125, 28.55224609375, 29.650146484375, 30.748046875, 31.845947265625, 32.94384765625, 34.041748046875, 35.1396484375, 36.237548828125, 37.33544921875, 38.433349609375, 39.53125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 6.0, 7.0, 6.0, 11.0, 29.0, 42.0, 91.0, 162.0, 486.0, 2137.0, 33712.0, 945882.0, 62081.0, 2959.0, 571.0, 193.0, 79.0, 47.0, 23.0, 17.0, 7.0, 6.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.9375, -17.3310546875, -16.724609375, -16.1181640625, -15.51171875, -14.9052734375, -14.298828125, -13.6923828125, -13.0859375, -12.4794921875, -11.873046875, -11.2666015625, -10.66015625, -10.0537109375, -9.447265625, -8.8408203125, -8.234375, -7.6279296875, -7.021484375, -6.4150390625, -5.80859375, -5.2021484375, -4.595703125, -3.9892578125, -3.3828125, -2.7763671875, -2.169921875, -1.5634765625, -0.95703125, -0.3505859375, 0.255859375, 0.8623046875, 1.46875, 2.0751953125, 2.681640625, 3.2880859375, 3.89453125, 4.5009765625, 5.107421875, 5.7138671875, 6.3203125, 6.9267578125, 7.533203125, 8.1396484375, 8.74609375, 9.3525390625, 9.958984375, 10.5654296875, 11.171875, 11.7783203125, 12.384765625, 12.9912109375, 13.59765625, 14.2041015625, 14.810546875, 15.4169921875, 16.0234375, 16.6298828125, 17.236328125, 17.8427734375, 18.44921875, 19.0556640625, 19.662109375, 20.2685546875, 20.875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 7.0, 1.0, 10.0, 6.0, 12.0, 15.0, 17.0, 15.0, 21.0, 22.0, 34.0, 49.0, 46.0, 80.0, 87.0, 96.0, 82.0, 85.0, 57.0, 54.0, 34.0, 29.0, 19.0, 21.0, 13.0, 15.0, 13.0, 12.0, 10.0, 10.0, 4.0, 8.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016641616821289062, -0.0016119331121444702, -0.0015597045421600342, -0.0015074759721755981, -0.0014552474021911621, -0.001403018832206726, -0.00135079026222229, -0.001298561692237854, -0.001246333122253418, -0.001194104552268982, -0.001141875982284546, -0.0010896474123001099, -0.0010374188423156738, -0.0009851902723312378, -0.0009329617023468018, -0.0008807331323623657, -0.0008285045623779297, -0.0007762759923934937, -0.0007240474224090576, -0.0006718188524246216, -0.0006195902824401855, -0.0005673617124557495, -0.0005151331424713135, -0.00046290457248687744, -0.0004106760025024414, -0.00035844743251800537, -0.00030621886253356934, -0.0002539902925491333, -0.00020176172256469727, -0.00014953315258026123, -9.73045825958252e-05, -4.507601261138916e-05, 7.152557373046875e-06, 5.938112735748291e-05, 0.00011160969734191895, 0.00016383826732635498, 0.00021606683731079102, 0.00026829540729522705, 0.0003205239772796631, 0.0003727525472640991, 0.00042498111724853516, 0.0004772096872329712, 0.0005294382572174072, 0.0005816668272018433, 0.0006338953971862793, 0.0006861239671707153, 0.0007383525371551514, 0.0007905811071395874, 0.0008428096771240234, 0.0008950382471084595, 0.0009472668170928955, 0.0009994953870773315, 0.0010517239570617676, 0.0011039525270462036, 0.0011561810970306396, 0.0012084096670150757, 0.0012606382369995117, 0.0013128668069839478, 0.0013650953769683838, 0.0014173239469528198, 0.0014695525169372559, 0.001521781086921692, 0.001574009656906128, 0.001626238226890564, 0.001678466796875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 11.0, 6.0, 14.0, 9.0, 28.0, 27.0, 60.0, 88.0, 141.0, 287.0, 567.0, 1206.0, 2936.0, 9110.0, 54995.0, 718321.0, 230033.0, 21752.0, 5215.0, 1971.0, 850.0, 420.0, 202.0, 104.0, 80.0, 35.0, 30.0, 17.0, 14.0, 8.0, 5.0, 6.0, 1.0, 2.0, 2.0, 0.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1640625, -5.8934326171875, -5.622802734375, -5.3521728515625, -5.08154296875, -4.8109130859375, -4.540283203125, -4.2696533203125, -3.9990234375, -3.7283935546875, -3.457763671875, -3.1871337890625, -2.91650390625, -2.6458740234375, -2.375244140625, -2.1046142578125, -1.833984375, -1.5633544921875, -1.292724609375, -1.0220947265625, -0.75146484375, -0.4808349609375, -0.210205078125, 0.0604248046875, 0.3310546875, 0.6016845703125, 0.872314453125, 1.1429443359375, 1.41357421875, 1.6842041015625, 1.954833984375, 2.2254638671875, 2.49609375, 2.7667236328125, 3.037353515625, 3.3079833984375, 3.57861328125, 3.8492431640625, 4.119873046875, 4.3905029296875, 4.6611328125, 4.9317626953125, 5.202392578125, 5.4730224609375, 5.74365234375, 6.0142822265625, 6.284912109375, 6.5555419921875, 6.826171875, 7.0968017578125, 7.367431640625, 7.6380615234375, 7.90869140625, 8.1793212890625, 8.449951171875, 8.7205810546875, 8.9912109375, 9.2618408203125, 9.532470703125, 9.8031005859375, 10.07373046875, 10.3443603515625, 10.614990234375, 10.8856201171875, 11.15625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 8.0, 6.0, 14.0, 11.0, 18.0, 28.0, 26.0, 34.0, 43.0, 67.0, 55.0, 65.0, 89.0, 91.0, 82.0, 89.0, 58.0, 46.0, 39.0, 27.0, 20.0, 21.0, 11.0, 9.0, 7.0, 9.0, 3.0, 9.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.578125, -5.398681640625, -5.21923828125, -5.039794921875, -4.8603515625, -4.680908203125, -4.50146484375, -4.322021484375, -4.142578125, -3.963134765625, -3.78369140625, -3.604248046875, -3.4248046875, -3.245361328125, -3.06591796875, -2.886474609375, -2.70703125, -2.527587890625, -2.34814453125, -2.168701171875, -1.9892578125, -1.809814453125, -1.63037109375, -1.450927734375, -1.271484375, -1.092041015625, -0.91259765625, -0.733154296875, -0.5537109375, -0.374267578125, -0.19482421875, -0.015380859375, 0.1640625, 0.343505859375, 0.52294921875, 0.702392578125, 0.8818359375, 1.061279296875, 1.24072265625, 1.420166015625, 1.599609375, 1.779052734375, 1.95849609375, 2.137939453125, 2.3173828125, 2.496826171875, 2.67626953125, 2.855712890625, 3.03515625, 3.214599609375, 3.39404296875, 3.573486328125, 3.7529296875, 3.932373046875, 4.11181640625, 4.291259765625, 4.470703125, 4.650146484375, 4.82958984375, 5.009033203125, 5.1884765625, 5.367919921875, 5.54736328125, 5.726806640625, 5.90625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 6.0, 9.0, 16.0, 34.0, 99.0, 244.0, 348.0, 146.0, 64.0, 19.0, 9.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-213.90438842773438, -203.83253479003906, -193.76068115234375, -183.68882751464844, -173.61697387695312, -163.5451202392578, -153.4732666015625, -143.40142822265625, -133.32955932617188, -123.25770568847656, -113.18585205078125, -103.11399841308594, -93.04214477539062, -82.97029113769531, -72.89844512939453, -62.82659149169922, -52.75474548339844, -42.682891845703125, -32.61103820800781, -22.539188385009766, -12.467334747314453, -2.3954811096191406, 7.676368713378906, 17.74822235107422, 27.82007598876953, 37.891929626464844, 47.963783264160156, 58.0356330871582, 68.10748291015625, 78.17933654785156, 88.25119018554688, 98.32304382324219, 108.3948974609375, 118.46675109863281, 128.53860473632812, 138.61045837402344, 148.68231201171875, 158.75416564941406, 168.82601928710938, 178.89785766601562, 188.9697265625, 199.0415802001953, 209.11343383789062, 219.18528747558594, 229.25714111328125, 239.32899475097656, 249.40084838867188, 259.4726867675781, 269.5445556640625, 279.61639404296875, 289.6882629394531, 299.7601013183594, 309.83197021484375, 319.90380859375, 329.9756774902344, 340.0475158691406, 350.1193542480469, 360.1911926269531, 370.2630615234375, 380.33489990234375, 390.4067687988281, 400.4786071777344, 410.55047607421875, 420.622314453125, 430.6941833496094]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 6.0, 6.0, 6.0, 14.0, 8.0, 15.0, 14.0, 24.0, 10.0, 10.0, 19.0, 22.0, 30.0, 21.0, 23.0, 26.0, 30.0, 40.0, 48.0, 59.0, 69.0, 53.0, 51.0, 54.0, 28.0, 41.0, 50.0, 31.0, 25.0, 15.0, 23.0, 16.0, 18.0, 16.0, 12.0, 16.0, 9.0, 12.0, 10.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0], "bins": [-128.56396484375, -125.0047836303711, -121.44560241699219, -117.88642120361328, -114.32723999023438, -110.76805877685547, -107.20887756347656, -103.64969635009766, -100.09051513671875, -96.53133392333984, -92.97215270996094, -89.41297149658203, -85.85379028320312, -82.29460906982422, -78.73542785644531, -75.1762466430664, -71.6170654296875, -68.0578842163086, -64.49870300292969, -60.93952178955078, -57.380340576171875, -53.82115936279297, -50.26197814941406, -46.702796936035156, -43.14362335205078, -39.584442138671875, -36.02526092529297, -32.46607971191406, -28.906898498535156, -25.347719192504883, -21.788537979125977, -18.22935676574707, -14.670173645019531, -11.110992431640625, -7.551811695098877, -3.992630958557129, -0.43344974517822266, 3.125730514526367, 6.684911727905273, 10.24409294128418, 13.803274154663086, 17.362455368041992, 20.9216365814209, 24.480815887451172, 28.039997100830078, 31.599178314208984, 35.15835952758789, 38.7175407409668, 42.2767219543457, 45.83590316772461, 49.395084381103516, 52.95426559448242, 56.51344680786133, 60.07262420654297, 63.631805419921875, 67.19098663330078, 70.75016784667969, 74.3093490600586, 77.8685302734375, 81.4277114868164, 84.98689270019531, 88.54607391357422, 92.10525512695312, 95.66443634033203, 99.22361755371094]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 10.0, 10.0, 18.0, 21.0, 43.0, 75.0, 112.0, 162.0, 279.0, 492.0, 1068.0, 2122.0, 5110.0, 15876.0, 69730.0, 753155.0, 2873665.0, 406002.0, 47325.0, 11280.0, 4038.0, 1717.0, 857.0, 451.0, 242.0, 139.0, 94.0, 67.0, 40.0, 26.0, 17.0, 9.0, 3.0, 4.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-12.1875, -11.772705078125, -11.35791015625, -10.943115234375, -10.5283203125, -10.113525390625, -9.69873046875, -9.283935546875, -8.869140625, -8.454345703125, -8.03955078125, -7.624755859375, -7.2099609375, -6.795166015625, -6.38037109375, -5.965576171875, -5.55078125, -5.135986328125, -4.72119140625, -4.306396484375, -3.8916015625, -3.476806640625, -3.06201171875, -2.647216796875, -2.232421875, -1.817626953125, -1.40283203125, -0.988037109375, -0.5732421875, -0.158447265625, 0.25634765625, 0.671142578125, 1.0859375, 1.500732421875, 1.91552734375, 2.330322265625, 2.7451171875, 3.159912109375, 3.57470703125, 3.989501953125, 4.404296875, 4.819091796875, 5.23388671875, 5.648681640625, 6.0634765625, 6.478271484375, 6.89306640625, 7.307861328125, 7.72265625, 8.137451171875, 8.55224609375, 8.967041015625, 9.3818359375, 9.796630859375, 10.21142578125, 10.626220703125, 11.041015625, 11.455810546875, 11.87060546875, 12.285400390625, 12.7001953125, 13.114990234375, 13.52978515625, 13.944580078125, 14.359375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 4.0, 4.0, 5.0, 8.0, 5.0, 14.0, 13.0, 15.0, 18.0, 25.0, 29.0, 33.0, 46.0, 48.0, 60.0, 57.0, 71.0, 50.0, 57.0, 57.0, 38.0, 53.0, 60.0, 43.0, 43.0, 38.0, 27.0, 20.0, 20.0, 11.0, 5.0, 12.0, 6.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.0625, -8.7608642578125, -8.459228515625, -8.1575927734375, -7.85595703125, -7.5543212890625, -7.252685546875, -6.9510498046875, -6.6494140625, -6.3477783203125, -6.046142578125, -5.7445068359375, -5.44287109375, -5.1412353515625, -4.839599609375, -4.5379638671875, -4.236328125, -3.9346923828125, -3.633056640625, -3.3314208984375, -3.02978515625, -2.7281494140625, -2.426513671875, -2.1248779296875, -1.8232421875, -1.5216064453125, -1.219970703125, -0.9183349609375, -0.61669921875, -0.3150634765625, -0.013427734375, 0.2882080078125, 0.58984375, 0.8914794921875, 1.193115234375, 1.4947509765625, 1.79638671875, 2.0980224609375, 2.399658203125, 2.7012939453125, 3.0029296875, 3.3045654296875, 3.606201171875, 3.9078369140625, 4.20947265625, 4.5111083984375, 4.812744140625, 5.1143798828125, 5.416015625, 5.7176513671875, 6.019287109375, 6.3209228515625, 6.62255859375, 6.9241943359375, 7.225830078125, 7.5274658203125, 7.8291015625, 8.1307373046875, 8.432373046875, 8.7340087890625, 9.03564453125, 9.3372802734375, 9.638916015625, 9.9405517578125, 10.2421875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 8.0, 6.0, 11.0, 10.0, 21.0, 38.0, 42.0, 84.0, 150.0, 312.0, 782.0, 1974.0, 6371.0, 25541.0, 192882.0, 3356710.0, 547018.0, 46153.0, 10565.0, 3205.0, 1294.0, 488.0, 248.0, 150.0, 73.0, 45.0, 25.0, 23.0, 13.0, 10.0, 8.0, 6.0, 4.0, 1.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.90625, -19.277587890625, -18.64892578125, -18.020263671875, -17.3916015625, -16.762939453125, -16.13427734375, -15.505615234375, -14.876953125, -14.248291015625, -13.61962890625, -12.990966796875, -12.3623046875, -11.733642578125, -11.10498046875, -10.476318359375, -9.84765625, -9.218994140625, -8.59033203125, -7.961669921875, -7.3330078125, -6.704345703125, -6.07568359375, -5.447021484375, -4.818359375, -4.189697265625, -3.56103515625, -2.932373046875, -2.3037109375, -1.675048828125, -1.04638671875, -0.417724609375, 0.2109375, 0.839599609375, 1.46826171875, 2.096923828125, 2.7255859375, 3.354248046875, 3.98291015625, 4.611572265625, 5.240234375, 5.868896484375, 6.49755859375, 7.126220703125, 7.7548828125, 8.383544921875, 9.01220703125, 9.640869140625, 10.26953125, 10.898193359375, 11.52685546875, 12.155517578125, 12.7841796875, 13.412841796875, 14.04150390625, 14.670166015625, 15.298828125, 15.927490234375, 16.55615234375, 17.184814453125, 17.8134765625, 18.442138671875, 19.07080078125, 19.699462890625, 20.328125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 7.0, 7.0, 8.0, 6.0, 12.0, 17.0, 28.0, 21.0, 48.0, 68.0, 113.0, 172.0, 300.0, 494.0, 739.0, 705.0, 469.0, 322.0, 169.0, 122.0, 86.0, 38.0, 34.0, 19.0, 13.0, 13.0, 10.0, 7.0, 6.0, 4.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.203125, -18.6201171875, -18.037109375, -17.4541015625, -16.87109375, -16.2880859375, -15.705078125, -15.1220703125, -14.5390625, -13.9560546875, -13.373046875, -12.7900390625, -12.20703125, -11.6240234375, -11.041015625, -10.4580078125, -9.875, -9.2919921875, -8.708984375, -8.1259765625, -7.54296875, -6.9599609375, -6.376953125, -5.7939453125, -5.2109375, -4.6279296875, -4.044921875, -3.4619140625, -2.87890625, -2.2958984375, -1.712890625, -1.1298828125, -0.546875, 0.0361328125, 0.619140625, 1.2021484375, 1.78515625, 2.3681640625, 2.951171875, 3.5341796875, 4.1171875, 4.7001953125, 5.283203125, 5.8662109375, 6.44921875, 7.0322265625, 7.615234375, 8.1982421875, 8.78125, 9.3642578125, 9.947265625, 10.5302734375, 11.11328125, 11.6962890625, 12.279296875, 12.8623046875, 13.4453125, 14.0283203125, 14.611328125, 15.1943359375, 15.77734375, 16.3603515625, 16.943359375, 17.5263671875, 18.109375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 6.0, 15.0, 53.0, 211.0, 466.0, 187.0, 50.0, 7.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-395.7889404296875, -381.8563232421875, -367.9237365722656, -353.9911193847656, -340.05853271484375, -326.12591552734375, -312.19329833984375, -298.2607116699219, -284.328125, -270.3955078125, -256.4629211425781, -242.53030395507812, -228.59771728515625, -214.66510009765625, -200.7324981689453, -186.79989624023438, -172.86727905273438, -158.93467712402344, -145.0020751953125, -131.0694580078125, -117.1368637084961, -103.20426177978516, -89.27165222167969, -75.33905029296875, -61.40644836425781, -47.473846435546875, -33.54124069213867, -19.60863494873047, -5.676033020019531, 8.256568908691406, 22.189178466796875, 36.12178039550781, 50.054412841796875, 63.98701477050781, 77.91961669921875, 91.85222625732422, 105.78482818603516, 119.7174301147461, 133.65003967285156, 147.5826416015625, 161.51524353027344, 175.44784545898438, 189.3804473876953, 203.31304931640625, 217.24566650390625, 231.17825317382812, 245.11087036132812, 259.04345703125, 272.97607421875, 286.90869140625, 300.8412780761719, 314.7738952636719, 328.70648193359375, 342.63909912109375, 356.57171630859375, 370.5043029785156, 384.4368896484375, 398.3695068359375, 412.3020935058594, 426.2347106933594, 440.16729736328125, 454.09991455078125, 468.03253173828125, 481.9651184082031, 495.8977355957031]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 8.0, 10.0, 9.0, 10.0, 27.0, 16.0, 12.0, 37.0, 28.0, 39.0, 44.0, 38.0, 38.0, 52.0, 45.0, 51.0, 52.0, 52.0, 50.0, 53.0, 37.0, 37.0, 36.0, 29.0, 44.0, 30.0, 25.0, 17.0, 13.0, 5.0, 15.0, 7.0, 8.0, 4.0, 3.0, 8.0, 6.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0], "bins": [-95.1252670288086, -92.31668853759766, -89.50811004638672, -86.69953918457031, -83.89096069335938, -81.08238220214844, -78.2738037109375, -75.46522521972656, -72.65664672851562, -69.84806823730469, -67.03948974609375, -64.23091125488281, -61.422340393066406, -58.61376190185547, -55.80518341064453, -52.996604919433594, -50.18803405761719, -47.37945556640625, -44.57088088989258, -41.76230239868164, -38.95372772216797, -36.14514923095703, -33.336570739746094, -30.52799415588379, -27.719417572021484, -24.91084098815918, -22.102264404296875, -19.293685913085938, -16.485109329223633, -13.676532745361328, -10.86795425415039, -8.059377670288086, -5.2508087158203125, -2.4422316551208496, 0.3663454055786133, 3.1749229431152344, 5.983499526977539, 8.792076110839844, 11.600654602050781, 14.409231185913086, 17.21780776977539, 20.026384353637695, 22.8349609375, 25.643539428710938, 28.452116012573242, 31.260692596435547, 34.069271087646484, 36.877845764160156, 39.686424255371094, 42.49500274658203, 45.3035774230957, 48.11215591430664, 50.92073059082031, 53.72930908203125, 56.53788757324219, 59.346466064453125, 62.1550407409668, 64.96361541748047, 67.7721939086914, 70.58077239990234, 73.38935089111328, 76.19792175292969, 79.00650024414062, 81.81507873535156, 84.6236572265625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 8.0, 8.0, 9.0, 10.0, 29.0, 33.0, 45.0, 75.0, 110.0, 164.0, 305.0, 521.0, 800.0, 1407.0, 2541.0, 4910.0, 9540.0, 20308.0, 46357.0, 110041.0, 235925.0, 298216.0, 176768.0, 77195.0, 32541.0, 14838.0, 7143.0, 3735.0, 1960.0, 1190.0, 703.0, 393.0, 252.0, 162.0, 99.0, 68.0, 52.0, 31.0, 22.0, 11.0, 10.0, 7.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-10.046875, -9.75390625, -9.4609375, -9.16796875, -8.875, -8.58203125, -8.2890625, -7.99609375, -7.703125, -7.41015625, -7.1171875, -6.82421875, -6.53125, -6.23828125, -5.9453125, -5.65234375, -5.359375, -5.06640625, -4.7734375, -4.48046875, -4.1875, -3.89453125, -3.6015625, -3.30859375, -3.015625, -2.72265625, -2.4296875, -2.13671875, -1.84375, -1.55078125, -1.2578125, -0.96484375, -0.671875, -0.37890625, -0.0859375, 0.20703125, 0.5, 0.79296875, 1.0859375, 1.37890625, 1.671875, 1.96484375, 2.2578125, 2.55078125, 2.84375, 3.13671875, 3.4296875, 3.72265625, 4.015625, 4.30859375, 4.6015625, 4.89453125, 5.1875, 5.48046875, 5.7734375, 6.06640625, 6.359375, 6.65234375, 6.9453125, 7.23828125, 7.53125, 7.82421875, 8.1171875, 8.41015625, 8.703125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 2.0, 6.0, 8.0, 19.0, 14.0, 10.0, 27.0, 17.0, 19.0, 36.0, 35.0, 49.0, 42.0, 53.0, 61.0, 50.0, 64.0, 58.0, 49.0, 57.0, 42.0, 45.0, 38.0, 54.0, 29.0, 19.0, 22.0, 18.0, 10.0, 11.0, 11.0, 9.0, 9.0, 3.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.8984375, -8.600830078125, -8.30322265625, -8.005615234375, -7.7080078125, -7.410400390625, -7.11279296875, -6.815185546875, -6.517578125, -6.219970703125, -5.92236328125, -5.624755859375, -5.3271484375, -5.029541015625, -4.73193359375, -4.434326171875, -4.13671875, -3.839111328125, -3.54150390625, -3.243896484375, -2.9462890625, -2.648681640625, -2.35107421875, -2.053466796875, -1.755859375, -1.458251953125, -1.16064453125, -0.863037109375, -0.5654296875, -0.267822265625, 0.02978515625, 0.327392578125, 0.625, 0.922607421875, 1.22021484375, 1.517822265625, 1.8154296875, 2.113037109375, 2.41064453125, 2.708251953125, 3.005859375, 3.303466796875, 3.60107421875, 3.898681640625, 4.1962890625, 4.493896484375, 4.79150390625, 5.089111328125, 5.38671875, 5.684326171875, 5.98193359375, 6.279541015625, 6.5771484375, 6.874755859375, 7.17236328125, 7.469970703125, 7.767578125, 8.065185546875, 8.36279296875, 8.660400390625, 8.9580078125, 9.255615234375, 9.55322265625, 9.850830078125, 10.1484375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 4.0, 4.0, 4.0, 7.0, 8.0, 16.0, 20.0, 27.0, 30.0, 56.0, 80.0, 162.0, 291.0, 664.0, 1642.0, 4895.0, 18732.0, 105401.0, 687303.0, 189633.0, 28814.0, 6902.0, 2157.0, 848.0, 361.0, 172.0, 116.0, 70.0, 36.0, 28.0, 13.0, 11.0, 13.0, 8.0, 8.0, 5.0, 5.0, 5.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-24.875, -24.156982421875, -23.43896484375, -22.720947265625, -22.0029296875, -21.284912109375, -20.56689453125, -19.848876953125, -19.130859375, -18.412841796875, -17.69482421875, -16.976806640625, -16.2587890625, -15.540771484375, -14.82275390625, -14.104736328125, -13.38671875, -12.668701171875, -11.95068359375, -11.232666015625, -10.5146484375, -9.796630859375, -9.07861328125, -8.360595703125, -7.642578125, -6.924560546875, -6.20654296875, -5.488525390625, -4.7705078125, -4.052490234375, -3.33447265625, -2.616455078125, -1.8984375, -1.180419921875, -0.46240234375, 0.255615234375, 0.9736328125, 1.691650390625, 2.40966796875, 3.127685546875, 3.845703125, 4.563720703125, 5.28173828125, 5.999755859375, 6.7177734375, 7.435791015625, 8.15380859375, 8.871826171875, 9.58984375, 10.307861328125, 11.02587890625, 11.743896484375, 12.4619140625, 13.179931640625, 13.89794921875, 14.615966796875, 15.333984375, 16.052001953125, 16.77001953125, 17.488037109375, 18.2060546875, 18.924072265625, 19.64208984375, 20.360107421875, 21.078125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 5.0, 11.0, 13.0, 7.0, 7.0, 14.0, 14.0, 21.0, 32.0, 26.0, 31.0, 37.0, 44.0, 39.0, 46.0, 45.0, 54.0, 58.0, 53.0, 33.0, 41.0, 58.0, 40.0, 31.0, 30.0, 29.0, 17.0, 29.0, 20.0, 19.0, 16.0, 9.0, 11.0, 7.0, 8.0, 8.0, 10.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-27.53125, -26.6123046875, -25.693359375, -24.7744140625, -23.85546875, -22.9365234375, -22.017578125, -21.0986328125, -20.1796875, -19.2607421875, -18.341796875, -17.4228515625, -16.50390625, -15.5849609375, -14.666015625, -13.7470703125, -12.828125, -11.9091796875, -10.990234375, -10.0712890625, -9.15234375, -8.2333984375, -7.314453125, -6.3955078125, -5.4765625, -4.5576171875, -3.638671875, -2.7197265625, -1.80078125, -0.8818359375, 0.037109375, 0.9560546875, 1.875, 2.7939453125, 3.712890625, 4.6318359375, 5.55078125, 6.4697265625, 7.388671875, 8.3076171875, 9.2265625, 10.1455078125, 11.064453125, 11.9833984375, 12.90234375, 13.8212890625, 14.740234375, 15.6591796875, 16.578125, 17.4970703125, 18.416015625, 19.3349609375, 20.25390625, 21.1728515625, 22.091796875, 23.0107421875, 23.9296875, 24.8486328125, 25.767578125, 26.6865234375, 27.60546875, 28.5244140625, 29.443359375, 30.3623046875, 31.28125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 5.0, 6.0, 7.0, 13.0, 9.0, 12.0, 22.0, 31.0, 49.0, 100.0, 146.0, 267.0, 432.0, 983.0, 2235.0, 6011.0, 18059.0, 63369.0, 261488.0, 553748.0, 100501.0, 27031.0, 8411.0, 3090.0, 1236.0, 520.0, 305.0, 132.0, 103.0, 76.0, 52.0, 30.0, 18.0, 13.0, 11.0, 5.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.744140625, -3.620025634765625, -3.49591064453125, -3.371795654296875, -3.2476806640625, -3.123565673828125, -2.99945068359375, -2.875335693359375, -2.751220703125, -2.627105712890625, -2.50299072265625, -2.378875732421875, -2.2547607421875, -2.130645751953125, -2.00653076171875, -1.882415771484375, -1.75830078125, -1.634185791015625, -1.51007080078125, -1.385955810546875, -1.2618408203125, -1.137725830078125, -1.01361083984375, -0.889495849609375, -0.765380859375, -0.641265869140625, -0.51715087890625, -0.393035888671875, -0.2689208984375, -0.144805908203125, -0.02069091796875, 0.103424072265625, 0.2275390625, 0.351654052734375, 0.47576904296875, 0.599884033203125, 0.7239990234375, 0.848114013671875, 0.97222900390625, 1.096343994140625, 1.220458984375, 1.344573974609375, 1.46868896484375, 1.592803955078125, 1.7169189453125, 1.841033935546875, 1.96514892578125, 2.089263916015625, 2.21337890625, 2.337493896484375, 2.46160888671875, 2.585723876953125, 2.7098388671875, 2.833953857421875, 2.95806884765625, 3.082183837890625, 3.206298828125, 3.330413818359375, 3.45452880859375, 3.578643798828125, 3.7027587890625, 3.826873779296875, 3.95098876953125, 4.075103759765625, 4.19921875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 6.0, 4.0, 10.0, 7.0, 5.0, 17.0, 26.0, 45.0, 40.0, 76.0, 109.0, 133.0, 105.0, 116.0, 71.0, 56.0, 52.0, 37.0, 17.0, 17.0, 17.0, 11.0, 4.0, 4.0, 6.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0016069412231445312, -0.0015649795532226562, -0.0015230178833007812, -0.0014810562133789062, -0.0014390945434570312, -0.0013971328735351562, -0.0013551712036132812, -0.0013132095336914062, -0.0012712478637695312, -0.0012292861938476562, -0.0011873245239257812, -0.0011453628540039062, -0.0011034011840820312, -0.0010614395141601562, -0.0010194778442382812, -0.0009775161743164062, -0.0009355545043945312, -0.0008935928344726562, -0.0008516311645507812, -0.0008096694946289062, -0.0007677078247070312, -0.0007257461547851562, -0.0006837844848632812, -0.0006418228149414062, -0.0005998611450195312, -0.0005578994750976562, -0.0005159378051757812, -0.00047397613525390625, -0.00043201446533203125, -0.00039005279541015625, -0.00034809112548828125, -0.00030612945556640625, -0.00026416778564453125, -0.00022220611572265625, -0.00018024444580078125, -0.00013828277587890625, -9.632110595703125e-05, -5.435943603515625e-05, -1.239776611328125e-05, 2.956390380859375e-05, 7.152557373046875e-05, 0.00011348724365234375, 0.00015544891357421875, 0.00019741058349609375, 0.00023937225341796875, 0.00028133392333984375, 0.00032329559326171875, 0.00036525726318359375, 0.00040721893310546875, 0.00044918060302734375, 0.0004911422729492188, 0.0005331039428710938, 0.0005750656127929688, 0.0006170272827148438, 0.0006589889526367188, 0.0007009506225585938, 0.0007429122924804688, 0.0007848739624023438, 0.0008268356323242188, 0.0008687973022460938, 0.0009107589721679688, 0.0009527206420898438, 0.0009946823120117188, 0.0010366439819335938, 0.0010786056518554688]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 6.0, 2.0, 1.0, 6.0, 17.0, 14.0, 28.0, 55.0, 112.0, 198.0, 417.0, 946.0, 2824.0, 11237.0, 70192.0, 669841.0, 252526.0, 31086.0, 6070.0, 1741.0, 623.0, 299.0, 125.0, 78.0, 45.0, 26.0, 15.0, 14.0, 5.0, 7.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.06640625, -5.86279296875, -5.6591796875, -5.45556640625, -5.251953125, -5.04833984375, -4.8447265625, -4.64111328125, -4.4375, -4.23388671875, -4.0302734375, -3.82666015625, -3.623046875, -3.41943359375, -3.2158203125, -3.01220703125, -2.80859375, -2.60498046875, -2.4013671875, -2.19775390625, -1.994140625, -1.79052734375, -1.5869140625, -1.38330078125, -1.1796875, -0.97607421875, -0.7724609375, -0.56884765625, -0.365234375, -0.16162109375, 0.0419921875, 0.24560546875, 0.44921875, 0.65283203125, 0.8564453125, 1.06005859375, 1.263671875, 1.46728515625, 1.6708984375, 1.87451171875, 2.078125, 2.28173828125, 2.4853515625, 2.68896484375, 2.892578125, 3.09619140625, 3.2998046875, 3.50341796875, 3.70703125, 3.91064453125, 4.1142578125, 4.31787109375, 4.521484375, 4.72509765625, 4.9287109375, 5.13232421875, 5.3359375, 5.53955078125, 5.7431640625, 5.94677734375, 6.150390625, 6.35400390625, 6.5576171875, 6.76123046875, 6.96484375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 3.0, 9.0, 9.0, 11.0, 17.0, 24.0, 38.0, 57.0, 63.0, 92.0, 99.0, 129.0, 122.0, 90.0, 65.0, 60.0, 34.0, 23.0, 17.0, 15.0, 9.0, 7.0, 3.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.5078125, -7.28411865234375, -7.0604248046875, -6.83673095703125, -6.613037109375, -6.38934326171875, -6.1656494140625, -5.94195556640625, -5.71826171875, -5.49456787109375, -5.2708740234375, -5.04718017578125, -4.823486328125, -4.59979248046875, -4.3760986328125, -4.15240478515625, -3.9287109375, -3.70501708984375, -3.4813232421875, -3.25762939453125, -3.033935546875, -2.81024169921875, -2.5865478515625, -2.36285400390625, -2.13916015625, -1.91546630859375, -1.6917724609375, -1.46807861328125, -1.244384765625, -1.02069091796875, -0.7969970703125, -0.57330322265625, -0.349609375, -0.12591552734375, 0.0977783203125, 0.32147216796875, 0.545166015625, 0.76885986328125, 0.9925537109375, 1.21624755859375, 1.43994140625, 1.66363525390625, 1.8873291015625, 2.11102294921875, 2.334716796875, 2.55841064453125, 2.7821044921875, 3.00579833984375, 3.2294921875, 3.45318603515625, 3.6768798828125, 3.90057373046875, 4.124267578125, 4.34796142578125, 4.5716552734375, 4.79534912109375, 5.01904296875, 5.24273681640625, 5.4664306640625, 5.69012451171875, 5.913818359375, 6.13751220703125, 6.3612060546875, 6.58489990234375, 6.80859375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 6.0, 7.0, 25.0, 42.0, 94.0, 206.0, 330.0, 145.0, 72.0, 39.0, 15.0, 9.0, 2.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-273.6329650878906, -267.60498046875, -261.5769958496094, -255.5490264892578, -249.5210418701172, -243.49307250976562, -237.465087890625, -231.43710327148438, -225.4091339111328, -219.3811492919922, -213.35317993164062, -207.3251953125, -201.29721069335938, -195.2692413330078, -189.2412567138672, -183.21328735351562, -177.185302734375, -171.15731811523438, -165.1293487548828, -159.1013641357422, -153.07337951660156, -147.04541015625, -141.01742553710938, -134.98944091796875, -128.96145629882812, -122.93347930908203, -116.9054946899414, -110.87751770019531, -104.84954071044922, -98.82156372070312, -92.7935791015625, -86.7656021118164, -80.73762512207031, -74.70964813232422, -68.6816635131836, -62.6536865234375, -56.625709533691406, -50.59772872924805, -44.56974792480469, -38.541770935058594, -32.513790130615234, -26.485811233520508, -20.45783233642578, -14.429851531982422, -8.401872634887695, -2.3738937377929688, 3.6540870666503906, 9.682064056396484, 15.710044860839844, 21.73802375793457, 27.766002655029297, 33.793983459472656, 39.82196044921875, 45.84994125366211, 51.87792205810547, 57.90589904785156, 63.93387985229492, 69.96186065673828, 75.98983764648438, 82.017822265625, 88.0457992553711, 94.07377624511719, 100.10176086425781, 106.12973022460938, 112.15771484375]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 4.0, 6.0, 10.0, 3.0, 7.0, 9.0, 12.0, 10.0, 16.0, 21.0, 16.0, 17.0, 26.0, 21.0, 19.0, 33.0, 36.0, 41.0, 62.0, 72.0, 67.0, 51.0, 68.0, 46.0, 40.0, 34.0, 38.0, 22.0, 27.0, 23.0, 22.0, 16.0, 21.0, 12.0, 14.0, 7.0, 8.0, 8.0, 5.0, 7.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-108.47959899902344, -105.140380859375, -101.80115509033203, -98.4619369506836, -95.12271118164062, -91.78349304199219, -88.44427490234375, -85.10505676269531, -81.76583099365234, -78.4266128540039, -75.08738708496094, -71.7481689453125, -68.40895080566406, -65.0697250366211, -61.730506896972656, -58.39128494262695, -55.05206298828125, -51.71284103393555, -48.373619079589844, -45.034400939941406, -41.6951789855957, -38.35595703125, -35.01673889160156, -31.67751693725586, -28.338294982910156, -24.999073028564453, -21.659852981567383, -18.320632934570312, -14.98141098022461, -11.642189025878906, -8.302968978881836, -4.963748931884766, -1.6245269775390625, 1.7146940231323242, 5.053915023803711, 8.393136024475098, 11.732357025146484, 15.071578979492188, 18.410799026489258, 21.750019073486328, 25.08924102783203, 28.428462982177734, 31.767683029174805, 35.106903076171875, 38.44612503051758, 41.78534698486328, 45.12456512451172, 48.46378707885742, 51.803009033203125, 55.14223098754883, 58.48145294189453, 61.82067108154297, 65.15989685058594, 68.49911499023438, 71.83833312988281, 75.17755126953125, 78.51677703857422, 81.85599517822266, 85.19522094726562, 88.53443908691406, 91.8736572265625, 95.21288299560547, 98.5521011352539, 101.89132690429688, 105.23054504394531]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 1.0, 5.0, 4.0, 8.0, 14.0, 18.0, 25.0, 27.0, 30.0, 63.0, 91.0, 134.0, 223.0, 373.0, 592.0, 1019.0, 2001.0, 4411.0, 9859.0, 25493.0, 83961.0, 340662.0, 1289639.0, 1707301.0, 540164.0, 128724.0, 36343.0, 12671.0, 4990.0, 2342.0, 1216.0, 695.0, 412.0, 268.0, 150.0, 99.0, 75.0, 63.0, 37.0, 23.0, 12.0, 10.0, 6.0, 11.0, 8.0, 4.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.44921875, -5.24090576171875, -5.0325927734375, -4.82427978515625, -4.615966796875, -4.40765380859375, -4.1993408203125, -3.99102783203125, -3.78271484375, -3.57440185546875, -3.3660888671875, -3.15777587890625, -2.949462890625, -2.74114990234375, -2.5328369140625, -2.32452392578125, -2.1162109375, -1.90789794921875, -1.6995849609375, -1.49127197265625, -1.282958984375, -1.07464599609375, -0.8663330078125, -0.65802001953125, -0.44970703125, -0.24139404296875, -0.0330810546875, 0.17523193359375, 0.383544921875, 0.59185791015625, 0.8001708984375, 1.00848388671875, 1.216796875, 1.42510986328125, 1.6334228515625, 1.84173583984375, 2.050048828125, 2.25836181640625, 2.4666748046875, 2.67498779296875, 2.88330078125, 3.09161376953125, 3.2999267578125, 3.50823974609375, 3.716552734375, 3.92486572265625, 4.1331787109375, 4.34149169921875, 4.5498046875, 4.75811767578125, 4.9664306640625, 5.17474365234375, 5.383056640625, 5.59136962890625, 5.7996826171875, 6.00799560546875, 6.21630859375, 6.42462158203125, 6.6329345703125, 6.84124755859375, 7.049560546875, 7.25787353515625, 7.4661865234375, 7.67449951171875, 7.8828125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 4.0, 5.0, 9.0, 10.0, 11.0, 17.0, 24.0, 28.0, 32.0, 54.0, 41.0, 45.0, 46.0, 59.0, 53.0, 55.0, 48.0, 50.0, 42.0, 55.0, 51.0, 45.0, 37.0, 35.0, 39.0, 20.0, 22.0, 12.0, 18.0, 5.0, 13.0, 3.0, 7.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.984375, -8.68798828125, -8.3916015625, -8.09521484375, -7.798828125, -7.50244140625, -7.2060546875, -6.90966796875, -6.61328125, -6.31689453125, -6.0205078125, -5.72412109375, -5.427734375, -5.13134765625, -4.8349609375, -4.53857421875, -4.2421875, -3.94580078125, -3.6494140625, -3.35302734375, -3.056640625, -2.76025390625, -2.4638671875, -2.16748046875, -1.87109375, -1.57470703125, -1.2783203125, -0.98193359375, -0.685546875, -0.38916015625, -0.0927734375, 0.20361328125, 0.5, 0.79638671875, 1.0927734375, 1.38916015625, 1.685546875, 1.98193359375, 2.2783203125, 2.57470703125, 2.87109375, 3.16748046875, 3.4638671875, 3.76025390625, 4.056640625, 4.35302734375, 4.6494140625, 4.94580078125, 5.2421875, 5.53857421875, 5.8349609375, 6.13134765625, 6.427734375, 6.72412109375, 7.0205078125, 7.31689453125, 7.61328125, 7.90966796875, 8.2060546875, 8.50244140625, 8.798828125, 9.09521484375, 9.3916015625, 9.68798828125, 9.984375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 2.0, 3.0, 9.0, 5.0, 4.0, 9.0, 17.0, 16.0, 39.0, 35.0, 88.0, 144.0, 277.0, 792.0, 2901.0, 16450.0, 260780.0, 3720156.0, 175190.0, 13492.0, 2549.0, 716.0, 279.0, 125.0, 83.0, 35.0, 32.0, 17.0, 7.0, 14.0, 5.0, 4.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.59375, -17.916259765625, -17.23876953125, -16.561279296875, -15.8837890625, -15.206298828125, -14.52880859375, -13.851318359375, -13.173828125, -12.496337890625, -11.81884765625, -11.141357421875, -10.4638671875, -9.786376953125, -9.10888671875, -8.431396484375, -7.75390625, -7.076416015625, -6.39892578125, -5.721435546875, -5.0439453125, -4.366455078125, -3.68896484375, -3.011474609375, -2.333984375, -1.656494140625, -0.97900390625, -0.301513671875, 0.3759765625, 1.053466796875, 1.73095703125, 2.408447265625, 3.0859375, 3.763427734375, 4.44091796875, 5.118408203125, 5.7958984375, 6.473388671875, 7.15087890625, 7.828369140625, 8.505859375, 9.183349609375, 9.86083984375, 10.538330078125, 11.2158203125, 11.893310546875, 12.57080078125, 13.248291015625, 13.92578125, 14.603271484375, 15.28076171875, 15.958251953125, 16.6357421875, 17.313232421875, 17.99072265625, 18.668212890625, 19.345703125, 20.023193359375, 20.70068359375, 21.378173828125, 22.0556640625, 22.733154296875, 23.41064453125, 24.088134765625, 24.765625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 5.0, 8.0, 6.0, 14.0, 17.0, 43.0, 38.0, 73.0, 138.0, 238.0, 371.0, 634.0, 803.0, 628.0, 451.0, 226.0, 138.0, 80.0, 49.0, 37.0, 25.0, 19.0, 6.0, 5.0, 9.0, 6.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.8125, -20.258056640625, -19.70361328125, -19.149169921875, -18.5947265625, -18.040283203125, -17.48583984375, -16.931396484375, -16.376953125, -15.822509765625, -15.26806640625, -14.713623046875, -14.1591796875, -13.604736328125, -13.05029296875, -12.495849609375, -11.94140625, -11.386962890625, -10.83251953125, -10.278076171875, -9.7236328125, -9.169189453125, -8.61474609375, -8.060302734375, -7.505859375, -6.951416015625, -6.39697265625, -5.842529296875, -5.2880859375, -4.733642578125, -4.17919921875, -3.624755859375, -3.0703125, -2.515869140625, -1.96142578125, -1.406982421875, -0.8525390625, -0.298095703125, 0.25634765625, 0.810791015625, 1.365234375, 1.919677734375, 2.47412109375, 3.028564453125, 3.5830078125, 4.137451171875, 4.69189453125, 5.246337890625, 5.80078125, 6.355224609375, 6.90966796875, 7.464111328125, 8.0185546875, 8.572998046875, 9.12744140625, 9.681884765625, 10.236328125, 10.790771484375, 11.34521484375, 11.899658203125, 12.4541015625, 13.008544921875, 13.56298828125, 14.117431640625, 14.671875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 15.0, 21.0, 96.0, 226.0, 299.0, 217.0, 74.0, 32.0, 9.0, 6.0, 7.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-325.6950988769531, -318.8290100097656, -311.9629211425781, -305.0968322753906, -298.2307434082031, -291.3646545410156, -284.4985656738281, -277.6324768066406, -270.7663879394531, -263.9002990722656, -257.0342102050781, -250.16812133789062, -243.30203247070312, -236.43594360351562, -229.56985473632812, -222.70376586914062, -215.83766174316406, -208.97157287597656, -202.10548400878906, -195.23939514160156, -188.37330627441406, -181.50721740722656, -174.64111328125, -167.7750244140625, -160.908935546875, -154.0428466796875, -147.1767578125, -140.3106689453125, -133.444580078125, -126.5784912109375, -119.71239471435547, -112.84630584716797, -105.980224609375, -99.1141357421875, -92.248046875, -85.3819580078125, -78.515869140625, -71.6497802734375, -64.78368377685547, -57.91759490966797, -51.05150604248047, -44.18541717529297, -37.31932830810547, -30.453235626220703, -23.587146759033203, -16.721057891845703, -9.854965209960938, -2.9888763427734375, 3.8772125244140625, 10.743302345275879, 17.609392166137695, 24.475482940673828, 31.341571807861328, 38.20766067504883, 45.073753356933594, 51.939842224121094, 58.805931091308594, 65.6720199584961, 72.5381088256836, 79.40420532226562, 86.27029418945312, 93.13638305664062, 100.00247192382812, 106.86856079101562, 113.73464965820312]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 5.0, 7.0, 4.0, 7.0, 11.0, 14.0, 11.0, 15.0, 20.0, 21.0, 20.0, 32.0, 30.0, 36.0, 40.0, 44.0, 48.0, 43.0, 55.0, 56.0, 32.0, 45.0, 50.0, 53.0, 46.0, 38.0, 34.0, 29.0, 16.0, 21.0, 17.0, 17.0, 19.0, 14.0, 11.0, 14.0, 8.0, 5.0, 4.0, 7.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-57.91127014160156, -55.9961051940918, -54.080936431884766, -52.165771484375, -50.250606536865234, -48.33544158935547, -46.42027282714844, -44.50510787963867, -42.589942932128906, -40.67477798461914, -38.75960922241211, -36.844444274902344, -34.92927932739258, -33.01411437988281, -31.09894561767578, -29.183780670166016, -27.268611907958984, -25.353445053100586, -23.43828010559082, -21.523113250732422, -19.607948303222656, -17.692781448364258, -15.77761459350586, -13.862448692321777, -11.947282791137695, -10.032116889953613, -8.116950988769531, -6.201784133911133, -4.286618232727051, -2.3714523315429688, -0.4562854766845703, 1.4588804244995117, 3.3740463256835938, 5.289212226867676, 7.204378604888916, 9.119544982910156, 11.034710884094238, 12.94987678527832, 14.865043640136719, 16.780208587646484, 18.695375442504883, 20.61054229736328, 22.525707244873047, 24.440874099731445, 26.356040954589844, 28.27120590209961, 30.186372756958008, 32.101539611816406, 34.01670455932617, 35.93186950683594, 37.84703826904297, 39.762203216552734, 41.6773681640625, 43.59253692626953, 45.5077018737793, 47.42286682128906, 49.338035583496094, 51.25320053100586, 53.16836929321289, 55.083534240722656, 56.99869918823242, 58.91386413574219, 60.82903289794922, 62.744197845458984, 64.65936279296875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 9.0, 8.0, 7.0, 16.0, 29.0, 42.0, 72.0, 99.0, 213.0, 342.0, 656.0, 1280.0, 2586.0, 5932.0, 14303.0, 39920.0, 121516.0, 337337.0, 336265.0, 121899.0, 39984.0, 14728.0, 5977.0, 2577.0, 1213.0, 687.0, 338.0, 203.0, 127.0, 68.0, 43.0, 33.0, 17.0, 12.0, 4.0, 8.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0078125, -8.661376953125, -8.31494140625, -7.968505859375, -7.6220703125, -7.275634765625, -6.92919921875, -6.582763671875, -6.236328125, -5.889892578125, -5.54345703125, -5.197021484375, -4.8505859375, -4.504150390625, -4.15771484375, -3.811279296875, -3.46484375, -3.118408203125, -2.77197265625, -2.425537109375, -2.0791015625, -1.732666015625, -1.38623046875, -1.039794921875, -0.693359375, -0.346923828125, -0.00048828125, 0.345947265625, 0.6923828125, 1.038818359375, 1.38525390625, 1.731689453125, 2.078125, 2.424560546875, 2.77099609375, 3.117431640625, 3.4638671875, 3.810302734375, 4.15673828125, 4.503173828125, 4.849609375, 5.196044921875, 5.54248046875, 5.888916015625, 6.2353515625, 6.581787109375, 6.92822265625, 7.274658203125, 7.62109375, 7.967529296875, 8.31396484375, 8.660400390625, 9.0068359375, 9.353271484375, 9.69970703125, 10.046142578125, 10.392578125, 10.739013671875, 11.08544921875, 11.431884765625, 11.7783203125, 12.124755859375, 12.47119140625, 12.817626953125, 13.1640625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 0.0, 9.0, 9.0, 7.0, 10.0, 12.0, 22.0, 23.0, 28.0, 30.0, 29.0, 40.0, 50.0, 45.0, 59.0, 41.0, 52.0, 64.0, 60.0, 56.0, 46.0, 39.0, 50.0, 42.0, 37.0, 28.0, 25.0, 21.0, 13.0, 12.0, 12.0, 5.0, 11.0, 5.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.0546875, -8.75732421875, -8.4599609375, -8.16259765625, -7.865234375, -7.56787109375, -7.2705078125, -6.97314453125, -6.67578125, -6.37841796875, -6.0810546875, -5.78369140625, -5.486328125, -5.18896484375, -4.8916015625, -4.59423828125, -4.296875, -3.99951171875, -3.7021484375, -3.40478515625, -3.107421875, -2.81005859375, -2.5126953125, -2.21533203125, -1.91796875, -1.62060546875, -1.3232421875, -1.02587890625, -0.728515625, -0.43115234375, -0.1337890625, 0.16357421875, 0.4609375, 0.75830078125, 1.0556640625, 1.35302734375, 1.650390625, 1.94775390625, 2.2451171875, 2.54248046875, 2.83984375, 3.13720703125, 3.4345703125, 3.73193359375, 4.029296875, 4.32666015625, 4.6240234375, 4.92138671875, 5.21875, 5.51611328125, 5.8134765625, 6.11083984375, 6.408203125, 6.70556640625, 7.0029296875, 7.30029296875, 7.59765625, 7.89501953125, 8.1923828125, 8.48974609375, 8.787109375, 9.08447265625, 9.3818359375, 9.67919921875, 9.9765625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 6.0, 2.0, 7.0, 14.0, 12.0, 19.0, 32.0, 39.0, 71.0, 127.0, 173.0, 290.0, 432.0, 800.0, 1654.0, 4609.0, 18706.0, 122638.0, 740826.0, 130261.0, 19539.0, 4582.0, 1669.0, 788.0, 457.0, 293.0, 173.0, 111.0, 69.0, 52.0, 37.0, 19.0, 22.0, 16.0, 6.0, 3.0, 8.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.2265625, -14.5789794921875, -13.931396484375, -13.2838134765625, -12.63623046875, -11.9886474609375, -11.341064453125, -10.6934814453125, -10.0458984375, -9.3983154296875, -8.750732421875, -8.1031494140625, -7.45556640625, -6.8079833984375, -6.160400390625, -5.5128173828125, -4.865234375, -4.2176513671875, -3.570068359375, -2.9224853515625, -2.27490234375, -1.6273193359375, -0.979736328125, -0.3321533203125, 0.3154296875, 0.9630126953125, 1.610595703125, 2.2581787109375, 2.90576171875, 3.5533447265625, 4.200927734375, 4.8485107421875, 5.49609375, 6.1436767578125, 6.791259765625, 7.4388427734375, 8.08642578125, 8.7340087890625, 9.381591796875, 10.0291748046875, 10.6767578125, 11.3243408203125, 11.971923828125, 12.6195068359375, 13.26708984375, 13.9146728515625, 14.562255859375, 15.2098388671875, 15.857421875, 16.5050048828125, 17.152587890625, 17.8001708984375, 18.44775390625, 19.0953369140625, 19.742919921875, 20.3905029296875, 21.0380859375, 21.6856689453125, 22.333251953125, 22.9808349609375, 23.62841796875, 24.2760009765625, 24.923583984375, 25.5711669921875, 26.21875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 7.0, 10.0, 7.0, 16.0, 15.0, 23.0, 22.0, 28.0, 34.0, 31.0, 47.0, 40.0, 43.0, 41.0, 54.0, 42.0, 60.0, 61.0, 50.0, 49.0, 47.0, 41.0, 35.0, 28.0, 26.0, 32.0, 23.0, 20.0, 15.0, 16.0, 10.0, 8.0, 5.0, 1.0, 5.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.609375, -21.690673828125, -20.77197265625, -19.853271484375, -18.9345703125, -18.015869140625, -17.09716796875, -16.178466796875, -15.259765625, -14.341064453125, -13.42236328125, -12.503662109375, -11.5849609375, -10.666259765625, -9.74755859375, -8.828857421875, -7.91015625, -6.991455078125, -6.07275390625, -5.154052734375, -4.2353515625, -3.316650390625, -2.39794921875, -1.479248046875, -0.560546875, 0.358154296875, 1.27685546875, 2.195556640625, 3.1142578125, 4.032958984375, 4.95166015625, 5.870361328125, 6.7890625, 7.707763671875, 8.62646484375, 9.545166015625, 10.4638671875, 11.382568359375, 12.30126953125, 13.219970703125, 14.138671875, 15.057373046875, 15.97607421875, 16.894775390625, 17.8134765625, 18.732177734375, 19.65087890625, 20.569580078125, 21.48828125, 22.406982421875, 23.32568359375, 24.244384765625, 25.1630859375, 26.081787109375, 27.00048828125, 27.919189453125, 28.837890625, 29.756591796875, 30.67529296875, 31.593994140625, 32.5126953125, 33.431396484375, 34.35009765625, 35.268798828125, 36.1875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 5.0, 1.0, 4.0, 6.0, 8.0, 15.0, 16.0, 21.0, 36.0, 91.0, 158.0, 345.0, 842.0, 2101.0, 6178.0, 23996.0, 151029.0, 762978.0, 78377.0, 15215.0, 4357.0, 1558.0, 611.0, 280.0, 130.0, 84.0, 37.0, 23.0, 9.0, 14.0, 6.0, 6.0, 7.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.62109375, -5.4705810546875, -5.320068359375, -5.1695556640625, -5.01904296875, -4.8685302734375, -4.718017578125, -4.5675048828125, -4.4169921875, -4.2664794921875, -4.115966796875, -3.9654541015625, -3.81494140625, -3.6644287109375, -3.513916015625, -3.3634033203125, -3.212890625, -3.0623779296875, -2.911865234375, -2.7613525390625, -2.61083984375, -2.4603271484375, -2.309814453125, -2.1593017578125, -2.0087890625, -1.8582763671875, -1.707763671875, -1.5572509765625, -1.40673828125, -1.2562255859375, -1.105712890625, -0.9552001953125, -0.8046875, -0.6541748046875, -0.503662109375, -0.3531494140625, -0.20263671875, -0.0521240234375, 0.098388671875, 0.2489013671875, 0.3994140625, 0.5499267578125, 0.700439453125, 0.8509521484375, 1.00146484375, 1.1519775390625, 1.302490234375, 1.4530029296875, 1.603515625, 1.7540283203125, 1.904541015625, 2.0550537109375, 2.20556640625, 2.3560791015625, 2.506591796875, 2.6571044921875, 2.8076171875, 2.9581298828125, 3.108642578125, 3.2591552734375, 3.40966796875, 3.5601806640625, 3.710693359375, 3.8612060546875, 4.01171875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 7.0, 8.0, 2.0, 8.0, 13.0, 18.0, 33.0, 38.0, 50.0, 72.0, 131.0, 148.0, 133.0, 106.0, 67.0, 41.0, 25.0, 17.0, 19.0, 17.0, 6.0, 9.0, 4.0, 4.0, 5.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.0014715194702148438, -0.0014325082302093506, -0.0013934969902038574, -0.0013544857501983643, -0.001315474510192871, -0.001276463270187378, -0.0012374520301818848, -0.0011984407901763916, -0.0011594295501708984, -0.0011204183101654053, -0.0010814070701599121, -0.001042395830154419, -0.0010033845901489258, -0.0009643733501434326, -0.0009253621101379395, -0.0008863508701324463, -0.0008473396301269531, -0.00080832839012146, -0.0007693171501159668, -0.0007303059101104736, -0.0006912946701049805, -0.0006522834300994873, -0.0006132721900939941, -0.000574260950088501, -0.0005352497100830078, -0.0004962384700775146, -0.0004572272300720215, -0.0004182159900665283, -0.00037920475006103516, -0.000340193510055542, -0.00030118227005004883, -0.00026217103004455566, -0.0002231597900390625, -0.00018414855003356934, -0.00014513731002807617, -0.00010612607002258301, -6.711483001708984e-05, -2.810359001159668e-05, 1.0907649993896484e-05, 4.991888999938965e-05, 8.893013000488281e-05, 0.00012794137001037598, 0.00016695261001586914, 0.0002059638500213623, 0.00024497509002685547, 0.00028398633003234863, 0.0003229975700378418, 0.00036200881004333496, 0.0004010200500488281, 0.0004400312900543213, 0.00047904253005981445, 0.0005180537700653076, 0.0005570650100708008, 0.0005960762500762939, 0.0006350874900817871, 0.0006740987300872803, 0.0007131099700927734, 0.0007521212100982666, 0.0007911324501037598, 0.0008301436901092529, 0.0008691549301147461, 0.0009081661701202393, 0.0009471774101257324, 0.0009861886501312256, 0.0010251998901367188]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 5.0, 2.0, 3.0, 6.0, 8.0, 24.0, 28.0, 46.0, 51.0, 113.0, 153.0, 276.0, 493.0, 994.0, 2118.0, 5259.0, 16172.0, 61946.0, 561915.0, 320710.0, 54478.0, 14680.0, 4921.0, 2018.0, 921.0, 518.0, 264.0, 160.0, 97.0, 59.0, 38.0, 30.0, 16.0, 11.0, 7.0, 4.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-4.33984375, -4.2156982421875, -4.091552734375, -3.9674072265625, -3.84326171875, -3.7191162109375, -3.594970703125, -3.4708251953125, -3.3466796875, -3.2225341796875, -3.098388671875, -2.9742431640625, -2.85009765625, -2.7259521484375, -2.601806640625, -2.4776611328125, -2.353515625, -2.2293701171875, -2.105224609375, -1.9810791015625, -1.85693359375, -1.7327880859375, -1.608642578125, -1.4844970703125, -1.3603515625, -1.2362060546875, -1.112060546875, -0.9879150390625, -0.86376953125, -0.7396240234375, -0.615478515625, -0.4913330078125, -0.3671875, -0.2430419921875, -0.118896484375, 0.0052490234375, 0.12939453125, 0.2535400390625, 0.377685546875, 0.5018310546875, 0.6259765625, 0.7501220703125, 0.874267578125, 0.9984130859375, 1.12255859375, 1.2467041015625, 1.370849609375, 1.4949951171875, 1.619140625, 1.7432861328125, 1.867431640625, 1.9915771484375, 2.11572265625, 2.2398681640625, 2.364013671875, 2.4881591796875, 2.6123046875, 2.7364501953125, 2.860595703125, 2.9847412109375, 3.10888671875, 3.2330322265625, 3.357177734375, 3.4813232421875, 3.60546875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 4.0, 6.0, 1.0, 4.0, 8.0, 9.0, 23.0, 28.0, 33.0, 56.0, 85.0, 115.0, 146.0, 136.0, 109.0, 81.0, 48.0, 39.0, 23.0, 9.0, 7.0, 9.0, 11.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.703125, -6.525390625, -6.34765625, -6.169921875, -5.9921875, -5.814453125, -5.63671875, -5.458984375, -5.28125, -5.103515625, -4.92578125, -4.748046875, -4.5703125, -4.392578125, -4.21484375, -4.037109375, -3.859375, -3.681640625, -3.50390625, -3.326171875, -3.1484375, -2.970703125, -2.79296875, -2.615234375, -2.4375, -2.259765625, -2.08203125, -1.904296875, -1.7265625, -1.548828125, -1.37109375, -1.193359375, -1.015625, -0.837890625, -0.66015625, -0.482421875, -0.3046875, -0.126953125, 0.05078125, 0.228515625, 0.40625, 0.583984375, 0.76171875, 0.939453125, 1.1171875, 1.294921875, 1.47265625, 1.650390625, 1.828125, 2.005859375, 2.18359375, 2.361328125, 2.5390625, 2.716796875, 2.89453125, 3.072265625, 3.25, 3.427734375, 3.60546875, 3.783203125, 3.9609375, 4.138671875, 4.31640625, 4.494140625, 4.671875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 4.0, 8.0, 4.0, 9.0, 8.0, 21.0, 34.0, 43.0, 67.0, 95.0, 224.0, 182.0, 96.0, 65.0, 52.0, 27.0, 13.0, 12.0, 6.0, 12.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-89.23074340820312, -86.33560943603516, -83.44047546386719, -80.54533386230469, -77.65019989013672, -74.75506591796875, -71.85993194580078, -68.96479797363281, -66.06965637207031, -63.174522399902344, -60.27938461303711, -57.38425064086914, -54.489112854003906, -51.59397888183594, -48.69884490966797, -45.803707122802734, -42.908573150634766, -40.0134391784668, -37.11830139160156, -34.223167419433594, -31.32802963256836, -28.43289566040039, -25.53775978088379, -22.642623901367188, -19.747488021850586, -16.852352142333984, -13.957216262817383, -11.062081336975098, -8.166945457458496, -5.2718095779418945, -2.3766746520996094, 0.5184612274169922, 3.4135971069335938, 6.308732986450195, 9.203868865966797, 12.099003791809082, 14.994139671325684, 17.88927459716797, 20.78441047668457, 23.679546356201172, 26.574682235717773, 29.469818115234375, 32.364952087402344, 35.26008987426758, 38.15522384643555, 41.05036163330078, 43.94549560546875, 46.84062957763672, 49.73576736450195, 52.63090133666992, 55.526039123535156, 58.421173095703125, 61.31631088256836, 64.2114486694336, 67.10658264160156, 70.00171661376953, 72.8968505859375, 75.79198455810547, 78.68711853027344, 81.58226013183594, 84.4773941040039, 87.37252807617188, 90.26766204833984, 93.16279602050781, 96.05793762207031]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 2.0, 6.0, 7.0, 2.0, 9.0, 8.0, 13.0, 17.0, 16.0, 43.0, 35.0, 42.0, 33.0, 52.0, 39.0, 87.0, 128.0, 104.0, 61.0, 52.0, 37.0, 36.0, 38.0, 21.0, 27.0, 20.0, 16.0, 12.0, 10.0, 8.0, 6.0, 2.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-130.162353515625, -126.38253784179688, -122.60272216796875, -118.82291412353516, -115.04309844970703, -111.2632827758789, -107.48346710205078, -103.70365905761719, -99.92384338378906, -96.14402770996094, -92.36421203613281, -88.58440399169922, -84.8045883178711, -81.02477264404297, -77.24495697021484, -73.46514892578125, -69.68533325195312, -65.905517578125, -62.12570571899414, -58.345890045166016, -54.566078186035156, -50.78626251220703, -47.006446838378906, -43.22663497924805, -39.446815490722656, -35.66699981689453, -31.887187957763672, -28.107372283935547, -24.327560424804688, -20.547744750976562, -16.76793098449707, -12.988117218017578, -9.208305358886719, -5.428491592407227, -1.6486773490905762, 2.131136894226074, 5.910950660705566, 9.690765380859375, 13.470579147338867, 17.25039291381836, 21.03020668029785, 24.810020446777344, 28.589834213256836, 32.36964797973633, 36.14946365356445, 39.92927551269531, 43.70909118652344, 47.48890686035156, 51.26871871948242, 55.04853439331055, 58.828346252441406, 62.60816192626953, 66.38797760009766, 70.16778564453125, 73.94760131835938, 77.7274169921875, 81.50723266601562, 85.28704833984375, 89.06686401367188, 92.84667205810547, 96.6264877319336, 100.40630340576172, 104.18611907958984, 107.96592712402344, 111.74574279785156]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 11.0, 15.0, 16.0, 18.0, 29.0, 47.0, 83.0, 123.0, 172.0, 304.0, 535.0, 943.0, 1585.0, 2923.0, 5735.0, 11126.0, 23505.0, 55470.0, 152259.0, 467652.0, 1228336.0, 1364614.0, 571907.0, 190445.0, 65875.0, 26120.0, 11771.0, 5710.0, 2974.0, 1621.0, 857.0, 580.0, 314.0, 204.0, 139.0, 89.0, 60.0, 39.0, 24.0, 18.0, 11.0, 7.0, 6.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.921875, -4.74664306640625, -4.5714111328125, -4.39617919921875, -4.220947265625, -4.04571533203125, -3.8704833984375, -3.69525146484375, -3.52001953125, -3.34478759765625, -3.1695556640625, -2.99432373046875, -2.819091796875, -2.64385986328125, -2.4686279296875, -2.29339599609375, -2.1181640625, -1.94293212890625, -1.7677001953125, -1.59246826171875, -1.417236328125, -1.24200439453125, -1.0667724609375, -0.89154052734375, -0.71630859375, -0.54107666015625, -0.3658447265625, -0.19061279296875, -0.015380859375, 0.15985107421875, 0.3350830078125, 0.51031494140625, 0.685546875, 0.86077880859375, 1.0360107421875, 1.21124267578125, 1.386474609375, 1.56170654296875, 1.7369384765625, 1.91217041015625, 2.08740234375, 2.26263427734375, 2.4378662109375, 2.61309814453125, 2.788330078125, 2.96356201171875, 3.1387939453125, 3.31402587890625, 3.4892578125, 3.66448974609375, 3.8397216796875, 4.01495361328125, 4.190185546875, 4.36541748046875, 4.5406494140625, 4.71588134765625, 4.89111328125, 5.06634521484375, 5.2415771484375, 5.41680908203125, 5.592041015625, 5.76727294921875, 5.9425048828125, 6.11773681640625, 6.29296875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 8.0, 4.0, 5.0, 10.0, 17.0, 18.0, 15.0, 29.0, 31.0, 38.0, 45.0, 47.0, 52.0, 61.0, 67.0, 59.0, 49.0, 55.0, 44.0, 59.0, 63.0, 48.0, 37.0, 40.0, 20.0, 27.0, 14.0, 13.0, 10.0, 5.0, 7.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1171875, -8.8153076171875, -8.513427734375, -8.2115478515625, -7.90966796875, -7.6077880859375, -7.305908203125, -7.0040283203125, -6.7021484375, -6.4002685546875, -6.098388671875, -5.7965087890625, -5.49462890625, -5.1927490234375, -4.890869140625, -4.5889892578125, -4.287109375, -3.9852294921875, -3.683349609375, -3.3814697265625, -3.07958984375, -2.7777099609375, -2.475830078125, -2.1739501953125, -1.8720703125, -1.5701904296875, -1.268310546875, -0.9664306640625, -0.66455078125, -0.3626708984375, -0.060791015625, 0.2410888671875, 0.54296875, 0.8448486328125, 1.146728515625, 1.4486083984375, 1.75048828125, 2.0523681640625, 2.354248046875, 2.6561279296875, 2.9580078125, 3.2598876953125, 3.561767578125, 3.8636474609375, 4.16552734375, 4.4674072265625, 4.769287109375, 5.0711669921875, 5.373046875, 5.6749267578125, 5.976806640625, 6.2786865234375, 6.58056640625, 6.8824462890625, 7.184326171875, 7.4862060546875, 7.7880859375, 8.0899658203125, 8.391845703125, 8.6937255859375, 8.99560546875, 9.2974853515625, 9.599365234375, 9.9012451171875, 10.203125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 1.0, 5.0, 11.0, 9.0, 10.0, 21.0, 27.0, 41.0, 51.0, 93.0, 99.0, 211.0, 424.0, 1111.0, 4124.0, 21850.0, 278432.0, 3553116.0, 305204.0, 23229.0, 4138.0, 1098.0, 406.0, 221.0, 86.0, 79.0, 57.0, 35.0, 21.0, 19.0, 17.0, 5.0, 3.0, 5.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-20.328125, -19.7862548828125, -19.244384765625, -18.7025146484375, -18.16064453125, -17.6187744140625, -17.076904296875, -16.5350341796875, -15.9931640625, -15.4512939453125, -14.909423828125, -14.3675537109375, -13.82568359375, -13.2838134765625, -12.741943359375, -12.2000732421875, -11.658203125, -11.1163330078125, -10.574462890625, -10.0325927734375, -9.49072265625, -8.9488525390625, -8.406982421875, -7.8651123046875, -7.3232421875, -6.7813720703125, -6.239501953125, -5.6976318359375, -5.15576171875, -4.6138916015625, -4.072021484375, -3.5301513671875, -2.98828125, -2.4464111328125, -1.904541015625, -1.3626708984375, -0.82080078125, -0.2789306640625, 0.262939453125, 0.8048095703125, 1.3466796875, 1.8885498046875, 2.430419921875, 2.9722900390625, 3.51416015625, 4.0560302734375, 4.597900390625, 5.1397705078125, 5.681640625, 6.2235107421875, 6.765380859375, 7.3072509765625, 7.84912109375, 8.3909912109375, 8.932861328125, 9.4747314453125, 10.0166015625, 10.5584716796875, 11.100341796875, 11.6422119140625, 12.18408203125, 12.7259521484375, 13.267822265625, 13.8096923828125, 14.3515625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 10.0, 5.0, 9.0, 18.0, 9.0, 10.0, 21.0, 35.0, 51.0, 55.0, 79.0, 101.0, 150.0, 197.0, 358.0, 436.0, 516.0, 505.0, 416.0, 340.0, 226.0, 149.0, 93.0, 68.0, 64.0, 35.0, 24.0, 23.0, 8.0, 19.0, 6.0, 8.0, 10.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-14.046875, -13.6575927734375, -13.268310546875, -12.8790283203125, -12.48974609375, -12.1004638671875, -11.711181640625, -11.3218994140625, -10.9326171875, -10.5433349609375, -10.154052734375, -9.7647705078125, -9.37548828125, -8.9862060546875, -8.596923828125, -8.2076416015625, -7.818359375, -7.4290771484375, -7.039794921875, -6.6505126953125, -6.26123046875, -5.8719482421875, -5.482666015625, -5.0933837890625, -4.7041015625, -4.3148193359375, -3.925537109375, -3.5362548828125, -3.14697265625, -2.7576904296875, -2.368408203125, -1.9791259765625, -1.58984375, -1.2005615234375, -0.811279296875, -0.4219970703125, -0.03271484375, 0.3565673828125, 0.745849609375, 1.1351318359375, 1.5244140625, 1.9136962890625, 2.302978515625, 2.6922607421875, 3.08154296875, 3.4708251953125, 3.860107421875, 4.2493896484375, 4.638671875, 5.0279541015625, 5.417236328125, 5.8065185546875, 6.19580078125, 6.5850830078125, 6.974365234375, 7.3636474609375, 7.7529296875, 8.1422119140625, 8.531494140625, 8.9207763671875, 9.31005859375, 9.6993408203125, 10.088623046875, 10.4779052734375, 10.8671875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 6.0, 5.0, 14.0, 17.0, 50.0, 206.0, 360.0, 232.0, 74.0, 24.0, 12.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-430.3618469238281, -422.3433532714844, -414.3248291015625, -406.30633544921875, -398.2878112792969, -390.2693176269531, -382.25079345703125, -374.2322998046875, -366.21380615234375, -358.1953125, -350.1767883300781, -342.1582946777344, -334.1397705078125, -326.12127685546875, -318.102783203125, -310.0842590332031, -302.06573486328125, -294.0472412109375, -286.0287170410156, -278.0102233886719, -269.99169921875, -261.97320556640625, -253.95469665527344, -245.93618774414062, -237.91769409179688, -229.89918518066406, -221.88067626953125, -213.8621826171875, -205.8436737060547, -197.82516479492188, -189.80665588378906, -181.78814697265625, -173.76963806152344, -165.75112915039062, -157.7326202392578, -149.714111328125, -141.69561767578125, -133.67710876464844, -125.65859985351562, -117.64009094238281, -109.62158966064453, -101.60308074951172, -93.58457946777344, -85.56607055664062, -77.54756164550781, -69.52906036376953, -61.51055145263672, -53.49204635620117, -45.473541259765625, -37.45503616333008, -29.4365291595459, -21.41802215576172, -13.399517059326172, -5.381011962890625, 2.6374969482421875, 10.656002044677734, 18.67450714111328, 26.693012237548828, 34.711517333984375, 42.73002624511719, 50.748531341552734, 58.76703643798828, 66.7855453491211, 74.80404663085938, 82.82255554199219]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 5.0, 2.0, 4.0, 13.0, 9.0, 15.0, 14.0, 17.0, 16.0, 24.0, 30.0, 30.0, 32.0, 34.0, 30.0, 39.0, 40.0, 50.0, 47.0, 43.0, 31.0, 53.0, 48.0, 42.0, 43.0, 42.0, 34.0, 41.0, 28.0, 28.0, 18.0, 19.0, 19.0, 12.0, 6.0, 11.0, 8.0, 8.0, 6.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-69.16143798828125, -67.0321044921875, -64.90277099609375, -62.773441314697266, -60.644107818603516, -58.514774322509766, -56.38544464111328, -54.25611114501953, -52.12677764892578, -49.99744415283203, -47.86811065673828, -45.7387809753418, -43.60944747924805, -41.4801139831543, -39.35078430175781, -37.22145080566406, -35.09211730957031, -32.96278381347656, -30.833452224731445, -28.704120635986328, -26.574787139892578, -24.445453643798828, -22.31612205505371, -20.186790466308594, -18.057456970214844, -15.92812442779541, -13.798791885375977, -11.669459342956543, -9.54012680053711, -7.410794258117676, -5.281461715698242, -3.1521291732788086, -1.022796630859375, 1.1065359115600586, 3.235868453979492, 5.365200996398926, 7.494533538818359, 9.623866081237793, 11.753198623657227, 13.88253116607666, 16.011863708496094, 18.141197204589844, 20.27052879333496, 22.399860382080078, 24.529193878173828, 26.658527374267578, 28.787858963012695, 30.917190551757812, 33.04652404785156, 35.17585754394531, 37.30519104003906, 39.43452072143555, 41.5638542175293, 43.69318771362305, 45.82251739501953, 47.95185089111328, 50.08118438720703, 52.21051788330078, 54.33985137939453, 56.469181060791016, 58.598514556884766, 60.727848052978516, 62.857177734375, 64.98651123046875, 67.1158447265625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 4.0, 6.0, 3.0, 12.0, 22.0, 36.0, 35.0, 64.0, 109.0, 167.0, 294.0, 521.0, 956.0, 1841.0, 3736.0, 7966.0, 17899.0, 43648.0, 113997.0, 301374.0, 334631.0, 132835.0, 50285.0, 20670.0, 8907.0, 4131.0, 1932.0, 1073.0, 590.0, 289.0, 181.0, 135.0, 69.0, 54.0, 33.0, 18.0, 18.0, 10.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4375, -9.1129150390625, -8.788330078125, -8.4637451171875, -8.13916015625, -7.8145751953125, -7.489990234375, -7.1654052734375, -6.8408203125, -6.5162353515625, -6.191650390625, -5.8670654296875, -5.54248046875, -5.2178955078125, -4.893310546875, -4.5687255859375, -4.244140625, -3.9195556640625, -3.594970703125, -3.2703857421875, -2.94580078125, -2.6212158203125, -2.296630859375, -1.9720458984375, -1.6474609375, -1.3228759765625, -0.998291015625, -0.6737060546875, -0.34912109375, -0.0245361328125, 0.300048828125, 0.6246337890625, 0.94921875, 1.2738037109375, 1.598388671875, 1.9229736328125, 2.24755859375, 2.5721435546875, 2.896728515625, 3.2213134765625, 3.5458984375, 3.8704833984375, 4.195068359375, 4.5196533203125, 4.84423828125, 5.1688232421875, 5.493408203125, 5.8179931640625, 6.142578125, 6.4671630859375, 6.791748046875, 7.1163330078125, 7.44091796875, 7.7655029296875, 8.090087890625, 8.4146728515625, 8.7392578125, 9.0638427734375, 9.388427734375, 9.7130126953125, 10.03759765625, 10.3621826171875, 10.686767578125, 11.0113525390625, 11.3359375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 10.0, 6.0, 5.0, 10.0, 11.0, 14.0, 21.0, 21.0, 33.0, 32.0, 45.0, 50.0, 41.0, 45.0, 66.0, 64.0, 74.0, 48.0, 53.0, 53.0, 44.0, 38.0, 34.0, 45.0, 32.0, 21.0, 28.0, 14.0, 12.0, 10.0, 6.0, 5.0, 2.0, 7.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.1875, -8.88720703125, -8.5869140625, -8.28662109375, -7.986328125, -7.68603515625, -7.3857421875, -7.08544921875, -6.78515625, -6.48486328125, -6.1845703125, -5.88427734375, -5.583984375, -5.28369140625, -4.9833984375, -4.68310546875, -4.3828125, -4.08251953125, -3.7822265625, -3.48193359375, -3.181640625, -2.88134765625, -2.5810546875, -2.28076171875, -1.98046875, -1.68017578125, -1.3798828125, -1.07958984375, -0.779296875, -0.47900390625, -0.1787109375, 0.12158203125, 0.421875, 0.72216796875, 1.0224609375, 1.32275390625, 1.623046875, 1.92333984375, 2.2236328125, 2.52392578125, 2.82421875, 3.12451171875, 3.4248046875, 3.72509765625, 4.025390625, 4.32568359375, 4.6259765625, 4.92626953125, 5.2265625, 5.52685546875, 5.8271484375, 6.12744140625, 6.427734375, 6.72802734375, 7.0283203125, 7.32861328125, 7.62890625, 7.92919921875, 8.2294921875, 8.52978515625, 8.830078125, 9.13037109375, 9.4306640625, 9.73095703125, 10.03125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 4.0, 9.0, 14.0, 14.0, 26.0, 27.0, 51.0, 62.0, 96.0, 115.0, 165.0, 254.0, 410.0, 633.0, 1105.0, 1989.0, 4755.0, 15513.0, 89334.0, 778773.0, 125332.0, 19513.0, 5398.0, 2080.0, 1050.0, 598.0, 401.0, 262.0, 152.0, 110.0, 94.0, 66.0, 42.0, 32.0, 16.0, 15.0, 12.0, 9.0, 9.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-22.03125, -21.39404296875, -20.7568359375, -20.11962890625, -19.482421875, -18.84521484375, -18.2080078125, -17.57080078125, -16.93359375, -16.29638671875, -15.6591796875, -15.02197265625, -14.384765625, -13.74755859375, -13.1103515625, -12.47314453125, -11.8359375, -11.19873046875, -10.5615234375, -9.92431640625, -9.287109375, -8.64990234375, -8.0126953125, -7.37548828125, -6.73828125, -6.10107421875, -5.4638671875, -4.82666015625, -4.189453125, -3.55224609375, -2.9150390625, -2.27783203125, -1.640625, -1.00341796875, -0.3662109375, 0.27099609375, 0.908203125, 1.54541015625, 2.1826171875, 2.81982421875, 3.45703125, 4.09423828125, 4.7314453125, 5.36865234375, 6.005859375, 6.64306640625, 7.2802734375, 7.91748046875, 8.5546875, 9.19189453125, 9.8291015625, 10.46630859375, 11.103515625, 11.74072265625, 12.3779296875, 13.01513671875, 13.65234375, 14.28955078125, 14.9267578125, 15.56396484375, 16.201171875, 16.83837890625, 17.4755859375, 18.11279296875, 18.75]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 5.0, 7.0, 5.0, 15.0, 15.0, 14.0, 18.0, 32.0, 25.0, 39.0, 49.0, 60.0, 64.0, 60.0, 57.0, 49.0, 62.0, 68.0, 70.0, 54.0, 41.0, 37.0, 25.0, 25.0, 21.0, 17.0, 14.0, 13.0, 12.0, 6.0, 5.0, 2.0, 5.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-36.90625, -35.849609375, -34.79296875, -33.736328125, -32.6796875, -31.623046875, -30.56640625, -29.509765625, -28.453125, -27.396484375, -26.33984375, -25.283203125, -24.2265625, -23.169921875, -22.11328125, -21.056640625, -20.0, -18.943359375, -17.88671875, -16.830078125, -15.7734375, -14.716796875, -13.66015625, -12.603515625, -11.546875, -10.490234375, -9.43359375, -8.376953125, -7.3203125, -6.263671875, -5.20703125, -4.150390625, -3.09375, -2.037109375, -0.98046875, 0.076171875, 1.1328125, 2.189453125, 3.24609375, 4.302734375, 5.359375, 6.416015625, 7.47265625, 8.529296875, 9.5859375, 10.642578125, 11.69921875, 12.755859375, 13.8125, 14.869140625, 15.92578125, 16.982421875, 18.0390625, 19.095703125, 20.15234375, 21.208984375, 22.265625, 23.322265625, 24.37890625, 25.435546875, 26.4921875, 27.548828125, 28.60546875, 29.662109375, 30.71875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 8.0, 5.0, 4.0, 12.0, 13.0, 15.0, 24.0, 22.0, 37.0, 37.0, 62.0, 77.0, 102.0, 148.0, 257.0, 426.0, 704.0, 1405.0, 2967.0, 7148.0, 21369.0, 87257.0, 731170.0, 147576.0, 30481.0, 9523.0, 3735.0, 1696.0, 887.0, 480.0, 278.0, 176.0, 115.0, 68.0, 70.0, 44.0, 41.0, 34.0, 18.0, 16.0, 10.0, 8.0, 9.0, 4.0, 6.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.93359375, -2.843719482421875, -2.75384521484375, -2.663970947265625, -2.5740966796875, -2.484222412109375, -2.39434814453125, -2.304473876953125, -2.214599609375, -2.124725341796875, -2.03485107421875, -1.944976806640625, -1.8551025390625, -1.765228271484375, -1.67535400390625, -1.585479736328125, -1.49560546875, -1.405731201171875, -1.31585693359375, -1.225982666015625, -1.1361083984375, -1.046234130859375, -0.95635986328125, -0.866485595703125, -0.776611328125, -0.686737060546875, -0.59686279296875, -0.506988525390625, -0.4171142578125, -0.327239990234375, -0.23736572265625, -0.147491455078125, -0.0576171875, 0.032257080078125, 0.12213134765625, 0.212005615234375, 0.3018798828125, 0.391754150390625, 0.48162841796875, 0.571502685546875, 0.661376953125, 0.751251220703125, 0.84112548828125, 0.930999755859375, 1.0208740234375, 1.110748291015625, 1.20062255859375, 1.290496826171875, 1.38037109375, 1.470245361328125, 1.56011962890625, 1.649993896484375, 1.7398681640625, 1.829742431640625, 1.91961669921875, 2.009490966796875, 2.099365234375, 2.189239501953125, 2.27911376953125, 2.368988037109375, 2.4588623046875, 2.548736572265625, 2.63861083984375, 2.728485107421875, 2.818359375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 5.0, 3.0, 6.0, 5.0, 9.0, 6.0, 11.0, 14.0, 27.0, 28.0, 40.0, 58.0, 102.0, 136.0, 143.0, 128.0, 65.0, 51.0, 31.0, 27.0, 18.0, 19.0, 8.0, 9.0, 6.0, 8.0, 4.0, 5.0, 4.0, 4.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0008645057678222656, -0.0008338764309883118, -0.0008032470941543579, -0.000772617757320404, -0.0007419884204864502, -0.0007113590836524963, -0.0006807297468185425, -0.0006501004099845886, -0.0006194710731506348, -0.0005888417363166809, -0.000558212399482727, -0.0005275830626487732, -0.0004969537258148193, -0.0004663243889808655, -0.0004356950521469116, -0.00040506571531295776, -0.0003744363784790039, -0.00034380704164505005, -0.0003131777048110962, -0.00028254836797714233, -0.0002519190311431885, -0.00022128969430923462, -0.00019066035747528076, -0.0001600310206413269, -0.00012940168380737305, -9.877234697341919e-05, -6.814301013946533e-05, -3.7513673305511475e-05, -6.884336471557617e-06, 2.374500036239624e-05, 5.43743371963501e-05, 8.500367403030396e-05, 0.00011563301086425781, 0.00014626234769821167, 0.00017689168453216553, 0.00020752102136611938, 0.00023815035820007324, 0.0002687796950340271, 0.00029940903186798096, 0.0003300383687019348, 0.00036066770553588867, 0.00039129704236984253, 0.0004219263792037964, 0.00045255571603775024, 0.0004831850528717041, 0.000513814389705658, 0.0005444437265396118, 0.0005750730633735657, 0.0006057024002075195, 0.0006363317370414734, 0.0006669610738754272, 0.0006975904107093811, 0.000728219747543335, 0.0007588490843772888, 0.0007894784212112427, 0.0008201077580451965, 0.0008507370948791504, 0.0008813664317131042, 0.0009119957685470581, 0.000942625105381012, 0.0009732544422149658, 0.0010038837790489197, 0.0010345131158828735, 0.0010651424527168274, 0.0010957717895507812]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 9.0, 9.0, 13.0, 27.0, 41.0, 52.0, 85.0, 87.0, 135.0, 210.0, 301.0, 552.0, 964.0, 1802.0, 3889.0, 9427.0, 29483.0, 134686.0, 706339.0, 117205.0, 26585.0, 8697.0, 3673.0, 1814.0, 993.0, 549.0, 329.0, 183.0, 136.0, 76.0, 62.0, 40.0, 28.0, 16.0, 18.0, 6.0, 7.0, 10.0, 5.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.201171875, -3.113372802734375, -3.02557373046875, -2.937774658203125, -2.8499755859375, -2.762176513671875, -2.67437744140625, -2.586578369140625, -2.498779296875, -2.410980224609375, -2.32318115234375, -2.235382080078125, -2.1475830078125, -2.059783935546875, -1.97198486328125, -1.884185791015625, -1.79638671875, -1.708587646484375, -1.62078857421875, -1.532989501953125, -1.4451904296875, -1.357391357421875, -1.26959228515625, -1.181793212890625, -1.093994140625, -1.006195068359375, -0.91839599609375, -0.830596923828125, -0.7427978515625, -0.654998779296875, -0.56719970703125, -0.479400634765625, -0.3916015625, -0.303802490234375, -0.21600341796875, -0.128204345703125, -0.0404052734375, 0.047393798828125, 0.13519287109375, 0.222991943359375, 0.310791015625, 0.398590087890625, 0.48638916015625, 0.574188232421875, 0.6619873046875, 0.749786376953125, 0.83758544921875, 0.925384521484375, 1.01318359375, 1.100982666015625, 1.18878173828125, 1.276580810546875, 1.3643798828125, 1.452178955078125, 1.53997802734375, 1.627777099609375, 1.715576171875, 1.803375244140625, 1.89117431640625, 1.978973388671875, 2.0667724609375, 2.154571533203125, 2.24237060546875, 2.330169677734375, 2.41796875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 4.0, 5.0, 9.0, 1.0, 8.0, 15.0, 11.0, 23.0, 19.0, 27.0, 39.0, 41.0, 55.0, 53.0, 65.0, 94.0, 88.0, 72.0, 58.0, 62.0, 43.0, 29.0, 35.0, 31.0, 28.0, 17.0, 14.0, 16.0, 9.0, 5.0, 10.0, 6.0, 7.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.23828125, -3.14105224609375, -3.0438232421875, -2.94659423828125, -2.849365234375, -2.75213623046875, -2.6549072265625, -2.55767822265625, -2.46044921875, -2.36322021484375, -2.2659912109375, -2.16876220703125, -2.071533203125, -1.97430419921875, -1.8770751953125, -1.77984619140625, -1.6826171875, -1.58538818359375, -1.4881591796875, -1.39093017578125, -1.293701171875, -1.19647216796875, -1.0992431640625, -1.00201416015625, -0.90478515625, -0.80755615234375, -0.7103271484375, -0.61309814453125, -0.515869140625, -0.41864013671875, -0.3214111328125, -0.22418212890625, -0.126953125, -0.02972412109375, 0.0675048828125, 0.16473388671875, 0.261962890625, 0.35919189453125, 0.4564208984375, 0.55364990234375, 0.65087890625, 0.74810791015625, 0.8453369140625, 0.94256591796875, 1.039794921875, 1.13702392578125, 1.2342529296875, 1.33148193359375, 1.4287109375, 1.52593994140625, 1.6231689453125, 1.72039794921875, 1.817626953125, 1.91485595703125, 2.0120849609375, 2.10931396484375, 2.20654296875, 2.30377197265625, 2.4010009765625, 2.49822998046875, 2.595458984375, 2.69268798828125, 2.7899169921875, 2.88714599609375, 2.984375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 7.0, 8.0, 23.0, 48.0, 128.0, 373.0, 262.0, 93.0, 34.0, 16.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.67706298828125, -138.86956787109375, -133.06207275390625, -127.25458526611328, -121.44709777832031, -115.63960266113281, -109.83210754394531, -104.02461242675781, -98.21712493896484, -92.40962982177734, -86.60214233398438, -80.79464721679688, -74.98715209960938, -69.1796646118164, -63.372169494628906, -57.56467819213867, -51.75718688964844, -45.9496955871582, -40.14220428466797, -34.33470916748047, -28.527217864990234, -22.7197265625, -16.9122314453125, -11.104740142822266, -5.297248840332031, 0.5102434158325195, 6.31773567199707, 12.125228881835938, 17.932720184326172, 23.740211486816406, 29.547706604003906, 35.35519790649414, 41.162689208984375, 46.97018051147461, 52.777671813964844, 58.585166931152344, 64.39265441894531, 70.20014953613281, 76.00764465332031, 81.81513977050781, 87.62262725830078, 93.43012237548828, 99.23760986328125, 105.04510498046875, 110.85260009765625, 116.66008758544922, 122.46758270263672, 128.2750701904297, 134.0825653076172, 139.8900604248047, 145.6975555419922, 151.50503540039062, 157.31253051757812, 163.12002563476562, 168.92752075195312, 174.73501586914062, 180.54251098632812, 186.35000610351562, 192.15750122070312, 197.96499633789062, 203.77247619628906, 209.57997131347656, 215.38746643066406, 221.19496154785156, 227.00244140625]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 0.0, 3.0, 3.0, 4.0, 4.0, 7.0, 13.0, 8.0, 15.0, 12.0, 22.0, 24.0, 38.0, 31.0, 32.0, 46.0, 47.0, 80.0, 123.0, 123.0, 78.0, 45.0, 47.0, 38.0, 21.0, 26.0, 20.0, 18.0, 12.0, 13.0, 12.0, 9.0, 6.0, 4.0, 8.0, 8.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-124.669677734375, -121.20639038085938, -117.74310302734375, -114.27981567382812, -110.8165283203125, -107.35324096679688, -103.88995361328125, -100.42666625976562, -96.96337890625, -93.50009155273438, -90.03680419921875, -86.57351684570312, -83.1102294921875, -79.64694213867188, -76.18365478515625, -72.72036743164062, -69.257080078125, -65.79379272460938, -62.33050537109375, -58.867218017578125, -55.4039306640625, -51.940643310546875, -48.47735595703125, -45.014068603515625, -41.55078125, -38.087493896484375, -34.62420654296875, -31.160919189453125, -27.6976318359375, -24.234344482421875, -20.77105712890625, -17.307769775390625, -13.844490051269531, -10.381202697753906, -6.917915344238281, -3.4546279907226562, 0.00865936279296875, 3.4719467163085938, 6.935234069824219, 10.398521423339844, 13.861808776855469, 17.325096130371094, 20.78838348388672, 24.251670837402344, 27.71495819091797, 31.178245544433594, 34.64153289794922, 38.104820251464844, 41.56810760498047, 45.031394958496094, 48.49468231201172, 51.957969665527344, 55.42125701904297, 58.884544372558594, 62.34783172607422, 65.81111907958984, 69.27440643310547, 72.7376937866211, 76.20098114013672, 79.66426849365234, 83.12755584716797, 86.5908432006836, 90.05413055419922, 93.51741790771484, 96.98070526123047]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 6.0, 7.0, 2.0, 6.0, 21.0, 19.0, 19.0, 31.0, 39.0, 71.0, 97.0, 151.0, 187.0, 361.0, 581.0, 1122.0, 2499.0, 7288.0, 23337.0, 114692.0, 714617.0, 2202311.0, 931879.0, 156166.0, 26354.0, 7059.0, 2476.0, 1150.0, 676.0, 376.0, 200.0, 153.0, 98.0, 55.0, 63.0, 40.0, 22.0, 17.0, 10.0, 10.0, 9.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.7421875, -10.390869140625, -10.03955078125, -9.688232421875, -9.3369140625, -8.985595703125, -8.63427734375, -8.282958984375, -7.931640625, -7.580322265625, -7.22900390625, -6.877685546875, -6.5263671875, -6.175048828125, -5.82373046875, -5.472412109375, -5.12109375, -4.769775390625, -4.41845703125, -4.067138671875, -3.7158203125, -3.364501953125, -3.01318359375, -2.661865234375, -2.310546875, -1.959228515625, -1.60791015625, -1.256591796875, -0.9052734375, -0.553955078125, -0.20263671875, 0.148681640625, 0.5, 0.851318359375, 1.20263671875, 1.553955078125, 1.9052734375, 2.256591796875, 2.60791015625, 2.959228515625, 3.310546875, 3.661865234375, 4.01318359375, 4.364501953125, 4.7158203125, 5.067138671875, 5.41845703125, 5.769775390625, 6.12109375, 6.472412109375, 6.82373046875, 7.175048828125, 7.5263671875, 7.877685546875, 8.22900390625, 8.580322265625, 8.931640625, 9.282958984375, 9.63427734375, 9.985595703125, 10.3369140625, 10.688232421875, 11.03955078125, 11.390869140625, 11.7421875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 5.0, 10.0, 11.0, 13.0, 22.0, 16.0, 28.0, 26.0, 43.0, 49.0, 45.0, 57.0, 60.0, 67.0, 78.0, 49.0, 57.0, 54.0, 59.0, 58.0, 37.0, 35.0, 20.0, 29.0, 17.0, 9.0, 14.0, 8.0, 4.0, 5.0, 3.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.1953125, -8.8955078125, -8.595703125, -8.2958984375, -7.99609375, -7.6962890625, -7.396484375, -7.0966796875, -6.796875, -6.4970703125, -6.197265625, -5.8974609375, -5.59765625, -5.2978515625, -4.998046875, -4.6982421875, -4.3984375, -4.0986328125, -3.798828125, -3.4990234375, -3.19921875, -2.8994140625, -2.599609375, -2.2998046875, -2.0, -1.7001953125, -1.400390625, -1.1005859375, -0.80078125, -0.5009765625, -0.201171875, 0.0986328125, 0.3984375, 0.6982421875, 0.998046875, 1.2978515625, 1.59765625, 1.8974609375, 2.197265625, 2.4970703125, 2.796875, 3.0966796875, 3.396484375, 3.6962890625, 3.99609375, 4.2958984375, 4.595703125, 4.8955078125, 5.1953125, 5.4951171875, 5.794921875, 6.0947265625, 6.39453125, 6.6943359375, 6.994140625, 7.2939453125, 7.59375, 7.8935546875, 8.193359375, 8.4931640625, 8.79296875, 9.0927734375, 9.392578125, 9.6923828125, 9.9921875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 5.0, 2.0, 5.0, 5.0, 12.0, 20.0, 14.0, 35.0, 80.0, 140.0, 244.0, 512.0, 1594.0, 7881.0, 439948.0, 3722576.0, 17075.0, 2566.0, 827.0, 323.0, 170.0, 80.0, 58.0, 37.0, 25.0, 16.0, 8.0, 5.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.28125, -36.87109375, -35.4609375, -34.05078125, -32.640625, -31.23046875, -29.8203125, -28.41015625, -27.0, -25.58984375, -24.1796875, -22.76953125, -21.359375, -19.94921875, -18.5390625, -17.12890625, -15.71875, -14.30859375, -12.8984375, -11.48828125, -10.078125, -8.66796875, -7.2578125, -5.84765625, -4.4375, -3.02734375, -1.6171875, -0.20703125, 1.203125, 2.61328125, 4.0234375, 5.43359375, 6.84375, 8.25390625, 9.6640625, 11.07421875, 12.484375, 13.89453125, 15.3046875, 16.71484375, 18.125, 19.53515625, 20.9453125, 22.35546875, 23.765625, 25.17578125, 26.5859375, 27.99609375, 29.40625, 30.81640625, 32.2265625, 33.63671875, 35.046875, 36.45703125, 37.8671875, 39.27734375, 40.6875, 42.09765625, 43.5078125, 44.91796875, 46.328125, 47.73828125, 49.1484375, 50.55859375, 51.96875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 4.0, 4.0, 3.0, 6.0, 11.0, 16.0, 20.0, 24.0, 40.0, 72.0, 99.0, 173.0, 316.0, 533.0, 709.0, 754.0, 475.0, 304.0, 174.0, 111.0, 74.0, 44.0, 39.0, 20.0, 11.0, 7.0, 6.0, 5.0, 7.0, 3.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.234375, -20.47216796875, -19.7099609375, -18.94775390625, -18.185546875, -17.42333984375, -16.6611328125, -15.89892578125, -15.13671875, -14.37451171875, -13.6123046875, -12.85009765625, -12.087890625, -11.32568359375, -10.5634765625, -9.80126953125, -9.0390625, -8.27685546875, -7.5146484375, -6.75244140625, -5.990234375, -5.22802734375, -4.4658203125, -3.70361328125, -2.94140625, -2.17919921875, -1.4169921875, -0.65478515625, 0.107421875, 0.86962890625, 1.6318359375, 2.39404296875, 3.15625, 3.91845703125, 4.6806640625, 5.44287109375, 6.205078125, 6.96728515625, 7.7294921875, 8.49169921875, 9.25390625, 10.01611328125, 10.7783203125, 11.54052734375, 12.302734375, 13.06494140625, 13.8271484375, 14.58935546875, 15.3515625, 16.11376953125, 16.8759765625, 17.63818359375, 18.400390625, 19.16259765625, 19.9248046875, 20.68701171875, 21.44921875, 22.21142578125, 22.9736328125, 23.73583984375, 24.498046875, 25.26025390625, 26.0224609375, 26.78466796875, 27.546875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 10.0, 4.0, 29.0, 49.0, 110.0, 234.0, 265.0, 158.0, 68.0, 23.0, 26.0, 8.0, 7.0, 4.0, 2.0, 2.0, 6.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-179.176513671875, -169.78628540039062, -160.39605712890625, -151.00582885742188, -141.6156005859375, -132.22537231445312, -122.83515930175781, -113.44493103027344, -104.05470275878906, -94.66447448730469, -85.27424621582031, -75.88402557373047, -66.4937973022461, -57.10356903076172, -47.71334457397461, -38.3231201171875, -28.932891845703125, -19.542665481567383, -10.15243911743164, -0.7622127532958984, 8.628013610839844, 18.01824188232422, 27.408466339111328, 36.79869079589844, 46.18891906738281, 55.57914733886719, 64.96937561035156, 74.3595962524414, 83.74982452392578, 93.14005279541016, 102.5302734375, 111.92050170898438, 121.31072998046875, 130.70095825195312, 140.0911865234375, 149.48141479492188, 158.87164306640625, 168.26187133789062, 177.65208435058594, 187.0423126220703, 196.4325408935547, 205.82276916503906, 215.21299743652344, 224.6032257080078, 233.99343872070312, 243.3836669921875, 252.77389526367188, 262.16412353515625, 271.5543518066406, 280.944580078125, 290.3348083496094, 299.72503662109375, 309.1152648925781, 318.5054931640625, 327.8957214355469, 337.28594970703125, 346.6761474609375, 356.0663757324219, 365.45660400390625, 374.8468322753906, 384.237060546875, 393.6272888183594, 403.01751708984375, 412.40771484375, 421.7979736328125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 6.0, 3.0, 5.0, 6.0, 12.0, 10.0, 9.0, 14.0, 25.0, 24.0, 13.0, 23.0, 20.0, 34.0, 41.0, 34.0, 45.0, 41.0, 43.0, 48.0, 63.0, 63.0, 54.0, 50.0, 43.0, 33.0, 37.0, 43.0, 27.0, 19.0, 31.0, 10.0, 21.0, 14.0, 8.0, 5.0, 3.0, 0.0, 3.0, 4.0, 0.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-120.64923095703125, -117.22179412841797, -113.79436492919922, -110.36692810058594, -106.93949890136719, -103.5120620727539, -100.08462524414062, -96.65719604492188, -93.22976684570312, -89.80233001708984, -86.3749008178711, -82.94746398925781, -79.52003479003906, -76.09259796142578, -72.6651611328125, -69.23773193359375, -65.81029510498047, -62.38286209106445, -58.95542907714844, -55.527992248535156, -52.100563049316406, -48.673126220703125, -45.24569320678711, -41.818260192871094, -38.39082717895508, -34.96339416503906, -31.535961151123047, -28.1085262298584, -24.681093215942383, -21.253660202026367, -17.82622528076172, -14.398792266845703, -10.971359252929688, -7.543925762176514, -4.11649227142334, -0.6890583038330078, 2.738374710083008, 6.165807723999023, 9.593242645263672, 13.020675659179688, 16.448108673095703, 19.87554168701172, 23.302974700927734, 26.730409622192383, 30.1578426361084, 33.58527374267578, 37.01271057128906, 40.44014358520508, 43.867576599121094, 47.29500961303711, 50.722442626953125, 54.149879455566406, 57.577308654785156, 61.00474548339844, 64.43217468261719, 67.85961151123047, 71.28704833984375, 74.71448516845703, 78.14191436767578, 81.56935119628906, 84.99678039550781, 88.4242172241211, 91.85165405273438, 95.27908325195312, 98.70651245117188]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 4.0, 7.0, 13.0, 20.0, 31.0, 44.0, 55.0, 88.0, 144.0, 208.0, 358.0, 535.0, 980.0, 1788.0, 3626.0, 7714.0, 19449.0, 55368.0, 186300.0, 480831.0, 196207.0, 58528.0, 19964.0, 8097.0, 3801.0, 1881.0, 1035.0, 527.0, 362.0, 183.0, 125.0, 83.0, 54.0, 40.0, 19.0, 19.0, 12.0, 5.0, 15.0, 10.0, 5.0, 3.0, 7.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.2890625, -9.962646484375, -9.63623046875, -9.309814453125, -8.9833984375, -8.656982421875, -8.33056640625, -8.004150390625, -7.677734375, -7.351318359375, -7.02490234375, -6.698486328125, -6.3720703125, -6.045654296875, -5.71923828125, -5.392822265625, -5.06640625, -4.739990234375, -4.41357421875, -4.087158203125, -3.7607421875, -3.434326171875, -3.10791015625, -2.781494140625, -2.455078125, -2.128662109375, -1.80224609375, -1.475830078125, -1.1494140625, -0.822998046875, -0.49658203125, -0.170166015625, 0.15625, 0.482666015625, 0.80908203125, 1.135498046875, 1.4619140625, 1.788330078125, 2.11474609375, 2.441162109375, 2.767578125, 3.093994140625, 3.42041015625, 3.746826171875, 4.0732421875, 4.399658203125, 4.72607421875, 5.052490234375, 5.37890625, 5.705322265625, 6.03173828125, 6.358154296875, 6.6845703125, 7.010986328125, 7.33740234375, 7.663818359375, 7.990234375, 8.316650390625, 8.64306640625, 8.969482421875, 9.2958984375, 9.622314453125, 9.94873046875, 10.275146484375, 10.6015625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 4.0, 3.0, 8.0, 9.0, 12.0, 13.0, 15.0, 34.0, 17.0, 19.0, 34.0, 42.0, 56.0, 48.0, 45.0, 57.0, 43.0, 57.0, 66.0, 55.0, 46.0, 58.0, 61.0, 35.0, 34.0, 27.0, 30.0, 19.0, 18.0, 11.0, 6.0, 4.0, 2.0, 3.0, 5.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.625, -8.3314208984375, -8.037841796875, -7.7442626953125, -7.45068359375, -7.1571044921875, -6.863525390625, -6.5699462890625, -6.2763671875, -5.9827880859375, -5.689208984375, -5.3956298828125, -5.10205078125, -4.8084716796875, -4.514892578125, -4.2213134765625, -3.927734375, -3.6341552734375, -3.340576171875, -3.0469970703125, -2.75341796875, -2.4598388671875, -2.166259765625, -1.8726806640625, -1.5791015625, -1.2855224609375, -0.991943359375, -0.6983642578125, -0.40478515625, -0.1112060546875, 0.182373046875, 0.4759521484375, 0.76953125, 1.0631103515625, 1.356689453125, 1.6502685546875, 1.94384765625, 2.2374267578125, 2.531005859375, 2.8245849609375, 3.1181640625, 3.4117431640625, 3.705322265625, 3.9989013671875, 4.29248046875, 4.5860595703125, 4.879638671875, 5.1732177734375, 5.466796875, 5.7603759765625, 6.053955078125, 6.3475341796875, 6.64111328125, 6.9346923828125, 7.228271484375, 7.5218505859375, 7.8154296875, 8.1090087890625, 8.402587890625, 8.6961669921875, 8.98974609375, 9.2833251953125, 9.576904296875, 9.8704833984375, 10.1640625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 3.0, 7.0, 7.0, 8.0, 7.0, 14.0, 16.0, 33.0, 41.0, 44.0, 86.0, 122.0, 159.0, 284.0, 526.0, 1114.0, 2999.0, 14886.0, 227806.0, 755578.0, 36545.0, 4992.0, 1568.0, 677.0, 373.0, 201.0, 140.0, 77.0, 57.0, 53.0, 36.0, 24.0, 11.0, 17.0, 14.0, 10.0, 4.0, 4.0, 1.0, 5.0, 4.0, 2.0, 1.0, 1.0], "bins": [-19.046875, -18.5609130859375, -18.074951171875, -17.5889892578125, -17.10302734375, -16.6170654296875, -16.131103515625, -15.6451416015625, -15.1591796875, -14.6732177734375, -14.187255859375, -13.7012939453125, -13.21533203125, -12.7293701171875, -12.243408203125, -11.7574462890625, -11.271484375, -10.7855224609375, -10.299560546875, -9.8135986328125, -9.32763671875, -8.8416748046875, -8.355712890625, -7.8697509765625, -7.3837890625, -6.8978271484375, -6.411865234375, -5.9259033203125, -5.43994140625, -4.9539794921875, -4.468017578125, -3.9820556640625, -3.49609375, -3.0101318359375, -2.524169921875, -2.0382080078125, -1.55224609375, -1.0662841796875, -0.580322265625, -0.0943603515625, 0.3916015625, 0.8775634765625, 1.363525390625, 1.8494873046875, 2.33544921875, 2.8214111328125, 3.307373046875, 3.7933349609375, 4.279296875, 4.7652587890625, 5.251220703125, 5.7371826171875, 6.22314453125, 6.7091064453125, 7.195068359375, 7.6810302734375, 8.1669921875, 8.6529541015625, 9.138916015625, 9.6248779296875, 10.11083984375, 10.5968017578125, 11.082763671875, 11.5687255859375, 12.0546875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 0.0, 2.0, 3.0, 0.0, 6.0, 4.0, 9.0, 11.0, 7.0, 16.0, 13.0, 15.0, 15.0, 19.0, 18.0, 29.0, 24.0, 35.0, 38.0, 38.0, 51.0, 56.0, 66.0, 69.0, 61.0, 54.0, 42.0, 38.0, 36.0, 42.0, 20.0, 36.0, 18.0, 17.0, 12.0, 11.0, 14.0, 9.0, 11.0, 8.0, 7.0, 6.0, 7.0, 5.0, 1.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.0625, -25.207763671875, -24.35302734375, -23.498291015625, -22.6435546875, -21.788818359375, -20.93408203125, -20.079345703125, -19.224609375, -18.369873046875, -17.51513671875, -16.660400390625, -15.8056640625, -14.950927734375, -14.09619140625, -13.241455078125, -12.38671875, -11.531982421875, -10.67724609375, -9.822509765625, -8.9677734375, -8.113037109375, -7.25830078125, -6.403564453125, -5.548828125, -4.694091796875, -3.83935546875, -2.984619140625, -2.1298828125, -1.275146484375, -0.42041015625, 0.434326171875, 1.2890625, 2.143798828125, 2.99853515625, 3.853271484375, 4.7080078125, 5.562744140625, 6.41748046875, 7.272216796875, 8.126953125, 8.981689453125, 9.83642578125, 10.691162109375, 11.5458984375, 12.400634765625, 13.25537109375, 14.110107421875, 14.96484375, 15.819580078125, 16.67431640625, 17.529052734375, 18.3837890625, 19.238525390625, 20.09326171875, 20.947998046875, 21.802734375, 22.657470703125, 23.51220703125, 24.366943359375, 25.2216796875, 26.076416015625, 26.93115234375, 27.785888671875, 28.640625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 10.0, 12.0, 18.0, 18.0, 30.0, 48.0, 86.0, 154.0, 312.0, 829.0, 3101.0, 18170.0, 839739.0, 171347.0, 11164.0, 2213.0, 690.0, 282.0, 125.0, 64.0, 44.0, 27.0, 19.0, 10.0, 13.0, 7.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.205078125, -3.113189697265625, -3.02130126953125, -2.929412841796875, -2.8375244140625, -2.745635986328125, -2.65374755859375, -2.561859130859375, -2.469970703125, -2.378082275390625, -2.28619384765625, -2.194305419921875, -2.1024169921875, -2.010528564453125, -1.91864013671875, -1.826751708984375, -1.73486328125, -1.642974853515625, -1.55108642578125, -1.459197998046875, -1.3673095703125, -1.275421142578125, -1.18353271484375, -1.091644287109375, -0.999755859375, -0.907867431640625, -0.81597900390625, -0.724090576171875, -0.6322021484375, -0.540313720703125, -0.44842529296875, -0.356536865234375, -0.2646484375, -0.172760009765625, -0.08087158203125, 0.011016845703125, 0.1029052734375, 0.194793701171875, 0.28668212890625, 0.378570556640625, 0.470458984375, 0.562347412109375, 0.65423583984375, 0.746124267578125, 0.8380126953125, 0.929901123046875, 1.02178955078125, 1.113677978515625, 1.20556640625, 1.297454833984375, 1.38934326171875, 1.481231689453125, 1.5731201171875, 1.665008544921875, 1.75689697265625, 1.848785400390625, 1.940673828125, 2.032562255859375, 2.12445068359375, 2.216339111328125, 2.3082275390625, 2.400115966796875, 2.49200439453125, 2.583892822265625, 2.67578125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 7.0, 6.0, 12.0, 5.0, 15.0, 14.0, 27.0, 30.0, 41.0, 60.0, 99.0, 111.0, 134.0, 128.0, 81.0, 62.0, 35.0, 24.0, 26.0, 21.0, 14.0, 9.0, 10.0, 8.0, 3.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006089210510253906, -0.0005906447768211365, -0.0005723685026168823, -0.0005540922284126282, -0.000535815954208374, -0.0005175396800041199, -0.0004992634057998657, -0.00048098713159561157, -0.0004627108573913574, -0.00044443458318710327, -0.0004261583089828491, -0.00040788203477859497, -0.0003896057605743408, -0.00037132948637008667, -0.0003530532121658325, -0.00033477693796157837, -0.0003165006637573242, -0.00029822438955307007, -0.0002799481153488159, -0.00026167184114456177, -0.00024339556694030762, -0.00022511929273605347, -0.00020684301853179932, -0.00018856674432754517, -0.00017029047012329102, -0.00015201419591903687, -0.00013373792171478271, -0.00011546164751052856, -9.718537330627441e-05, -7.890909910202026e-05, -6.063282489776611e-05, -4.235655069351196e-05, -2.4080276489257812e-05, -5.804002285003662e-06, 1.2472271919250488e-05, 3.074854612350464e-05, 4.902482032775879e-05, 6.730109453201294e-05, 8.557736873626709e-05, 0.00010385364294052124, 0.0001221299171447754, 0.00014040619134902954, 0.0001586824655532837, 0.00017695873975753784, 0.000195235013961792, 0.00021351128816604614, 0.0002317875623703003, 0.00025006383657455444, 0.0002683401107788086, 0.00028661638498306274, 0.0003048926591873169, 0.00032316893339157104, 0.0003414452075958252, 0.00035972148180007935, 0.0003779977560043335, 0.00039627403020858765, 0.0004145503044128418, 0.00043282657861709595, 0.0004511028528213501, 0.00046937912702560425, 0.0004876554012298584, 0.0005059316754341125, 0.0005242079496383667, 0.0005424842238426208, 0.000560760498046875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 6.0, 8.0, 13.0, 9.0, 15.0, 27.0, 35.0, 42.0, 65.0, 102.0, 151.0, 262.0, 449.0, 869.0, 1586.0, 3482.0, 8536.0, 24401.0, 106493.0, 766216.0, 97161.0, 23578.0, 8107.0, 3332.0, 1629.0, 765.0, 498.0, 236.0, 173.0, 86.0, 68.0, 36.0, 29.0, 30.0, 18.0, 8.0, 6.0, 9.0, 9.0, 2.0, 7.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2998046875, -1.2571563720703125, -1.214508056640625, -1.1718597412109375, -1.12921142578125, -1.0865631103515625, -1.043914794921875, -1.0012664794921875, -0.9586181640625, -0.9159698486328125, -0.873321533203125, -0.8306732177734375, -0.78802490234375, -0.7453765869140625, -0.702728271484375, -0.6600799560546875, -0.617431640625, -0.5747833251953125, -0.532135009765625, -0.4894866943359375, -0.44683837890625, -0.4041900634765625, -0.361541748046875, -0.3188934326171875, -0.2762451171875, -0.2335968017578125, -0.190948486328125, -0.1483001708984375, -0.10565185546875, -0.0630035400390625, -0.020355224609375, 0.0222930908203125, 0.06494140625, 0.1075897216796875, 0.150238037109375, 0.1928863525390625, 0.23553466796875, 0.2781829833984375, 0.320831298828125, 0.3634796142578125, 0.4061279296875, 0.4487762451171875, 0.491424560546875, 0.5340728759765625, 0.57672119140625, 0.6193695068359375, 0.662017822265625, 0.7046661376953125, 0.747314453125, 0.7899627685546875, 0.832611083984375, 0.8752593994140625, 0.91790771484375, 0.9605560302734375, 1.003204345703125, 1.0458526611328125, 1.0885009765625, 1.1311492919921875, 1.173797607421875, 1.2164459228515625, 1.25909423828125, 1.3017425537109375, 1.344390869140625, 1.3870391845703125, 1.4296875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 7.0, 2.0, 4.0, 6.0, 10.0, 13.0, 13.0, 22.0, 23.0, 38.0, 42.0, 72.0, 133.0, 129.0, 111.0, 97.0, 85.0, 52.0, 32.0, 25.0, 19.0, 16.0, 13.0, 12.0, 8.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.337890625, -2.270416259765625, -2.20294189453125, -2.135467529296875, -2.0679931640625, -2.000518798828125, -1.93304443359375, -1.865570068359375, -1.798095703125, -1.730621337890625, -1.66314697265625, -1.595672607421875, -1.5281982421875, -1.460723876953125, -1.39324951171875, -1.325775146484375, -1.25830078125, -1.190826416015625, -1.12335205078125, -1.055877685546875, -0.9884033203125, -0.920928955078125, -0.85345458984375, -0.785980224609375, -0.718505859375, -0.651031494140625, -0.58355712890625, -0.516082763671875, -0.4486083984375, -0.381134033203125, -0.31365966796875, -0.246185302734375, -0.1787109375, -0.111236572265625, -0.04376220703125, 0.023712158203125, 0.0911865234375, 0.158660888671875, 0.22613525390625, 0.293609619140625, 0.361083984375, 0.428558349609375, 0.49603271484375, 0.563507080078125, 0.6309814453125, 0.698455810546875, 0.76593017578125, 0.833404541015625, 0.90087890625, 0.968353271484375, 1.03582763671875, 1.103302001953125, 1.1707763671875, 1.238250732421875, 1.30572509765625, 1.373199462890625, 1.440673828125, 1.508148193359375, 1.57562255859375, 1.643096923828125, 1.7105712890625, 1.778045654296875, 1.84552001953125, 1.912994384765625, 1.98046875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 6.0, 13.0, 24.0, 49.0, 106.0, 476.0, 137.0, 70.0, 45.0, 21.0, 14.0, 15.0, 3.0, 5.0, 3.0, 4.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.92178344726562, -66.52570343017578, -63.12963104248047, -59.733551025390625, -56.33747863769531, -52.94139862060547, -49.54532241821289, -46.14924621582031, -42.753170013427734, -39.357093811035156, -35.96101760864258, -32.56494140625, -29.16886329650879, -25.77278709411621, -22.376708984375, -18.980632781982422, -15.584556579589844, -12.188480377197266, -8.792403221130371, -5.396326065063477, -2.0002498626708984, 1.3958263397216797, 4.791904449462891, 8.187980651855469, 11.584056854248047, 14.980133056640625, 18.376209259033203, 21.772287368774414, 25.168363571166992, 28.56443977355957, 31.96051788330078, 35.35659408569336, 38.75267028808594, 42.148746490478516, 45.544822692871094, 48.94090270996094, 52.33697509765625, 55.733055114746094, 59.12913131713867, 62.52520751953125, 65.92127990722656, 69.3173599243164, 72.71343231201172, 76.10951232910156, 79.50558471679688, 82.90166473388672, 86.29774475097656, 89.69381713867188, 93.08989715576172, 96.48597717285156, 99.88204956054688, 103.27812957763672, 106.67420196533203, 110.07028198242188, 113.46635437011719, 116.86243438720703, 120.25851440429688, 123.65459442138672, 127.05066680908203, 130.44674682617188, 133.8428192138672, 137.2388916015625, 140.63497924804688, 144.0310516357422, 147.4271240234375]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 5.0, 3.0, 8.0, 5.0, 3.0, 9.0, 6.0, 6.0, 17.0, 10.0, 10.0, 19.0, 21.0, 20.0, 21.0, 18.0, 27.0, 56.0, 143.0, 168.0, 148.0, 49.0, 29.0, 29.0, 19.0, 16.0, 16.0, 14.0, 17.0, 16.0, 5.0, 12.0, 12.0, 6.0, 10.0, 3.0, 8.0, 5.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.87934112548828, -67.33285522460938, -64.786376953125, -62.23989486694336, -59.69341278076172, -57.14692687988281, -54.60044479370117, -52.05396270751953, -49.50748062133789, -46.96099853515625, -44.41451644897461, -41.86803436279297, -39.32154846191406, -36.77507019042969, -34.22858428955078, -31.68210220336914, -29.1356201171875, -26.58913803100586, -24.04265594482422, -21.496171951293945, -18.949689865112305, -16.403207778930664, -13.856724739074707, -11.31024169921875, -8.76375961303711, -6.2172770500183105, -3.6707944869995117, -1.124311923980713, 1.422170639038086, 3.9686527252197266, 6.515135765075684, 9.06161880493164, 11.60809326171875, 14.15457534790039, 16.70105743408203, 19.247541427612305, 21.794023513793945, 24.340505599975586, 26.88698959350586, 29.4334716796875, 31.97995376586914, 34.52643585205078, 37.07291793823242, 39.61940002441406, 42.16588592529297, 44.712364196777344, 47.25885009765625, 49.80533218383789, 52.35181427001953, 54.89829635620117, 57.44477844238281, 59.99126052856445, 62.537742614746094, 65.084228515625, 67.63070678710938, 70.17719268798828, 72.72367858886719, 75.2701644897461, 77.81664276123047, 80.36312866210938, 82.90960693359375, 85.45609283447266, 88.00257110595703, 90.54905700683594, 93.09553527832031]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 5.0, 4.0, 6.0, 4.0, 4.0, 11.0, 8.0, 10.0, 13.0, 16.0, 21.0, 26.0, 23.0, 37.0, 24.0, 44.0, 59.0, 179.0, 229.0, 62.0, 46.0, 31.0, 28.0, 27.0, 17.0, 16.0, 7.0, 17.0, 7.0, 9.0, 4.0, 4.0, 6.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.90625, -9.6236572265625, -9.341064453125, -9.0584716796875, -8.77587890625, -8.4932861328125, -8.210693359375, -7.9281005859375, -7.6455078125, -7.3629150390625, -7.080322265625, -6.7977294921875, -6.51513671875, -6.2325439453125, -5.949951171875, -5.6673583984375, -5.384765625, -5.1021728515625, -4.819580078125, -4.5369873046875, -4.25439453125, -3.9718017578125, -3.689208984375, -3.4066162109375, -3.1240234375, -2.8414306640625, -2.558837890625, -2.2762451171875, -1.99365234375, -1.7110595703125, -1.428466796875, -1.1458740234375, -0.86328125, -0.5806884765625, -0.298095703125, -0.0155029296875, 0.26708984375, 0.5496826171875, 0.832275390625, 1.1148681640625, 1.3974609375, 1.6800537109375, 1.962646484375, 2.2452392578125, 2.52783203125, 2.8104248046875, 3.093017578125, 3.3756103515625, 3.658203125, 3.9407958984375, 4.223388671875, 4.5059814453125, 4.78857421875, 5.0711669921875, 5.353759765625, 5.6363525390625, 5.9189453125, 6.2015380859375, 6.484130859375, 6.7667236328125, 7.04931640625, 7.3319091796875, 7.614501953125, 7.8970947265625, 8.1796875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 8.0, 2.0, 0.0, 4.0, 1.0, 9.0, 5.0, 17.0, 19.0, 29.0, 78.0, 122.0, 285.0, 807.0, 4174.0, 7604836.0, 773051.0, 3835.0, 776.0, 263.0, 108.0, 47.0, 41.0, 19.0, 19.0, 14.0, 6.0, 6.0, 7.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.76966857910156, -107.41175079345703, -104.0538330078125, -100.69591522216797, -97.33799743652344, -93.9800796508789, -90.62216186523438, -87.26423645019531, -83.90632629394531, -80.54840850830078, -77.19049072265625, -73.83257293701172, -70.47465515136719, -67.11673736572266, -63.75881576538086, -60.40089797973633, -57.04297637939453, -53.68505859375, -50.32714080810547, -46.96922302246094, -43.611305236816406, -40.253387451171875, -36.89546585083008, -33.53754806518555, -30.179630279541016, -26.821712493896484, -23.463794708251953, -20.10587501525879, -16.747957229614258, -13.390039443969727, -10.032119750976562, -6.674201965332031, -3.3162841796875, 0.04163408279418945, 3.399552345275879, 6.757471084594727, 10.115388870239258, 13.473306655883789, 16.831226348876953, 20.189144134521484, 23.547061920166016, 26.904979705810547, 30.262897491455078, 33.620819091796875, 36.978736877441406, 40.33665466308594, 43.69457244873047, 47.052490234375, 50.41040802001953, 53.76832580566406, 57.126243591308594, 60.484161376953125, 63.842079162597656, 67.19999694824219, 70.55792236328125, 73.91583251953125, 77.27375793457031, 80.63167572021484, 83.98959350585938, 87.3475112915039, 90.70542907714844, 94.06334686279297, 97.4212646484375, 100.77919006347656, 104.13710021972656]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 2.0, 2.0, 5.0, 4.0, 3.0, 2.0, 2.0, 6.0, 3.0, 3.0, 4.0, 5.0, 4.0, 8.0, 5.0, 1.0, 6.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 3.0, 7.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.20687103271484, -77.32122802734375, -74.43557739257812, -71.54993438720703, -68.6642837524414, -65.77864074707031, -62.89299392700195, -60.007347106933594, -57.1217041015625, -54.23605728149414, -51.35041046142578, -48.46476745605469, -45.57912063598633, -42.69347381591797, -39.80782699584961, -36.92218017578125, -34.03653335571289, -31.15088653564453, -28.265241622924805, -25.379594802856445, -22.49394989013672, -19.60830307006836, -16.72265625, -13.837011337280273, -10.951364517211914, -8.065718650817871, -5.18007230758667, -2.2944259643554688, 0.5912199020385742, 3.476865768432617, 6.362512588500977, 9.248157501220703, 12.133804321289062, 15.019450187683105, 17.90509605407715, 20.790742874145508, 23.676387786865234, 26.562034606933594, 29.447681427001953, 32.33332824707031, 35.218971252441406, 38.104618072509766, 40.990264892578125, 43.87590789794922, 46.76155471801758, 49.64720153808594, 52.5328483581543, 55.418495178222656, 58.304141998291016, 61.189788818359375, 64.07543182373047, 66.9610824584961, 69.84672546386719, 72.73237609863281, 75.6180191040039, 78.503662109375, 81.38931274414062, 84.27495574951172, 87.16060638427734, 90.04624938964844, 92.93190002441406, 95.81754302978516, 98.70318603515625, 101.58883666992188, 104.47447967529297]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 12.0, 10.0, 29.0, 48.0, 78.0, 133.0, 303.0, 585.0, 1293.0, 2864.0, 6498.0, 15555.0, 36810.0, 89011.0, 167120.0, 116824.0, 49659.0, 21010.0, 9070.0, 3810.0, 1808.0, 827.0, 411.0, 204.0, 104.0, 71.0, 45.0, 17.0, 20.0, 10.0, 13.0, 6.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.5, -35.02001953125, -33.5400390625, -32.06005859375, -30.580078125, -29.10009765625, -27.6201171875, -26.14013671875, -24.66015625, -23.18017578125, -21.7001953125, -20.22021484375, -18.740234375, -17.26025390625, -15.7802734375, -14.30029296875, -12.8203125, -11.34033203125, -9.8603515625, -8.38037109375, -6.900390625, -5.42041015625, -3.9404296875, -2.46044921875, -0.98046875, 0.49951171875, 1.9794921875, 3.45947265625, 4.939453125, 6.41943359375, 7.8994140625, 9.37939453125, 10.859375, 12.33935546875, 13.8193359375, 15.29931640625, 16.779296875, 18.25927734375, 19.7392578125, 21.21923828125, 22.69921875, 24.17919921875, 25.6591796875, 27.13916015625, 28.619140625, 30.09912109375, 31.5791015625, 33.05908203125, 34.5390625, 36.01904296875, 37.4990234375, 38.97900390625, 40.458984375, 41.93896484375, 43.4189453125, 44.89892578125, 46.37890625, 47.85888671875, 49.3388671875, 50.81884765625, 52.298828125, 53.77880859375, 55.2587890625, 56.73876953125, 58.21875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 7.0, 4.0, 3.0, 2.0, 9.0, 10.0, 7.0, 11.0, 16.0, 23.0, 22.0, 20.0, 32.0, 29.0, 37.0, 50.0, 66.0, 54.0, 53.0, 67.0, 71.0, 56.0, 58.0, 48.0, 37.0, 34.0, 37.0, 30.0, 24.0, 8.0, 10.0, 16.0, 14.0, 8.0, 2.0, 8.0, 3.0, 5.0, 5.0, 3.0, 0.0, 4.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2109375, -7.94775390625, -7.6845703125, -7.42138671875, -7.158203125, -6.89501953125, -6.6318359375, -6.36865234375, -6.10546875, -5.84228515625, -5.5791015625, -5.31591796875, -5.052734375, -4.78955078125, -4.5263671875, -4.26318359375, -4.0, -3.73681640625, -3.4736328125, -3.21044921875, -2.947265625, -2.68408203125, -2.4208984375, -2.15771484375, -1.89453125, -1.63134765625, -1.3681640625, -1.10498046875, -0.841796875, -0.57861328125, -0.3154296875, -0.05224609375, 0.2109375, 0.47412109375, 0.7373046875, 1.00048828125, 1.263671875, 1.52685546875, 1.7900390625, 2.05322265625, 2.31640625, 2.57958984375, 2.8427734375, 3.10595703125, 3.369140625, 3.63232421875, 3.8955078125, 4.15869140625, 4.421875, 4.68505859375, 4.9482421875, 5.21142578125, 5.474609375, 5.73779296875, 6.0009765625, 6.26416015625, 6.52734375, 6.79052734375, 7.0537109375, 7.31689453125, 7.580078125, 7.84326171875, 8.1064453125, 8.36962890625, 8.6328125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 6.0, 9.0, 9.0, 20.0, 41.0, 76.0, 102.0, 87.0, 67.0, 21.0, 20.0, 9.0, 9.0, 7.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.8221435546875, -34.45989227294922, -32.09764099121094, -29.735387802124023, -27.373136520385742, -25.01088523864746, -22.648632049560547, -20.286380767822266, -17.924129486083984, -15.561878204345703, -13.199625968933105, -10.837373733520508, -8.475122451782227, -6.112871170043945, -3.7506189346313477, -1.38836669921875, 0.9738845825195312, 3.3361363410949707, 5.69838809967041, 8.060640335083008, 10.422891616821289, 12.78514289855957, 15.147395133972168, 17.509647369384766, 19.871898651123047, 22.234149932861328, 24.59640121459961, 26.958654403686523, 29.320905685424805, 31.683156967163086, 34.04541015625, 36.40766143798828, 38.76990509033203, 41.13215637207031, 43.494407653808594, 45.856658935546875, 48.218910217285156, 50.58116149902344, 52.943416595458984, 55.305667877197266, 57.66791915893555, 60.03017044067383, 62.39242172241211, 64.75467681884766, 67.11692810058594, 69.47917938232422, 71.8414306640625, 74.20368194580078, 76.56593322753906, 78.92818450927734, 81.29043579101562, 83.6526870727539, 86.01493835449219, 88.37718963623047, 90.73944091796875, 93.10169982910156, 95.46394348144531, 97.8261947631836, 100.18844604492188, 102.55069732666016, 104.91294860839844, 107.27519989013672, 109.637451171875, 111.99971008300781, 114.3619613647461]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 2.0, 4.0, 4.0, 3.0, 5.0, 9.0, 8.0, 10.0, 6.0, 13.0, 35.0, 58.0, 66.0, 72.0, 62.0, 35.0, 26.0, 21.0, 10.0, 15.0, 2.0, 5.0, 3.0, 7.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.15165710449219, -38.915802001953125, -37.67994689941406, -36.444087982177734, -35.20823287963867, -33.97237777709961, -32.73651885986328, -31.50066375732422, -30.264808654785156, -29.028953552246094, -27.7930965423584, -26.557239532470703, -25.32138442993164, -24.085529327392578, -22.849672317504883, -21.613815307617188, -20.377960205078125, -19.142105102539062, -17.906248092651367, -16.670391082763672, -15.43453598022461, -14.19867992401123, -12.962823867797852, -11.726967811584473, -10.491111755371094, -9.255255699157715, -8.019399642944336, -6.783543586730957, -5.547687530517578, -4.311831474304199, -3.0759754180908203, -1.8401193618774414, -0.6042633056640625, 0.6315927505493164, 1.8674488067626953, 3.103304862976074, 4.339160919189453, 5.575016975402832, 6.810873031616211, 8.04672908782959, 9.282585144042969, 10.518441200256348, 11.754297256469727, 12.990153312683105, 14.226009368896484, 15.461865425109863, 16.697721481323242, 17.933578491210938, 19.16943359375, 20.405288696289062, 21.641145706176758, 22.877002716064453, 24.112857818603516, 25.348712921142578, 26.584569931030273, 27.82042694091797, 29.05628204345703, 30.292137145996094, 31.52799415588379, 32.763851165771484, 33.99970626831055, 35.23556137084961, 36.47142028808594, 37.707275390625, 38.94313049316406]}, "eval/loss": 0.9598673582077026, "eval/wer": 0.14415540607575847, "eval/runtime": 868.6571, "eval/samples_per_second": 3.041, "eval/steps_per_second": 0.381} \ No newline at end of file